From 25e1ffaba03798a0886a2b1b2b0058d3b31e46ee Mon Sep 17 00:00:00 2001
From: angelinalg <122562471+angelinalg@users.noreply.github.com>
Date: Wed, 25 Jan 2023 22:24:01 -0800
Subject: [PATCH 001/267] [docs] missing parenthesis (#31950)

Signed-off-by: angelinalg <122562471+angelinalg@users.noreply.github.com>

Signed-off-by: angelinalg <122562471+angelinalg@users.noreply.github.com>
---
 .../cluster/vms/user-guides/large-cluster-best-practices.rst  | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/doc/source/cluster/vms/user-guides/large-cluster-best-practices.rst b/doc/source/cluster/vms/user-guides/large-cluster-best-practices.rst
index 49a031bef4df..64287b25254f 100644
--- a/doc/source/cluster/vms/user-guides/large-cluster-best-practices.rst
+++ b/doc/source/cluster/vms/user-guides/large-cluster-best-practices.rst
@@ -97,8 +97,8 @@ General recommendations with AWS instance types:
 
 * The latest gen GPU is almost always the best bang for your buck (p3 > p2, g4
   > g3), for most well designed applications the performance outweighs the
-  price (the instance price may be higher, but you’ll use the instance for less
-  time.
+  price. (The instance price may be higher, but you use the instance for less
+  time.)
 * You may want to consider using older instances if you’re doing dev work and
   won’t actually fully utilize the GPUs though.
 * If you’re doing training (ML or RL), you should use a P instance. If you’re

From 1f3226ef866d1625c1d6d43ac553798dfbd941f5 Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Wed, 25 Jan 2023 22:56:49 -0800
Subject: [PATCH 002/267] [core][scalability] Change ray syncer from unary call
 to streaming call (#30460)

To handle the failure of resource broadcasting, it's hard to do fault tolerance since the status need to be maintained.

This PR updated the communication protocol to streaming.

There are several things changed for the protocol:

Once we received the message, it'll be pushed immediately. But it'll be buffered (512kb), so the cost is not big.
If there is no more message or it exceeded the buffer, it'll flush.
The PR has been tested with 2k nodes (2 cpus per node) and 14k actors.
---
 BUILD.bazel                                   |   1 +
 .../many_nodes_tests/actor_test.py            |  15 +-
 src/mock/ray/common/ray_syncer/ray_syncer.h   |  20 +-
 src/ray/common/id.cc                          |   3 +
 src/ray/common/id.h                           |   4 +
 src/ray/common/ray_config_def.h               |   4 +
 src/ray/common/ray_syncer/ray_syncer-inl.h    | 313 +++++++++---
 src/ray/common/ray_syncer/ray_syncer.cc       | 478 +++++++-----------
 src/ray/common/ray_syncer/ray_syncer.h        |  87 +---
 src/ray/common/test/ray_syncer_test.cc        | 388 ++++++++++----
 .../common/test/syncer_service_e2e_test.cc    |   2 +-
 src/ray/gcs/gcs_server/gcs_actor_scheduler.cc |   1 -
 src/ray/gcs/gcs_server/gcs_server.cc          |  38 +-
 src/ray/gcs/gcs_server/gcs_server.h           |   4 +-
 src/ray/protobuf/ray_syncer.proto             |  33 +-
 src/ray/raylet/node_manager.cc                |   2 +
 src/ray/rpc/grpc_client.h                     |   3 +-
 src/ray/rpc/grpc_server.cc                    |   3 +-
 18 files changed, 811 insertions(+), 588 deletions(-)

diff --git a/BUILD.bazel b/BUILD.bazel
index 88088be4788d..82e9a74be901 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -2631,6 +2631,7 @@ cc_test(
     copts = COPTS,
     tags = ["team:core"],
     deps = [
+        ":grpc_common_lib",
         ":ray_common",
         ":ray_mock",
         "@com_google_googletest//:gtest",
diff --git a/release/nightly_tests/many_nodes_tests/actor_test.py b/release/nightly_tests/many_nodes_tests/actor_test.py
index 620db9cefbd8..884647d1c0f3 100644
--- a/release/nightly_tests/many_nodes_tests/actor_test.py
+++ b/release/nightly_tests/many_nodes_tests/actor_test.py
@@ -16,11 +16,6 @@ def foo(self):
     return actors
 
 
-def test_actor_ready(actors):
-    remaining = [actor.foo.remote() for actor in actors]
-    ray.get(remaining)
-
-
 def parse_script_args():
     parser = argparse.ArgumentParser()
     parser.add_argument("--cpus-per-actor", type=float, default=0.2)
@@ -43,7 +38,15 @@ def main():
         sleep(10)
         return
     actor_ready_start = perf_counter()
-    test_actor_ready(actors)
+    total_actors = len(actors)
+    objs = [actor.foo.remote() for actor in actors]
+
+    while len(objs) != 0:
+        objs_ready, objs = ray.wait(objs, timeout=10)
+        print(
+            f"Status: {total_actors - len(objs)}/{total_actors}, "
+            f"{perf_counter() - actor_ready_start}"
+        )
     actor_ready_end = perf_counter()
     actor_ready_time = actor_ready_end - actor_ready_start
 
diff --git a/src/mock/ray/common/ray_syncer/ray_syncer.h b/src/mock/ray/common/ray_syncer/ray_syncer.h
index 0f768dab64c3..2ef430420697 100644
--- a/src/mock/ray/common/ray_syncer/ray_syncer.h
+++ b/src/mock/ray/common/ray_syncer/ray_syncer.h
@@ -43,10 +43,24 @@ class MockReceiverInterface : public ReceiverInterface {
 namespace ray {
 namespace syncer {
 
-class MockNodeSyncConnection : public NodeSyncConnection {
+class MockRaySyncerBidiReactor : public RaySyncerBidiReactor {
  public:
-  using NodeSyncConnection::NodeSyncConnection;
-  MOCK_METHOD(void, DoSend, (), (override));
+  using RaySyncerBidiReactor::RaySyncerBidiReactor;
+
+  MOCK_METHOD(void, Disconnect, (), (override));
+
+  MOCK_METHOD(bool,
+              PushToSendingQueue,
+              (std::shared_ptr<const RaySyncMessage>),
+              (override));
+};
+
+template <typename T>
+class MockRaySyncerBidiReactorBase : public RaySyncerBidiReactorBase<T> {
+ public:
+  using RaySyncerBidiReactorBase<T>::RaySyncerBidiReactorBase;
+
+  MOCK_METHOD(void, Disconnect, (), (override));
 };
 
 }  // namespace syncer
diff --git a/src/ray/common/id.cc b/src/ray/common/id.cc
index a7c51ccce55a..444770769568 100644
--- a/src/ray/common/id.cc
+++ b/src/ray/common/id.cc
@@ -337,4 +337,7 @@ ID_OSTREAM_OPERATOR(ActorID);
 ID_OSTREAM_OPERATOR(TaskID);
 ID_OSTREAM_OPERATOR(ObjectID);
 ID_OSTREAM_OPERATOR(PlacementGroupID);
+
+const NodeID kGCSNodeID = NodeID::FromBinary(std::string(kUniqueIDSize, 0));
+
 }  // namespace ray
diff --git a/src/ray/common/id.h b/src/ray/common/id.h
index efe6c8ed9774..a6c753a1de35 100644
--- a/src/ray/common/id.h
+++ b/src/ray/common/id.h
@@ -561,3 +561,7 @@ DEFINE_UNIQUE_ID(PlacementGroupID);
 
 #undef DEFINE_UNIQUE_ID
 }  // namespace std
+
+namespace ray {
+extern const NodeID kGCSNodeID;
+}
diff --git a/src/ray/common/ray_config_def.h b/src/ray/common/ray_config_def.h
index fd01f2bb0471..eb93e48f520d 100644
--- a/src/ray/common/ray_config_def.h
+++ b/src/ray/common/ray_config_def.h
@@ -686,6 +686,10 @@ RAY_CONFIG(int64_t, grpc_client_keepalive_time_ms, 300000)
 /// grpc keepalive timeout for client.
 RAY_CONFIG(int64_t, grpc_client_keepalive_timeout_ms, 120000)
 
+/// grpc streaming buffer size
+/// Set it to 512kb
+RAY_CONFIG(int64_t, grpc_stream_buffer_size, 512 * 1024);
+
 /// Whether to use log reporter in event framework
 RAY_CONFIG(bool, event_log_reporter_enabled, false)
 
diff --git a/src/ray/common/ray_syncer/ray_syncer-inl.h b/src/ray/common/ray_syncer/ray_syncer-inl.h
index 506ab14b6d9f..7726bc3da654 100644
--- a/src/ray/common/ray_syncer/ray_syncer-inl.h
+++ b/src/ray/common/ray_syncer/ray_syncer-inl.h
@@ -79,12 +79,48 @@ class NodeState {
       cluster_view_;
 };
 
-class NodeSyncConnection {
+/// This is the base class for the bidi-streaming call and defined the method
+/// needed. A bidi-stream for ray syncer needs to support pushing message and
+/// disconnect from the remote node.
+/// For the implementation, in the constructor, it needs to connect to the remote
+/// node and it needs to implement the communication between the two nodes.
+///
+/// Please refer to https://github.com/grpc/proposal/blob/master/L67-cpp-callback-api.md
+/// for the callback API
+///
+// clang-format off
+/// For the server side:
+///                                     grpc end (error or request)
+///                       +---------------------------------------------------------------+
+///                       |                                                               v
+/// +------------+      +-------------+  canceled by client            +----------+     +--------+     +--------+
+/// | StartRead  | <--> | OnReadDone  | -----------------------------> | OnCancel | --> | Finish | --> | OnDone |
+/// +------------+      +-------------+                                +----------+     +--------+     +--------+
+///                                     canceled by client               ^                ^
+///                       +----------------------------------------------+                |
+///                       |                                                               |
+/// +------------+      +-------------+  grpc end (error or request)                      |
+/// | StartWrite | <--> | OnWriteDone | --------------------------------------------------+
+/// +------------+      +-------------+
+///
+///
+/// For the client side:
+/// +------------+      +-------------+       +------------+  gRPC error or disconnected   +--------+
+/// | StartCall  | ---> |  StartRead  | <---> | OnReadDone | ----------------------------> | OnDone |
+/// +------------+      +-------------+       +------------+                               +--------+
+///   |                                                                                        ^
+///   |                                                                                        |
+///   v                                                                                        |
+/// +------------+      +-------------+  gRPC error or disconnected                            |
+/// | StartWrite | <--> | OnWriteDone | -------------------------------------------------------+
+/// +------------+      +-------------+
+// clang-format on
+class RaySyncerBidiReactor {
  public:
-  NodeSyncConnection(
-      instrumented_io_context &io_context,
-      std::string remote_node_id,
-      std::function<void(std::shared_ptr<RaySyncMessage>)> message_processor);
+  RaySyncerBidiReactor(const std::string &remote_node_id)
+      : remote_node_id_(remote_node_id) {}
+
+  virtual ~RaySyncerBidiReactor(){};
 
   /// Push a message to the sending queue to be sent later. Some message
   /// might be dropped if the module think the target node has already got the
@@ -94,38 +130,192 @@ class NodeSyncConnection {
   /// \param message The message to be sent.
   ///
   /// \return true if push to queue successfully.
-  bool PushToSendingQueue(std::shared_ptr<const RaySyncMessage> message);
-
-  /// Send the message queued.
-  virtual void DoSend() = 0;
-
-  virtual ~NodeSyncConnection() {}
+  virtual bool PushToSendingQueue(std::shared_ptr<const RaySyncMessage> message) = 0;
 
   /// Return the remote node id of this connection.
   const std::string &GetRemoteNodeID() const { return remote_node_id_; }
 
+  /// Disconnect will terminate the communication between local and remote node.
+  /// It also needs to do proper cleanup.
+  virtual void Disconnect() = 0;
+
+ private:
+  std::string remote_node_id_;
+};
+
+/// This class implements the communication between two nodes except the initialization
+/// and cleanup.
+/// It keeps track of the message received and sent between two nodes and uses that to
+/// deduplicate the messages. It also supports the batching for performance purposes.
+template <typename T>
+class RaySyncerBidiReactorBase : public RaySyncerBidiReactor, public T {
+ public:
+  /// Constructor of RaySyncerBidiReactor.
+  ///
+  /// \param io_context The io context for the callback.
+  /// \param remote_node_id The node id connects to.
+  /// \param message_processor The callback for the message received.
+  /// \param cleanup_cb When the connection terminates, it'll be called to cleanup
+  ///     the environment.
+  RaySyncerBidiReactorBase(
+      instrumented_io_context &io_context,
+      const std::string &remote_node_id,
+      std::function<void(std::shared_ptr<const RaySyncMessage>)> message_processor)
+      : RaySyncerBidiReactor(remote_node_id),
+        io_context_(io_context),
+        message_processor_(std::move(message_processor)) {}
+
+  bool PushToSendingQueue(std::shared_ptr<const RaySyncMessage> message) override {
+    // Try to filter out the messages the target node already has.
+    // Usually it'll be the case when the message is generated from the
+    // target node or it's sent from the target node.
+    // No need to resend the message sent from a node back.
+    if (message->node_id() == GetRemoteNodeID()) {
+      // Skip the message when it's about the node of this connection.
+      return false;
+    }
+
+    auto &node_versions = GetNodeComponentVersions(message->node_id());
+    if (node_versions[message->message_type()] < message->version()) {
+      node_versions[message->message_type()] = message->version();
+      sending_buffer_[std::make_pair(message->node_id(), message->message_type())] =
+          std::move(message);
+      StartSend();
+      return true;
+    }
+    return false;
+  }
+
+  virtual ~RaySyncerBidiReactorBase() {}
+
+  void StartPull() {
+    receiving_message_ = std::make_shared<RaySyncMessage>();
+    RAY_LOG(DEBUG) << "Start reading: " << NodeID::FromBinary(GetRemoteNodeID());
+    StartRead(receiving_message_.get());
+  }
+
+ protected:
+  /// The io context
+  instrumented_io_context &io_context_;
+
+ private:
   /// Handle the udpates sent from the remote node.
   ///
   /// \param messages The message received.
-  void ReceiveUpdate(RaySyncMessages messages);
+  void ReceiveUpdate(std::shared_ptr<const RaySyncMessage> message) {
+    auto &node_versions = GetNodeComponentVersions(message->node_id());
+    RAY_LOG(DEBUG) << "Receive update: "
+                   << " message_type=" << message->message_type()
+                   << ", message_version=" << message->version()
+                   << ", local_message_version="
+                   << node_versions[message->message_type()];
+    if (node_versions[message->message_type()] < message->version()) {
+      node_versions[message->message_type()] = message->version();
+      message_processor_(message);
+    } else {
+      RAY_LOG_EVERY_N(WARNING, 100)
+          << "Drop message received from " << NodeID::FromBinary(message->node_id())
+          << " because the message version " << message->version()
+          << " is older than the local version " << node_versions[message->message_type()]
+          << ". Message type: " << message->message_type();
+    }
+  }
+
+  void SendNext() {
+    sending_ = false;
+    StartSend();
+  }
+
+  void StartSend() {
+    if (sending_) {
+      return;
+    }
+
+    if (sending_buffer_.size() != 0) {
+      auto iter = sending_buffer_.begin();
+      auto msg = std::move(iter->second);
+      sending_buffer_.erase(iter);
+      Send(std::move(msg), sending_buffer_.empty());
+      sending_ = true;
+    }
+  }
+
+  /// Sending a message to the remote node
+  ///
+  /// \param message The message to be sent
+  /// \param flush Whether to flush the sending queue in gRPC.
+  void Send(std::shared_ptr<const RaySyncMessage> message, bool flush) {
+    sending_message_ = std::move(message);
+    grpc::WriteOptions opts;
+    if (flush) {
+      opts.clear_buffer_hint();
+    } else {
+      opts.set_buffer_hint();
+    }
+    RAY_LOG(DEBUG) << "[BidiReactor] Sending message to "
+                   << NodeID::FromBinary(GetRemoteNodeID()) << " about node "
+                   << NodeID::FromBinary(sending_message_->node_id());
+    StartWrite(sending_message_.get(), opts);
+  }
+
+  // Please refer to grpc callback api for the following four methods:
+  //     https://github.com/grpc/proposal/blob/master/L67-cpp-callback-api.md
+  using T::StartRead;
+  using T::StartWrite;
+
+  void OnWriteDone(bool ok) override {
+    if (ok) {
+      io_context_.dispatch([this]() { SendNext(); }, "");
+    } else {
+      // No need to resent the message since if ok=false, it's the end
+      // of gRPC call and client will reconnect in case of a failure.
+      // In gRPC, OnDone will be called after.
+      RAY_LOG_EVERY_N(ERROR, 100)
+          << "Failed to send the message to: " << NodeID::FromBinary(GetRemoteNodeID());
+    }
+  }
+
+  void OnReadDone(bool ok) override {
+    if (ok) {
+      io_context_.dispatch(
+          [this, msg = std::move(receiving_message_)]() mutable {
+            RAY_CHECK(!msg->node_id().empty());
+            ReceiveUpdate(std::move(msg));
+            StartPull();
+          },
+          "");
+    } else {
+      // No need to resent the message since if ok=false, it's the end
+      // of gRPC call and client will reconnect in case of a failure.
+      // In gRPC, OnDone will be called after.
+      RAY_LOG_EVERY_N(ERROR, 100)
+          << "Failed to read the message from: " << NodeID::FromBinary(GetRemoteNodeID());
+    }
+  }
+
+  /// grpc requests for sending and receiving
+  std::shared_ptr<const RaySyncMessage> sending_message_;
+  std::shared_ptr<RaySyncMessage> receiving_message_;
 
- protected:
   // For testing
-  FRIEND_TEST(RaySyncerTest, NodeSyncConnection);
+  FRIEND_TEST(RaySyncerTest, RaySyncerBidiReactorBase);
   friend struct SyncerServerTest;
 
   std::array<int64_t, kComponentArraySize> &GetNodeComponentVersions(
-      const std::string &node_id);
-
-  /// The io context
-  instrumented_io_context &io_context_;
-
-  /// The remote node id.
-  std::string remote_node_id_;
+      const std::string &node_id) {
+    auto iter = node_versions_.find(node_id);
+    if (iter == node_versions_.end()) {
+      iter = node_versions_.emplace(node_id, std::array<int64_t, kComponentArraySize>())
+                 .first;
+      iter->second.fill(-1);
+    }
+    return iter->second;
+  }
 
   /// Handler of a message update.
-  std::function<void(std::shared_ptr<RaySyncMessage>)> message_processor_;
+  const std::function<void(std::shared_ptr<const RaySyncMessage>)> message_processor_;
 
+ private:
   /// Buffering all the updates. Sending will be done in an async way.
   absl::flat_hash_map<std::pair<std::string, MessageType>,
                       std::shared_ptr<const RaySyncMessage>>
@@ -136,58 +326,63 @@ class NodeSyncConnection {
   /// We'll filter the received or sent messages when the message is stale.
   absl::flat_hash_map<std::string, std::array<int64_t, kComponentArraySize>>
       node_versions_;
+
+  bool sending_ = false;
 };
 
-/// SyncConnection for gRPC server side. It has customized logic for sending.
-class ServerSyncConnection : public NodeSyncConnection {
+/// Reactor for gRPC server side. It defines the server's specific behavior for a
+/// streaming call.
+class RayServerBidiReactor : public RaySyncerBidiReactorBase<ServerBidiReactor> {
  public:
-  ServerSyncConnection(
+  RayServerBidiReactor(
+      grpc::CallbackServerContext *server_context,
       instrumented_io_context &io_context,
-      const std::string &remote_node_id,
-      std::function<void(std::shared_ptr<RaySyncMessage>)> message_processor);
+      const std::string &local_node_id,
+      std::function<void(std::shared_ptr<const RaySyncMessage>)> message_processor,
+      std::function<void(const std::string &, bool)> cleanup_cb);
 
-  ~ServerSyncConnection() override;
+  ~RayServerBidiReactor() override = default;
 
-  void HandleLongPollingRequest(grpc::ServerUnaryReactor *reactor,
-                                RaySyncMessages *response);
+  void Disconnect() override;
 
- protected:
-  /// Send the message from the pending queue to the target node.
-  /// It'll send nothing unless there is a long-polling request.
-  /// TODO (iycheng): Unify the sending algorithm when we migrate to gRPC streaming
-  void DoSend() override;
-
-  /// These two fields are RPC related. When the server got long-polling requests,
-  /// these two fields will be set so that it can be used to send message.
-  /// After the message being sent, these two fields will be set to be empty again.
-  /// When the periodical timer wake up, it'll check whether these two fields are set
-  /// and it'll only send data when these are set.
-  std::vector<RaySyncMessages *> responses_;
-  std::vector<grpc::ServerUnaryReactor *> unary_reactors_;
+ private:
+  void OnCancel() override;
+  void OnDone() override;
+
+  /// Cleanup callback when the call ends.
+  const std::function<void(const std::string &, bool)> cleanup_cb_;
+
+  /// grpc callback context
+  grpc::CallbackServerContext *server_context_;
 };
 
-/// SyncConnection for gRPC client side. It has customized logic for sending.
-class ClientSyncConnection : public NodeSyncConnection {
+/// Reactor for gRPC client side. It defines the client's specific behavior for a
+/// streaming call.
+class RayClientBidiReactor : public RaySyncerBidiReactorBase<ClientBidiReactor> {
  public:
-  ClientSyncConnection(
+  RayClientBidiReactor(
+      const std::string &remote_node_id,
+      const std::string &local_node_id,
       instrumented_io_context &io_context,
-      const std::string &node_id,
-      std::function<void(std::shared_ptr<RaySyncMessage>)> message_processor,
-      std::shared_ptr<grpc::Channel> channel);
+      std::function<void(std::shared_ptr<const RaySyncMessage>)> message_processor,
+      std::function<void(const std::string &, bool)> cleanup_cb,
+      std::unique_ptr<ray::rpc::syncer::RaySyncer::Stub> stub);
 
- protected:
-  /// Send the message from the pending queue to the target node.
-  /// It'll use gRPC to send the message directly.
-  void DoSend() override;
+  ~RayClientBidiReactor() override = default;
 
-  /// Start to send long-polling request to remote nodes.
-  void StartLongPolling();
+  void Disconnect() override;
 
-  /// Stub for this connection.
-  std::unique_ptr<ray::rpc::syncer::RaySyncer::Stub> stub_;
+ private:
+  /// Callback from gRPC
+  void OnDone(const grpc::Status &status) override;
 
-  /// Dummy request for long-polling.
-  DummyRequest dummy_;
+  /// Cleanup callback when the call ends.
+  const std::function<void(const std::string &, bool)> cleanup_cb_;
+
+  /// grpc callback context
+  grpc::ClientContext client_context_;
+
+  std::unique_ptr<ray::rpc::syncer::RaySyncer::Stub> stub_;
 };
 
 }  // namespace syncer
diff --git a/src/ray/common/ray_syncer/ray_syncer.cc b/src/ray/common/ray_syncer/ray_syncer.cc
index 86afc1625146..7dd8420e78a9 100644
--- a/src/ray/common/ray_syncer/ray_syncer.cc
+++ b/src/ray/common/ray_syncer/ray_syncer.cc
@@ -55,9 +55,10 @@ std::optional<RaySyncMessage> NodeState::CreateSyncMessage(MessageType message_t
 bool NodeState::ConsumeSyncMessage(std::shared_ptr<const RaySyncMessage> message) {
   auto &current = cluster_view_[message->node_id()][message->message_type()];
 
-  RAY_LOG(DEBUG) << "ConsumeSyncMessage: " << (current ? current->version() : -1)
-                 << " message_version: " << message->version()
-                 << ", message_from: " << NodeID::FromBinary(message->node_id());
+  RAY_LOG(DEBUG) << "ConsumeSyncMessage: local_version="
+                 << (current ? current->version() : -1)
+                 << " message_version=" << message->version()
+                 << ", message_from=" << NodeID::FromBinary(message->node_id());
   // Check whether newer version of this message has been received.
   if (current && current->version() >= message->version()) {
     return false;
@@ -66,180 +67,85 @@ bool NodeState::ConsumeSyncMessage(std::shared_ptr<const RaySyncMessage> message
   current = message;
   auto receiver = receivers_[message->message_type()];
   if (receiver != nullptr) {
+    RAY_LOG(DEBUG) << "Consume message from: " << NodeID::FromBinary(message->node_id());
     receiver->ConsumeSyncMessage(message);
   }
   return true;
 }
 
-NodeSyncConnection::NodeSyncConnection(
-    instrumented_io_context &io_context,
-    std::string remote_node_id,
-    std::function<void(std::shared_ptr<RaySyncMessage>)> message_processor)
-    : io_context_(io_context),
-      remote_node_id_(std::move(remote_node_id)),
-      message_processor_(std::move(message_processor)) {}
-
-void NodeSyncConnection::ReceiveUpdate(RaySyncMessages messages) {
-  for (auto &message : *messages.mutable_sync_messages()) {
-    auto &node_versions = GetNodeComponentVersions(message.node_id());
-    RAY_LOG(DEBUG) << "Receive update: "
-                   << " message_type=" << message.message_type()
-                   << ", message_version=" << message.version()
-                   << ", local_message_version=" << node_versions[message.message_type()];
-    if (node_versions[message.message_type()] < message.version()) {
-      node_versions[message.message_type()] = message.version();
-      message_processor_(std::make_shared<RaySyncMessage>(std::move(message)));
-    }
-  }
-}
+namespace {
 
-bool NodeSyncConnection::PushToSendingQueue(
-    std::shared_ptr<const RaySyncMessage> message) {
-  // Try to filter out the messages the target node already has.
-  // Usually it'll be the case when the message is generated from the
-  // target node or it's sent from the target node.
-  if (message->node_id() == GetRemoteNodeID()) {
-    // Skip the message when it's about the node of this connection.
-    return false;
-  }
-
-  auto &node_versions = GetNodeComponentVersions(message->node_id());
-  if (node_versions[message->message_type()] < message->version()) {
-    node_versions[message->message_type()] = message->version();
-    sending_buffer_[std::make_pair(message->node_id(), message->message_type())] =
-        message;
-    return true;
-  }
-  return false;
+std::string GetNodeIDFromServerContext(grpc::CallbackServerContext *server_context) {
+  const auto &metadata = server_context->client_metadata();
+  auto iter = metadata.find("node_id");
+  RAY_CHECK(iter != metadata.end());
+  return NodeID::FromHex(std::string(iter->second.begin(), iter->second.end())).Binary();
 }
 
-std::array<int64_t, kComponentArraySize> &NodeSyncConnection::GetNodeComponentVersions(
-    const std::string &node_id) {
-  auto iter = node_versions_.find(node_id);
-  if (iter == node_versions_.end()) {
-    iter =
-        node_versions_.emplace(node_id, std::array<int64_t, kComponentArraySize>()).first;
-    iter->second.fill(-1);
-  }
-  return iter->second;
-}
+}  // namespace
 
-ClientSyncConnection::ClientSyncConnection(
+RayServerBidiReactor::RayServerBidiReactor(
+    grpc::CallbackServerContext *server_context,
     instrumented_io_context &io_context,
-    const std::string &node_id,
-    std::function<void(std::shared_ptr<RaySyncMessage>)> message_processor,
-    std::shared_ptr<grpc::Channel> channel)
-    : NodeSyncConnection(io_context, node_id, std::move(message_processor)),
-      stub_(ray::rpc::syncer::RaySyncer::NewStub(channel)) {
-  for (int64_t i = 0; i < RayConfig::instance().ray_syncer_polling_buffer(); ++i) {
-    StartLongPolling();
-  }
+    const std::string &local_node_id,
+    std::function<void(std::shared_ptr<const RaySyncMessage>)> message_processor,
+    std::function<void(const std::string &, bool)> cleanup_cb)
+    : RaySyncerBidiReactorBase<ServerBidiReactor>(
+          io_context,
+          GetNodeIDFromServerContext(server_context),
+          std::move(message_processor)),
+      cleanup_cb_(std::move(cleanup_cb)),
+      server_context_(server_context) {
+  // Send the local node id to the remote
+  server_context_->AddInitialMetadata("node_id", NodeID::FromBinary(local_node_id).Hex());
+  StartSendInitialMetadata();
+
+  // Start pulling from remote
+  StartPull();
 }
 
-void ClientSyncConnection::StartLongPolling() {
-  // This will be a long-polling request. The node will only reply if
-  //    1. there is a new version of message
-  //    2. and it has passed X ms since last update.
-  auto client_context = std::make_shared<grpc::ClientContext>();
-  auto in_message = std::make_shared<ray::rpc::syncer::RaySyncMessages>();
-  stub_->async()->LongPolling(
-      client_context.get(),
-      &dummy_,
-      in_message.get(),
-      [this, client_context, in_message](grpc::Status status) mutable {
-        if (status.ok()) {
-          io_context_.dispatch(
-              [this, messages = std::move(*in_message)]() mutable {
-                ReceiveUpdate(std::move(messages));
-              },
-              "LongPollingCallback");
-          // Start the next polling.
-          StartLongPolling();
-        }
-      });
+void RayServerBidiReactor::Disconnect() {
+  io_context_.dispatch([this]() { Finish(grpc::Status::OK); }, "");
 }
 
-void ClientSyncConnection::DoSend() {
-  if (sending_buffer_.empty()) {
-    return;
-  }
+void RayServerBidiReactor::OnCancel() { Disconnect(); }
 
-  auto client_context = std::make_shared<grpc::ClientContext>();
-  auto arena = std::make_shared<google::protobuf::Arena>();
-  auto request = google::protobuf::Arena::CreateMessage<RaySyncMessages>(arena.get());
-  auto response = google::protobuf::Arena::CreateMessage<DummyResponse>(arena.get());
-
-  std::vector<std::shared_ptr<const RaySyncMessage>> holder;
-
-  size_t message_bytes = 0;
-  auto iter = sending_buffer_.begin();
-  while (message_bytes < RayConfig::instance().max_sync_message_batch_bytes() &&
-         iter != sending_buffer_.end()) {
-    message_bytes += iter->second->sync_message().size();
-    // TODO (iycheng): Use arena allocator for optimization
-    request->mutable_sync_messages()->UnsafeArenaAddAllocated(
-        const_cast<RaySyncMessage *>(iter->second.get()));
-    holder.push_back(iter->second);
-    sending_buffer_.erase(iter++);
-  }
-  if (request->sync_messages_size() != 0) {
-    stub_->async()->Update(
-        client_context.get(),
-        request,
-        response,
-        [arena, client_context, holder = std::move(holder)](grpc::Status status) {
-          if (!status.ok()) {
-            RAY_LOG(ERROR) << "Sending request failed because of "
-                           << status.error_message();
-          }
-        });
-  }
+void RayServerBidiReactor::OnDone() {
+  io_context_.dispatch(
+      [this]() {
+        cleanup_cb_(GetRemoteNodeID(), false);
+        delete this;
+      },
+      "");
 }
 
-ServerSyncConnection::ServerSyncConnection(
-    instrumented_io_context &io_context,
+RayClientBidiReactor::RayClientBidiReactor(
     const std::string &remote_node_id,
-    std::function<void(std::shared_ptr<RaySyncMessage>)> message_processor)
-    : NodeSyncConnection(io_context, remote_node_id, std::move(message_processor)) {}
-
-ServerSyncConnection::~ServerSyncConnection() {
-  // If there is a pending request, we need to cancel it. Otherwise, rpc will
-  // hang there forever.
-  while (!unary_reactors_.empty()) {
-    unary_reactors_.back()->Finish(grpc::Status::CANCELLED);
-    unary_reactors_.pop_back();
-  }
+    const std::string &local_node_id,
+    instrumented_io_context &io_context,
+    std::function<void(std::shared_ptr<const RaySyncMessage>)> message_processor,
+    std::function<void(const std::string &, bool)> cleanup_cb,
+    std::unique_ptr<ray::rpc::syncer::RaySyncer::Stub> stub)
+    : RaySyncerBidiReactorBase<ClientBidiReactor>(
+          io_context, remote_node_id, std::move(message_processor)),
+      cleanup_cb_(std::move(cleanup_cb)),
+      stub_(std::move(stub)) {
+  client_context_.AddMetadata("node_id", NodeID::FromBinary(local_node_id).Hex());
+  stub_->async()->StartSync(&client_context_, this);
+  StartPull();
 }
 
-void ServerSyncConnection::HandleLongPollingRequest(grpc::ServerUnaryReactor *reactor,
-                                                    RaySyncMessages *response) {
-  unary_reactors_.push_back(reactor);
-  responses_.push_back(response);
+void RayClientBidiReactor::OnDone(const grpc::Status &status) {
+  io_context_.dispatch(
+      [this, status]() {
+        cleanup_cb_(GetRemoteNodeID(), !status.ok());
+        delete this;
+      },
+      "");
 }
 
-void ServerSyncConnection::DoSend() {
-  // There is no receive request
-  if (unary_reactors_.empty() || sending_buffer_.empty()) {
-    return;
-  }
-
-  RAY_CHECK(!responses_.empty());
-
-  size_t message_bytes = 0;
-  auto iter = sending_buffer_.begin();
-  while (message_bytes < RayConfig::instance().max_sync_message_batch_bytes() &&
-         iter != sending_buffer_.end()) {
-    message_bytes += iter->second->sync_message().size();
-    // TODO (iycheng): Use arena allocator for optimization
-    responses_.back()->add_sync_messages()->CopyFrom(*iter->second);
-    sending_buffer_.erase(iter++);
-  }
-
-  if (responses_.back()->sync_messages_size() != 0) {
-    unary_reactors_.back()->Finish(grpc::Status::OK);
-    responses_.pop_back();
-    unary_reactors_.pop_back();
-  }
+void RayClientBidiReactor::Disconnect() {
+  io_context_.dispatch([this]() { StartWritesDone(); }, "");
 }
 
 RaySyncer::RaySyncer(instrumented_io_context &io_context,
@@ -249,109 +155,133 @@ RaySyncer::RaySyncer(instrumented_io_context &io_context,
       node_state_(std::make_unique<NodeState>()),
       timer_(io_context) {
   stopped_ = std::make_shared<bool>(false);
-  timer_.RunFnPeriodically(
-      [this]() {
-        for (auto &[_, sync_connection] : sync_connections_) {
-          sync_connection->DoSend();
-        }
-      },
-      RayConfig::instance().raylet_report_resources_period_milliseconds());
 }
 
 RaySyncer::~RaySyncer() {
   *stopped_ = true;
-  for (auto &call : inflight_requests_) {
-    auto f = call->promise.get_future();
-    if (!f.valid()) {
-      call->context.TryCancel();
-    }
-    f.get();
-  }
+  io_context_.dispatch(
+      [reactors = sync_reactors_]() {
+        for (auto [_, reactor] : reactors) {
+          reactor->Disconnect();
+        }
+      },
+      "");
 }
 
-void RaySyncer::Connect(std::shared_ptr<grpc::Channel> channel) {
-  auto call = std::make_unique<StartSyncCall>();
-
-  auto stub = ray::rpc::syncer::RaySyncer::NewStub(channel);
-  call->request.set_node_id(local_node_id_);
-
-  stub->async()->StartSync(
-      &call->context,
-      &call->request,
-      &call->response,
-      [this, channel, call = call.get(), stopped = this->stopped_](grpc::Status status) {
-        call->promise.set_value();
-        if (*stopped) {
-          return;
-        }
-        if (status.ok()) {
-          io_context_.dispatch(
-              [this, channel, node_id = call->response.node_id()]() {
-                auto connection = std::make_unique<ClientSyncConnection>(
-                    io_context_,
-                    node_id,
-                    [this](auto msg) { BroadcastMessage(msg); },
-                    channel);
-                Connect(std::move(connection));
-              },
-              "StartSyncCallback");
+std::vector<std::string> RaySyncer::GetAllConnectedNodeIDs() const {
+  std::promise<std::vector<std::string>> promise;
+  io_context_.dispatch(
+      [&]() {
+        std::vector<std::string> nodes;
+        for (auto [node_id, _] : sync_reactors_) {
+          nodes.push_back(node_id);
         }
-      });
-  inflight_requests_.emplace(std::move(call));
+        promise.set_value(std::move(nodes));
+      },
+      "");
+  return promise.get_future().get();
+}
+
+void RaySyncer::Connect(const std::string &node_id,
+                        std::shared_ptr<grpc::Channel> channel) {
+  io_context_.dispatch(
+      [=]() {
+        auto stub = ray::rpc::syncer::RaySyncer::NewStub(channel);
+        auto reactor = new RayClientBidiReactor(
+            /* remote_node_id */ node_id,
+            /* local_node_id */ GetLocalNodeID(),
+            /* io_context */ io_context_,
+            /* message_processor */ [this](auto msg) { BroadcastRaySyncMessage(msg); },
+            /* cleanup_cb */
+            [this, channel](const std::string &node_id, bool restart) {
+              sync_reactors_.erase(node_id);
+              if (restart) {
+                RAY_LOG(INFO) << "Connection is broken. Reconnect to node: "
+                              << NodeID::FromBinary(node_id);
+                Connect(node_id, channel);
+              }
+            },
+            /* stub */ std::move(stub));
+        Connect(reactor);
+        reactor->StartCall();
+      },
+      "");
 }
 
-void RaySyncer::Connect(std::unique_ptr<NodeSyncConnection> connection) {
-  // Somehow connection=std::move(connection) won't be compiled here.
-  // Potentially it might have a leak here if the function is not executed.
+void RaySyncer::Connect(RaySyncerBidiReactor *reactor) {
   io_context_.dispatch(
-      [this, connection = connection.release()]() mutable {
-        RAY_CHECK(connection != nullptr);
-        RAY_CHECK(sync_connections_[connection->GetRemoteNodeID()] == nullptr);
-        auto &conn = *connection;
-        sync_connections_[connection->GetRemoteNodeID()].reset(connection);
+      [this, reactor]() {
+        RAY_CHECK(sync_reactors_.find(reactor->GetRemoteNodeID()) ==
+                  sync_reactors_.end());
+        sync_reactors_[reactor->GetRemoteNodeID()] = reactor;
+        // Send the view for new connections.
         for (const auto &[_, messages] : node_state_->GetClusterView()) {
-          for (auto &message : messages) {
+          for (const auto &message : messages) {
             if (!message) {
               continue;
             }
-            conn.PushToSendingQueue(message);
+            RAY_LOG(DEBUG) << "Push init view from: "
+                           << NodeID::FromBinary(GetLocalNodeID()) << " to "
+                           << NodeID::FromBinary(reactor->GetRemoteNodeID()) << " about "
+                           << NodeID::FromBinary(message->node_id());
+            reactor->PushToSendingQueue(message);
           }
         }
       },
-      "RaySyncer::Connect");
+      "RaySyncerConnect");
 }
 
 void RaySyncer::Disconnect(const std::string &node_id) {
+  std::promise<RaySyncerBidiReactor *> promise;
   io_context_.dispatch(
-      [this, node_id]() {
-        auto iter = sync_connections_.find(node_id);
-        if (iter != sync_connections_.end()) {
-          sync_connections_.erase(iter);
+      [&]() {
+        auto iter = sync_reactors_.find(node_id);
+        if (iter == sync_reactors_.end()) {
+          promise.set_value(nullptr);
+          return;
+        }
+
+        auto reactor = iter->second;
+        if (iter != sync_reactors_.end()) {
+          sync_reactors_.erase(iter);
         }
+        promise.set_value(reactor);
       },
       "RaySyncerDisconnect");
+  auto reactor = promise.get_future().get();
+  if (reactor != nullptr) {
+    reactor->Disconnect();
+  }
 }
 
-bool RaySyncer::Register(MessageType message_type,
+void RaySyncer::Register(MessageType message_type,
                          const ReporterInterface *reporter,
                          ReceiverInterface *receiver,
                          int64_t pull_from_reporter_interval_ms) {
-  if (!node_state_->SetComponent(message_type, reporter, receiver)) {
-    return false;
-  }
+  io_context_.dispatch(
+      [this, message_type, reporter, receiver, pull_from_reporter_interval_ms]() mutable {
+        if (!node_state_->SetComponent(message_type, reporter, receiver)) {
+          return;
+        }
 
-  // Set job to pull from reporter periodically
-  if (reporter != nullptr && pull_from_reporter_interval_ms > 0) {
-    timer_.RunFnPeriodically(
-        [this, message_type]() { OnDemandBroadcasting(message_type); },
-        pull_from_reporter_interval_ms);
-  }
+        // Set job to pull from reporter periodically
+        if (reporter != nullptr && pull_from_reporter_interval_ms > 0) {
+          timer_.RunFnPeriodically(
+              [this, stopped = stopped_, message_type]() {
+                if (*stopped) {
+                  return;
+                }
+                OnDemandBroadcasting(message_type);
+              },
+              pull_from_reporter_interval_ms);
+        }
 
-  RAY_LOG(DEBUG) << "Registered components: "
-                 << "message_type:" << message_type << ", reporter:" << reporter
-                 << ", receiver:" << receiver
-                 << ", pull_from_reporter_interval_ms:" << pull_from_reporter_interval_ms;
-  return true;
+        RAY_LOG(DEBUG) << "Registered components: "
+                       << "message_type:" << message_type << ", reporter:" << reporter
+                       << ", receiver:" << receiver << ", pull_from_reporter_interval_ms:"
+                       << pull_from_reporter_interval_ms;
+      },
+      "RaySyncerRegister");
 }
 
 bool RaySyncer::OnDemandBroadcasting(MessageType message_type) {
@@ -372,90 +302,38 @@ void RaySyncer::BroadcastMessage(std::shared_ptr<const RaySyncMessage> message)
   io_context_.dispatch(
       [this, message] {
         // The message is stale. Just skip this one.
+        RAY_LOG(DEBUG) << "Receive message from: "
+                       << NodeID::FromBinary(message->node_id()) << " to "
+                       << NodeID::FromBinary(GetLocalNodeID());
         if (!node_state_->ConsumeSyncMessage(message)) {
           return;
         }
-        for (auto &connection : sync_connections_) {
-          connection.second->PushToSendingQueue(message);
+        for (auto &reactor : sync_reactors_) {
+          reactor.second->PushToSendingQueue(message);
         }
       },
       "RaySyncer.BroadcastMessage");
 }
 
-grpc::ServerUnaryReactor *RaySyncerService::StartSync(
-    grpc::CallbackServerContext *context,
-    const StartSyncRequest *request,
-    StartSyncResponse *response) {
-  auto *reactor = context->DefaultReactor();
-  // Make sure server only have one client
-  if (!remote_node_id_.empty()) {
-    RAY_LOG(WARNING) << "Get a new sync request from "
-                     << NodeID::FromBinary(request->node_id()) << ". "
-                     << "Now disconnect from " << NodeID::FromBinary(remote_node_id_);
-    syncer_.Disconnect(remote_node_id_);
-  }
-  remote_node_id_ = request->node_id();
-  RAY_LOG(DEBUG) << "Get connect from: " << NodeID::FromBinary(remote_node_id_);
-  syncer_.GetIOContext().dispatch(
-      [this, response, reactor, context]() {
-        if (context->IsCancelled()) {
-          reactor->Finish(grpc::Status::CANCELLED);
-          return;
-        }
-
-        syncer_.Connect(std::make_unique<ServerSyncConnection>(
-            syncer_.GetIOContext(), remote_node_id_, [this](auto msg) {
-              syncer_.BroadcastMessage(msg);
-            }));
-        response->set_node_id(syncer_.GetLocalNodeID());
-        reactor->Finish(grpc::Status::OK);
-      },
-      "RaySyncer::StartSync");
-  return reactor;
-}
-
-grpc::ServerUnaryReactor *RaySyncerService::Update(grpc::CallbackServerContext *context,
-                                                   const RaySyncMessages *request,
-                                                   DummyResponse *) {
-  auto *reactor = context->DefaultReactor();
-  // Make sure request is allocated from heap so that it can be moved safely.
-  RAY_CHECK(request->GetArena() == nullptr);
-  syncer_.GetIOContext().dispatch(
-      [this, request = std::move(*const_cast<RaySyncMessages *>(request))]() mutable {
-        auto *sync_connection = dynamic_cast<ServerSyncConnection *>(
-            syncer_.GetSyncConnection(remote_node_id_));
-        if (sync_connection != nullptr) {
-          sync_connection->ReceiveUpdate(std::move(request));
-        } else {
-          RAY_LOG(FATAL) << "Fail to get the sync context";
-        }
-      },
-      "SyncerUpdate");
-  reactor->Finish(grpc::Status::OK);
-  return reactor;
-}
-
-grpc::ServerUnaryReactor *RaySyncerService::LongPolling(
-    grpc::CallbackServerContext *context,
-    const DummyRequest *,
-    RaySyncMessages *response) {
-  auto *reactor = context->DefaultReactor();
-  syncer_.GetIOContext().dispatch(
-      [this, reactor, response]() mutable {
-        auto *sync_connection = dynamic_cast<ServerSyncConnection *>(
-            syncer_.GetSyncConnection(remote_node_id_));
-        if (sync_connection != nullptr) {
-          sync_connection->HandleLongPollingRequest(reactor, response);
-        } else {
-          RAY_LOG(ERROR) << "Fail to setup long-polling";
-          reactor->Finish(grpc::Status::CANCELLED);
-        }
-      },
-      "SyncLongPolling");
+ServerBidiReactor *RaySyncerService::StartSync(grpc::CallbackServerContext *context) {
+  auto reactor = new RayServerBidiReactor(
+      context,
+      syncer_.GetIOContext(),
+      syncer_.GetLocalNodeID(),
+      [this](auto msg) mutable { syncer_.BroadcastMessage(msg); },
+      [this](const std::string &node_id, bool reconnect) mutable {
+        // No need to reconnect for server side.
+        RAY_CHECK(!reconnect);
+        syncer_.sync_reactors_.erase(node_id);
+      });
+  RAY_LOG(DEBUG) << "Get connection from "
+                 << NodeID::FromBinary(reactor->GetRemoteNodeID()) << " to "
+                 << NodeID::FromBinary(syncer_.GetLocalNodeID());
+  syncer_.Connect(reactor);
   return reactor;
 }
 
-RaySyncerService::~RaySyncerService() { syncer_.Disconnect(remote_node_id_); }
+RaySyncerService::~RaySyncerService() {}
 
 }  // namespace syncer
 }  // namespace ray
diff --git a/src/ray/common/ray_syncer/ray_syncer.h b/src/ray/common/ray_syncer/ray_syncer.h
index 07c636b6cc29..abe835c60e0a 100644
--- a/src/ray/common/ray_syncer/ray_syncer.h
+++ b/src/ray/common/ray_syncer/ray_syncer.h
@@ -27,13 +27,11 @@
 namespace ray {
 namespace syncer {
 
-using ray::rpc::syncer::DummyRequest;
-using ray::rpc::syncer::DummyResponse;
 using ray::rpc::syncer::MessageType;
 using ray::rpc::syncer::RaySyncMessage;
-using ray::rpc::syncer::RaySyncMessages;
-using ray::rpc::syncer::StartSyncRequest;
-using ray::rpc::syncer::StartSyncResponse;
+
+using ServerBidiReactor = grpc::ServerBidiReactor<RaySyncMessage, RaySyncMessage>;
+using ClientBidiReactor = grpc::ClientBidiReactor<RaySyncMessage, RaySyncMessage>;
 
 static constexpr size_t kComponentArraySize =
     static_cast<size_t>(ray::rpc::syncer::MessageType_ARRAYSIZE);
@@ -73,7 +71,7 @@ struct ReceiverInterface {
 
 // Forward declaration of internal structures
 class NodeState;
-class NodeSyncConnection;
+class RaySyncerBidiReactor;
 
 /// RaySyncer is an embedding service for component synchronization.
 /// All operations in this class needs to be finished GetIOContext()
@@ -81,9 +79,9 @@ class NodeSyncConnection;
 /// RaySyncer is the control plane to make sure all connections eventually
 /// have the latest view of the cluster components registered.
 /// RaySyncer has two components:
-///    1. NodeSyncConnection: keeps track of the sending and receiving information
+///    1. RaySyncerBidiReactor: keeps track of the sending and receiving information
 ///       and make sure not sending the information the remote node knows.
-///    2. NodeState: keeps track of the local status, similar to NodeSyncConnection,
+///    2. NodeState: keeps track of the local status, similar to RaySyncerBidiReactor,
 //        but it's for local node.
 class RaySyncer {
  public:
@@ -98,15 +96,9 @@ class RaySyncer {
   /// TODO (iycheng): Introduce grpc channel pool and use node_id
   /// for the connection.
   ///
-  /// \param connection The connection to the remote node.
-  void Connect(std::unique_ptr<NodeSyncConnection> connection);
-
-  /// Connect to a node.
-  /// TODO (iycheng): Introduce grpc channel pool and use node_id
-  /// for the connection.
-  ///
-  /// \param connection The connection to the remote node.
-  void Connect(std::shared_ptr<grpc::Channel> channel);
+  /// \param node_id The id of the node connect to.
+  /// \param channel The gRPC channel.
+  void Connect(const std::string &node_id, std::shared_ptr<grpc::Channel> channel);
 
   void Disconnect(const std::string &node_id);
 
@@ -121,7 +113,7 @@ class RaySyncer {
   /// \param pull_from_reporter_interval_ms The frequence to pull a message. 0 means
   /// never pull a message in syncer.
   /// from reporter and push it to sending queue.
-  bool Register(MessageType message_type,
+  void Register(MessageType message_type,
                 const ReporterInterface *reporter,
                 ReceiverInterface *receiver,
                 int64_t pull_from_reporter_interval_ms = 100);
@@ -143,24 +135,16 @@ class RaySyncer {
   /// \param message The message to be broadcasted.
   void BroadcastRaySyncMessage(std::shared_ptr<const RaySyncMessage> message);
 
+  std::vector<std::string> GetAllConnectedNodeIDs() const;
+
  private:
+  void Connect(RaySyncerBidiReactor *connection);
+
+  std::shared_ptr<bool> stopped_;
+
   /// Get the io_context used by RaySyncer.
   instrumented_io_context &GetIOContext() { return io_context_; }
 
-  /// Get the SyncConnection of a node.
-  ///
-  /// \param node_id The node id to lookup.
-  ///
-  /// \return nullptr if it doesn't exist, otherwise, the connection associated with the
-  /// node.
-  NodeSyncConnection *GetSyncConnection(const std::string &node_id) const {
-    auto iter = sync_connections_.find(node_id);
-    if (iter == sync_connections_.end()) {
-      return nullptr;
-    }
-    return iter->second.get();
-  }
-
   /// Function to broadcast the messages to other nodes.
   /// A message will be sent to a node if that node doesn't have this message.
   /// The message can be generated by local reporter or received by the other node.
@@ -175,29 +159,14 @@ class RaySyncer {
   const std::string local_node_id_;
 
   /// Manage connections. Here the key is the NodeID in binary form.
-  absl::flat_hash_map<std::string, std::unique_ptr<NodeSyncConnection>> sync_connections_;
-
-  /// Upward connections. These are connections initialized not by the local node.
-  absl::flat_hash_set<NodeSyncConnection *> upward_connections_;
+  absl::flat_hash_map<std::string, RaySyncerBidiReactor *> sync_reactors_;
 
   /// The local node state
   std::unique_ptr<NodeState> node_state_;
 
-  /// Context of a rpc call.
-  struct StartSyncCall {
-    StartSyncRequest request;
-    StartSyncResponse response;
-    grpc::ClientContext context;
-    std::promise<void> promise;
-  };
-
-  absl::flat_hash_set<std::unique_ptr<StartSyncCall>> inflight_requests_;
-
   /// Timer is used to do broadcasting.
   ray::PeriodicalRunner timer_;
 
-  std::shared_ptr<bool> stopped_;
-
   friend class RaySyncerService;
   /// Test purpose
   friend struct SyncerServerTest;
@@ -209,9 +178,6 @@ class RaySyncer {
   FRIEND_TEST(SyncerTest, Reconnect);
 };
 
-class ClientSyncConnection;
-class ServerSyncConnection;
-
 /// RaySyncerService is a service to take care of resource synchronization
 /// related operations.
 /// Right now only raylet needs to setup this service. But in the future,
@@ -223,25 +189,10 @@ class RaySyncerService : public ray::rpc::syncer::RaySyncer::CallbackService {
 
   ~RaySyncerService();
 
-  grpc::ServerUnaryReactor *StartSync(grpc::CallbackServerContext *context,
-                                      const StartSyncRequest *request,
-                                      StartSyncResponse *response) override;
-
-  grpc::ServerUnaryReactor *Update(grpc::CallbackServerContext *context,
-                                   const RaySyncMessages *request,
-                                   DummyResponse *) override;
-
-  grpc::ServerUnaryReactor *LongPolling(grpc::CallbackServerContext *context,
-                                        const DummyRequest *,
-                                        RaySyncMessages *response) override;
+  grpc::ServerBidiReactor<RaySyncMessage, RaySyncMessage> *StartSync(
+      grpc::CallbackServerContext *context) override;
 
  private:
-  // This will be created after connection is established.
-  // Ideally this should be owned by RaySyncer, but since we are doing
-  // long-polling right now, we have to put it here so that when
-  // long-polling request comes, we can set it up.
-  std::string remote_node_id_;
-
   // The ray syncer this RPC wrappers of.
   RaySyncer &syncer_;
 };
diff --git a/src/ray/common/test/ray_syncer_test.cc b/src/ray/common/test/ray_syncer_test.cc
index 8ca793737778..ff0652d22be3 100644
--- a/src/ray/common/test/ray_syncer_test.cc
+++ b/src/ray/common/test/ray_syncer_test.cc
@@ -27,6 +27,7 @@
 #include <grpcpp/server_builder.h>
 
 #include "ray/common/ray_syncer/ray_syncer.h"
+#include "ray/rpc/grpc_server.h"
 #include "mock/ray/common/ray_syncer/ray_syncer.h"
 // clang-format on
 
@@ -44,6 +45,9 @@ namespace syncer {
 
 constexpr size_t kTestComponents = 1;
 
+using work_guard_type =
+    boost::asio::executor_work_guard<boost::asio::io_context::executor_type>;
+
 RaySyncMessage MakeMessage(MessageType cid, int64_t version, const NodeID &id) {
   auto msg = RaySyncMessage();
   msg.set_version(version);
@@ -55,6 +59,7 @@ RaySyncMessage MakeMessage(MessageType cid, int64_t version, const NodeID &id) {
 class RaySyncerTest : public ::testing::Test {
  protected:
   void SetUp() override {
+    work_guard_ = std::make_unique<work_guard_type>(io_context_.get_executor());
     local_versions_.fill(0);
     for (size_t cid = 0; cid < reporters_.size(); ++cid) {
       receivers_[cid] = std::make_unique<MockReceiverInterface>();
@@ -74,10 +79,7 @@ class RaySyncerTest : public ::testing::Test {
       ON_CALL(*reporter, CreateSyncMessage(_, _))
           .WillByDefault(WithArg<0>(Invoke(take_snapshot)));
     }
-    thread_ = std::make_unique<std::thread>([this]() {
-      boost::asio::io_context::work work(io_context_);
-      io_context_.run();
-    });
+    thread_ = std::make_unique<std::thread>([this]() { io_context_.run(); });
     local_id_ = NodeID::FromRandom();
     syncer_ = std::make_unique<RaySyncer>(io_context_, local_id_.Binary());
   }
@@ -95,7 +97,7 @@ class RaySyncerTest : public ::testing::Test {
   }
 
   void TearDown() override {
-    io_context_.stop();
+    work_guard_->reset();
     thread_->join();
   }
 
@@ -106,6 +108,7 @@ class RaySyncerTest : public ::testing::Test {
       nullptr};
 
   instrumented_io_context io_context_;
+  std::unique_ptr<work_guard_type> work_guard_;
   std::unique_ptr<std::thread> thread_;
 
   std::unique_ptr<RaySyncer> syncer_;
@@ -145,40 +148,58 @@ TEST_F(RaySyncerTest, NodeStateConsume) {
   ASSERT_FALSE(node_status->ConsumeSyncMessage(std::make_shared<RaySyncMessage>(msg)));
 }
 
-TEST_F(RaySyncerTest, NodeSyncConnection) {
+struct MockReactor {
+  void StartRead(RaySyncMessage *) { ++read_cnt; }
+
+  void StartWrite(const RaySyncMessage *,
+                  grpc::WriteOptions opts = grpc::WriteOptions()) {
+    ++write_cnt;
+  }
+
+  virtual void OnWriteDone(bool ok) {}
+  virtual void OnReadDone(bool ok) {}
+
+  size_t read_cnt = 0;
+  size_t write_cnt = 0;
+};
+
+TEST_F(RaySyncerTest, RaySyncerBidiReactorBase) {
   auto node_id = NodeID::FromRandom();
 
-  MockNodeSyncConnection sync_connection(
+  MockRaySyncerBidiReactorBase<MockReactor> sync_reactor(
       io_context_,
       node_id.Binary(),
-      [](std::shared_ptr<ray::rpc::syncer::RaySyncMessage>) {});
+      [](std::shared_ptr<const ray::rpc::syncer::RaySyncMessage>) {});
   auto from_node_id = NodeID::FromRandom();
   auto msg = MakeMessage(MessageType::RESOURCE_VIEW, 0, from_node_id);
+  auto msg_ptr1 = std::make_shared<RaySyncMessage>(msg);
+  msg.set_version(2);
+  auto msg_ptr2 = std::make_shared<RaySyncMessage>(msg);
+  msg.set_version(3);
+  auto msg_ptr3 = std::make_shared<RaySyncMessage>(msg);
 
   // First push will succeed and the second one will be deduplicated.
-  ASSERT_TRUE(sync_connection.PushToSendingQueue(std::make_shared<RaySyncMessage>(msg)));
-  ASSERT_FALSE(sync_connection.PushToSendingQueue(std::make_shared<RaySyncMessage>(msg)));
-  ASSERT_EQ(1, sync_connection.sending_buffer_.size());
-  ASSERT_EQ(0, sync_connection.sending_buffer_.begin()->second->version());
-  ASSERT_EQ(1, sync_connection.node_versions_.size());
+  ASSERT_TRUE(sync_reactor.PushToSendingQueue(msg_ptr1));
+  ASSERT_FALSE(sync_reactor.PushToSendingQueue(msg_ptr1));
+  ASSERT_EQ(0, sync_reactor.sending_buffer_.size());
+
+  ASSERT_TRUE(sync_reactor.PushToSendingQueue(msg_ptr2));
+  ASSERT_EQ(1, sync_reactor.sending_buffer_.size());
+  ASSERT_EQ(1, sync_reactor.node_versions_.size());
+  ASSERT_EQ(2, sync_reactor.sending_buffer_.begin()->second->version());
   ASSERT_EQ(
-      0,
-      sync_connection.node_versions_[from_node_id.Binary()][MessageType::RESOURCE_VIEW]);
+      2, sync_reactor.node_versions_[from_node_id.Binary()][MessageType::RESOURCE_VIEW]);
 
-  msg.set_version(2);
-  ASSERT_TRUE(sync_connection.PushToSendingQueue(std::make_shared<RaySyncMessage>(msg)));
-  ASSERT_FALSE(sync_connection.PushToSendingQueue(std::make_shared<RaySyncMessage>(msg)));
-  // The previous message is deleted.
-  ASSERT_EQ(1, sync_connection.sending_buffer_.size());
-  ASSERT_EQ(1, sync_connection.node_versions_.size());
-  ASSERT_EQ(2, sync_connection.sending_buffer_.begin()->second->version());
+  ASSERT_TRUE(sync_reactor.PushToSendingQueue(msg_ptr3));
+  ASSERT_EQ(1, sync_reactor.sending_buffer_.size());
+  ASSERT_EQ(1, sync_reactor.node_versions_.size());
+  ASSERT_EQ(3, sync_reactor.sending_buffer_.begin()->second->version());
   ASSERT_EQ(
-      2,
-      sync_connection.node_versions_[from_node_id.Binary()][MessageType::RESOURCE_VIEW]);
+      3, sync_reactor.node_versions_[from_node_id.Binary()][MessageType::RESOURCE_VIEW]);
 }
 
 struct SyncerServerTest {
-  SyncerServerTest(std::string port) {
+  SyncerServerTest(std::string port) : work_guard(io_context.get_executor()) {
     this->server_port = port;
     // Setup io context
     auto node_id = NodeID::FromRandom();
@@ -187,6 +208,7 @@ struct SyncerServerTest {
     }
     // Setup syncer and grpc server
     syncer = std::make_unique<RaySyncer>(io_context, node_id.Binary());
+    thread = std::make_unique<std::thread>([this] { io_context.run(); });
 
     auto server_address = std::string("0.0.0.0:") + port;
     grpc::ServerBuilder builder;
@@ -196,7 +218,10 @@ struct SyncerServerTest {
     server = builder.BuildAndStart();
 
     for (size_t cid = 0; cid < reporters.size(); ++cid) {
-      auto snapshot_received = [this](std::shared_ptr<const RaySyncMessage> message) {
+      auto snapshot_received = [this,
+                                node_id](std::shared_ptr<const RaySyncMessage> message) {
+        RAY_LOG(DEBUG) << "Message received: from "
+                       << NodeID::FromBinary(message->node_id()) << " to " << node_id;
         auto iter = received_versions.find(message->node_id());
         if (iter == received_versions.end()) {
           for (auto &v : received_versions[message->node_id()]) {
@@ -208,6 +233,9 @@ struct SyncerServerTest {
         received_versions[message->node_id()][message->message_type()] =
             message->version();
         message_consumed[message->node_id()]++;
+        RAY_LOG(DEBUG) << "Message consumed from "
+                       << NodeID::FromBinary(message->node_id())
+                       << ", local_id=" << node_id;
       };
       receivers[cid] = std::make_unique<MockReceiverInterface>();
       EXPECT_CALL(*receivers[cid], ConsumeSyncMessage(_))
@@ -232,10 +260,6 @@ struct SyncerServerTest {
       syncer->Register(
           static_cast<MessageType>(cid), reporter.get(), receivers[cid].get());
     }
-    thread = std::make_unique<std::thread>([this] {
-      boost::asio::io_context::work work(io_context);
-      io_context.run();
-    });
   }
 
   void WaitSendingFlush() {
@@ -244,13 +268,22 @@ struct SyncerServerTest {
       auto f = p.get_future();
       io_context.post(
           [&p, this]() mutable {
-            for (const auto &[node_id, conn] : syncer->sync_connections_) {
-              if (!conn->sending_buffer_.empty()) {
+            for (const auto &[node_id, conn] : syncer->sync_reactors_) {
+              auto ptr = dynamic_cast<RayServerBidiReactor *>(conn);
+              size_t remainings = 0;
+              if (ptr == nullptr) {
+                remainings =
+                    dynamic_cast<RayClientBidiReactor *>(conn)->sending_buffer_.size();
+              } else {
+                remainings = ptr->sending_buffer_.size();
+              }
+
+              if (remainings != 0) {
                 p.set_value(false);
                 RAY_LOG(INFO) << NodeID::FromBinary(syncer->GetLocalNodeID()) << ": "
                               << "Waiting for message on " << NodeID::FromBinary(node_id)
                               << " to be sent."
-                              << " Remainings " << conn->sending_buffer_.size();
+                              << " Remainings " << remainings;
                 return;
               }
             }
@@ -281,11 +314,19 @@ struct SyncerServerTest {
     return false;
   }
 
-  ~SyncerServerTest() {
-    service.reset();
-    server.reset();
+  void Stop() {
+    for (auto node_id : syncer->GetAllConnectedNodeIDs()) {
+      syncer->Disconnect(node_id);
+    }
+
+    server->Shutdown();
+
     io_context.stop();
     thread->join();
+
+    server.reset();
+    service.reset();
+
     syncer.reset();
   }
 
@@ -314,7 +355,9 @@ struct SyncerServerTest {
   std::unique_ptr<RaySyncer> syncer;
   std::unique_ptr<grpc::Server> server;
   std::unique_ptr<std::thread> thread;
+
   instrumented_io_context io_context;
+  work_guard_type work_guard;
   std::string server_port;
   std::array<std::atomic<int64_t>, kTestComponents> local_versions;
   std::array<std::unique_ptr<MockReporterInterface>, kTestComponents> reporters = {
@@ -367,38 +410,57 @@ using TClusterView = absl::flat_hash_map<
     std::string,
     std::array<std::shared_ptr<const RaySyncMessage>, kComponentArraySize>>;
 
-TEST(SyncerTest, Test1To1) {
-  auto s1 = SyncerServerTest("19990");
+class SyncerTest : public ::testing::Test {
+ public:
+  SyncerServerTest &MakeServer(std::string port) {
+    servers.emplace_back(std::make_unique<SyncerServerTest>(port));
+    return *servers.back();
+  }
+
+ protected:
+  void TearDown() override {
+    // Drain all grpc requests.
+    for (auto &s : servers) {
+      s->Stop();
+    }
+
+    std::this_thread::sleep_for(1s);
+  }
+  std::vector<std::unique_ptr<SyncerServerTest>> servers;
+};
+
+TEST_F(SyncerTest, Test1To1) {
+  auto &s1 = MakeServer("19990");
 
-  auto s2 = SyncerServerTest("19991");
+  auto &s2 = MakeServer("19991");
 
   // Make sure the setup is correct
   ASSERT_NE(nullptr, s1.receivers[MessageType::RESOURCE_VIEW]);
   ASSERT_NE(nullptr, s2.receivers[MessageType::RESOURCE_VIEW]);
   ASSERT_NE(nullptr, s1.reporters[MessageType::RESOURCE_VIEW]);
   ASSERT_NE(nullptr, s2.reporters[MessageType::RESOURCE_VIEW]);
+  RAY_LOG(DEBUG) << "s1: " << NodeID::FromBinary(s1.syncer->GetLocalNodeID());
+  RAY_LOG(DEBUG) << "s2: " << NodeID::FromBinary(s2.syncer->GetLocalNodeID());
 
   auto channel_to_s2 = MakeChannel("19991");
 
-  s1.syncer->Connect(channel_to_s2);
+  s1.syncer->Connect(s2.syncer->GetLocalNodeID(), channel_to_s2);
 
   // Make sure s2 adds s1
   ASSERT_TRUE(s2.WaitUntil(
-      [&s2]() {
-        return s2.syncer->sync_connections_.size() == 1 && s2.snapshot_taken == 1;
-      },
+      [&s2]() { return s2.syncer->sync_reactors_.size() == 1 && s2.snapshot_taken == 1; },
       5));
 
   // Make sure s1 adds s2
   ASSERT_TRUE(s1.WaitUntil(
-      [&s1]() {
-        return s1.syncer->sync_connections_.size() == 1 && s1.snapshot_taken == 1;
-      },
+      [&s1]() { return s1.syncer->sync_reactors_.size() == 1 && s1.snapshot_taken == 1; },
       5));
 
   // s1 will only send 1 message to s2 because it only has one reporter
   ASSERT_TRUE(s2.WaitUntil(
       [&s2, node_id = s1.syncer->GetLocalNodeID()]() {
+        RAY_LOG(DEBUG) << NodeID::FromBinary(node_id) << " - "
+                       << s2.GetNumConsumedMessages(node_id);
         return s2.GetNumConsumedMessages(node_id) == 1;
       },
       5));
@@ -406,6 +468,9 @@ TEST(SyncerTest, Test1To1) {
   // s2 will send 2 messages to s1 because it has two reporters.
   ASSERT_TRUE(s1.WaitUntil(
       [&s1, node_id = s2.syncer->GetLocalNodeID()]() {
+        RAY_LOG(DEBUG) << "Num of messages from " << NodeID::FromBinary(node_id) << " to "
+                       << NodeID::FromBinary(s1.syncer->GetLocalNodeID()) << " is "
+                       << s1.GetNumConsumedMessages(node_id);
         return s1.GetNumConsumedMessages(node_id) == 1;
       },
       5));
@@ -475,7 +540,7 @@ TEST(SyncerTest, Test1To1) {
   ASSERT_LE(s2.GetNumConsumedMessages(s1.syncer->GetLocalNodeID()), max_sends + 3);
 }
 
-TEST(SyncerTest, Reconnect) {
+TEST_F(SyncerTest, Reconnect) {
   // This test is to check reconnect works.
   // Firstly
   //    s1 -> s3
@@ -483,59 +548,47 @@ TEST(SyncerTest, Reconnect) {
   //    s2 -> s3
   // And we need to ensure s3 is connecting to s2
 
-  auto s1 = SyncerServerTest("19990");
-  auto s2 = SyncerServerTest("19991");
-  auto s3 = SyncerServerTest("19992");
+  auto &s1 = MakeServer("19990");
+  auto &s2 = MakeServer("19991");
+  auto &s3 = MakeServer("19992");
 
-  s1.syncer->Connect(MakeChannel("19992"));
+  s1.syncer->Connect(s3.syncer->GetLocalNodeID(), MakeChannel("19992"));
 
   // Make sure the setup is correct
   ASSERT_TRUE(s1.WaitUntil(
-      [&s1]() {
-        return s1.syncer->sync_connections_.size() == 1 && s1.snapshot_taken == 1;
-      },
+      [&s1]() { return s1.syncer->sync_reactors_.size() == 1 && s1.snapshot_taken == 1; },
       5));
 
   ASSERT_TRUE(s1.WaitUntil(
-      [&s3]() {
-        return s3.syncer->sync_connections_.size() == 1 && s3.snapshot_taken == 1;
-      },
+      [&s3]() { return s3.syncer->sync_reactors_.size() == 1 && s3.snapshot_taken == 1; },
       5));
-  s2.syncer->Connect(MakeChannel("19992"));
+  s2.syncer->Connect(s3.syncer->GetLocalNodeID(), MakeChannel("19992"));
 
   ASSERT_TRUE(s1.WaitUntil(
-      [&s2]() {
-        return s2.syncer->sync_connections_.size() == 1 && s2.snapshot_taken == 1;
-      },
+      [&s2]() { return s2.syncer->sync_reactors_.size() == 1 && s2.snapshot_taken == 1; },
       5));
 }
 
-TEST(SyncerTest, Broadcast) {
+TEST_F(SyncerTest, Broadcast) {
   // This test covers the broadcast feature of ray syncer.
-  auto s1 = SyncerServerTest("19990");
-  auto s2 = SyncerServerTest("19991");
-  auto s3 = SyncerServerTest("19992");
+  auto &s1 = MakeServer("19990");
+  auto &s2 = MakeServer("19991");
+  auto &s3 = MakeServer("19992");
   // We need to make sure s1 is sending data to s3 for s2
-  s1.syncer->Connect(MakeChannel("19991"));
-  s1.syncer->Connect(MakeChannel("19992"));
+  s1.syncer->Connect(s2.syncer->GetLocalNodeID(), MakeChannel("19991"));
+  s1.syncer->Connect(s3.syncer->GetLocalNodeID(), MakeChannel("19992"));
 
   // Make sure the setup is correct
   ASSERT_TRUE(s1.WaitUntil(
-      [&s1]() {
-        return s1.syncer->sync_connections_.size() == 2 && s1.snapshot_taken == 1;
-      },
+      [&s1]() { return s1.syncer->sync_reactors_.size() == 2 && s1.snapshot_taken == 1; },
       5));
 
   ASSERT_TRUE(s1.WaitUntil(
-      [&s2]() {
-        return s2.syncer->sync_connections_.size() == 1 && s2.snapshot_taken == 1;
-      },
+      [&s2]() { return s2.syncer->sync_reactors_.size() == 1 && s2.snapshot_taken == 1; },
       5));
 
   ASSERT_TRUE(s1.WaitUntil(
-      [&s3]() {
-        return s3.syncer->sync_connections_.size() == 1 && s3.snapshot_taken == 1;
-      },
+      [&s3]() { return s3.syncer->sync_reactors_.size() == 1 && s3.snapshot_taken == 1; },
       5));
 
   // Change the resource in s2 and make sure s1 && s3 are correct
@@ -554,7 +607,7 @@ TEST(SyncerTest, Broadcast) {
       5));
 }
 
-bool CompareViews(const std::vector<std::unique_ptr<SyncerServerTest>> &servers,
+bool CompareViews(const std::vector<SyncerServerTest *> &servers,
                   const std::vector<TClusterView> &views,
                   const std::vector<std::set<size_t>> &g) {
   // Check broadcasting is working
@@ -595,7 +648,7 @@ bool CompareViews(const std::vector<std::unique_ptr<SyncerServerTest>> &servers,
 }
 
 bool TestCorrectness(std::function<TClusterView(RaySyncer &syncer)> get_cluster_view,
-                     std::vector<std::unique_ptr<SyncerServerTest>> &servers,
+                     std::vector<SyncerServerTest *> &servers,
                      const std::vector<std::set<size_t>> &g) {
   auto check = [&servers, get_cluster_view, &g]() {
     std::vector<TClusterView> views;
@@ -656,15 +709,16 @@ bool TestCorrectness(std::function<TClusterView(RaySyncer &syncer)> get_cluster_
   return check();
 }
 
-TEST(SyncerTest, Test1ToN) {
+TEST_F(SyncerTest, Test1ToN) {
   size_t base_port = 18990;
-  std::vector<std::unique_ptr<SyncerServerTest>> servers;
+  std::vector<SyncerServerTest *> servers;
   for (int i = 0; i < 20; ++i) {
-    servers.push_back(std::make_unique<SyncerServerTest>(std::to_string(i + base_port)));
+    servers.push_back(&MakeServer(std::to_string(i + base_port)));
   }
   std::vector<std::set<size_t>> g(servers.size());
   for (size_t i = 1; i < servers.size(); ++i) {
-    servers[0]->syncer->Connect(MakeChannel(servers[i]->server_port));
+    servers[0]->syncer->Connect(servers[i]->syncer->GetLocalNodeID(),
+                                MakeChannel(servers[i]->server_port));
     g[0].insert(i);
   }
 
@@ -680,11 +734,11 @@ TEST(SyncerTest, Test1ToN) {
   ASSERT_TRUE(TestCorrectness(get_cluster_view, servers, g));
 }
 
-TEST(SyncerTest, TestMToN) {
+TEST_F(SyncerTest, TestMToN) {
   size_t base_port = 18990;
-  std::vector<std::unique_ptr<SyncerServerTest>> servers;
+  std::vector<SyncerServerTest *> servers;
   for (int i = 0; i < 20; ++i) {
-    servers.push_back(std::make_unique<SyncerServerTest>(std::to_string(i + base_port)));
+    servers.push_back(&MakeServer(std::to_string(i + base_port)));
   }
   std::vector<std::set<size_t>> g(servers.size());
   // Try to construct a tree based structure
@@ -693,7 +747,8 @@ TEST(SyncerTest, TestMToN) {
   while (i < servers.size()) {
     // try to connect to 2 servers per node.
     for (int k = 0; k < 2 && i < servers.size(); ++k, ++i) {
-      servers[curr]->syncer->Connect(MakeChannel(servers[i]->server_port));
+      servers[curr]->syncer->Connect(servers[i]->syncer->GetLocalNodeID(),
+                                     MakeChannel(servers[i]->server_port));
       g[curr].insert(i);
     }
     ++curr;
@@ -710,5 +765,166 @@ TEST(SyncerTest, TestMToN) {
   ASSERT_TRUE(TestCorrectness(get_cluster_view, servers, g));
 }
 
+struct MockRaySyncerService : public ray::rpc::syncer::RaySyncer::CallbackService {
+  MockRaySyncerService(
+      instrumented_io_context &_io_context,
+      std::function<void(std::shared_ptr<const RaySyncMessage>)> _message_processor,
+      std::function<void(const std::string &, bool)> _cleanup_cb)
+      : message_processor(_message_processor),
+        cleanup_cb(_cleanup_cb),
+        node_id(NodeID::FromRandom()),
+        io_context(_io_context) {}
+  grpc::ServerBidiReactor<RaySyncMessage, RaySyncMessage> *StartSync(
+      grpc::CallbackServerContext *context) override {
+    reactor = new RayServerBidiReactor(
+        context, io_context, node_id.Binary(), message_processor, cleanup_cb);
+    return reactor;
+  }
+
+  std::function<void(std::shared_ptr<const RaySyncMessage>)> message_processor;
+  std::function<void(const std::string &, bool)> cleanup_cb;
+  NodeID node_id;
+  instrumented_io_context &io_context;
+  RayServerBidiReactor *reactor = nullptr;
+};
+
+class SyncerReactorTest : public ::testing::Test {
+ protected:
+  void SetUp() override {
+    rpc_service_ = std::make_unique<MockRaySyncerService>(
+        io_context_,
+        [this](auto msg) { server_received_message.set_value(msg); },
+        [this](auto &node, bool restart) {
+          server_cleanup.set_value(std::make_pair(node, restart));
+        });
+    grpc::ServerBuilder builder;
+    builder.AddListeningPort("0.0.0.0:18990", grpc::InsecureServerCredentials());
+    builder.RegisterService(rpc_service_.get());
+    server = builder.BuildAndStart();
+
+    client_node_id = NodeID::FromRandom();
+    cli_channel = MakeChannel("18990");
+    auto cli_stub = ray::rpc::syncer::RaySyncer::NewStub(cli_channel);
+    cli_reactor = std::make_unique<RayClientBidiReactor>(
+                      rpc_service_->node_id.Binary(),
+                      client_node_id.Binary(),
+                      io_context_,
+                      [this](auto msg) { client_received_message.set_value(msg); },
+                      [this](const std::string &n, bool r) {
+                        client_cleanup.set_value(std::make_pair(n, r));
+                      },
+                      std::move(cli_stub))
+                      .release();
+    cli_reactor->StartCall();
+
+    work_guard_ = std::make_unique<work_guard_type>(io_context_.get_executor());
+    thread_ = std::make_unique<std::thread>([this]() { io_context_.run(); });
+
+    auto start = steady_clock::now();
+    while (duration_cast<seconds>(steady_clock::now() - start).count() <= 5) {
+      RAY_LOG(INFO) << "Waiting: "
+                    << duration_cast<seconds>(steady_clock::now() - start).count();
+      if (rpc_service_->reactor != nullptr) {
+        break;
+      };
+      std::this_thread::sleep_for(1s);
+    }
+  }
+
+  void TearDown() override {
+    io_context_.stop();
+    thread_->join();
+  }
+
+  std::pair<RayServerBidiReactor *, RayClientBidiReactor *> GetReactors() {
+    return std::make_pair(rpc_service_->reactor, cli_reactor);
+  }
+
+  std::pair<std::string, std::string> GetNodeID() {
+    return std::make_pair(rpc_service_->node_id.Binary(), client_node_id.Binary());
+  }
+
+  void ResetPromise() {
+    server_received_message = std::promise<std::shared_ptr<const RaySyncMessage>>();
+    client_received_message = std::promise<std::shared_ptr<const RaySyncMessage>>();
+    server_cleanup = std::promise<std::pair<std::string, bool>>();
+    client_cleanup = std::promise<std::pair<std::string, bool>>();
+  }
+
+  instrumented_io_context io_context_;
+  std::unique_ptr<work_guard_type> work_guard_;
+  std::unique_ptr<std::thread> thread_;
+  std::unique_ptr<MockRaySyncerService> rpc_service_;
+  std::unique_ptr<grpc::Server> server;
+  std::promise<std::shared_ptr<const RaySyncMessage>> server_received_message;
+  std::promise<std::shared_ptr<const RaySyncMessage>> client_received_message;
+  std::promise<std::pair<std::string, bool>> server_cleanup;
+  std::promise<std::pair<std::string, bool>> client_cleanup;
+
+  grpc::ClientContext cli_context;
+  RayClientBidiReactor *cli_reactor;
+  std::shared_ptr<grpc::Channel> cli_channel;
+  NodeID client_node_id;
+};
+
+TEST_F(SyncerReactorTest, TestReactor) {
+  auto [s, c] = GetReactors();
+  auto [node_s, node_c] = GetNodeID();
+  ASSERT_TRUE(s != nullptr);
+  ASSERT_TRUE(c != nullptr);
+
+  auto msg_s = std::make_shared<RaySyncMessage>();
+  msg_s->set_version(1);
+  msg_s->set_node_id(node_s);
+
+  s->PushToSendingQueue(msg_s);
+
+  auto msg_c = std::make_shared<RaySyncMessage>();
+  msg_c->set_version(2);
+  msg_c->set_node_id(node_c);
+
+  c->PushToSendingQueue(msg_c);
+  // Make sure sending is working
+  auto server_received = server_received_message.get_future().get();
+  auto client_received = client_received_message.get_future().get();
+  ResetPromise();
+  ASSERT_EQ(server_received->version(), 2);
+  ASSERT_EQ(server_received->node_id(), node_c);
+  ASSERT_EQ(client_received->version(), 1);
+  ASSERT_EQ(client_received->node_id(), node_s);
+
+  s->Disconnect();
+  auto c_cleanup = client_cleanup.get_future().get();
+  ASSERT_EQ(node_s, c_cleanup.first);
+  ASSERT_EQ(false, c_cleanup.second);
+}
+
+TEST_F(SyncerReactorTest, TestReactorFailure) {
+  auto [s, c] = GetReactors();
+  auto [node_s, node_c] = GetNodeID();
+  ASSERT_TRUE(s != nullptr);
+  ASSERT_TRUE(c != nullptr);
+  s->Finish(grpc::Status::CANCELLED);
+  auto c_cleanup = client_cleanup.get_future().get();
+  ASSERT_EQ(node_s, c_cleanup.first);
+  ASSERT_EQ(true, c_cleanup.second);
+}
+
 }  // namespace syncer
 }  // namespace ray
+
+int main(int argc, char **argv) {
+  InitShutdownRAII ray_log_shutdown_raii(ray::RayLog::StartRayLog,
+                                         ray::RayLog::ShutDownRayLog,
+                                         argv[0],
+                                         ray::RayLogLevel::INFO,
+                                         /*log_dir=*/"");
+  ray::RayLog::InstallFailureSignalHandler(argv[0]);
+  ray::RayLog::InstallTerminateHandler();
+
+  ::testing::InitGoogleTest(&argc, argv);
+  auto ret = RUN_ALL_TESTS();
+  // Sleep for gRPC to gracefully shutdown.
+  std::this_thread::sleep_for(2s);
+  return ret;
+}
diff --git a/src/ray/common/test/syncer_service_e2e_test.cc b/src/ray/common/test/syncer_service_e2e_test.cc
index f8e3999439b7..0e8c37d249c3 100644
--- a/src/ray/common/test/syncer_service_e2e_test.cc
+++ b/src/ray/common/test/syncer_service_e2e_test.cc
@@ -123,7 +123,7 @@ int main(int argc, char *argv[]) {
     channel = grpc::CreateCustomChannel(
         "localhost:" + leader_port, grpc::InsecureChannelCredentials(), argument);
 
-    syncer.Connect(channel);
+    syncer.Connect(ray::NodeID::FromRandom().Binary(), channel);
   }
 
   boost::asio::io_context::work work(io_context);
diff --git a/src/ray/gcs/gcs_server/gcs_actor_scheduler.cc b/src/ray/gcs/gcs_server/gcs_actor_scheduler.cc
index 0d08b337e8d5..7fa71a8791cf 100644
--- a/src/ray/gcs/gcs_server/gcs_actor_scheduler.cc
+++ b/src/ray/gcs/gcs_server/gcs_actor_scheduler.cc
@@ -444,7 +444,6 @@ void GcsActorScheduler::CreateActorOnWorker(std::shared_ptr<GcsActor> actor,
   RAY_LOG(INFO) << "Start creating actor " << actor->GetActorID() << " on worker "
                 << worker->GetWorkerID() << " at node " << actor->GetNodeID()
                 << ", job id = " << actor->GetActorID().JobId();
-
   std::unique_ptr<rpc::PushTaskRequest> request(new rpc::PushTaskRequest());
   request->set_intended_worker_id(worker->GetWorkerID().Binary());
   request->mutable_task_spec()->CopyFrom(
diff --git a/src/ray/gcs/gcs_server/gcs_server.cc b/src/ray/gcs/gcs_server/gcs_server.cc
index 706a483c3760..5d9f98db3b83 100644
--- a/src/ray/gcs/gcs_server/gcs_server.cc
+++ b/src/ray/gcs/gcs_server/gcs_server.cc
@@ -50,7 +50,6 @@ GcsServer::GcsServer(const ray::gcs::GcsServerConfig &config,
                            RayConfig::instance().gcs_server_rpc_client_thread_num()),
       raylet_client_pool_(
           std::make_shared<rpc::NodeManagerClientPool>(client_call_manager_)),
-      local_node_id_(NodeID::FromRandom()),
       pubsub_periodical_runner_(pubsub_io_service_),
       periodical_runner_(main_service),
       is_started_(false),
@@ -273,7 +272,7 @@ void GcsServer::InitGcsResourceManager(const GcsInitData &gcs_init_data) {
   gcs_resource_manager_ = std::make_shared<GcsResourceManager>(
       main_service_,
       cluster_resource_scheduler_->GetClusterResourceManager(),
-      local_node_id_,
+      kGCSNodeID,
       cluster_task_manager_);
 
   // Initialize by gcs tables data.
@@ -320,7 +319,7 @@ void GcsServer::InitGcsResourceManager(const GcsInitData &gcs_init_data) {
 
 void GcsServer::InitClusterResourceScheduler() {
   cluster_resource_scheduler_ = std::make_shared<ClusterResourceScheduler>(
-      scheduling::NodeID(local_node_id_.Binary()),
+      scheduling::NodeID(kGCSNodeID.Binary()),
       NodeResources(),
       /*is_node_available_fn=*/
       [](auto) { return true; },
@@ -330,7 +329,7 @@ void GcsServer::InitClusterResourceScheduler() {
 void GcsServer::InitClusterTaskManager() {
   RAY_CHECK(cluster_resource_scheduler_);
   cluster_task_manager_ = std::make_shared<ClusterTaskManager>(
-      local_node_id_,
+      kGCSNodeID,
       cluster_resource_scheduler_,
       /*get_node_info=*/
       [this](const NodeID &node_id) {
@@ -472,8 +471,8 @@ std::string GcsServer::StorageType() const {
 
 void GcsServer::InitRaySyncer(const GcsInitData &gcs_init_data) {
   if (RayConfig::instance().use_ray_syncer()) {
-    ray_syncer_ = std::make_unique<syncer::RaySyncer>(ray_syncer_io_context_,
-                                                      local_node_id_.Binary());
+    ray_syncer_ =
+        std::make_unique<syncer::RaySyncer>(ray_syncer_io_context_, kGCSNodeID.Binary());
     ray_syncer_->Register(
         syncer::MessageType::RESOURCE_VIEW, nullptr, gcs_resource_manager_.get());
     ray_syncer_->Register(
@@ -482,19 +481,8 @@ void GcsServer::InitRaySyncer(const GcsInitData &gcs_init_data) {
       boost::asio::io_service::work work(ray_syncer_io_context_);
       ray_syncer_io_context_.run();
     });
-
-    for (const auto &pair : gcs_init_data.Nodes()) {
-      if (pair.second.state() ==
-          rpc::GcsNodeInfo_GcsNodeState::GcsNodeInfo_GcsNodeState_ALIVE) {
-        rpc::Address address;
-        address.set_raylet_id(pair.second.node_id());
-        address.set_ip_address(pair.second.node_manager_address());
-        address.set_port(pair.second.node_manager_port());
-
-        auto raylet_client = raylet_client_pool_->GetOrConnectByAddress(address);
-        ray_syncer_->Connect(raylet_client->GetChannel());
-      }
-    }
+    ray_syncer_service_ = std::make_unique<syncer::RaySyncerService>(*ray_syncer_);
+    rpc_server_.RegisterService(*ray_syncer_service_);
   } else {
     /*
       The current synchronization flow is:
@@ -622,9 +610,7 @@ void GcsServer::InstallEventListeners() {
     }
     cluster_task_manager_->ScheduleAndDispatchTasks();
 
-    if (RayConfig::instance().use_ray_syncer()) {
-      ray_syncer_->Connect(raylet_client->GetChannel());
-    } else {
+    if (!RayConfig::instance().use_ray_syncer()) {
       gcs_ray_syncer_->AddNode(*node);
     }
   });
@@ -640,9 +626,7 @@ void GcsServer::InstallEventListeners() {
         raylet_client_pool_->Disconnect(node_id);
         gcs_healthcheck_manager_->RemoveNode(node_id);
 
-        if (RayConfig::instance().use_ray_syncer()) {
-          ray_syncer_->Disconnect(node_id.Binary());
-        } else {
+        if (!RayConfig::instance().use_ray_syncer()) {
           gcs_ray_syncer_->RemoveNode(*node);
         }
       });
@@ -776,14 +760,14 @@ void GcsServer::TryGlobalGC() {
     if (RayConfig::instance().use_ray_syncer()) {
       auto msg = std::make_shared<syncer::RaySyncMessage>();
       msg->set_version(absl::GetCurrentTimeNanos());
-      msg->set_node_id(local_node_id_.Binary());
+      msg->set_node_id(kGCSNodeID.Binary());
       msg->set_message_type(syncer::MessageType::COMMANDS);
       std::string serialized_msg;
       RAY_CHECK(resources_data.SerializeToString(&serialized_msg));
       msg->set_sync_message(std::move(serialized_msg));
       ray_syncer_->BroadcastRaySyncMessage(std::move(msg));
     } else {
-      resources_data.set_node_id(local_node_id_.Binary());
+      resources_data.set_node_id(kGCSNodeID.Binary());
       gcs_ray_syncer_->Update(resources_data);
     }
 
diff --git a/src/ray/gcs/gcs_server/gcs_server.h b/src/ray/gcs/gcs_server/gcs_server.h
index f326d954bfea..f6397452aceb 100644
--- a/src/ray/gcs/gcs_server/gcs_server.h
+++ b/src/ray/gcs/gcs_server/gcs_server.h
@@ -188,9 +188,6 @@ class GcsServer {
   std::shared_ptr<rpc::NodeManagerClientPool> raylet_client_pool_;
   /// The gcs resource manager.
   std::shared_ptr<GcsResourceManager> gcs_resource_manager_;
-  /// The gcs server's node id, for the creation of `cluster_resource_scheduler_` and
-  /// `cluster_task_manager_`.
-  NodeID local_node_id_;
   /// The cluster resource scheduler.
   std::shared_ptr<ClusterResourceScheduler> cluster_resource_scheduler_;
   /// The cluster task manager.
@@ -226,6 +223,7 @@ class GcsServer {
 
   /// Ray Syncer realted fields.
   std::unique_ptr<syncer::RaySyncer> ray_syncer_;
+  std::unique_ptr<syncer::RaySyncerService> ray_syncer_service_;
   std::unique_ptr<std::thread> ray_syncer_thread_;
   instrumented_io_context ray_syncer_io_context_;
 
diff --git a/src/ray/protobuf/ray_syncer.proto b/src/ray/protobuf/ray_syncer.proto
index f171665ef6f0..b24a0ecb323b 100644
--- a/src/ray/protobuf/ray_syncer.proto
+++ b/src/ray/protobuf/ray_syncer.proto
@@ -32,37 +32,6 @@ message RaySyncMessage {
   bytes node_id = 4;
 }
 
-message RaySyncMessages {
-  // The bached messages.
-  repeated RaySyncMessage sync_messages = 1;
-}
-
-message StartSyncRequest {
-  bytes node_id = 1;
-}
-
-message StartSyncResponse {
-  bytes node_id = 1;
-}
-
-message DummyRequest {}
-message DummyResponse {}
-
 service RaySyncer {
-  // Ideally these should be a streaming API like this
-  //   rpc StartSync(stream RaySyncMessages) returns (stream RaySyncMessages);
-  // But to make sure it's the same as the current protocol, we still use
-  // unary rpc.
-  // TODO (iycheng): Using grpc streaming for the protocol.
-
-  // This is the first message that should be sent. It will initialize
-  // some structure between nodes.
-  rpc StartSync(StartSyncRequest) returns (StartSyncResponse);
-
-  // These two RPCs are for messages reporting and broadcasting.
-  // Update is used by the client to send update request to the server.
-  rpc Update(RaySyncMessages) returns (DummyResponse);
-
-  // LongPolling is used by the server to send request to the client.
-  rpc LongPolling(DummyRequest) returns (RaySyncMessages);
+  rpc StartSync(stream RaySyncMessage) returns (stream RaySyncMessage);
 }
diff --git a/src/ray/raylet/node_manager.cc b/src/ray/raylet/node_manager.cc
index ad019b5dc233..31f722e8bf6a 100644
--- a/src/ray/raylet/node_manager.cc
+++ b/src/ray/raylet/node_manager.cc
@@ -527,6 +527,8 @@ ray::Status NodeManager::RegisterGcs() {
         /* receiver */ this,
         /* pull_from_reporter_interval_ms */ 0);
 
+    auto gcs_channel = gcs_client_->GetGcsRpcClient().GetChannel();
+    ray_syncer_.Connect(kGCSNodeID.Binary(), gcs_channel);
     periodical_runner_.RunFnPeriodically(
         [this] {
           auto triggered_by_global_gc = TryLocalGC();
diff --git a/src/ray/rpc/grpc_client.h b/src/ray/rpc/grpc_client.h
index e5c5065030aa..8c67353e2cb1 100644
--- a/src/ray/rpc/grpc_client.h
+++ b/src/ray/rpc/grpc_client.h
@@ -57,7 +57,8 @@ inline std::shared_ptr<grpc::Channel> BuildChannel(
                     ::RayConfig::instance().grpc_enable_http_proxy() ? 1 : 0);
   arguments->SetMaxSendMessageSize(::RayConfig::instance().max_grpc_message_size());
   arguments->SetMaxReceiveMessageSize(::RayConfig::instance().max_grpc_message_size());
-
+  arguments->SetInt(GRPC_ARG_HTTP2_WRITE_BUFFER_SIZE,
+                    ::RayConfig::instance().grpc_stream_buffer_size());
   std::shared_ptr<grpc::Channel> channel;
   if (::RayConfig::instance().USE_TLS()) {
     std::string server_cert_file = std::string(::RayConfig::instance().TLS_SERVER_CERT());
diff --git a/src/ray/rpc/grpc_server.cc b/src/ray/rpc/grpc_server.cc
index 962017aca9f7..d38e02d57151 100644
--- a/src/ray/rpc/grpc_server.cc
+++ b/src/ray/rpc/grpc_server.cc
@@ -83,7 +83,8 @@ void GrpcServer::Run() {
   builder.AddChannelArgument(GRPC_ARG_KEEPALIVE_TIMEOUT_MS,
                              RayConfig::instance().grpc_keepalive_timeout_ms());
   builder.AddChannelArgument(GRPC_ARG_KEEPALIVE_PERMIT_WITHOUT_CALLS, 0);
-
+  builder.AddChannelArgument(GRPC_ARG_HTTP2_WRITE_BUFFER_SIZE,
+                             RayConfig::instance().grpc_stream_buffer_size());
   // NOTE(rickyyx): This argument changes how frequent the gRPC server expects a keepalive
   // ping from the client. See https://github.com/grpc/grpc/blob/HEAD/doc/keepalive.md#faq
   // We set this to 1min because GCS gRPC client currently sends keepalive every 1min:

From 38ee064fa87fe9f2e6fa9889c49aa6de3914a001 Mon Sep 17 00:00:00 2001
From: shrekris-anyscale <92341594+shrekris-anyscale@users.noreply.github.com>
Date: Thu, 26 Jan 2023 07:38:27 -0800
Subject: [PATCH 003/267] [Serve] Avoid killing replicas that are actively
 being deployed in `long_running_serve_failure` test (#31945)

The `long_running_serve_failure` release test is unstable and passes about 50% of the time. It seems to fail after a `.deploy()` call errors with the message:

```
Traceback (most recent call last):
  File "workloads/serve_failure.py", line 159, in <module>
    tester.run()
  File "workloads/serve_failure.py", line 130, in run
    action_chosen()
  File "workloads/serve_failure.py", line 107, in create_deployment
    handler.deploy()
  File "/home/ray/anaconda3/lib/python3.7/site-packages/ray/serve/deployment.py", line 217, in deploy
    self._deploy(*init_args, _blocking=_blocking, **init_kwargs)
  File "/home/ray/anaconda3/lib/python3.7/site-packages/ray/serve/deployment.py", line 244, in _deploy
    _blocking=_blocking,
  File "/home/ray/anaconda3/lib/python3.7/site-packages/ray/serve/_private/client.py", line 37, in check
    return f(self, *args, **kwargs)
  File "/home/ray/anaconda3/lib/python3.7/site-packages/ray/serve/_private/client.py", line 238, in deploy
    self._wait_for_deployment_healthy(name)
  File "/home/ray/anaconda3/lib/python3.7/site-packages/ray/serve/_private/client.py", line 174, in _wait_for_deployment_healthy
    f"Deployment {name} is UNHEALTHY: " f"{status.message}"
RuntimeError: Deployment InWRYtjoUK is UNHEALTHY:
```

The deployment that's marked `UNHEALTHY` is always killed by the `RandomKiller` before this message appears. The issue is likely that:

1. The `RandomKiller` kills the deployment while it's still deploying
2. This causes the deployment to be [marked `UNHEALTHY`](https://github.com/ray-project/ray/blob/455100b54f0a82ce44dfa2257d40297c275424e0/python/ray/serve/_private/deployment_state.py#L1517-L1523)
3. This in turn causes [the `deploy()` call](https://github.com/ray-project/ray/blob/3735ba410ddfa63cc8516f69fa8b3997259a3f11/release/long_running_tests/workloads/serve_failure.py#L107) (and the test) [to raise an error and fail](https://github.com/ray-project/ray/blob/455100b54f0a82ce44dfa2257d40297c275424e0/python/ray/serve/_private/client.py#L172-L175).

This change guards against this by preventing the `RandomKiller` from kill the deployment while it's deploying.
---
 python/ray/serve/_private/deployment_state.py |  6 ++-
 python/ray/serve/controller.py                |  6 ++-
 .../workloads/serve_failure.py                | 49 +++++++++++++------
 3 files changed, 43 insertions(+), 18 deletions(-)

diff --git a/python/ray/serve/_private/deployment_state.py b/python/ray/serve/_private/deployment_state.py
index 45b865241395..ba7cae52964c 100644
--- a/python/ray/serve/_private/deployment_state.py
+++ b/python/ray/serve/_private/deployment_state.py
@@ -1519,7 +1519,11 @@ def _check_and_update_replicas(self) -> bool:
                 # recovered or a new deploy happens.
                 if replica.version == self._target_state.version:
                     self._curr_status_info: DeploymentStatusInfo = DeploymentStatusInfo(
-                        self._name, DeploymentStatus.UNHEALTHY
+                        name=self._name,
+                        status=DeploymentStatus.UNHEALTHY,
+                        message="A replica's health check failed. This "
+                        "deployment will be UNHEALTHY until the replica "
+                        "recovers or a new deploy happens.",
                     )
 
         slow_start_replicas = []
diff --git a/python/ray/serve/controller.py b/python/ray/serve/controller.py
index 9dd231c84166..a05a47429e2c 100644
--- a/python/ray/serve/controller.py
+++ b/python/ray/serve/controller.py
@@ -312,7 +312,11 @@ def _recover_config_from_checkpoint(self):
             self.deploy_app(ServeApplicationSchema.parse_obj(config), update_time=False)
 
     def _all_running_replicas(self) -> Dict[str, List[RunningReplicaInfo]]:
-        """Used for testing."""
+        """Used for testing.
+
+        Returned dictionary maps deployment names to replica infos.
+        """
+
         return self.deployment_state_manager.get_running_replica_infos()
 
     def get_http_config(self):
diff --git a/release/long_running_tests/workloads/serve_failure.py b/release/long_running_tests/workloads/serve_failure.py
index fa94bfeef31c..319551b7c94f 100644
--- a/release/long_running_tests/workloads/serve_failure.py
+++ b/release/long_running_tests/workloads/serve_failure.py
@@ -2,11 +2,13 @@
 import random
 import string
 import time
+import asyncio
 
 import requests
 
 import ray
 from ray import serve
+from ray.serve.context import get_global_client
 from ray.cluster_utils import Cluster
 from ray._private.test_utils import safe_write_to_results_json
 
@@ -62,25 +64,35 @@ def update_progress(result):
 class RandomKiller:
     def __init__(self, kill_period_s=1):
         self.kill_period_s = kill_period_s
+        self.sanctuary = set()
 
-    def _get_all_serve_actors(self):
-        controller = serve.context.get_global_client()._controller
+    async def run(self):
+        while True:
+            chosen = random.choice(self._get_serve_actors())
+            print(f"Killing {chosen}")
+            ray.kill(chosen, no_restart=False)
+            await asyncio.sleep(self.kill_period_s)
+
+    async def spare(self, deployment_name: str):
+        print(f'Sparing deployment "{deployment_name}" replicas.')
+        self.sanctuary.add(deployment_name)
+
+    async def stop_spare(self, deployment_name: str):
+        print(f'No longer sparing deployment "{deployment_name}" replicas.')
+        self.sanctuary.discard(deployment_name)
+
+    def _get_serve_actors(self):
+        controller = get_global_client()._controller
         routers = list(ray.get(controller.get_http_proxies.remote()).values())
         all_handles = routers + [controller]
-        worker_handle_dict = ray.get(controller._all_running_replicas.remote())
-        for _, replica_info_list in worker_handle_dict.items():
-            for replica_info in replica_info_list:
-                all_handles.append(replica_info.actor_handle)
+        replica_dict = ray.get(controller._all_running_replicas.remote())
+        for deployment_name, replica_info_list in replica_dict.items():
+            if deployment_name not in self.sanctuary:
+                for replica_info in replica_info_list:
+                    all_handles.append(replica_info.actor_handle)
 
         return all_handles
 
-    def run(self):
-        while True:
-            chosen = random.choice(self._get_all_serve_actors())
-            print(f"Killing {chosen}")
-            ray.kill(chosen, no_restart=False)
-            time.sleep(self.kill_period_s)
-
 
 class RandomTest:
     def __init__(self, max_deployments=1):
@@ -90,8 +102,11 @@ def __init__(self, max_deployments=1):
             (self.verify_deployment, 4),
         ]
         self.deployments = []
+        self.random_killer = RandomKiller.remote()
+
         for _ in range(max_deployments):
             self.create_deployment()
+        self.random_killer.run.remote()
 
     def create_deployment(self):
         if len(self.deployments) == self.max_deployments:
@@ -104,10 +119,14 @@ def create_deployment(self):
         def handler(self, *args):
             return new_name
 
-        handler.deploy()
+        ray.get(self.random_killer.spare.remote(new_name))
+
+        handler.deploy(_blocking=True)
 
         self.deployments.append(new_name)
 
+        ray.get(self.random_killer.stop_spare.remote(new_name))
+
     def verify_deployment(self):
         deployment = random.choice(self.deployments)
         for _ in range(100):
@@ -154,6 +173,4 @@ def run(self):
 
 
 tester = RandomTest(max_deployments=NUM_NODES * CPUS_PER_NODE)
-random_killer = RandomKiller.remote()
-random_killer.run.remote()
 tester.run()

From 0c68ba46d770cbd56a7edabbf332d8ab1beffa1d Mon Sep 17 00:00:00 2001
From: Sihan Wang <sihanwang41@gmail.com>
Date: Thu, 26 Jan 2023 07:44:25 -0800
Subject: [PATCH 004/267] [Serve] Serve python API to support multi application
 (#31589)

- Python API for multi applications. serve.run() & serve.delete()
---
 .../ray/serve/api/ServeControllerClient.java  |  20 +-
 python/ray/serve/BUILD                        |  10 +-
 python/ray/serve/__init__.py                  |   2 +
 .../ray/serve/_private/application_state.py   | 224 ++++++++++++++++++
 python/ray/serve/_private/client.py           |  51 +++-
 python/ray/serve/_private/common.py           |   9 +-
 .../serve/_private/deployment_graph_build.py  |  15 +-
 python/ray/serve/_private/deployment_state.py |  12 +-
 python/ray/serve/api.py                       |  41 +++-
 python/ray/serve/controller.py                | 194 ++++++++-------
 python/ray/serve/schema.py                    |  16 ++
 python/ray/serve/tests/test_api.py            | 108 +++++++++
 .../ray/serve/tests/test_application_state.py | 136 +++++++++++
 python/ray/serve/tests/test_schema.py         |  27 ++-
 src/ray/protobuf/serve.proto                  |   3 +
 15 files changed, 739 insertions(+), 129 deletions(-)
 create mode 100644 python/ray/serve/_private/application_state.py
 create mode 100644 python/ray/serve/tests/test_application_state.py

diff --git a/java/serve/src/main/java/io/ray/serve/api/ServeControllerClient.java b/java/serve/src/main/java/io/ray/serve/api/ServeControllerClient.java
index f1d8a4e51729..39c366f1ba66 100644
--- a/java/serve/src/main/java/io/ray/serve/api/ServeControllerClient.java
+++ b/java/serve/src/main/java/io/ray/serve/api/ServeControllerClient.java
@@ -369,19 +369,13 @@ private StatusOverview getServeStatus() {
   }
 
   private DeploymentStatusInfo getDeploymentStatus(String name) {
-    StatusOverview statusOverview = getServeStatus();
-    if (statusOverview == null
-        || statusOverview.getDeploymentStatuses() == null
-        || statusOverview.getDeploymentStatuses().getDeploymentStatusInfosList() == null) {
-      return null;
-    }
-    for (DeploymentStatusInfo deploymentStatusInfo :
-        statusOverview.getDeploymentStatuses().getDeploymentStatusInfosList()) {
-      if (StringUtils.equals(name, deploymentStatusInfo.getName())) {
-        return deploymentStatusInfo;
-      }
-    }
-    return null;
+    return ServeProtoUtil.bytesToProto(
+        (byte[])
+            ((PyActorHandle) controller)
+                .task(PyActorMethod.of("get_deployment_status"), name)
+                .remote()
+                .get(),
+        DeploymentStatusInfo::parseFrom);
   }
 
   public BaseActorHandle getController() {
diff --git a/python/ray/serve/BUILD b/python/ray/serve/BUILD
index 68935517a11b..c01a7f3a6b3d 100644
--- a/python/ray/serve/BUILD
+++ b/python/ray/serve/BUILD
@@ -19,7 +19,7 @@ filegroup(
 
 py_test(
     name = "test_api",
-    size = "medium",
+    size = "large",
     srcs = serve_tests_srcs,
     tags = ["exclusive", "team:serve"],
     deps = [":serve_lib"],
@@ -33,6 +33,14 @@ py_test(
     deps = [":serve_lib"],
 )
 
+py_test(
+    name = "test_application_state",
+    size = "small",
+    srcs = serve_tests_srcs,
+    tags = ["exclusive", "team:serve"],
+    deps = [":serve_lib"],
+)
+
 py_test(
     name = "test_deploy",
     size = "large",
diff --git a/python/ray/serve/__init__.py b/python/ray/serve/__init__.py
index 5e997ee09907..23c0eac007c4 100644
--- a/python/ray/serve/__init__.py
+++ b/python/ray/serve/__init__.py
@@ -10,6 +10,7 @@
         run,
         shutdown,
         start,
+        delete,
     )
     from ray.serve.air_integrations import PredictorDeployment
     from ray.serve.batching import batch
@@ -38,4 +39,5 @@
     "list_deployments",
     "run",
     "PredictorDeployment",
+    "delete",
 ]
diff --git a/python/ray/serve/_private/application_state.py b/python/ray/serve/_private/application_state.py
new file mode 100644
index 000000000000..636b7bba9f51
--- /dev/null
+++ b/python/ray/serve/_private/application_state.py
@@ -0,0 +1,224 @@
+import ray
+import traceback
+from typing import Dict, List
+from ray.serve._private.common import ApplicationStatus
+from ray.serve._private.deployment_state import DeploymentStateManager
+from ray.serve._private.common import (
+    DeploymentStatus,
+    DeploymentStatusInfo,
+    ApplicationStatusInfo,
+)
+import time
+from ray.exceptions import RayTaskError, RuntimeEnvSetupError
+import logging
+from ray.serve._private.constants import SERVE_LOGGER_NAME
+from ray.types import ObjectRef
+
+logger = logging.getLogger(SERVE_LOGGER_NAME)
+
+
+class ApplicationState:
+    """Manage single application states with all operations"""
+
+    def __init__(
+        self,
+        name: str,
+        deployment_state_manager: DeploymentStateManager,
+        deployment_params: List[Dict] = None,
+        deploy_obj_ref: ObjectRef = None,
+        deployment_time: float = 0,
+    ):
+        """
+        Args:
+            name: application name
+            deployment_state_manager: deployment state manager which is used for
+                fetching deployment information
+            deployment_params: all deployment parameters to deploy.
+            deploy_obj_ref: Task ObjRef of deploying application.
+            deployment_time: Deployment timestamp
+        """
+        if deploy_obj_ref:
+            self.status: ApplicationStatus = ApplicationStatus.DEPLOYING
+        else:
+            self.status: ApplicationStatus = ApplicationStatus.NOT_STARTED
+        self.name = name
+        self.deployment_params = deployment_params
+        self.to_be_deleted = False
+        self.deployment_state_manager = deployment_state_manager
+        if deployment_time:
+            self.deployment_timestamp = deployment_time
+        else:
+            self.deployment_timestamp = time.time()
+        self.deploy_obj_ref = deploy_obj_ref
+        self.app_msg = ""
+
+    def delete(self):
+        """Delete the application"""
+        self.status = ApplicationStatus.DELETING
+
+    def deploy(self):
+        """Deploy the application"""
+        self.status = ApplicationStatus.DEPLOYING
+
+    def update(self):
+        """Update the application status, maintain the ApplicationStatus.
+        This method should be idempotent.
+
+        Status:
+            DEPLOYING -> RUNNING: All deployments are healthy.
+            DEPLOYING -> DEPLOY_FAILED: Not all deployments are healthy.
+            DELETING: Mark to_be_deleted as True when all deployments are gone.
+        """
+
+        if self.to_be_deleted:
+            return
+
+        if self.status == ApplicationStatus.DELETING:
+            mark_delete = True
+            for name in self.get_all_deployments():
+                if self.deployment_state_manager.get_deployment(name):
+                    mark_delete = False
+                    break
+            self.to_be_deleted = mark_delete
+            return
+
+        if self.status == ApplicationStatus.DEPLOYING:
+            if self.deploy_obj_ref:
+                finished, pending = ray.wait([self.deploy_obj_ref], timeout=0)
+                if pending:
+                    return
+                try:
+                    ray.get(finished[0])
+                except RayTaskError:
+                    self.status = ApplicationStatus.DEPLOY_FAILED
+                    self.app_msg = f"Deployment failed:\n{traceback.format_exc()}"
+                    self.deploy_obj_ref = None
+                    return
+                except RuntimeEnvSetupError:
+                    self.status = ApplicationStatus.DEPLOY_FAILED
+                    self.app_msg = (
+                        f"Runtime env setup failed:\n{traceback.format_exc()}"
+                    )
+                    self.deploy_obj_ref = None
+                    return
+            deployments_statuses = (
+                self.deployment_state_manager.get_deployment_statuses(
+                    self.get_all_deployments()
+                )
+            )
+            num_health_deployments = 0
+            for deployment_status in deployments_statuses:
+                if deployment_status.status == DeploymentStatus.UNHEALTHY:
+                    self.status = ApplicationStatus.DEPLOY_FAILED
+                    return
+                if deployment_status.status == DeploymentStatus.HEALTHY:
+                    num_health_deployments += 1
+            if num_health_deployments == len(deployments_statuses):
+                self.status = ApplicationStatus.RUNNING
+
+    def get_all_deployments(self) -> List[str]:
+        """Return all deployments name from the application"""
+        if self.deployment_params is None:
+            return []
+        return [params["name"] for params in self.deployment_params]
+
+    def get_deployments_statuses(self) -> List[DeploymentStatusInfo]:
+        """Return all deployment status information"""
+        return self.deployment_state_manager.get_deployment_statuses(
+            self.get_all_deployments()
+        )
+
+    def get_application_status_info(self) -> ApplicationStatusInfo:
+        """Return the application status information"""
+        return ApplicationStatusInfo(
+            self.status,
+            message=self.app_msg,
+            deployment_timestamp=self.deployment_timestamp,
+        )
+
+
+class ApplicationStateManager:
+    def __init__(self, deployment_state_manager):
+        self.deployment_state_manager = deployment_state_manager
+        self._application_states: Dict[str, ApplicationState] = {}
+
+    def delete_application(self, name: str):
+        """Delete application by name"""
+        if name not in self._application_states:
+            return
+        self._application_states[name].delete()
+
+    def deploy_application(self, name: str, deployment_args: List[Dict]):
+        """Deploy single application
+
+        Args:
+            name: application name
+            deployment_args: deployment args
+        """
+        if name in self._application_states:
+            self._application_states[name].deployment_params = deployment_args
+        else:
+            self._application_states[name] = ApplicationState(
+                name,
+                self.deployment_state_manager,
+                deployment_args,
+            )
+        self._application_states[name].deploy()
+
+    def get_deployments(self, app_name: str) -> List[str]:
+        """Return all deployment names by app name"""
+        if app_name not in self._application_states:
+            return []
+        return self._application_states[app_name].get_all_deployments()
+
+    def get_deployments_statuses(self, app_name: str) -> List[DeploymentStatusInfo]:
+        """Return all deployment statuses by app name"""
+        if app_name not in self._application_states:
+            return []
+        return self._application_states[app_name].get_deployments_statuses()
+
+    def get_app_status(self, name: str) -> ApplicationStatusInfo:
+        if name not in self._application_states:
+            return ApplicationStatusInfo(
+                ApplicationStatus.NOT_STARTED,
+                message=f"Application {name} doesn't exist",
+                deployment_timestamp=0,
+            )
+        return self._application_states[name].get_application_status_info()
+
+    def create_application_state(
+        self, name: str, deploy_obj_ref: ObjectRef, deployment_time: float = 0
+    ):
+        """Create application state
+        This is used for holding the deploy_obj_ref which is created by run_graph method
+        """
+        if (
+            name in self._application_states
+            and self._application_states[name].deploy_obj_ref
+        ):
+            logger.info(
+                f"Received new config deployment for {name} request. Cancelling "
+                "previous request."
+            )
+            ray.cancel(self._application_states[name].deploy_obj_ref)
+        self._application_states[name] = ApplicationState(
+            name,
+            self.deployment_state_manager,
+            deploy_obj_ref=deploy_obj_ref,
+            deployment_time=deployment_time,
+        )
+
+    def get_deployment_timestamp(self, name: str) -> float:
+        if name not in self._application_states:
+            return -1
+        return self._application_states[name].deployment_timestamp
+
+    def update(self):
+        """Update each application state"""
+        apps_to_be_deleted = []
+        for name, app in self._application_states.items():
+            app.update()
+            if app.to_be_deleted:
+                apps_to_be_deleted.append(name)
+        for app_name in apps_to_be_deleted:
+            del self._application_states[app_name]
diff --git a/python/ray/serve/_private/client.py b/python/ray/serve/_private/client.py
index 36cfad1e45a5..653bbf5c254a 100644
--- a/python/ray/serve/_private/client.py
+++ b/python/ray/serve/_private/client.py
@@ -12,6 +12,7 @@
     DeploymentStatus,
     StatusOverview,
     ApplicationStatus,
+    DeploymentStatusInfo,
 )
 from ray.serve.config import DeploymentConfig, HTTPOptions, ReplicaConfig
 from ray.serve._private.constants import (
@@ -23,6 +24,9 @@
 from ray.serve.exceptions import RayServeException
 from ray.serve.generated.serve_pb2 import DeploymentRoute, DeploymentRouteList
 from ray.serve.generated.serve_pb2 import StatusOverview as StatusOverviewProto
+from ray.serve.generated.serve_pb2 import (
+    DeploymentStatusInfo as DeploymentStatusInfoProto,
+)
 from ray.serve.handle import RayServeHandle, RayServeSyncHandle
 from ray.serve.schema import ServeApplicationSchema
 
@@ -159,14 +163,18 @@ def _wait_for_deployment_healthy(self, name: str, timeout_s: int = -1):
         start = time.time()
         while time.time() - start < timeout_s or timeout_s < 0:
 
-            status = self.get_serve_status().get_deployment_status(name)
+            status_bytes = ray.get(self._controller.get_deployment_status.remote(name))
 
-            if status is None:
+            if status_bytes is None:
                 raise RuntimeError(
                     f"Waiting for deployment {name} to be HEALTHY, "
                     "but deployment doesn't exist."
                 )
 
+            status = DeploymentStatusInfo.from_proto(
+                DeploymentStatusInfoProto.FromString(status_bytes)
+            )
+
             if status.status == DeploymentStatus.HEALTHY:
                 break
             elif status.status == DeploymentStatus.UNHEALTHY:
@@ -194,9 +202,14 @@ def _wait_for_deployment_deleted(self, name: str, timeout_s: int = 60):
         """
         start = time.time()
         while time.time() - start < timeout_s:
-            curr_status = self.get_serve_status().get_deployment_status(name)
-            if curr_status is None:
+            curr_status_bytes = ray.get(
+                self._controller.get_deployment_status.remote(name)
+            )
+            if curr_status_bytes is None:
                 break
+            curr_status = DeploymentStatusInfo.from_proto(
+                DeploymentStatusInfoProto.FromString(curr_status_bytes)
+            )
             logger.debug(
                 f"Waiting for {name} to be deleted, current status: {curr_status}."
             )
@@ -241,6 +254,7 @@ def deploy(
     @_ensure_connected
     def deploy_group(
         self,
+        name,
         deployments: List[Dict],
         _blocking: bool = True,
         remove_past_deployments: bool = True,
@@ -262,7 +276,7 @@ def deploy_group(
             )
 
         updating_list = ray.get(
-            self._controller.deploy_group.remote(deployment_args_list)
+            self._controller.deploy_group.remote(name, deployment_args_list)
         )
 
         tags = []
@@ -312,6 +326,29 @@ def deploy_app(
                     f"Serve application isn't running after {timeout_s}s."
                 )
 
+    @_ensure_connected
+    def delete_apps(self, names: List[str], blocking: bool = True):
+        logger.info(f"Deleting app {names}")
+        self._controller.delete_apps.remote(names)
+        if blocking:
+            start = time.time()
+            while time.time() - start < 60:
+                curr_statuses_bytes = ray.get(
+                    self._controller.get_serve_statuses.remote(names)
+                )
+                all_deleted = True
+                for cur_status_bytes in curr_statuses_bytes:
+                    cur_status = StatusOverview.from_proto(
+                        StatusOverviewProto.FromString(cur_status_bytes)
+                    )
+                    if cur_status.app_status.status != ApplicationStatus.NOT_STARTED:
+                        all_deleted = False
+                if all_deleted:
+                    return
+                time.sleep(CLIENT_POLLING_INTERVAL_S)
+            else:
+                raise TimeoutError(f"Deployment {names} wasn't deleted after 60s.")
+
     @_ensure_connected
     def delete_deployments(self, names: Iterable[str], blocking: bool = True) -> None:
         ray.get(self._controller.delete_deployments.remote(names))
@@ -348,9 +385,9 @@ def get_app_config(self) -> Dict:
         return ray.get(self._controller.get_app_config.remote())
 
     @_ensure_connected
-    def get_serve_status(self) -> StatusOverview:
+    def get_serve_status(self, name: str = "") -> StatusOverview:
         proto = StatusOverviewProto.FromString(
-            ray.get(self._controller.get_serve_status.remote())
+            ray.get(self._controller.get_serve_status.remote(name))
         )
         return StatusOverview.from_proto(proto)
 
diff --git a/python/ray/serve/_private/common.py b/python/ray/serve/_private/common.py
index 439bec125495..faa7c422cdbb 100644
--- a/python/ray/serve/_private/common.py
+++ b/python/ray/serve/_private/common.py
@@ -33,6 +33,7 @@ class ApplicationStatus(str, Enum):
     DEPLOYING = "DEPLOYING"
     RUNNING = "RUNNING"
     DEPLOY_FAILED = "DEPLOY_FAILED"
+    DELETING = "DELETING"
 
 
 @dataclass(eq=True)
@@ -92,6 +93,7 @@ def from_proto(cls, proto: DeploymentStatusInfoProto):
 @dataclass(eq=True)
 class StatusOverview:
     app_status: ApplicationStatusInfo
+    name: str = ""
     deployment_statuses: List[DeploymentStatusInfo] = field(default_factory=list)
 
     def debug_string(self):
@@ -131,6 +133,7 @@ def to_proto(self):
 
         # Return protobuf encapsulating application and deployment protos
         return StatusOverviewProto(
+            name=self.name,
             app_status=app_status_proto,
             deployment_statuses=deployment_status_proto_list,
         )
@@ -147,7 +150,11 @@ def from_proto(cls, proto: StatusOverviewProto) -> "StatusOverview":
             deployment_statuses.append(DeploymentStatusInfo.from_proto(info_proto))
 
         # Recreate StatusInfo
-        return cls(app_status=app_status, deployment_statuses=deployment_statuses)
+        return cls(
+            app_status=app_status,
+            deployment_statuses=deployment_statuses,
+            name=proto.name,
+        )
 
 
 HEALTH_CHECK_CONCURRENCY_GROUP = "health_check"
diff --git a/python/ray/serve/_private/deployment_graph_build.py b/python/ray/serve/_private/deployment_graph_build.py
index 4a812bd39a3b..a75852f3e75d 100644
--- a/python/ray/serve/_private/deployment_graph_build.py
+++ b/python/ray/serve/_private/deployment_graph_build.py
@@ -32,7 +32,7 @@
 from ray.experimental.gradio_utils import type_to_string
 
 
-def build(ray_dag_root_node: DAGNode) -> List[Deployment]:
+def build(ray_dag_root_node: DAGNode, name: str = None) -> List[Deployment]:
     """Do all the DAG transformation, extraction and generation needed to
     produce a runnable and deployable serve pipeline application from a valid
     DAG authored with Ray DAG API.
@@ -64,6 +64,8 @@ def build(ray_dag_root_node: DAGNode) -> List[Deployment]:
         ray_dag_root_node: DAGNode acting as root of a Ray authored DAG. It
             should be executable via `ray_dag_root_node.execute(user_input)`
             and should have `InputNode` in it.
+        name: Application name,. If provided, formatting all the deployment name to
+            {name}_{deployment_name}
 
     Returns:
         deployments: All deployments needed for an e2e runnable serve pipeline,
@@ -86,7 +88,7 @@ def build(ray_dag_root_node: DAGNode) -> List[Deployment]:
     """
     with _DAGNodeNameGenerator() as node_name_generator:
         serve_root_dag = ray_dag_root_node.apply_recursive(
-            lambda node: transform_ray_dag_to_serve_dag(node, node_name_generator)
+            lambda node: transform_ray_dag_to_serve_dag(node, node_name_generator, name)
         )
     deployments = extract_deployments_from_serve_dag(serve_root_dag)
 
@@ -133,11 +135,12 @@ def get_and_validate_ingress_deployment(
 
 
 def transform_ray_dag_to_serve_dag(
-    dag_node: DAGNode, node_name_generator: _DAGNodeNameGenerator
+    dag_node: DAGNode, node_name_generator: _DAGNodeNameGenerator, name: str = None
 ):
     """
     Transform a Ray DAG to a Serve DAG. Map ClassNode to DeploymentNode with
     ray decorated body passed in, and ClassMethodNode to DeploymentMethodNode.
+    When provided name, all Deployment name will {name}_{deployment_name}
     """
     if isinstance(dag_node, ClassNode):
         deployment_name = node_name_generator.get_node_name(dag_node)
@@ -195,6 +198,9 @@ def replace_with_handle(node):
         ):
             deployment_name = deployment_shell.name
 
+        if name:
+            deployment_name = f"{name}_{deployment_name}"
+
         # Set the route prefix, prefer the one user supplied,
         # otherwise set it to /deployment_name
         if (
@@ -257,6 +263,9 @@ def replace_with_handle(node):
                 dag_node._body.__annotations__["return"]
             )
 
+        if name:
+            deployment_name = f"{name}_{deployment_name}"
+
         return DeploymentFunctionNode(
             dag_node._body,
             deployment_name,
diff --git a/python/ray/serve/_private/deployment_state.py b/python/ray/serve/_private/deployment_state.py
index ba7cae52964c..9db5d6256de9 100644
--- a/python/ray/serve/_private/deployment_state.py
+++ b/python/ray/serve/_private/deployment_state.py
@@ -1979,10 +1979,14 @@ def get_deployment(
         else:
             return None
 
-    def get_deployment_statuses(self) -> List[DeploymentStatusInfo]:
-        return list(
-            map(lambda state: state.curr_status_info, self._deployment_states.values())
-        )
+    def get_deployment_statuses(
+        self, names: List[str] = None
+    ) -> List[DeploymentStatusInfo]:
+        statuses = []
+        for name, state in self._deployment_states.items():
+            if not names or name in names:
+                statuses.append(state.curr_status_info)
+        return statuses
 
     def deploy(self, deployment_name: str, deployment_info: DeploymentInfo) -> bool:
         """Deploy the deployment.
diff --git a/python/ray/serve/api.py b/python/ray/serve/api.py
index 7ae5999b4e38..714611c0e83e 100644
--- a/python/ray/serve/api.py
+++ b/python/ray/serve/api.py
@@ -457,6 +457,8 @@ def run(
     _blocking: bool = True,
     host: str = DEFAULT_HTTP_HOST,
     port: int = DEFAULT_HTTP_PORT,
+    name: str = "",
+    route_prefix: str = "/",
 ) -> Optional[RayServeHandle]:
     """Run a Serve application and return a ServeHandle to the ingress.
 
@@ -473,6 +475,11 @@ def run(
             "127.0.0.1". To expose Serve publicly, you probably want to set
             this to "0.0.0.0".
         port: Port for HTTP server. Defaults to 8000.
+        name: Application name. If not provided, this will be the only
+            application running on the cluster (it will delete all others).
+        route_prefix: Route prefix for HTTP requests. If not provided, it will use
+            route_prefix of the ingress deployment. By default, the ingress route
+            prefix is '/'.
 
     Returns:
         RayServeHandle: A regular ray serve handle that can be called by user
@@ -488,14 +495,17 @@ def run(
 
     if isinstance(target, Application):
         deployments = list(target.deployments.values())
+        if name:
+            for deployment in deployments:
+                deployment._name = f"{name}_{deployment._name}"
         ingress = target.ingress
     # Each DAG should always provide a valid Driver ClassNode
     elif isinstance(target, ClassNode):
-        deployments = pipeline_build(target)
+        deployments = pipeline_build(target, name)
         ingress = get_and_validate_ingress_deployment(deployments)
     # Special case where user is doing single function serve.run(func.bind())
     elif isinstance(target, FunctionNode):
-        deployments = pipeline_build(target)
+        deployments = pipeline_build(target, name)
         ingress = get_and_validate_ingress_deployment(deployments)
         if len(deployments) != 1:
             raise ValueError(
@@ -517,9 +527,18 @@ def run(
             f"Got unexpected type {type(target)} instead."
         )
 
+    # when name provided, keep all existing applications
+    # otherwise, delete all of them.
+    remove_past_deployments = True
+    if name:
+        remove_past_deployments = False
+
     parameter_group = []
 
     for deployment in deployments:
+        # Overwrite route prefix
+        if route_prefix != "/" and deployment._route_prefix:
+            deployment._route_prefix = route_prefix
         deployment_parameters = {
             "name": deployment._name,
             "func_or_class": deployment._func_or_class,
@@ -534,7 +553,10 @@ def run(
         }
         parameter_group.append(deployment_parameters)
     client.deploy_group(
-        parameter_group, _blocking=_blocking, remove_past_deployments=True
+        name,
+        parameter_group,
+        _blocking=_blocking,
+        remove_past_deployments=remove_past_deployments,
     )
 
     if ingress is not None:
@@ -574,3 +596,16 @@ def build(target: Union[ClassNode, FunctionNode]) -> Application:
     # TODO(edoakes): this should accept host and port, but we don't
     # currently support them in the REST API.
     return Application(pipeline_build(target))
+
+
+@PublicAPI(stability="alpha")
+def delete(name: str, _blocking: bool = True):
+    """Delete an app by its name
+
+    Deletes the app with all corresponding deployments.
+
+    Args:
+        name: the name of app to delete.
+    """
+    client = get_global_client()
+    client.delete_apps([name], blocking=_blocking)
diff --git a/python/ray/serve/controller.py b/python/ray/serve/controller.py
index a05a47429e2c..0d4d13734497 100644
--- a/python/ray/serve/controller.py
+++ b/python/ray/serve/controller.py
@@ -4,7 +4,6 @@
 import os
 import pickle
 import time
-import traceback
 from collections import defaultdict
 from typing import Any, Dict, Iterable, List, Optional, Tuple, Union
 
@@ -15,12 +14,9 @@
 )
 from ray.util.scheduling_strategies import NodeAffinitySchedulingStrategy
 from ray.actor import ActorHandle
-from ray.exceptions import RayTaskError, RuntimeEnvSetupError
 from ray._private.gcs_utils import GcsClient
 from ray.serve._private.autoscaling_policy import BasicAutoscalingPolicy
 from ray.serve._private.common import (
-    ApplicationStatus,
-    ApplicationStatusInfo,
     DeploymentInfo,
     EndpointInfo,
     EndpointTag,
@@ -48,7 +44,7 @@
     override_runtime_envs_except_env_vars,
     get_random_letters,
 )
-from ray.types import ObjectRef
+from ray.serve._private.application_state import ApplicationStateManager
 
 logger = logging.getLogger(SERVE_LOGGER_NAME)
 
@@ -146,11 +142,10 @@ async def __init__(
             all_serve_actor_names,
         )
 
-        # Reference to Ray task executing most recent deployment request
-        self.config_deployment_request_ref: ObjectRef = None
-
-        # Unix timestamp of latest config deployment request. Defaults to 0.
-        self.deployment_timestamp = 0
+        # Manage all applications' state
+        self.application_state_manager = ApplicationStateManager(
+            self.deployment_state_manager
+        )
 
         run_background_task(self.run_control_loop())
 
@@ -255,6 +250,10 @@ async def run_control_loop(self) -> None:
                     self.deployment_state_manager.update()
                 except Exception:
                     logger.exception("Exception updating deployment state.")
+                try:
+                    self.application_state_manager.update()
+                except Exception:
+                    logger.exception("Exception updating application state.")
 
             try:
                 self._put_serve_snapshot()
@@ -308,8 +307,12 @@ def _put_serve_snapshot(self) -> None:
     def _recover_config_from_checkpoint(self):
         checkpoint = self.kv_store.get(CONFIG_CHECKPOINT_KEY)
         if checkpoint is not None:
-            self.deployment_timestamp, config, _ = pickle.loads(checkpoint)
-            self.deploy_app(ServeApplicationSchema.parse_obj(config), update_time=False)
+            config_checkpoints_dict = pickle.loads(checkpoint)
+            for name in config_checkpoints_dict:
+                deployment_time, config, _ = config_checkpoints_dict[name]
+                self.deploy_app(
+                    ServeApplicationSchema.parse_obj(config), deployment_time
+                )
 
     def _all_running_replicas(self) -> Dict[str, List[RunningReplicaInfo]]:
         """Used for testing.
@@ -415,7 +418,7 @@ def deploy(
 
         return updating
 
-    def deploy_group(self, deployment_args_list: List[Dict]) -> List[bool]:
+    def deploy_group(self, name: str, deployment_args_list: List[Dict]) -> List[bool]:
         """
         Takes in a list of dictionaries that contain keyword arguments for the
         controller's deploy() function. Calls deploy on all the argument
@@ -423,66 +426,77 @@ def deploy_group(self, deployment_args_list: List[Dict]) -> List[bool]:
         group of deployments.
         """
 
-        return [self.deploy(**args) for args in deployment_args_list]
+        deployments_success = [self.deploy(**args) for args in deployment_args_list]
+        self.application_state_manager.deploy_application(name, deployment_args_list)
+        return deployments_success
 
     def deploy_app(
-        self, config: ServeApplicationSchema, update_time: bool = True
+        self,
+        config: ServeApplicationSchema,
+        deployment_time: float = 0,
     ) -> None:
         """Kicks off a task that deploys a Serve application.
 
-        Cancels any previous in-progress task that is deploying a Serve
-        application.
+        Cancels in-progress task that is deploying a Serve
+        application with same name.
 
         Args:
             config: Contains the following:
+                name: Application name. If not provided, it is empty string.
                 import_path: Serve deployment graph's import path
                 runtime_env: runtime_env to run the deployment graph in
                 deployment_override_options: Dictionaries that
                     contain argument-value options that can be passed directly
                     into a set_options() call. Overrides deployment options set
                     in the graph's code itself.
-            update_time: Whether to update the deployment_timestamp.
+            deployment_time: set deployment_timestamp. If not provided, time.time() is
+                    used to indicate the deployment time.
         """
-
-        if update_time:
-            self.deployment_timestamp = time.time()
-
         config_dict = config.dict(exclude_unset=True)
 
         # Compare new config options with old ones and set versions of new deployments
-        config_checkpoint = self.kv_store.get(CONFIG_CHECKPOINT_KEY)
-
-        if config_checkpoint is not None:
-            _, last_config_dict, last_version_dict = pickle.loads(config_checkpoint)
+        config_checkpoints = self.kv_store.get(CONFIG_CHECKPOINT_KEY)
+        if config_checkpoints is None:
+            config_checkpoints_dict = {}
+        else:
+            config_checkpoints_dict = pickle.loads(config_checkpoints)
+        if config.name in config_checkpoints_dict:
+            _, last_config_dict, last_version_dict = config_checkpoints_dict[
+                config.name
+            ]
             updated_version_dict = _generate_deployment_config_versions(
                 config_dict, last_config_dict, last_version_dict
             )
         else:
             updated_version_dict = _generate_deployment_config_versions(config_dict)
 
+        deployment_override_options = config_dict.get("deployments", [])
+
+        if not deployment_time:
+            deployment_time = time.time()
+
+        config_checkpoints_dict[config.name] = (
+            deployment_time,
+            config_dict,
+            updated_version_dict,
+        )
         self.kv_store.put(
             CONFIG_CHECKPOINT_KEY,
-            pickle.dumps(
-                (self.deployment_timestamp, config_dict, updated_version_dict)
-            ),
+            pickle.dumps(config_checkpoints_dict),
         )
 
-        deployment_override_options = config_dict.get("deployments", [])
-
-        if self.config_deployment_request_ref is not None:
-            ray.cancel(self.config_deployment_request_ref)
-            logger.info(
-                "Received new config deployment request. Cancelling "
-                "previous request."
-            )
-
-        self.config_deployment_request_ref = run_graph.options(
-            runtime_env=config.runtime_env
-        ).remote(
+        deploy_obj_ref = run_graph.options(runtime_env=config.runtime_env).remote(
             config.import_path,
             config.runtime_env,
             deployment_override_options,
             updated_version_dict,
+            config.name,
+            config_dict.get("route_prefix", "/"),
+        )
+        self.application_state_manager.create_application_state(
+            config.name,
+            deploy_obj_ref=deploy_obj_ref,
+            deployment_time=deployment_time,
         )
 
     def delete_deployment(self, name: str):
@@ -571,53 +585,62 @@ def list_deployments(self, include_deleted: Optional[bool] = False) -> bytes:
             )
         return deployment_route_list.SerializeToString()
 
-    async def get_serve_status(self) -> bytes:
-
-        serve_app_status = ApplicationStatus.RUNNING
-        serve_app_message = ""
-        deployment_timestamp = self.deployment_timestamp
-
-        if self.config_deployment_request_ref:
-            finished, pending = ray.wait(
-                [self.config_deployment_request_ref], timeout=0
-            )
+    def get_serve_status(self, name: str = "") -> bytes:
+        """Return application status
+        Args:
+            name: application name. If application name doesn't exist, app_status
+            is NOT_STARTED.
+        """
 
-            if pending:
-                serve_app_status = ApplicationStatus.DEPLOYING
-            else:
-                try:
-                    await finished[0]
-                except Exception as e:
-                    serve_app_status = ApplicationStatus.DEPLOY_FAILED
-                    tb = traceback.format_exc()
-
-                    if isinstance(e, RayTaskError):
-                        serve_app_message = f"Deployment failed:\n{tb}"
-                    elif isinstance(e, RuntimeEnvSetupError):
-                        serve_app_message = f"Runtime env setup failed:\n{tb}"
-                    else:
-                        serve_app_message = f"Unknown error occurred:\n{tb}"
-
-        app_status = ApplicationStatusInfo(
-            serve_app_status, serve_app_message, deployment_timestamp
+        app_status = self.application_state_manager.get_app_status(name)
+        deployment_statuses = self.application_state_manager.get_deployments_statuses(
+            name
         )
-        deployment_statuses = self.deployment_state_manager.get_deployment_statuses()
-
         status_info = StatusOverview(
+            name=name,
             app_status=app_status,
             deployment_statuses=deployment_statuses,
         )
-
         return status_info.to_proto().SerializeToString()
 
-    def get_app_config(self) -> Dict:
+    def get_serve_statuses(self, names: List[str]) -> List[bytes]:
+        statuses = []
+        for name in names:
+            statuses.append(self.get_serve_status(name))
+        return statuses
+
+    def get_app_config(self, name: str = "") -> Dict:
         checkpoint = self.kv_store.get(CONFIG_CHECKPOINT_KEY)
         if checkpoint is None:
             return ServeApplicationSchema.get_empty_schema_dict()
         else:
-            _, config, _ = pickle.loads(checkpoint)
+            config_checkpoints_dict = pickle.loads(checkpoint)
+            if name not in config_checkpoints_dict:
+                return ServeApplicationSchema.get_empty_schema_dict()
+            _, config, _ = config_checkpoints_dict[name]
+
             return config
 
+    def get_deployment_status(self, name: str) -> Union[None, bytes]:
+        """Get deployment status by deployment name"""
+        status = self.deployment_state_manager.get_deployment_statuses([name])
+        if not status:
+            return None
+        return status[0].to_proto().SerializeToString()
+
+    def delete_apps(self, names: Iterable[str]):
+        """Delete applications based on names
+
+        During deletion, the application status is DELETING
+        """
+        deployments_to_delete = []
+        for name in names:
+            deployments_to_delete.extend(
+                self.application_state_manager.get_deployments(name)
+            )
+            self.application_state_manager.delete_application(name)
+        self.delete_deployments(deployments_to_delete)
+
 
 def _generate_deployment_config_versions(
     new_config: Dict,
@@ -710,9 +733,11 @@ def run_graph(
     graph_env: Dict,
     deployment_override_options: List[Dict],
     deployment_versions: Dict,
+    name: str = "",
+    route_prefix: str = "/",
 ):
     """
-    Deploys a Serve application to the controller's Ray cluster.
+    Build application object from user config
 
     Args:
         import_path: Serve deployment graph's import path
@@ -722,6 +747,9 @@ def run_graph(
         deployment_versions: Versions of each deployment, each of which is
             the same as the last deployment if it is a config update or
             a new randomly generated version if it is a code update
+        name: application name. If specified, application will be deployed
+            without removing existing applications.
+        route_prefix: route_prefix. Define the route path for the application.
     """
     try:
         from ray import serve
@@ -733,7 +761,7 @@ def run_graph(
 
         # Override options for each deployment
         for options in deployment_override_options:
-            name = options["name"]
+            deployment_name = options["name"]
 
             # Merge graph-level and deployment-level runtime_envs
             if "ray_actor_options" in options:
@@ -742,23 +770,21 @@ def run_graph(
             else:
                 # Otherwise, get options from graph code (and default to {} if code
                 # sets options to None)
-                ray_actor_options = app.deployments[name].ray_actor_options or {}
-
+                ray_actor_options = (
+                    app.deployments[deployment_name].ray_actor_options or {}
+                )
             deployment_env = ray_actor_options.get("runtime_env", {})
             merged_env = override_runtime_envs_except_env_vars(
                 graph_env, deployment_env
             )
-
             ray_actor_options.update({"runtime_env": merged_env})
             options["ray_actor_options"] = ray_actor_options
-
-            options["version"] = deployment_versions[name]
-
+            options["version"] = deployment_versions[deployment_name]
             # Update the deployment's options
-            app.deployments[name].set_options(**options, _internal=True)
+            app.deployments[deployment_name].set_options(**options, _internal=True)
 
         # Run the graph locally on the cluster
-        serve.run(app)
+        serve.run(app, name=name, route_prefix=route_prefix)
     except KeyboardInterrupt:
         # Error is raised when this task is canceled with ray.cancel(), which
         # happens when deploy_app() is called.
diff --git a/python/ray/serve/schema.py b/python/ray/serve/schema.py
index 2a7e5f86c2ca..79f1e347bc5e 100644
--- a/python/ray/serve/schema.py
+++ b/python/ray/serve/schema.py
@@ -242,6 +242,20 @@ def get_user_configured_option_names(self) -> Set[str]:
 
 @PublicAPI(stability="beta")
 class ServeApplicationSchema(BaseModel, extra=Extra.forbid):
+    name: str = Field(
+        default="",
+        description=(
+            "Application name, the name should be unique within the serve instance"
+        ),
+    )
+    route_prefix: str = Field(
+        default="/",
+        description=(
+            "Route prefix for HTTP requests. If not provided, it will use"
+            "route_prefix of the ingress deployment. By default, the ingress route"
+            "prefix is '/'."
+        ),
+    )
     import_path: str = Field(
         default=None,
         description=(
@@ -398,6 +412,7 @@ def kubernetes_dict(self, **kwargs) -> Dict:
 
 @PublicAPI(stability="beta")
 class ServeStatusSchema(BaseModel, extra=Extra.forbid):
+    name: str = Field(description="Application name", default="")
     app_status: ApplicationStatusInfo = Field(
         ...,
         description=(
@@ -438,6 +453,7 @@ def get_empty_schema_dict() -> Dict:
 def serve_status_to_schema(serve_status: StatusOverview) -> ServeStatusSchema:
 
     return ServeStatusSchema(
+        name=serve_status.name,
         app_status=serve_status.app_status,
         deployment_statuses=serve_status.deployment_statuses,
     )
diff --git a/python/ray/serve/tests/test_api.py b/python/ray/serve/tests/test_api.py
index ebb009293d3e..9acbc2b2c2ad 100644
--- a/python/ray/serve/tests/test_api.py
+++ b/python/ray/serve/tests/test_api.py
@@ -5,11 +5,13 @@
 import requests
 import pytest
 import starlette.responses
+from fastapi import FastAPI
 
 import ray
 from ray import serve
 from ray._private.test_utils import SignalActor, wait_for_condition
 from ray.serve.application import Application
+from ray.serve.drivers import DAGDriver
 
 
 @serve.deployment()
@@ -476,6 +478,112 @@ def f():
             f.set_options(max_concurrent_queries=-4)
 
 
+def test_deploy_application(serve_instance):
+    """Test deploy multiple applications"""
+
+    @serve.deployment
+    def f():
+        return "got f"
+
+    @serve.deployment
+    def g():
+        return "got g"
+
+    @serve.deployment(route_prefix="/my_prefix")
+    def h():
+        return "got h"
+
+    @serve.deployment
+    class Model1:
+        def __call__(self):
+            return "got model1"
+
+    app = FastAPI()
+
+    @serve.deployment(route_prefix="/hello")
+    @serve.ingress(app)
+    class MyFastAPIDeployment:
+        @app.get("/")
+        def root(self):
+            return "Hello, world!"
+
+    # Test function deployment with app name
+    f_handle = serve.run(f.bind(), name="app_f")
+    assert ray.get(f_handle.remote()) == "got f"
+    assert requests.get("http://127.0.0.1:8000/").text == "got f"
+
+    # Test function deployment with app name and route_prefix
+    g_handle = serve.run(g.bind(), name="app_g", route_prefix="/app_g")
+    assert ray.get(g_handle.remote()) == "got g"
+    assert requests.get("http://127.0.0.1:8000/app_g").text == "got g"
+
+    # Test function deployment with app name and route_prefix set in deployment
+    # decorator
+    h_handle = serve.run(h.bind(), name="app_h")
+    assert ray.get(h_handle.remote()) == "got h"
+    assert requests.get("http://127.0.0.1:8000/my_prefix").text == "got h"
+
+    # Test deployment graph
+    graph_handle = serve.run(
+        DAGDriver.bind(Model1.bind()), name="graph", route_prefix="/my_graph"
+    )
+    assert ray.get(graph_handle.predict.remote()) == "got model1"
+    assert requests.get("http://127.0.0.1:8000/my_graph").text == '"got model1"'
+
+    # Test FastAPI
+    serve.run(MyFastAPIDeployment.bind(), name="FastAPI")
+    assert requests.get("http://127.0.0.1:8000/hello").text == '"Hello, world!"'
+
+
+def test_delete_application(serve_instance):
+    """Test delete single application"""
+
+    @serve.deployment
+    def f():
+        return "got f"
+
+    @serve.deployment
+    def g():
+        return "got g"
+
+    f_handle = serve.run(f.bind(), name="app_f")
+    g_handle = serve.run(g.bind(), name="app_g", route_prefix="/app_g")
+    assert ray.get(f_handle.remote()) == "got f"
+    assert requests.get("http://127.0.0.1:8000/").text == "got f"
+
+    serve.delete("app_f")
+    assert "Path '/' not found" in requests.get("http://127.0.0.1:8000/").text
+
+    # delete again, no exception & crash expected.
+    serve.delete("app_f")
+
+    # make sure no affect to app_g
+    assert ray.get(g_handle.remote()) == "got g"
+    assert requests.get("http://127.0.0.1:8000/app_g").text == "got g"
+
+
+def test_deployment_name_with_app_name():
+    """Test replica name with app name as prefix"""
+
+    controller = serve.context._global_client._controller
+
+    @serve.deployment
+    def g():
+        return "got g"
+
+    serve.run(g.bind())
+    deployment_info = ray.get(controller._all_running_replicas.remote())
+    assert "g" in deployment_info
+
+    @serve.deployment
+    def f():
+        return "got f"
+
+    serve.run(f.bind(), name="app1")
+    deployment_info = ray.get(controller._all_running_replicas.remote())
+    assert "app1_f" in deployment_info
+
+
 if __name__ == "__main__":
     import sys
 
diff --git a/python/ray/serve/tests/test_application_state.py b/python/ray/serve/tests/test_application_state.py
new file mode 100644
index 000000000000..82b5a4e16038
--- /dev/null
+++ b/python/ray/serve/tests/test_application_state.py
@@ -0,0 +1,136 @@
+import sys
+import pytest
+from typing import List
+import time
+
+import ray
+from ray._private.test_utils import SignalActor
+from ray.serve._private.application_state import ApplicationStateManager
+from ray.serve._private.common import ApplicationStatus
+from ray.serve._private.common import DeploymentStatus, DeploymentStatusInfo
+
+
+class MockDeploymentStateManager:
+    def __init__(self):
+        self.deployment_statuses = [
+            DeploymentStatusInfo("d1", DeploymentStatus.UPDATING),
+            DeploymentStatusInfo("d2", DeploymentStatus.UPDATING),
+        ]
+
+    def set_deployment_statuses_unhealthy(self, index: int = 0):
+        self.deployment_statuses[index].status = DeploymentStatus.UNHEALTHY
+
+    def set_deployment_statuses_healthy(self, index: int = 0):
+        self.deployment_statuses[index].status = DeploymentStatus.HEALTHY
+
+    def get_deployment_statuses(self, deployment_names: List[str]):
+        return self.deployment_statuses
+
+    def get_all_deployments(self):
+        return ["d1", "d2"]
+
+
+def test_deploy_app():
+    """Test DEPLOYING status"""
+    app_state_manager = ApplicationStateManager(MockDeploymentStateManager())
+    app_state_manager.deploy_application("test_app", {})
+
+    app_status = app_state_manager.get_app_status("test_app")
+    assert app_status.status == ApplicationStatus.DEPLOYING
+    assert app_status.deployment_timestamp > 0
+
+
+def test_delete_app():
+    """Test DELETING status"""
+    app_state_manager = ApplicationStateManager(MockDeploymentStateManager())
+    app_state_manager.deploy_application("test_app", {})
+    app_state_manager.delete_application("test_app")
+    app_status = app_state_manager.get_app_status("test_app")
+    assert app_status.status == ApplicationStatus.DELETING
+
+
+def test_create_app():
+    """Test object ref based deploy and set DEPLOYING"""
+    app_state_manager = ApplicationStateManager(MockDeploymentStateManager())
+    app_state_manager.create_application_state("test_app", ray.ObjectRef.nil())
+    app_status = app_state_manager.get_app_status("test_app")
+    assert app_status.status == ApplicationStatus.DEPLOYING
+
+
+def test_update_app_running():
+    """Test DEPLOYING -> RUNNING"""
+    app_state_manager = ApplicationStateManager(MockDeploymentStateManager())
+    app_state_manager.deploy_application("test_app", {})
+    app_status = app_state_manager.get_app_status("test_app")
+    assert app_status.status == ApplicationStatus.DEPLOYING
+    app_state_manager.deployment_state_manager.set_deployment_statuses_healthy(0)
+    app_state_manager.update()
+    app_status = app_state_manager.get_app_status("test_app")
+    assert app_status.status == ApplicationStatus.DEPLOYING
+    app_state_manager.deployment_state_manager.set_deployment_statuses_healthy(1)
+    app_state_manager.update()
+    app_status = app_state_manager.get_app_status("test_app")
+    assert app_status.status == ApplicationStatus.RUNNING
+
+    # rerun update, application status should not make difference
+    app_state_manager.update()
+    app_status = app_state_manager.get_app_status("test_app")
+    assert app_status.status == ApplicationStatus.RUNNING
+
+
+def test_update_app_deploy_failed():
+    """Test DEPLOYING -> DEPLOY_FAILED"""
+    app_state_manager = ApplicationStateManager(MockDeploymentStateManager())
+    app_state_manager.deploy_application("test_app", {})
+    app_status = app_state_manager.get_app_status("test_app")
+    assert app_status.status == ApplicationStatus.DEPLOYING
+    app_state_manager.deployment_state_manager.set_deployment_statuses_unhealthy(0)
+    app_state_manager.update()
+    app_status = app_state_manager.get_app_status("test_app")
+    assert app_status.status == ApplicationStatus.DEPLOY_FAILED
+    # rerun update, application status should not make difference
+    app_state_manager.update()
+    assert app_status.status == ApplicationStatus.DEPLOY_FAILED
+
+
+@pytest.mark.skipif(sys.platform == "win32", reason="Failing on Windows.")
+@pytest.mark.parametrize("fail_deploy", [False, True])
+def test_config_deploy_app(fail_deploy):
+    """Test config based deploy
+    DEPLOYING -> RUNNING
+    DEPLOYING -> DEPLOY_FAILED
+    """
+    signal = SignalActor.remote()
+
+    @ray.remote
+    def task():
+        ray.get(signal.wait.remote())
+        if fail_deploy:
+            raise Exception("fail!")
+
+    object_ref = task.remote()
+    app_state_manager = ApplicationStateManager(MockDeploymentStateManager())
+    app_state_manager.create_application_state("test_app", object_ref)
+    app_status = app_state_manager.get_app_status("test_app")
+    assert app_status.status == ApplicationStatus.DEPLOYING
+
+    app_state_manager.update()
+    app_status = app_state_manager.get_app_status("test_app")
+    assert app_status.status == ApplicationStatus.DEPLOYING
+
+    signal.send.remote()
+    time.sleep(2)
+    if fail_deploy:
+        app_state_manager.update()
+        app_status = app_state_manager.get_app_status("test_app")
+        assert app_status.status == ApplicationStatus.DEPLOY_FAILED
+    else:
+        app_state_manager.deployment_state_manager.set_deployment_statuses_healthy(0)
+        app_state_manager.deployment_state_manager.set_deployment_statuses_healthy(1)
+        app_state_manager.update()
+        app_status = app_state_manager.get_app_status("test_app")
+        assert app_status.status == ApplicationStatus.RUNNING
+
+
+if __name__ == "__main__":
+    sys.exit(pytest.main(["-v", "-s", __file__]))
diff --git a/python/ray/serve/tests/test_schema.py b/python/ray/serve/tests/test_schema.py
index 0e289b0eabc2..c0e94936db72 100644
--- a/python/ray/serve/tests/test_schema.py
+++ b/python/ray/serve/tests/test_schema.py
@@ -664,22 +664,23 @@ def f1():
     def f2():
         pass
 
-    f1._func_or_class = "ray.serve.tests.test_schema.global_f"
-    f2._func_or_class = "ray.serve.tests.test_schema.global_f"
-
     client = serve.start()
-
-    f1.deploy()
-    f2.deploy()
+    serve.run(f1.bind(), name="app1")
+    serve.run(f2.bind(), name="app2")
 
     # Check statuses
-    statuses = serve_status_to_schema(client.get_serve_status()).deployment_statuses
-    deployment_names = {"f1", "f2"}
-    for deployment_status in statuses:
-        assert deployment_status.status in {"UPDATING", "HEALTHY"}
-        assert deployment_status.name in deployment_names
-        deployment_names.remove(deployment_status.name)
-    assert len(deployment_names) == 0
+    f1_statuses = serve_status_to_schema(
+        client.get_serve_status("app1")
+    ).deployment_statuses
+    f2_statuses = serve_status_to_schema(
+        client.get_serve_status("app2")
+    ).deployment_statuses
+    assert len(f1_statuses) == 1
+    assert f1_statuses[0].status in {"UPDATING", "HEALTHY"}
+    assert f1_statuses[0].name == "app1_f1"
+    assert len(f2_statuses) == 1
+    assert f2_statuses[0].status in {"UPDATING", "HEALTHY"}
+    assert f2_statuses[0].name == "app2_f2"
 
     serve.shutdown()
 
diff --git a/src/ray/protobuf/serve.proto b/src/ray/protobuf/serve.proto
index f75beaa9ecdc..d328a7f4d8fe 100644
--- a/src/ray/protobuf/serve.proto
+++ b/src/ray/protobuf/serve.proto
@@ -203,6 +203,8 @@ enum ApplicationStatus {
   DEPLOYING = 0;
   RUNNING = 1;
   DEPLOY_FAILED = 2;
+  DELETING = 3;
+  NOT_STARTED = 5;
 }
 
 message ApplicationStatusInfo {
@@ -214,6 +216,7 @@ message ApplicationStatusInfo {
 message StatusOverview {
   ApplicationStatusInfo app_status = 1;
   DeploymentStatusInfoList deployment_statuses = 2;
+  string name = 3;
 }
 
 // RPC Schema

From 0cb80704509fd789c6da13ad70dfaa5d218fbd7d Mon Sep 17 00:00:00 2001
From: Sven Mika <svenmika1977@gmail.com>
Date: Thu, 26 Jan 2023 17:54:42 +0100
Subject: [PATCH 005/267] [RLlib] AlgorithmConfig objects supported by all
 (internally used) `Algorithm.default_resource_request()` methods. (#31958)

---
 rllib/algorithms/algorithm.py                 |  9 ----
 rllib/algorithms/alpha_star/alpha_star.py     | 42 +++++++++-------
 rllib/algorithms/apex_dqn/apex_dqn.py         | 48 +++++++++----------
 rllib/algorithms/impala/impala.py             | 44 ++++++++---------
 rllib/algorithms/mock.py                      |  2 +-
 ...e_envs_with_inference_done_on_main_node.py | 21 +++++---
 6 files changed, 86 insertions(+), 80 deletions(-)

diff --git a/rllib/algorithms/algorithm.py b/rllib/algorithms/algorithm.py
index 81859387d005..61b75e8e4fbf 100644
--- a/rllib/algorithms/algorithm.py
+++ b/rllib/algorithms/algorithm.py
@@ -2725,15 +2725,6 @@ def _run_one_evaluation(
         Returns:
             The results dict from the evaluation call.
         """
-
-        eval_results = {
-            "evaluation": {
-                "episode_reward_max": np.nan,
-                "episode_reward_min": np.nan,
-                "episode_reward_mean": np.nan,
-            }
-        }
-
         eval_func_to_use = (
             self._evaluate_async
             if self.config.enable_async_evaluation
diff --git a/rllib/algorithms/alpha_star/alpha_star.py b/rllib/algorithms/alpha_star/alpha_star.py
index a388895b31cf..e829bde1900a 100644
--- a/rllib/algorithms/alpha_star/alpha_star.py
+++ b/rllib/algorithms/alpha_star/alpha_star.py
@@ -2,7 +2,7 @@
 A multi-agent, distributed multi-GPU, league-capable asynch. PPO
 ================================================================
 """
-from typing import Any, Dict, Optional, Type
+from typing import Any, Dict, Optional, Type, Union
 
 import gymnasium as gym
 import tree
@@ -257,25 +257,31 @@ class AlphaStar(appo.APPO):
 
     @classmethod
     @override(Algorithm)
-    def default_resource_request(cls, config):
-        cf = dict(cls.get_default_config(), **config)
+    def default_resource_request(
+        cls,
+        config: Union[AlgorithmConfig, PartialAlgorithmConfigDict],
+    ):
+        if isinstance(config, AlgorithmConfig):
+            cf: AlphaStarConfig = config
+        else:
+            cf: AlphaStarConfig = cls.get_default_config().update_from_dict(config)
         # Construct a dummy LeagueBuilder, such that it gets the opportunity to
         # adjust the multiagent config, according to its setup, and we can then
         # properly infer the resources to allocate.
-        from_config(cf["league_builder_config"], algo=None, algo_config=cf)
+        from_config(cf.league_builder_config, algo=None, algo_config=cf)
 
-        max_num_policies_to_train = cf["max_num_policies_to_train"] or len(
-            cf["multiagent"].get("policies_to_train") or cf["multiagent"]["policies"]
+        max_num_policies_to_train = cf.max_num_policies_to_train or len(
+            cf.policies_to_train or cf.policies
         )
         num_learner_shards = min(
-            cf["num_gpus"] or max_num_policies_to_train, max_num_policies_to_train
+            cf.num_gpus or max_num_policies_to_train, max_num_policies_to_train
         )
-        num_gpus_per_shard = cf["num_gpus"] / num_learner_shards
+        num_gpus_per_shard = cf.num_gpus / num_learner_shards
         num_policies_per_shard = max_num_policies_to_train / num_learner_shards
 
-        fake_gpus = cf["_fake_gpus"]
+        fake_gpus = cf._fake_gpus
 
-        eval_config = cf["evaluation_config"]
+        eval_config = cf.get_evaluation_config_object()
 
         # Return PlacementGroupFactory containing all needed resources
         # (already properly defined as device bundles).
@@ -283,15 +289,15 @@ def default_resource_request(cls, config):
             bundles=[
                 {
                     # Driver (no GPUs).
-                    "CPU": cf["num_cpus_for_driver"],
+                    "CPU": cf.num_cpus_for_local_worker,
                 }
             ]
             + [
                 {
                     # RolloutWorkers (no GPUs).
-                    "CPU": cf["num_cpus_per_worker"],
+                    "CPU": cf.num_cpus_per_worker,
                 }
-                for _ in range(cf["num_workers"])
+                for _ in range(cf.num_workers)
             ]
             + [
                 {
@@ -310,20 +316,20 @@ def default_resource_request(cls, config):
                         # Note: The local eval worker is located on the driver
                         # CPU or not even created iff >0 eval workers.
                         "CPU": eval_config.get(
-                            "num_cpus_per_worker", cf["num_cpus_per_worker"]
+                            "num_cpus_per_worker", cf.num_cpus_per_worker
                         ),
                     }
-                    for _ in range(cf["evaluation_num_workers"])
+                    for _ in range(cf.evaluation_num_workers)
                 ]
-                if cf["evaluation_interval"]
+                if cf.evaluation_interval
                 else []
             ),
-            strategy=config.get("placement_strategy", "PACK"),
+            strategy=cf.placement_strategy,
         )
 
     @classmethod
     @override(appo.APPO)
-    def get_default_config(cls) -> AlgorithmConfig:
+    def get_default_config(cls) -> AlphaStarConfig:
         return AlphaStarConfig()
 
     @override(appo.APPO)
diff --git a/rllib/algorithms/apex_dqn/apex_dqn.py b/rllib/algorithms/apex_dqn/apex_dqn.py
index 4d46c0690039..5eea96eccc8e 100644
--- a/rllib/algorithms/apex_dqn/apex_dqn.py
+++ b/rllib/algorithms/apex_dqn/apex_dqn.py
@@ -15,7 +15,7 @@
 import platform
 import random
 from collections import defaultdict
-from typing import Any, Dict, List, Optional, Tuple
+from typing import Any, Dict, List, Optional, Tuple, Union
 
 import ray
 from ray._private.dict import merge_dicts
@@ -42,6 +42,7 @@
     TARGET_NET_UPDATE_TIMER,
 )
 from ray.rllib.utils.typing import (
+    PartialAlgorithmConfigDict,
     ResultDict,
     SampleBatchType,
 )
@@ -700,10 +701,16 @@ def _compile_iteration_results(self, *args, **kwargs):
 
     @classmethod
     @override(Algorithm)
-    def default_resource_request(cls, config):
-        cf = dict(cls.get_default_config(), **config)
+    def default_resource_request(
+        cls,
+        config: Union[AlgorithmConfig, PartialAlgorithmConfigDict],
+    ):
+        if isinstance(config, AlgorithmConfig):
+            cf: ApexDQNConfig = config
+        else:
+            cf: ApexDQNConfig = cls.get_default_config().update_from_dict(config)
 
-        eval_config = cf["evaluation_config"]
+        eval_config = cf.get_evaluation_config_object()
 
         # Return PlacementGroupFactory containing all needed resources
         # (already properly defined as device bundles).
@@ -715,19 +722,19 @@ def default_resource_request(cls, config):
                     # data bandwidth between buffers and the learner (driver).
                     # Replay buffer actors each contain one shard of the total
                     # replay buffer and use 1 CPU each.
-                    "CPU": cf["num_cpus_for_driver"]
-                    + cf["optimizer"]["num_replay_buffer_shards"],
-                    "GPU": 0 if cf["_fake_gpus"] else cf["num_gpus"],
+                    "CPU": cf.num_cpus_for_local_worker
+                    + cf.optimizer["num_replay_buffer_shards"],
+                    "GPU": 0 if cf._fake_gpus else cf.num_gpus,
                 }
             ]
             + [
                 {
                     # RolloutWorkers.
-                    "CPU": cf["num_cpus_per_worker"],
-                    "GPU": cf["num_gpus_per_worker"],
-                    **cf["custom_resources_per_worker"],
+                    "CPU": cf.num_cpus_per_worker,
+                    "GPU": cf.num_gpus_per_worker,
+                    **cf.custom_resources_per_worker,
                 }
-                for _ in range(cf["num_workers"])
+                for _ in range(cf.num_rollout_workers)
             ]
             + (
                 [
@@ -735,23 +742,16 @@ def default_resource_request(cls, config):
                         # Evaluation workers.
                         # Note: The local eval worker is located on the driver
                         # CPU.
-                        "CPU": eval_config.get(
-                            "num_cpus_per_worker", cf["num_cpus_per_worker"]
-                        ),
-                        "GPU": eval_config.get(
-                            "num_gpus_per_worker", cf["num_gpus_per_worker"]
-                        ),
-                        **eval_config.get(
-                            "custom_resources_per_worker",
-                            cf["custom_resources_per_worker"],
-                        ),
+                        "CPU": eval_config.num_cpus_per_worker,
+                        "GPU": eval_config.num_gpus_per_worker,
+                        **eval_config.custom_resources_per_worker,
                     }
-                    for _ in range(cf["evaluation_num_workers"])
+                    for _ in range(cf.evaluation_num_workers)
                 ]
-                if cf["evaluation_interval"]
+                if cf.evaluation_interval
                 else []
             ),
-            strategy=config.get("placement_strategy", "PACK"),
+            strategy=cf.placement_strategy,
         )
 
 
diff --git a/rllib/algorithms/impala/impala.py b/rllib/algorithms/impala/impala.py
index 301589e095b7..bea342df72c2 100644
--- a/rllib/algorithms/impala/impala.py
+++ b/rllib/algorithms/impala/impala.py
@@ -42,6 +42,7 @@
 
 from ray.rllib.utils.metrics.learner_info import LearnerInfoBuilder
 from ray.rllib.utils.typing import (
+    PartialAlgorithmConfigDict,
     PolicyID,
     ResultDict,
     SampleBatchType,
@@ -593,10 +594,16 @@ def training_step(self) -> ResultDict:
 
     @classmethod
     @override(Algorithm)
-    def default_resource_request(cls, config):
-        cf = dict(cls.get_default_config(), **config)
+    def default_resource_request(
+        cls,
+        config: Union[AlgorithmConfig, PartialAlgorithmConfigDict],
+    ):
+        if isinstance(config, AlgorithmConfig):
+            cf: ImpalaConfig = config
+        else:
+            cf: ImpalaConfig = cls.get_default_config().update_from_dict(config)
 
-        eval_config = cf["evaluation_config"]
+        eval_config = cf.get_evaluation_config_object()
 
         # Return PlacementGroupFactory containing all needed resources
         # (already properly defined as device bundles).
@@ -610,18 +617,18 @@ def default_resource_request(cls, config):
                     # from RolloutWorkers (n rollout workers map to m
                     # aggregation workers, where m < n) and always use 1 CPU
                     # each.
-                    "CPU": cf["num_cpus_for_driver"] + cf["num_aggregation_workers"],
-                    "GPU": 0 if cf["_fake_gpus"] else cf["num_gpus"],
+                    "CPU": cf.num_cpus_for_local_worker + cf.num_aggregation_workers,
+                    "GPU": 0 if cf._fake_gpus else cf.num_gpus,
                 }
             ]
             + [
                 {
                     # RolloutWorkers.
-                    "CPU": cf["num_cpus_per_worker"],
-                    "GPU": cf["num_gpus_per_worker"],
-                    **cf["custom_resources_per_worker"],
+                    "CPU": cf.num_cpus_per_worker,
+                    "GPU": cf.num_gpus_per_worker,
+                    **cf.custom_resources_per_worker,
                 }
-                for _ in range(cf["num_workers"])
+                for _ in range(cf.num_rollout_workers)
             ]
             + (
                 [
@@ -629,23 +636,16 @@ def default_resource_request(cls, config):
                         # Evaluation (remote) workers.
                         # Note: The local eval worker is located on the driver
                         # CPU or not even created iff >0 eval workers.
-                        "CPU": eval_config.get(
-                            "num_cpus_per_worker", cf["num_cpus_per_worker"]
-                        ),
-                        "GPU": eval_config.get(
-                            "num_gpus_per_worker", cf["num_gpus_per_worker"]
-                        ),
-                        **eval_config.get(
-                            "custom_resources_per_worker",
-                            cf["custom_resources_per_worker"],
-                        ),
+                        "CPU": eval_config.num_cpus_per_worker,
+                        "GPU": eval_config.num_gpus_per_worker,
+                        **eval_config.custom_resources_per_worker,
                     }
-                    for _ in range(cf["evaluation_num_workers"])
+                    for _ in range(cf.evaluation_num_workers)
                 ]
-                if cf["evaluation_interval"]
+                if cf.evaluation_interval
                 else []
             ),
-            strategy=config.get("placement_strategy", "PACK"),
+            strategy=cf.placement_strategy,
         )
 
     def concatenate_batches_and_pre_queue(self, batches: List[SampleBatch]):
diff --git a/rllib/algorithms/mock.py b/rllib/algorithms/mock.py
index b00b72a7c546..f89955812b1e 100644
--- a/rllib/algorithms/mock.py
+++ b/rllib/algorithms/mock.py
@@ -27,7 +27,7 @@ def get_default_config(cls) -> AlgorithmConfig:
         )
 
     @classmethod
-    def default_resource_request(cls, config):
+    def default_resource_request(cls, config: AlgorithmConfig):
         return None
 
     @override(Algorithm)
diff --git a/rllib/examples/remote_envs_with_inference_done_on_main_node.py b/rllib/examples/remote_envs_with_inference_done_on_main_node.py
index ed9957f98cfe..bbefcc0439e1 100644
--- a/rllib/examples/remote_envs_with_inference_done_on_main_node.py
+++ b/rllib/examples/remote_envs_with_inference_done_on_main_node.py
@@ -11,13 +11,16 @@
 """
 import argparse
 import os
+from typing import Union
 
 import ray
+from ray import air, tune
 from ray.rllib.algorithms.ppo import PPO, PPOConfig
 from ray.rllib.algorithms.algorithm import Algorithm
+from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.test_utils import check_learning_achieved
-from ray import air, tune
+from ray.rllib.utils.typing import PartialAlgorithmConfigDict
 from ray.tune import PlacementGroupFactory
 from ray.tune.logger import pretty_print
 
@@ -82,8 +85,14 @@ def get_cli_args():
 class PPORemoteInference(PPO):
     @classmethod
     @override(Algorithm)
-    def default_resource_request(cls, config):
-        cf = dict(cls.get_default_config(), **config)
+    def default_resource_request(
+        cls,
+        config: Union[AlgorithmConfig, PartialAlgorithmConfigDict],
+    ):
+        if isinstance(config, AlgorithmConfig):
+            cf = config
+        else:
+            cf = cls.get_default_config().update_from_dict(config)
 
         # Return PlacementGroupFactory containing all needed resources
         # (already properly defined as device bundles).
@@ -94,15 +103,15 @@ def default_resource_request(cls, config):
                     # main model in this example (num_workers=0).
                     "CPU": 1,
                     # Possibly add n GPUs to this.
-                    "GPU": cf["num_gpus"],
+                    "GPU": cf.num_gpus,
                 },
                 {
                     # Different bundle (meaning: possibly different node)
                     # for your n "remote" envs (set remote_worker_envs=True).
-                    "CPU": cf["num_envs_per_worker"],
+                    "CPU": cf.num_envs_per_worker,
                 },
             ],
-            strategy=config.get("placement_strategy", "PACK"),
+            strategy=cf.placement_strategy,
         )
 
 
From e72a389c82a2f535072f3510c30312bf1b87e599 Mon Sep 17 00:00:00 2001
From: Amog Kamsetty <amogkam@users.noreply.github.com>
Date: Thu, 26 Jan 2023 10:03:22 -0800
Subject: [PATCH 006/267] [Data] Add Logical Operator for `filter` and
 `flat_map` (#31954)

Signed-off-by: amogkam amogkamsetty@yahoo.com

Adds logical operators for filter() and flat_map()

Closes #31936
---
 .../logical/operators/map_operator.py         | 62 ++++++++++++++++
 python/ray/data/dataset.py                    | 29 +++++++-
 .../data/tests/test_execution_optimizer.py    | 70 ++++++++++++++++---
 3 files changed, 151 insertions(+), 10 deletions(-)

diff --git a/python/ray/data/_internal/logical/operators/map_operator.py b/python/ray/data/_internal/logical/operators/map_operator.py
index 5ecddcd9d32a..261e198cc3b6 100644
--- a/python/ray/data/_internal/logical/operators/map_operator.py
+++ b/python/ray/data/_internal/logical/operators/map_operator.py
@@ -26,8 +26,28 @@
 class AbstractMap(LogicalOperator):
     """Abstract class for logical operators should be converted to physical
     MapOperator.
+
+    Args:
+        name: Name for this operator. This is the name that will appear when inspecting
+            the logical plan of a Dataset.
+        input_op: The operator preceding this operator in the plan DAG. The outputs of
+            `input_op` will be the inputs to this operator.
+        block_fn: The transform function to apply to each input block to produce output
+            blocks.
+        target_block_size: The target size for blocks outputted by this operator.
+        fn: User provided UDF to be called in `block_fn`.
+        fn_args: Arguments to `fn`.
+        fn_kwargs: Keyword arguments to `fn`.
+        fn_constructor_args: Arguments to provide to the initializor of `fn` if `fn` is
+            a callable class.
+        fn_constructor_kwargs: Keyword Arguments to provide to the initializor of `fn`
+            if `fn` is a callable class.
+        ray_remote_args: Args to provide to ray.remote.
     """
 
+    # TODO: Replace `fn`, `fn_args`, `fn_kwargs`, `fn_constructor_args`, and
+    # `fn_constructor_kwargs` from this API, in favor of `block_fn_args` and
+    # `block_fn_kwargs`. Operators should only be concerned with `block_fn`.
     def __init__(
         self,
         name: str,
@@ -112,6 +132,48 @@ def __init__(
         )
 
 
+class Filter(AbstractMap):
+    """Logical operator for filter."""
+
+    def __init__(
+        self,
+        input_op: LogicalOperator,
+        block_fn: BlockTransform,
+        fn: RowUDF,
+        compute: Optional[Union[str, ComputeStrategy]] = None,
+        ray_remote_args: Optional[Dict[str, Any]] = None,
+    ):
+        super().__init__(
+            "Filter",
+            input_op,
+            block_fn,
+            compute=compute,
+            fn=fn,
+            ray_remote_args=ray_remote_args,
+        )
+
+
+class FlatMap(AbstractMap):
+    """Logical operator for flat_map."""
+
+    def __init__(
+        self,
+        input_op: LogicalOperator,
+        block_fn: BlockTransform,
+        fn: RowUDF,
+        compute: Optional[Union[str, ComputeStrategy]] = None,
+        ray_remote_args: Optional[Dict[str, Any]] = None,
+    ):
+        super().__init__(
+            "FlatMap",
+            input_op,
+            block_fn,
+            compute=compute,
+            fn=fn,
+            ray_remote_args=ray_remote_args,
+        )
+
+
 def plan_map_op(op: AbstractMap, input_physical_dag: PhysicalOperator) -> MapOperator:
     """Get the corresponding physical operators DAG for AbstractMap operators."""
     compute = get_compute(op._compute)
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index d2f146bf10aa..7ab51669992b 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -32,6 +32,8 @@
 from ray.air.util.data_batch_conversion import BlockFormat
 from ray.data._internal.logical.optimizers import LogicalPlan
 from ray.data._internal.logical.operators.map_operator import (
+    Filter,
+    FlatMap,
     MapRows,
     MapBatches,
 )
@@ -902,7 +904,18 @@ def transform(block: Block, fn: RowUDF[T, U]) -> Iterable[Block]:
         plan = self._plan.with_stage(
             OneToOneStage("flat_map", transform, compute, ray_remote_args, fn=fn)
         )
-        return Dataset(plan, self._epoch, self._lazy)
+
+        logical_plan = self._logical_plan
+        if logical_plan is not None:
+            op = FlatMap(
+                input_op=logical_plan.dag,
+                block_fn=transform,
+                fn=fn,
+                compute=compute,
+                ray_remote_args=ray_remote_args,
+            )
+            logical_plan = LogicalPlan(op)
+        return Dataset(plan, self._epoch, self._lazy, logical_plan)
 
     def filter(
         self,
@@ -967,7 +980,19 @@ def transform(block: Block, fn: RowUDF[T, U]) -> Iterable[Block]:
         plan = self._plan.with_stage(
             OneToOneStage("filter", transform, compute, ray_remote_args, fn=fn)
         )
-        return Dataset(plan, self._epoch, self._lazy)
+
+        logical_plan = self._logical_plan
+        if logical_plan is not None:
+            op = Filter(
+                input_op=logical_plan.dag,
+                block_fn=transform,
+                fn=fn,
+                compute=compute,
+                ray_remote_args=ray_remote_args,
+            )
+            logical_plan = LogicalPlan(op)
+
+        return Dataset(plan, self._epoch, self._lazy, logical_plan)
 
     def repartition(self, num_blocks: int, *, shuffle: bool = False) -> "Dataset[T]":
         """Repartition the dataset into exactly this number of blocks.
diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index 34596fc82ca4..8901826ee616 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -4,20 +4,18 @@
 from ray.data._internal.execution.operators.map_operator import MapOperator
 from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
 from ray.data._internal.logical.operators.read_operator import Read
-from ray.data._internal.logical.operators.map_operator import MapRows, MapBatches
+from ray.data._internal.logical.operators.map_operator import (
+    MapRows,
+    MapBatches,
+    Filter,
+    FlatMap,
+)
 from ray.data._internal.logical.planner import Planner
 from ray.data.datasource.parquet_datasource import ParquetDatasource
 
 from ray.tests.conftest import *  # noqa
 
 
-def test_e2e_optimizer_sanity(ray_start_cluster_enabled, enable_optimizer):
-    ds = ray.data.range(5)
-    ds = ds.map_batches(lambda x: x)
-    ds = ds.map(lambda x: x + 1)
-    assert ds.take_all() == [1, 2, 3, 4, 5], ds
-
-
 def test_read_operator(ray_start_cluster_enabled, enable_optimizer):
     planner = Planner()
     op = Read(ParquetDatasource())
@@ -45,6 +43,12 @@ def test_map_batches_operator(ray_start_cluster_enabled, enable_optimizer):
     assert isinstance(physical_op.input_dependencies[0], MapOperator)
 
 
+def test_map_batches_e2e(ray_start_cluster_enabled, enable_optimizer):
+    ds = ray.data.range(5)
+    ds = ds.map_batches(lambda x: x)
+    assert ds.take_all() == list(range(5)), ds
+
+
 def test_map_rows_operator(ray_start_cluster_enabled, enable_optimizer):
     planner = Planner()
     read_op = Read(ParquetDatasource())
@@ -61,6 +65,56 @@ def test_map_rows_operator(ray_start_cluster_enabled, enable_optimizer):
     assert isinstance(physical_op.input_dependencies[0], MapOperator)
 
 
+def test_map_rows_e2e(ray_start_cluster_enabled, enable_optimizer):
+    ds = ray.data.range(5)
+    ds = ds.map(lambda x: x + 1)
+    assert ds.take_all() == [1, 2, 3, 4, 5], ds
+
+
+def test_filter_operator(ray_start_cluster_enabled, enable_optimizer):
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = Filter(
+        read_op,
+        lambda it: (x for x in it),
+        lambda x: x,
+    )
+    physical_op = planner.plan(op)
+
+    assert op.name == "Filter"
+    assert isinstance(physical_op, MapOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], MapOperator)
+
+
+def test_filter_e2e(ray_start_cluster_enabled, enable_optimizer):
+    ds = ray.data.range(5)
+    ds = ds.filter(fn=lambda x: x % 2 == 0)
+    assert ds.take_all() == [0, 2, 4], ds
+
+
+def test_flat_map(ray_start_cluster_enabled, enable_optimizer):
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = FlatMap(
+        read_op,
+        lambda it: ([x, x] for x in it),
+        lambda x: x,
+    )
+    physical_op = planner.plan(op)
+
+    assert op.name == "FlatMap"
+    assert isinstance(physical_op, MapOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], MapOperator)
+
+
+def test_flat_map_e2e(ray_start_cluster_enabled, enable_optimizer):
+    ds = ray.data.range(2)
+    ds = ds.flat_map(fn=lambda x: [x, x])
+    assert ds.take_all() == [0, 0, 1, 1], ds
+
+
 if __name__ == "__main__":
     import sys
 

From 994c3d63440665c664766f64e0eb48a60a4cf4e4 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Thu, 26 Jan 2023 11:18:57 -0800
Subject: [PATCH 007/267] [docker/arm64] Build docker images (with suffix) for
 arm64 (#31861)

This PR adds Docker image builds for arm64 (aarch64). The images will be tagged with a suffix `-aarch64`. In a future retagging step, we can combine the existing x86_64 images with the aarch64 images for true multiplatform images.

Changes needed to make this work:
- Move libgcc to libgcc-ng because the former does not exist on conda for aarch64
- Upgrade Python 3.7.7 to 3.7.16 because the former does not exist on conda for aarch74

Please also note that aarch64 base images only exist for CUDA >= 11.2.

Lastly, we are not building ray-ml docker images. This is because not all current dependencies are compatible with aarch64 - specifically, tensorflow requires at least 1.10.1 and torch 1.13.0 does not seem to be released for linux aarch64.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 .buildkite/pipeline.arm64.yml          |  80 +++++++++++
 build-docker.sh                        |   2 +-
 ci/build/build-docker-images.py        | 181 +++++++++++++++++++------
 docker/base-deps/Dockerfile            |   8 +-
 docker/base-deps/README.md             |  14 +-
 docker/ray-deps/README.md              |  13 +-
 docker/ray-ml/README.md                |   2 +
 docker/ray-worker-container/Dockerfile |   6 +-
 docker/ray/README.md                   |  28 +++-
 9 files changed, 283 insertions(+), 51 deletions(-)

diff --git a/.buildkite/pipeline.arm64.yml b/.buildkite/pipeline.arm64.yml
index 99388bf18671..e49fff07fb41 100644
--- a/.buildkite/pipeline.arm64.yml
+++ b/.buildkite/pipeline.arm64.yml
@@ -54,3 +54,83 @@
 #    - python .buildkite/copy_files.py --destination branch_wheels --path ./.whl
 #    # Upload to latest directory.
 #    - if [ "$BUILDKITE_BRANCH" == "master" ]; then python .buildkite/copy_files.py --destination wheels --path ./.whl; fi
+
+
+- label: ":mechanical_arm: :docker: Build Images: py37 [aarch64] (1/2)"
+  conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
+  instance_size: arm64-medium
+  commands:
+    - LINUX_WHEELS=1 ./ci/ci.sh build
+    - pip install -q docker aws_requests_auth boto3
+    - ./ci/env/env_info.sh
+    - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
+    - python ./ci/build/build-docker-images.py --py-versions py37 --device-types cpu cu112 --build-type BUILDKITE --build-base --suffix aarch64
+
+- label: ":mechanical_arm: :docker: Build Images: py37 [aarch64] (2/2)"
+  conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
+  instance_size: arm64-medium
+  commands:
+    - LINUX_WHEELS=1 ./ci/ci.sh build
+    - pip install -q docker aws_requests_auth boto3
+    - ./ci/env/env_info.sh
+    - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
+    - python ./ci/build/build-docker-images.py --py-versions py37 --device-types cu113 cu116 --build-type BUILDKITE --build-base --suffix aarch64
+
+- label: ":mechanical_arm: :docker: Build Images: py38 [aarch64] (1/2)"
+  conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
+  instance_size: arm64-medium
+  commands:
+    - LINUX_WHEELS=1 ./ci/ci.sh build
+    - pip install -q docker aws_requests_auth boto3
+    - ./ci/env/env_info.sh
+    - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
+    - python ./ci/build/build-docker-images.py --py-versions py38 --device-types cpu cu112 --build-type BUILDKITE --build-base --suffix aarch64
+
+- label: ":mechanical_arm: :docker: Build Images: py38 [aarch64] (2/2)"
+  conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
+  instance_size: arm64-medium
+  commands:
+    - LINUX_WHEELS=1 ./ci/ci.sh build
+    - pip install -q docker aws_requests_auth boto3
+    - ./ci/env/env_info.sh
+    - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
+    - python ./ci/build/build-docker-images.py --py-versions py38 --device-types cu113 cu116 --build-type BUILDKITE --build-base --suffix aarch64
+
+- label: ":mechanical_arm: :docker: Build Images: py39 [aarch64] (1/2)"
+  conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
+  instance_size: arm64-medium
+  commands:
+    - LINUX_WHEELS=1 ./ci/ci.sh build
+    - pip install -q docker aws_requests_auth boto3
+    - ./ci/env/env_info.sh
+    - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
+    - python ./ci/build/build-docker-images.py --py-versions py39 --device-types cpu cu112 --build-type BUILDKITE --build-base --suffix aarch64
+
+- label: ":mechanical_arm: :docker: Build Images: py39 [aarch64] (2/2)"
+  conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
+  instance_size: arm64-medium
+  commands:
+    - LINUX_WHEELS=1 ./ci/ci.sh build
+    - pip install -q docker aws_requests_auth boto3
+    - ./ci/env/env_info.sh
+    - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
+    - python ./ci/build/build-docker-images.py --py-versions py39 --device-types cu113 cu116 --build-type BUILDKITE --build-base --suffix aarch64
+
+- label: ":mechanical_arm: :docker: Build Images: py310 [aarch64] (1/2)"
+  conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
+  instance_size: arm64-medium
+  commands:
+    - LINUX_WHEELS=1 ./ci/ci.sh build
+    - pip install -q docker aws_requests_auth boto3
+    - ./ci/env/env_info.sh
+    - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
+    - python ./ci/build/build-docker-images.py --py-versions py310 --device-types cpu cu112 --build-type BUILDKITE --build-base --suffix aarch64
+
+- label: ":mechanical_arm: :docker: Build Images: py310 [aarch64] (2/2)"
+  conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
+  instance_size: arm64-medium
+  commands:
+    - LINUX_WHEELS=1 ./ci/ci.sh build
+    - pip install -q docker aws_requests_auth boto3
+    - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
+    - python ./ci/build/build-docker-images.py --py-versions py310 --device-types cu113 cu116 --build-type BUILDKITE --build-base --suffix aarch64
diff --git a/build-docker.sh b/build-docker.sh
index 0b640c040637..8d8f5fbe250e 100755
--- a/build-docker.sh
+++ b/build-docker.sh
@@ -8,7 +8,7 @@ set -x
 GPU=""
 BASE_IMAGE="ubuntu:focal"
 WHEEL_URL="https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-3.0.0.dev0-cp37-cp37m-manylinux2014_x86_64.whl"
-PYTHON_VERSION="3.7.7"
+PYTHON_VERSION="3.7.16"
 
 
 while [[ $# -gt 0 ]]
diff --git a/ci/build/build-docker-images.py b/ci/build/build-docker-images.py
index fd8745af00e1..e3a3fec464c6 100644
--- a/ci/build/build-docker-images.py
+++ b/ci/build/build-docker-images.py
@@ -5,12 +5,13 @@
 import glob
 import itertools
 import os
+import platform
 import re
 import shutil
 import subprocess
 import sys
 from collections import defaultdict
-from typing import List, Tuple
+from typing import List, Optional, Tuple
 
 import docker
 
@@ -18,6 +19,7 @@
 DOCKER_USERNAME = "raytravisbot"
 DOCKER_CLIENT = None
 PYTHON_WHL_VERSION = "cp3"
+ADDITIONAL_PLATFORMS = ["aarch64"]
 
 DOCKER_HUB_DESCRIPTION = {
     "base-deps": (
@@ -70,6 +72,12 @@
 IMAGE_NAMES = list(DOCKER_HUB_DESCRIPTION.keys())
 
 
+def _with_suffix(tag: str, suffix: Optional[str] = None):
+    if suffix:
+        return tag + "-" + suffix
+    return tag
+
+
 def _get_branch():
     branch = os.environ.get("TRAVIS_BRANCH") or os.environ.get("BUILDKITE_BRANCH")
     if not branch:
@@ -159,7 +167,11 @@ def _check_if_docker_files_modified():
 
 
 def _build_docker_image(
-    image_name: str, py_version: str, image_type: str, no_cache=True
+    image_name: str,
+    py_version: str,
+    image_type: str,
+    suffix: Optional[str] = None,
+    no_cache=True,
 ):
     """Builds Docker image with the provided info.
 
@@ -169,6 +181,7 @@ def _build_docker_image(
         Must be one of PY_MATRIX.keys()
     image_type: The image type to build. Must be one of
         BASE_IMAGES.keys()
+    suffix: Suffix to add to the tags (e.g. "aarch64" for "ray:sha256-aarch64")
     no_cache: If True, don't use caching when building the image.
     """
 
@@ -197,6 +210,9 @@ def _build_docker_image(
     # I.e. "py310"[3:] == 10
     build_args["PYTHON_MINOR_VERSION"] = py_version[3:]
 
+    if platform.processor() in ADDITIONAL_PLATFORMS:
+        build_args["HOSTTYPE"] = platform.processor()
+
     device_tag = f"{image_type}"
 
     if image_name == "base-deps":
@@ -204,6 +220,8 @@ def _build_docker_image(
     else:
         base_image = f"-{py_version}-{device_tag}"
 
+        base_image = _with_suffix(base_image, suffix=suffix)
+
     if image_name != "ray-worker-container":
         build_args["BASE_IMAGE"] = base_image
 
@@ -216,6 +234,8 @@ def _build_docker_image(
 
     tagged_name = f"rayproject/{image_name}:nightly-{py_version}-{device_tag}"
 
+    tagged_name = _with_suffix(tagged_name, suffix=suffix)
+
     for i in range(2):
         cleanup = DOCKER_CLIENT.containers.prune().get("SpaceReclaimed")
         if cleanup is not None:
@@ -305,22 +325,33 @@ def check_staleness(repository, tag):
     return is_stale
 
 
-def build_for_all_versions(image_name, py_versions, image_types, **kwargs):
+def build_for_all_versions(image_name, py_versions, image_types, suffix, **kwargs):
     """Builds the given Docker image for all Python & CUDA versions"""
     for py_version in py_versions:
         for image_type in image_types:
             _build_docker_image(
-                image_name, py_version=py_version, image_type=image_type, **kwargs
+                image_name,
+                py_version=py_version,
+                image_type=image_type,
+                suffix=suffix,
+                **kwargs,
             )
 
 
-def build_base_images(py_versions, image_types):
-    build_for_all_versions("base-deps", py_versions, image_types, no_cache=False)
-    build_for_all_versions("ray-deps", py_versions, image_types, no_cache=False)
+def build_base_images(py_versions, image_types, suffix):
+    build_for_all_versions(
+        "base-deps", py_versions, image_types, suffix=suffix, no_cache=False
+    )
+    build_for_all_versions(
+        "ray-deps", py_versions, image_types, suffix=suffix, no_cache=False
+    )
 
 
 def build_or_pull_base_images(
-    py_versions: List[str], image_types: List[str], rebuild_base_images: bool = True
+    py_versions: List[str],
+    image_types: List[str],
+    rebuild_base_images: bool = True,
+    suffix: Optional[str] = None,
 ) -> bool:
     """Returns images to tag and build."""
     repositories = ["rayproject/base-deps", "rayproject/ray-deps"]
@@ -342,7 +373,7 @@ def build_or_pull_base_images(
         is_stale = True
 
     if rebuild_base_images or _release_build() or is_stale:
-        build_base_images(py_versions, image_types)
+        build_base_images(py_versions, image_types, suffix=suffix)
         return True
     else:
         print("Just pulling images!")
@@ -441,8 +472,9 @@ def _create_new_tags(all_tags, old_str, new_str):
 def push_and_tag_images(
     py_versions: List[str],
     image_types: List[str],
-    push_base_images: bool,
     merge_build: bool = False,
+    image_list: Optional[List[str]] = None,
+    suffix: Optional[str] = None,
 ):
 
     date_tag = datetime.datetime.now().strftime("%Y-%m-%d")
@@ -452,10 +484,6 @@ def push_and_tag_images(
         date_tag = release_name
         sha_tag = release_name
 
-    image_list = ["ray", "ray-ml"]
-    if push_base_images:
-        image_list.extend(["base-deps", "ray-deps"])
-
     for image_name in image_list:
         full_image_name = f"rayproject/{image_name}"
 
@@ -476,7 +504,8 @@ def push_and_tag_images(
                     )
                     continue
 
-                tag = f"nightly-{py_name}-{image_type}"
+                tag = _with_suffix(f"nightly-{py_name}-{image_type}", suffix=suffix)
+
                 tag_mapping[tag].append(tag)
 
         # If no device is specified, it should map to CPU image.
@@ -519,41 +548,83 @@ def push_and_tag_images(
             )
             tag_mapping[old_tag].extend(new_tags)
 
+        print(f"These tags will be created for {image_name}: ", tag_mapping)
+
         # Sanity checking.
         for old_tag in tag_mapping.keys():
             if DEFAULT_PYTHON_VERSION in old_tag:
                 if "-cpu" in old_tag:
-                    assert "nightly-cpu" in tag_mapping[old_tag]
+                    assert (
+                        _with_suffix("nightly-cpu", suffix=suffix)
+                        in tag_mapping[old_tag]
+                    )
                     if "-deps" in image_name:
-                        assert "nightly" in tag_mapping[old_tag]
-                        assert f"{date_tag}-cpu" in tag_mapping[old_tag]
-                        assert f"{date_tag}" in tag_mapping[old_tag]
+                        assert (
+                            _with_suffix("nightly", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
+                        assert (
+                            _with_suffix(f"{date_tag}-cpu", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
+                        assert (
+                            _with_suffix(f"{date_tag}", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
                     elif image_name == "ray":
-                        assert "nightly" in tag_mapping[old_tag]
-                        assert f"{sha_tag}-cpu" in tag_mapping[old_tag]
-                        assert f"{sha_tag}" in tag_mapping[old_tag]
+                        assert (
+                            _with_suffix("nightly", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
+                        assert (
+                            _with_suffix(f"{sha_tag}-cpu", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
+                        assert (
+                            _with_suffix(f"{sha_tag}", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
                     # For ray-ml, nightly should refer to the GPU image.
                     elif image_name == "ray-ml":
-                        assert f"{sha_tag}-cpu" in tag_mapping[old_tag]
+                        assert (
+                            _with_suffix(f"{sha_tag}-cpu", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
                     else:
                         raise RuntimeError(f"Invalid image name: {image_name}")
 
                 elif ML_CUDA_VERSION in old_tag:
-                    assert "nightly-gpu" in tag_mapping[old_tag]
+                    assert (
+                        _with_suffix("nightly-gpu", suffix=suffix)
+                        in tag_mapping[old_tag]
+                    )
                     if "-deps" in image_name:
-                        assert f"{date_tag}-gpu" in tag_mapping[old_tag]
+                        assert (
+                            _with_suffix(f"{date_tag}-gpu", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
                     elif image_name == "ray":
-                        assert f"{sha_tag}-gpu" in tag_mapping[old_tag]
+                        assert (
+                            _with_suffix(f"{sha_tag}-gpu", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
                     # For ray-ml, nightly should refer to the GPU image.
                     elif image_name == "ray-ml":
-                        assert "nightly" in tag_mapping[old_tag]
-                        assert f"{sha_tag}" in tag_mapping[old_tag]
-                        assert f"{sha_tag}-gpu" in tag_mapping[old_tag]
+                        assert (
+                            _with_suffix("nightly", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
+                        assert (
+                            _with_suffix(f"{sha_tag}", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
+                        assert (
+                            _with_suffix(f"{sha_tag}-gpu", suffix=suffix)
+                            in tag_mapping[old_tag]
+                        )
                     else:
                         raise RuntimeError(f"Invalid image name: {image_name}")
 
-        print(f"These tags will be created for {image_name}: ", tag_mapping)
-
         # Tag and push all images.
         for old_tag in tag_mapping.keys():
             for new_tag in tag_mapping[old_tag]:
@@ -636,6 +707,12 @@ def push_readmes(merge_build: bool):
         required=True,
         help="Whether to bypass checking if docker is affected",
     )
+    parser.add_argument(
+        "--suffix",
+        required=False,
+        choices=ADDITIONAL_PLATFORMS,
+        help="Suffix to append to the build tags",
+    )
     parser.add_argument(
         "--build-base",
         dest="base",
@@ -718,28 +795,47 @@ def push_readmes(merge_build: bool):
             DOCKER_CLIENT.api.login(username=username, password=password)
         copy_wheels(build_type == HUMAN)
         is_base_images_built = build_or_pull_base_images(
-            py_versions, image_types, args.base
+            py_versions, image_types, args.base, suffix=args.suffix
         )
 
         if args.only_build_worker_container:
-            build_for_all_versions("ray-worker-container", py_versions, image_types)
+            build_for_all_versions(
+                "ray-worker-container", py_versions, image_types, suffix=args.suffix
+            )
             # TODO Currently don't push ray_worker_container
         else:
             # Build Ray Docker images.
-            build_for_all_versions("ray", py_versions, image_types)
+            build_for_all_versions("ray", py_versions, image_types, suffix=args.suffix)
+
+            # List of images to tag and push to docker hub
+            images_to_tag_and_push = []
+
+            if is_base_images_built:
+                images_to_tag_and_push += ["base-deps", "ray-deps"]
+
+            # Always tag/push ray
+            images_to_tag_and_push += ["ray"]
 
             # Only build ML Docker images for ML_CUDA_VERSION or cpu.
-            ml_image_types = [
-                image_type
-                for image_type in image_types
-                if image_type in [ML_CUDA_VERSION, "cpu"]
-            ]
+            if platform.processor() not in ADDITIONAL_PLATFORMS:
+                ml_image_types = [
+                    image_type
+                    for image_type in image_types
+                    if image_type in [ML_CUDA_VERSION, "cpu"]
+                ]
+            else:
+                # Do not build ray-ml e.g. for arm64
+                ml_image_types = []
 
             if len(ml_image_types) > 0:
                 prep_ray_ml()
                 build_for_all_versions(
-                    "ray-ml", py_versions, image_types=ml_image_types
+                    "ray-ml",
+                    py_versions,
+                    image_types=ml_image_types,
+                    suffix=args.suffix,
                 )
+                images_to_tag_and_push += ["ray-ml"]
 
             if build_type in {MERGE, PR}:
                 valid_branch = _valid_branch()
@@ -748,8 +844,9 @@ def push_readmes(merge_build: bool):
                 push_and_tag_images(
                     py_versions,
                     image_types,
-                    is_base_images_built,
-                    valid_branch and is_merge,
+                    merge_build=valid_branch and is_merge,
+                    image_list=images_to_tag_and_push,
+                    suffix=args.suffix,
                 )
 
         # TODO(ilr) Re-Enable Push READMEs by using a normal password
diff --git a/docker/base-deps/Dockerfile b/docker/base-deps/Dockerfile
index 6334c1359305..0b60772e8415 100644
--- a/docker/base-deps/Dockerfile
+++ b/docker/base-deps/Dockerfile
@@ -11,7 +11,9 @@ ENV TZ=America/Los_Angeles
 # TODO(ilr) $HOME seems to point to result in "" instead of "/home/ray"
 ENV PATH "/home/ray/anaconda3/bin:$PATH"
 ARG DEBIAN_FRONTEND=noninteractive
-ARG PYTHON_VERSION=3.7.7
+ARG PYTHON_VERSION=3.7.16
+
+ARG HOSTTYPE=${HOSTTYPE:-x86_64}
 
 ARG RAY_UID=1000
 ARG RAY_GID=100
@@ -42,14 +44,14 @@ RUN sudo apt-get update -y && sudo apt-get upgrade -y \
         openssh-client \
         gnupg; fi) \
     && wget \
-        --quiet "https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh" \
+        --quiet "https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-${HOSTTYPE}.sh" \
         -O /tmp/miniconda.sh \
     && /bin/bash /tmp/miniconda.sh -b -u -p $HOME/anaconda3 \
     && $HOME/anaconda3/bin/conda init \ 
     && echo 'export PATH=$HOME/anaconda3/bin:$PATH' >> /home/ray/.bashrc \
     && rm /tmp/miniconda.sh \
     && $HOME/anaconda3/bin/conda install -y \
-        libgcc python=$PYTHON_VERSION \
+        libgcc-ng python=$PYTHON_VERSION \
     && $HOME/anaconda3/bin/conda clean -y --all \
     && $HOME/anaconda3/bin/pip install --no-cache-dir \
         flatbuffers \
diff --git a/docker/base-deps/README.md b/docker/base-deps/README.md
index f7d92140a597..048020779b71 100644
--- a/docker/base-deps/README.md
+++ b/docker/base-deps/README.md
@@ -6,7 +6,7 @@ This image  has the system-level dependencies for `Ray` and the `Ray Autoscaler`
 
 ## Tags
 
-Images are `tagged` with the format `{Ray version}[-{Python version}][-{Platform}]`. `Ray version` tag can be one of the following:
+Images are `tagged` with the format `{Ray version}[-{Python version}][-{Platform}][-{Architecture}]`. `Ray version` tag can be one of the following:
 
 | Ray version tag | Description |
 | --------------- | ----------- |
@@ -26,6 +26,18 @@ The optional `Platform` tag specifies the platform where the image is intended f
 | `-gpu`  | Aliases to a specific `-cuXX` tagged image. |
 | no tag  | Aliases to `-cpu` tagged images for `ray`, and aliases to ``-gpu`` tagged images for `ray-ml`. |
 
+The optional `Architecture` tag can be used to specify images for different CPU architectures.
+Currently, we support the `x86_64` (`amd64`) and `aarch64` (`arm64`) architectures.
+
+Please note that suffixes are only used to specify `aarch64` images. No suffix means
+`x86_64`/`amd64`-compatible images.
+
+| Platform tag | Description             |
+|--------------|-------------------------|
+| `-aarch64`   | arm64-compatible images |
+| no tag       | Defaults to `amd64`     |
+
+
 ## Other Images
 * [`rayproject/ray`](https://hub.docker.com/repository/docker/rayproject/ray) - Ray and all of its dependencies.
 * [`rayproject/ray-ml`](https://hub.docker.com/repository/docker/rayproject/ray-ml) - This image with common ML libraries to make development & deployment more smooth!
diff --git a/docker/ray-deps/README.md b/docker/ray-deps/README.md
index 9be0ee4795e5..d510fdb16861 100644
--- a/docker/ray-deps/README.md
+++ b/docker/ray-deps/README.md
@@ -5,7 +5,7 @@ This has the python-level dependencies for `Ray` and the `Ray Autoscaler`. The `
 
 ## Tags
 
-Images are `tagged` with the format `{Ray version}[-{Python version}][-{Platform}]`. `Ray version` tag can be one of the following:
+Images are `tagged` with the format `{Ray version}[-{Python version}][-{Platform}][-{Architecture}]`. `Ray version` tag can be one of the following:
 
 | Ray version tag | Description |
 | --------------- | ----------- |
@@ -25,6 +25,17 @@ The optional `Platform` tag specifies the platform where the image is intended f
 | `-gpu`  | Aliases to a specific `-cuXX` tagged image. |
 | no tag  | Aliases to `-cpu` tagged images for `ray`, and aliases to ``-gpu`` tagged images for `ray-ml`. |
 
+The optional `Architecture` tag can be used to specify images for different CPU architectures.
+Currently, we support the `x86_64` (`amd64`) and `aarch64` (`arm64`) architectures.
+
+Please note that suffixes are only used to specify `aarch64` images. No suffix means
+`x86_64`/`amd64`-compatible images.
+
+| Platform tag | Description             |
+|--------------|-------------------------|
+| `-aarch64`   | arm64-compatible images |
+| no tag       | Defaults to `amd64`     |
+
 ## Other Images
 * [`rayproject/ray`](https://hub.docker.com/repository/docker/rayproject/ray) - Ray and all of its dependencies.
 * [`rayproject/ray-ml`](https://hub.docker.com/repository/docker/rayproject/ray-ml) - This image with common ML libraries to make development & deployment more smooth!
diff --git a/docker/ray-ml/README.md b/docker/ray-ml/README.md
index 56d32e9a029b..22a6cb13ee5f 100644
--- a/docker/ray-ml/README.md
+++ b/docker/ray-ml/README.md
@@ -29,5 +29,7 @@ Examples tags:
 - `nightly-py38-cpu`
 - `806c18-py38-cu112`
 
+The `ray-ml` images are not built for the `arm64` (`aarch64`) architecture.
+
 ## Other Images
 * [`rayproject/ray`](https://hub.docker.com/repository/docker/rayproject/ray) - Ray and all of its dependencies.
diff --git a/docker/ray-worker-container/Dockerfile b/docker/ray-worker-container/Dockerfile
index e340b6af0b62..fc6f2c6a404f 100644
--- a/docker/ray-worker-container/Dockerfile
+++ b/docker/ray-worker-container/Dockerfile
@@ -6,9 +6,11 @@ ARG BASE_IMAGE
 ARG AUTOSCALER="autoscaler"
 ENV TZ=America/Los_Angeles
 
+ARG HOSTTYPE=${HOSTTYPE:-x86_64}
+
 ENV PATH "/root/anaconda3/bin:$PATH"
 ARG DEBIAN_FRONTEND=noninteractive
-ARG PYTHON_VERSION=3.7.7
+ARG PYTHON_VERSION=3.7.16
 
 RUN apt-get update -y \
     && apt-get install -y sudo tzdata \
@@ -30,7 +32,7 @@ RUN apt-get update -y && sudo apt-get upgrade -y \
         gnupg; fi) \
         unzip \
     && wget \
-        --quiet "https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh" \
+        --quiet "https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-${HOSTTYPE}.sh" \
         -O /tmp/miniconda.sh \
     && /bin/bash /tmp/miniconda.sh -b -u -p $HOME/anaconda3 \
     && $HOME/anaconda3/bin/conda init \
diff --git a/docker/ray/README.md b/docker/ray/README.md
index 4a0958d2d25d..0a908187881a 100644
--- a/docker/ray/README.md
+++ b/docker/ray/README.md
@@ -4,7 +4,7 @@ everything needed to get started with running Ray! They work for both local deve
 
 ## Tags
 
-Images are `tagged` with the format `{Ray version}[-{Python version}][-{Platform}]`. `Ray version` tag can be one of the following:
+Images are `tagged` with the format `{Ray version}[-{Python version}][-{Platform}][-{Architecture}]`. `Ray version` tag can be one of the following:
 
 | Ray version tag | Description |
 | --------------- | ----------- |
@@ -24,11 +24,37 @@ The optional `Platform` tag specifies the platform where the image is intended f
 | `-gpu`  | Aliases to a specific `-cuXX` tagged image. |
 | no tag  | Aliases to `-cpu` tagged images for `ray`, and aliases to ``-gpu`` tagged images for `ray-ml`. |
 
+The optional `Architecture` tag can be used to specify images for different CPU architectures.
+Currently, we support the `x86_64` (`amd64`) and `aarch64` (`arm64`) architectures.
+
+Please note that suffixes are only used to specify `aarch64` images. No suffix means
+`x86_64`/`amd64`-compatible images.
+
+| Platform tag | Description             |
+|--------------|-------------------------|
+| `-aarch64`   | arm64-compatible images |
+| no tag       | Defaults to `amd64`     |
+
 Examples tags:
 - none: equivalent to `latest`
 - `latest`: equivalent to `latest-py37-cpu`, i.e. image for the most recent Ray release
 - `nightly-py38-cpu`
 - `806c18-py38-cu112`
+- `806c18-py38-cu116-aarch64`
+
+## Roadmap
+
+Ray 2.3 will be the first release for which arm64 images are released. These images will have the `-aarch64` suffix.
+
+There won't be a `:latest-aarch64` image, instead `:2.3.0-aarch64` should be used explicitly. This is because
+we may remove suffixes in the next release.
+
+For Ray 2.4, we aim to have support for multiplatform images. This means that specifying the suffix
+will not be needed anymore - docker will automatically choose a compatible image.
+
+We may stop publishing architecture suffixes completely when we have support for multiplatform images.
+
+There is an open RFC issue on GitHub to discuss this roadmap: [Link to issue](https://github.com/ray-project/ray/issues/31966)
 
 ## Other Images
 * [`rayproject/ray-ml`](https://hub.docker.com/repository/docker/rayproject/ray-ml) - This image with common ML libraries to make development & deployment more smooth!

From 6b081e9e000f181cb05036c91e3369e58c2baba3 Mon Sep 17 00:00:00 2001
From: Eric Liang <ekhliang@gmail.com>
Date: Thu, 26 Jan 2023 11:35:56 -0800
Subject: [PATCH 008/267] [data] [streaming] [11/n]--- Run streaming executor
 on a helper thread (#31951)

We currently run the streaming control loop on the user thread, which means it stalls between generator yields. This moves it in a separate thread to avoid unnecessary stalls. We still provide backpressure via the queue between threads (size set to 1).

This improves ingest throughput by 20% on a benchmark I tried (1.0->1.2GB/s). The queue size did not seem to matter, just having it >=1 was sufficient to provide the performance improvement.
---
 .../_internal/execution/streaming_executor.py | 66 ++++++++++++++-----
 1 file changed, 48 insertions(+), 18 deletions(-)

diff --git a/python/ray/data/_internal/execution/streaming_executor.py b/python/ray/data/_internal/execution/streaming_executor.py
index 1d3543100b0c..b2f169869b59 100644
--- a/python/ray/data/_internal/execution/streaming_executor.py
+++ b/python/ray/data/_internal/execution/streaming_executor.py
@@ -1,4 +1,6 @@
 import logging
+import queue
+import threading
 import os
 from typing import Iterator, Optional
 
@@ -27,7 +29,7 @@
 DEBUG_TRACE_SCHEDULING = "RAY_DATASET_TRACE_SCHEDULING" in os.environ
 
 
-class StreamingExecutor(Executor):
+class StreamingExecutor(Executor, threading.Thread):
     """A streaming Dataset executor.
 
     This implementation executes Dataset DAGs in a fully streamed way. It runs
@@ -41,9 +43,16 @@ def __init__(self, options: ExecutionOptions):
         # data updates the stats object in legacy code).
         self._stats: Optional[DatasetStats] = None
         self._global_info: Optional[ProgressBar] = None
-        if options.locality_with_output:
-            raise NotImplementedError("locality with output")
-        super().__init__(options)
+
+        # Internal execution state shared across thread boundaries. We run the control
+        # loop on a separate thread so that it doesn't become stalled between
+        # generator `yield`s.
+        self._runner_thread_out = queue.Queue(maxsize=1)
+        self._topology: Optional[Topology] = None
+        self._output_node: Optional[OpState] = None
+
+        Executor.__init__(self, options)
+        threading.Thread.__init__(self)
 
     def execute(
         self, dag: PhysicalOperator, initial_stats: Optional[DatasetStats] = None
@@ -57,27 +66,48 @@ def execute(
             logger.info("Executing DAG %s", dag)
             self._global_info = ProgressBar("Resource usage vs limits", 1, 0)
 
-        # Setup the streaming DAG topology.
-        topology, self._stats = build_streaming_topology(dag, self._options)
-        output_node: OpState = topology[dag]
+        # Setup the streaming DAG topology and start the runner thread.
+        self._topology, self._stats = build_streaming_topology(dag, self._options)
+        _validate_topology(self._topology, self._get_or_refresh_resource_limits())
 
+        self._output_node: OpState = self._topology[dag]
+        self.start()
+
+        # Drain items from the runner thread until completion.
         try:
-            _validate_topology(topology, self._get_or_refresh_resource_limits())
-            output_node: OpState = topology[dag]
+            item = self._runner_thread_out.get()
+            while item is not None:
+                if isinstance(item, Exception):
+                    raise item
+                else:
+                    yield item
+                item = self._runner_thread_out.get()
+        finally:
+            for op in self._topology:
+                op.shutdown()
+            if self._global_info:
+                self._global_info.close()
 
+    def run(self):
+        """Run the control loop in a helper thread.
+
+        Results are returned via the `self._runner_thread_out` queue.
+        """
+        try:
             # Run scheduling loop until complete.
-            while self._scheduling_loop_step(topology):
-                while output_node.outqueue:
-                    yield output_node.outqueue.pop(0)
+            while self._scheduling_loop_step(self._topology):
+                while self._output_node.outqueue:
+                    self._runner_thread_out.put(self._output_node.outqueue.pop(0))
 
             # Handle any leftover outputs.
-            while output_node.outqueue:
-                yield output_node.outqueue.pop(0)
+            while self._output_node.outqueue:
+                self._runner_thread_out.put(self._output_node.outqueue.pop(0))
+        except Exception as e:
+            # Propagate it to the result iterator.
+            self._runner_thread_out.put(e)
         finally:
-            for op in topology:
-                op.shutdown()
-            if self._global_info:
-                self._global_info.close()
+            # Signal end of results.
+            self._runner_thread_out.put(None)
 
     def get_stats(self):
         """Return the stats object for the streaming execution.

From 39a901eb40aa1d55639ddd90bcd4094182e999a9 Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Thu, 26 Jan 2023 14:21:39 -0800
Subject: [PATCH 009/267] [nightly] Delete deprecated flags in nightly test.
 (#31973)

<!-- Please add a reviewer to the assignee section when you create a PR. If you don't have the access to it, we will shortly find a reviewer and assign them to your PR. -->

## Why are these changes needed?
These flags are no longer useful because the migration has been finished. Delete them.
<!-- Please give a short summary of the change and the problem this solves. -->

## Related issue number

<!-- For example: "Closes #1234" -->

## Checks

- [ ] I've signed off every commit(by using the -s flag, i.e., `git commit -s`) in this PR.
- [ ] I've run `scripts/format.sh` to lint the changes in this PR.
- [ ] I've included any doc changes needed for https://docs.ray.io/en/master/.
- [ ] I've made sure the tests are passing. Note that there might be a few flaky tests, see the recent failures at https://flakey-tests.ray.io/
- Testing Strategy
   - [ ] Unit tests
   - [ ] Release tests
   - [ ] This PR is not tested :(
---
 release/ray_release/cluster_manager/cluster_manager.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/release/ray_release/cluster_manager/cluster_manager.py b/release/ray_release/cluster_manager/cluster_manager.py
index f4e44579af90..5455360c2107 100644
--- a/release/ray_release/cluster_manager/cluster_manager.py
+++ b/release/ray_release/cluster_manager/cluster_manager.py
@@ -54,8 +54,6 @@ def set_cluster_env(self, cluster_env: Dict[str, Any]):
         # Add flags for redisless Ray
         self.cluster_env.setdefault("env_vars", {})
         self.cluster_env["env_vars"]["MATCH_AUTOSCALER_AND_RAY_IMAGES"] = "1"
-        self.cluster_env["env_vars"]["RAY_gcs_storage"] = "memory"
-        self.cluster_env["env_vars"]["RAY_bootstrap_with_gcs"] = "1"
         self.cluster_env["env_vars"]["RAY_USAGE_STATS_ENABLED"] = "1"
         self.cluster_env["env_vars"]["RAY_USAGE_STATS_SOURCE"] = "nightly-tests"
         self.cluster_env["env_vars"][

From a32b9b1bf21bb3cd971ce48aa9517810693d8f1f Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Thu, 26 Jan 2023 15:09:40 -0800
Subject: [PATCH 010/267] [core] Fix gcs healthch manager crash when node is
 removed by node manager. (#31917)

The root cause is because the data structure is deleted, but call backs is not canceled and got executed. This PR simplify the life model and make it the way gRPC works. We only delete the structure after gRPC OnDone is called.

In the shortcut, according to the doc https://github.com/grpc/proposal/blob/master/L67-cpp-callback-api.md#unary-rpc-shortcuts , OnDone will call the callback function.

A better model is needed here. The code will be changed once we update the threading model in gRPC.
---
 .bazelrc                                      |  1 +
 BUILD.bazel                                   |  2 +-
 .../gcs_server/gcs_health_check_manager.cc    | 48 ++++++------
 .../gcs/gcs_server/gcs_health_check_manager.h | 23 ++----
 .../test/gcs_health_check_manager_test.cc     | 75 +++++++++++++++----
 5 files changed, 90 insertions(+), 59 deletions(-)

diff --git a/.bazelrc b/.bazelrc
index 1c4b9f296b8f..1b98b8f72a3f 100644
--- a/.bazelrc
+++ b/.bazelrc
@@ -97,6 +97,7 @@ build:tsan --copt -g
 build:tsan --copt -fno-omit-frame-pointer
 build:tsan --copt -Wno-uninitialized
 build:tsan --linkopt -fsanitize=thread
+build:tsan --cxxopt="-D_RAY_TSAN_BUILD"
 # This config is only for running TSAN with LLVM toolchain on Linux.
 build:tsan-clang --config=tsan
 build:tsan-clang --config=llvm
diff --git a/BUILD.bazel b/BUILD.bazel
index 82e9a74be901..9b6b22d43240 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -1856,7 +1856,7 @@ cc_library(
 
 cc_test(
     name = "gcs_health_check_manager_test",
-    size = "small",
+    size = "medium",
     srcs = [
         "src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc",
     ],
diff --git a/src/ray/gcs/gcs_server/gcs_health_check_manager.cc b/src/ray/gcs/gcs_server/gcs_health_check_manager.cc
index 831f345ef81a..7a3d99e74e05 100644
--- a/src/ray/gcs/gcs_server/gcs_health_check_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_health_check_manager.cc
@@ -53,6 +53,7 @@ void GcsHealthCheckManager::RemoveNode(const NodeID &node_id) {
         if (iter == health_check_contexts_.end()) {
           return;
         }
+        iter->second->Stop();
         health_check_contexts_.erase(iter);
       },
       "GcsHealthCheckManager::RemoveNode");
@@ -60,8 +61,11 @@ void GcsHealthCheckManager::RemoveNode(const NodeID &node_id) {
 
 void GcsHealthCheckManager::FailNode(const NodeID &node_id) {
   RAY_LOG(WARNING) << "Node " << node_id << " is dead because the health check failed.";
-  on_node_death_callback_(node_id);
-  health_check_contexts_.erase(node_id);
+  auto iter = health_check_contexts_.find(node_id);
+  if (iter != health_check_contexts_.end()) {
+    on_node_death_callback_(node_id);
+    health_check_contexts_.erase(iter);
+  }
 }
 
 std::vector<NodeID> GcsHealthCheckManager::GetAllNodes() const {
@@ -75,27 +79,23 @@ std::vector<NodeID> GcsHealthCheckManager::GetAllNodes() const {
 void GcsHealthCheckManager::HealthCheckContext::StartHealthCheck() {
   using ::grpc::health::v1::HealthCheckResponse;
 
-  context_ = std::make_shared<grpc::ClientContext>();
+  // Reset the context/request/response for the next request.
+  context_.~ClientContext();
+  new (&context_) grpc::ClientContext();
+  response_.Clear();
 
   auto deadline =
       std::chrono::system_clock::now() + std::chrono::milliseconds(manager_->timeout_ms_);
-  context_->set_deadline(deadline);
+  context_.set_deadline(deadline);
   stub_->async()->Check(
-      context_.get(),
-      &request_,
-      &response_,
-      [this, stopped = this->stopped_, context = this->context_, now = absl::Now()](
-          ::grpc::Status status) {
+      &context_, &request_, &response_, [this, now = absl::Now()](::grpc::Status status) {
         // This callback is done in gRPC's thread pool.
         STATS_health_check_rpc_latency_ms.Record(
             absl::ToInt64Milliseconds(absl::Now() - now));
-        if (status.error_code() == ::grpc::StatusCode::CANCELLED) {
-          return;
-        }
         manager_->io_service_.post(
-            [this, stopped, status]() {
-              // Stopped has to be read in the same thread where it's updated.
-              if (*stopped) {
+            [this, status]() {
+              if (stopped_) {
+                delete this;
                 return;
               }
               RAY_LOG(DEBUG) << "Health check status: " << int(response_.status());
@@ -110,32 +110,28 @@ void GcsHealthCheckManager::HealthCheckContext::StartHealthCheck() {
               }
 
               if (health_check_remaining_ == 0) {
-                manager_->io_service_.post([this]() { manager_->FailNode(node_id_); },
-                                           "");
+                manager_->FailNode(node_id_);
+                delete this;
               } else {
                 // Do another health check.
                 timer_.expires_from_now(
                     boost::posix_time::milliseconds(manager_->period_ms_));
-                timer_.async_wait([this, stopped](auto ec) {
-                  // We need to check stopped here as well since cancel
-                  // won't impact the queued tasks.
-                  if (ec != boost::asio::error::operation_aborted && !*stopped) {
-                    StartHealthCheck();
-                  }
-                });
+                timer_.async_wait([this](auto) { StartHealthCheck(); });
               }
             },
             "HealthCheck");
       });
 }
 
+void GcsHealthCheckManager::HealthCheckContext::Stop() { stopped_ = true; }
+
 void GcsHealthCheckManager::AddNode(const NodeID &node_id,
                                     std::shared_ptr<grpc::Channel> channel) {
   io_service_.dispatch(
       [this, channel, node_id]() {
         RAY_CHECK(health_check_contexts_.count(node_id) == 0);
-        auto context = std::make_unique<HealthCheckContext>(this, channel, node_id);
-        health_check_contexts_.emplace(std::make_pair(node_id, std::move(context)));
+        auto context = new HealthCheckContext(this, channel, node_id);
+        health_check_contexts_.emplace(std::make_pair(node_id, context));
       },
       "GcsHealthCheckManager::AddNode");
 }
diff --git a/src/ray/gcs/gcs_server/gcs_health_check_manager.h b/src/ray/gcs/gcs_server/gcs_health_check_manager.h
index e0daea5edfcf..d877a217d803 100644
--- a/src/ray/gcs/gcs_server/gcs_health_check_manager.h
+++ b/src/ray/gcs/gcs_server/gcs_health_check_manager.h
@@ -91,27 +91,16 @@ class GcsHealthCheckManager {
                        NodeID node_id)
         : manager_(manager),
           node_id_(node_id),
-          stopped_(std::make_shared<bool>(false)),
           timer_(manager->io_service_),
           health_check_remaining_(manager->failure_threshold_) {
       request_.set_service(node_id.Hex());
       stub_ = grpc::health::v1::Health::NewStub(channel);
       timer_.expires_from_now(
           boost::posix_time::milliseconds(manager_->initial_delay_ms_));
-      timer_.async_wait([this](auto ec) {
-        if (ec != boost::asio::error::operation_aborted) {
-          StartHealthCheck();
-        }
-      });
+      timer_.async_wait([this](auto) { StartHealthCheck(); });
     }
 
-    ~HealthCheckContext() {
-      timer_.cancel();
-      if (context_ != nullptr) {
-        context_->TryCancel();
-      }
-      *stopped_ = true;
-    }
+    void Stop();
 
    private:
     void StartHealthCheck();
@@ -121,14 +110,12 @@ class GcsHealthCheckManager {
     NodeID node_id_;
 
     // Whether the health check has stopped.
-    std::shared_ptr<bool> stopped_;
+    bool stopped_ = false;
 
     /// gRPC related fields
     std::unique_ptr<::grpc::health::v1::Health::Stub> stub_;
 
-    // The context is used in the gRPC callback which is in another
-    // thread, so we need it to be a shared_ptr.
-    std::shared_ptr<grpc::ClientContext> context_;
+    grpc::ClientContext context_;
     ::grpc::health::v1::HealthCheckRequest request_;
     ::grpc::health::v1::HealthCheckResponse response_;
 
@@ -146,7 +133,7 @@ class GcsHealthCheckManager {
   std::function<void(const NodeID &)> on_node_death_callback_;
 
   /// The context of the health check for each nodes.
-  absl::flat_hash_map<NodeID, std::unique_ptr<HealthCheckContext>> health_check_contexts_;
+  absl::flat_hash_map<NodeID, HealthCheckContext *> health_check_contexts_;
 
   /// The delay for the first health check request.
   const int64_t initial_delay_ms_;
diff --git a/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc b/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc
index f4f4bf8cefb2..31be1bbd5d6d 100644
--- a/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc
@@ -19,9 +19,13 @@
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/optional.hpp>
 #include <boost/thread.hpp>
+#include <cstdlib>
 #include <unordered_map>
 
 using namespace boost;
+using namespace boost::asio;
+using namespace boost::asio::ip;
+
 #include <ray/rpc/grpc_server.h>
 
 #include <chrono>
@@ -30,6 +34,20 @@ using namespace boost;
 #include "gtest/gtest.h"
 #include "ray/gcs/gcs_server/gcs_health_check_manager.h"
 
+int GetFreePort() {
+  io_service io_service;
+  tcp::acceptor acceptor(io_service);
+  tcp::endpoint endpoint;
+
+  // try to bind to port 0 to find a free port
+  acceptor.open(tcp::v4());
+  acceptor.bind(tcp::endpoint(tcp::v4(), 0));
+  endpoint = acceptor.local_endpoint();
+  auto port = endpoint.port();
+  acceptor.close();
+  return port;
+}
+
 using namespace ray;
 using namespace std::literals::chrono_literals;
 
@@ -46,7 +64,6 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
         timeout_ms,
         period_ms,
         failure_threshold);
-    port = 10000;
   }
 
   void TearDown() override {
@@ -65,7 +82,8 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
   NodeID AddServer(bool alive = true) {
     std::promise<int> port_promise;
     auto node_id = NodeID::FromRandom();
-
+    auto port = GetFreePort();
+    RAY_LOG(INFO) << "Get port " << port;
     auto server = std::make_shared<rpc::GrpcServer>(node_id.Hex(), port, true);
 
     auto channel = grpc::CreateChannel("localhost:" + std::to_string(port),
@@ -76,7 +94,6 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
     }
     servers.emplace(node_id, server);
     health_check->AddNode(node_id, channel);
-    ++port;
     return node_id;
   }
 
@@ -115,14 +132,13 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
     }
   }
 
-  int port;
   instrumented_io_context io_service;
   std::unique_ptr<gcs::GcsHealthCheckManager> health_check;
   std::unordered_map<NodeID, std::shared_ptr<rpc::GrpcServer>> servers;
   std::unordered_set<NodeID> dead_nodes;
-  const int64_t initial_delay_ms = 1000;
-  const int64_t timeout_ms = 1000;
-  const int64_t period_ms = 1000;
+  const int64_t initial_delay_ms = 100;
+  const int64_t timeout_ms = 10;
+  const int64_t period_ms = 10;
   const int64_t failure_threshold = 5;
 };
 
@@ -143,8 +159,6 @@ TEST_F(GcsHealthCheckManagerTest, TestBasic) {
     Run(2);  // One for starting RPC and one for the RPC callback.
   }
 
-  Run();  // For failure callback.
-
   ASSERT_EQ(1, dead_nodes.size());
   ASSERT_TRUE(dead_nodes.count(node_id));
 }
@@ -169,8 +183,6 @@ TEST_F(GcsHealthCheckManagerTest, StoppedAndResume) {
     }
   }
 
-  Run();  // For failure callback.
-
   ASSERT_EQ(0, dead_nodes.size());
 }
 
@@ -196,8 +208,6 @@ TEST_F(GcsHealthCheckManagerTest, Crashed) {
     Run(2);  // One for starting RPC and one for the RPC callback.
   }
 
-  Run();  // For failure callback.
-
   ASSERT_EQ(1, dead_nodes.size());
   ASSERT_TRUE(dead_nodes.count(node_id));
 }
@@ -230,12 +240,49 @@ TEST_F(GcsHealthCheckManagerTest, NoRegister) {
     Run(2);  // One for starting RPC and one for the RPC callback.
   }
 
-  Run(2);
+  Run(1);
   ASSERT_EQ(1, dead_nodes.size());
   ASSERT_TRUE(dead_nodes.count(node_id));
 }
 
+TEST_F(GcsHealthCheckManagerTest, StressTest) {
+#ifdef _RAY_TSAN_BUILD
+  GTEST_SKIP() << "Disabled in tsan because of performance";
+#endif
+  boost::asio::io_service::work work(io_service);
+  std::srand(std::time(nullptr));
+  auto t = std::make_unique<std::thread>([this]() { this->io_service.run(); });
+
+  std::vector<NodeID> alive_nodes;
+
+  for (int i = 0; i < 200; ++i) {
+    alive_nodes.emplace_back(AddServer(true));
+    std::this_thread::sleep_for(10ms);
+  }
+
+  for (size_t i = 0; i < 20000UL; ++i) {
+    RAY_LOG(INFO) << "Progress: " << i << "/20000";
+    auto iter = alive_nodes.begin() + std::rand() % alive_nodes.size();
+    health_check->RemoveNode(*iter);
+    DeleteServer(*iter);
+    alive_nodes.erase(iter);
+    alive_nodes.emplace_back(AddServer(true));
+  }
+  RAY_LOG(INFO) << "Finished!";
+  io_service.stop();
+  t->join();
+}
+
 int main(int argc, char **argv) {
+  InitShutdownRAII ray_log_shutdown_raii(ray::RayLog::StartRayLog,
+                                         ray::RayLog::ShutDownRayLog,
+                                         argv[0],
+                                         ray::RayLogLevel::INFO,
+                                         /*log_dir=*/"");
+
+  ray::RayLog::InstallFailureSignalHandler(argv[0]);
+  ray::RayLog::InstallTerminateHandler();
+
   ::testing::InitGoogleTest(&argc, argv);
   return RUN_ALL_TESTS();
 }

From e753b03c23aa630d59c7f032cd6f17877788f950 Mon Sep 17 00:00:00 2001
From: Alex Wu <alex@anyscale.io>
Date: Thu, 26 Jan 2023 15:27:20 -0800
Subject: [PATCH 011/267] [1/n] Stabilize GCS/Autoscaler interface: Introduce
 monitor server (#31827)

This is the first PR towards stabilizing the GCS autoscaler interface by introducing a new grpc service definition which we will provide backwards compatibility guarantees.

This PR mostly just introduces scaffolding and a trivial GetRayVersion endpoint.

By the end of this series of PRs, monitor.py will only communicate with the rest of the ray cluster via this service definition.
---
 BUILD.bazel                                   | 36 +++++++++++++++
 python/ray/tests/BUILD                        |  8 ++++
 python/ray/tests/test_monitor_service.py      | 18 ++++++++
 src/ray/gcs/gcs_server/gcs_monitor_server.cc  | 32 +++++++++++++
 src/ray/gcs/gcs_server/gcs_monitor_server.h   | 33 +++++++++++++
 src/ray/gcs/gcs_server/gcs_server.cc          | 10 ++++
 src/ray/gcs/gcs_server/gcs_server.h           |  8 ++++
 .../test/gcs_monitor_server_test.cc           | 46 +++++++++++++++++++
 src/ray/protobuf/BUILD                        | 15 ++++++
 src/ray/protobuf/monitor.proto                | 30 ++++++++++++
 src/ray/rpc/gcs_server/gcs_rpc_server.h       | 42 +++++++++++++++++
 11 files changed, 278 insertions(+)
 create mode 100644 python/ray/tests/test_monitor_service.py
 create mode 100644 src/ray/gcs/gcs_server/gcs_monitor_server.cc
 create mode 100644 src/ray/gcs/gcs_server/gcs_monitor_server.h
 create mode 100644 src/ray/gcs/gcs_server/test/gcs_monitor_server_test.cc
 create mode 100644 src/ray/protobuf/monitor.proto

diff --git a/BUILD.bazel b/BUILD.bazel
index 9b6b22d43240..39c9ddd285da 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -272,6 +272,23 @@ cc_library(
     ],
 )
 
+# monitor/autoscaler service
+cc_grpc_library(
+    name = "monitor_cc_grpc",
+    srcs = ["//src/ray/protobuf:monitor_proto"],
+    grpc_only = True,
+    deps = ["//src/ray/protobuf:monitor_cc_proto"],
+)
+
+cc_library(
+    name = "monitor_rpc",
+    copts = COPTS,
+    visibility = ["//visibility:public"],
+    deps = [
+        ":monitor_cc_grpc",
+    ],
+)
+
 # === End of rpc definitions ===
 
 # === Begin of plasma definitions ===
@@ -541,6 +558,7 @@ cc_library(
         ":gcs_service_cc_grpc",
         ":gcs_service_rpc",
         ":gcs_table_storage_lib",
+        ":monitor_rpc",
         ":node_manager_rpc",
         ":observable_store_client",
         ":pubsub_lib",
@@ -2020,6 +2038,23 @@ cc_test(
     ],
 )
 
+cc_test(
+    name = "gcs_monitor_server_test",
+    size = "small",
+    srcs = [
+        "src/ray/gcs/gcs_server/test/gcs_monitor_server_test.cc",
+    ],
+    copts = COPTS,
+    tags = ["team:serverless"],
+    deps = [
+        ":gcs_server_lib",
+        ":gcs_server_test_util",
+        ":gcs_test_util_lib",
+        ":ray_mock",
+        "@com_google_googletest//:gtest_main",
+    ],
+)
+
 cc_library(
     name = "gcs_table_storage_lib",
     srcs = glob(
@@ -2828,6 +2863,7 @@ filegroup(
         "//src/ray/protobuf:gcs_py_proto",
         "//src/ray/protobuf:gcs_service_py_proto",
         "//src/ray/protobuf:job_agent_py_proto",
+        "//src/ray/protobuf:monitor_py_proto",
         "//src/ray/protobuf:node_manager_py_proto",
         "//src/ray/protobuf:ray_client_py_proto",
         "//src/ray/protobuf:reporter_py_proto",
diff --git a/python/ray/tests/BUILD b/python/ray/tests/BUILD
index d158b9372a8b..56241ea1343b 100644
--- a/python/ray/tests/BUILD
+++ b/python/ray/tests/BUILD
@@ -203,6 +203,14 @@ py_test_module_list(
   deps = ["//:ray_lib", ":conftest"],
 )
 
+py_test_module_list(
+  files = [
+    "test_monitor_service.py",
+  ],
+  size = "medium",
+  tags = ["exclusive", "medium_size_python_tests_k_to_z", "team:serverless"],
+  deps = ["//:ray_lib", ":conftest"],
+)
 
 py_test_module_list(
   files = [
diff --git a/python/ray/tests/test_monitor_service.py b/python/ray/tests/test_monitor_service.py
new file mode 100644
index 000000000000..71c7a3e2af47
--- /dev/null
+++ b/python/ray/tests/test_monitor_service.py
@@ -0,0 +1,18 @@
+import pytest
+
+import ray
+import grpc
+from ray.core.generated import monitor_pb2, monitor_pb2_grpc
+
+
+@pytest.fixture
+def monitor_stub(ray_start_regular_shared):
+    channel = grpc.insecure_channel(ray_start_regular_shared["gcs_address"])
+
+    return monitor_pb2_grpc.MonitorGcsServiceStub(channel)
+
+
+def test_ray_version(monitor_stub):
+    request = monitor_pb2.GetRayVersionRequest()
+    response = monitor_stub.GetRayVersion(request)
+    assert response.version == ray.__version__
diff --git a/src/ray/gcs/gcs_server/gcs_monitor_server.cc b/src/ray/gcs/gcs_server/gcs_monitor_server.cc
new file mode 100644
index 000000000000..af0d36c93134
--- /dev/null
+++ b/src/ray/gcs/gcs_server/gcs_monitor_server.cc
@@ -0,0 +1,32 @@
+// Copyright 2017 The Ray Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//  http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "ray/gcs/gcs_server/gcs_monitor_server.h"
+
+#include "ray/common/constants.h"
+
+namespace ray {
+namespace gcs {
+
+GcsMonitorServer::GcsMonitorServer() {}
+
+void GcsMonitorServer::HandleGetRayVersion(rpc::GetRayVersionRequest request,
+                                           rpc::GetRayVersionReply *reply,
+                                           rpc::SendReplyCallback send_reply_callback) {
+  reply->set_version(kRayVersion);
+  send_reply_callback(Status::OK(), nullptr, nullptr);
+}
+
+}  // namespace gcs
+}  // namespace ray
diff --git a/src/ray/gcs/gcs_server/gcs_monitor_server.h b/src/ray/gcs/gcs_server/gcs_monitor_server.h
new file mode 100644
index 000000000000..4fa85bb3b5f7
--- /dev/null
+++ b/src/ray/gcs/gcs_server/gcs_monitor_server.h
@@ -0,0 +1,33 @@
+// Copyright 2023 The Ray Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//  http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+
+#include "ray/rpc/gcs_server/gcs_rpc_server.h"
+
+namespace ray {
+namespace gcs {
+
+/// GcsMonitorServer is a shim responsible for providing a compatible interface between
+/// GCS and `monitor.py`
+class GcsMonitorServer : public rpc::MonitorServiceHandler {
+ public:
+  explicit GcsMonitorServer();
+
+  void HandleGetRayVersion(rpc::GetRayVersionRequest request,
+                           rpc::GetRayVersionReply *reply,
+                           rpc::SendReplyCallback send_reply_callback) override;
+};
+}  // namespace gcs
+}  // namespace ray
diff --git a/src/ray/gcs/gcs_server/gcs_server.cc b/src/ray/gcs/gcs_server/gcs_server.cc
index 5d9f98db3b83..1b013bd79f22 100644
--- a/src/ray/gcs/gcs_server/gcs_server.cc
+++ b/src/ray/gcs/gcs_server/gcs_server.cc
@@ -166,6 +166,9 @@ void GcsServer::DoStart(const GcsInitData &gcs_init_data) {
   // Init GCS task manager.
   InitGcsTaskManager();
 
+  // Init Monitor service.
+  InitMonitorServer();
+
   // Install event listeners.
   InstallEventListeners();
 
@@ -586,6 +589,13 @@ void GcsServer::InitGcsTaskManager() {
   rpc_server_.RegisterService(*task_info_service_);
 }
 
+void GcsServer::InitMonitorServer() {
+  monitor_server_ = std::make_unique<GcsMonitorServer>();
+  monitor_grpc_service_.reset(
+      new rpc::MonitorGrpcService(main_service_, *monitor_server_));
+  rpc_server_.RegisterService(*monitor_grpc_service_);
+}
+
 void GcsServer::InstallEventListeners() {
   // Install node event listeners.
   gcs_node_manager_->AddNodeAddedListener([this](std::shared_ptr<rpc::GcsNodeInfo> node) {
diff --git a/src/ray/gcs/gcs_server/gcs_server.h b/src/ray/gcs/gcs_server/gcs_server.h
index f6397452aceb..dadc1f81e6e7 100644
--- a/src/ray/gcs/gcs_server/gcs_server.h
+++ b/src/ray/gcs/gcs_server/gcs_server.h
@@ -22,6 +22,7 @@
 #include "ray/gcs/gcs_server/gcs_health_check_manager.h"
 #include "ray/gcs/gcs_server/gcs_init_data.h"
 #include "ray/gcs/gcs_server/gcs_kv_manager.h"
+#include "ray/gcs/gcs_server/gcs_monitor_server.h"
 #include "ray/gcs/gcs_server/gcs_redis_failure_detector.h"
 #include "ray/gcs/gcs_server/gcs_table_storage.h"
 #include "ray/gcs/gcs_server/gcs_task_manager.h"
@@ -151,6 +152,9 @@ class GcsServer {
   /// Install event listeners.
   void InstallEventListeners();
 
+  /// Initialize monitor service.
+  void InitMonitorServer();
+
  private:
   /// Gets the type of KV storage to use from config.
   std::string StorageType() const;
@@ -215,6 +219,10 @@ class GcsServer {
   std::unique_ptr<GcsFunctionManager> function_manager_;
   /// Node resource info handler and service.
   std::unique_ptr<rpc::NodeResourceInfoGrpcService> node_resource_info_service_;
+  /// Monitor server supports monitor.py
+  std::unique_ptr<GcsMonitorServer> monitor_server_;
+  /// Monitor service for monitor server
+  std::unique_ptr<rpc::MonitorGrpcService> monitor_grpc_service_;
 
   /// Synchronization service for ray.
   /// TODO(iycheng): Deprecate this gcs_ray_syncer_ one once we roll out
diff --git a/src/ray/gcs/gcs_server/test/gcs_monitor_server_test.cc b/src/ray/gcs/gcs_server/test/gcs_monitor_server_test.cc
new file mode 100644
index 000000000000..cba584afc6a3
--- /dev/null
+++ b/src/ray/gcs/gcs_server/test/gcs_monitor_server_test.cc
@@ -0,0 +1,46 @@
+
+// Copyright 2017 The Ray Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//  http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <memory>
+
+// clang-format off
+#include "gtest/gtest.h"
+#include "ray/gcs/gcs_server/test/gcs_server_test_util.h"
+#include "ray/gcs/test/gcs_test_util.h"
+#include "ray/gcs/gcs_server/gcs_monitor_server.h"
+#include "mock/ray/pubsub/publisher.h"
+// clang-format on
+
+namespace ray {
+class GcsMonitorServerTest : public ::testing::Test {
+ public:
+  GcsMonitorServerTest() : monitor_server_() {}
+
+ protected:
+  gcs::GcsMonitorServer monitor_server_;
+};
+
+TEST_F(GcsMonitorServerTest, TestRayVersion) {
+  rpc::GetRayVersionRequest request;
+  rpc::GetRayVersionReply reply;
+  auto send_reply_callback =
+      [](ray::Status status, std::function<void()> f1, std::function<void()> f2) {};
+
+  monitor_server_.HandleGetRayVersion(request, &reply, send_reply_callback);
+
+  ASSERT_EQ(reply.version(), kRayVersion);
+}
+
+}  // namespace ray
diff --git a/src/ray/protobuf/BUILD b/src/ray/protobuf/BUILD
index 499e0445be9c..22054c994261 100644
--- a/src/ray/protobuf/BUILD
+++ b/src/ray/protobuf/BUILD
@@ -4,6 +4,21 @@ load("@rules_proto//proto:defs.bzl", "proto_library")
 load("@rules_cc//cc:defs.bzl", "cc_binary", "cc_library", "cc_proto_library", "cc_test")
 load("@rules_proto_grpc//python:defs.bzl", "python_grpc_compile")
 
+proto_library(
+    name = "monitor_proto",
+    srcs = ["monitor.proto"],
+)
+
+cc_proto_library(
+    name = "monitor_cc_proto",
+    deps = [":monitor_proto"],
+)
+
+python_grpc_compile(
+    name = "monitor_py_proto",
+    deps = [":monitor_proto"],
+)
+
 proto_library(
     name = "common_proto",
     srcs = ["common.proto"],
diff --git a/src/ray/protobuf/monitor.proto b/src/ray/protobuf/monitor.proto
new file mode 100644
index 000000000000..b8190fd9d1e1
--- /dev/null
+++ b/src/ray/protobuf/monitor.proto
@@ -0,0 +1,30 @@
+// Copyright 2017 The Ray Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//  http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+syntax = "proto3";
+option cc_enable_arenas = true;
+package ray.rpc;
+
+message GetRayVersionRequest {}
+
+message GetRayVersionReply {
+  string version = 1;
+}
+
+// This service provides a stable interface for a monitor/autoscaler process to interact
+// with Ray.
+service MonitorGcsService {
+  // Get the ray version of the service.
+  rpc GetRayVersion(GetRayVersionRequest) returns (GetRayVersionReply);
+}
diff --git a/src/ray/rpc/gcs_server/gcs_rpc_server.h b/src/ray/rpc/gcs_server/gcs_rpc_server.h
index c2453c88a1df..bcfca5052d9b 100644
--- a/src/ray/rpc/gcs_server/gcs_rpc_server.h
+++ b/src/ray/rpc/gcs_server/gcs_rpc_server.h
@@ -19,6 +19,7 @@
 #include "ray/rpc/grpc_server.h"
 #include "ray/rpc/server_call.h"
 #include "src/ray/protobuf/gcs_service.grpc.pb.h"
+#include "src/ray/protobuf/monitor.grpc.pb.h"
 
 namespace ray {
 namespace rpc {
@@ -31,6 +32,11 @@ namespace rpc {
 #define ACTOR_INFO_SERVICE_RPC_HANDLER(HANDLER, MAX_ACTIVE_RPCS) \
   RPC_SERVICE_HANDLER(ActorInfoGcsService, HANDLER, MAX_ACTIVE_RPCS)
 
+#define MONITOR_SERVICE_RPC_HANDLER(HANDLER) \
+  RPC_SERVICE_HANDLER(MonitorGcsService,     \
+                      HANDLER,               \
+                      RayConfig::instance().gcs_max_active_rpcs_per_handler())
+
 #define NODE_INFO_SERVICE_RPC_HANDLER(HANDLER) \
   RPC_SERVICE_HANDLER(NodeInfoGcsService,      \
                       HANDLER,                 \
@@ -209,6 +215,41 @@ class ActorInfoGrpcService : public GrpcService {
   ActorInfoGcsServiceHandler &service_handler_;
 };
 
+class MonitorGcsServiceHandler {
+ public:
+  virtual ~MonitorGcsServiceHandler() = default;
+
+  virtual void HandleGetRayVersion(GetRayVersionRequest request,
+                                   GetRayVersionReply *reply,
+                                   SendReplyCallback send_reply_callback) = 0;
+};
+
+/// The `GrpcService` for `MonitorServer`.
+class MonitorGrpcService : public GrpcService {
+ public:
+  /// Constructor.
+  ///
+  /// \param[in] handler The service handler that actually handle the requests.
+  explicit MonitorGrpcService(instrumented_io_context &io_service,
+                              MonitorGcsServiceHandler &handler)
+      : GrpcService(io_service), service_handler_(handler){};
+
+ protected:
+  grpc::Service &GetGrpcService() override { return service_; }
+
+  void InitServerCallFactories(
+      const std::unique_ptr<grpc::ServerCompletionQueue> &cq,
+      std::vector<std::unique_ptr<ServerCallFactory>> *server_call_factories) override {
+    MONITOR_SERVICE_RPC_HANDLER(GetRayVersion);
+  }
+
+ private:
+  /// The grpc async service object.
+  MonitorGcsService::AsyncService service_;
+  /// The service handler that actually handle the requests.
+  MonitorGcsServiceHandler &service_handler_;
+};
+
 class NodeInfoGcsServiceHandler {
  public:
   virtual ~NodeInfoGcsServiceHandler() = default;
@@ -581,6 +622,7 @@ class InternalPubSubGrpcService : public GrpcService {
 
 using JobInfoHandler = JobInfoGcsServiceHandler;
 using ActorInfoHandler = ActorInfoGcsServiceHandler;
+using MonitorServiceHandler = MonitorGcsServiceHandler;
 using NodeInfoHandler = NodeInfoGcsServiceHandler;
 using NodeResourceInfoHandler = NodeResourceInfoGcsServiceHandler;
 using WorkerInfoHandler = WorkerInfoGcsServiceHandler;

From f59f1e6b53a1f385619f8927295a90e7fa066508 Mon Sep 17 00:00:00 2001
From: Balaji Veeramani <balaji@anyscale.com>
Date: Thu, 26 Jan 2023 16:08:11 -0800
Subject: [PATCH 012/267] [docs] Improve visibility of API annotations (#31971)

Closes https://github.com/ray-project/ray/issues/30396
---
 python/ray/util/annotations.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/python/ray/util/annotations.py b/python/ray/util/annotations.py
index 9996b092fcab..f7b93746f910 100644
--- a/python/ray/util/annotations.py
+++ b/python/ray/util/annotations.py
@@ -49,7 +49,7 @@ def PublicAPI(*args, **kwargs):
     def wrap(obj):
         if stability in ["alpha", "beta"]:
             message = (
-                f"PublicAPI ({stability}): This API is in {stability} "
+                f"**PublicAPI ({stability}):** This API is in {stability} "
                 "and may change before becoming stable."
             )
         else:
@@ -80,7 +80,8 @@ def DeveloperAPI(*args, **kwargs):
 
     def wrap(obj):
         _append_doc(
-            obj, message="DeveloperAPI: This API may change across minor Ray releases."
+            obj,
+            message="**DeveloperAPI:** This API may change across minor Ray releases.",
         )
         _mark_annotated(obj)
         return obj

From d770668a1402acb1406b48fa50fc34f1baba3d73 Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Thu, 26 Jan 2023 19:15:13 -0500
Subject: [PATCH 013/267] [ci][core][data] Have tests from data to be owned by
 data team on flaky dashboard.  (#31972)

---
 python/ray/data/BUILD | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/python/ray/data/BUILD b/python/ray/data/BUILD
index 2dd31bbbf138..0217c480ab40 100644
--- a/python/ray/data/BUILD
+++ b/python/ray/data/BUILD
@@ -23,7 +23,7 @@ py_test(
     size = "large",
     srcs = ["tests/test_dataset_formats.py"],
     data = glob(["tests/image-folder/**/*"]),
-    tags = ["team:core", "exclusive"],
+    tags = ["team:data", "exclusive"],
     deps = ["//:ray_lib", ":conftest"],
 )
 
@@ -31,7 +31,7 @@ py_test(
     name = "test_mongo_dataset",
     size = "large",
     srcs = ["tests/test_mongo_dataset.py"],
-    tags = ["team:core", "exclusive", "dataset_integration"],
+    tags = ["team:data", "exclusive", "dataset_integration"],
     deps = ["//:ray_lib", ":conftest"],
 )
 
@@ -45,6 +45,6 @@ py_test_module_list(
     ],
   ),
   size = "large",
-  tags = ["team:core", "exclusive"],
+  tags = ["team:data", "exclusive"],
   deps = ["//:ray_lib", ":conftest"],
 )

From 5b0f7a2ddb8eb5dc761cf81fa16087df9be72c5c Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Thu, 26 Jan 2023 19:19:28 -0500
Subject: [PATCH 014/267] [core][state] Task backend return most recently added
 tasks when getting all tasks (#31837)

Signed-off-by: rickyyx <rickyx@anyscale.com>

This PR changes the implicit ordering of task events returned by GcsTaskManager when querying all task events with limit: it will now always returns the most recently added task events.

Before this PR, there is no implicit ordering and usually the least recently added task events are returned.

This allows users to get recent data when data truncation happens.
---
 python/ray/tests/test_state_api.py            |  4 +-
 src/ray/gcs/gcs_server/gcs_task_manager.cc    | 25 +++++++++++-
 src/ray/gcs/gcs_server/gcs_task_manager.h     |  5 ++-
 .../gcs_server/test/gcs_task_manager_test.cc  | 40 +++++++++++++++++++
 4 files changed, 69 insertions(+), 5 deletions(-)

diff --git a/python/ray/tests/test_state_api.py b/python/ray/tests/test_state_api.py
index 1be1619a7ecc..3859eb11f43a 100644
--- a/python/ray/tests/test_state_api.py
+++ b/python/ray/tests/test_state_api.py
@@ -2361,10 +2361,10 @@ def f():
 
     def verify(task_attempts):
         assert len(task_attempts) == 3
-        for task_attempt in task_attempts[:-1]:
+        for task_attempt in task_attempts[1:]:
             assert task_attempt["state"] == "FAILED"
 
-        task_attempts[-1]["state"] == "FINISHED"
+        task_attempts[0]["state"] == "FINISHED"
 
         assert {task_attempt["attempt_number"] for task_attempt in task_attempts} == {
             0,
diff --git a/src/ray/gcs/gcs_server/gcs_task_manager.cc b/src/ray/gcs/gcs_server/gcs_task_manager.cc
index 68dc813758cc..68f75cd918a3 100644
--- a/src/ray/gcs/gcs_server/gcs_task_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_task_manager.cc
@@ -30,7 +30,26 @@ void GcsTaskManager::Stop() {
 
 std::vector<rpc::TaskEvents> GcsTaskManager::GcsTaskManagerStorage::GetTaskEvents()
     const {
-  return task_events_;
+  std::vector<rpc::TaskEvents> ret;
+  // NOTE(rickyx): This could be done better if we expose an iterator - which we
+  // probably have to do if we are supporting pagination in the future.
+  // As for now, this will make sure data is returned w.r.t insertion order, so we could
+  // return the more recent entries when limit applies.
+  RAY_CHECK(next_idx_to_overwrite_ == 0 || next_idx_to_overwrite_ < task_events_.size())
+      << "next_idx_to_overwrite=" << next_idx_to_overwrite_
+      << " should be in bound. (size=" << task_events_.size() << ")";
+  // Copy from the least recently generated data, where `next_idx_to_overwrite_` points to
+  // the least recently added data.
+  std::copy(task_events_.begin() + next_idx_to_overwrite_,
+            task_events_.end(),
+            std::back_inserter(ret));
+  // Copy the wrapped around if any
+  if (next_idx_to_overwrite_ > 0) {
+    std::copy(task_events_.begin(),
+              task_events_.begin() + next_idx_to_overwrite_,
+              std::back_inserter(ret));
+  }
+  return ret;
 }
 
 std::vector<rpc::TaskEvents> GcsTaskManager::GcsTaskManagerStorage::GetTaskEvents(
@@ -345,7 +364,9 @@ void GcsTaskManager::HandleGetTaskEvents(rpc::GetTaskEventsRequest request,
   auto count = 0;
   int32_t num_profile_event_limit = 0;
   int32_t num_status_event_limit = 0;
-  for (auto &task_event : task_events) {
+
+  for (auto itr = task_events.rbegin(); itr != task_events.rend(); ++itr) {
+    auto &task_event = *itr;
     if (request.exclude_driver_task() && !task_event.has_state_updates()) {
       // Driver related profile events will generate TaskEvent w/o any task state updates.
       continue;
diff --git a/src/ray/gcs/gcs_server/gcs_task_manager.h b/src/ray/gcs/gcs_server/gcs_task_manager.h
index afd49d9604eb..f8e779ef7c1a 100644
--- a/src/ray/gcs/gcs_server/gcs_task_manager.h
+++ b/src/ray/gcs/gcs_server/gcs_task_manager.h
@@ -137,7 +137,10 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
 
     /// Get all task events.
     ///
-    /// \return all task events stored.
+    /// This retrieves copies of all task events ordered from the least recently inserted
+    /// to the most recently inserted task events.
+    ///
+    /// \return all task events stored sorted with insertion order.
     std::vector<rpc::TaskEvents> GetTaskEvents() const;
 
     /// Get task events from tasks corresponding to `task_ids`.
diff --git a/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc b/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
index d106f25c7c1d..bf192b2ec609 100644
--- a/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
@@ -732,5 +732,45 @@ TEST_F(GcsTaskManagerMemoryLimitedTest, TestLimitTaskEvents) {
   }
 }
 
+TEST_F(GcsTaskManagerMemoryLimitedTest, TestLimitReturnRecentTasksWhenGetAll) {
+  // Keep adding tasks and make sure even with eviction, the returned tasks are
+  // the mo
+  size_t num_to_insert = 200;
+  size_t num_query = 10;
+  size_t inserted = 0;
+
+  auto task_ids = GenTaskIDs(num_to_insert);
+
+  for (size_t i = 0; i < num_to_insert; ++i) {
+    // Add a task event
+    {
+      inserted++;
+      auto events = GenTaskEvents({task_ids[i]},
+                                  /* attempt_number */ 0,
+                                  /* job_id */ 0,
+                                  /* profile event */ absl::nullopt,
+                                  GenStateUpdate({{rpc::TaskStatus::RUNNING, 1}}));
+      auto events_data = Mocker::GenTaskEventsData(events);
+      SyncAddTaskEventData(events_data);
+    }
+
+    if (inserted < num_query || inserted % num_query != 0) {
+      continue;
+    }
+
+    // Expect returned tasks with limit are the most recently added ones.
+    {
+      absl::flat_hash_set<TaskID> query_ids(task_ids.begin() + (inserted - num_query),
+                                            task_ids.begin() + inserted);
+      auto reply = SyncGetTaskEvents(
+          /* task_ids */ {}, /* job_id */ absl::nullopt, /* limit */ num_query);
+      for (const auto &task_event : reply.events_by_task()) {
+        EXPECT_EQ(query_ids.count(TaskID::FromBinary(task_event.task_id())), 1)
+            << TaskID::FromBinary(task_event.task_id()).Hex() << "not there, at " << i;
+      }
+    }
+  }
+}
+
 }  // namespace gcs
 }  // namespace ray

From 6bcaa9c55f7ad4ea14366ac7762458d5bf17ffd5 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Thu, 26 Jan 2023 17:02:29 -0800
Subject: [PATCH 015/267] [tune] Only keep cached actors if search has not
 ended (#31974)

We currently keep one actor cached if no other trials have been staged to prevent us removing actors when we may need them in one of the next iterations. However, when the search algorithm won't produce new trials anymore, we keep this actor needlessly. This can keep resources occupied needlessly and prevent downscaling, as caught in #31883.

This PR passes another flag to the trial executor cleanup method indicating if new trials are to be expected. If not, we can cleanup unneeded actors even if no further trials are staged.

This behavior is tested in the `cluster_tune_scale_up_down` release test. We won't add a unit test for this as this would effectively mimic the release test. Instead, we can add proper actor reuse testing once we made more progress with the execution refactor.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 .../ray/tune/execution/ray_trial_executor.py  | 14 +++++++----
 python/ray/tune/execution/trial_runner.py     |  2 +-
 python/ray/tune/tests/test_trial_runner_3.py  |  2 +-
 .../workloads/tune_scale_up_down.py           | 24 +++++++++++++++++++
 4 files changed, 35 insertions(+), 7 deletions(-)

diff --git a/python/ray/tune/execution/ray_trial_executor.py b/python/ray/tune/execution/ray_trial_executor.py
index a3e8f3f56af8..035bb55defd2 100644
--- a/python/ray/tune/execution/ray_trial_executor.py
+++ b/python/ray/tune/execution/ray_trial_executor.py
@@ -843,8 +843,8 @@ def on_step_begin(self) -> None:
         """Before step() is called, update the available resources."""
         self._resource_updater.update_avail_resources()
 
-    def on_step_end(self) -> None:
-        self._cleanup_cached_actors()
+    def on_step_end(self, search_ended: bool = False) -> None:
+        self._cleanup_cached_actors(search_ended=search_ended)
         self._do_force_trial_cleanup()
 
     def _count_staged_resources(self):
@@ -854,7 +854,9 @@ def _count_staged_resources(self):
             counter[resource_request] += 1
         return counter
 
-    def _cleanup_cached_actors(self, force_all: bool = False):
+    def _cleanup_cached_actors(
+        self, search_ended: bool = False, force_all: bool = False
+    ):
         """Clean up unneeded cached actors.
 
         Ray Tune caches actors for re-use to avoid initialization overhead. This is
@@ -884,8 +886,10 @@ def _cleanup_cached_actors(self, force_all: bool = False):
         resources for all cached actors. If we cached more actors than we need, we
         terminate the excess actors and free the resources.
         """
-        if not self._staged_trials and not force_all:
-            # If we don't have any staged trials, keep cached actors
+        if not self._staged_trials and not force_all and not search_ended:
+            # If we don't have any staged trials, keep cached actors,
+            # unless cleanup is forced or no new trials are going to be generated
+            # (if the search ended).
             return
 
         staged_resources = self._count_staged_resources()
diff --git a/python/ray/tune/execution/trial_runner.py b/python/ray/tune/execution/trial_runner.py
index 0479dd6eeb4d..f25e63828220 100644
--- a/python/ray/tune/execution/trial_runner.py
+++ b/python/ray/tune/execution/trial_runner.py
@@ -967,7 +967,7 @@ def step(self):
         self._reconcile_live_trials()
 
         with warn_if_slow("on_step_end"):
-            self.trial_executor.on_step_end()
+            self.trial_executor.on_step_end(search_ended=self._search_alg.is_finished())
         with warn_if_slow("callbacks.on_step_end"):
             self._callbacks.on_step_end(iteration=self._iteration, trials=self._trials)
 
diff --git a/python/ray/tune/tests/test_trial_runner_3.py b/python/ray/tune/tests/test_trial_runner_3.py
index a50b714553de..79c130377f42 100644
--- a/python/ray/tune/tests/test_trial_runner_3.py
+++ b/python/ray/tune/tests/test_trial_runner_3.py
@@ -75,7 +75,7 @@ def on_step_begin(self):
             cnt = self.pre_step if hasattr(self, "pre_step") else 0
             self.pre_step = cnt + 1
 
-        def on_step_end(self):
+        def on_step_end(self, search_ended: bool = False):
             cnt = self.pre_step if hasattr(self, "post_step") else 0
             self.post_step = 1 + cnt
 
diff --git a/release/cluster_tests/workloads/tune_scale_up_down.py b/release/cluster_tests/workloads/tune_scale_up_down.py
index f99ebcfc496d..7909ce8aa0c7 100644
--- a/release/cluster_tests/workloads/tune_scale_up_down.py
+++ b/release/cluster_tests/workloads/tune_scale_up_down.py
@@ -1,3 +1,27 @@
+"""Test cluster up/down scaling behavior.
+
+This test should run on a cluster with autoscaling enabled. It assumes 1-3 nodes
+with 4 CPUs each.
+
+We start a Ray Tune run with 3 trials. Each trial uses 4 CPUs, so fills up a node
+completely. This means we will trigger autoscaling after starting up.
+
+The trial on the head node will run for 30 minutes. This is to make sure that
+we have enough time that the nodes for the other two trials come up, complete
+training, and come down before the first trial finishes.
+
+The other two trials will run once their nodes are up, and take 3 minutes each
+to finish. The three minutes have been chosen to make sure that both trials
+run in parallel for some time, i.e. to avoid that both additional trials run on
+only one node.
+
+We keep track of the number of nodes we observe at any point during the run.
+
+Test owner: krfricke
+
+Acceptance criteria: Should have scaled to 3 nodes at some point during the run.
+Should have scaled down to 1 node at the end.
+"""
 from collections import Counter
 import time
 

From 581cd4e21e74f7e7b85386fbd1e80d40c3251623 Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Thu, 26 Jan 2023 20:03:13 -0800
Subject: [PATCH 016/267] [nightly] Update the many nodes actor workload to 1k
 nodes. (#31935)

This PR update the test to run with 1k nodes 20k actors. Right now the infra can't scale to 1k nodes when starting because of rate limiting. This PR scale up inside the testing script slowly to avoid the rate limiting.
---
 .../many_nodes_tests/actor_test.py            | 125 ++++++++++++++++++
 .../many_nodes_tests/app_config.yaml          |   0
 .../many_nodes_tests/compute_config.yaml      |   6 +-
 .../many_nodes_tests/multi_master_test.py     |   0
 .../many_nodes_tests/actor_test.py            |  73 ----------
 release/release_tests.yaml                    |  19 +--
 6 files changed, 138 insertions(+), 85 deletions(-)
 create mode 100644 release/benchmarks/distributed/many_nodes_tests/actor_test.py
 rename release/{nightly_tests => benchmarks/distributed}/many_nodes_tests/app_config.yaml (100%)
 rename release/{nightly_tests => benchmarks/distributed}/many_nodes_tests/compute_config.yaml (71%)
 rename release/{nightly_tests => benchmarks/distributed}/many_nodes_tests/multi_master_test.py (100%)
 delete mode 100644 release/nightly_tests/many_nodes_tests/actor_test.py

diff --git a/release/benchmarks/distributed/many_nodes_tests/actor_test.py b/release/benchmarks/distributed/many_nodes_tests/actor_test.py
new file mode 100644
index 000000000000..495570a74c6d
--- /dev/null
+++ b/release/benchmarks/distributed/many_nodes_tests/actor_test.py
@@ -0,0 +1,125 @@
+import argparse
+import os
+import math
+from time import sleep, perf_counter
+import json
+import ray
+import psutil
+
+
+def test_max_actors_launch(cpus_per_actor, total_actors):
+    @ray.remote(num_cpus=cpus_per_actor)
+    class Actor:
+        def foo(self):
+            pass
+
+    print("Start launch actors")
+    actors = [Actor.options(max_restarts=-1).remote() for _ in range(total_actors)]
+    return actors
+
+
+def parse_script_args():
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--cpus-per-actor", type=float, default=0.2)
+    parser.add_argument("--total-actors", nargs="+", type=int, required=True)
+    parser.add_argument("--no-report", default=False, action="store_true")
+    parser.add_argument("--no-wait", default=False, action="store_true")
+    return parser.parse_known_args()
+
+
+def scale_cluster_up(num_cpus):
+    print(f"Start to scale up to {num_cpus} cpus")
+
+    def get_curr_cpus():
+        return int(sum([r.get("Resources", {}).get("CPU", 0) for r in ray.nodes()]))
+
+    step = 1000
+    curr_cpus = get_curr_cpus()
+    target_cpus = curr_cpus
+
+    while curr_cpus < num_cpus:
+        curr_cpus = get_curr_cpus()
+        new_target_cpus = min(curr_cpus + step, num_cpus)
+        if new_target_cpus != target_cpus:
+            target_cpus = new_target_cpus
+            ray.autoscaler.sdk.request_resources(num_cpus=target_cpus)
+        print(f"Waiting for cluster to be up: {curr_cpus}->{target_cpus}->{num_cpus}")
+        sleep(10)
+
+
+def run_one(total_actors, cpus_per_actor, no_wait):
+    total_cpus = cpus_per_actor * total_actors + psutil.cpu_count()
+    total_cpus = int(math.ceil(total_cpus))
+    scale_cluster_up(total_cpus)
+
+    actor_launch_start = perf_counter()
+    actors = test_max_actors_launch(cpus_per_actor, total_actors)
+    actor_launch_end = perf_counter()
+    actor_launch_time = actor_launch_end - actor_launch_start
+    actor_ready_start = perf_counter()
+    total_actors = len(actors)
+    objs = [actor.foo.remote() for actor in actors]
+
+    while len(objs) != 0:
+        timeout = None if no_wait else 30
+        objs_ready, objs = ray.wait(objs, num_returns=len(objs), timeout=timeout)
+        print(
+            f"Status: {total_actors - len(objs)}/{total_actors}, "
+            f"{perf_counter() - actor_ready_start}"
+        )
+    actor_ready_end = perf_counter()
+    actor_ready_time = actor_ready_end - actor_ready_start
+
+    throughput = total_actors / (actor_ready_time + actor_launch_time)
+    print(f"Actor launch time: {actor_launch_time} ({total_actors} actors)")
+    print(f"Actor ready time: {actor_ready_time} ({total_actors} actors)")
+    print(
+        f"Total time: {actor_launch_time + actor_ready_time}"
+        f" ({total_actors} actors)"
+    )
+    print(f"Through put: {throughput}")
+
+    return {
+        "actor_launch_time": actor_launch_time,
+        "actor_ready_time": actor_ready_time,
+        "total_time": actor_launch_time + actor_ready_time,
+        "num_actors": total_actors,
+        "success": "1",
+        "throughput": throughput,
+    }
+
+
+def main():
+    args, unknown = parse_script_args()
+    args.total_actors.sort()
+
+    ray.init(address="auto")
+
+    dashboard_test = None
+    # Enable it once v2 support prometheus
+    # dashboard_test = DashboardTestAtScale(addr)
+    result = {}
+    for i in args.total_actors:
+        result[f"many_nodes_actor_tests_{i}"] = run_one(
+            i, args.cpus_per_actor, args.no_wait
+        )
+
+    if "TEST_OUTPUT_JSON" in os.environ and not args.no_report:
+        out_file = open(os.environ["TEST_OUTPUT_JSON"], "w")
+        if dashboard_test is not None:
+            perf = [
+                {
+                    "perf_metric_name": name,
+                    "perf_metric_value": r["throughput"],
+                    "perf_metric_type": "THROUGHPUT",
+                }
+                for (name, r) in result.items()
+            ]
+            result["perf_metrics"] = perf
+            dashboard_test.update_release_test_result(result)
+
+        json.dump(result, out_file)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/release/nightly_tests/many_nodes_tests/app_config.yaml b/release/benchmarks/distributed/many_nodes_tests/app_config.yaml
similarity index 100%
rename from release/nightly_tests/many_nodes_tests/app_config.yaml
rename to release/benchmarks/distributed/many_nodes_tests/app_config.yaml
diff --git a/release/nightly_tests/many_nodes_tests/compute_config.yaml b/release/benchmarks/distributed/many_nodes_tests/compute_config.yaml
similarity index 71%
rename from release/nightly_tests/many_nodes_tests/compute_config.yaml
rename to release/benchmarks/distributed/many_nodes_tests/compute_config.yaml
index 8a0e63ebb518..882fca85b154 100644
--- a/release/nightly_tests/many_nodes_tests/compute_config.yaml
+++ b/release/benchmarks/distributed/many_nodes_tests/compute_config.yaml
@@ -8,7 +8,7 @@ head_node_type:
 
 worker_node_types:
    - name: worker_node
-     instance_type: m5.xlarge
-     min_workers: 250
-     max_workers: 250
+     instance_type: m5.large
+     min_workers: 500
+     max_workers: 2000
      use_spot: false
diff --git a/release/nightly_tests/many_nodes_tests/multi_master_test.py b/release/benchmarks/distributed/many_nodes_tests/multi_master_test.py
similarity index 100%
rename from release/nightly_tests/many_nodes_tests/multi_master_test.py
rename to release/benchmarks/distributed/many_nodes_tests/multi_master_test.py
diff --git a/release/nightly_tests/many_nodes_tests/actor_test.py b/release/nightly_tests/many_nodes_tests/actor_test.py
deleted file mode 100644
index 884647d1c0f3..000000000000
--- a/release/nightly_tests/many_nodes_tests/actor_test.py
+++ /dev/null
@@ -1,73 +0,0 @@
-import argparse
-import os
-from time import sleep, perf_counter
-import json
-import ray
-
-
-def test_max_actors_launch(cpus_per_actor, total_actors):
-    @ray.remote(num_cpus=cpus_per_actor)
-    class Actor:
-        def foo(self):
-            pass
-
-    print("Start launch actors")
-    actors = [Actor.options(max_restarts=-1).remote() for _ in range(total_actors)]
-    return actors
-
-
-def parse_script_args():
-    parser = argparse.ArgumentParser()
-    parser.add_argument("--cpus-per-actor", type=float, default=0.2)
-    parser.add_argument("--total-actors", type=int, default=5000)
-    parser.add_argument("--no-report", default=False, action="store_true")
-    parser.add_argument("--fail", default=False, action="store_true")
-    return parser.parse_known_args()
-
-
-def main():
-    args, unknown = parse_script_args()
-
-    ray.init(address="auto")
-    actor_launch_start = perf_counter()
-    actors = test_max_actors_launch(args.cpus_per_actor, args.total_actors)
-    actor_launch_end = perf_counter()
-    actor_launch_time = actor_launch_end - actor_launch_start
-
-    if args.fail:
-        sleep(10)
-        return
-    actor_ready_start = perf_counter()
-    total_actors = len(actors)
-    objs = [actor.foo.remote() for actor in actors]
-
-    while len(objs) != 0:
-        objs_ready, objs = ray.wait(objs, timeout=10)
-        print(
-            f"Status: {total_actors - len(objs)}/{total_actors}, "
-            f"{perf_counter() - actor_ready_start}"
-        )
-    actor_ready_end = perf_counter()
-    actor_ready_time = actor_ready_end - actor_ready_start
-
-    print(f"Actor launch time: {actor_launch_time} ({args.total_actors} actors)")
-    print(f"Actor ready time: {actor_ready_time} ({args.total_actors} actors)")
-    print(
-        f"Total time: {actor_launch_time + actor_ready_time}"
-        f" ({args.total_actors} actors)"
-    )
-
-    if "TEST_OUTPUT_JSON" in os.environ and not args.no_report:
-        out_file = open(os.environ["TEST_OUTPUT_JSON"], "w")
-        results = {
-            "actor_launch_time": actor_launch_time,
-            "actor_ready_time": actor_ready_time,
-            "total_time": actor_launch_time + actor_ready_time,
-            "num_actors": args.total_actors,
-            "success": "1",
-        }
-        json.dump(results, out_file)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index bb830a6db379..1c6e51a078dc 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -3872,27 +3872,28 @@
       num_nodes: 32
 
 
-- name: many_nodes_actor_test
+- name: many_nodes_actor_test_on_v2
   group: core-daily-test
-  working_dir: nightly_tests
+  working_dir: benchmarks
   legacy:
     test_name: many_nodes_actor_test
-    test_suite: nightly_tests
+    test_suite: benchmarks
 
   frequency: nightly-3x
   team: core
   env: staging
   cluster:
-    cluster_env: many_nodes_tests/app_config.yaml
-    cluster_compute: many_nodes_tests/compute_config.yaml
+    cluster_env: distributed/many_nodes_tests/app_config.yaml
+    cluster_compute: distributed/many_nodes_tests/compute_config.yaml
 
   run:
     timeout: 7200
-    # 4cpus per node x 250 nodes / 0.2 cpus per actor = 5k
-    script: python many_nodes_tests/actor_test.py --cpus-per-actor=0.2 --total-actors=5000
-    wait_for_nodes:
-      num_nodes: 251
+    # 2cpus per node x 1000 nodes / 0.2 cpus per actor = 10k
+    # 2cpus per node x 2000 nodes / 0.2 cpus per actor = 20k
+    script: python distributed/many_nodes_tests/actor_test.py --no-wait --cpus-per-actor=0.2 --total-actors 1000 2000
     type: job
+    wait_for_nodes:
+      num_nodes: 500
 
 #- name: many_nodes_multi_master_test
 #  group: core-daily-test

From b60f887597f1d5cd29039bd6fe584dfb986ca177 Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Thu, 26 Jan 2023 22:06:04 -0800
Subject: [PATCH 017/267] [nightly] Increase the number of actors started for
 the test (#31990)

Signed-off-by: Yi Cheng <74173148+iycheng@users.noreply.github.com>

In the previously PR, the number failed to be updated. This PR updated it.

```
  many_nodes_actor_tests_10000 = {'actor_launch_time': 14.038594387999979, 'actor_ready_time': 44.27844531799997, 'total_time': 58.317039705999946, 'num_actors': 10000, 'success': '1', 'throughput': 17
1.47646812002273}
  many_nodes_actor_tests_20000 = {'actor_launch_time': 17.670945039000117, 'actor_ready_time': 230.851894916, 'total_time': 248.5228399550001, 'num_actors': 20000, 'success': '1', 'throughput': 80.4755
0077739892}
```
---
 release/release_tests.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index 1c6e51a078dc..e1db50e84d51 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -3890,7 +3890,7 @@
     timeout: 7200
     # 2cpus per node x 1000 nodes / 0.2 cpus per actor = 10k
     # 2cpus per node x 2000 nodes / 0.2 cpus per actor = 20k
-    script: python distributed/many_nodes_tests/actor_test.py --no-wait --cpus-per-actor=0.2 --total-actors 1000 2000
+    script: python distributed/many_nodes_tests/actor_test.py --no-wait --cpus-per-actor=0.2 --total-actors 10000 20000
     type: job
     wait_for_nodes:
       num_nodes: 500

From 3343c76332ce0db9d0f8c98d6ac153804e4afe18 Mon Sep 17 00:00:00 2001
From: Peyton Murray <peynmurray@gmail.com>
Date: Thu, 26 Jan 2023 23:18:49 -0800
Subject: [PATCH 018/267] Add informative progress bar names to map_batches
 (#31526)

Signed-off-by: pdmurray <peynmurray@gmail.com>

Signed-off-by: pdmurray <peynmurray@gmail.com>
---
 .bazeliskrc                                   |  1 +
 .gitignore                                    |  2 +
 python/ray/air/tests/test_dataset_config.py   |  6 +-
 python/ray/data/_internal/plan.py             | 26 +++++++-
 python/ray/data/dataset.py                    | 10 ++-
 python/ray/data/tests/test_dataset.py         | 10 +--
 python/ray/data/tests/test_optimize.py        | 64 +++++++++++--------
 python/ray/data/tests/test_stats.py           | 45 +++++++------
 .../ray/train/tests/test_batch_predictor.py   | 16 ++---
 9 files changed, 115 insertions(+), 65 deletions(-)
 create mode 100644 .bazeliskrc

diff --git a/.bazeliskrc b/.bazeliskrc
new file mode 100644
index 000000000000..9adf2699b0d0
--- /dev/null
+++ b/.bazeliskrc
@@ -0,0 +1 @@
+USE_BAZEL_VERSION=5.x
diff --git a/.gitignore b/.gitignore
index 297a7b9d0608..9268fa948c4e 100644
--- a/.gitignore
+++ b/.gitignore
@@ -224,3 +224,5 @@ workflow_data/
 
 # Auto-generated tag mapping
 tag-mapping.json
+
+.bazeliskrc
diff --git a/python/ray/air/tests/test_dataset_config.py b/python/ray/air/tests/test_dataset_config.py
index 6616395f93bd..902835e3f4b9 100644
--- a/python/ray/air/tests/test_dataset_config.py
+++ b/python/ray/air/tests/test_dataset_config.py
@@ -251,7 +251,7 @@ def checker(shard, results):
         # applying the preprocessor on each epoch.
         assert results[0] == results[1], results
         stats = shard.stats()
-        assert "Stage 1 read->map_batches: 1/1 blocks executed " in stats, stats
+        assert "Stage 1 read->BatchMapper: 1/1 blocks executed " in stats, stats
 
     def rand(x):
         x["value"] = [random.random() for _ in range(len(x))]
@@ -284,8 +284,8 @@ def checker(shard, results):
         assert results[0] != results[1], results
         stats = shard.stats()
         assert (
-            "Stage 1 read->randomize_block_order->map_batches: 1/1 blocks executed "
-            in stats
+            "Stage 1 read->randomize_block_order->"
+            "BatchMapper: 1/1 blocks executed " in stats
         ), stats
 
     test = TestStream(
diff --git a/python/ray/data/_internal/plan.py b/python/ray/data/_internal/plan.py
index 3bc492e944e9..47097bf2821b 100644
--- a/python/ray/data/_internal/plan.py
+++ b/python/ray/data/_internal/plan.py
@@ -45,6 +45,30 @@
 logger = DatasetLogger(__name__)
 
 
+def capfirst(s: str):
+    """Capitalize the first letter of a string
+
+    Args:
+        s: String to capitalize
+
+    Returns:
+       Capitalized string
+    """
+    return s[0].upper() + s[1:]
+
+
+def capitalize(s: str):
+    """Capitalize a string, removing '_' and keeping camelcase.
+
+    Args:
+        s: String to capitalize
+
+    Returns:
+        Capitalized string with no underscores.
+    """
+    return "".join(capfirst(x) for x in s.split("_"))
+
+
 class Stage:
     """Represents a Dataset transform stage (e.g., map or shuffle)."""
 
@@ -157,7 +181,7 @@ def get_plan_as_string(self) -> str:
             # Get string representation of each stage in reverse order.
             for stage in self._stages_after_snapshot[::-1]:
                 # Get name of each stage in camel case.
-                stage_name = stage.name.title().replace("_", "")
+                stage_name = capitalize(stage.name)
                 if num_stages == 0:
                     plan_str += f"{stage_name}\n"
                 else:
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index 7ab51669992b..f2f9db25753d 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -671,8 +671,16 @@ def process_next_batch(batch: DataBatch) -> Iterator[Block]:
             if output_buffer.has_next():
                 yield output_buffer.next()
 
+        # breakpoint()
+        if hasattr(fn, "__self__") and isinstance(
+            fn.__self__, ray.data.preprocessor.Preprocessor
+        ):
+            stage_name = fn.__self__.__class__.__name__
+        else:
+            stage_name = f'MapBatches({getattr(fn, "__name__", type(fn))})'
+
         stage = OneToOneStage(
-            "map_batches",
+            stage_name,
             transform,
             compute,
             ray_remote_args,
diff --git a/python/ray/data/tests/test_dataset.py b/python/ray/data/tests/test_dataset.py
index e593c5ca60ce..4cd1d39aa5a8 100644
--- a/python/ray/data/tests/test_dataset.py
+++ b/python/ray/data/tests/test_dataset.py
@@ -1517,26 +1517,28 @@ def test_dataset_repr(ray_start_regular_shared):
     assert repr(ds) == "Dataset(num_blocks=10, num_rows=10, schema=<class 'int'>)"
     ds = ds.map_batches(lambda x: x)
     assert repr(ds) == (
-        "MapBatches\n" "+- Dataset(num_blocks=10, num_rows=10, schema=<class 'int'>)"
+        "MapBatches(<lambda>)\n"
+        "+- Dataset(num_blocks=10, num_rows=10, schema=<class 'int'>)"
     )
     ds = ds.filter(lambda x: x > 0)
     assert repr(ds) == (
         "Filter\n"
-        "+- MapBatches\n"
+        "+- MapBatches(<lambda>)\n"
         "   +- Dataset(num_blocks=10, num_rows=10, schema=<class 'int'>)"
     )
     ds = ds.random_shuffle()
     assert repr(ds) == (
         "RandomShuffle\n"
         "+- Filter\n"
-        "   +- MapBatches\n"
+        "   +- MapBatches(<lambda>)\n"
         "      +- Dataset(num_blocks=10, num_rows=10, schema=<class 'int'>)"
     )
     ds.fully_executed()
     assert repr(ds) == "Dataset(num_blocks=10, num_rows=9, schema=<class 'int'>)"
     ds = ds.map_batches(lambda x: x)
     assert repr(ds) == (
-        "MapBatches\n" "+- Dataset(num_blocks=10, num_rows=9, schema=<class 'int'>)"
+        "MapBatches(<lambda>)\n"
+        "+- Dataset(num_blocks=10, num_rows=9, schema=<class 'int'>)"
     )
     ds1, ds2 = ds.split(2)
     assert (
diff --git a/python/ray/data/tests/test_optimize.py b/python/ray/data/tests/test_optimize.py
index e8d0893aa3a4..97b62885e1b2 100644
--- a/python/ray/data/tests/test_optimize.py
+++ b/python/ray/data/tests/test_optimize.py
@@ -59,6 +59,11 @@ def expect_stages(pipe, num_stages_expected, stage_names):
         ), pipe._optimized_stages
 
 
+def dummy_map(x):
+    """Dummy function used in calls to map_batches in these tests."""
+    return x
+
+
 def test_memory_sanity(shutdown_only):
     info = ray.init(num_cpus=1, object_store_memory=500e6)
     ds = ray.data.range(10)
@@ -312,23 +317,23 @@ def test_optimize_reorder(ray_start_regular_shared):
     context.optimize_fuse_read_stages = True
     context.optimize_reorder_stages = True
 
-    ds = ray.data.range(10).randomize_block_order().map_batches(lambda x: x)
+    ds = ray.data.range(10).randomize_block_order().map_batches(dummy_map)
     expect_stages(
         ds,
         2,
-        ["read->map_batches", "randomize_block_order"],
+        ["read->MapBatches(dummy_map)", "randomize_block_order"],
     )
 
     ds2 = (
         ray.data.range(10)
         .randomize_block_order()
         .repartition(10)
-        .map_batches(lambda x: x)
+        .map_batches(dummy_map)
     )
     expect_stages(
         ds2,
         3,
-        ["read->randomize_block_order", "repartition", "map_batches"],
+        ["read->randomize_block_order", "repartition", "MapBatches(dummy_map)"],
     )
 
 
@@ -338,10 +343,10 @@ def test_window_randomize_fusion(ray_start_regular_shared):
     context.optimize_fuse_read_stages = True
     context.optimize_reorder_stages = True
 
-    pipe = ray.data.range(100).randomize_block_order().window().map_batches(lambda x: x)
+    pipe = ray.data.range(100).randomize_block_order().window().map_batches(dummy_map)
     pipe.take()
     stats = pipe.stats()
-    assert "read->randomize_block_order->map_batches" in stats, stats
+    assert "read->randomize_block_order->MapBatches(dummy_map)" in stats, stats
 
 
 def test_optimize_fuse(ray_start_regular_shared):
@@ -349,8 +354,8 @@ def test_optimize_fuse(ray_start_regular_shared):
 
     def build_pipe():
         pipe = ray.data.range(3).window(blocks_per_window=1).repeat(2)
-        pipe = pipe.map_batches(lambda x: x)
-        pipe = pipe.map_batches(lambda x: x)
+        pipe = pipe.map_batches(dummy_map)
+        pipe = pipe.map_batches(dummy_map)
         pipe = pipe.random_shuffle_each_window()
         results = [sorted(p.take()) for p in pipe.iter_epochs()]
         assert results == [[0, 1, 2], [0, 1, 2]], results
@@ -362,7 +367,10 @@ def build_pipe():
     expect_stages(
         build_pipe(),
         1,
-        ["read->map_batches->map_batches->random_shuffle_map", "random_shuffle_reduce"],
+        [
+            "read->MapBatches(dummy_map)->MapBatches(dummy_map)->random_shuffle_map",
+            "random_shuffle_reduce",
+        ],
     )
 
     context.optimize_fuse_stages = True
@@ -373,7 +381,7 @@ def build_pipe():
         1,
         [
             "read",
-            "map_batches->map_batches->random_shuffle_map",
+            "MapBatches(dummy_map)->MapBatches(dummy_map)->random_shuffle_map",
             "random_shuffle_reduce",
         ],
     )
@@ -386,7 +394,7 @@ def build_pipe():
         2,
         [
             "read",
-            "map_batches->map_batches",
+            "MapBatches(dummy_map)->MapBatches(dummy_map)",
             "random_shuffle_map",
             "random_shuffle_reduce",
         ],
@@ -400,8 +408,8 @@ def build_pipe():
         3,
         [
             "read",
-            "map_batches",
-            "map_batches",
+            "MapBatches(dummy_map)",
+            "MapBatches(dummy_map)",
             "random_shuffle_map",
             "random_shuffle_reduce",
         ],
@@ -428,14 +436,14 @@ def test_optimize_equivalent_remote_args(ray_start_regular_shared):
         for kwb in equivalent_kwargs:
             print("CHECKING", kwa, kwb)
             pipe = ray.data.range(3).repeat(2)
-            pipe = pipe.map_batches(lambda x: x, compute="tasks", **kwa)
-            pipe = pipe.map_batches(lambda x: x, compute="tasks", **kwb)
+            pipe = pipe.map_batches(dummy_map, compute="tasks", **kwa)
+            pipe = pipe.map_batches(dummy_map, compute="tasks", **kwb)
             pipe.take()
             expect_stages(
                 pipe,
                 1,
                 [
-                    "read->map_batches->map_batches",
+                    "read->MapBatches(dummy_map)->MapBatches(dummy_map)",
                 ],
             )
 
@@ -443,14 +451,14 @@ def test_optimize_equivalent_remote_args(ray_start_regular_shared):
         for kwb in equivalent_kwargs:
             print("CHECKING", kwa, kwb)
             pipe = ray.data.range(3).repeat(2)
-            pipe = pipe.map_batches(lambda x: x, compute="tasks", **kwa)
+            pipe = pipe.map_batches(dummy_map, compute="tasks", **kwa)
             pipe = pipe.random_shuffle_each_window(**kwb)
             pipe.take()
             expect_stages(
                 pipe,
                 1,
                 [
-                    "read->map_batches->random_shuffle_map",
+                    "read->MapBatches(dummy_map)->random_shuffle_map",
                     "random_shuffle_reduce",
                 ],
             )
@@ -464,32 +472,32 @@ def test_optimize_incompatible_stages(ray_start_regular_shared):
 
     pipe = ray.data.range(3).repeat(2)
     # Should get fused as long as their resource types are compatible.
-    pipe = pipe.map_batches(lambda x: x, compute="actors")
+    pipe = pipe.map_batches(dummy_map, compute="actors")
     # Cannot fuse actors->tasks.
-    pipe = pipe.map_batches(lambda x: x, compute="tasks")
+    pipe = pipe.map_batches(dummy_map, compute="tasks")
     pipe = pipe.random_shuffle_each_window()
     pipe.take()
     expect_stages(
         pipe,
         2,
         [
-            "read->map_batches",
-            "map_batches->random_shuffle_map",
+            "read->MapBatches(dummy_map)",
+            "MapBatches(dummy_map)->random_shuffle_map",
             "random_shuffle_reduce",
         ],
     )
 
     pipe = ray.data.range(3).repeat(2)
-    pipe = pipe.map_batches(lambda x: x, compute="tasks")
-    pipe = pipe.map_batches(lambda x: x, num_cpus=0.75)
+    pipe = pipe.map_batches(dummy_map, compute="tasks")
+    pipe = pipe.map_batches(dummy_map, num_cpus=0.75)
     pipe = pipe.random_shuffle_each_window()
     pipe.take()
     expect_stages(
         pipe,
         3,
         [
-            "read->map_batches",
-            "map_batches",
+            "read->MapBatches(dummy_map)",
+            "MapBatches(dummy_map)",
             "random_shuffle_map",
             "random_shuffle_reduce",
         ],
@@ -556,7 +564,7 @@ def __call__(self, x):
         pipe,
         1,
         [
-            "read->map_batches->map_batches",
+            "read->MapBatches(CallableFn)->MapBatches(CallableFn)",
         ],
     )
 
@@ -592,7 +600,7 @@ def __call__(self, x):
         pipe,
         1,
         [
-            "read->map_batches->map_batches",
+            "read->MapBatches(<lambda>)->MapBatches(CallableFn)",
         ],
     )
 
diff --git a/python/ray/data/tests/test_stats.py b/python/ray/data/tests/test_stats.py
index c5c85c27ddda..454750723cfd 100644
--- a/python/ray/data/tests/test_stats.py
+++ b/python/ray/data/tests/test_stats.py
@@ -25,6 +25,11 @@ def canonicalize(stats: str) -> str:
     return s4
 
 
+def dummy_map_batches(x):
+    """Dummy function used in calls to map_batches below."""
+    return x
+
+
 def test_dataset_stats_basic(ray_start_regular_shared, enable_auto_log_stats):
     context = DatasetContext.get_current()
     context.optimize_fuse_stages = True
@@ -39,7 +44,7 @@ def test_dataset_stats_basic(ray_start_regular_shared, enable_auto_log_stats):
         )
     with patch.object(logger, "info") as mock_logger:
         ds = ray.data.range(1000, parallelism=10)
-        ds = ds.map_batches(lambda x: x).fully_executed()
+        ds = ds.map_batches(dummy_map_batches).fully_executed()
 
         if enable_auto_log_stats:
             logger_args, logger_kwargs = mock_logger.call_args
@@ -47,7 +52,7 @@ def test_dataset_stats_basic(ray_start_regular_shared, enable_auto_log_stats):
             if context.new_execution_backend:
                 assert (
                     canonicalize(logger_args[0])
-                    == """Stage N read->map_batches: N/N blocks executed in T
+                    == """Stage N read->MapBatches(dummy_map_batches): N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
 * Remote cpu time: T min, T max, T mean, T total
 * Peak heap memory usage (MiB): N min, N max, N mean
@@ -61,7 +66,7 @@ def test_dataset_stats_basic(ray_start_regular_shared, enable_auto_log_stats):
             else:
                 assert (
                     canonicalize(logger_args[0])
-                    == """Stage N read->map_batches: N/N blocks executed in T
+                    == """Stage N read->MapBatches(dummy_map_batches): N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
 * Remote cpu time: T min, T max, T mean, T total
 * Peak heap memory usage (MiB): N min, N max, N mean
@@ -71,7 +76,7 @@ def test_dataset_stats_basic(ray_start_regular_shared, enable_auto_log_stats):
 """
                 )
 
-        ds = ds.map(lambda x: x).fully_executed()
+        ds = ds.map(dummy_map_batches).fully_executed()
         if enable_auto_log_stats:
             logger_args, logger_kwargs = mock_logger.call_args
 
@@ -108,7 +113,7 @@ def test_dataset_stats_basic(ray_start_regular_shared, enable_auto_log_stats):
     if context.new_execution_backend:
         assert (
             stats
-            == """Stage N read->map_batches: N/N blocks executed in T
+            == """Stage N read->MapBatches(dummy_map_batches): N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
 * Remote cpu time: T min, T max, T mean, T total
 * Peak heap memory usage (MiB): N min, N max, N mean
@@ -140,7 +145,7 @@ def test_dataset_stats_basic(ray_start_regular_shared, enable_auto_log_stats):
     else:
         assert (
             stats
-            == """Stage N read->map_batches: N/N blocks executed in T
+            == """Stage N read->MapBatches(dummy_map_batches): N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
 * Remote cpu time: T min, T max, T mean, T total
 * Peak heap memory usage (MiB): N min, N max, N mean
@@ -369,7 +374,7 @@ def test_dataset_pipeline_stats_basic(ray_start_regular_shared, enable_auto_log_
 
     with patch.object(logger, "info") as mock_logger:
         ds = ray.data.range(1000, parallelism=10)
-        ds = ds.map_batches(lambda x: x).fully_executed()
+        ds = ds.map_batches(dummy_map_batches).fully_executed()
 
         if enable_auto_log_stats:
             logger_args, logger_kwargs = mock_logger.call_args
@@ -377,7 +382,7 @@ def test_dataset_pipeline_stats_basic(ray_start_regular_shared, enable_auto_log_
             if context.new_execution_backend:
                 assert (
                     canonicalize(logger_args[0])
-                    == """Stage N read->map_batches: N/N blocks executed in T
+                    == """Stage N read->MapBatches(dummy_map_batches): N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
 * Remote cpu time: T min, T max, T mean, T total
 * Peak heap memory usage (MiB): N min, N max, N mean
@@ -391,7 +396,7 @@ def test_dataset_pipeline_stats_basic(ray_start_regular_shared, enable_auto_log_
             else:
                 assert (
                     canonicalize(logger_args[0])
-                    == """Stage N read->map_batches: N/N blocks executed in T
+                    == """Stage N read->MapBatches(dummy_map_batches): N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
 * Remote cpu time: T min, T max, T mean, T total
 * Peak heap memory usage (MiB): N min, N max, N mean
@@ -402,14 +407,14 @@ def test_dataset_pipeline_stats_basic(ray_start_regular_shared, enable_auto_log_
                 )
 
         pipe = ds.repeat(5)
-        pipe = pipe.map(lambda x: x)
+        pipe = pipe.map(dummy_map_batches)
         if enable_auto_log_stats:
             # Stats only include first stage, and not for pipelined map
             logger_args, logger_kwargs = mock_logger.call_args
             if context.new_execution_backend:
                 assert (
                     canonicalize(logger_args[0])
-                    == """Stage N read->map_batches: N/N blocks executed in T
+                    == """Stage N read->MapBatches(dummy_map_batches): N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
 * Remote cpu time: T min, T max, T mean, T total
 * Peak heap memory usage (MiB): N min, N max, N mean
@@ -423,7 +428,7 @@ def test_dataset_pipeline_stats_basic(ray_start_regular_shared, enable_auto_log_
             else:
                 assert (
                     canonicalize(logger_args[0])
-                    == """Stage N read->map_batches: N/N blocks executed in T
+                    == """Stage N read->MapBatches(dummy_map_batches): N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
 * Remote cpu time: T min, T max, T mean, T total
 * Peak heap memory usage (MiB): N min, N max, N mean
@@ -473,7 +478,7 @@ def test_dataset_pipeline_stats_basic(ray_start_regular_shared, enable_auto_log_
             assert (
                 stats
                 == """== Pipeline Window N ==
-Stage N read->map_batches: N/N blocks executed in T
+Stage N read->MapBatches(dummy_map_batches): N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
 * Remote cpu time: T min, T max, T mean, T total
 * Peak heap memory usage (MiB): N min, N max, N mean
@@ -494,7 +499,7 @@ def test_dataset_pipeline_stats_basic(ray_start_regular_shared, enable_auto_log_
 'obj_store_mem_peak': N}
 
 == Pipeline Window N ==
-Stage N read->map_batches: [execution cached]
+Stage N read->MapBatches(dummy_map_batches): [execution cached]
 * Extra metrics: {'obj_store_mem_alloc': N, 'obj_store_mem_freed': N, \
 'obj_store_mem_peak': N}
 
@@ -509,7 +514,7 @@ def test_dataset_pipeline_stats_basic(ray_start_regular_shared, enable_auto_log_
 'obj_store_mem_peak': N}
 
 == Pipeline Window N ==
-Stage N read->map_batches: [execution cached]
+Stage N read->MapBatches(dummy_map_batches): [execution cached]
 * Extra metrics: {'obj_store_mem_alloc': N, 'obj_store_mem_freed': N, \
 'obj_store_mem_peak': N}
 
@@ -540,7 +545,7 @@ def test_dataset_pipeline_stats_basic(ray_start_regular_shared, enable_auto_log_
             assert (
                 stats
                 == """== Pipeline Window N ==
-Stage N read->map_batches: N/N blocks executed in T
+Stage N read->MapBatches(dummy_map_batches): N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
 * Remote cpu time: T min, T max, T mean, T total
 * Peak heap memory usage (MiB): N min, N max, N mean
@@ -557,7 +562,7 @@ def test_dataset_pipeline_stats_basic(ray_start_regular_shared, enable_auto_log_
 * Tasks per node: N min, N max, N mean; N nodes used
 
 == Pipeline Window N ==
-Stage N read->map_batches: [execution cached]
+Stage N read->MapBatches(dummy_map_batches): [execution cached]
 
 Stage N map: N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
@@ -568,7 +573,7 @@ def test_dataset_pipeline_stats_basic(ray_start_regular_shared, enable_auto_log_
 * Tasks per node: N min, N max, N mean; N nodes used
 
 == Pipeline Window N ==
-Stage N read->map_batches: [execution cached]
+Stage N read->MapBatches(dummy_map_batches): [execution cached]
 
 Stage N map: N/N blocks executed in T
 * Remote wall time: T min, T max, T mean, T total
@@ -607,11 +612,11 @@ def test_dataset_pipeline_cache_cases(ray_start_regular_shared):
     assert "[execution cached]" in stats
 
     # CACHED (eager map stage).
-    ds = ray.data.range(10).map_batches(lambda x: x).repeat(2)
+    ds = ray.data.range(10).map_batches(dummy_map_batches).repeat(2)
     ds.take(999)
     stats = ds.stats()
     assert "[execution cached]" in stats
-    assert "read->map_batches" in stats
+    assert "read->MapBatches(dummy_map_batches)" in stats
 
 
 def test_dataset_pipeline_split_stats_basic(ray_start_regular_shared):
diff --git a/python/ray/train/tests/test_batch_predictor.py b/python/ray/train/tests/test_batch_predictor.py
index 5b04009318ed..5c51a502408e 100644
--- a/python/ray/train/tests/test_batch_predictor.py
+++ b/python/ray/train/tests/test_batch_predictor.py
@@ -116,8 +116,8 @@ def test_separate_gpu_stage(shutdown_only):
         allow_gpu=True,
     )
     stats = ds.stats()
-    assert "Stage 1 read->map_batches:" in stats, stats
-    assert "Stage 2 map_batches:" in stats, stats
+    assert "Stage 1 read->DummyPreprocessor:" in stats, stats
+    assert "Stage 2 MapBatches(ScoringWrapper):" in stats, stats
     assert ds.max("value") == 36.0, ds
 
     ds = batch_predictor.predict(
@@ -128,7 +128,7 @@ def test_separate_gpu_stage(shutdown_only):
     )
     stats = ds.stats()
     assert "Stage 1 read:" in stats, stats
-    assert "Stage 2 map_batches:" in stats, stats
+    assert "Stage 2 MapBatches(ScoringWrapper):" in stats, stats
     assert ds.max("value") == 36.0, ds
 
 
@@ -160,7 +160,7 @@ def test_batch_prediction():
     test_dataset = ray.data.range_table(4)
     ds = batch_predictor.predict(test_dataset)
     # Check fusion occurred.
-    assert "read->map_batches" in ds.stats(), ds.stats()
+    assert "read->DummyPreprocessor" in ds.stats(), ds.stats()
     assert ds.to_pandas().to_numpy().squeeze().tolist() == [
         0.0,
         4.0,
@@ -278,7 +278,7 @@ def test_batch_prediction_various_combination():
         ds = batch_predictor.predict(input_dataset)
         print(ds.stats())
         # Check no fusion needed since we're not doing a dataset read.
-        assert "Stage 1 map_batches" in ds.stats(), ds.stats()
+        assert f"Stage 1 {preprocessor.__class__.__name__}" in ds.stats(), ds.stats()
         assert ds.to_pandas().to_numpy().squeeze().tolist() == [
             4.0,
             8.0,
@@ -544,8 +544,8 @@ def test_separate_gpu_stage_pipelined(shutdown_only):
     )
     out = [x["value"] for x in ds.iter_rows()]
     stats = ds.stats()
-    assert "Stage 1 read->map_batches:" in stats, stats
-    assert "Stage 2 map_batches:" in stats, stats
+    assert "Stage 1 read->DummyPreprocessor:" in stats, stats
+    assert "Stage 2 MapBatches(ScoringWrapper):" in stats, stats
     assert max(out) == 16.0, out
 
     ds = batch_predictor.predict_pipelined(
@@ -558,7 +558,7 @@ def test_separate_gpu_stage_pipelined(shutdown_only):
     out = [x["value"] for x in ds.iter_rows()]
     stats = ds.stats()
     assert "Stage 1 read:" in stats, stats
-    assert "Stage 2 map_batches:" in stats, stats
+    assert "Stage 2 MapBatches(ScoringWrapper):" in stats, stats
     assert max(out) == 16.0, out
 
 
From 7b2299be8e69f4abf96b5cbb076c035b0a285792 Mon Sep 17 00:00:00 2001
From: andreapiso <14676006+andreapiso@users.noreply.github.com>
Date: Fri, 27 Jan 2023 22:53:31 +0800
Subject: [PATCH 019/267] Enable Log Rotation on Serve (#31844)

This PR adds log rotation for Ray Serve, letting it inherit rotation parameters (max_bytes, backup_count) from Ray Core, bringing a more consistent logging experience to Ray (as opposed to having the serve/ folder grow forever while the other logs rotate.
---
 doc/source/ray-observability/ray-logging.rst  |  3 ++
 .../serve/production-guide/monitoring.md      |  2 ++
 python/ray/serve/_private/logging_utils.py    | 12 ++++++-
 python/ray/serve/tests/test_logging.py        | 32 +++++++++++++++++++
 4 files changed, 48 insertions(+), 1 deletion(-)

diff --git a/doc/source/ray-observability/ray-logging.rst b/doc/source/ray-observability/ray-logging.rst
index b4220fef0bc5..692fbeb479e0 100644
--- a/doc/source/ray-observability/ray-logging.rst
+++ b/doc/source/ray-observability/ray-logging.rst
@@ -173,8 +173,11 @@ Here's a Ray log directory structure. Note that ``.out`` is logs from stdout/std
 - ``runtime_env_setup-ray_client_server_[port].log``: Logs from installing :ref:`runtime environments <runtime-environments>` for a job when connecting via :ref:`Ray Client <ray-client-ref>`.
 - ``worker-[worker_id]-[job_id]-[pid].[out|err]``: Python/Java part of Ray drivers and workers. All of stdout and stderr from tasks/actors are streamed here. Note that job_id is an id of the driver.- 
 
+.. _ray-log-rotation:
+
 Log rotation
 ------------
+
 Ray supports log rotation of log files. Note that not all components are currently supporting log rotation. (Raylet and Python/Java worker logs are not rotating).
 
 By default, logs are rotating when it reaches to 512MB (maxBytes), and there could be up to 5 backup files (backupCount). Indexes are appended to all backup files (e.g., `raylet.out.1`)
diff --git a/doc/source/serve/production-guide/monitoring.md b/doc/source/serve/production-guide/monitoring.md
index 47b96604be4f..d9d913a9fd18 100644
--- a/doc/source/serve/production-guide/monitoring.md
+++ b/doc/source/serve/production-guide/monitoring.md
@@ -99,6 +99,8 @@ This causes the HTTP proxy and deployment replica to print log statements to the
 
 A copy of these logs are stored at `/tmp/ray/session_latest/logs/serve/`. You can parse these stored logs with a logging stack such as ELK or [Loki](serve-logging-loki) to search them by deployment or replica. 
 
+Serve supports [Log Rotation](ray-log-rotation) of these logs through setting the environment variables `RAY_ROTATION_MAX_BYTES` and `RAY_ROTATION_BACKUP_COUNT`.
+
 To silence the replica-level logs or otherwise configure logging, configure the `"ray.serve"` logger **inside the deployment constructor**:
 
 ```python
diff --git a/python/ray/serve/_private/logging_utils.py b/python/ray/serve/_private/logging_utils.py
index 1d76be1057f5..11604f8e3de8 100644
--- a/python/ray/serve/_private/logging_utils.py
+++ b/python/ray/serve/_private/logging_utils.py
@@ -22,6 +22,8 @@ def configure_component_logger(
     log_level: int = logging.INFO,
     log_to_stream: bool = True,
     log_to_file: bool = True,
+    max_bytes: Optional[int] = None,
+    backup_count: Optional[int] = None,
 ):
     """Returns a logger to be used by a Serve component.
 
@@ -51,12 +53,20 @@ def configure_component_logger(
             ray._private.worker._global_node.get_logs_dir_path(), "serve"
         )
         os.makedirs(logs_dir, exist_ok=True)
+        if max_bytes is None:
+            max_bytes = ray._private.worker._global_node.max_bytes
+        if backup_count is None:
+            backup_count = ray._private.worker._global_node.backup_count
         if component_type is not None:
             component_name = f"{component_type}_{component_name}"
         log_file_name = LOG_FILE_FMT.format(
             component_name=component_name, component_id=component_id
         )
-        file_handler = logging.FileHandler(os.path.join(logs_dir, log_file_name))
+        file_handler = logging.handlers.RotatingFileHandler(
+            os.path.join(logs_dir, log_file_name),
+            maxBytes=max_bytes,
+            backupCount=backup_count,
+        )
         file_handler.setFormatter(formatter)
         logger.addHandler(file_handler)
 
diff --git a/python/ray/serve/tests/test_logging.py b/python/ray/serve/tests/test_logging.py
index 47ef85a622b1..6b5b2c37c21b 100644
--- a/python/ray/serve/tests/test_logging.py
+++ b/python/ray/serve/tests/test_logging.py
@@ -12,6 +12,38 @@
 from ray._private.test_utils import wait_for_condition
 
 
+def set_logging_config(monkeypatch, max_bytes, backup_count):
+    monkeypatch.setenv("RAY_ROTATION_MAX_BYTES", str(max_bytes))
+    monkeypatch.setenv("RAY_ROTATION_BACKUP_COUNT", str(backup_count))
+
+
+def test_log_rotation_config(monkeypatch, ray_shutdown):
+    # This test should be executed before any test that uses
+    # the shared serve_instance, as environment variables
+    # for log rotation need to be set before ray.init
+    logger = logging.getLogger("ray.serve")
+    max_bytes = 100
+    backup_count = 3
+    set_logging_config(monkeypatch, max_bytes, backup_count)
+    ray.init(num_cpus=1)
+
+    @serve.deployment
+    class Handle:
+        def __call__(self):
+            handlers = logger.handlers
+            res = {}
+            for handler in handlers:
+                if isinstance(handler, logging.handlers.RotatingFileHandler):
+                    res["max_bytes"] = handler.maxBytes
+                    res["backup_count"] = handler.backupCount
+            return res
+
+    handle = serve.run(Handle.bind())
+    rotation_config = ray.get(handle.remote())
+    assert rotation_config["max_bytes"] == max_bytes
+    assert rotation_config["backup_count"] == backup_count
+
+
 def test_handle_access_log(serve_instance):
     name = "handler"
 

From ed72ca8f10a09c9934a51fc3579d11c64fda58b4 Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Fri, 27 Jan 2023 09:55:43 -0500
Subject: [PATCH 020/267] [core][state] Handle driver tasks  (#31832)

This PR adds additional information to the driver task event, namely, driver task type, and it's running/finished timestamps. This allows users (i.e. the dashboard) to inspect driver task more easily.
This PR also exposes the exclude_driver flag to state API, allowing requests through https and ListAPiOptions to get driver tasks, while the default behaviour from state API will still be excluding it.
This PR also filters out any tasks w/o task_info to prevent missing data issue.
---
 dashboard/modules/state/state_head.py         |  9 ++-
 dashboard/state_aggregator.py                 |  8 +-
 python/ray/experimental/state/api.py          |  2 +-
 python/ray/experimental/state/common.py       |  3 +
 .../ray/experimental/state/state_manager.py   |  8 +-
 python/ray/tests/test_state_api.py            |  4 +-
 python/ray/tests/test_task_events.py          | 81 ++++++++++++++++---
 src/ray/core_worker/core_worker.cc            | 31 ++++++-
 src/ray/core_worker/task_manager.cc           |  2 +
 src/ray/gcs/gcs_server/gcs_task_manager.cc    |  9 ++-
 .../gcs_server/test/gcs_task_manager_test.cc  | 51 +++++++++++-
 src/ray/protobuf/gcs_service.proto            |  2 +-
 12 files changed, 185 insertions(+), 25 deletions(-)

diff --git a/dashboard/modules/state/state_head.py b/dashboard/modules/state/state_head.py
index 3358f03da337..b2e755b35e0d 100644
--- a/dashboard/modules/state/state_head.py
+++ b/dashboard/modules/state/state_head.py
@@ -192,9 +192,16 @@ def _options_from_req(self, req: aiohttp.web.Request) -> ListApiOptions:
         timeout = int(req.query.get("timeout", 30))
         filters = self._get_filters_from_req(req)
         detail = convert_string_to_type(req.query.get("detail", False), bool)
+        exclude_driver = convert_string_to_type(
+            req.query.get("exclude_driver", True), bool
+        )
 
         return ListApiOptions(
-            limit=limit, timeout=timeout, filters=filters, detail=detail
+            limit=limit,
+            timeout=timeout,
+            filters=filters,
+            detail=detail,
+            exclude_driver=exclude_driver,
         )
 
     def _summary_options_from_req(self, req: aiohttp.web.Request) -> SummaryApiOptions:
diff --git a/dashboard/state_aggregator.py b/dashboard/state_aggregator.py
index ebec09d7b917..c75b5d5385db 100644
--- a/dashboard/state_aggregator.py
+++ b/dashboard/state_aggregator.py
@@ -373,13 +373,15 @@ async def list_tasks(self, *, option: ListApiOptions) -> ListApiResponse:
         """
         job_id = None
         for filter in option.filters:
-            if filter[0] == "job_id":
+            if filter[0] == "job_id" and filter[1] == "=":
+                # Filtering by job_id == xxxx, pass it to source side filtering.
                 # tuple consists of (job_id, predicate, value)
                 job_id = filter[2]
-
         try:
             reply = await self._client.get_all_task_info(
-                timeout=option.timeout, job_id=job_id
+                timeout=option.timeout,
+                job_id=job_id,
+                exclude_driver=option.exclude_driver,
             )
         except DataSourceUnavailable:
             raise DataSourceUnavailable(GCS_QUERY_FAILURE_WARNING)
diff --git a/python/ray/experimental/state/api.py b/python/ray/experimental/state/api.py
index 4512e8bda780..daefed8b423b 100644
--- a/python/ray/experimental/state/api.py
+++ b/python/ray/experimental/state/api.py
@@ -174,7 +174,7 @@ def _make_param(cls, options: Union[ListApiOptions, GetApiOptions]) -> Dict:
                 continue
 
             option_val = getattr(options, field.name)
-            if option_val:
+            if option_val is not None:
                 options_dict[field.name] = option_val
 
         return options_dict
diff --git a/python/ray/experimental/state/common.py b/python/ray/experimental/state/common.py
index 664041240aca..6e997820857c 100644
--- a/python/ray/experimental/state/common.py
+++ b/python/ray/experimental/state/common.py
@@ -88,6 +88,8 @@ class ListApiOptions:
     filters: Optional[List[Tuple[str, PredicateType, SupportedFilterType]]] = field(
         default_factory=list
     )
+    # [only tasks] If driver tasks should be excluded.
+    exclude_driver: bool = True
     # When the request is processed on the server side,
     # we should apply multiplier so that server side can finish
     # processing a request within timeout. Otherwise,
@@ -99,6 +101,7 @@ def __post_init__(self):
         assert isinstance(self.limit, int)
         assert isinstance(self.timeout, int)
         assert isinstance(self.detail, bool)
+        assert isinstance(self.exclude_driver, bool)
         assert isinstance(self.filters, list) or self.filters is None, (
             "filters must be a list type. Given filters: "
             f"{self.filters} type: {type(self.filters)}. "
diff --git a/python/ray/experimental/state/state_manager.py b/python/ray/experimental/state/state_manager.py
index c82c0211f311..70d22b8fa070 100644
--- a/python/ray/experimental/state/state_manager.py
+++ b/python/ray/experimental/state/state_manager.py
@@ -234,14 +234,18 @@ async def get_all_actor_info(
 
     @handle_grpc_network_errors
     async def get_all_task_info(
-        self, timeout: int = None, limit: int = None, job_id: Optional[str] = None
+        self,
+        timeout: int = None,
+        limit: int = None,
+        job_id: Optional[str] = None,
+        exclude_driver: bool = True,
     ) -> Optional[GetTaskEventsReply]:
         if not limit:
             limit = RAY_MAX_LIMIT_FROM_DATA_SOURCE
         if job_id:
             job_id = JobID(hex_to_binary(job_id)).binary()
         request = GetTaskEventsRequest(
-            limit=limit, exclude_driver_task=True, job_id=job_id
+            limit=limit, exclude_driver=exclude_driver, job_id=job_id
         )
         reply = await self._gcs_task_info_stub.GetTaskEvents(request, timeout=timeout)
         return reply
diff --git a/python/ray/tests/test_state_api.py b/python/ray/tests/test_state_api.py
index 3859eb11f43a..c37f4b0fc00c 100644
--- a/python/ray/tests/test_state_api.py
+++ b/python/ray/tests/test_state_api.py
@@ -283,6 +283,7 @@ def create_api_options(
     limit: int = DEFAULT_LIMIT,
     filters: List[Tuple[str, SupportedFilterType]] = None,
     detail: bool = False,
+    exclude_driver: bool = True,
 ):
     if not filters:
         filters = []
@@ -292,6 +293,7 @@ def create_api_options(
         filters=filters,
         _server_timeout_multiplier=1.0,
         detail=detail,
+        exclude_driver=exclude_driver,
     )
 
 
@@ -804,7 +806,7 @@ async def test_api_manager_list_tasks(state_api_manager):
     ]
     result = await state_api_manager.list_tasks(option=create_api_options())
     data_source_client.get_all_task_info.assert_any_await(
-        timeout=DEFAULT_RPC_TIMEOUT, job_id=None
+        timeout=DEFAULT_RPC_TIMEOUT, job_id=None, exclude_driver=True
     )
     data = result.result
     data = data
diff --git a/python/ray/tests/test_task_events.py b/python/ray/tests/test_task_events.py
index 87d16772a363..425f1f5931cc 100644
--- a/python/ray/tests/test_task_events.py
+++ b/python/ray/tests/test_task_events.py
@@ -4,12 +4,13 @@
 import time
 
 import ray
+from ray.experimental.state.common import ListApiOptions, StateResource
 from ray._private.test_utils import (
     raw_metrics,
     run_string_as_driver_nonblocking,
     wait_for_condition,
 )
-from ray.experimental.state.api import list_tasks
+from ray.experimental.state.api import StateApiClient, list_tasks
 
 from ray._private.worker import RayContext
 
@@ -68,7 +69,7 @@ def verify():
             "At least 10 tasks events should be reported. "
             "Could be more than 10 with multiple flush."
         )
-        assert metric["STORED"] == 10, "10 task's events should be stored."
+        assert metric["STORED"] == 11, "10 task + 1 driver's events should be stored."
 
         return True
 
@@ -123,6 +124,66 @@ def verify():
     )
 
 
+def test_handle_driver_tasks(shutdown_only):
+    ray.init(_system_config=_SYSTEM_CONFIG)
+
+    job_id = ray.get_runtime_context().get_job_id()
+    script = """
+import ray
+import time
+ray.init("auto")
+
+@ray.remote
+def f():
+    time.sleep(3)
+
+
+ray.get(f.remote())
+"""
+    run_string_as_driver_nonblocking(script)
+
+    client = StateApiClient()
+
+    def list_tasks(exclude_driver):
+        return client.list(
+            StateResource.TASKS,
+            # Filter out this driver
+            options=ListApiOptions(
+                exclude_driver=exclude_driver, filters=[("job_id", "!=", job_id)]
+            ),
+            raise_on_missing_output=True,
+        )
+
+    # Check driver running
+    def verify():
+        tasks_with_driver = list_tasks(exclude_driver=False)
+        assert len(tasks_with_driver) == 2, tasks_with_driver
+        task_types = {task["type"] for task in tasks_with_driver}
+        assert task_types == {"NORMAL_TASK", "DRIVER_TASK"}
+
+        for task in tasks_with_driver:
+            if task["type"] == "DRIVER_TASK":
+                assert task["state"] == "RUNNING", task
+
+        return True
+
+    wait_for_condition(verify, timeout=15, retry_interval_ms=1000)
+
+    # Check driver finishes
+    def verify():
+        tasks_with_driver = list_tasks(exclude_driver=False)
+        assert len(tasks_with_driver) == 2, tasks_with_driver
+        for task in tasks_with_driver:
+            if task["type"] == "DRIVER_TASK":
+                assert task["state"] == "FINISHED", task
+
+        tasks_no_driver = list_tasks(exclude_driver=True)
+        assert len(tasks_no_driver) == 1, tasks_no_driver
+        return True
+
+    wait_for_condition(verify)
+
+
 def test_fault_tolerance_job_failed(shutdown_only):
     ray.init(num_cpus=8, _system_config=_SYSTEM_CONFIG)
     script = """
@@ -184,11 +245,11 @@ def verify():
         for task in tasks:
             if "finished" in task["func_or_class_name"]:
                 assert (
-                    task["scheduling_state"] == "FINISHED"
+                    task["state"] == "FINISHED"
                 ), f"task {task['func_or_class_name']} has wrong state"
             else:
                 assert (
-                    task["scheduling_state"] == "FAILED"
+                    task["state"] == "FAILED"
                 ), f"task {task['func_or_class_name']} has wrong state"
 
         return True
@@ -247,9 +308,9 @@ def verify():
         ), "1 creation task + 1 actor tasks + 2 normal tasks run by the actor tasks"
         for task in tasks:
             if "finish" in task["name"] or "__init__" in task["name"]:
-                assert task["scheduling_state"] == "FINISHED", task
+                assert task["state"] == "FINISHED", task
             else:
-                assert task["scheduling_state"] == "FAILED", task
+                assert task["state"] == "FAILED", task
 
         return True
 
@@ -276,9 +337,9 @@ def verify():
         )
         for task in tasks:
             if "finish" in task["name"] or "__init__" in task["name"]:
-                assert task["scheduling_state"] == "FINISHED", task
+                assert task["state"] == "FINISHED", task
             else:
-                assert task["scheduling_state"] == "FAILED", task
+                assert task["state"] == "FAILED", task
 
         return True
 
@@ -405,9 +466,9 @@ def add_death_tasks_recur(task, execution_graph, dead_tasks):
 
         for task in target_tasks:
             if task["name"] in dead_tasks:
-                assert task["scheduling_state"] == "FAILED", task["name"]
+                assert task["state"] == "FAILED", task["name"]
             else:
-                assert task["scheduling_state"] == "RUNNING", task["name"]
+                assert task["state"] == "RUNNING", task["name"]
 
         return True
 
diff --git a/src/ray/core_worker/core_worker.cc b/src/ray/core_worker/core_worker.cc
index 61a10cc5f847..c3ea072b52db 100644
--- a/src/ray/core_worker/core_worker.cc
+++ b/src/ray/core_worker/core_worker.cc
@@ -360,11 +360,27 @@ CoreWorker::CoreWorker(const CoreWorkerOptions &options, const WorkerID &worker_
     builder.SetDriverTaskSpec(task_id,
                               options_.language,
                               worker_context_.GetCurrentJobID(),
-                              TaskID::ComputeDriverTaskId(worker_context_.GetWorkerID()),
+                              // Driver has no parent task
+                              /* parent_task_id */ TaskID::Nil(),
                               GetCallerId(),
                               rpc_address_);
     // Drivers are never re-executed.
     SetCurrentTaskId(task_id, /*attempt_number=*/0, "driver");
+
+    // Add the driver task info.
+    if (task_event_buffer_->Enabled()) {
+      rpc::TaskEvents task_event;
+      const auto spec = builder.Build();
+      auto task_info = task_manager_->MakeTaskInfoEntry(spec);
+      task_event.set_task_id(task_id.Binary());
+      task_event.set_job_id(spec.JobId().Binary());
+      task_event.set_attempt_number(0);
+      task_event.mutable_task_info()->Swap(&task_info);
+      gcs::FillTaskStatusUpdateTime(rpc::TaskStatus::RUNNING,
+                                    absl::GetCurrentTimeNanos(),
+                                    task_event.mutable_state_updates());
+      task_event_buffer_->AddTaskEvent(std::move(task_event));
+    }
   }
 
   auto raylet_client_factory = [this](const std::string ip_address, int port) {
@@ -643,6 +659,19 @@ void CoreWorker::Disconnect(
   // Force stats export before exiting the worker.
   RecordMetrics();
 
+  // Driver exiting.
+  if (options_.worker_type == WorkerType::DRIVER && task_event_buffer_->Enabled()) {
+    // Mark Driver as finished.
+    rpc::TaskEvents task_event;
+    task_event.set_task_id(worker_context_.GetCurrentTaskID().Binary());
+    task_event.set_job_id(worker_context_.GetCurrentJobID().Binary());
+    task_event.set_attempt_number(0);
+    gcs::FillTaskStatusUpdateTime(rpc::TaskStatus::FINISHED,
+                                  absl::GetCurrentTimeNanos(),
+                                  task_event.mutable_state_updates());
+    task_event_buffer_->AddTaskEvent(std::move(task_event));
+  }
+
   // Force task state events push before exiting the worker.
   task_event_buffer_->FlushEvents(/* forced */ true);
 
diff --git a/src/ray/core_worker/task_manager.cc b/src/ray/core_worker/task_manager.cc
index a3839592c9f5..3cf71e383d19 100644
--- a/src/ray/core_worker/task_manager.cc
+++ b/src/ray/core_worker/task_manager.cc
@@ -842,6 +842,8 @@ rpc::TaskInfoEntry TaskManager::MakeTaskInfoEntry(
   rpc::TaskType type;
   if (task_spec.IsNormalTask()) {
     type = rpc::TaskType::NORMAL_TASK;
+  } else if (task_spec.IsDriverTask()) {
+    type = rpc::TaskType::DRIVER_TASK;
   } else if (task_spec.IsActorCreationTask()) {
     type = rpc::TaskType::ACTOR_CREATION_TASK;
     task_info.set_actor_id(task_spec.ActorCreationId().Binary());
diff --git a/src/ray/gcs/gcs_server/gcs_task_manager.cc b/src/ray/gcs/gcs_server/gcs_task_manager.cc
index 68f75cd918a3..7810f2ff0b50 100644
--- a/src/ray/gcs/gcs_server/gcs_task_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_task_manager.cc
@@ -367,8 +367,13 @@ void GcsTaskManager::HandleGetTaskEvents(rpc::GetTaskEventsRequest request,
 
   for (auto itr = task_events.rbegin(); itr != task_events.rend(); ++itr) {
     auto &task_event = *itr;
-    if (request.exclude_driver_task() && !task_event.has_state_updates()) {
-      // Driver related profile events will generate TaskEvent w/o any task state updates.
+    if (!task_event.has_task_info()) {
+      // Skip task events w/o task info.
+      continue;
+    }
+
+    if (request.exclude_driver() &&
+        task_event.task_info().type() == rpc::TaskType::DRIVER_TASK) {
       continue;
     }
 
diff --git a/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc b/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
index bf192b2ec609..4932794d521b 100644
--- a/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
@@ -99,7 +99,8 @@ class GcsTaskManagerTest : public ::testing::Test {
 
   rpc::GetTaskEventsReply SyncGetTaskEvents(absl::flat_hash_set<TaskID> task_ids,
                                             absl::optional<JobID> job_id = absl::nullopt,
-                                            int64_t limit = -1) {
+                                            int64_t limit = -1,
+                                            bool exclude_driver = true) {
     rpc::GetTaskEventsRequest request;
     rpc::GetTaskEventsReply reply;
     std::promise<bool> promise;
@@ -118,6 +119,8 @@ class GcsTaskManagerTest : public ::testing::Test {
       request.set_limit(limit);
     }
 
+    request.set_exclude_driver(exclude_driver);
+
     task_manager->HandleGetTaskEvents(
         request,
         &reply,
@@ -131,11 +134,14 @@ class GcsTaskManagerTest : public ::testing::Test {
     return reply;
   }
 
-  static rpc::TaskInfoEntry GenTaskInfo(JobID job_id,
-                                        TaskID parent_task_id = TaskID::Nil()) {
+  static rpc::TaskInfoEntry GenTaskInfo(
+      JobID job_id,
+      TaskID parent_task_id = TaskID::Nil(),
+      rpc::TaskType task_type = rpc::TaskType::NORMAL_TASK) {
     rpc::TaskInfoEntry task_info;
     task_info.set_job_id(job_id.Binary());
     task_info.set_parent_task_id(parent_task_id.Binary());
+    task_info.set_type(task_type);
     return task_info;
   }
 
@@ -188,6 +194,8 @@ class GcsTaskManagerTest : public ::testing::Test {
 
       if (task_info.has_value()) {
         events.mutable_task_info()->CopyFrom(*task_info);
+      } else {
+        events.mutable_task_info()->CopyFrom(GenTaskInfo(JobID::FromInt(job_id)));
       }
 
       result.push_back(events);
@@ -732,6 +740,43 @@ TEST_F(GcsTaskManagerMemoryLimitedTest, TestLimitTaskEvents) {
   }
 }
 
+TEST_F(GcsTaskManagerTest, TestGetTaskEventsWithDriver) {
+  // Add task events
+  auto task_ids = GenTaskIDs(1);
+  auto driver_task = task_ids[0];
+
+  // Add Driver
+  {
+    auto events = GenTaskEvents(
+        {driver_task},
+        /* attempt_number */ 0,
+        /* job_id */ 0,
+        /* profile event */ absl::nullopt,
+        /* status_update*/ absl::nullopt,
+        GenTaskInfo(
+            /* job_id */ JobID::FromInt(0), TaskID::Nil(), rpc::TaskType::DRIVER_TASK));
+    auto events_data = Mocker::GenTaskEventsData(events);
+    SyncAddTaskEventData(events_data);
+  }
+
+  // Should get the event when including driver
+  {
+    auto reply = SyncGetTaskEvents(/* task_ids */ {},
+                                   /* job_id */ absl::nullopt,
+                                   /* limit */ -1,
+                                   /* exclude_driver*/ false);
+    EXPECT_EQ(reply.events_by_task_size(), 1);
+  }
+
+  // Default exclude driver
+  {
+    auto reply = SyncGetTaskEvents(/* task_ids */ {},
+                                   /* job_id */ absl::nullopt,
+                                   /* limit */ -1);
+    EXPECT_EQ(reply.events_by_task_size(), 0);
+  }
+}
+
 TEST_F(GcsTaskManagerMemoryLimitedTest, TestLimitReturnRecentTasksWhenGetAll) {
   // Keep adding tasks and make sure even with eviction, the returned tasks are
   // the mo
diff --git a/src/ray/protobuf/gcs_service.proto b/src/ray/protobuf/gcs_service.proto
index 14bf644fed9d..2d7e214c6e60 100644
--- a/src/ray/protobuf/gcs_service.proto
+++ b/src/ray/protobuf/gcs_service.proto
@@ -611,7 +611,7 @@ message GetTaskEventsRequest {
   // guarantee.
   optional int64 limit = 3;
   // True if task events from driver (only profiling events) should be excluded.
-  bool exclude_driver_task = 4;
+  bool exclude_driver = 4;
 }
 
 message GetTaskEventsReply {

From 3f1a880f7a4b248366ca00ea31483341d2eee1cf Mon Sep 17 00:00:00 2001
From: Cindy Zhang <cindyzyx9@gmail.com>
Date: Fri, 27 Jan 2023 09:18:46 -0800
Subject: [PATCH 021/267] [serve] Add exponential backoff when retrying
 replicas (#31436)

If deployment is repeatedly failing, perform exponential backoff so as to not repeatedly try to restart the replica at a very fast rate.

Related issue number
Closes #31121
---
 python/ray/serve/_private/deployment_state.py | 81 ++++++++++++++-----
 .../ray/serve/tests/test_deployment_state.py  | 51 ++++++++++++
 2 files changed, 111 insertions(+), 21 deletions(-)

diff --git a/python/ray/serve/_private/deployment_state.py b/python/ray/serve/_private/deployment_state.py
index 9db5d6256de9..002a8fa3ea46 100644
--- a/python/ray/serve/_private/deployment_state.py
+++ b/python/ray/serve/_private/deployment_state.py
@@ -114,6 +114,9 @@ def from_deployment_info(
     os.environ.get("SERVE_SLOW_STARTUP_WARNING_PERIOD_S", 30)
 )
 
+EXPONENTIAL_BACKOFF_FACTOR = float(os.environ.get("EXPONENTIAL_BACKOFF_FACTOR", 2.0))
+MAX_BACKOFF_TIME_S = int(os.environ.get("SERVE_MAX_BACKOFF_TIME_S", 64))
+
 ALL_REPLICA_STATES = list(ReplicaState)
 _SCALING_LOG_ENABLED = os.environ.get("SERVE_ENABLE_SCALING_LOG", "0") != "0"
 
@@ -978,6 +981,9 @@ def __init__(
         # DeploymentInfo and bring current deployment to meet new status.
         self._target_state: DeploymentTargetState = DeploymentTargetState.default()
         self._prev_startup_warning: float = time.time()
+        # Exponential backoff when retrying a consistently failing deployment
+        self._last_retry: float = 0.0
+        self._backoff_time_s: int = 1
         self._replica_constructor_retry_counter: int = 0
         self._replicas: ReplicaStateContainer = ReplicaStateContainer()
         self._curr_status_info: DeploymentStatusInfo = DeploymentStatusInfo(
@@ -1104,6 +1110,7 @@ def _set_target_state(self, target_info: DeploymentInfo) -> None:
             self._name, DeploymentStatus.UPDATING
         )
         self._replica_constructor_retry_counter = 0
+        self._backoff_time_s = 1
 
         logger.debug(f"Deploying new version of {self._name}: {target_state.version}.")
 
@@ -1308,28 +1315,43 @@ def _scale_deployment_replicas(self) -> bool:
             )
             to_add = max(delta_replicas - stopping_replicas, 0)
             if to_add > 0:
+                # Exponential backoff
+                failed_to_start_threshold = min(
+                    MAX_DEPLOYMENT_CONSTRUCTOR_RETRY_COUNT,
+                    self._target_state.num_replicas * 3,
+                )
+                if self._replica_constructor_retry_counter >= failed_to_start_threshold:
+                    # Wait 1, 2, 4, ... seconds before consecutive retries, with random
+                    # offset added to avoid synchronization
+                    if (
+                        time.time() - self._last_retry
+                        < self._backoff_time_s + random.uniform(0, 3)
+                    ):
+                        return replicas_stopped
+
+                self._last_retry = time.time()
                 logger.info(
                     f"Adding {to_add} replica{'s' if to_add > 1 else ''} "
                     f"to deployment '{self._name}'."
                 )
-            for _ in range(to_add):
-                replica_name = ReplicaName(self._name, get_random_letters())
-                new_deployment_replica = DeploymentReplica(
-                    self._controller_name,
-                    self._detached,
-                    replica_name.replica_tag,
-                    replica_name.deployment_tag,
-                    self._target_state.version,
-                )
-                new_deployment_replica.start(
-                    self._target_state.info, self._target_state.version
-                )
+                for _ in range(to_add):
+                    replica_name = ReplicaName(self._name, get_random_letters())
+                    new_deployment_replica = DeploymentReplica(
+                        self._controller_name,
+                        self._detached,
+                        replica_name.replica_tag,
+                        replica_name.deployment_tag,
+                        self._target_state.version,
+                    )
+                    new_deployment_replica.start(
+                        self._target_state.info, self._target_state.version
+                    )
 
-                self._replicas.add(ReplicaState.STARTING, new_deployment_replica)
-                logger.debug(
-                    "Adding STARTING to replica_tag: "
-                    f"{replica_name}, deployment: {self._name}"
-                )
+                    self._replicas.add(ReplicaState.STARTING, new_deployment_replica)
+                    logger.debug(
+                        "Adding STARTING to replica_tag: "
+                        f"{replica_name}, deployment: {self._name}"
+                    )
 
         elif delta_replicas < 0:
             replicas_stopped = True
@@ -1407,10 +1429,10 @@ def _check_curr_status(self) -> bool:
                     name=self._name,
                     status=DeploymentStatus.UNHEALTHY,
                     message=(
-                        f"The Deployment failed to start {failed_to_start_count} "
-                        "times in a row. This may be due to a problem with the "
-                        "deployment constructor or the initial health check failing. "
-                        "See logs for details."
+                        f"The Deployment failed to start {failed_to_start_count} times "
+                        "in a row. This may be due to a problem with the deployment "
+                        "constructor or the initial health check failing. See logs for "
+                        f"details. Retrying after {self._backoff_time_s} seconds."
                     ),
                 )
                 return False
@@ -1453,6 +1475,7 @@ def _check_startup_replicas(
         """
         slow_replicas = []
         transitioned_to_running = False
+        replicas_failed = False
         for replica in self._replicas.pop(states=[original_state]):
             start_status = replica.check_started()
             if start_status == ReplicaStartupStatus.SUCCEEDED:
@@ -1466,6 +1489,7 @@ def _check_startup_replicas(
                     # Increase startup failure counter if we're tracking it
                     self._replica_constructor_retry_counter += 1
 
+                replicas_failed = True
                 replica.stop(graceful=False)
                 self._replicas.add(ReplicaState.STOPPING, replica)
             elif start_status in [
@@ -1485,6 +1509,21 @@ def _check_startup_replicas(
                 else:
                     self._replicas.add(original_state, replica)
 
+        # If replicas have failed enough times, execute exponential backoff
+        # Wait 1, 2, 4, ... seconds before consecutive retries (or use a custom
+        # backoff factor by setting EXPONENTIAL_BACKOFF_FACTOR)
+        failed_to_start_threshold = min(
+            MAX_DEPLOYMENT_CONSTRUCTOR_RETRY_COUNT,
+            self._target_state.num_replicas * 3,
+        )
+        if (
+            replicas_failed
+            and self._replica_constructor_retry_counter > failed_to_start_threshold
+        ):
+            self._backoff_time_s = min(
+                EXPONENTIAL_BACKOFF_FACTOR * self._backoff_time_s, MAX_BACKOFF_TIME_S
+            )
+
         return slow_replicas, transitioned_to_running
 
     def _check_and_update_replicas(self) -> bool:
diff --git a/python/ray/serve/tests/test_deployment_state.py b/python/ray/serve/tests/test_deployment_state.py
index 1ce865997d96..5113a0761b7c 100644
--- a/python/ray/serve/tests/test_deployment_state.py
+++ b/python/ray/serve/tests/test_deployment_state.py
@@ -1991,6 +1991,57 @@ def test_deploy_with_transient_constructor_failure(
     assert deployment_state.curr_status_info.status == DeploymentStatus.HEALTHY
 
 
+@pytest.mark.parametrize("mock_deployment_state", [False], indirect=True)
+@patch.object(DriverDeploymentState, "_get_all_node_ids")
+def test_exponential_backoff(mock_get_all_node_ids, mock_deployment_state):
+    """Test exponential backoff."""
+    deployment_state, timer = mock_deployment_state
+    mock_get_all_node_ids.return_value = [(str(i), str(i)) for i in range(2)]
+
+    b_info_1, b_version_1 = deployment_info(num_replicas=2)
+    updating = deployment_state.deploy(b_info_1)
+    assert updating
+    assert deployment_state.curr_status_info.status == DeploymentStatus.UPDATING
+
+    _constructor_failure_loop_two_replica(deployment_state, 3)
+    assert deployment_state._replica_constructor_retry_counter == 6
+    last_retry = timer.time()
+
+    for i in range(7):
+        while timer.time() - last_retry < 2**i:
+            deployment_state.update()
+            assert deployment_state._replica_constructor_retry_counter == 6 + 2 * i
+            # Check that during backoff time, no replicas are created
+            check_counts(deployment_state, total=0)
+            timer.advance(0.1)  # simulate time passing between each call to udpate
+
+        # Skip past random additional backoff time used to avoid synchronization
+        timer.advance(5)
+
+        # Set new replicas to fail consecutively
+        check_counts(deployment_state, total=0)  # No replicas
+        deployment_state.update()
+        last_retry = timer.time()  # This should be time at which replicas were retried
+        check_counts(deployment_state, total=2)  # Two new replicas
+        replica_1 = deployment_state._replicas.get()[0]
+        replica_2 = deployment_state._replicas.get()[1]
+        replica_1._actor.set_failed_to_start()
+        replica_2._actor.set_failed_to_start()
+        timer.advance(0.1)  # simulate time passing between each call to udpate
+
+        # Now the replica should be marked STOPPING after failure.
+        deployment_state.update()
+        check_counts(deployment_state, total=2, by_state=[(ReplicaState.STOPPING, 2)])
+        timer.advance(0.1)  # simulate time passing between each call to udpate
+
+        # Once it's done stopping, replica should be removed.
+        replica_1._actor.set_done_stopping()
+        replica_2._actor.set_done_stopping()
+        deployment_state.update()
+        check_counts(deployment_state, total=0)
+        timer.advance(0.1)  # simulate time passing between each call to udpate
+
+
 @pytest.fixture
 def mock_deployment_state_manager(request) -> Tuple[DeploymentStateManager, Mock]:
     ray.init()

From 76d746786bf335a7f093bbab71e7e48ee16fccd3 Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Fri, 27 Jan 2023 09:24:16 -0800
Subject: [PATCH 022/267] [RLlib] Fixed the autorom dependency issue (#31933)

Co-authored-by: Cade Daniel <edacih@gmail.com>
Closes https://github.com/ray-project/ray/issues/31880
---
 release/rllib_tests/app_config.yaml | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/release/rllib_tests/app_config.yaml b/release/rllib_tests/app_config.yaml
index b66417df9249..2dae5b40912c 100755
--- a/release/rllib_tests/app_config.yaml
+++ b/release/rllib_tests/app_config.yaml
@@ -19,7 +19,10 @@ python:
   - ale-py==0.8.0
   - gym==0.26.2
   - mujoco-py<2.2,>=2.1
-  - autorom[accept-rom-license]
+  # AutoROM downloads ROMs via torrent when they are built. The torrent is unreliable,
+  # so we built it for py3 and use that instead. This wheel was tested for python 3.7, 3.8,
+  # and 3.9.
+  - https://ray-ci-deps-wheels.s3.us-west-2.amazonaws.com/AutoROM.accept_rom_license-0.5.4-py3-none-any.whl
   conda_packages: []
 
 post_build_cmds:

From 15af4857c30eaaf4233ffd5934af9dbd30a4b720 Mon Sep 17 00:00:00 2001
From: Alan Guo <aguo@anyscale.com>
Date: Fri, 27 Jan 2023 09:57:53 -0800
Subject: [PATCH 023/267] Polish the Dashboard new IA part 2 (#31946)

Adds back the metrics page
Adds button to visit new dashboard and to go back
Adds buttons for leaving feedback and viewing docs
Add color to status badges of tasks and placement groups table
Add alert when grafana is not running
Fix copy button icon
Separate metrics page into sections (both new IA and old IA)
---
 dashboard/client/src/App.tsx                  |  12 +-
 .../client/src/components/EventTable.tsx      |   7 +-
 .../MetadataSection/MetadataSection.tsx       |   4 +-
 .../src/components/PlacementGroupTable.tsx    |   2 +-
 .../client/src/components/StatusChip.tsx      |  41 ++-
 dashboard/client/src/components/TaskTable.tsx |   2 +-
 dashboard/client/src/pages/actor/index.tsx    |   8 +
 dashboard/client/src/pages/job/JobDetail.tsx  |  55 +++-
 dashboard/client/src/pages/job/JobRow.tsx     |  49 +--
 .../client/src/pages/layout/MainNavLayout.tsx |  75 ++++-
 dashboard/client/src/pages/layout/index.tsx   |  17 +
 .../pages/metrics/Metrics.component.test.tsx  |  70 +++++
 .../client/src/pages/metrics/Metrics.tsx      | 296 ++++++++++++------
 dashboard/client/src/pages/metrics/utils.ts   |  36 ++-
 .../overview/OverviewPage.component.test.tsx  |   1 -
 .../src/pages/overview/OverviewPage.tsx       |  11 -
 .../overview/cards/ClusterUtilizationCard.tsx |  45 ++-
 .../pages/overview/cards/NodeCountCard.tsx    |  35 ++-
 ...{placementGroup.d.ts => placementGroup.ts} |   0
 dashboard/modules/metrics/metrics_head.py     |   2 +-
 20 files changed, 571 insertions(+), 197 deletions(-)
 create mode 100644 dashboard/client/src/pages/metrics/Metrics.component.test.tsx
 rename dashboard/client/src/type/{placementGroup.d.ts => placementGroup.ts} (100%)

diff --git a/dashboard/client/src/App.tsx b/dashboard/client/src/App.tsx
index 302a9afe3985..b45d1f0db50f 100644
--- a/dashboard/client/src/App.tsx
+++ b/dashboard/client/src/App.tsx
@@ -52,6 +52,10 @@ type GlobalContextType = {
    * running as detected by the grafana healthcheck endpoint.
    */
   grafanaHost: string | undefined;
+  /**
+   * Whether prometheus is runing or not
+   */
+  prometheusHealth: boolean | undefined;
   /**
    * The name of the currently running ray session.
    */
@@ -63,6 +67,7 @@ export const GlobalContext = React.createContext<GlobalContextType>({
   ipLogMap: {},
   namespaceMap: {},
   grafanaHost: undefined,
+  prometheusHealth: undefined,
   sessionName: undefined,
 });
 
@@ -79,6 +84,7 @@ const App = () => {
     ipLogMap: {},
     namespaceMap: {},
     grafanaHost: undefined,
+    prometheusHealth: undefined,
     sessionName: undefined,
   });
   const getTheme = (name: string) => {
@@ -119,11 +125,13 @@ const App = () => {
   // Detect if grafana is running
   useEffect(() => {
     const doEffect = async () => {
-      const { grafanaHost, sessionName } = await getMetricsInfo();
+      const { grafanaHost, sessionName, prometheusHealth } =
+        await getMetricsInfo();
       setContext((existingContext) => ({
         ...existingContext,
         grafanaHost,
         sessionName,
+        prometheusHealth,
       }));
     };
     doEffect();
@@ -221,6 +229,8 @@ const App = () => {
                       />
                     </Route>
                   </Route>
+                  <Route element={<Actors />} path="actors" />
+                  <Route element={<Metrics newIA />} path="metrics" />
                   <Route element={<NewIALogsPage />} path="logs">
                     {/* TODO(aguo): Refactor Logs component to use optional query
                         params since react-router 6 doesn't support optional path params... */}
diff --git a/dashboard/client/src/components/EventTable.tsx b/dashboard/client/src/components/EventTable.tsx
index c4d9cfec7a17..174a94e9f5a9 100644
--- a/dashboard/client/src/components/EventTable.tsx
+++ b/dashboard/client/src/components/EventTable.tsx
@@ -35,11 +35,16 @@ const useStyles = makeStyles((theme) => ({
     padding: theme.spacing(2),
     marginTop: theme.spacing(2),
   },
+  filterContainer: {
+    display: "flex",
+    alignItems: "center",
+  },
   search: {
     margin: theme.spacing(1),
     display: "inline-block",
     fontSize: 12,
     lineHeight: "46px",
+    height: 56,
   },
   infokv: {
     margin: theme.spacing(1),
@@ -166,7 +171,7 @@ const EventTable = (props: EventTableProps) => {
 
   return (
     <div style={{ position: "relative" }}>
-      <div>
+      <div className={classes.filterContainer}>
         <Autocomplete
           className={classes.search}
           style={{ width: 200 }}
diff --git a/dashboard/client/src/components/MetadataSection/MetadataSection.tsx b/dashboard/client/src/components/MetadataSection/MetadataSection.tsx
index fca1d1f39858..531ca020c050 100644
--- a/dashboard/client/src/components/MetadataSection/MetadataSection.tsx
+++ b/dashboard/client/src/components/MetadataSection/MetadataSection.tsx
@@ -8,9 +8,9 @@ import {
   Tooltip,
   Typography,
 } from "@material-ui/core";
-import FileCopyOutlined from "@material-ui/icons/FileCopyOutlined";
 import copy from "copy-to-clipboard";
 import React, { useState } from "react";
+import { RiFileCopyLine } from "react-icons/ri";
 import { Link as RouterLink } from "react-router-dom";
 import { HelpInfo } from "../Tooltip";
 
@@ -121,7 +121,7 @@ export const MetadataContentField: React.FC<{
               size="small"
               className={classes.button}
             >
-              <FileCopyOutlined />
+              <RiFileCopyLine />
             </IconButton>
           </Tooltip>
         )}
diff --git a/dashboard/client/src/components/PlacementGroupTable.tsx b/dashboard/client/src/components/PlacementGroupTable.tsx
index f3768034b477..dd2ac7084e98 100644
--- a/dashboard/client/src/components/PlacementGroupTable.tsx
+++ b/dashboard/client/src/components/PlacementGroupTable.tsx
@@ -148,7 +148,7 @@ const PlacementGroupTable = ({
                 <TableCell align="center">{name ? name : "-"}</TableCell>
                 <TableCell align="center">{creator_job_id}</TableCell>
                 <TableCell align="center">
-                  <StatusChip type="actor" status={state} />
+                  <StatusChip type="placementGroup" status={state} />
                 </TableCell>
                 <TableCell align="center">
                   {stats ? stats.scheduling_state : "-"}
diff --git a/dashboard/client/src/components/StatusChip.tsx b/dashboard/client/src/components/StatusChip.tsx
index 7c57c0d724b1..c945c3a6cbd9 100644
--- a/dashboard/client/src/components/StatusChip.tsx
+++ b/dashboard/client/src/components/StatusChip.tsx
@@ -11,6 +11,8 @@ import {
 import { CSSProperties } from "@material-ui/core/styles/withStyles";
 import React, { ReactNode } from "react";
 import { ActorEnum } from "../type/actor";
+import { PlacementGroupState } from "../type/placementGroup";
+import { TypeTaskStatus } from "../type/task";
 
 const colorMap = {
   node: {
@@ -26,18 +28,37 @@ const colorMap = {
     [ActorEnum.PENDING]: blue,
     [ActorEnum.RECONSTRUCTING]: lightBlue,
   },
+  task: {
+    [TypeTaskStatus.FAILED]: red,
+    [TypeTaskStatus.FINISHED]: green,
+    [TypeTaskStatus.RUNNING]: blue,
+    [TypeTaskStatus.RUNNING_IN_RAY_GET]: blue,
+    [TypeTaskStatus.RUNNING_IN_RAY_WAIT]: blue,
+    [TypeTaskStatus.SUBMITTED_TO_WORKER]: "#cfcf08",
+    [TypeTaskStatus.PENDING_ARGS_FETCH]: blue,
+    [TypeTaskStatus.PENDING_OBJ_STORE_MEM_AVAIL]: blue,
+    [TypeTaskStatus.PENDING_NODE_ASSIGNMENT]: "#cfcf08",
+    [TypeTaskStatus.PENDING_ARGS_AVAIL]: "#f79e02",
+  },
   job: {
     INIT: grey,
-    SUBMITTED: blue,
+    SUBMITTED: "#cfcf08",
     DISPATCHED: lightBlue,
-    RUNNING: green,
-    COMPLETED: cyan,
-    FINISHED: cyan,
+    RUNNING: blue,
+    COMPLETED: green,
+    SUCCEEDED: green,
+    FINISHED: green,
     FAILED: red,
   },
+  placementGroup: {
+    [PlacementGroupState.PENDING]: "#f79e02",
+    [PlacementGroupState.CREATED]: blue,
+    [PlacementGroupState.REMOVED]: red,
+    [PlacementGroupState.RESCHEDULING]: "#cfcf08",
+  },
 } as {
   [key: string]: {
-    [key: string]: Color;
+    [key: string]: Color | string;
   };
 };
 
@@ -66,7 +87,7 @@ export const StatusChip = ({
     margin: 2,
   } as CSSProperties;
 
-  let color = blueGrey as Color;
+  let color: Color | string = blueGrey;
 
   if (typeMap[type]) {
     color = typeMap[type];
@@ -78,10 +99,12 @@ export const StatusChip = ({
     color = colorMap[type][status];
   }
 
-  style.color = color[500];
-  style.borderColor = color[500];
+  const colorValue = typeof color === "string" ? color : color[500];
+
+  style.color = colorValue;
+  style.borderColor = colorValue;
   if (color !== blueGrey) {
-    style.backgroundColor = `${color[500]}20`;
+    style.backgroundColor = `${colorValue}20`;
   }
 
   return (
diff --git a/dashboard/client/src/components/TaskTable.tsx b/dashboard/client/src/components/TaskTable.tsx
index c833cb1a2ae0..c4f59ac3c66a 100644
--- a/dashboard/client/src/components/TaskTable.tsx
+++ b/dashboard/client/src/components/TaskTable.tsx
@@ -170,7 +170,7 @@ const TaskTable = ({
                 <TableCell align="center">{name ? name : "-"}</TableCell>
                 <TableCell align="center">{job_id}</TableCell>
                 <TableCell align="center">
-                  <StatusChip type="actor" status={state} />
+                  <StatusChip type="task" status={state} />
                 </TableCell>
                 <TableCell align="center">
                   {start_time_ms && start_time_ms > 0 ? (
diff --git a/dashboard/client/src/pages/actor/index.tsx b/dashboard/client/src/pages/actor/index.tsx
index 4cbe9c2afef3..7661539b518a 100644
--- a/dashboard/client/src/pages/actor/index.tsx
+++ b/dashboard/client/src/pages/actor/index.tsx
@@ -1,6 +1,7 @@
 import { makeStyles } from "@material-ui/core";
 import React from "react";
 import TitleCard from "../../components/TitleCard";
+import { MainNavPageInfo } from "../layout/mainNavContext";
 import ActorList from "./ActorList";
 
 const useStyles = makeStyles((theme) => ({
@@ -18,6 +19,13 @@ const Actors = () => {
 
   return (
     <div className={classes.root}>
+      <MainNavPageInfo
+        pageInfo={{
+          id: "actors",
+          title: "Actors",
+          path: "/new/actors",
+        }}
+      />
       <TitleCard title="ACTORS">
         <ActorList />
       </TitleCard>
diff --git a/dashboard/client/src/pages/job/JobDetail.tsx b/dashboard/client/src/pages/job/JobDetail.tsx
index 8f0b6cdf1c21..dbc408ff8f80 100644
--- a/dashboard/client/src/pages/job/JobDetail.tsx
+++ b/dashboard/client/src/pages/job/JobDetail.tsx
@@ -1,12 +1,15 @@
 import { makeStyles } from "@material-ui/core";
 import { Alert } from "@material-ui/lab";
 import dayjs from "dayjs";
-import React from "react";
+import React, { useContext } from "react";
+import { Link } from "react-router-dom";
+import { GlobalContext } from "../../App";
 import { DurationText } from "../../common/DurationText";
 import Loading from "../../components/Loading";
 import { MetadataSection } from "../../components/MetadataSection";
 import { StatusChip } from "../../components/StatusChip";
 import TitleCard from "../../components/TitleCard";
+import { UnifiedJob } from "../../type/job";
 import ActorList from "../actor/ActorList";
 import PlacementGroupList from "../state/PlacementGroup";
 import TaskList from "../state/task";
@@ -163,6 +166,10 @@ export const JobDetailChartsPage = ({
                   : "-",
               },
             },
+            {
+              label: "Logs",
+              content: <JobLogsLink job={job} newIA />,
+            },
           ]}
         />
       </TitleCard>
@@ -177,3 +184,49 @@ export const JobDetailChartsPage = ({
     </div>
   );
 };
+
+type JobLogsLinkProps = {
+  job: Pick<
+    UnifiedJob,
+    | "driver_agent_http_address"
+    | "driver_info"
+    | "job_id"
+    | "submission_id"
+    | "type"
+  >;
+  newIA?: boolean;
+};
+
+export const JobLogsLink = ({
+  job: { driver_agent_http_address, driver_info, job_id, submission_id, type },
+  newIA = false,
+}: JobLogsLinkProps) => {
+  const { ipLogMap } = useContext(GlobalContext);
+
+  let link: string | undefined;
+
+  const baseLink = newIA ? "/new/logs" : "/log";
+
+  if (driver_agent_http_address) {
+    link = `${baseLink}/${encodeURIComponent(
+      `${driver_agent_http_address}/logs`,
+    )}`;
+  } else if (driver_info && ipLogMap[driver_info.node_ip_address]) {
+    link = `${baseLink}/${encodeURIComponent(
+      ipLogMap[driver_info.node_ip_address],
+    )}`;
+  }
+
+  if (link) {
+    link += `?fileName=${
+      type === "DRIVER" ? job_id : `driver-${submission_id}`
+    }`;
+    return (
+      <Link to={link} target="_blank">
+        Log
+      </Link>
+    );
+  }
+
+  return <span>-</span>;
+};
diff --git a/dashboard/client/src/pages/job/JobRow.tsx b/dashboard/client/src/pages/job/JobRow.tsx
index 0be459efa1df..010754eb4976 100644
--- a/dashboard/client/src/pages/job/JobRow.tsx
+++ b/dashboard/client/src/pages/job/JobRow.tsx
@@ -1,18 +1,20 @@
 import { TableCell, TableRow, Tooltip } from "@material-ui/core";
 import { makeStyles } from "@material-ui/core/styles";
 import dayjs from "dayjs";
-import React, { useContext } from "react";
+import React from "react";
 import { Link } from "react-router-dom";
-import { GlobalContext } from "../../App";
 import { DurationText } from "../../common/DurationText";
+import { StatusChip } from "../../components/StatusChip";
 import { UnifiedJob } from "../../type/job";
 import { useJobProgress } from "./hook/useJobProgress";
+import { JobLogsLink } from "./JobDetail";
 import { MiniTaskProgressBar } from "./TaskProgressBar";
 
 const useStyles = makeStyles((theme) => ({
   overflowCell: {
     display: "block",
-    width: "150px",
+    margin: "auto",
+    maxWidth: 360,
     textOverflow: "ellipsis",
     overflow: "hidden",
     whiteSpace: "nowrap",
@@ -24,21 +26,16 @@ type JobRowProps = {
   newIA?: boolean;
 };
 
-export const JobRow = ({
-  job: {
+export const JobRow = ({ job, newIA = false }: JobRowProps) => {
+  const {
     job_id,
     submission_id,
     driver_info,
-    type,
     status,
     start_time,
     end_time,
     entrypoint,
-    driver_agent_http_address,
-  },
-  newIA = false,
-}: JobRowProps) => {
-  const { ipLogMap } = useContext(GlobalContext);
+  } = job;
   const { progress, error, driverExists } = useJobProgress(job_id ?? undefined);
   const classes = useStyles();
 
@@ -57,30 +54,6 @@ export const JobRow = ({
     }
   })();
 
-  const logsLink = (() => {
-    let link: string | undefined;
-    if (driver_agent_http_address) {
-      link = `/log/${encodeURIComponent(`${driver_agent_http_address}/logs`)}`;
-    } else if (driver_info && ipLogMap[driver_info.node_ip_address]) {
-      link = `/log/${encodeURIComponent(
-        ipLogMap[driver_info.node_ip_address],
-      )}`;
-    }
-
-    if (link) {
-      link += `?fileName=${
-        type === "DRIVER" ? job_id : `driver-${submission_id}`
-      }`;
-      return (
-        <Link to={link} target="_blank">
-          Log
-        </Link>
-      );
-    }
-
-    return "-";
-  })();
-
   return (
     <TableRow>
       <TableCell align="center">
@@ -101,7 +74,9 @@ export const JobRow = ({
           <div>{entrypoint}</div>
         </Tooltip>
       </TableCell>
-      <TableCell align="center">{status}</TableCell>
+      <TableCell align="center">
+        <StatusChip type="job" status={job.status} />
+      </TableCell>
       <TableCell align="center">
         {start_time && start_time > 0 ? (
           <DurationText startTime={start_time} endTime={end_time} />
@@ -113,7 +88,7 @@ export const JobRow = ({
       <TableCell align="center">
         {/* TODO(aguo): Also show logs for the job id instead
       of just the submission's logs */}
-        {logsLink}
+        <JobLogsLink job={job} newIA={newIA} />
       </TableCell>
       <TableCell align="center">
         {dayjs(Number(start_time)).format("YYYY/MM/DD HH:mm:ss")}
diff --git a/dashboard/client/src/pages/layout/MainNavLayout.tsx b/dashboard/client/src/pages/layout/MainNavLayout.tsx
index 85dabc6d97a3..fb2fcd6f968c 100644
--- a/dashboard/client/src/pages/layout/MainNavLayout.tsx
+++ b/dashboard/client/src/pages/layout/MainNavLayout.tsx
@@ -1,12 +1,19 @@
-import { createStyles, makeStyles, Typography } from "@material-ui/core";
+import {
+  createStyles,
+  IconButton,
+  makeStyles,
+  Tooltip,
+  Typography,
+} from "@material-ui/core";
 import classNames from "classnames";
 import React, { useContext } from "react";
+import { RiBookMarkLine, RiFeedbackLine } from "react-icons/ri/";
 import { Link, Outlet } from "react-router-dom";
 import Logo from "../../logo.svg";
 import { MainNavContext, useMainNavState } from "./mainNavContext";
 
-const MAIN_NAV_HEIGHT = 56;
-const BREADCRUMBS_HEIGHT = 36;
+export const MAIN_NAV_HEIGHT = 56;
+export const BREADCRUMBS_HEIGHT = 36;
 
 const useStyles = makeStyles((theme) =>
   createStyles({
@@ -103,6 +110,23 @@ const useMainNavBarStyles = makeStyles((theme) =>
     navItemHighlighted: {
       color: "#036DCF",
     },
+    flexSpacer: {
+      flexGrow: 1,
+    },
+    actionItemsContainer: {
+      marginRight: theme.spacing(2),
+    },
+    backToOld: {
+      marginRight: theme.spacing(1.5),
+      textDecoration: "none",
+    },
+    backToOldText: {
+      letterSpacing: 0.25,
+      fontWeight: 500,
+    },
+    actionItem: {
+      color: "#5F6469",
+    },
   }),
 );
 
@@ -122,6 +146,16 @@ const NAV_ITEMS = [
     path: "/new/cluster",
     id: "cluster",
   },
+  {
+    title: "Actors",
+    path: "/new/actors",
+    id: "actors",
+  },
+  {
+    title: "Metrics",
+    path: "/new/metrics",
+    id: "metrics",
+  },
   {
     title: "Logs",
     path: "/new/logs",
@@ -152,6 +186,41 @@ const MainNavBar = () => {
           </Link>
         </Typography>
       ))}
+      <div className={classes.flexSpacer}></div>
+      <div className={classes.actionItemsContainer}>
+        <Link
+          className={classNames(classes.actionItem, classes.backToOld)}
+          to="/"
+        >
+          <Typography
+            variant="body2"
+            component="span"
+            className={classes.backToOldText}
+          >
+            Back to old UI
+          </Typography>
+        </Link>
+        <Tooltip title="Docs">
+          <IconButton
+            className={classes.actionItem}
+            href="https://docs.ray.io/en/latest/ray-core/ray-dashboard.html"
+            target="_blank"
+            rel="noopener noreferrer"
+          >
+            <RiBookMarkLine />
+          </IconButton>
+        </Tooltip>
+        <Tooltip title="Leave feedback">
+          <IconButton
+            className={classes.actionItem}
+            href="https://github.com/ray-project/ray/issues/new?assignees=&labels=bug%2Ctriage%2Cdashboard&template=bug-report.yml&title=%5BDashboard%5D+%3CTitle%3E"
+            target="_blank"
+            rel="noopener noreferrer"
+          >
+            <RiFeedbackLine />
+          </IconButton>
+        </Tooltip>
+      </div>
     </div>
   );
 };
diff --git a/dashboard/client/src/pages/layout/index.tsx b/dashboard/client/src/pages/layout/index.tsx
index ee11cd765377..cdc6e07a3c76 100644
--- a/dashboard/client/src/pages/layout/index.tsx
+++ b/dashboard/client/src/pages/layout/index.tsx
@@ -61,6 +61,14 @@ const useStyles = makeStyles((theme) => ({
   child: {
     flex: 1,
   },
+  newUI: {
+    fontWeight: 500,
+    color: "#036DCF",
+    backgroundColor: "#036DCF20",
+    padding: theme.spacing(0.5),
+    margin: theme.spacing(-0.5),
+    borderRadius: 4,
+  },
 }));
 
 const BasicLayout = ({
@@ -151,6 +159,15 @@ const BasicLayout = ({
               <ListItemText>METRICS</ListItemText>
             </ListItem>
           )}
+          <ListItem
+            button
+            className={classnames(classes.menuItem)}
+            onClick={() => navigate("/new")}
+          >
+            <ListItemText classes={{ primary: classes.newUI }}>
+              TRY THE NEW UI
+            </ListItemText>
+          </ListItem>
           <ListItem>
             <IconButton
               color="primary"
diff --git a/dashboard/client/src/pages/metrics/Metrics.component.test.tsx b/dashboard/client/src/pages/metrics/Metrics.component.test.tsx
new file mode 100644
index 000000000000..42b778234884
--- /dev/null
+++ b/dashboard/client/src/pages/metrics/Metrics.component.test.tsx
@@ -0,0 +1,70 @@
+import { render, screen } from "@testing-library/react";
+import React, { PropsWithChildren } from "react";
+import { GlobalContext } from "../../App";
+import { Metrics } from "./Metrics";
+
+const Wrapper = ({ children }: PropsWithChildren<{}>) => {
+  return (
+    <GlobalContext.Provider
+      value={{
+        grafanaHost: "localhost:3000",
+        prometheusHealth: true,
+        sessionName: "session-name",
+        ipLogMap: {},
+        nodeMap: {},
+        nodeMapByIp: {},
+        namespaceMap: {},
+      }}
+    >
+      {children}
+    </GlobalContext.Provider>
+  );
+};
+
+const MetricsDisabledWrapper = ({ children }: PropsWithChildren<{}>) => {
+  return (
+    <GlobalContext.Provider
+      value={{
+        grafanaHost: undefined,
+        prometheusHealth: false,
+        sessionName: undefined,
+        ipLogMap: {},
+        nodeMap: {},
+        nodeMapByIp: {},
+        namespaceMap: {},
+      }}
+    >
+      {children}
+    </GlobalContext.Provider>
+  );
+};
+
+describe("Metrics", () => {
+  it("renders", async () => {
+    expect.assertions(6);
+
+    render(<Metrics newIA />, { wrapper: Wrapper });
+    await screen.findByText(/View in Grafana/);
+    expect(screen.getByText(/30 minutes/)).toBeVisible();
+    expect(screen.getByText(/Tasks/)).toBeVisible();
+    expect(screen.getByText(/Actors/)).toBeVisible();
+    expect(screen.getByText(/Scheduler and autoscaler/)).toBeVisible();
+    expect(screen.getByText(/Node metrics/)).toBeVisible();
+    expect(
+      screen.queryByText(/Grafana or prometheus server not detected./),
+    ).toBeNull();
+  });
+
+  it("renders warning when ", async () => {
+    expect.assertions(6);
+
+    render(<Metrics newIA />, { wrapper: MetricsDisabledWrapper });
+    await screen.findByText(/Grafana or prometheus server not detected./);
+    expect(screen.queryByText(/View in Grafana/)).toBeNull();
+    expect(screen.queryByText(/30 minutes/)).toBeNull();
+    expect(screen.queryByText(/Tasks/)).toBeNull();
+    expect(screen.queryByText(/Actors/)).toBeNull();
+    expect(screen.queryByText(/Scheduler and autoscaler/)).toBeNull();
+    expect(screen.queryByText(/Node metrics/)).toBeNull();
+  });
+});
diff --git a/dashboard/client/src/pages/metrics/Metrics.tsx b/dashboard/client/src/pages/metrics/Metrics.tsx
index 8610f6961622..db51011e4fb6 100644
--- a/dashboard/client/src/pages/metrics/Metrics.tsx
+++ b/dashboard/client/src/pages/metrics/Metrics.tsx
@@ -7,29 +7,36 @@ import {
   TextField,
 } from "@material-ui/core";
 import { Alert } from "@material-ui/lab";
+import classNames from "classnames";
 import React, { useContext, useEffect, useState } from "react";
+import { RiExternalLinkLine } from "react-icons/ri";
 
 import { GlobalContext } from "../../App";
+import { CollapsibleSection } from "../../common/CollapsibleSection";
+import { ClassNameProps } from "../../common/props";
+import { MainNavPageInfo } from "../layout/mainNavContext";
+import { MAIN_NAV_HEIGHT } from "../layout/MainNavLayout";
 
 const useStyles = makeStyles((theme) =>
   createStyles({
-    root: {},
+    metricsRoot: { margin: theme.spacing(1) },
+    metricsSection: {
+      marginTop: theme.spacing(3),
+    },
     grafanaEmbedsContainer: {
-      marginTop: theme.spacing(1),
-      marginLeft: theme.spacing(1),
       display: "flex",
       flexDirection: "row",
       flexWrap: "wrap",
       gap: theme.spacing(3),
+      marginTop: theme.spacing(2),
     },
     chart: {
-      flex: "1 0 448px",
-      maxWidth: "100%",
+      width: "100%",
       height: 300,
       overflow: "hidden",
       [theme.breakpoints.up("md")]: {
         // Calculate max width based on 1/3 of the total width minus padding between cards
-        maxWidth: `calc((100% - ${theme.spacing(3)}px * 2) / 3)`,
+        width: `calc((100% - ${theme.spacing(3)}px * 2) / 3)`,
       },
     },
     grafanaEmbed: {
@@ -38,16 +45,26 @@ const useStyles = makeStyles((theme) =>
     },
     topBar: {
       position: "sticky",
+      top: 0,
       width: "100%",
       display: "flex",
       flexDirection: "row",
       alignItems: "center",
       justifyContent: "flex-end",
       padding: theme.spacing(1),
+      boxShadow: "0px 1px 0px #D2DCE6",
+      zIndex: 1,
+      height: 36,
+    },
+    topBarNewIA: {
+      top: MAIN_NAV_HEIGHT,
     },
     timeRangeButton: {
       marginLeft: theme.spacing(2),
     },
+    alert: {
+      marginTop: 30,
+    },
   }),
 );
 
@@ -75,85 +92,121 @@ const TIME_RANGE_TO_FROM_VALUE: Record<TimeRangeOptions, string> = {
   [TimeRangeOptions.SEVEN_DAYS]: "now-7d",
 };
 
+type MetricConfig = {
+  title: string;
+  path: string;
+};
+
+type MetricsSectionConfig = {
+  title: string;
+  contents: MetricConfig[];
+};
+
 // NOTE: please keep the titles here in sync with grafana_dashboard_factory.py
-const METRICS_CONFIG = [
-  {
-    title: "Scheduler Task State",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=26",
-  },
-  {
-    title: "Active Tasks by Name",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=35",
-  },
-  {
-    title: "Scheduler Actor State",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=33",
-  },
-  {
-    title: "Active Actors by Name",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=36",
-  },
+const METRICS_CONFIG: MetricsSectionConfig[] = [
   {
-    title: "Scheduler CPUs (logical slots)",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=27",
-  },
-  {
-    title: "Object Store Memory",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=29",
-  },
-  {
-    title: "Scheduler GPUs (logical slots)",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=28",
-  },
-  {
-    title: "Scheduler Placement Groups",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=40",
-  },
-  {
-    title: "Node CPU (hardware utilization)",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=2",
-  },
-  {
-    title: "Node GPU (hardware utilization)",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=8",
-  },
-  {
-    title: "Node Disk",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=6",
-  },
-  {
-    title: "Node Disk IO Speed",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=32",
-  },
-  {
-    title: "Node Memory (heap + object store)",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=4",
-  },
-  {
-    title: "Node Memory by Component",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=34",
-  },
-  {
-    title: "Node CPU by Component",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=37",
+    title: "Tasks",
+    contents: [
+      {
+        title: "Scheduler Task State",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=26",
+      },
+      {
+        title: "Active Tasks by Name",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=35",
+      },
+    ],
   },
   {
-    title: "Node GPU Memory (GRAM)",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=18",
+    title: "Actors",
+    contents: [
+      {
+        title: "Scheduler Actor State",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=33",
+      },
+      {
+        title: "Active Actors by Name",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=36",
+      },
+    ],
   },
   {
-    title: "Node Network",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=20",
+    title: "Scheduler and autoscaler",
+    contents: [
+      {
+        title: "Node Count",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=24",
+      },
+      {
+        title: "Scheduler CPUs (logical slots)",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=27",
+      },
+      {
+        title: "Scheduler GPUs (logical slots)",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=28",
+      },
+      {
+        title: "Scheduler Placement Groups",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=40",
+      },
+    ],
   },
   {
-    title: "Node Count",
-    path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=24",
+    title: "Node metrics",
+    contents: [
+      {
+        title: "Node CPU (hardware utilization)",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=2",
+      },
+      {
+        title: "Node Memory (heap + object store)",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=4",
+      },
+      {
+        title: "Node GPU (hardware utilization)",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=8",
+      },
+      {
+        title: "Node GPU Memory (GRAM)",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=18",
+      },
+      {
+        title: "Node Disk",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=6",
+      },
+      {
+        title: "Node Disk IO Speed",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=32",
+      },
+      {
+        title: "Node Network",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=20",
+      },
+      {
+        title: "Node CPU by Component",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=37",
+      },
+
+      {
+        title: "Node Memory by Component",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=34",
+      },
+      {
+        title: "Object Store Memory",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=29",
+      },
+    ],
   },
 ];
 
-export const Metrics = () => {
+type MetricsProps = {
+  newIA?: boolean;
+};
+
+export const Metrics = ({ newIA = false }: MetricsProps) => {
   const classes = useStyles();
-  const { grafanaHost, sessionName } = useContext(GlobalContext);
+  const { grafanaHost, sessionName, prometheusHealth } =
+    useContext(GlobalContext);
 
   const [timeRangeOption, setTimeRangeOption] = useState<TimeRangeOptions>(
     TimeRangeOptions.THIRTY_MINS,
@@ -172,31 +225,28 @@ export const Metrics = () => {
   const timeRangeParams = `${fromParam}${toParam}`;
 
   return (
-    <div className={classes.root}>
-      {grafanaHost === undefined ? (
-        <Alert style={{ marginTop: 30 }} severity="warning">
-          Grafana server not detected. Please make sure the grafana server is
-          running and refresh this page. See:{" "}
-          <a
-            href="https://docs.ray.io/en/latest/ray-observability/ray-metrics.html"
-            target="_blank"
-            rel="noreferrer"
-          >
-            https://docs.ray.io/en/latest/ray-observability/ray-metrics.html
-          </a>
-          .
-          <br />
-          If you are hosting grafana on a separate machine or using a
-          non-default port, please set the RAY_GRAFANA_HOST env var to point to
-          your grafana server when launching ray.
-        </Alert>
+    <div>
+      <MainNavPageInfo
+        pageInfo={{
+          id: "metrics",
+          title: "Metrics",
+          path: "/new/metrics",
+        }}
+      />
+      {grafanaHost === undefined || !prometheusHealth ? (
+        <GrafanaNotRunningAlert className={classes.alert} />
       ) : (
         <div>
-          <Paper className={classes.topBar}>
+          <Paper
+            className={classNames(classes.topBar, {
+              [classes.topBarNewIA]: newIA,
+            })}
+          >
             <Button
               href={grafanaHost}
               target="_blank"
               rel="noopener noreferrer"
+              endIcon={<RiExternalLinkLine />}
             >
               View in Grafana
             </Button>
@@ -204,7 +254,6 @@ export const Metrics = () => {
               className={classes.timeRangeButton}
               select
               size="small"
-              variant="outlined"
               style={{ width: 120 }}
               value={timeRangeOption}
               onChange={({ target: { value } }) => {
@@ -223,17 +272,34 @@ export const Metrics = () => {
             time-series graph. You can use control/cmd + click to filter out a
             line in the time-series graph.
           </Alert>
-          <div className={classes.grafanaEmbedsContainer}>
-            {METRICS_CONFIG.map(({ title, path }) => (
-              <Paper className={classes.chart} elevation={1} variant="outlined">
-                <iframe
-                  key={title}
-                  title={title}
-                  className={classes.grafanaEmbed}
-                  src={`${grafanaHost}${path}&refresh${timeRangeParams}&var-SessionName=${sessionName}`}
-                  frameBorder="0"
-                />
-              </Paper>
+          <div className={classes.metricsRoot}>
+            {METRICS_CONFIG.map(({ title, contents }) => (
+              <CollapsibleSection
+                key={title}
+                title={title}
+                startExpanded
+                className={classes.metricsSection}
+                keepRendered
+              >
+                <div className={classes.grafanaEmbedsContainer}>
+                  {contents.map(({ title, path }) => (
+                    <Paper
+                      key={path}
+                      className={classes.chart}
+                      elevation={1}
+                      variant="outlined"
+                    >
+                      <iframe
+                        key={title}
+                        title={title}
+                        className={classes.grafanaEmbed}
+                        src={`${grafanaHost}${path}&refresh${timeRangeParams}&var-SessionName=${sessionName}`}
+                        frameBorder="0"
+                      />
+                    </Paper>
+                  ))}
+                </div>
+              </CollapsibleSection>
             ))}
           </div>
         </div>
@@ -241,3 +307,25 @@ export const Metrics = () => {
     </div>
   );
 };
+
+export const GrafanaNotRunningAlert = ({ className }: ClassNameProps) => {
+  const { grafanaHost, prometheusHealth } = useContext(GlobalContext);
+  return grafanaHost === undefined || !prometheusHealth ? (
+    <Alert className={className} severity="warning">
+      Grafana or prometheus server not detected. Please make sure both services
+      are running and refresh this page. See:{" "}
+      <a
+        href="https://docs.ray.io/en/latest/ray-observability/ray-metrics.html"
+        target="_blank"
+        rel="noreferrer"
+      >
+        https://docs.ray.io/en/latest/ray-observability/ray-metrics.html
+      </a>
+      .
+      <br />
+      If you are hosting grafana on a separate machine or using a non-default
+      port, please set the RAY_GRAFANA_HOST env var to point to your grafana
+      server when launching ray.
+    </Alert>
+  ) : null;
+};
diff --git a/dashboard/client/src/pages/metrics/utils.ts b/dashboard/client/src/pages/metrics/utils.ts
index 78749fb9c11a..ea89a4430bb6 100644
--- a/dashboard/client/src/pages/metrics/utils.ts
+++ b/dashboard/client/src/pages/metrics/utils.ts
@@ -1,6 +1,7 @@
 import { get } from "../../service/requestHandlers";
 
 const GRAFANA_HEALTHCHECK_URL = "/api/grafana_health";
+const PROMETHEUS_HEALTHCHECK_URL = "/api/prometheus_health";
 
 type GrafanaHealthcheckRsp = {
   result: boolean;
@@ -11,19 +12,44 @@ type GrafanaHealthcheckRsp = {
   };
 };
 
+type PrometheusHealthcheckRsp = {
+  result: boolean;
+  msg: string;
+};
+
 const fetchGrafanaHealthcheck = async () => {
   return await get<GrafanaHealthcheckRsp>(GRAFANA_HEALTHCHECK_URL);
 };
 
+const fetchPrometheusHealthcheck = async () => {
+  return await get<PrometheusHealthcheckRsp>(PROMETHEUS_HEALTHCHECK_URL);
+};
+
+type MetricsInfo = {
+  grafanaHost?: string;
+  sessionName?: string;
+  prometheusHealth?: boolean;
+};
+
 export const getMetricsInfo = async () => {
+  const info: MetricsInfo = {
+    grafanaHost: undefined,
+    sessionName: undefined,
+    prometheusHealth: undefined,
+  };
   try {
     const resp = await fetchGrafanaHealthcheck();
     if (resp.data.result) {
-      return {
-        grafanaHost: resp.data.data.grafanaHost,
-        sessionName: resp.data.data.sessionName,
-      };
+      info.grafanaHost = resp.data.data.grafanaHost;
+      info.sessionName = resp.data.data.sessionName;
     }
   } catch (e) {}
-  return { grafanaHost: undefined, sessionName: undefined };
+  try {
+    const resp = await fetchPrometheusHealthcheck();
+    if (resp.data.result) {
+      info.prometheusHealth = resp.data.result;
+    }
+  } catch (e) {}
+
+  return info;
 };
diff --git a/dashboard/client/src/pages/overview/OverviewPage.component.test.tsx b/dashboard/client/src/pages/overview/OverviewPage.component.test.tsx
index 775a0fbc8f01..12aa921d2e80 100644
--- a/dashboard/client/src/pages/overview/OverviewPage.component.test.tsx
+++ b/dashboard/client/src/pages/overview/OverviewPage.component.test.tsx
@@ -22,6 +22,5 @@ describe("OverviewPage", () => {
 
     render(<OverviewPage />, { wrapper: MemoryRouter });
     await screen.findByText(/Events/);
-    expect(screen.getByText(/Node metrics/)).toBeVisible();
   });
 });
diff --git a/dashboard/client/src/pages/overview/OverviewPage.tsx b/dashboard/client/src/pages/overview/OverviewPage.tsx
index 91f347b62774..4d06c17bae73 100644
--- a/dashboard/client/src/pages/overview/OverviewPage.tsx
+++ b/dashboard/client/src/pages/overview/OverviewPage.tsx
@@ -3,7 +3,6 @@ import React from "react";
 import { CollapsibleSection } from "../../common/CollapsibleSection";
 import EventTable from "../../components/EventTable";
 import { MainNavPageInfo } from "../layout/mainNavContext";
-import { Metrics } from "../metrics";
 import { ClusterUtilizationCard } from "./cards/ClusterUtilizationCard";
 import { NodeCountCard } from "./cards/NodeCountCard";
 import { RecentJobsCard } from "./cards/RecentJobsCard";
@@ -59,16 +58,6 @@ export const OverviewPage = () => {
       >
         <EventTable />
       </CollapsibleSection>
-
-      {/* TODO (aguo): Make section match the design */}
-      <CollapsibleSection
-        className={classes.section}
-        title="Node metrics"
-        startExpanded
-        keepRendered
-      >
-        <Metrics />
-      </CollapsibleSection>
     </div>
   );
 };
diff --git a/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx b/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx
index 00554591a982..89108546f2ac 100644
--- a/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx
+++ b/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx
@@ -1,8 +1,9 @@
-import { createStyles, makeStyles } from "@material-ui/core";
+import { createStyles, makeStyles, Typography } from "@material-ui/core";
 import classNames from "classnames";
 import React, { useContext } from "react";
 import { GlobalContext } from "../../../App";
-import { OverviewCard } from "./OverviewCard";
+import { GrafanaNotRunningAlert } from "../../metrics";
+import { LinkWithArrow, OverviewCard } from "./OverviewCard";
 
 const useStyles = makeStyles((theme) =>
   createStyles({
@@ -14,6 +15,19 @@ const useStyles = makeStyles((theme) =>
     graph: {
       flex: 1,
     },
+    noGraph: {
+      flex: 1,
+      padding: theme.spacing(2, 3),
+    },
+    alert: {
+      marginTop: theme.spacing(2),
+    },
+    links: {
+      display: "flex",
+      flexDirection: "row",
+      flexWrap: "nowrap",
+      margin: theme.spacing(1, 3, 2),
+    },
   }),
 );
 
@@ -26,7 +40,8 @@ export const ClusterUtilizationCard = ({
 }: ClusterUtilizationCardProps) => {
   const classes = useStyles();
 
-  const { grafanaHost, sessionName } = useContext(GlobalContext);
+  const { grafanaHost, prometheusHealth, sessionName } =
+    useContext(GlobalContext);
   const path =
     "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=2";
   const timeRangeParams = "&from=now-30m&to=now";
@@ -35,12 +50,24 @@ export const ClusterUtilizationCard = ({
     <OverviewCard className={classNames(classes.root, className)}>
       {/* TODO (aguo): Switch this to overall utilization graph */}
       {/* TODO (aguo): Handle grafana not running */}
-      <iframe
-        title="Cluster Utilization"
-        className={classes.graph}
-        src={`${grafanaHost}${path}&refresh${timeRangeParams}&var-SessionName=${sessionName}`}
-        frameBorder="0"
-      />
+      {grafanaHost === undefined || !prometheusHealth ? (
+        <div className={classes.noGraph}>
+          <Typography variant="h3">Cluster utilization</Typography>
+          <GrafanaNotRunningAlert className={classes.alert} />
+        </div>
+      ) : (
+        <React.Fragment>
+          <iframe
+            title="Cluster Utilization"
+            className={classes.graph}
+            src={`${grafanaHost}${path}&refresh${timeRangeParams}&var-SessionName=${sessionName}`}
+            frameBorder="0"
+          />
+          <div className={classes.links}>
+            <LinkWithArrow text="View all metrics" to="/new/metrics" />
+          </div>
+        </React.Fragment>
+      )}
     </OverviewCard>
   );
 };
diff --git a/dashboard/client/src/pages/overview/cards/NodeCountCard.tsx b/dashboard/client/src/pages/overview/cards/NodeCountCard.tsx
index ab53ebc46bbf..fc09a4c53b67 100644
--- a/dashboard/client/src/pages/overview/cards/NodeCountCard.tsx
+++ b/dashboard/client/src/pages/overview/cards/NodeCountCard.tsx
@@ -1,7 +1,8 @@
-import { createStyles, makeStyles } from "@material-ui/core";
+import { createStyles, makeStyles, Typography } from "@material-ui/core";
 import classNames from "classnames";
 import React, { useContext } from "react";
 import { GlobalContext } from "../../../App";
+import { GrafanaNotRunningAlert } from "../../metrics";
 import { LinkWithArrow, OverviewCard } from "./OverviewCard";
 
 const useStyles = makeStyles((theme) =>
@@ -14,11 +15,18 @@ const useStyles = makeStyles((theme) =>
     graph: {
       flex: 1,
     },
+    noGraph: {
+      flex: 1,
+      padding: theme.spacing(2, 3),
+    },
+    alert: {
+      marginTop: theme.spacing(2),
+    },
     links: {
       display: "flex",
       flexDirection: "row",
       flexWrap: "nowrap",
-      margin: theme.spacing(0, 3, 2),
+      margin: theme.spacing(1, 3, 2),
     },
   }),
 );
@@ -30,20 +38,27 @@ type NodeCountCardProps = {
 export const NodeCountCard = ({ className }: NodeCountCardProps) => {
   const classes = useStyles();
 
-  const { grafanaHost, sessionName } = useContext(GlobalContext);
+  const { grafanaHost, prometheusHealth, sessionName } =
+    useContext(GlobalContext);
   const path =
     "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=24";
   const timeRangeParams = "&from=now-30m&to=now";
 
   return (
     <OverviewCard className={classNames(classes.root, className)}>
-      {/* TODO (aguo): Handle grafana not running */}
-      <iframe
-        title="Node Count"
-        className={classes.graph}
-        src={`${grafanaHost}${path}&refresh${timeRangeParams}&var-SessionName=${sessionName}`}
-        frameBorder="0"
-      />
+      {grafanaHost === undefined || !prometheusHealth ? (
+        <div className={classes.noGraph}>
+          <Typography variant="h3">Node count</Typography>
+          <GrafanaNotRunningAlert className={classes.alert} />
+        </div>
+      ) : (
+        <iframe
+          title="Node Count"
+          className={classes.graph}
+          src={`${grafanaHost}${path}&refresh${timeRangeParams}&var-SessionName=${sessionName}`}
+          frameBorder="0"
+        />
+      )}
       <div className={classes.links}>
         <LinkWithArrow text="View all nodes" to="/new/cluster" />
       </div>
diff --git a/dashboard/client/src/type/placementGroup.d.ts b/dashboard/client/src/type/placementGroup.ts
similarity index 100%
rename from dashboard/client/src/type/placementGroup.d.ts
rename to dashboard/client/src/type/placementGroup.ts
diff --git a/dashboard/modules/metrics/metrics_head.py b/dashboard/modules/metrics/metrics_head.py
index c67f14c21062..7326d519fe6e 100644
--- a/dashboard/modules/metrics/metrics_head.py
+++ b/dashboard/modules/metrics/metrics_head.py
@@ -171,7 +171,7 @@ async def grafana_health(self, req) -> aiohttp.web.Response:
             )
 
     @routes.get("/api/prometheus_health")
-    async def prometheus_health(self, req) -> bool:
+    async def prometheus_health(self, req):
         try:
             path = f"{self.prometheus_host}/{PROMETHEUS_HEALTHCHECK_PATH}"
 

From eab29ca31e6ad47a7ef7239d95571ec8a8605217 Mon Sep 17 00:00:00 2001
From: Justin Yu <justinvyu@berkeley.edu>
Date: Fri, 27 Jan 2023 11:10:29 -0800
Subject: [PATCH 024/267] [Tune] Clarify which `RunConfig` is used when there
 are multiple places to specify it (#31959)

This PR clarifies where RunConfig can be specified. Also, when multiple configs are specified in different locations (in the Tuner and Trainer), this PR also logs information about which RunConfig is actually used.

Signed-off-by: Justin Yu <justinvyu@berkeley.edu>
---
 python/ray/train/tests/test_tune.py    | 29 ++++++++++++++++++++++++++
 python/ray/tune/impl/tuner_internal.py | 21 +++++++++++++++----
 2 files changed, 46 insertions(+), 4 deletions(-)

diff --git a/python/ray/train/tests/test_tune.py b/python/ray/train/tests/test_tune.py
index 4e372734d9d6..59f170bb4989 100644
--- a/python/ray/train/tests/test_tune.py
+++ b/python/ray/train/tests/test_tune.py
@@ -20,6 +20,7 @@
 from ray.train.torch.torch_trainer import TorchTrainer
 from ray.tune.tune_config import TuneConfig
 from ray.tune.tuner import Tuner
+from ray.tune.impl.tuner_internal import _TUNER_PKL
 
 
 @pytest.fixture
@@ -279,6 +280,34 @@ def train_func(config):
     assert not results.errors
 
 
+def test_run_config_in_trainer_and_tuner(
+    ray_start_4_cpus, tmp_path, propagate_logs, caplog
+):
+    trainer = DataParallelTrainer(
+        lambda config: None,
+        backend_config=TestConfig(),
+        scaling_config=ScalingConfig(num_workers=1),
+        run_config=RunConfig(name="ignored", local_dir="ignored"),
+    )
+    with caplog.at_level(logging.INFO, logger="ray.tune.impl.tuner_internal"):
+        Tuner(trainer, run_config=RunConfig(name="used", local_dir=str(tmp_path)))
+    assert list((tmp_path / "used").glob(_TUNER_PKL))
+    assert (
+        "`RunConfig` was passed to both the `Tuner` and the `DataParallelTrainer`"
+        in caplog.text
+    )
+
+
+def test_run_config_in_param_space():
+    trainer = DataParallelTrainer(
+        lambda config: None,
+        backend_config=TestConfig(),
+        scaling_config=ScalingConfig(num_workers=1),
+    )
+    with pytest.raises(ValueError):
+        Tuner(trainer, param_space={"run_config": RunConfig(name="ignored")})
+
+
 if __name__ == "__main__":
     import sys
 
diff --git a/python/ray/tune/impl/tuner_internal.py b/python/ray/tune/impl/tuner_internal.py
index 38dd889d8912..fbd7d57e9823 100644
--- a/python/ray/tune/impl/tuner_internal.py
+++ b/python/ray/tune/impl/tuner_internal.py
@@ -81,10 +81,23 @@ def __init__(
     ):
         from ray.train.trainer import BaseTrainer
 
-        # If no run config was passed to Tuner directly, use the one from the Trainer,
-        # if available
-        if not run_config and isinstance(trainable, BaseTrainer):
-            run_config = trainable.run_config
+        if isinstance(trainable, BaseTrainer):
+            # If no run config was passed to the Tuner directly,
+            # use the one from the Trainer, if available
+            if not run_config:
+                run_config = trainable.run_config
+            if run_config and trainable.run_config != RunConfig():
+                logger.info(
+                    "A `RunConfig` was passed to both the `Tuner` and the "
+                    f"`{trainable.__class__.__name__}`. The run config passed to "
+                    "the `Tuner` is the one that will be used."
+                )
+            if param_space and "run_config" in param_space:
+                raise ValueError(
+                    "`RunConfig` cannot be tuned as part of the `param_space`! "
+                    "Move the run config to be a parameter of the `Tuner`: "
+                    "Tuner(..., run_config=RunConfig(...))"
+                )
 
         self._tune_config = tune_config or TuneConfig()
         self._run_config = run_config or RunConfig()

From 1b20ae9a29e973db94d84588b4e2936fe6375b3f Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Fri, 27 Jan 2023 11:22:55 -0800
Subject: [PATCH 025/267] [docs] Fix linkcheck error and map batches docstring
 test (#31996)

581cd4e moved some test files, breaking a link from the documentation. cc @iycheng

3343c76 changed the MapBatches string representation, breaking a docstring test. cc @peytondmurray

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 doc/source/ray-core/miscellaneous.rst | 2 +-
 python/ray/data/dataset.py            | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/doc/source/ray-core/miscellaneous.rst b/doc/source/ray-core/miscellaneous.rst
index 9e3d923a3d27..6b02e02a26ee 100644
--- a/doc/source/ray-core/miscellaneous.rst
+++ b/doc/source/ray-core/miscellaneous.rst
@@ -309,7 +309,7 @@ The Ray setup:
 
 Test workload:
 
-- Test script: `code <https://github.com/ray-project/ray/blob/master/release/nightly_tests/many_nodes_tests/actor_test.py>`_
+- Test script: `code <https://github.com/ray-project/ray/blob/master/release/benchmarks/distributed/many_nodes_tests/actor_test.py>`_
 
 
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index f2f9db25753d..efdb7556d47e 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -191,7 +191,7 @@ class Dataset(Generic[T]):
         >>> ds = ray.data.range(1000)
         >>> # Transform in parallel with map_batches().
         >>> ds.map_batches(lambda batch: [v * 2 for v in batch])
-        MapBatches
+        MapBatches(<lambda>)
         +- Dataset(num_blocks=17, num_rows=1000, schema=<class 'int'>)
         >>> # Compute max.
         >>> ds.max()

From 02ca4c9f2b2311e3fdf47de99303f7473170e477 Mon Sep 17 00:00:00 2001
From: Clark Zinzow <clarkzinzow@gmail.com>
Date: Fri, 27 Jan 2023 11:30:29 -0800
Subject: [PATCH 026/267] [Datasets] [Autoscaling Actor Pool - 1/2] Refactor
 `MapOperator`, execution state, and task submitters. (#31986)

---
 .../data/_internal/execution/legacy_compat.py |   4 +-
 .../operators/actor_pool_map_operator.py      | 374 ++++++++++++++
 .../operators/actor_pool_submitter.py         | 178 -------
 .../execution/operators/map_operator.py       | 474 ++++++++++++++++--
 .../execution/operators/map_operator_state.py | 287 -----------
 .../execution/operators/map_task_submitter.py | 118 -----
 .../operators/task_pool_map_operator.py       | 104 ++++
 .../operators/task_pool_submitter.py          |  41 --
 python/ray/data/_internal/execution/util.py   |  13 -
 .../logical/operators/map_operator.py         |   2 +-
 .../logical/operators/read_operator.py        |   2 +-
 python/ray/data/tests/conftest.py             |  15 +
 .../tests/test_actor_pool_map_operator.py     | 294 +++++++++++
 .../data/tests/test_actor_pool_submitter.py   | 163 ------
 python/ray/data/tests/test_bulk_executor.py   |  23 +-
 .../test_executor_resource_management.py      |  58 ++-
 python/ray/data/tests/test_operators.py       | 188 ++++++-
 .../ray/data/tests/test_streaming_executor.py |  78 ++-
 18 files changed, 1475 insertions(+), 941 deletions(-)
 create mode 100644 python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
 delete mode 100644 python/ray/data/_internal/execution/operators/actor_pool_submitter.py
 delete mode 100644 python/ray/data/_internal/execution/operators/map_operator_state.py
 delete mode 100644 python/ray/data/_internal/execution/operators/map_task_submitter.py
 create mode 100644 python/ray/data/_internal/execution/operators/task_pool_map_operator.py
 delete mode 100644 python/ray/data/_internal/execution/operators/task_pool_submitter.py
 create mode 100644 python/ray/data/tests/test_actor_pool_map_operator.py
 delete mode 100644 python/ray/data/tests/test_actor_pool_submitter.py

diff --git a/python/ray/data/_internal/execution/legacy_compat.py b/python/ray/data/_internal/execution/legacy_compat.py
index 6f4f0ff86199..07fb4fcf1153 100644
--- a/python/ray/data/_internal/execution/legacy_compat.py
+++ b/python/ray/data/_internal/execution/legacy_compat.py
@@ -151,7 +151,7 @@ def do_read(blocks: Iterator[Block]) -> Iterator[Block]:
             for read_task in blocks:
                 yield from read_task()
 
-        return MapOperator(do_read, inputs, name="DoRead")
+        return MapOperator.create(do_read, inputs, name="DoRead")
     else:
         output = _block_list_to_bundles(blocks, owns_blocks=owns_blocks)
         for i in output:
@@ -217,7 +217,7 @@ def fn(item: Any) -> Any:
         def do_map(blocks: Iterator[Block]) -> Iterator[Block]:
             yield from block_fn(blocks, *fn_args, **fn_kwargs)
 
-        return MapOperator(
+        return MapOperator.create(
             do_map,
             input_op,
             name=stage.name,
diff --git a/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py b/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
new file mode 100644
index 000000000000..fcee783b55a0
--- /dev/null
+++ b/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
@@ -0,0 +1,374 @@
+import collections
+from typing import Dict, Any, Iterator, Callable, List, Tuple, Union, Optional
+
+import ray
+from ray.data.block import Block, BlockMetadata
+from ray.data.context import DatasetContext, DEFAULT_SCHEDULING_STRATEGY
+from ray.data._internal.execution.interfaces import (
+    RefBundle,
+    ExecutionResources,
+    ExecutionOptions,
+    PhysicalOperator,
+)
+from ray.data._internal.execution.operators.map_operator import (
+    MapOperator,
+    _map_task,
+    _TaskState,
+)
+from ray.types import ObjectRef
+from ray._raylet import ObjectRefGenerator
+
+
+class ActorPoolMapOperator(MapOperator):
+    """A MapOperator implementation that executes tasks on an actor pool."""
+
+    def __init__(
+        self,
+        transform_fn: Callable[[Iterator[Block]], Iterator[Block]],
+        input_op: PhysicalOperator,
+        name: str = "ActorPoolMap",
+        min_rows_per_bundle: Optional[int] = None,
+        ray_remote_args: Optional[Dict[str, Any]] = None,
+        pool_size: int = 1,
+    ):
+        """Create an ActorPoolMapOperator instance.
+
+        Args:
+            transform_fn: The function to apply to each ref bundle input.
+            input_op: Operator generating input data for this op.
+            name: The name of this operator.
+            min_rows_per_bundle: The number of rows to gather per batch passed to the
+                transform_fn, or None to use the block size. Setting the batch size is
+                important for the performance of GPU-accelerated transform functions.
+                The actual rows passed may be less if the dataset is small.
+            ray_remote_args: Customize the ray remote args for this op's tasks.
+            pool_size: The desired size of the actor pool.
+        """
+        super().__init__(
+            transform_fn, input_op, name, min_rows_per_bundle, ray_remote_args
+        )
+        self._ray_remote_args = self._apply_default_remote_args(self._ray_remote_args)
+
+        self._pool_size = pool_size
+        # A map from task output futures to task state and the actor on which its
+        # running.
+        self._tasks: Dict[
+            ObjectRef[ObjectRefGenerator], Tuple[_TaskState, ray.actor.ActorHandle]
+        ] = {}
+        # A pool of running actors on which we can execute mapper tasks.
+        self._actor_pool = _ActorPool()
+        # A queue of bundles awaiting dispatch to actors.
+        self._bundle_queue = collections.deque()
+        # Cached actor class.
+        self._cls = None
+        # Whether no more submittable bundles will be added.
+        self._inputs_done = False
+
+    def start(self, options: ExecutionOptions):
+        super().start(options)
+
+        # Create the actor workers and add them to the pool.
+        self._cls = ray.remote(**self._ray_remote_args)(_MapWorker)
+        for _ in range(self._pool_size):
+            self._start_actor()
+
+    def _start_actor(self):
+        """Start a new actor and add it to the actor pool as a pending actor."""
+        assert self._cls is not None
+        actor = self._cls.remote()
+        self._actor_pool.add_pending_actor(actor, actor.ready.remote())
+
+    def _add_bundled_input(self, bundle: RefBundle):
+        self._bundle_queue.append(bundle)
+        # Try to dispatch all bundles in the queue, including this new bundle.
+        self._dispatch_tasks()
+
+    def _dispatch_tasks(self):
+        """Try to dispatch tasks from the bundle buffer to the actor pool.
+
+        This is called when:
+            * a new input bundle is added,
+            * a task finishes,
+            * a new worker has been created.
+        """
+        while self._bundle_queue:
+            # Pick an actor from the pool.
+            actor = self._actor_pool.pick_actor()
+            if actor is None:
+                # No actors available for executing the next task.
+                break
+            # Submit the map task.
+            bundle = self._bundle_queue.popleft()
+            input_blocks = [block for block, _ in bundle.blocks]
+            ref = actor.submit.options(num_returns="dynamic").remote(
+                self._transform_fn_ref, *input_blocks
+            )
+            task = _TaskState(bundle)
+            self._tasks[ref] = (task, actor)
+            self._handle_task_submitted(task)
+
+        # Kill inactive workers if there's no more work to do.
+        self._kill_inactive_workers_if_done()
+
+    def notify_work_completed(
+        self, ref: Union[ObjectRef[ObjectRefGenerator], ray.ObjectRef]
+    ):
+        # This actor pool MapOperator implementation has both task output futures AND
+        # worker started futures to handle here.
+        if ref in self._tasks:
+            # Get task state and set output.
+            task, actor = self._tasks.pop(ref)
+            task.output = self._map_ref_to_ref_bundle(ref)
+            self._handle_task_done(task)
+            # Return the actor that was running the task to the pool.
+            self._actor_pool.return_actor(actor)
+        else:
+            # ref is a future for a now-ready actor; move actor from pending to the
+            # active actor pool.
+            has_actor = self._actor_pool.pending_to_running(ref)
+            if not has_actor:
+                # Actor has already been killed.
+                return
+        # For either a completed task or ready worker, we try to dispatch queued tasks.
+        self._dispatch_tasks()
+
+    def inputs_done(self):
+        # Call base implementation to handle any leftover bundles. This may or may not
+        # trigger task dispatch.
+        super().inputs_done()
+
+        # Mark inputs as done so future task dispatch will kill all inactive workers
+        # once the bundle queue is exhausted.
+        self._inputs_done = True
+
+        # Manually trigger inactive worker termination in case the bundle queue is
+        # alread exhausted.
+        self._kill_inactive_workers_if_done()
+
+    def _kill_inactive_workers_if_done(self):
+        if self._inputs_done and not self._bundle_queue:
+            # No more tasks will be submitted, so we kill all current and future
+            # inactive workers.
+            self._actor_pool.kill_all_inactive_actors()
+
+    def shutdown(self):
+        # We kill all actors in the pool on shutdown, even if they are busy doing work.
+        self._actor_pool.kill_all_actors()
+        super().shutdown()
+
+    def get_work_refs(self) -> List[ray.ObjectRef]:
+        # Work references that we wish the executor to wait on includes both task
+        # futures AND worker ready futures.
+        return list(self._tasks.keys()) + self._actor_pool.get_pending_actor_refs()
+
+    def num_active_work_refs(self) -> int:
+        # Active work references only includes running tasks, not pending actor starts.
+        return len(self._tasks)
+
+    def progress_str(self) -> str:
+        return (
+            f"{self._actor_pool.num_running_actors()} "
+            f"({self._actor_pool.num_pending_actors()} pending)"
+        )
+
+    def base_resource_usage(self) -> ExecutionResources:
+        min_workers = self._pool_size
+        return ExecutionResources(
+            cpu=self._ray_remote_args.get("num_cpus", 0) * min_workers,
+            gpu=self._ray_remote_args.get("num_gpus", 0) * min_workers,
+        )
+
+    def current_resource_usage(self) -> ExecutionResources:
+        # Both pending and running actors count towards our current resource usage.
+        num_active_workers = self._actor_pool.num_total_actors()
+        return ExecutionResources(
+            cpu=self._ray_remote_args.get("num_cpus", 0) * num_active_workers,
+            gpu=self._ray_remote_args.get("num_gpus", 0) * num_active_workers,
+            object_store_memory=self._metrics.cur,
+        )
+
+    def incremental_resource_usage(self) -> ExecutionResources:
+        return ExecutionResources(cpu=0, gpu=0)
+
+    @staticmethod
+    def _apply_default_remote_args(ray_remote_args: Dict[str, Any]) -> Dict[str, Any]:
+        """Apply defaults to the actor creation remote args."""
+        ray_remote_args = ray_remote_args.copy()
+        if "scheduling_strategy" not in ray_remote_args:
+            ctx = DatasetContext.get_current()
+            if ctx.scheduling_strategy == DEFAULT_SCHEDULING_STRATEGY:
+                ray_remote_args["scheduling_strategy"] = "SPREAD"
+            else:
+                ray_remote_args["scheduling_strategy"] = ctx.scheduling_strategy
+        return ray_remote_args
+
+
+class _MapWorker:
+    """An actor worker for MapOperator."""
+
+    def ready(self):
+        return "ok"
+
+    def submit(
+        self, fn: Callable[[Iterator[Block]], Iterator[Block]], *blocks: Block
+    ) -> Iterator[Union[Block, List[BlockMetadata]]]:
+        yield from _map_task(fn, *blocks)
+
+
+class _ActorPool:
+    """A pool of actors for map task execution.
+
+    This class is in charge of tracking the number of in-flight tasks per actor,
+    providing the least heavily loaded actor to the operator, and killing idle
+    actors when the operator is done submitting work to the pool.
+    """
+
+    def __init__(self):
+        # Number of tasks in flight per actor.
+        self._num_tasks_in_flight: Dict[ray.actor.ActorHandle, int] = {}
+        # Actors that are not yet ready (still pending creation).
+        self._pending_actors: Dict[ObjectRef, ray.actor.ActorHandle] = {}
+        # Whether actors that become idle should be eagerly killed. This is False until
+        # the first call to kill_idle_actors().
+        self._should_kill_idle_actors = False
+
+    def add_pending_actor(self, actor: ray.actor.ActorHandle, ready_ref: ray.ObjectRef):
+        """Adds a pending actor to the pool.
+
+        This actor won't be pickable until it is marked as running via a
+        pending_to_running() call.
+
+        Args:
+            actor: The not-yet-ready actor to add as pending to the pool.
+            ready_ref: The ready future for the actor.
+        """
+        # The caller shouldn't add new actors to the pool after invoking
+        # kill_inactive_actors().
+        assert not self._should_kill_idle_actors
+        self._pending_actors[ready_ref] = actor
+
+    def pending_to_running(self, ready_ref: ray.ObjectRef) -> bool:
+        """Mark the actor corresponding to the provided ready future as running, making
+        the actor pickable.
+
+        Args:
+            ready_ref: The ready future for the actor that we wish to mark as running.
+
+        Returns:
+            Whether the actor was still pending. This can return False if the actor had
+            already been killed.
+        """
+        if ready_ref not in self._pending_actors:
+            # We assume that there was a race between killing the actor and the actor
+            # ready future resolving. Since we can rely on ray.kill() eventually killing
+            # the actor, we can safely drop this reference.
+            return False
+        actor = self._pending_actors.pop(ready_ref)
+        self._num_tasks_in_flight[actor] = 0
+        return True
+
+    def pick_actor(self) -> Optional[ray.actor.ActorHandle]:
+        """Provides the least heavily loaded running actor in the pool for task
+        submission.
+
+        None will be returned if all actors are still pending.
+        """
+        if not self._num_tasks_in_flight:
+            # Actor pool is empty or all actors are still pending.
+            return None
+
+        actor = min(
+            self._num_tasks_in_flight.keys(),
+            key=lambda actor: self._num_tasks_in_flight[actor],
+        )
+        self._num_tasks_in_flight[actor] += 1
+        return actor
+
+    def return_actor(self, actor: ray.actor.ActorHandle):
+        """Returns the provided actor to the pool."""
+        assert actor in self._num_tasks_in_flight
+        assert self._num_tasks_in_flight[actor] > 0
+
+        self._num_tasks_in_flight[actor] -= 1
+        if self._should_kill_idle_actors and self._num_tasks_in_flight[actor] == 0:
+            self._kill_running_actor(actor)
+
+    def get_pending_actor_refs(self) -> List[ray.ObjectRef]:
+        return list(self._pending_actors.keys())
+
+    def num_total_actors(self) -> int:
+        """Return the total number of actors managed by this pool, including pending
+        actors
+        """
+        return self.num_pending_actors() + self.num_running_actors()
+
+    def num_running_actors(self) -> int:
+        """Return the number of running actors in the pool."""
+        return len(self._num_tasks_in_flight)
+
+    def num_idle_actors(self) -> int:
+        """Return the number of idle actors in the pool."""
+        return sum(
+            1 if tasks_in_flight == 0 else 0
+            for tasks_in_flight in self._num_tasks_in_flight.values()
+        )
+
+    def num_pending_actors(self) -> int:
+        """Return the number of pending actors in the pool."""
+        return len(self._pending_actors)
+
+    def num_active_actors(self) -> int:
+        """Return the number of actors in the pool with at least one active task."""
+        return sum(
+            1 if num_tasks_in_flight > 0 else 0
+            for num_tasks_in_flight in self._num_tasks_in_flight.values()
+        )
+
+    def kill_all_inactive_actors(self):
+        """Kills all currently inactive actors and ensures that all actors that become
+        idle in the future will be eagerly killed.
+
+        This is called once the operator is done submitting work to the pool, and this
+        function is idempotent. Adding new pending actors after calling this function
+        will raise an error.
+        """
+        self._kill_all_pending_actors()
+        self._kill_all_idle_actors()
+
+    def kill_all_actors(self):
+        """Kills all actors, including running/active actors.
+
+        This is called once the operator is shutting down.
+        """
+        self._kill_all_pending_actors()
+        self._kill_all_running_actors()
+
+    def _kill_all_pending_actors(self):
+        pending_actor_refs = list(self._pending_actors.keys())
+        for ref in pending_actor_refs:
+            self._kill_pending_actor(ref)
+
+    def _kill_all_idle_actors(self):
+        idle_actors = [
+            actor
+            for actor, tasks_in_flight in self._num_tasks_in_flight.items()
+            if tasks_in_flight == 0
+        ]
+        for actor in idle_actors:
+            self._kill_running_actor(actor)
+        self._should_kill_idle_actors = True
+
+    def _kill_all_running_actors(self):
+        actors = list(self._num_tasks_in_flight.keys())
+        for actor in actors:
+            self._kill_running_actor(actor)
+
+    def _kill_running_actor(self, actor: ray.actor.ActorHandle):
+        """Kill the provided actor and remove it from the pool."""
+        ray.kill(actor)
+        del self._num_tasks_in_flight[actor]
+
+    def _kill_pending_actor(self, ready_ref: ray.ObjectRef):
+        """Kill the provided pending actor and remove it from the pool."""
+        actor = self._pending_actors.pop(ready_ref)
+        ray.kill(actor)
diff --git a/python/ray/data/_internal/execution/operators/actor_pool_submitter.py b/python/ray/data/_internal/execution/operators/actor_pool_submitter.py
deleted file mode 100644
index adcf95990b93..000000000000
--- a/python/ray/data/_internal/execution/operators/actor_pool_submitter.py
+++ /dev/null
@@ -1,178 +0,0 @@
-from typing import Dict, Any, Iterator, Callable, List, Union
-import ray
-from ray.data.block import Block, BlockMetadata
-from ray.data.context import DatasetContext
-from ray.data.context import DEFAULT_SCHEDULING_STRATEGY
-from ray.data._internal.execution.interfaces import (
-    ExecutionOptions,
-)
-from ray.data._internal.execution.operators.map_task_submitter import (
-    MapTaskSubmitter,
-    _map_task,
-)
-from ray.types import ObjectRef
-from ray._raylet import ObjectRefGenerator
-
-
-class ActorPoolSubmitter(MapTaskSubmitter):
-    """A task submitter for MapOperator that uses a Ray actor pool."""
-
-    def __init__(
-        self,
-        transform_fn_ref: ObjectRef[Callable[[Iterator[Block]], Iterator[Block]]],
-        ray_remote_args: Dict[str, Any],
-        pool_size: int,
-    ):
-        """Create an ActorPoolSubmitter instance.
-
-        Args:
-            transform_fn_ref: The function to apply to a block bundle in the submitted
-                map task.
-            ray_remote_args: Remote arguments for the Ray actors to be created.
-            pool_size: The size of the actor pool.
-        """
-        super().__init__(transform_fn_ref, ray_remote_args)
-        self._pool_size = pool_size
-        # A map from task output futures to the actors on which they are running.
-        self._active_actors: Dict[ObjectRef[Block], ray.actor.ActorHandle] = {}
-        # The actor pool on which we are running map tasks.
-        self._actor_pool = ActorPool()
-
-    def progress_str(self) -> str:
-        return f"{self._actor_pool.size()} actors"
-
-    def start(self, options: ExecutionOptions):
-        super().start(options)
-        # Create the actor workers and add them to the pool.
-        ray_remote_args = self._apply_default_remote_args(self._ray_remote_args)
-        cls_ = ray.remote(**ray_remote_args)(MapWorker)
-        for _ in range(self._pool_size):
-            self._actor_pool.add_actor(cls_.remote())
-
-    def submit(
-        self, input_blocks: List[ObjectRef[Block]]
-    ) -> ObjectRef[ObjectRefGenerator]:
-        # Pick an actor from the pool.
-        actor = self._actor_pool.pick_actor()
-        # Submit the map task.
-        ref = actor.submit.options(num_returns="dynamic").remote(
-            self._transform_fn_ref, *input_blocks
-        )
-        self._active_actors[ref] = actor
-        return ref
-
-    def task_done(self, ref: ObjectRef[ObjectRefGenerator]):
-        # Return the actor that was running the task to the pool.
-        actor = self._active_actors.pop(ref)
-        self._actor_pool.return_actor(actor)
-
-    def task_submission_done(self):
-        # Kill all idle actors in the pool, and ensure that all remaining actors in the
-        # pool will be killed as they become idle.
-        self._actor_pool.kill_idle_actors()
-
-    def shutdown(self, _):
-        self._actor_pool.kill_all_actors()
-
-    @staticmethod
-    def _apply_default_remote_args(ray_remote_args: Dict[str, Any]) -> Dict[str, Any]:
-        """Apply defaults to the actor creation remote args."""
-        ray_remote_args = ray_remote_args.copy()
-        if "scheduling_strategy" not in ray_remote_args:
-            ctx = DatasetContext.get_current()
-            if ctx.scheduling_strategy == DEFAULT_SCHEDULING_STRATEGY:
-                ray_remote_args["scheduling_strategy"] = "SPREAD"
-            else:
-                ray_remote_args["scheduling_strategy"] = ctx.scheduling_strategy
-        return ray_remote_args
-
-
-class MapWorker:
-    """An actor worker for MapOperator."""
-
-    def ready(self):
-        return "ok"
-
-    def submit(
-        self, fn: Callable[[Iterator[Block]], Iterator[Block]], *blocks: Block
-    ) -> Iterator[Union[Block, List[BlockMetadata]]]:
-        yield from _map_task(fn, *blocks)
-
-
-class ActorPool:
-    """A pool of actors for map task execution.
-
-    This class is in charge of tracking the number of in-flight tasks per actor,
-    providing the least heavily loaded actor to the task submitter, and killing idle
-    actors when the task submitter is done submitting work to the pool.
-    """
-
-    def __init__(self):
-        # Number of tasks in flight per actor.
-        self._num_tasks_in_flight: Dict[ray.actor.ActorHandle, int] = {}
-        # Whether actors that become idle should be eagerly killed. This is False until
-        # the first call to kill_idle_actors().
-        self._should_kill_idle_actors = False
-
-    def size(self) -> int:
-        """Return the current actor pool size."""
-        return len(self._num_tasks_in_flight)
-
-    def add_actor(self, actor: ray.actor.ActorHandle):
-        """Adds an actor to the pool."""
-        self._num_tasks_in_flight[actor] = 0
-
-    def pick_actor(self) -> ray.actor.ActorHandle:
-        """Provides the least heavily loaded actor in the pool for task submission."""
-        if not self._num_tasks_in_flight:
-            raise ValueError("Actor pool is empty.")
-
-        actor = min(
-            self._num_tasks_in_flight.keys(),
-            key=lambda actor: self._num_tasks_in_flight[actor],
-        )
-        self._num_tasks_in_flight[actor] += 1
-        return actor
-
-    def return_actor(self, actor: ray.actor.ActorHandle):
-        """Returns the provided actor to the pool."""
-        if actor not in self._num_tasks_in_flight:
-            raise ValueError(
-                f"Actor {actor} doesn't exist in pool: "
-                f"{list(self._num_tasks_in_flight.keys())}"
-            )
-        if self._num_tasks_in_flight[actor] == 0:
-            raise ValueError(f"Actor {actor} has already been returned by all pickers.")
-
-        self._num_tasks_in_flight[actor] -= 1
-        if self._should_kill_idle_actors and self._num_tasks_in_flight[actor] == 0:
-            self._kill_actor(actor)
-
-    def kill_idle_actors(self):
-        """Kills all currently idle actors and ensures that all actors that become idle
-        in the future will be eagerly killed.
-
-        This is called once the task submitter is done submitting work to the pool.
-        """
-        idle_actors = [
-            actor
-            for actor, tasks_in_flight in self._num_tasks_in_flight.items()
-            if tasks_in_flight == 0
-        ]
-        for actor in idle_actors:
-            self._kill_actor(actor)
-        self._should_kill_idle_actors = True
-
-    def kill_all_actors(self):
-        """Kills all currently idle actors.
-
-        This is called once the task submitter is shutting down.
-        """
-        all_actors = list(self._num_tasks_in_flight.keys())
-        for actor in all_actors:
-            self._kill_actor(actor)
-
-    def _kill_actor(self, actor: ray.actor.ActorHandle):
-        """Kill the provided actor and remove it from the pool."""
-        ray.kill(actor)
-        del self._num_tasks_in_flight[actor]
diff --git a/python/ray/data/_internal/execution/operators/map_operator.py b/python/ray/data/_internal/execution/operators/map_operator.py
index a0062bfa25c2..0fe279cc05c2 100644
--- a/python/ray/data/_internal/execution/operators/map_operator.py
+++ b/python/ray/data/_internal/execution/operators/map_operator.py
@@ -1,11 +1,14 @@
-from typing import List, Iterator, Any, Dict, Callable, Optional
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+import itertools
+from typing import List, Iterator, Any, Dict, Callable, Optional, Union
 
 import ray
-from ray.data.block import Block, BlockMetadata
-from ray.data._internal.stats import StatsDict
+from ray.data.block import Block, BlockAccessor, BlockMetadata, BlockExecStats
 from ray.data._internal.compute import (
     ComputeStrategy,
     TaskPoolStrategy,
+    ActorPoolStrategy,
 )
 from ray.data._internal.execution.interfaces import (
     RefBundle,
@@ -13,12 +16,14 @@
     ExecutionResources,
     PhysicalOperator,
 )
-from ray.data._internal.execution.operators.map_operator_state import (
-    MapOperatorState,
-)
+from ray.data._internal.memory_tracing import trace_allocation
+from ray.data._internal.stats import StatsDict
+from ray.util.scheduling_strategies import NodeAffinitySchedulingStrategy
+from ray.types import ObjectRef
+from ray._raylet import ObjectRefGenerator
 
 
-class MapOperator(PhysicalOperator):
+class MapOperator(PhysicalOperator, ABC):
     """A streaming operator that maps input bundles 1:1 to output bundles.
 
     This operator implements the distributed map operation, supporting both task
@@ -29,15 +34,50 @@ def __init__(
         self,
         transform_fn: Callable[[Iterator[Block]], Iterator[Block]],
         input_op: PhysicalOperator,
+        name: str,
+        min_rows_per_bundle: Optional[int],
+        ray_remote_args: Optional[Dict[str, Any]],
+    ):
+        # NOTE: This constructor should not be called directly; use MapOperator.create()
+        # instead.
+        # NOTE: This constructor must be called by subclasses.
+
+        # Put the function def in the object store to avoid repeated serialization
+        # in case it's large (i.e., closure captures large objects).
+        self._transform_fn_ref = ray.put(transform_fn)
+        self._ray_remote_args = _canonicalize_ray_remote_args(ray_remote_args or {})
+
+        # Bundles block references up to the min_rows_per_bundle target.
+        self._block_ref_bundler = _BlockRefBundler(min_rows_per_bundle)
+        # Object store allocation stats.
+        self._metrics = _ObjectStoreMetrics(alloc=0, freed=0, cur=0, peak=0)
+
+        # Queue for task outputs, either ordered or unordered (this is set by start()).
+        self._output_queue: _OutputQueue = None
+        # Output metadata, added to on get_next().
+        self._output_metadata: List[BlockMetadata] = []
+
+        super().__init__(name, [input_op])
+
+    @classmethod
+    def create(
+        cls,
+        transform_fn: Callable[[Iterator[Block]], Iterator[Block]],
+        input_op: PhysicalOperator,
         name: str = "Map",
         # TODO(ekl): slim down ComputeStrategy to only specify the compute
         # config and not contain implementation code.
         compute_strategy: Optional[ComputeStrategy] = None,
         min_rows_per_bundle: Optional[int] = None,
         ray_remote_args: Optional[Dict[str, Any]] = None,
-    ):
+    ) -> "MapOperator":
         """Create a MapOperator.
 
+        This factory creates the MapOperator pool implementation that corresponds to the
+        compute argument:
+            - If None or TaskPoolStrategy -> TaskPoolMapOperator
+            - If ActorPoolStrategy -> ActorPoolMapOperator
+
         Args:
             transform_fn: The function to apply to each ref bundle input.
             input_op: Operator generating input data for this op.
@@ -49,75 +89,413 @@ def __init__(
                 The actual rows passed may be less if the dataset is small.
             ray_remote_args: Customize the ray remote args for this op's tasks.
         """
-        ray_remote_args = _canonicalize_ray_remote_args(ray_remote_args or {})
-        compute_strategy = compute_strategy or TaskPoolStrategy()
-        self._ray_remote_args = ray_remote_args
-        self._execution_state = MapOperatorState(
-            transform_fn,
-            compute_strategy,
-            ray_remote_args,
-            min_rows_per_bundle,
-        )
-        self._output_metadata: List[BlockMetadata] = []
-        super().__init__(name, [input_op])
+        if compute_strategy is None:
+            compute_strategy = TaskPoolStrategy()
 
-    def get_metrics(self) -> Dict[str, int]:
-        return {
-            "obj_store_mem_alloc": self._execution_state.obj_store_mem_alloc,
-            "obj_store_mem_freed": self._execution_state.obj_store_mem_freed,
-            "obj_store_mem_peak": self._execution_state.obj_store_mem_peak,
-        }
+        if isinstance(compute_strategy, TaskPoolStrategy):
+            from ray.data._internal.execution.operators.task_pool_map_operator import (
+                TaskPoolMapOperator,
+            )
 
-    def progress_str(self) -> str:
-        return self._execution_state.progress_str()
+            return TaskPoolMapOperator(
+                transform_fn,
+                input_op,
+                name=name,
+                min_rows_per_bundle=min_rows_per_bundle,
+                ray_remote_args=ray_remote_args,
+            )
+        elif isinstance(compute_strategy, ActorPoolStrategy):
+            from ray.data._internal.execution.operators.actor_pool_map_operator import (
+                ActorPoolMapOperator,
+            )
+
+            pool_size = compute_strategy.max_size
+            if pool_size == float("inf"):
+                # Use min_size if max_size is unbounded (default).
+                pool_size = compute_strategy.min_size
+            return ActorPoolMapOperator(
+                transform_fn,
+                input_op,
+                name=name,
+                min_rows_per_bundle=min_rows_per_bundle,
+                ray_remote_args=ray_remote_args,
+                pool_size=pool_size,
+            )
+        else:
+            raise ValueError(f"Unsupported execution strategy {compute_strategy}")
+
+    def start(self, options: "ExecutionOptions"):
+        # Create output queue with desired ordering semantics.
+        if options.preserve_order:
+            self._output_queue = _OrderedOutputQueue()
+        else:
+            self._output_queue = _UnorderedOutputQueue()
+        if options.locality_with_output:
+            # Try to schedule tasks locally.
+            self._ray_remote_args[
+                "scheduling_strategy"
+            ] = NodeAffinitySchedulingStrategy(
+                ray.get_runtime_context().get_node_id(),
+                soft=True,
+            )
+        super().start(options)
 
-    def add_input(self, refs: RefBundle, input_index: int) -> None:
+    def add_input(self, refs: RefBundle, input_index: int):
         assert input_index == 0, input_index
-        self._execution_state.add_input(refs)
+        # Add RefBundle to the bundler.
+        self._block_ref_bundler.add_bundle(refs)
+        if self._block_ref_bundler.has_bundle():
+            # If the bundler has a full bundle, add it to the operator's task submission
+            # queue.
+            bundle = self._block_ref_bundler.get_next_bundle()
+            self._add_bundled_input(bundle)
 
-    def inputs_done(self) -> None:
-        self._execution_state.inputs_done()
+    @abstractmethod
+    def _add_bundled_input(self, refs: RefBundle):
+        """Add a pre-bundled upstream output to this operator.
+
+        Unlike the add_input() arg, this RefBundle has already been further bundled by
+        _block_ref_bundler up to the target size, meaning that this bundle is ready for
+        task submission.
+
+        This must be implemented by subclasses.
+
+        Args:
+            refs: The fully-bundled ref bundle that should be added as input.
+        """
+        raise NotImplementedError
+
+    def _handle_task_submitted(self, task: "_TaskState"):
+        """Handle a newly submitted task, notifying the output queue and updating
+        object store metrics.
+
+        This should be called by subclasses right after a task is submitted.
+
+        Args:
+            task: The task state for the newly submitted task.
+        """
+        # Notify output queue that this task is pending.
+        self._output_queue.notify_pending_task(task)
+        # Update object store metrics.
+        self._metrics.cur += task.inputs.size_bytes()
+        if self._metrics.cur > self._metrics.peak:
+            self._metrics.peak = self._metrics.cur
+
+    @abstractmethod
+    def notify_work_completed(
+        self, ref: Union[ObjectRef[ObjectRefGenerator], ray.ObjectRef]
+    ):
+        """Indicates that a task is done executing OR that a worker is done starting.
+
+        This must be implemented by subclasses.
+
+        Args:
+            ref: The output ref for the task that's done or the worker that has
+                been started.
+        """
+        raise NotImplementedError
+
+    def _handle_task_done(self, task: "_TaskState"):
+        """Handle a newly completed task, notifying the output queue, freeing task
+        inputs, and updating object store metrics.
+
+        This should be called by subclasses right after a task completes.
+
+        Args:
+            task: The task state for the newly completed task.
+        """
+        # Notify output queue that this task is complete.
+        self._output_queue.notify_task_completed(task)
+        task.inputs.destroy_if_owned()
+        # Update object store metrics.
+        allocated = task.output.size_bytes()
+        self._metrics.alloc += allocated
+        self._metrics.cur += allocated
+        freed = task.inputs.size_bytes()
+        self._metrics.freed += freed
+        self._metrics.cur -= freed
+        if self._metrics.cur > self._metrics.peak:
+            self._metrics.peak = self._metrics.cur
+
+    def inputs_done(self):
+        self._block_ref_bundler.done_adding_bundles()
+        if self._block_ref_bundler.has_bundle():
+            # Handle any leftover bundles in the bundler.
+            bundle = self._block_ref_bundler.get_next_bundle()
+            self._add_bundled_input(bundle)
         super().inputs_done()
 
     def has_next(self) -> bool:
         assert self._started
-        return self._execution_state.has_next()
+        return self._output_queue.has_next()
 
     def get_next(self) -> RefBundle:
         assert self._started
-        bundle = self._execution_state.get_next()
+        bundle = self._output_queue.get_next()
+        self._metrics.cur -= bundle.size_bytes()
         for _, meta in bundle.blocks:
             self._output_metadata.append(meta)
         return bundle
 
-    def get_work_refs(self) -> List[ray.ObjectRef]:
-        return self._execution_state.get_work_refs()
+    @abstractmethod
+    def get_work_refs(
+        self,
+    ) -> List[Union[ObjectRef[ObjectRefGenerator], ray.ObjectRef]]:
+        raise NotImplementedError
 
+    @abstractmethod
     def num_active_work_refs(self) -> int:
-        return self._execution_state.num_active_work_refs()
+        raise NotImplementedError
 
-    def notify_work_completed(self, task: ray.ObjectRef) -> None:
-        self._execution_state.work_completed(task)
+    @abstractmethod
+    def progress_str(self) -> str:
+        raise NotImplementedError
+
+    def get_metrics(self) -> Dict[str, int]:
+        return self._metrics.to_metrics_dict()
 
     def get_stats(self) -> StatsDict:
         return {self._name: self._output_metadata}
 
-    def start(self, options: ExecutionOptions) -> None:
-        self._execution_state.start(options)
-        super().start(options)
-
-    def shutdown(self) -> None:
-        self._execution_state.shutdown()
+    @abstractmethod
+    def shutdown(self):
+        # NOTE: This must be implemented by subclasses, and those overriding methods
+        # must call this method.
         super().shutdown()
 
+    @abstractmethod
+    def current_resource_usage(self) -> ExecutionResources:
+        raise NotImplementedError
+
+    @abstractmethod
     def base_resource_usage(self) -> ExecutionResources:
-        return self._execution_state.base_resource_usage()
+        raise NotImplementedError
 
+    @abstractmethod
     def incremental_resource_usage(self) -> ExecutionResources:
-        return self._execution_state.incremental_resource_usage()
+        raise NotImplementedError
 
-    def current_resource_usage(self) -> ExecutionResources:
-        return self._execution_state.current_resource_usage()
+    @staticmethod
+    def _map_ref_to_ref_bundle(ref: ObjectRef[ObjectRefGenerator]) -> RefBundle:
+        """Utility for converting a generator ref to a RefBundle.
+
+        This function blocks on the completion of the underlying generator task via
+        ray.get().
+        """
+        all_refs = list(ray.get(ref))
+        del ref
+        block_refs = all_refs[:-1]
+        block_metas = ray.get(all_refs[-1])
+        assert len(block_metas) == len(block_refs), (block_refs, block_metas)
+        for ref in block_refs:
+            trace_allocation(ref, "map_operator_work_completed")
+        return RefBundle(list(zip(block_refs, block_metas)), owns_blocks=True)
+
+
+@dataclass
+class _TaskState:
+    """Tracks the driver-side state for an MapOperator task.
+
+    Attributes:
+        inputs: The input ref bundle.
+        output: The output ref bundle that is set when the task completes.
+    """
+
+    inputs: RefBundle
+    output: Optional[RefBundle] = None
+
+
+@dataclass
+class _ObjectStoreMetrics:
+    """Metrics for object store memory allocations."""
+
+    alloc: int
+    freed: int
+    cur: int
+    peak: int
+
+    def to_metrics_dict(self) -> Dict[str, int]:
+        return {
+            "obj_store_mem_alloc": self.alloc,
+            "obj_store_mem_freed": self.freed,
+            "obj_store_mem_peak": self.peak,
+        }
+
+
+def _map_task(
+    fn: Callable[[Iterator[Block]], Iterator[Block]],
+    *blocks: Block,
+) -> Iterator[Union[Block, List[BlockMetadata]]]:
+    """Remote function for a single operator task.
+
+    Args:
+        fn: The callable that takes Iterator[Block] as input and returns
+            Iterator[Block] as output.
+        blocks: The concrete block values from the task ref bundle.
+
+    Returns:
+        A generator of blocks, followed by the list of BlockMetadata for the blocks
+        as the last generator return.
+    """
+    output_metadata = []
+    stats = BlockExecStats.builder()
+    for b_out in fn(iter(blocks)):
+        # TODO(Clark): Add input file propagation from input blocks.
+        m_out = BlockAccessor.for_block(b_out).get_metadata([], None)
+        m_out.exec_stats = stats.build()
+        output_metadata.append(m_out)
+        yield b_out
+        stats = BlockExecStats.builder()
+    yield output_metadata
+
+
+class _BlockRefBundler:
+    """Rebundles RefBundles to get them close to a particular number of rows."""
+
+    def __init__(self, min_rows_per_bundle: Optional[int]):
+        """Creates a BlockRefBundler.
+
+        Args:
+            min_rows_per_bundle: The target number of rows per bundle. Note that we
+                bundle up to this target, but only exceed it if not doing so would
+                result in an empty bundle.
+        """
+        self._min_rows_per_bundle = min_rows_per_bundle
+        self._bundle_buffer: List[RefBundle] = []
+        self._bundle_buffer_size = 0
+        self._finalized = False
+
+    def add_bundle(self, bundle: RefBundle):
+        """Add a bundle to the bundler."""
+        self._bundle_buffer.append(bundle)
+        self._bundle_buffer_size += self._get_bundle_size(bundle)
+
+    def has_bundle(self) -> bool:
+        """Returns whether the bundler has a bundle."""
+        return self._bundle_buffer and (
+            self._min_rows_per_bundle is None
+            or self._bundle_buffer_size >= self._min_rows_per_bundle
+            or (self._finalized and self._bundle_buffer_size > 0)
+        )
+
+    def get_next_bundle(self) -> RefBundle:
+        """Gets the next bundle."""
+        assert self.has_bundle()
+        if self._min_rows_per_bundle is None:
+            # Short-circuit if no bundle row target was defined.
+            assert len(self._bundle_buffer) == 1
+            bundle = self._bundle_buffer[0]
+            self._bundle_buffer = []
+            self._bundle_buffer_size = 0
+            return bundle
+        leftover = []
+        output_buffer = []
+        output_buffer_size = 0
+        buffer_filled = False
+        for bundle in self._bundle_buffer:
+            bundle_size = self._get_bundle_size(bundle)
+            if buffer_filled:
+                # Buffer has been filled, save it in the leftovers.
+                leftover.append(bundle)
+            elif (
+                output_buffer_size + bundle_size <= self._min_rows_per_bundle
+                or output_buffer_size == 0
+            ):
+                # Bundle fits in buffer, or bundle doesn't fit but the buffer still
+                # needs a non-empty bundle.
+                output_buffer.append(bundle)
+                output_buffer_size += bundle_size
+            else:
+                # Bundle doesn't fit in a buffer that already has at least one non-empty
+                # bundle, so we add it to the leftovers.
+                leftover.append(bundle)
+                # Add all remaining bundles to the leftovers.
+                buffer_filled = True
+        self._bundle_buffer = leftover
+        self._bundle_buffer_size = sum(
+            self._get_bundle_size(bundle) for bundle in leftover
+        )
+        return _merge_ref_bundles(*output_buffer)
+
+    def done_adding_bundles(self):
+        """Indicate that no more RefBundles will be added to this bundler."""
+        self._finalized = True
+
+    @staticmethod
+    def _get_bundle_size(bundle: RefBundle):
+        return bundle.num_rows() if bundle.num_rows() is not None else float("inf")
+
+
+def _merge_ref_bundles(*bundles: RefBundle) -> RefBundle:
+    """Merge N ref bundles into a single bundle of multiple blocks."""
+    # Check that at least one bundle is non-null.
+    assert any(bundle is not None for bundle in bundles)
+    blocks = list(
+        itertools.chain(
+            block for bundle in bundles if bundle is not None for block in bundle.blocks
+        )
+    )
+    owns_blocks = all(bundle.owns_blocks for bundle in bundles if bundle is not None)
+    return RefBundle(blocks, owns_blocks)
+
+
+class _OutputQueue:
+    """Interface for swapping between different output order modes."""
+
+    def notify_pending_task(self, task: _TaskState):
+        """Called when a new task becomes pending."""
+        pass
+
+    def notify_task_completed(self, task: _TaskState):
+        """Called when a previously pending task completes."""
+        pass
+
+    def has_next(self) -> bool:
+        raise NotImplementedError
+
+    def get_next(self) -> RefBundle:
+        raise NotImplementedError
+
+
+class _OrderedOutputQueue(_OutputQueue):
+    """An queue that returns finished tasks in submission order."""
+
+    def __init__(self):
+        self._tasks_by_output_order: Dict[int, _TaskState] = {}
+        self._next_task_index: int = 0
+        self._next_output_index: int = 0
+
+    def notify_pending_task(self, task: _TaskState):
+        self._tasks_by_output_order[self._next_task_index] = task
+        self._next_task_index += 1
+
+    def has_next(self) -> bool:
+        i = self._next_output_index
+        return (
+            i in self._tasks_by_output_order
+            and self._tasks_by_output_order[i].output is not None
+        )
+
+    def get_next(self) -> RefBundle:
+        i = self._next_output_index
+        self._next_output_index += 1
+        return self._tasks_by_output_order.pop(i).output
+
+
+class _UnorderedOutputQueue(_OutputQueue):
+    """An queue that does not guarantee output order of finished tasks."""
+
+    def __init__(self):
+        self._completed_tasks: List[_TaskState] = []
+
+    def notify_task_completed(self, task: _TaskState):
+        self._completed_tasks.append(task)
+
+    def has_next(self) -> bool:
+        return len(self._completed_tasks) > 0
+
+    def get_next(self) -> RefBundle:
+        return self._completed_tasks.pop(0).output
 
 
 def _canonicalize_ray_remote_args(ray_remote_args: Dict[str, Any]) -> Dict[str, Any]:
diff --git a/python/ray/data/_internal/execution/operators/map_operator_state.py b/python/ray/data/_internal/execution/operators/map_operator_state.py
deleted file mode 100644
index 462d0024802a..000000000000
--- a/python/ray/data/_internal/execution/operators/map_operator_state.py
+++ /dev/null
@@ -1,287 +0,0 @@
-from dataclasses import dataclass
-from typing import Callable, Optional, List, Dict, Any, Iterator
-
-import ray
-from ray.data.block import Block
-from ray.data.context import DatasetContext
-from ray.data._internal.compute import (
-    ComputeStrategy,
-    TaskPoolStrategy,
-    ActorPoolStrategy,
-)
-from ray.data._internal.execution.util import merge_ref_bundles
-from ray.data._internal.execution.interfaces import (
-    RefBundle,
-    ExecutionResources,
-    ExecutionOptions,
-)
-from ray.data._internal.execution.operators.map_task_submitter import MapTaskSubmitter
-from ray.data._internal.execution.operators.actor_pool_submitter import (
-    ActorPoolSubmitter,
-)
-from ray.data._internal.execution.operators.task_pool_submitter import TaskPoolSubmitter
-from ray.data._internal.memory_tracing import trace_allocation
-from ray.types import ObjectRef
-from ray._raylet import ObjectRefGenerator
-
-
-class MapOperatorState:
-    def __init__(
-        self,
-        transform_fn: Callable[[Iterator[Block]], Iterator[Block]],
-        compute_strategy: ComputeStrategy,
-        ray_remote_args: Dict[str, Any],
-        min_rows_per_bundle: Optional[int],
-    ):
-        # Execution arguments.
-        self._min_rows_per_bundle: Optional[int] = min_rows_per_bundle
-
-        # Put the function def in the object store to avoid repeated serialization
-        # in case it's large (i.e., closure captures large objects).
-        transform_fn_ref = ray.put(transform_fn)
-
-        # Submitter of Ray tasks mapping transform_fn over data.
-        self._ray_remote_args = ray_remote_args
-        if isinstance(compute_strategy, TaskPoolStrategy):
-            task_submitter = TaskPoolSubmitter(transform_fn_ref, ray_remote_args)
-            self._base_resource_usage = ExecutionResources()
-        elif isinstance(compute_strategy, ActorPoolStrategy):
-            # TODO(Clark): Better mapping from configured min/max pool size to static
-            # pool size?
-            pool_size = compute_strategy.max_size
-            if pool_size == float("inf"):
-                # Use min_size if max_size is unbounded (default).
-                pool_size = compute_strategy.min_size
-            task_submitter = ActorPoolSubmitter(
-                transform_fn_ref, ray_remote_args, pool_size
-            )
-            self._base_resource_usage = ExecutionResources(
-                cpu=ray_remote_args.get("num_cpus", 0) * compute_strategy.min_size,
-                gpu=ray_remote_args.get("num_gpus", 0) * compute_strategy.min_size,
-            )
-        else:
-            raise ValueError(f"Unsupported execution strategy {compute_strategy}")
-        self._task_submitter: MapTaskSubmitter = task_submitter
-
-        # The temporary block bundle used to accumulate inputs until they meet the
-        # min_rows_per_bundle requirement.
-        self._block_bundle: Optional[RefBundle] = None
-
-        # Execution state.
-        self._tasks: Dict[ObjectRef[ObjectRefGenerator], _TaskState] = {}
-        self._obj_store_mem_alloc: int = 0
-        self._obj_store_mem_freed: int = 0
-        self._obj_store_mem_cur: int = 0
-        self._obj_store_mem_peak: int = 0
-        self._output_queue: Optional[_OutputQueue] = None
-
-    def start(self, options: ExecutionOptions) -> None:
-        self._task_submitter.start(options)
-        if options.preserve_order:
-            self._output_queue = _OrderedOutputQueue()
-        else:
-            self._output_queue = _UnorderedOutputQueue()
-
-    def add_input(self, bundle: RefBundle) -> None:
-        if self._min_rows_per_bundle is None:
-            self._create_task(bundle)
-            return
-
-        def get_num_rows(bundle: Optional[RefBundle]):
-            if bundle is None:
-                return 0
-            if bundle.num_rows() is None:
-                return float("inf")
-            return bundle.num_rows()
-
-        bundle_rows = get_num_rows(bundle)
-        acc_num_rows = get_num_rows(self._block_bundle) + bundle_rows
-        if acc_num_rows > self._min_rows_per_bundle:
-            if self._block_bundle:
-                if get_num_rows(self._block_bundle) > 0:
-                    self._create_task(self._block_bundle)
-                self._block_bundle = bundle
-            else:
-                self._create_task(bundle)
-        else:
-            # TODO(ekl) add a warning if we merge 10+ blocks per bundle.
-            self._block_bundle = merge_ref_bundles(self._block_bundle, bundle)
-
-    def inputs_done(self) -> None:
-        if self._block_bundle:
-            self._create_task(self._block_bundle)
-            self._block_bundle = None
-        self._task_submitter.task_submission_done()
-
-    def work_completed(self, ref: ObjectRef[ObjectRefGenerator]) -> None:
-        self._task_submitter.task_done(ref)
-        task: _TaskState = self._tasks.pop(ref)
-        # Dynamic block splitting path.
-        all_refs = list(ray.get(ref))
-        del ref
-        block_refs = all_refs[:-1]
-        block_metas = ray.get(all_refs[-1])
-        assert len(block_metas) == len(block_refs), (block_refs, block_metas)
-        for ref in block_refs:
-            trace_allocation(ref, "map_operator_work_completed")
-        task.output = RefBundle(list(zip(block_refs, block_metas)), owns_blocks=True)
-        self._output_queue.notify_task_completed(task)
-        allocated = task.output.size_bytes()
-        self._obj_store_mem_alloc += allocated
-        self._obj_store_mem_cur += allocated
-        # TODO(ekl) this isn't strictly correct if multiple operators depend on this
-        # bundle, but it doesn't happen in linear dags for now.
-        task.inputs.destroy_if_owned()
-        freed = task.inputs.size_bytes()
-        self._obj_store_mem_freed += freed
-        self._obj_store_mem_cur -= freed
-        if self._obj_store_mem_cur > self._obj_store_mem_peak:
-            self._obj_store_mem_peak = self._obj_store_mem_cur
-
-    def has_next(self) -> bool:
-        return self._output_queue.has_next()
-
-    def get_next(self) -> RefBundle:
-        bundle = self._output_queue.get_next()
-        self._obj_store_mem_cur -= bundle.size_bytes()
-        return bundle
-
-    def get_work_refs(self) -> List[ray.ObjectRef]:
-        return list(self._tasks.keys())
-
-    def num_active_work_refs(self) -> int:
-        return len(self._tasks)
-
-    def progress_str(self) -> str:
-        return self._task_submitter.progress_str()
-
-    def shutdown(self) -> None:
-        self._task_submitter.shutdown(self.get_work_refs())
-
-    @property
-    def obj_store_mem_alloc(self) -> int:
-        """Return the object store memory allocated by this operator execution."""
-        return self._obj_store_mem_alloc
-
-    @property
-    def obj_store_mem_freed(self) -> int:
-        """Return the object store memory freed by this operator execution."""
-        return self._obj_store_mem_freed
-
-    @property
-    def obj_store_mem_peak(self) -> int:
-        """Return the peak object store memory utilization during this operator
-        execution.
-        """
-        return self._obj_store_mem_peak
-
-    def _create_task(self, bundle: RefBundle) -> None:
-        input_blocks = []
-        for block, _ in bundle.blocks:
-            input_blocks.append(block)
-        # TODO fix for Ray client: https://github.com/ray-project/ray/issues/30458
-        if not DatasetContext.get_current().block_splitting_enabled:
-            raise NotImplementedError("New backend requires block splitting")
-        ref: ObjectRef[ObjectRefGenerator] = self._task_submitter.submit(input_blocks)
-        task = _TaskState(bundle)
-        self._tasks[ref] = task
-        self._output_queue.notify_pending_task(task)
-        self._obj_store_mem_cur += bundle.size_bytes()
-        if self._obj_store_mem_cur > self._obj_store_mem_peak:
-            self._obj_store_mem_peak = self._obj_store_mem_cur
-
-    def base_resource_usage(self) -> ExecutionResources:
-        return self._base_resource_usage
-
-    def current_resource_usage(self) -> ExecutionResources:
-        if isinstance(self._task_submitter, ActorPoolSubmitter):
-            num_active_workers = self._task_submitter._actor_pool.size()
-        else:
-            num_active_workers = self.num_active_work_refs()
-        return ExecutionResources(
-            cpu=self._ray_remote_args.get("num_cpus", 0) * num_active_workers,
-            gpu=self._ray_remote_args.get("num_gpus", 0) * num_active_workers,
-            object_store_memory=self._obj_store_mem_cur,
-        )
-
-    def incremental_resource_usage(self) -> ExecutionResources:
-        if isinstance(self._task_submitter, ActorPoolSubmitter):
-            # TODO(ekl) this should be non-zero if all actors are saturated, otherwise
-            # we will submit way too many tasks.
-            return ExecutionResources(cpu=0, gpu=0)
-        return ExecutionResources(
-            cpu=self._ray_remote_args.get("num_cpus", 0),
-            gpu=self._ray_remote_args.get("num_gpus", 0),
-        )
-
-
-@dataclass
-class _TaskState:
-    """Tracks the driver-side state for an MapOperator task.
-
-    Attributes:
-        inputs: The input ref bundle.
-        output: The output ref bundle that is set when the task completes.
-    """
-
-    inputs: RefBundle
-    output: Optional[RefBundle] = None
-
-
-class _OutputQueue:
-    """Interface for swapping between different output order modes."""
-
-    def notify_pending_task(self, task: "_TaskState"):
-        """Called when a new task becomes pending."""
-        pass
-
-    def notify_task_completed(self, task: "_TaskState"):
-        """Called when a previously pending task completes."""
-        pass
-
-    def has_next(self) -> bool:
-        raise NotImplementedError
-
-    def get_next(self) -> RefBundle:
-        raise NotImplementedError
-
-
-class _OrderedOutputQueue(_OutputQueue):
-    """An queue that returns finished tasks in submission order."""
-
-    def __init__(self):
-        self._tasks_by_output_order: Dict[int, _TaskState] = {}
-        self._next_task_index: int = 0
-        self._next_output_index: int = 0
-
-    def notify_pending_task(self, task: "_TaskState"):
-        self._tasks_by_output_order[self._next_task_index] = task
-        self._next_task_index += 1
-
-    def has_next(self) -> bool:
-        i = self._next_output_index
-        return (
-            i in self._tasks_by_output_order
-            and self._tasks_by_output_order[i].output is not None
-        )
-
-    def get_next(self) -> RefBundle:
-        i = self._next_output_index
-        self._next_output_index += 1
-        return self._tasks_by_output_order.pop(i).output
-
-
-class _UnorderedOutputQueue(_OutputQueue):
-    """An queue that does not guarantee output order of finished tasks."""
-
-    def __init__(self):
-        self._completed_tasks: List[_TaskState] = []
-
-    def notify_task_completed(self, task: "_TaskState"):
-        self._completed_tasks.append(task)
-
-    def has_next(self) -> bool:
-        return len(self._completed_tasks) > 0
-
-    def get_next(self) -> RefBundle:
-        return self._completed_tasks.pop(0).output
diff --git a/python/ray/data/_internal/execution/operators/map_task_submitter.py b/python/ray/data/_internal/execution/operators/map_task_submitter.py
deleted file mode 100644
index 88b17a97cedf..000000000000
--- a/python/ray/data/_internal/execution/operators/map_task_submitter.py
+++ /dev/null
@@ -1,118 +0,0 @@
-from abc import ABC, abstractmethod
-from typing import Dict, Any, List, Union, Tuple, Callable, Iterator
-
-import ray
-from ray.data.block import Block, BlockAccessor, BlockMetadata, BlockExecStats
-from ray.data._internal.execution.interfaces import (
-    ExecutionOptions,
-)
-from ray.types import ObjectRef
-from ray.util.scheduling_strategies import NodeAffinitySchedulingStrategy
-from ray._raylet import ObjectRefGenerator
-
-
-class MapTaskSubmitter(ABC):
-    """A task submitter for MapOperator.
-
-    This abstraction is in charge of submitting tasks, reserving resources for their
-    execution, and cleaning up said resources when a task completes or when task
-    submission is done.
-    """
-
-    def __init__(
-        self,
-        transform_fn_ref: ObjectRef[Callable[[Iterator[Block]], Iterator[Block]]],
-        ray_remote_args: Dict[str, Any],
-    ):
-        """Create a TaskPoolSubmitter instance.
-
-        Args:
-            transform_fn_ref: The function to apply to a block bundle in the submitted
-                map task.
-            ray_remote_args: Remote arguments for the Ray tasks to be launched.
-        """
-        self._transform_fn_ref = transform_fn_ref
-        self._ray_remote_args = ray_remote_args
-
-    def start(self, options: ExecutionOptions):
-        """Start the task submitter so it's ready to submit tasks.
-
-        This is called when execution of the map operator actually starts, and is where
-        the submitter can initialize expensive state, reserve resources, start workers,
-        etc.
-        """
-        if options.locality_with_output:
-            self._ray_remote_args[
-                "scheduling_strategy"
-            ] = NodeAffinitySchedulingStrategy(
-                ray.get_runtime_context().get_node_id(),
-                soft=True,
-            )
-
-    @abstractmethod
-    def submit(
-        self, input_blocks: List[ObjectRef[Block]]
-    ) -> Union[
-        ObjectRef[ObjectRefGenerator], Tuple[ObjectRef[Block], ObjectRef[BlockMetadata]]
-    ]:
-        """Submit a map task.
-
-        Args:
-            input_blocks: The block bundle on which to apply transform_fn.
-
-        Returns:
-            An object ref representing the output of the map task.
-        """
-        raise NotImplementedError
-
-    def task_done(self, task_ref: ObjectRef[Union[ObjectRefGenerator, Block]]):
-        """Indicates that the task that output the provided ref is done.
-
-        Args:
-            task_ref: The output ref for the task that's done.
-        """
-        pass
-
-    def task_submission_done(self):
-        """Indicates that no more tasks will be submitter."""
-        pass
-
-    def progress_str(self) -> str:
-        """Pass through progress string for operators."""
-        raise NotImplementedError
-
-    @abstractmethod
-    def shutdown(self, task_refs: List[ObjectRef[Union[ObjectRefGenerator, Block]]]):
-        """Shutdown the submitter, i.e. release any reserved resources.
-
-        Args:
-            task_refs: The output refs for all of the tasks submitted by this submitter.
-        """
-        raise NotImplementedError
-
-
-def _map_task(
-    fn: Callable[[Iterator[Block]], Iterator[Block]],
-    *blocks: Block,
-) -> Iterator[Union[Block, List[BlockMetadata]]]:
-    """Remote function for a single operator task.
-
-    Args:
-        fn: The callable that takes Iterator[Block] as input and returns
-            Iterator[Block] as output.
-        blocks: The concrete block values from the task ref bundle.
-
-    Returns:
-        A generator of blocks, followed by the list of BlockMetadata for the blocks
-        as the last generator return.
-    """
-    output_metadata = []
-    stats = BlockExecStats.builder()
-    for b_out in fn(iter(blocks)):
-        # TODO(Clark): Add input file propagation from input blocks.
-        m_out = BlockAccessor.for_block(b_out).get_metadata([], None)
-        m_out.exec_stats = stats.build()
-        output_metadata.append(m_out)
-        yield b_out
-        stats = BlockExecStats.builder()
-    yield output_metadata
diff --git a/python/ray/data/_internal/execution/operators/task_pool_map_operator.py b/python/ray/data/_internal/execution/operators/task_pool_map_operator.py
new file mode 100644
index 000000000000..342d7e2b5f94
--- /dev/null
+++ b/python/ray/data/_internal/execution/operators/task_pool_map_operator.py
@@ -0,0 +1,104 @@
+from typing import List, Optional, Callable, Iterator, Dict, Any
+
+import ray
+from ray.data.block import Block
+from ray.data._internal.execution.interfaces import (
+    RefBundle,
+    ExecutionResources,
+    PhysicalOperator,
+)
+from ray.data._internal.execution.operators.map_operator import (
+    MapOperator,
+    _TaskState,
+    _map_task,
+)
+from ray.data._internal.remote_fn import cached_remote_fn
+from ray.types import ObjectRef
+from ray._raylet import ObjectRefGenerator
+
+
+class TaskPoolMapOperator(MapOperator):
+    """A MapOperator implementation that executes tasks on a task pool."""
+
+    def __init__(
+        self,
+        transform_fn: Callable[[Iterator[Block]], Iterator[Block]],
+        input_op: PhysicalOperator,
+        name: str = "TaskPoolMap",
+        min_rows_per_bundle: Optional[int] = None,
+        ray_remote_args: Optional[Dict[str, Any]] = None,
+    ):
+        """Create an TaskPoolMapOperator instance.
+
+        Args:
+            transform_fn: The function to apply to each ref bundle input.
+            input_op: Operator generating input data for this op.
+            name: The name of this operator.
+            min_rows_per_bundle: The number of rows to gather per batch passed to the
+                transform_fn, or None to use the block size. Setting the batch size is
+                important for the performance of GPU-accelerated transform functions.
+                The actual rows passed may be less if the dataset is small.
+            ray_remote_args: Customize the ray remote args for this op's tasks.
+        """
+        super().__init__(
+            transform_fn, input_op, name, min_rows_per_bundle, ray_remote_args
+        )
+        self._tasks: Dict[ObjectRef[ObjectRefGenerator], _TaskState] = {}
+
+    def _add_bundled_input(self, bundle: RefBundle):
+        # Submit the task as a normal Ray task.
+        map_task = cached_remote_fn(_map_task, num_returns="dynamic")
+        input_blocks = [block for block, _ in bundle.blocks]
+        ref = map_task.options(**self._ray_remote_args).remote(
+            self._transform_fn_ref, *input_blocks
+        )
+        task = _TaskState(bundle)
+        self._tasks[ref] = task
+        self._handle_task_submitted(task)
+
+    def notify_work_completed(self, ref: ObjectRef[ObjectRefGenerator]):
+        task: _TaskState = self._tasks.pop(ref)
+        task.output = self._map_ref_to_ref_bundle(ref)
+        self._handle_task_done(task)
+
+    def shutdown(self):
+        task_refs = self.get_work_refs()
+        # Cancel all active tasks.
+        for task in task_refs:
+            ray.cancel(task)
+        # Wait until all tasks have failed or been cancelled.
+        for task in task_refs:
+            try:
+                ray.get(task)
+            except ray.exceptions.RayError:
+                # Cancellation either succeeded, or the task had already failed with
+                # a different error, or cancellation failed. In all cases, we
+                # swallow the exception.
+                pass
+        super().shutdown()
+
+    def progress_str(self) -> str:
+        return ""
+
+    def get_work_refs(self) -> List[ray.ObjectRef]:
+        return list(self._tasks.keys())
+
+    def num_active_work_refs(self) -> int:
+        return len(self.get_work_refs())
+
+    def base_resource_usage(self) -> ExecutionResources:
+        return ExecutionResources()
+
+    def current_resource_usage(self) -> ExecutionResources:
+        num_active_workers = self.num_active_work_refs()
+        return ExecutionResources(
+            cpu=self._ray_remote_args.get("num_cpus", 0) * num_active_workers,
+            gpu=self._ray_remote_args.get("num_gpus", 0) * num_active_workers,
+            object_store_memory=self._metrics.cur,
+        )
+
+    def incremental_resource_usage(self) -> ExecutionResources:
+        return ExecutionResources(
+            cpu=self._ray_remote_args.get("num_cpus", 0),
+            gpu=self._ray_remote_args.get("num_gpus", 0),
+        )
diff --git a/python/ray/data/_internal/execution/operators/task_pool_submitter.py b/python/ray/data/_internal/execution/operators/task_pool_submitter.py
deleted file mode 100644
index b850c22be71d..000000000000
--- a/python/ray/data/_internal/execution/operators/task_pool_submitter.py
+++ /dev/null
@@ -1,41 +0,0 @@
-from typing import Union, List
-
-import ray
-from ray.data.block import Block
-from ray.data._internal.execution.operators.map_task_submitter import (
-    MapTaskSubmitter,
-    _map_task,
-)
-from ray.data._internal.remote_fn import cached_remote_fn
-from ray.types import ObjectRef
-from ray._raylet import ObjectRefGenerator
-
-
-class TaskPoolSubmitter(MapTaskSubmitter):
-    """A task submitter for MapOperator that uses normal Ray tasks."""
-
-    def submit(
-        self, input_blocks: List[ObjectRef[Block]]
-    ) -> ObjectRef[ObjectRefGenerator]:
-        # Submit the task as a normal Ray task.
-        map_task = cached_remote_fn(_map_task, num_returns="dynamic")
-        return map_task.options(**self._ray_remote_args).remote(
-            self._transform_fn_ref, *input_blocks
-        )
-
-    def shutdown(self, task_refs: List[ObjectRef[Union[ObjectRefGenerator, Block]]]):
-        # Cancel all active tasks.
-        for task in task_refs:
-            ray.cancel(task)
-        # Wait until all tasks have failed or been cancelled.
-        for task in task_refs:
-            try:
-                ray.get(task)
-            except ray.exceptions.RayError:
-                # Cancellation either succeeded, or the task had already failed with
-                # a different error, or cancellation failed. In all cases, we
-                # swallow the exception.
-                pass
-
-    def progress_str(self) -> str:
-        return ""
diff --git a/python/ray/data/_internal/execution/util.py b/python/ray/data/_internal/execution/util.py
index 6ef517175850..52f3b8a65f80 100644
--- a/python/ray/data/_internal/execution/util.py
+++ b/python/ray/data/_internal/execution/util.py
@@ -24,16 +24,3 @@ def make_ref_bundles(simple_data: List[Block]) -> List[RefBundle]:
             )
         )
     return output
-
-
-def merge_ref_bundles(x: RefBundle, y: RefBundle) -> RefBundle:
-    """Merge two ref bundles into a single bundle of multiple blocks."""
-    if x is None:
-        return y
-    elif y is None:
-        return x
-    else:
-        return RefBundle(
-            x.blocks + y.blocks,
-            x.owns_blocks and y.owns_blocks,
-        )
diff --git a/python/ray/data/_internal/logical/operators/map_operator.py b/python/ray/data/_internal/logical/operators/map_operator.py
index 261e198cc3b6..bc09e8e2c838 100644
--- a/python/ray/data/_internal/logical/operators/map_operator.py
+++ b/python/ray/data/_internal/logical/operators/map_operator.py
@@ -216,7 +216,7 @@ def fn(item: Any) -> Any:
     def do_map(blocks: Iterator[Block]) -> Iterator[Block]:
         yield from block_fn(blocks, *fn_args, **fn_kwargs)
 
-    return MapOperator(
+    return MapOperator.create(
         do_map,
         input_physical_dag,
         name=op.name,
diff --git a/python/ray/data/_internal/logical/operators/read_operator.py b/python/ray/data/_internal/logical/operators/read_operator.py
index a17e37c1dff2..451a82a02cc0 100644
--- a/python/ray/data/_internal/logical/operators/read_operator.py
+++ b/python/ray/data/_internal/logical/operators/read_operator.py
@@ -61,4 +61,4 @@ def do_read(blocks: Iterator[ReadTask]) -> Iterator[Block]:
         for read_task in blocks:
             yield from read_task()
 
-    return MapOperator(do_read, inputs, name="DoRead")
+    return MapOperator.create(do_read, inputs, name="DoRead")
diff --git a/python/ray/data/tests/conftest.py b/python/ray/data/tests/conftest.py
index 7d013d9f84eb..abc66d8ac51e 100644
--- a/python/ray/data/tests/conftest.py
+++ b/python/ray/data/tests/conftest.py
@@ -17,9 +17,24 @@
 
 # Trigger pytest hook to automatically zip test cluster logs to archive dir on failure
 from ray.tests.conftest import pytest_runtest_makereport  # noqa
+from ray.tests.conftest import _ray_start
 from ray.tests.conftest import *  # noqa
 
 
+@pytest.fixture(scope="module")
+def ray_start_2_cpus_shared(request):
+    param = getattr(request, "param", {})
+    with _ray_start(num_cpus=2, **param) as res:
+        yield res
+
+
+@pytest.fixture(scope="module")
+def ray_start_10_cpus_shared(request):
+    param = getattr(request, "param", {})
+    with _ray_start(num_cpus=10, **param) as res:
+        yield res
+
+
 @pytest.fixture(scope="function")
 def aws_credentials():
     import os
diff --git a/python/ray/data/tests/test_actor_pool_map_operator.py b/python/ray/data/tests/test_actor_pool_map_operator.py
new file mode 100644
index 000000000000..8ce9c67b4a06
--- /dev/null
+++ b/python/ray/data/tests/test_actor_pool_map_operator.py
@@ -0,0 +1,294 @@
+import time
+
+import pytest
+
+import ray
+from ray.tests.conftest import *  # noqa
+from ray.data._internal.execution.operators.actor_pool_map_operator import _ActorPool
+
+
+@ray.remote
+class PoolWorker:
+    def ready(self) -> str:
+        return "ok"
+
+
+class TestActorPool:
+    def _add_ready_worker(self, pool: _ActorPool) -> ray.actor.ActorHandle:
+        actor = PoolWorker.remote()
+        ready_ref = actor.ready.remote()
+        pool.add_pending_actor(actor, ready_ref)
+        # Wait until actor has started.
+        ray.get(ready_ref)
+        # Mark actor as running.
+        has_actor = pool.pending_to_running(ready_ref)
+        assert has_actor
+        return actor
+
+    def test_add_pending(self, ray_start_regular_shared):
+        # Test that pending actor is added in the correct state.
+        pool = _ActorPool()
+        actor = PoolWorker.remote()
+        ready_ref = actor.ready.remote()
+        pool.add_pending_actor(actor, ready_ref)
+        # Check that the pending actor is not pickable.
+        assert pool.pick_actor() is None
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 1
+        assert pool.num_pending_actors() == 1
+        assert pool.num_running_actors() == 0
+        assert pool.num_active_actors() == 0
+        assert pool.num_idle_actors() == 0
+        # Check that ready future is returned.
+        assert pool.get_pending_actor_refs() == [ready_ref]
+
+    def test_pending_to_running(self, ray_start_regular_shared):
+        # Test that pending actor is correctly transitioned to running.
+        pool = _ActorPool()
+        actor = self._add_ready_worker(pool)
+        # Check that the actor is pickable.
+        picked_actor = pool.pick_actor()
+        assert picked_actor == actor
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 1
+        assert pool.num_pending_actors() == 0
+        assert pool.num_running_actors() == 1
+        assert pool.num_active_actors() == 1
+        assert pool.num_idle_actors() == 0
+
+    def test_repeated_picking(self, ray_start_regular_shared):
+        # Test that we can repeatedly pick the same actor.
+        pool = _ActorPool()
+        actor = self._add_ready_worker(pool)
+        for _ in range(10):
+            picked_actor = pool.pick_actor()
+            assert picked_actor == actor
+
+    def test_return_actor(self, ray_start_regular_shared):
+        # Test that we can return an actor as many times as we've picked it.
+        pool = _ActorPool()
+        self._add_ready_worker(pool)
+        for _ in range(10):
+            picked_actor = pool.pick_actor()
+        # Return the actor as many times as it was picked.
+        for _ in range(10):
+            pool.return_actor(picked_actor)
+        # Returning the actor more times than it has been picked should raise an
+        # AssertionError.
+        with pytest.raises(AssertionError):
+            pool.return_actor(picked_actor)
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 1
+        assert pool.num_pending_actors() == 0
+        assert pool.num_running_actors() == 1
+        assert pool.num_active_actors() == 0
+        assert pool.num_idle_actors() == 1  # Actor should now be idle.
+
+    def test_pick_ordering_lone_idle(self, ray_start_regular_shared):
+        # Test that a lone idle actor is the one that's picked.
+        pool = _ActorPool()
+        self._add_ready_worker(pool)
+        # Ensure that actor has been picked once.
+        pool.pick_actor()
+        # Add a new, idle actor.
+        actor2 = self._add_ready_worker(pool)
+        # Check that picked actor is the idle newly added actor.
+        picked_actor = pool.pick_actor()
+        assert picked_actor == actor2
+
+    def test_pick_ordering_full_order(self, ray_start_regular_shared):
+        # Test that the least loaded actor is always picked.
+        pool = _ActorPool()
+        # Add 4 actors to the pool.
+        actors = [self._add_ready_worker(pool) for _ in range(4)]
+        # Pick 4 actors.
+        picked_actors = [pool.pick_actor() for _ in range(4)]
+        # Check that the 4 distinct actors that were added to the pool were all
+        # returned.
+        assert set(picked_actors) == set(actors)
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 4
+        assert pool.num_pending_actors() == 0
+        assert pool.num_running_actors() == 4
+        assert pool.num_active_actors() == 4
+        assert pool.num_idle_actors() == 0
+
+    def test_pick_ordering_with_returns(self, ray_start_regular_shared):
+        # Test that pick ordering works with returns.
+        pool = _ActorPool()
+        actor1 = self._add_ready_worker(pool)
+        actor2 = self._add_ready_worker(pool)
+        picked_actors = [pool.pick_actor() for _ in range(2)]
+        # Double-check that both actors were picked.
+        assert set(picked_actors) == {actor1, actor2}
+        # Return actor 2, implying that it's now idle.
+        pool.return_actor(actor2)
+        # Check that actor 2 is the next actor that's picked.
+        assert pool.pick_actor() == actor2
+
+    def test_kill_all_inactive_pending_actor_killed(self, ray_start_regular_shared):
+        # Test that pending actors are killed on the kill_all_inactive_actors() call.
+        pool = _ActorPool()
+        actor = PoolWorker.remote()
+        ready_ref = actor.ready.remote()
+        pool.add_pending_actor(actor, ready_ref)
+        # Kill inactive actors.
+        pool.kill_all_inactive_actors()
+        # Check that actor is not in pool.
+        assert pool.get_pending_actor_refs() == []
+        # Check that actor is no longer in the pool as pending, to protect against
+        # ready/killed races.
+        assert not pool.pending_to_running(ready_ref)
+        # Check that actor was killed.
+        # Wait a few seconds to let actor killing happen.
+        time.sleep(1)
+        with pytest.raises(ray.exceptions.RayActorError):
+            ray.get(actor.ready.remote())
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 0
+        assert pool.num_pending_actors() == 0
+        assert pool.num_running_actors() == 0
+        assert pool.num_active_actors() == 0
+        assert pool.num_idle_actors() == 0
+
+    def test_kill_all_inactive_idle_actor_killed(self, ray_start_regular_shared):
+        # Test that idle actors are killed on the kill_all_inactive_actors() call.
+        pool = _ActorPool()
+        actor = self._add_ready_worker(pool)
+        # Kill inactive actors.
+        pool.kill_all_inactive_actors()
+        # Check that actor is not in pool.
+        assert pool.pick_actor() is None
+        # Check that actor was killed.
+        # Wait a few seconds to let actor killing happen.
+        time.sleep(1)
+        with pytest.raises(ray.exceptions.RayActorError):
+            ray.get(actor.ready.remote())
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 0
+        assert pool.num_pending_actors() == 0
+        assert pool.num_running_actors() == 0
+        assert pool.num_active_actors() == 0
+        assert pool.num_idle_actors() == 0
+
+    def test_kill_all_inactive_active_actor_not_killed(self, ray_start_regular_shared):
+        # Test that active actors are NOT killed on the kill_all_inactive_actors() call.
+        pool = _ActorPool()
+        actor = self._add_ready_worker(pool)
+        # Pick actor (and double-check that the actor was picked).
+        assert pool.pick_actor() == actor
+        # Kill inactive actors.
+        pool.kill_all_inactive_actors()
+        # Check that the active actor is still in the pool.
+        assert pool.pick_actor() == actor
+
+    def test_kill_all_inactive_future_idle_actors_killed(
+        self, ray_start_regular_shared
+    ):
+        # Test that future idle actors are killed after the kill_all_inactive_actors()
+        # call.
+        pool = _ActorPool()
+        actor = self._add_ready_worker(pool)
+        # Pick actor (and double-check that the actor was picked).
+        assert pool.pick_actor() == actor
+        # Kill inactive actors, of which there are currently none.
+        pool.kill_all_inactive_actors()
+        # Check that the active actor is still in the pool.
+        assert pool.pick_actor() == actor
+        # Return the actor to the pool twice, which should set it as idle and cause it
+        # to be killed.
+        for _ in range(2):
+            pool.return_actor(actor)
+        # Check that actor is not in pool.
+        assert pool.pick_actor() is None
+        # Check that actor was killed.
+        # Wait a few seconds to let actor killing happen.
+        time.sleep(1)
+        with pytest.raises(ray.exceptions.RayActorError):
+            ray.get(actor.ready.remote())
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 0
+        assert pool.num_pending_actors() == 0
+        assert pool.num_running_actors() == 0
+        assert pool.num_active_actors() == 0
+        assert pool.num_idle_actors() == 0
+
+    def test_kill_all_inactive_mixture(self, ray_start_regular_shared):
+        # Test that in a mixture of pending, idle, and active actors, only the pending
+        # and idle actors are killed on the kill_all_inactive_actors() call.
+        pool = _ActorPool()
+        # Add active actor.
+        actor1 = self._add_ready_worker(pool)
+        # Pick actor (and double-check that the actor was picked).
+        assert pool.pick_actor() == actor1
+        # Add idle actor.
+        self._add_ready_worker(pool)
+        # Add pending actor.
+        actor3 = PoolWorker.remote()
+        ready_ref = actor3.ready.remote()
+        pool.add_pending_actor(actor3, ready_ref)
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 3
+        assert pool.num_pending_actors() == 1
+        assert pool.num_running_actors() == 2
+        assert pool.num_active_actors() == 1
+        assert pool.num_idle_actors() == 1
+        # Kill inactive actors.
+        pool.kill_all_inactive_actors()
+        # Check that the active actor is still in the pool.
+        assert pool.pick_actor() == actor1
+        # Check that adding a pending actor raises an error.
+        with pytest.raises(AssertionError):
+            pool.add_pending_actor(actor3, ready_ref)
+        # Check that kill_all_inactive_actors() is idempotent.
+        pool.kill_all_inactive_actors()
+        # Check that the active actor is still in the pool.
+        assert pool.pick_actor() == actor1
+        # Return the actor to the pool thrice, which should set it as idle and cause it
+        # to be killed.
+        for _ in range(3):
+            pool.return_actor(actor1)
+        # Check that actor is not in pool.
+        assert pool.pick_actor() is None
+        # Check that actor was killed.
+        # Wait a few seconds to let actor killing happen.
+        time.sleep(1)
+        with pytest.raises(ray.exceptions.RayActorError):
+            ray.get(actor1.ready.remote())
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 0
+        assert pool.num_pending_actors() == 0
+        assert pool.num_running_actors() == 0
+        assert pool.num_active_actors() == 0
+        assert pool.num_idle_actors() == 0
+
+    def test_all_actors_killed(self, ray_start_regular_shared):
+        # Test that all actors are killed after the kill_all_actors() call.
+        pool = _ActorPool()
+        active_actor = self._add_ready_worker(pool)
+        # Pick actor (and double-check that the actor was picked).
+        assert pool.pick_actor() == active_actor
+        idle_actor = self._add_ready_worker(pool)
+        # Kill all actors, including active actors.
+        pool.kill_all_actors()
+        # Check that the pool is empty.
+        assert pool.pick_actor() is None
+        # Check that both actors were killed.
+        # Wait a few seconds to let actor killing happen.
+        time.sleep(1)
+        with pytest.raises(ray.exceptions.RayActorError):
+            ray.get(idle_actor.ready.remote())
+        with pytest.raises(ray.exceptions.RayActorError):
+            ray.get(active_actor.ready.remote())
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 0
+        assert pool.num_pending_actors() == 0
+        assert pool.num_running_actors() == 0
+        assert pool.num_active_actors() == 0
+        assert pool.num_idle_actors() == 0
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/python/ray/data/tests/test_actor_pool_submitter.py b/python/ray/data/tests/test_actor_pool_submitter.py
deleted file mode 100644
index 7c3bb1e320e2..000000000000
--- a/python/ray/data/tests/test_actor_pool_submitter.py
+++ /dev/null
@@ -1,163 +0,0 @@
-import pytest
-
-import ray
-from ray.tests.conftest import *  # noqa
-from ray.data._internal.execution.operators.actor_pool_submitter import ActorPool
-
-
-@ray.remote
-class PoolWorker:
-    def inc(self, x):
-        return x + 1
-
-
-class TestActorPool:
-    def test_pick_the_adds(self, ray_start_regular_shared):
-        # Test that we can pick an actor that we add to the pool.
-        pool = ActorPool()
-        actor = PoolWorker.remote()
-        pool.add_actor(actor)
-        picked_actor = pool.pick_actor()
-        assert picked_actor == actor
-
-    def test_repeated_picking(self, ray_start_regular_shared):
-        # Test that we can repeatedly pick the same actor.
-        pool = ActorPool()
-        actor = PoolWorker.remote()
-        pool.add_actor(actor)
-        for _ in range(10):
-            picked_actor = pool.pick_actor()
-            assert picked_actor == actor
-
-    def test_return_actor(self, ray_start_regular_shared):
-        # Test that we can return an actor as many times as we've picked it.
-        pool = ActorPool()
-        actor = PoolWorker.remote()
-        pool.add_actor(actor)
-        for _ in range(10):
-            picked_actor = pool.pick_actor()
-        # Return the actor as many times as it was picked.
-        for _ in range(10):
-            pool.return_actor(picked_actor)
-        # Returning the actor more times than it has been picked should raise a
-        # ValueError.
-        with pytest.raises(ValueError):
-            pool.return_actor(picked_actor)
-
-    def test_pick_ordering_lone_idle(ray_start_regular_shared):
-        # Test that a lone idle actor is the one that's picked.
-        pool = ActorPool()
-        actor1 = PoolWorker.remote()
-        pool.add_actor(actor1)
-        # Ensure that actor has been picked once.
-        pool.pick_actor()
-        # Add a new, idle actor.
-        actor2 = PoolWorker.remote()
-        pool.add_actor(actor2)
-        # Check that picked actor is the idle newly added actor.
-        picked_actor = pool.pick_actor()
-        assert picked_actor == actor2
-
-    def test_pick_ordering_full_order(ray_start_regular_shared):
-        # Test that the least loaded actor is always picked.
-        pool = ActorPool()
-        # Add 4 actors to the pool.
-        actors = [PoolWorker.remote() for _ in range(4)]
-        for actor in actors:
-            pool.add_actor(actor)
-        # Pick 4 actors.
-        picked_actors = [pool.pick_actor() for _ in range(4)]
-        # Check that the 4 distinct actors that were added to the pool were all
-        # returned.
-        assert set(picked_actors) == set(actors)
-
-    def test_pick_ordering_with_returns(ray_start_regular_shared):
-        # Test that pick ordering works with returns.
-        pool = ActorPool()
-        actor1 = PoolWorker.remote()
-        pool.add_actor(actor1)
-        actor2 = PoolWorker.remote()
-        pool.add_actor(actor2)
-        picked_actors = [pool.pick_actor() for _ in range(2)]
-        # Double-check that both actors were picked.
-        assert set(picked_actors) == {actor1, actor2}
-        # Return actor 2, implying that it's now idle.
-        pool.return_actor(actor2)
-        # Check that actor 2 is the next actor that's picked.
-        assert pool.pick_actor() == actor2
-
-    def test_idle_actor_killed(ray_start_regular_shared):
-        # Test that idle actors are killed on the kill_idle_actors() call.
-        pool = ActorPool()
-        actor = PoolWorker.remote()
-        pool.add_actor(actor)
-        # Kill idle actors.
-        pool.kill_idle_actors()
-        # Check that actor is not in pool.
-        with pytest.raises(ValueError):
-            pool.pick_actor()
-        # Check that actor was killed.
-        with pytest.raises(ray.exceptions.RayActorError):
-            ray.get(actor.inc.remote(1))
-
-    def test_active_actor_not_killed(ray_start_regular_shared):
-        # Test that active actors are NOT killed on the kill_idle_actors() call.
-        pool = ActorPool()
-        actor = PoolWorker.remote()
-        pool.add_actor(actor)
-        picked_actor = pool.pick_actor()
-        # Double-check that actor was picked.
-        assert picked_actor == actor
-        # Kill idle actors.
-        pool.kill_idle_actors()
-        # Check that the active actor is still in the pool.
-        assert pool.pick_actor() == actor
-
-    def test_future_idle_actors_killed(ray_start_regular_shared):
-        # Test that future idle actors are killed after the kill_idle_actors() call.
-        pool = ActorPool()
-        actor = PoolWorker.remote()
-        pool.add_actor(actor)
-        picked_actor = pool.pick_actor()
-        # Double-check that actor was picked.
-        assert picked_actor == actor
-        # Kill idle actors, of which there are currently none.
-        pool.kill_idle_actors()
-        # Check that the active actor is still in the pool.
-        assert pool.pick_actor() == actor
-        # Return the actor to the pool twice, which should set it as idle and cause it
-        # to be killed.
-        for _ in range(2):
-            pool.return_actor(actor)
-        # Check that actor is not in pool.
-        with pytest.raises(ValueError):
-            pool.pick_actor()
-        # Check that actor was killed.
-        with pytest.raises(ray.exceptions.RayActorError):
-            ray.get(actor.inc.remote(1))
-
-    def test_all_actors_killed(ray_start_regular_shared):
-        # Test that all actors are killed after the kill_all_actors() call.
-        pool = ActorPool()
-        active_actor = PoolWorker.remote()
-        pool.add_actor(active_actor)
-        picked_actor = pool.pick_actor()
-        # Double-check that actor was picked.
-        assert picked_actor == active_actor
-        idle_actor = PoolWorker.remote()
-        pool.add_actor(idle_actor)
-        # Kill all actors, including idle actors.
-        pool.kill_all_actors()
-        # Check that the pool is empty.
-        with pytest.raises(ValueError):
-            pool.pick_actor()
-        # Check that both actors were killed.
-        for actor in [idle_actor, active_actor]:
-            with pytest.raises(ray.exceptions.RayActorError):
-                ray.get(actor.inc.remote(1))
-
-
-if __name__ == "__main__":
-    import sys
-
-    sys.exit(pytest.main(["-v", __file__]))
diff --git a/python/ray/data/tests/test_bulk_executor.py b/python/ray/data/tests/test_bulk_executor.py
index 824ef38747a1..c63d5c9bd094 100644
--- a/python/ray/data/tests/test_bulk_executor.py
+++ b/python/ray/data/tests/test_bulk_executor.py
@@ -12,6 +12,7 @@
 from ray.data._internal.execution.operators.map_operator import MapOperator
 from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
 from ray.data._internal.execution.util import make_ref_bundles
+from ray.data.tests.conftest import *  # noqa
 
 
 def make_transform(block_fn):
@@ -31,7 +32,7 @@ def ref_bundles_to_list(bundles: List[RefBundle]) -> List[List[Any]]:
 
 
 @pytest.mark.parametrize("preserve_order", [False, True])
-def test_multi_stage_execution(preserve_order):
+def test_multi_stage_execution(ray_start_10_cpus_shared, preserve_order):
     executor = BulkExecutor(ExecutionOptions(preserve_order=preserve_order))
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
@@ -43,8 +44,8 @@ def delay_first(block):
         result = [b * -1 for b in block]
         return result
 
-    o2 = MapOperator(make_transform(delay_first), o1)
-    o3 = MapOperator(make_transform(lambda block: [b * 2 for b in block]), o2)
+    o2 = MapOperator.create(make_transform(delay_first), o1)
+    o3 = MapOperator.create(make_transform(lambda block: [b * 2 for b in block]), o2)
 
     def reverse_sort(inputs: List[RefBundle]):
         reversed_list = inputs[::-1]
@@ -61,15 +62,15 @@ def reverse_sort(inputs: List[RefBundle]):
         assert sorted(output) == sorted(expected), (output, expected)
 
 
-def test_basic_stats():
+def test_basic_stats(ray_start_10_cpus_shared):
     executor = BulkExecutor(ExecutionOptions())
     prev_stats = ray.data.range(10)._plan.stats()
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
-    o2 = MapOperator(
+    o2 = MapOperator.create(
         make_transform(lambda block: [b * 2 for b in block]), o1, name="Foo"
     )
-    o3 = MapOperator(
+    o3 = MapOperator.create(
         make_transform(lambda block: [b * 2 for b in block]), o2, name="Bar"
     )
     it = executor.execute(o3, initial_stats=prev_stats)
@@ -84,7 +85,7 @@ def test_basic_stats():
 
 
 # TODO(ekl) remove this test once we have the new backend on by default.
-def test_e2e_bulk_sanity():
+def test_e2e_bulk_sanity(ray_start_10_cpus_shared):
     DatasetContext.get_current().new_execution_backend = True
     result = ray.data.range(5).map(lambda x: x + 1)
     assert result.take_all() == [1, 2, 3, 4, 5], result
@@ -93,12 +94,12 @@ def test_e2e_bulk_sanity():
     assert "obj_store_mem_alloc" in result.stats(), result.stats()
 
 
-def test_actor_strategy():
+def test_actor_strategy(ray_start_10_cpus_shared):
     executor = BulkExecutor(ExecutionOptions())
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
-    o2 = MapOperator(make_transform(lambda block: [b * -1 for b in block]), o1)
-    o3 = MapOperator(
+    o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
+    o3 = MapOperator.create(
         make_transform(lambda block: [b * 2 for b in block]),
         o2,
         compute_strategy=ActorPoolStrategy(1, 2),
@@ -111,7 +112,7 @@ def test_actor_strategy():
     assert sorted(output) == sorted(expected), (output, expected)
 
 
-def test_new_execution_backend_invocation():
+def test_new_execution_backend_invocation(ray_start_10_cpus_shared):
     DatasetContext.get_current().new_execution_backend = True
     # Read-only: will use legacy executor for now.
     ds = ray.data.range(10)
diff --git a/python/ray/data/tests/test_executor_resource_management.py b/python/ray/data/tests/test_executor_resource_management.py
index cc0db06bf3a9..016276b7f54a 100644
--- a/python/ray/data/tests/test_executor_resource_management.py
+++ b/python/ray/data/tests/test_executor_resource_management.py
@@ -1,5 +1,6 @@
 import pytest
 
+import ray
 from ray.data._internal.execution.interfaces import (
     ExecutionResources,
     ExecutionOptions,
@@ -44,7 +45,7 @@ def test_resource_utils():
 
 def test_resource_canonicalization():
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
-    op = MapOperator(
+    op = MapOperator.create(
         _mul2_transform,
         input_op=input_op,
         name="TestMapper",
@@ -54,7 +55,7 @@ def test_resource_canonicalization():
     assert op.incremental_resource_usage() == ExecutionResources(cpu=1, gpu=0)
     assert op._ray_remote_args == {"num_cpus": 1}
 
-    op = MapOperator(
+    op = MapOperator.create(
         _mul2_transform,
         input_op=input_op,
         name="TestMapper",
@@ -66,7 +67,7 @@ def test_resource_canonicalization():
     assert op._ray_remote_args == {"num_gpus": 2}
 
     with pytest.raises(ValueError):
-        MapOperator(
+        MapOperator.create(
             _mul2_transform,
             input_op=input_op,
             name="TestMapper",
@@ -77,7 +78,7 @@ def test_resource_canonicalization():
 
 def test_task_pool_resource_reporting():
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
-    op = MapOperator(
+    op = MapOperator.create(
         _mul2_transform,
         input_op=input_op,
         name="TestMapper",
@@ -97,7 +98,7 @@ def test_task_pool_resource_reporting():
 
 def test_actor_pool_resource_reporting():
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
-    op = MapOperator(
+    op = MapOperator.create(
         _mul2_transform,
         input_op=input_op,
         name="TestMapper",
@@ -106,28 +107,63 @@ def test_actor_pool_resource_reporting():
     op.start(ExecutionOptions())
     assert op.base_resource_usage() == ExecutionResources(cpu=2, gpu=0)
     assert op.incremental_resource_usage() == ExecutionResources(cpu=0, gpu=0)
+    # Actors are pending creation, but they still count against CPU utilization.
     assert op.current_resource_usage() == ExecutionResources(
         cpu=2, gpu=0, object_store_memory=0
     )
 
-    # Pool is idle.
+    # Add inputs.
+    for _ in range(4):
+        assert op.incremental_resource_usage() == ExecutionResources(cpu=0, gpu=0)
+        op.add_input(input_op.get_next(), 0)
+    # Pool is still idle while waiting for actors to start.
     assert op.current_resource_usage() == ExecutionResources(
         cpu=2, gpu=0, object_store_memory=0
     )
 
-    # Pool is active running tasks.
-    for _ in range(4):
-        assert op.incremental_resource_usage() == ExecutionResources(cpu=0, gpu=0)
-        op.add_input(input_op.get_next(), 0)
+    # Wait for actors to start.
+    work_refs = op.get_work_refs()
+    assert len(work_refs) == 2
+    for work_ref in work_refs:
+        ray.get(work_ref)
+        op.notify_work_completed(work_ref)
+    # Actors have now started and the pool is actively running tasks.
     usage = op.current_resource_usage()
     assert usage.cpu == 2, usage
     assert usage.gpu == 0, usage
+    # Now that tasks have been submitted, object store memory is accounted for.
     assert usage.object_store_memory == pytest.approx(256, abs=100), usage
 
-    # Any further inputs would require adding new actors.
     # TODO: test autoscaling resource reporting.
     # assert op.incremental_resource_usage() == ExecutionResources(cpu=1, gpu=0)
 
+    # Indicate that no more inputs will arrive.
+    op.inputs_done()
+
+    # Wait until tasks are done.
+    work_refs = op.get_work_refs()
+    while work_refs:
+        for work_ref in work_refs:
+            ray.get(work_ref)
+            op.notify_work_completed(work_ref)
+        work_refs = op.get_work_refs()
+
+    # Work is done and the pool has been scaled down.
+    usage = op.current_resource_usage()
+    assert usage.cpu == 0, usage
+    assert usage.gpu == 0, usage
+    assert usage.object_store_memory == pytest.approx(416, abs=100), usage
+
+    # Consume task outputs.
+    while op.has_next():
+        op.get_next()
+
+    # Work is done, pool has been scaled down, and outputs have been consumed.
+    usage = op.current_resource_usage()
+    assert usage.cpu == 0, usage
+    assert usage.gpu == 0, usage
+    assert usage.object_store_memory == 0, usage
+
 
 if __name__ == "__main__":
     import sys
diff --git a/python/ray/data/tests/test_operators.py b/python/ray/data/tests/test_operators.py
index 1a9d946cdaa6..d616d71d0215 100644
--- a/python/ray/data/tests/test_operators.py
+++ b/python/ray/data/tests/test_operators.py
@@ -1,4 +1,5 @@
 import pytest
+import numpy as np
 from typing import List, Iterable, Any
 import time
 
@@ -11,7 +12,16 @@
     ExecutionOptions,
 )
 from ray.data._internal.execution.operators.all_to_all_operator import AllToAllOperator
-from ray.data._internal.execution.operators.map_operator import MapOperator
+from ray.data._internal.execution.operators.map_operator import (
+    MapOperator,
+    _BlockRefBundler,
+)
+from ray.data._internal.execution.operators.task_pool_map_operator import (
+    TaskPoolMapOperator,
+)
+from ray.data._internal.execution.operators.actor_pool_map_operator import (
+    ActorPoolMapOperator,
+)
 from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
 from ray.data._internal.execution.util import make_ref_bundles
 from ray.tests.conftest import *  # noqa
@@ -73,7 +83,7 @@ def dummy_all_transform(bundles: List[RefBundle]):
 
 def test_num_outputs_total():
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
-    op1 = MapOperator(
+    op1 = MapOperator.create(
         _mul2_transform,
         input_op=input_op,
         name="TestMapper",
@@ -92,7 +102,7 @@ def test_map_operator_bulk(ray_start_regular_shared, use_actors):
     # Create with inputs.
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
     compute_strategy = ActorPoolStrategy() if use_actors else TaskPoolStrategy()
-    op = MapOperator(
+    op = MapOperator.create(
         _mul2_transform,
         input_op=input_op,
         name="TestMapper",
@@ -101,14 +111,25 @@ def test_map_operator_bulk(ray_start_regular_shared, use_actors):
 
     # Feed data and block on exec.
     op.start(ExecutionOptions())
+    if use_actors:
+        # Actor will be pending after starting the operator.
+        assert op.progress_str() == "0 (1 pending)"
     while input_op.has_next():
         op.add_input(input_op.get_next(), 0)
     op.inputs_done()
-    for work in op.get_work_refs():
-        ray.get(work)
-        op.notify_work_completed(work)
+    work_refs = op.get_work_refs()
+    while work_refs:
+        for work_ref in work_refs:
+            ray.get(work_ref)
+            op.notify_work_completed(work_ref)
+        work_refs = op.get_work_refs()
+        if use_actors and work_refs:
+            # After actor is ready (first work ref resolved), actor will remain ready
+            # while there is work to do.
+            assert op.progress_str() == "1 (0 pending)"
     if use_actors:
-        assert op.progress_str() == "0 actors"
+        # After all work is done, actor will have been killed to free up resources..
+        assert op.progress_str() == "0 (0 pending)"
     else:
         assert op.progress_str() == ""
 
@@ -134,7 +155,7 @@ def test_map_operator_streamed(ray_start_regular_shared, use_actors):
     # Create with inputs.
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
     compute_strategy = ActorPoolStrategy() if use_actors else TaskPoolStrategy()
-    op = MapOperator(
+    op = MapOperator.create(
         _mul2_transform,
         input_op=input_op,
         name="TestMapper",
@@ -146,10 +167,10 @@ def test_map_operator_streamed(ray_start_regular_shared, use_actors):
     op.start(ExecutionOptions())
     while input_op.has_next():
         op.add_input(input_op.get_next(), 0)
-        for work in op.get_work_refs():
-            ray.get(work)
-            op.notify_work_completed(work)
-        assert op.has_next()
+        while not op.has_next():
+            work_refs = op.get_work_refs()
+            ready, _ = ray.wait(work_refs, num_returns=1, fetch_local=False)
+            op.notify_work_completed(ready[0])
         while op.has_next():
             ref = op.get_next()
             assert ref.owns_blocks, ref
@@ -165,7 +186,7 @@ def test_map_operator_streamed(ray_start_regular_shared, use_actors):
 
 
 @pytest.mark.parametrize("use_actors", [False, True])
-def test_map_operator_min_rows_per_bundle(ray_start_regular_shared, use_actors):
+def test_map_operator_min_rows_per_bundle(shutdown_only, use_actors):
     # Simple sanity check of batching behavior.
     def _check_batch(block_iter: Iterable[Block]) -> Iterable[Block]:
         block_iter = list(block_iter)
@@ -176,7 +197,7 @@ def _check_batch(block_iter: Iterable[Block]) -> Iterable[Block]:
     # Create with inputs.
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(10)]))
     compute_strategy = ActorPoolStrategy() if use_actors else TaskPoolStrategy()
-    op = MapOperator(
+    op = MapOperator.create(
         _check_batch,
         input_op=input_op,
         name="TestMapper",
@@ -189,9 +210,12 @@ def _check_batch(block_iter: Iterable[Block]) -> Iterable[Block]:
     while input_op.has_next():
         op.add_input(input_op.get_next(), 0)
     op.inputs_done()
-    for work in op.get_work_refs():
-        ray.get(work)
-        op.notify_work_completed(work)
+    work_refs = op.get_work_refs()
+    while work_refs:
+        for work_ref in work_refs:
+            ray.get(work_ref)
+            op.notify_work_completed(work_ref)
+        work_refs = op.get_work_refs()
 
     # Check we return transformed bundles in order.
     assert _take_outputs(op) == [[i] for i in range(10)]
@@ -200,12 +224,11 @@ def _check_batch(block_iter: Iterable[Block]) -> Iterable[Block]:
 
 @pytest.mark.parametrize("use_actors", [False, True])
 def test_map_operator_ray_args(shutdown_only, use_actors):
-    ray.shutdown()
     ray.init(num_cpus=0, num_gpus=1)
     # Create with inputs.
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(10)]))
     compute_strategy = ActorPoolStrategy() if use_actors else TaskPoolStrategy()
-    op = MapOperator(
+    op = MapOperator.create(
         _mul2_transform,
         input_op=input_op,
         name="TestMapper",
@@ -218,9 +241,12 @@ def test_map_operator_ray_args(shutdown_only, use_actors):
     while input_op.has_next():
         op.add_input(input_op.get_next(), 0)
     op.inputs_done()
-    for work in op.get_work_refs():
-        ray.get(work)
-        op.notify_work_completed(work)
+    work_refs = op.get_work_refs()
+    while work_refs:
+        for work_ref in work_refs:
+            ray.get(work_ref)
+            op.notify_work_completed(work_ref)
+        work_refs = op.get_work_refs()
 
     # Check we don't hang and complete with num_gpus=1.
     assert _take_outputs(op) == [[i * 2] for i in range(10)]
@@ -228,8 +254,7 @@ def test_map_operator_ray_args(shutdown_only, use_actors):
 
 
 @pytest.mark.parametrize("use_actors", [False, True])
-def test_map_operator_shutdown(use_actors):
-    ray.shutdown()
+def test_map_operator_shutdown(shutdown_only, use_actors):
     ray.init(num_cpus=0, num_gpus=1)
 
     def _sleep(block_iter: Iterable[Block]) -> Iterable[Block]:
@@ -238,7 +263,7 @@ def _sleep(block_iter: Iterable[Block]) -> Iterable[Block]:
     # Create with inputs.
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(10)]))
     compute_strategy = ActorPoolStrategy() if use_actors else TaskPoolStrategy()
-    op = MapOperator(
+    op = MapOperator.create(
         _sleep,
         input_op=input_op,
         name="TestMapper",
@@ -256,6 +281,119 @@ def _sleep(block_iter: Iterable[Block]) -> Iterable[Block]:
     wait_for_condition(lambda: (ray.available_resources().get("GPU", 0) == 1.0))
 
 
+@pytest.mark.parametrize(
+    "compute,expected",
+    [
+        (TaskPoolStrategy(), TaskPoolMapOperator),
+        (ActorPoolStrategy(), ActorPoolMapOperator),
+    ],
+)
+def test_map_operator_pool_delegation(compute, expected):
+    # Test that the MapOperator factory delegates to the appropriate pool
+    # implementation.
+    input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
+    op = MapOperator.create(
+        _mul2_transform,
+        input_op=input_op,
+        name="TestMapper",
+        compute_strategy=compute,
+    )
+    assert isinstance(op, expected)
+
+
+def _get_bundles(bundle: RefBundle):
+    output = []
+    for block, _ in bundle.blocks:
+        output.extend(ray.get(block))
+    return output
+
+
+@pytest.mark.parametrize(
+    "target,in_bundles,expected_bundles",
+    [
+        (
+            1,  # Unit target, should leave unchanged.
+            [[1], [2], [3, 4], [5]],
+            [[1], [2], [3, 4], [5]],
+        ),
+        (
+            None,  # No target, should leave unchanged.
+            [[1], [2], [3, 4], [5]],
+            [[1], [2], [3, 4], [5]],
+        ),
+        (
+            2,  # Empty blocks should be handled.
+            [[1], [], [2, 3], []],
+            [[1], [2, 3]],
+        ),
+        (
+            2,  # Test bundling, finalizing, passing, leftovers, etc.
+            [[1], [2], [3, 4, 5], [6], [7], [8], [9, 10], [11]],
+            [[1, 2], [3, 4, 5], [6, 7], [8], [9, 10], [11]],
+        ),
+        (
+            3,  # Test bundling, finalizing, passing, leftovers, etc.
+            [[1], [2, 3], [4, 5, 6, 7], [8, 9], [10, 11]],
+            [[1, 2, 3], [4, 5, 6, 7], [8, 9], [10, 11]],
+        ),
+    ],
+)
+def test_block_ref_bundler_basic(target, in_bundles, expected_bundles):
+    # Test that the bundler creates the expected output bundles.
+    bundler = _BlockRefBundler(target)
+    bundles = make_ref_bundles(in_bundles)
+    out_bundles = []
+    for bundle in bundles:
+        bundler.add_bundle(bundle)
+        while bundler.has_bundle():
+            out_bundle = _get_bundles(bundler.get_next_bundle())
+            out_bundles.append(out_bundle)
+    bundler.done_adding_bundles()
+    if bundler.has_bundle():
+        out_bundle = _get_bundles(bundler.get_next_bundle())
+        out_bundles.append(out_bundle)
+    assert len(out_bundles) == len(expected_bundles)
+    for bundle, expected in zip(out_bundles, expected_bundles):
+        assert bundle == expected
+
+
+@pytest.mark.parametrize(
+    "target,n,num_bundles,num_out_bundles,out_bundle_size",
+    [
+        (5, 20, 20, 4, 5),
+        (5, 20, 10, 5, 4),
+        (8, 16, 4, 2, 8),
+    ],
+)
+def test_block_ref_bundler_uniform(
+    target, n, num_bundles, num_out_bundles, out_bundle_size
+):
+    # Test that the bundler creates the expected number of bundles with the expected
+    # size.
+    bundler = _BlockRefBundler(target)
+    data = np.arange(n)
+    pre_bundles = [arr.tolist() for arr in np.array_split(data, num_bundles)]
+    bundles = make_ref_bundles(pre_bundles)
+    out_bundles = []
+    for bundle in bundles:
+        bundler.add_bundle(bundle)
+        while bundler.has_bundle():
+            out_bundles.append(bundler.get_next_bundle())
+    bundler.done_adding_bundles()
+    if bundler.has_bundle():
+        out_bundles.append(bundler.get_next_bundle())
+    assert len(out_bundles) == num_out_bundles
+    for out_bundle in out_bundles:
+        assert out_bundle.num_rows() == out_bundle_size
+    flat_out = [
+        i
+        for bundle in out_bundles
+        for block, _ in bundle.blocks
+        for i in ray.get(block)
+    ]
+    assert flat_out == list(range(n))
+
+
 if __name__ == "__main__":
     import sys
 
diff --git a/python/ray/data/tests/test_streaming_executor.py b/python/ray/data/tests/test_streaming_executor.py
index 5b8f8f29b77d..18a925d523cc 100644
--- a/python/ray/data/tests/test_streaming_executor.py
+++ b/python/ray/data/tests/test_streaming_executor.py
@@ -29,6 +29,7 @@
 from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
 from ray.data._internal.execution.util import make_ref_bundles
 from ray.util.scheduling_strategies import NodeAffinitySchedulingStrategy
+from ray.data.tests.conftest import *  # noqa
 
 
 @ray.remote
@@ -52,11 +53,11 @@ def ref_bundles_to_list(bundles: List[RefBundle]) -> List[List[Any]]:
     return output
 
 
-def test_build_streaming_topology():
+def test_build_streaming_topology(ray_start_10_cpus_shared):
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
-    o2 = MapOperator(make_transform(lambda block: [b * -1 for b in block]), o1)
-    o3 = MapOperator(make_transform(lambda block: [b * 2 for b in block]), o2)
+    o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
+    o3 = MapOperator.create(make_transform(lambda block: [b * 2 for b in block]), o2)
     topo, _ = build_streaming_topology(o3, ExecutionOptions())
     assert len(topo) == 3, topo
     assert o1 in topo, topo
@@ -66,21 +67,21 @@ def test_build_streaming_topology():
     assert list(topo) == [o1, o2, o3]
 
 
-def test_disallow_non_unique_operators():
+def test_disallow_non_unique_operators(ray_start_10_cpus_shared):
     inputs = make_ref_bundles([[x] for x in range(20)])
     # An operator [o1] cannot used in the same DAG twice.
     o1 = InputDataBuffer(inputs)
-    o2 = MapOperator(make_transform(lambda block: [b * -1 for b in block]), o1)
-    o3 = MapOperator(make_transform(lambda block: [b * -1 for b in block]), o1)
+    o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
+    o3 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
     o4 = PhysicalOperator("test_combine", [o2, o3])
     with pytest.raises(ValueError):
         build_streaming_topology(o4, ExecutionOptions())
 
 
-def test_process_completed_tasks():
+def test_process_completed_tasks(ray_start_10_cpus_shared):
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
-    o2 = MapOperator(make_transform(lambda block: [b * -1 for b in block]), o1)
+    o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
     topo, _ = build_streaming_topology(o2, ExecutionOptions())
 
     # Test processing output bundles.
@@ -109,12 +110,12 @@ def test_process_completed_tasks():
     o2.inputs_done.assert_called_once()
 
 
-def test_select_operator_to_run():
+def test_select_operator_to_run(ray_start_10_cpus_shared):
     opt = ExecutionOptions()
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
-    o2 = MapOperator(make_transform(lambda block: [b * -1 for b in block]), o1)
-    o3 = MapOperator(make_transform(lambda block: [b * 2 for b in block]), o2)
+    o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
+    o3 = MapOperator.create(make_transform(lambda block: [b * 2 for b in block]), o2)
     topo, _ = build_streaming_topology(o3, opt)
 
     # Test empty.
@@ -147,11 +148,11 @@ def test_select_operator_to_run():
     )
 
 
-def test_dispatch_next_task():
+def test_dispatch_next_task(ray_start_10_cpus_shared):
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
     o1_state = OpState(o1, [])
-    o2 = MapOperator(make_transform(lambda block: [b * -1 for b in block]), o1)
+    o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
     op_state = OpState(o2, [o1_state.outqueue])
 
     # TODO: test multiple inqueues with the union operator.
@@ -167,27 +168,27 @@ def test_dispatch_next_task():
     assert o2.add_input.called_once_with("dummy2")
 
 
-def test_debug_dump_topology():
+def test_debug_dump_topology(ray_start_10_cpus_shared):
     opt = ExecutionOptions()
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
-    o2 = MapOperator(make_transform(lambda block: [b * -1 for b in block]), o1)
-    o3 = MapOperator(make_transform(lambda block: [b * 2 for b in block]), o2)
+    o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
+    o3 = MapOperator.create(make_transform(lambda block: [b * 2 for b in block]), o2)
     topo, _ = build_streaming_topology(o3, opt)
     # Just a sanity check to ensure it doesn't crash.
     _debug_dump_topology(topo)
 
 
-def test_validate_topology():
+def test_validate_topology(ray_start_10_cpus_shared):
     opt = ExecutionOptions()
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
-    o2 = MapOperator(
+    o2 = MapOperator.create(
         make_transform(lambda block: [b * -1 for b in block]),
         o1,
         compute_strategy=ray.data.ActorPoolStrategy(8, 8),
     )
-    o3 = MapOperator(
+    o3 = MapOperator.create(
         make_transform(lambda block: [b * 2 for b in block]),
         o2,
         compute_strategy=ray.data.ActorPoolStrategy(4, 4),
@@ -200,7 +201,7 @@ def test_validate_topology():
         _validate_topology(topo, ExecutionResources(cpu=10))
 
 
-def test_execution_allowed():
+def test_execution_allowed(ray_start_10_cpus_shared):
     op = InputDataBuffer([])
 
     # CPU.
@@ -245,15 +246,15 @@ def test_execution_allowed():
     )
 
 
-def test_select_ops_ensure_at_least_one_live_operator():
+def test_select_ops_ensure_at_least_one_live_operator(ray_start_10_cpus_shared):
     opt = ExecutionOptions()
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
-    o2 = MapOperator(
+    o2 = MapOperator.create(
         make_transform(lambda block: [b * -1 for b in block]),
         o1,
     )
-    o3 = MapOperator(
+    o3 = MapOperator.create(
         make_transform(lambda block: [b * 2 for b in block]),
         o2,
     )
@@ -275,12 +276,12 @@ def test_select_ops_ensure_at_least_one_live_operator():
     )
 
 
-def test_pipelined_execution():
+def test_pipelined_execution(ray_start_10_cpus_shared):
     executor = StreamingExecutor(ExecutionOptions())
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
-    o2 = MapOperator(make_transform(lambda block: [b * -1 for b in block]), o1)
-    o3 = MapOperator(make_transform(lambda block: [b * 2 for b in block]), o2)
+    o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
+    o3 = MapOperator.create(make_transform(lambda block: [b * 2 for b in block]), o2)
 
     def reverse_sort(inputs: List[RefBundle]):
         reversed_list = inputs[::-1]
@@ -293,7 +294,7 @@ def reverse_sort(inputs: List[RefBundle]):
     assert output == expected, (output, expected)
 
 
-def test_e2e_option_propagation():
+def test_e2e_option_propagation(ray_start_10_cpus_shared):
     DatasetContext.get_current().new_execution_backend = True
     DatasetContext.get_current().use_streaming_executor = True
 
@@ -312,7 +313,7 @@ def run():
         run()
 
 
-def test_configure_spread_e2e():
+def test_configure_spread_e2e(ray_start_10_cpus_shared):
     from ray import remote_function
 
     tasks = []
@@ -333,31 +334,24 @@ def _test_hook(fn, args, strategy):
     assert tasks == ["DEFAULT", "DEFAULT", "SPREAD", "SPREAD"]
 
 
-def test_configure_output_locality():
+def test_configure_output_locality(ray_start_10_cpus_shared):
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
-    o2 = MapOperator(make_transform(lambda block: [b * -1 for b in block]), o1)
-    o3 = MapOperator(
+    o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
+    o3 = MapOperator.create(
         make_transform(lambda block: [b * 2 for b in block]),
         o2,
         compute_strategy=ray.data.ActorPoolStrategy(1, 1),
     )
     topo, _ = build_streaming_topology(o3, ExecutionOptions(locality_with_output=False))
-    assert (
-        o2._execution_state._task_submitter._ray_remote_args.get("scheduling_strategy")
-        is None
-    )
-    assert (
-        o3._execution_state._task_submitter._ray_remote_args.get("scheduling_strategy")
-        is None
-    )
+    assert o2._ray_remote_args.get("scheduling_strategy") is None
+    assert o3._ray_remote_args.get("scheduling_strategy") == "SPREAD"
     topo, _ = build_streaming_topology(o3, ExecutionOptions(locality_with_output=True))
     assert isinstance(
-        o2._execution_state._task_submitter._ray_remote_args["scheduling_strategy"],
-        NodeAffinitySchedulingStrategy,
+        o2._ray_remote_args["scheduling_strategy"], NodeAffinitySchedulingStrategy
     )
     assert isinstance(
-        o3._execution_state._task_submitter._ray_remote_args["scheduling_strategy"],
+        o3._ray_remote_args["scheduling_strategy"],
         NodeAffinitySchedulingStrategy,
     )
 

From ffbd87a0e608e57d69a2a0bd755efd5210341026 Mon Sep 17 00:00:00 2001
From: Eric Liang <ekhliang@gmail.com>
Date: Fri, 27 Jan 2023 13:58:41 -0800
Subject: [PATCH 027/267] [data] [streaming] [12/n]--- Improve output
 backpressure reporting and management (#31979)

Before this PR, stalls in the consumer thread would fully block the control loop. This provides backpressure, but at the cost of performance.

This PR fully decouples the consumer thread from the control loop thread, allowing execution to proceed so long as there is sufficient object_store_memory budget remaining. It also adds a progress bar for the output queue, showing the number of output bundles consumed and the number of queued bundles for output:
---
 .../_internal/execution/streaming_executor.py |  62 ++++++---
 .../execution/streaming_executor_state.py     |  48 +++++--
 .../ray/data/tests/test_streaming_executor.py | 124 ++++++++++++++++--
 3 files changed, 199 insertions(+), 35 deletions(-)

diff --git a/python/ray/data/_internal/execution/streaming_executor.py b/python/ray/data/_internal/execution/streaming_executor.py
index b2f169869b59..a3489cea1883 100644
--- a/python/ray/data/_internal/execution/streaming_executor.py
+++ b/python/ray/data/_internal/execution/streaming_executor.py
@@ -1,5 +1,4 @@
 import logging
-import queue
 import threading
 import os
 from typing import Iterator, Optional
@@ -43,11 +42,11 @@ def __init__(self, options: ExecutionOptions):
         # data updates the stats object in legacy code).
         self._stats: Optional[DatasetStats] = None
         self._global_info: Optional[ProgressBar] = None
+        self._output_info: Optional[ProgressBar] = None
 
         # Internal execution state shared across thread boundaries. We run the control
         # loop on a separate thread so that it doesn't become stalled between
         # generator `yield`s.
-        self._runner_thread_out = queue.Queue(maxsize=1)
         self._topology: Optional[Topology] = None
         self._output_node: Optional[OpState] = None
 
@@ -68,6 +67,9 @@ def execute(
 
         # Setup the streaming DAG topology and start the runner thread.
         self._topology, self._stats = build_streaming_topology(dag, self._options)
+        self._output_info = ProgressBar(
+            "Output", dag.num_outputs_total() or 1, len(self._topology)
+        )
         _validate_topology(self._topology, self._get_or_refresh_resource_limits())
 
         self._output_node: OpState = self._topology[dag]
@@ -75,39 +77,41 @@ def execute(
 
         # Drain items from the runner thread until completion.
         try:
-            item = self._runner_thread_out.get()
+            item = self._output_node.get_output_blocking()
             while item is not None:
                 if isinstance(item, Exception):
                     raise item
                 else:
+                    self._output_info.update(1)
                     yield item
-                item = self._runner_thread_out.get()
+                item = self._output_node.get_output_blocking()
         finally:
-            for op in self._topology:
-                op.shutdown()
+            # Close the progress bars from top to bottom to avoid them jumping
+            # around in the console after completion.
             if self._global_info:
                 self._global_info.close()
+            for op, state in self._topology.items():
+                op.shutdown()
+                if state.progress_bar:
+                    state.progress_bar.close()
+            if self._output_info:
+                self._output_info.close()
 
     def run(self):
         """Run the control loop in a helper thread.
 
-        Results are returned via the `self._runner_thread_out` queue.
+        Results are returned via the output node's outqueue.
         """
         try:
             # Run scheduling loop until complete.
             while self._scheduling_loop_step(self._topology):
-                while self._output_node.outqueue:
-                    self._runner_thread_out.put(self._output_node.outqueue.pop(0))
-
-            # Handle any leftover outputs.
-            while self._output_node.outqueue:
-                self._runner_thread_out.put(self._output_node.outqueue.pop(0))
+                pass
         except Exception as e:
             # Propagate it to the result iterator.
-            self._runner_thread_out.put(e)
+            self._output_node.outqueue.append(e)
         finally:
             # Signal end of results.
-            self._runner_thread_out.put(None)
+            self._output_node.outqueue.append(None)
 
     def get_stats(self):
         """Return the stats object for the streaming execution.
@@ -136,24 +140,40 @@ def _scheduling_loop_step(self, topology: Topology) -> bool:
         # ray.wait() overhead, so make sure to allow multiple dispatch per call for
         # greater parallelism.
         process_completed_tasks(topology)
-        for op_state in topology.values():
-            op_state.refresh_progress_bar()
 
         # Dispatch as many operators as we can for completed tasks.
         limits = self._get_or_refresh_resource_limits()
         cur_usage = self._get_current_usage(topology)
         self._report_current_usage(cur_usage, limits)
-        op = select_operator_to_run(topology, cur_usage, limits)
+        op = select_operator_to_run(
+            topology,
+            cur_usage,
+            limits,
+            ensure_at_least_one_running=self._consumer_idling(),
+        )
         while op is not None:
             if DEBUG_TRACE_SCHEDULING:
                 _debug_dump_topology(topology)
             topology[op].dispatch_next_task()
             cur_usage = self._get_current_usage(topology)
-            op = select_operator_to_run(topology, cur_usage, limits)
+            op = select_operator_to_run(
+                topology,
+                cur_usage,
+                limits,
+                ensure_at_least_one_running=self._consumer_idling(),
+            )
+
+        # Update the progress bar to reflect scheduling decisions.
+        for op_state in topology.values():
+            op_state.refresh_progress_bar()
 
         # Keep going until all operators run to completion.
         return not all(op.completed() for op in topology)
 
+    def _consumer_idling(self) -> bool:
+        """Returns whether the user thread is blocked on topology execution."""
+        return len(self._output_node.outqueue) == 0
+
     def _get_or_refresh_resource_limits(self) -> ExecutionResources:
         """Return concrete limits for use at the current time.
 
@@ -192,6 +212,10 @@ def _report_current_usage(
                 f"{cur_usage.object_store_memory_str()}/"
                 f"{limits.object_store_memory_str()} object_store_memory"
             )
+        if self._output_info:
+            self._output_info.set_description(
+                f"output: {len(self._output_node.outqueue)} queued"
+            )
 
 
 def _validate_topology(topology: Topology, limits: ExecutionResources) -> None:
diff --git a/python/ray/data/_internal/execution/streaming_executor_state.py b/python/ray/data/_internal/execution/streaming_executor_state.py
index 29d416dca593..a208dc5ecb96 100644
--- a/python/ray/data/_internal/execution/streaming_executor_state.py
+++ b/python/ray/data/_internal/execution/streaming_executor_state.py
@@ -4,7 +4,9 @@
 """
 
 import math
-from typing import Dict, List, Optional
+import time
+from collections import deque
+from typing import Dict, List, Optional, Deque, Union
 
 import ray
 from ray.data._internal.execution.interfaces import (
@@ -22,21 +24,27 @@
 # operator to tracked streaming exec state.
 Topology = Dict[PhysicalOperator, "OpState"]
 
+# A RefBundle or an exception / end of stream indicator.
+MaybeRefBundle = Union[RefBundle, Exception, None]
+
 
 class OpState:
     """The execution state tracked for each PhysicalOperator.
 
     This tracks state to manage input and output buffering for StreamingExecutor and
     progress bars, which is separate from execution state internal to the operators.
+
+    Note: we use the `deque` data structure here because it is thread-safe, enabling
+    operator queues to be shared across threads.
     """
 
-    def __init__(self, op: PhysicalOperator, inqueues: List[List[RefBundle]]):
+    def __init__(self, op: PhysicalOperator, inqueues: List[Deque[MaybeRefBundle]]):
         # Each inqueue is connected to another operator's outqueue.
         assert len(inqueues) == len(op.input_dependencies), (op, inqueues)
-        self.inqueues: List[List[RefBundle]] = inqueues
+        self.inqueues: List[Deque[MaybeRefBundle]] = inqueues
         # The outqueue is connected to another operator's inqueue (they physically
         # share the same Python list reference).
-        self.outqueue: List[RefBundle] = []
+        self.outqueue: Deque[MaybeRefBundle] = deque()
         self.op = op
         self.progress_bar = None
         self.num_completed_tasks = 0
@@ -80,10 +88,22 @@ def dispatch_next_task(self) -> None:
         """Move a bundle from the operator inqueue to the operator itself."""
         for i, inqueue in enumerate(self.inqueues):
             if inqueue:
-                self.op.add_input(inqueue.pop(0), input_index=i)
+                self.op.add_input(inqueue.popleft(), input_index=i)
                 return
         assert False, "Nothing to dispatch"
 
+    def get_output_blocking(self) -> MaybeRefBundle:
+        """Get an item from this node's output queue, blocking as needed.
+
+        Returns:
+            The RefBundle from the output queue, or an error / end of stream indicator.
+        """
+        while True:
+            try:
+                return self.outqueue.popleft()
+            except IndexError:
+                time.sleep(0.01)
+
 
 def build_streaming_topology(
     dag: PhysicalOperator, options: ExecutionOptions
@@ -177,7 +197,10 @@ def process_completed_tasks(topology: Topology) -> None:
 
 
 def select_operator_to_run(
-    topology: Topology, cur_usage: ExecutionResources, limits: ExecutionResources
+    topology: Topology,
+    cur_usage: ExecutionResources,
+    limits: ExecutionResources,
+    ensure_at_least_one_running: bool,
 ) -> Optional[PhysicalOperator]:
     """Select an operator to run, if possible.
 
@@ -187,6 +210,10 @@ def select_operator_to_run(
     This is currently implemented by applying backpressure on operators that are
     producing outputs faster than they are consuming them `len(outqueue)`, as well as
     operators with a large number of running tasks `num_active_tasks()`.
+
+    Note that memory limits also apply to the outqueue of the output operator. This
+    provides backpressure if the consumer is slow. However, once a bundle is returned
+    to the user, it is no longer tracked.
     """
 
     # Filter to ops that are eligible for execution.
@@ -196,8 +223,13 @@ def select_operator_to_run(
         if state.num_queued() > 0 and _execution_allowed(op, cur_usage, limits)
     ]
 
-    # To ensure liveness, allow at least 1 op to run regardless of limits.
-    if not ops and all(op.num_active_work_refs() == 0 for op in topology):
+    # To ensure liveness, allow at least 1 op to run regardless of limits. This is
+    # gated on `ensure_at_least_one_running`, which is set if the consumer is blocked.
+    if (
+        ensure_at_least_one_running
+        and not ops
+        and all(op.num_active_work_refs() == 0 for op in topology)
+    ):
         # The topology is entirely idle, so choose from all ready ops ignoring limits.
         ops = [op for op, state in topology.items() if state.num_queued() > 0]
 
diff --git a/python/ray/data/tests/test_streaming_executor.py b/python/ray/data/tests/test_streaming_executor.py
index 18a925d523cc..2762ec0a69f5 100644
--- a/python/ray/data/tests/test_streaming_executor.py
+++ b/python/ray/data/tests/test_streaming_executor.py
@@ -29,6 +29,7 @@
 from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
 from ray.data._internal.execution.util import make_ref_bundles
 from ray.util.scheduling_strategies import NodeAffinitySchedulingStrategy
+from ray._private.test_utils import wait_for_condition
 from ray.data.tests.conftest import *  # noqa
 
 
@@ -120,31 +121,37 @@ def test_select_operator_to_run(ray_start_10_cpus_shared):
 
     # Test empty.
     assert (
-        select_operator_to_run(topo, ExecutionResources(), ExecutionResources()) is None
+        select_operator_to_run(topo, ExecutionResources(), ExecutionResources(), True)
+        is None
     )
 
     # Test backpressure based on queue length between operators.
     topo[o1].outqueue.append("dummy1")
     assert (
-        select_operator_to_run(topo, ExecutionResources(), ExecutionResources()) == o2
+        select_operator_to_run(topo, ExecutionResources(), ExecutionResources(), True)
+        == o2
     )
     topo[o1].outqueue.append("dummy2")
     assert (
-        select_operator_to_run(topo, ExecutionResources(), ExecutionResources()) == o2
+        select_operator_to_run(topo, ExecutionResources(), ExecutionResources(), True)
+        == o2
     )
     topo[o2].outqueue.append("dummy3")
     assert (
-        select_operator_to_run(topo, ExecutionResources(), ExecutionResources()) == o3
+        select_operator_to_run(topo, ExecutionResources(), ExecutionResources(), True)
+        == o3
     )
 
     # Test backpressure includes num active tasks as well.
     topo[o3].num_active_tasks = MagicMock(return_value=2)
     assert (
-        select_operator_to_run(topo, ExecutionResources(), ExecutionResources()) == o2
+        select_operator_to_run(topo, ExecutionResources(), ExecutionResources(), True)
+        == o2
     )
     topo[o2].num_active_tasks = MagicMock(return_value=2)
     assert (
-        select_operator_to_run(topo, ExecutionResources(), ExecutionResources()) == o3
+        select_operator_to_run(topo, ExecutionResources(), ExecutionResources(), True)
+        == o3
     )
 
 
@@ -263,17 +270,23 @@ def test_select_ops_ensure_at_least_one_live_operator(ray_start_10_cpus_shared):
     o1.num_active_work_refs = MagicMock(return_value=2)
     assert (
         select_operator_to_run(
-            topo, ExecutionResources(cpu=1), ExecutionResources(cpu=1)
+            topo, ExecutionResources(cpu=1), ExecutionResources(cpu=1), True
         )
         is None
     )
     o1.num_active_work_refs = MagicMock(return_value=0)
     assert (
         select_operator_to_run(
-            topo, ExecutionResources(cpu=1), ExecutionResources(cpu=1)
+            topo, ExecutionResources(cpu=1), ExecutionResources(cpu=1), True
         )
         is o3
     )
+    assert (
+        select_operator_to_run(
+            topo, ExecutionResources(cpu=1), ExecutionResources(cpu=1), False
+        )
+        is None
+    )
 
 
 def test_pipelined_execution(ray_start_10_cpus_shared):
@@ -334,6 +347,101 @@ def _test_hook(fn, args, strategy):
     assert tasks == ["DEFAULT", "DEFAULT", "SPREAD", "SPREAD"]
 
 
+def test_scheduling_progress_when_output_blocked():
+    # Processing stages should fully finish even if output is completely stalled.
+
+    @ray.remote
+    class Counter:
+        def __init__(self):
+            self.i = 0
+
+        def inc(self):
+            self.i += 1
+
+        def get(self):
+            return self.i
+
+    counter = Counter.remote()
+
+    def func(x):
+        ray.get(counter.inc.remote())
+        return x
+
+    DatasetContext.get_current().use_streaming_executor = True
+    DatasetContext.get_current().execution_options.preserve_order = True
+
+    # Only take the first item from the iterator.
+    it = iter(
+        ray.data.range(100, parallelism=100)
+        .map_batches(func, batch_size=None)
+        .iter_batches(batch_size=None)
+    )
+    next(it)
+    # The pipeline should fully execute even when the output iterator is blocked.
+    wait_for_condition(lambda: ray.get(counter.get.remote()) == 100)
+    # Check we can take the rest.
+    assert list(it) == [[x] for x in range(1, 100)]
+
+
+def test_backpressure_from_output():
+    # Here we set the memory limit low enough so the output getting blocked will
+    # actually stall execution.
+
+    @ray.remote
+    class Counter:
+        def __init__(self):
+            self.i = 0
+
+        def inc(self):
+            self.i += 1
+
+        def get(self):
+            return self.i
+
+    counter = Counter.remote()
+
+    def func(x):
+        ray.get(counter.inc.remote())
+        return x
+
+    ctx = DatasetContext.get_current()
+    try:
+        ctx.use_streaming_executor = True
+        ctx.execution_options.resource_limits.object_store_memory = 10000
+
+        # Only take the first item from the iterator.
+        it = iter(
+            ray.data.range(100000, parallelism=100)
+            .map_batches(func, batch_size=None)
+            .iter_batches(batch_size=None)
+        )
+        next(it)
+        num_finished = ray.get(counter.get.remote())
+        assert num_finished < 5, num_finished
+
+        # Check we can get the rest.
+        for rest in it:
+            pass
+        assert ray.get(counter.get.remote()) == 100
+    finally:
+        ctx.execution_options.resource_limits.object_store_memory = None
+
+
+def test_e2e_liveness_with_output_backpressure_edge_case():
+    # At least one operator is ensured to be running, if the output becomes idle.
+    ctx = DatasetContext.get_current()
+    ctx.use_streaming_executor = True
+    ctx.execution_options.preserve_order = True
+    try:
+        ctx.execution_options.resource_limits.object_store_memory = 1
+        ds = ray.data.range(10000, parallelism=100).map(lambda x: x, num_cpus=2)
+        # This will hang forever if the liveness logic is wrong, since the output
+        # backpressure will prevent any operators from running at all.
+        assert ds.take_all() == list(range(10000))
+    finally:
+        ctx.execution_options.resource_limits.object_store_memory = None
+
+
 def test_configure_output_locality(ray_start_10_cpus_shared):
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)

From 25a7df61f8ad0a3ca756c82dbe554e18b9d582c3 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Fri, 27 Jan 2023 14:18:52 -0800
Subject: [PATCH 028/267] [tune] Fix tune_cloud_* tests fow new Trial
 constructor arguments (#32010)

https://github.com/ray-project/ray/pull/31669 changed the `Trial.__dict__` by moving `local_dir` to `_local_dir`, which resulted in an error in our tune cloud tests. This PR updates the signature of the `TrialStub` class to resolve the issue.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 release/tune_tests/cloud_tests/workloads/run_cloud_test.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/release/tune_tests/cloud_tests/workloads/run_cloud_test.py b/release/tune_tests/cloud_tests/workloads/run_cloud_test.py
index b6876212db0c..b2ede829401d 100644
--- a/release/tune_tests/cloud_tests/workloads/run_cloud_test.py
+++ b/release/tune_tests/cloud_tests/workloads/run_cloud_test.py
@@ -77,7 +77,7 @@ def __init__(
         trial_id: str,
         status: str,
         config: Dict[str, Any],
-        local_dir: str,
+        _local_dir: str,
         experiment_tag: str,
         _last_result: Dict[str, Any],
         relative_logdir: str,
@@ -88,7 +88,7 @@ def __init__(
         self.trial_id = trial_id
         self.status = status
         self.config = config
-        self.local_dir = local_dir
+        self.local_dir = _local_dir
         self.experiment_tag = experiment_tag
         self.last_result = _last_result
         self.relative_logdir = relative_logdir

From e64b44baf5d2a610337ee6b8d81a26ae5f44294f Mon Sep 17 00:00:00 2001
From: clarng <clarence.wyng@gmail.com>
Date: Fri, 27 Jan 2023 14:30:00 -0800
Subject: [PATCH 029/267] [core] remove legacy memory monitor from task
 submission codepath (#31993)

Remove legacy memory monitor from worker submission code path, as that was already disabled by default in Ray 2.2
---
 python/ray/_private/memory_monitor.py    |  2 ++
 python/ray/_private/worker.py            |  2 --
 python/ray/_raylet.pyx                   |  5 -----
 python/ray/tests/test_memory_pressure.py | 22 ----------------------
 4 files changed, 2 insertions(+), 29 deletions(-)

diff --git a/python/ray/_private/memory_monitor.py b/python/ray/_private/memory_monitor.py
index dd9f1b4eb03c..6979617909bb 100644
--- a/python/ray/_private/memory_monitor.py
+++ b/python/ray/_private/memory_monitor.py
@@ -103,6 +103,8 @@ class MemoryMonitor:
 
     The environment variable `RAY_MEMORY_MONITOR_ERROR_THRESHOLD` can be used
     to overwrite the default error_threshold setting.
+
+    Used by test only. For production code use memory_monitor.cc
     """
 
     def __init__(self, error_threshold=0.95, check_interval=1):
diff --git a/python/ray/_private/worker.py b/python/ray/_private/worker.py
index d784c22fc77d..ece785f9f08b 100644
--- a/python/ray/_private/worker.py
+++ b/python/ray/_private/worker.py
@@ -44,7 +44,6 @@
 import ray
 import ray._private.gcs_utils as gcs_utils
 import ray._private.import_thread as import_thread
-import ray._private.memory_monitor as memory_monitor
 import ray._private.node
 import ray._private.parameter
 import ray._private.profiling as profiling
@@ -426,7 +425,6 @@ def __init__(self):
         # When the worker is constructed. Record the original value of the
         # CUDA_VISIBLE_DEVICES environment variable.
         self.original_gpu_ids = ray._private.utils.get_cuda_visible_devices()
-        self.memory_monitor = memory_monitor.MemoryMonitor()
         # A dictionary that maps from driver id to SerializationContext
         # TODO: clean up the SerializationContext once the job finished.
         self.serialization_context_map = {}
diff --git a/python/ray/_raylet.pyx b/python/ray/_raylet.pyx
index 15e25be41a29..0a6a099a8382 100644
--- a/python/ray/_raylet.pyx
+++ b/python/ray/_raylet.pyx
@@ -804,11 +804,6 @@ cdef void execute_task(
 
     with core_worker.profile_event(b"task::" + name, extra_data=extra_data):
         try:
-            if (not (<int>task_type == <int>TASK_TYPE_ACTOR_TASK
-                     and function_name == "__ray_terminate__") and
-                    ray._config.memory_monitor_refresh_ms() == 0):
-                worker.memory_monitor.raise_if_low_memory()
-
             with core_worker.profile_event(b"task:deserialize_arguments"):
                 if c_args.empty():
                     args, kwargs = [], {}
diff --git a/python/ray/tests/test_memory_pressure.py b/python/ray/tests/test_memory_pressure.py
index f82e1f831d44..2324763acb33 100644
--- a/python/ray/tests/test_memory_pressure.py
+++ b/python/ray/tests/test_memory_pressure.py
@@ -1,5 +1,4 @@
 from math import ceil
-import os
 import sys
 import time
 
@@ -470,26 +469,5 @@ def test_put_object_task_usage_slightly_below_limit_does_not_crash():
         )
 
 
-@pytest.mark.skipif(
-    sys.platform != "linux" and sys.platform != "linux2",
-    reason="memory monitor only on linux currently",
-)
-def test_legacy_memory_monitor_disabled_by_oom_killer():
-    os.environ["RAY_MEMORY_MONITOR_ERROR_THRESHOLD"] = "0.5"
-    with ray.init(
-        _system_config={
-            "memory_monitor_refresh_ms": 50,
-            "memory_usage_threshold": 0.9,
-            "min_memory_free_bytes": -1,
-        },
-    ):
-        bytes_to_alloc = get_additional_bytes_to_reach_memory_usage_pct(0.7)
-        leaker = Leaker.options(max_restarts=0, max_task_retries=0).remote()
-        ray.get(leaker.allocate.remote(bytes_to_alloc))
-
-        bytes_to_alloc = get_additional_bytes_to_reach_memory_usage_pct(0.8)
-        ray.get(leaker.allocate.remote(allocate_bytes=bytes_to_alloc, sleep_time_s=10))
-
-
 if __name__ == "__main__":
     sys.exit(pytest.main(["-sv", __file__]))

From 2a7dd31119c312acebf703b736deae30dfc01427 Mon Sep 17 00:00:00 2001
From: Stephanie Wang <swang@cs.berkeley.edu>
Date: Fri, 27 Jan 2023 16:32:20 -0600
Subject: [PATCH 030/267] [docs] Revamp Ray core fault tolerance guide (#27573)

The structure of the content looks good. My main request is (like with the scheduling refactor), that we make this discoverable with links from the main task/actor sections. Could we add 2-3 links each from the main tasks/actors/objects content to the appropriate fault tolerance sections?

_Originally posted by @ericl in https://github.com/ray-project/ray/pull/27573#pullrequestreview-1271672917_

Co-authored-by: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Co-authored-by: Jiajun Yao <jeromeyjj@gmail.com>
---
 doc/source/ray-core/actors.rst                |  11 +-
 .../ray-core/actors/fault-tolerance.rst       | 128 ------------------
 doc/source/ray-core/actors/named-actors.rst   |  13 +-
 doc/source/ray-core/actors/task-orders.rst    |   6 +-
 .../ray-core/actors/terminating-actors.rst    |  96 +++++++------
 .../doc_code/actor_creator_failure.py         |  44 ++++++
 doc/source/ray-core/doc_code/actor_restart.py |  44 ++++++
 doc/source/ray-core/doc_code/owners.py        |  19 +++
 .../ray-core/doc_code/task_exceptions.py      |  38 ++++++
 doc/source/ray-core/fault-tolerance.rst       |  26 ++++
 .../ray-core/fault_tolerance/actors.rst       | 107 +++++++++++++++
 .../ray-core/fault_tolerance/objects.rst      | 104 ++++++++++++++
 doc/source/ray-core/fault_tolerance/tasks.rst |  85 ++++++++++++
 doc/source/ray-core/objects.rst               |  11 +-
 .../ray-core/objects/fault-tolerance.rst      |  15 --
 doc/source/ray-core/tasks.rst                 |  12 +-
 doc/source/ray-core/tasks/fault-tolerance.rst |  75 ----------
 doc/source/ray-core/user-guide.rst            |   3 +-
 .../troubleshoot-failures.rst                 |  28 ----
 19 files changed, 558 insertions(+), 307 deletions(-)
 delete mode 100644 doc/source/ray-core/actors/fault-tolerance.rst
 create mode 100644 doc/source/ray-core/doc_code/actor_creator_failure.py
 create mode 100644 doc/source/ray-core/doc_code/actor_restart.py
 create mode 100644 doc/source/ray-core/doc_code/owners.py
 create mode 100644 doc/source/ray-core/doc_code/task_exceptions.py
 create mode 100644 doc/source/ray-core/fault-tolerance.rst
 create mode 100644 doc/source/ray-core/fault_tolerance/actors.rst
 create mode 100644 doc/source/ray-core/fault_tolerance/objects.rst
 create mode 100644 doc/source/ray-core/fault_tolerance/tasks.rst
 delete mode 100644 doc/source/ray-core/objects/fault-tolerance.rst
 delete mode 100644 doc/source/ray-core/tasks/fault-tolerance.rst

diff --git a/doc/source/ray-core/actors.rst b/doc/source/ray-core/actors.rst
index a311b7bbcf32..0b6d4c1c5f0c 100644
--- a/doc/source/ray-core/actors.rst
+++ b/doc/source/ray-core/actors.rst
@@ -323,12 +323,22 @@ If we instantiate an actor, we can pass the handle around to various tasks.
 
 Scheduling
 ----------
+
 For each actor, Ray will choose a node to run it
 and the scheduling decision is based on a few factors like
 :ref:`the actor's resource requirements <ray-scheduling-resources>`
 and :ref:`the specified scheduling strategy <ray-scheduling-strategies>`.
 See :ref:`Ray scheduling <ray-scheduling>` for more details.
 
+Fault Tolerance
+---------------
+
+By default, Ray actors won't be :ref:`restarted <fault-tolerance-actors>` and
+actor tasks won't be retried when actors crash unexpectedly.
+You can change this behavior by setting
+``max_restarts`` and ``max_task_retries`` options
+in :ref:`ray.remote() <ray-remote-ref>` and :ref:`.options() <ray-options-ref>`.
+See :ref:`Ray fault tolerance <fault-tolerance>` for more details.
 
 FAQ: Actors, Workers and Resources
 ----------------------------------
@@ -361,7 +371,6 @@ More about Ray Actors
     actors/async_api.rst
     actors/concurrency_group_api.rst
     actors/actor-utils.rst
-    actors/fault-tolerance.rst
     actors/out-of-band-communication.rst
     actors/task-orders.rst
     actors/patterns/index.rst
diff --git a/doc/source/ray-core/actors/fault-tolerance.rst b/doc/source/ray-core/actors/fault-tolerance.rst
deleted file mode 100644
index 54766e5d32ae..000000000000
--- a/doc/source/ray-core/actors/fault-tolerance.rst
+++ /dev/null
@@ -1,128 +0,0 @@
-.. _actor-fault-tolerance:
-
-Fault Tolerance
-===============
-
-Ray will automatically restart actors that crash unexpectedly.
-This behavior is controlled using ``max_restarts``,
-which sets the maximum number of times that an actor will be restarted.
-If 0, the actor won't be restarted. If -1, it will be restarted infinitely.
-The default value of ``max_restarts`` is 0.
-When an actor is restarted, its state will be recreated by rerunning its
-constructor.
-After the specified number of restarts, subsequent actor methods will
-raise a ``RayActorError``.
-You can experiment with this behavior by running the following code.
-
-.. code-block:: python
-
-    import os
-    import ray
-    import time
-
-    ray.init(ignore_reinit_error=True)
-
-    @ray.remote(max_restarts=5)
-    class Actor:
-        def __init__(self):
-            self.counter = 0
-
-        def increment_and_possibly_fail(self):
-            self.counter += 1
-            time.sleep(0.2)
-            if self.counter == 10:
-                os._exit(0)
-            return self.counter
-
-    actor = Actor.remote()
-
-    # The actor will be restarted up to 5 times. After that, methods will
-    # always raise a `RayActorError` exception. The actor is restarted by
-    # rerunning its constructor. Methods that were sent or executing when the
-    # actor died will also raise a `RayActorError` exception.
-    for _ in range(100):
-        try:
-            counter = ray.get(actor.increment_and_possibly_fail.remote())
-            print(counter)
-        except ray.exceptions.RayActorError:
-            print('FAILURE')
-
-By default, actor tasks execute with at-most-once semantics
-(``max_task_retries=0`` in the ``@ray.remote`` decorator). This means that if an
-actor task is submitted to an actor that is unreachable, Ray will report the
-error with ``RayActorError``, a Python-level exception that is thrown when
-``ray.get`` is called on the future returned by the task. Note that this
-exception may be thrown even though the task did indeed execute successfully.
-For example, this can happen if the actor dies immediately after executing the
-task.
-
-Ray also offers at-least-once execution semantics for actor tasks
-(``max_task_retries=-1`` or ``max_task_retries > 0``). This means that if an
-actor task is submitted to an actor that is unreachable, the system will
-automatically retry the task until it receives a reply from the actor. With
-this option, the system will only throw a ``RayActorError`` to the application
-if one of the following occurs: (1) the actor’s ``max_restarts`` limit has been
-exceeded and the actor cannot be restarted anymore, or (2) the
-``max_task_retries`` limit has been exceeded for this particular task. The
-limit can be set to infinity with ``max_task_retries = -1``.
-
-You can experiment with this behavior by running the following code.
-
-.. code-block:: python
-
-    import os
-    import ray
-
-    ray.init(ignore_reinit_error=True)
-
-    @ray.remote(max_restarts=5, max_task_retries=-1)
-    class Actor:
-        def __init__(self):
-            self.counter = 0
-
-        def increment_and_possibly_fail(self):
-            # Exit after every 10 tasks.
-            if self.counter == 10:
-                os._exit(0)
-            self.counter += 1
-            return self.counter
-
-    actor = Actor.remote()
-
-    # The actor will be reconstructed up to 5 times. The actor is
-    # reconstructed by rerunning its constructor. Methods that were
-    # executing when the actor died will be retried and will not
-    # raise a `RayActorError`. Retried methods may execute twice, once
-    # on the failed actor and a second time on the restarted actor.
-    for _ in range(50):
-        counter = ray.get(actor.increment_and_possibly_fail.remote())
-        print(counter)  # Prints the sequence 1-10 5 times.
-
-    # After the actor has been restarted 5 times, all subsequent methods will
-    # raise a `RayActorError`.
-    for _ in range(10):
-        try:
-            counter = ray.get(actor.increment_and_possibly_fail.remote())
-            print(counter)  # Unreachable.
-        except ray.exceptions.RayActorError:
-            print('FAILURE')  # Prints 10 times.
-
-For at-least-once actors, the system will still guarantee execution ordering
-according to the initial submission order. For example, any tasks submitted
-after a failed actor task will not execute on the actor until the failed actor
-task has been successfully retried. The system will not attempt to re-execute
-any tasks that executed successfully before the failure (unless :ref:`object reconstruction <object-reconstruction>` is enabled).
-
-At-least-once execution is best suited for read-only actors or actors with
-ephemeral state that does not need to be rebuilt after a failure. For actors
-that have critical state, it is best to take periodic checkpoints and either
-manually restart the actor or automatically restart the actor with at-most-once
-semantics. If the actor’s exact state at the time of failure is needed, the
-application is responsible for resubmitting all tasks since the last
-checkpoint.
-
-.. note::
-    For :ref:`async or threaded actors <async-actors>`, the tasks might
-    be executed out of order. Upon actor restart, the system will only retry
-    *incomplete* tasks. Previously completed tasks will not be
-    re-executed.
diff --git a/doc/source/ray-core/actors/named-actors.rst b/doc/source/ray-core/actors/named-actors.rst
index 327440598635..79b7367d24ac 100644
--- a/doc/source/ray-core/actors/named-actors.rst
+++ b/doc/source/ray-core/actors/named-actors.rst
@@ -155,7 +155,7 @@ created with the specified arguments.
 Actor Lifetimes
 ---------------
 
-Separately, actor lifetimes can be decoupled from the job, allowing an actor to persist even after the driver process of the job exits.
+Separately, actor lifetimes can be decoupled from the job, allowing an actor to persist even after the driver process of the job exits. We call these actors *detached*.
 
 .. tabbed:: Python
 
@@ -163,7 +163,7 @@ Separately, actor lifetimes can be decoupled from the job, allowing an actor to
 
         counter = Counter.options(name="CounterActor", lifetime="detached").remote()
 
-    The CounterActor will be kept alive even after the driver running above script
+    The ``CounterActor`` will be kept alive even after the driver running above script
     exits. Therefore it is possible to run the following script in a different
     driver:
 
@@ -172,8 +172,8 @@ Separately, actor lifetimes can be decoupled from the job, allowing an actor to
         counter = ray.get_actor("CounterActor")
         print(ray.get(counter.get_counter.remote()))
 
-    Note that the lifetime option is decoupled from the name. If we only specified
-    the name without specifying ``lifetime="detached"``, then the CounterActor can
+    Note that an actor can be named but not detached. If we only specified the
+    name without specifying ``lifetime="detached"``, then the CounterActor can
     only be retrieved as long as the original driver is still running.
 
 .. tabbed:: Java
@@ -199,3 +199,8 @@ Separately, actor lifetimes can be decoupled from the job, allowing an actor to
 
     Customizing lifetime of an actor hasn't been implemented in C++ yet.
 
+
+Unlike normal actors, detached actors are not automatically garbage-collected by Ray.
+Detached actors must be manually destroyed once you are sure that they are no
+longer needed. To do this, use ``ray.kill`` to :ref:`manually terminate <ray-kill-actors>` the actor.
+After this call, the actor's name may be reused.
diff --git a/doc/source/ray-core/actors/task-orders.rst b/doc/source/ray-core/actors/task-orders.rst
index 1074b9fd117d..0131abdd66fe 100644
--- a/doc/source/ray-core/actors/task-orders.rst
+++ b/doc/source/ray-core/actors/task-orders.rst
@@ -1,5 +1,7 @@
-Actor Task Execution Orders
-===========================
+.. _actor-task-order:
+
+Actor Task Execution Order
+==========================
 
 Synchronous, Single-Threaded Actor
 ----------------------------------
diff --git a/doc/source/ray-core/actors/terminating-actors.rst b/doc/source/ray-core/actors/terminating-actors.rst
index bbd7c88973fd..d71d8f3312bf 100644
--- a/doc/source/ray-core/actors/terminating-actors.rst
+++ b/doc/source/ray-core/actors/terminating-actors.rst
@@ -1,22 +1,61 @@
 Terminating Actors
 ==================
 
-Automatic termination
-^^^^^^^^^^^^^^^^^^^^^
+Actor processes will be terminated automatically when all copies of the
+actor handle have gone out of scope in Python, or if the original creator
+process dies.
+
+Note that automatic termination of actors is not yet supported in Java or C++.
+
+.. _ray-kill-actors:
+
+Manual termination via an actor handle
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In most cases, Ray will automatically terminate actors that have gone out of
+scope, but you may sometimes need to terminate an actor forcefully. This should
+be reserved for cases where an actor is unexpectedly hanging or leaking
+resources, and for :ref:`detached actors <actor-lifetimes>`, which must be
+manually destroyed.
 
 .. tabbed:: Python
 
-    Actor processes will be terminated automatically when all copies of the
-    actor handle have gone out of scope in Python, or if the original creator
-    process dies.
+    .. code-block:: python
+
+        ray.kill(actor_handle)
+        # This will not go through the normal Python sys.exit
+        # teardown logic, so any exit handlers installed in
+        # the actor using ``atexit`` will not be called.
+
 
 .. tabbed:: Java
 
-    Terminating an actor automatically when the initial actor handle goes out of scope hasn't been implemented in Java yet.
+    .. code-block:: java
+
+        actorHandle.kill();
+        // This will not go through the normal Java System.exit teardown logic, so any
+        // shutdown hooks installed in the actor using ``Runtime.addShutdownHook(...)`` will
+        // not be called.
 
 .. tabbed:: C++
 
-    Terminating an actor automatically when the initial actor handle goes out of scope hasn't been implemented in C++ yet.
+    .. code-block:: c++
+
+        actor_handle.Kill();
+        // This will not go through the normal C++ std::exit
+        // teardown logic, so any exit handlers installed in
+        // the actor using ``std::atexit`` will not be called.
+
+
+This will cause the actor to immediately exit its process, causing any current,
+pending, and future tasks to fail with a ``RayActorError``. If you would like
+Ray to :ref:`automatically restart <fault-tolerance-actors>` the actor, make sure to set a nonzero
+``max_restarts`` in the ``@ray.remote`` options for the actor, then pass the
+flag ``no_restart=False`` to ``ray.kill``.
+
+For :ref:`named and detached actors <actor-lifetimes>`, calling ``ray.kill`` on
+an actor handle will destroy the actor and allow the name to be reused.
+
 
 Manual termination within the actor
 ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
@@ -59,46 +98,3 @@ This will kill the actor process and release resources associated/assigned to th
 Note that this method of termination will wait until any previously submitted
 tasks finish executing and then exit the process gracefully with sys.exit.
 
-Manual termination via an actor handle
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-You can terminate an actor forcefully.
-
-.. tabbed:: Python
-
-    .. code-block:: python
-
-        ray.kill(actor_handle)
-
-.. tabbed:: Java
-
-    .. code-block:: java
-
-        actorHandle.kill();
-
-.. tabbed:: C++
-
-    .. code-block:: c++
-
-        actor_handle.Kill();
-
-This will call the exit syscall from within the actor, causing it to exit
-immediately and any pending tasks to fail.
-
-.. tabbed:: Python
-
-    This will not go through the normal
-    Python sys.exit teardown logic, so any exit handlers installed in the actor using
-    ``atexit`` will not be called.
-
-.. tabbed:: Java
-
-    This will not go through the normal Java System.exit teardown logic, so any
-    shutdown hooks installed in the actor using ``Runtime.addShutdownHook(...)`` will
-    not be called.
-
-.. tabbed:: C++
-
-    This will not go through the normal
-    C++ std::exit teardown logic, so any exit handlers installed in the actor using
-    ``std::atexit`` will not be called.
diff --git a/doc/source/ray-core/doc_code/actor_creator_failure.py b/doc/source/ray-core/doc_code/actor_creator_failure.py
new file mode 100644
index 000000000000..a4d0cd923f9a
--- /dev/null
+++ b/doc/source/ray-core/doc_code/actor_creator_failure.py
@@ -0,0 +1,44 @@
+# flake8: noqa
+
+# fmt: off
+# __actor_creator_failure_begin__
+import ray
+import os
+import signal
+ray.init()
+
+@ray.remote(max_restarts=-1)
+class Actor:
+    def ping(self):
+        return "hello"
+
+@ray.remote
+class Parent:
+    def generate_actors(self):
+        self.child = Actor.remote()
+        self.detached_actor = Actor.options(name="actor", lifetime="detached").remote()
+        return self.child, self.detached_actor, os.getpid()
+
+parent = Parent.remote()
+actor, detached_actor, pid = ray.get(parent.generate_actors.remote())
+
+os.kill(pid, signal.SIGKILL)
+
+try:
+    print("actor.ping:", ray.get(actor.ping.remote()))
+except ray.exceptions.RayActorError as e:
+    print("Failed to submit actor call", e)
+# Failed to submit actor call The actor died unexpectedly before finishing this task.
+# 	class_name: Actor
+# 	actor_id: 56f541b178ff78470f79c3b601000000
+# 	namespace: ea8b3596-7426-4aa8-98cc-9f77161c4d5f
+# The actor is dead because because all references to the actor were removed.
+
+try:
+    print("detached_actor.ping:", ray.get(detached_actor.ping.remote()))
+except ray.exceptions.RayActorError as e:
+    print("Failed to submit detached actor call", e)
+# detached_actor.ping: hello
+
+# __actor_creator_failure_end__
+# fmt: on
diff --git a/doc/source/ray-core/doc_code/actor_restart.py b/doc/source/ray-core/doc_code/actor_restart.py
new file mode 100644
index 000000000000..667dc33dc3c0
--- /dev/null
+++ b/doc/source/ray-core/doc_code/actor_restart.py
@@ -0,0 +1,44 @@
+# flake8: noqa
+
+# fmt: off
+# __actor_restart_begin__
+import os
+import ray
+
+ray.init()
+
+# This actor kills itself after executing 10 tasks.
+@ray.remote(max_restarts=4, max_task_retries=-1)
+class Actor:
+    def __init__(self):
+        self.counter = 0
+
+    def increment_and_possibly_fail(self):
+        # Exit after every 10 tasks.
+        if self.counter == 10:
+            os._exit(0)
+        self.counter += 1
+        return self.counter
+
+actor = Actor.remote()
+
+# The actor will be reconstructed up to 4 times, so we can execute up to 50
+# tasks successfully. The actor is reconstructed by rerunning its constructor.
+# Methods that were executing when the actor died will be retried and will not
+# raise a `RayActorError`. Retried methods may execute twice, once on the
+# failed actor and a second time on the restarted actor.
+for _ in range(50):
+    counter = ray.get(actor.increment_and_possibly_fail.remote())
+    print(counter)  # Prints the sequence 1-10 5 times.
+
+# After the actor has been restarted 4 times, all subsequent methods will
+# raise a `RayActorError`.
+for _ in range(10):
+    try:
+        counter = ray.get(actor.increment_and_possibly_fail.remote())
+        print(counter)  # Unreachable.
+    except ray.exceptions.RayActorError:
+        print("FAILURE")  # Prints 10 times.
+
+# __actor_restart_end__
+# fmt: on
diff --git a/doc/source/ray-core/doc_code/owners.py b/doc/source/ray-core/doc_code/owners.py
new file mode 100644
index 000000000000..b16a83d52a4a
--- /dev/null
+++ b/doc/source/ray-core/doc_code/owners.py
@@ -0,0 +1,19 @@
+# flake8: noqa
+# __owners_begin__
+import ray
+import numpy as np
+
+
+@ray.remote
+def large_array():
+    return np.zeros(int(1e5))
+
+
+x = ray.put(1)  # The driver owns x and also creates the value of x.
+
+y = large_array.remote()
+# The driver is the owner of y, even though the value may be stored somewhere else.
+# If the node that stores the value of y dies, Ray will automatically recover
+# it by re-executing the large_array task.
+# If the driver dies, anyone still using y will receive an OwnerDiedError.
+# __owners_end__
diff --git a/doc/source/ray-core/doc_code/task_exceptions.py b/doc/source/ray-core/doc_code/task_exceptions.py
new file mode 100644
index 000000000000..3f48e1691e23
--- /dev/null
+++ b/doc/source/ray-core/doc_code/task_exceptions.py
@@ -0,0 +1,38 @@
+# flake8: noqa
+
+# fmt: off
+# __task_exceptions_begin__
+
+import ray
+
+@ray.remote
+def f():
+    raise Exception("the real error")
+
+@ray.remote
+def g(x):
+    return
+
+
+try:
+    ray.get(f.remote())
+except ray.exceptions.RayTaskError as e:
+    print(e)
+    # ray::f() (pid=71867, ip=XXX.XX.XXX.XX)
+    #   File "errors.py", line 5, in f
+    #     raise Exception("the real error")
+    # Exception: the real error
+
+try:
+    ray.get(g.remote(f.remote()))
+except ray.exceptions.RayTaskError as e:
+    print(e)
+    # ray::g() (pid=73085, ip=128.32.132.47)
+    #   At least one of the input arguments for this task could not be computed:
+    # ray.exceptions.RayTaskError: ray::f() (pid=73085, ip=XXX.XX.XXX.XX)
+    #   File "errors.py", line 5, in f
+    #     raise Exception("the real error")
+    # Exception: the real error
+
+# __task_exceptions_end__
+# fmt: on
diff --git a/doc/source/ray-core/fault-tolerance.rst b/doc/source/ray-core/fault-tolerance.rst
new file mode 100644
index 000000000000..2bc5c9a9028e
--- /dev/null
+++ b/doc/source/ray-core/fault-tolerance.rst
@@ -0,0 +1,26 @@
+.. _fault-tolerance:
+
+Fault Tolerance
+===============
+
+Ray is a distributed system, and that means failures can happen. Generally, failures can
+be classified into two classes: 1) application-level failures, and 2)
+system-level failures.  The former can happen because of bugs in user-level
+code, or if external systems fail. The latter can be triggered by node
+failures, network failures, or just bugs in Ray. Here, we describe the
+mechanisms that Ray provides to allow applications to recover from failures.
+
+To handle application-level failures, Ray provides mechanisms to catch errors,
+retry failed code, and handle misbehaving code. See the pages for :ref:`task
+<fault-tolerance-tasks>` and :ref:`actor <fault-tolerance-actors>` fault
+tolerance for more information on these mechanisms.
+
+Ray also provides several mechanisms to automatically recover from internal system-level failures. In particular, Ray can automatically recover from some failures in the :ref:`distributed object store <fault-tolerance-objects>`.
+
+
+.. toctree::
+    :maxdepth: 1
+
+    fault_tolerance/tasks.rst
+    fault_tolerance/actors.rst
+    fault_tolerance/objects.rst
diff --git a/doc/source/ray-core/fault_tolerance/actors.rst b/doc/source/ray-core/fault_tolerance/actors.rst
new file mode 100644
index 000000000000..d1ea3d67e524
--- /dev/null
+++ b/doc/source/ray-core/fault_tolerance/actors.rst
@@ -0,0 +1,107 @@
+.. _fault-tolerance-actors:
+.. _actor-fault-tolerance:
+
+Actor Fault Tolerance
+=====================
+
+Actors can fail if the actor process dies, or if the **owner** of the actor
+dies. The owner of an actor is the worker that originally created the actor by
+calling ``ActorClass.remote()``. :ref:`Detached actors <actor-lifetimes>` do
+not have an owner process and are cleaned up when the Ray cluster is destroyed.
+
+
+Actor process failure
+---------------------
+
+Ray can automatically restart actors that crash unexpectedly.
+This behavior is controlled using ``max_restarts``,
+which sets the maximum number of times that an actor will be restarted.
+The default value of ``max_restarts`` is 0, meaning that the actor won't be
+restarted. If set to -1, the actor will be restarted infinitely many times.
+When an actor is restarted, its state will be recreated by rerunning its
+constructor.
+After the specified number of restarts, subsequent actor methods will
+raise a ``RayActorError``.
+
+By default, actor tasks execute with at-most-once semantics
+(``max_task_retries=0`` in the ``@ray.remote`` :ref:`decorator <ray-remote-ref>`). This means that if an
+actor task is submitted to an actor that is unreachable, Ray will report the
+error with ``RayActorError``, a Python-level exception that is thrown when
+``ray.get`` is called on the future returned by the task. Note that this
+exception may be thrown even though the task did indeed execute successfully.
+For example, this can happen if the actor dies immediately after executing the
+task.
+
+Ray also offers at-least-once execution semantics for actor tasks
+(``max_task_retries=-1`` or ``max_task_retries > 0``). This means that if an
+actor task is submitted to an actor that is unreachable, the system will
+automatically retry the task. With this option, the system will only throw a
+``RayActorError`` to the application if one of the following occurs: (1) the
+actor’s ``max_restarts`` limit has been exceeded and the actor cannot be
+restarted anymore, or (2) the ``max_task_retries`` limit has been exceeded for
+this particular task. Note that if the actor is currently restarting when a
+task is submitted, this will count for one retry. The retry limit can be set to
+infinity with ``max_task_retries = -1``.
+
+You can experiment with this behavior by running the following code.
+
+.. literalinclude:: ../doc_code/actor_restart.py
+  :language: python
+  :start-after: __actor_restart_begin__
+  :end-before: __actor_restart_end__
+
+For at-least-once actors, the system will still guarantee execution ordering
+according to the initial submission order. For example, any tasks submitted
+after a failed actor task will not execute on the actor until the failed actor
+task has been successfully retried. The system will not attempt to re-execute
+any tasks that executed successfully before the failure
+(unless ``max_task_retries`` is nonzero and the task is needed for :ref:`object
+reconstruction <fault-tolerance-objects-reconstruction>`).
+
+.. note::
+
+  For :ref:`async or threaded actors <async-actors>`, :ref:`tasks might be
+  executed out of order <actor-task-order>`. Upon actor restart, the system
+  will only retry *incomplete* tasks. Previously completed tasks will not be
+  re-executed.
+
+
+At-least-once execution is best suited for read-only actors or actors with
+ephemeral state that does not need to be rebuilt after a failure. For actors
+that have critical state, the application is responsible for recovering the
+state, e.g., by taking periodic checkpoints and recovering from the checkpoint
+upon actor restart.
+
+
+Actor creator failure
+---------------------
+
+For :ref:`non-detached actors <actor-lifetimes>`, the owner of an actor is the
+worker that created it, i.e. the worker that called ``ActorClass.remote()``. Similar to
+:ref:`objects <fault-tolerance-objects>`, if the owner of an actor dies, then
+the actor will also fate-share with the owner.  Ray will not automatically
+recover an actor whose owner is dead, even if it has a nonzero
+``max_restarts``.
+
+Since :ref:`detached actors <actor-lifetimes>` do not have an owner, they will still be restarted by Ray
+even if their original creator dies. Detached actors will continue to be
+automatically restarted until the maximum restarts is exceeded, the actor is
+destroyed, or until the Ray cluster is destroyed.
+
+You can try out this behavior in the following code.
+
+.. literalinclude:: ../doc_code/actor_creator_failure.py
+  :language: python
+  :start-after: __actor_creator_failure_begin__
+  :end-before: __actor_creator_failure_end__
+
+Force-killing a misbehaving actor
+---------------------------------
+
+Sometimes application-level code can cause an actor to hang or leak resources.
+In these cases, Ray allows you to recover from the failure by :ref:`manually
+terminating <ray-kill-actors>` the actor. You can do this by calling
+``ray.kill`` on any handle to the actor. Note that it does not need to be the
+original handle to the actor.
+
+If ``max_restarts`` is set, you can also allow Ray to automatically restart the actor by passing ``no_restart=False`` to ``ray.kill``.
diff --git a/doc/source/ray-core/fault_tolerance/objects.rst b/doc/source/ray-core/fault_tolerance/objects.rst
new file mode 100644
index 000000000000..4c2987d8efd2
--- /dev/null
+++ b/doc/source/ray-core/fault_tolerance/objects.rst
@@ -0,0 +1,104 @@
+.. _fault-tolerance-objects:
+.. _object-fault-tolerance:
+
+Object Fault Tolerance
+======================
+
+A Ray object has both data (the value returned when calling ``ray.get``) and
+metadata (e.g., the location of the value). Data is stored in the Ray object
+store while the metadata is stored at the object's **owner**. The owner of an
+object is the worker process that creates the original ``ObjectRef``, e.g., by
+calling ``f.remote()`` or ``ray.put()``. Note that this worker is usually a
+distinct process from the worker that creates the **value** of the object,
+except in cases of ``ray.put``.
+
+.. literalinclude:: ../doc_code/owners.py
+  :language: python
+  :start-after: __owners_begin__
+  :end-before: __owners_end__
+
+
+Ray can automatically recover from data loss but not owner failure.
+
+.. _fault-tolerance-objects-reconstruction:
+
+Recovering from data loss
+-------------------------
+
+When an object value is lost from the object store, such as during node
+failures, Ray will use *lineage reconstruction* to recover the object.
+Ray will first automatically attempt to recover the value by looking
+for copies of the same object on other nodes. If none are found, then Ray will
+automatically recover the value by :ref:`re-executing <fault-tolerance-tasks>`
+the task that previously created the value.  Arguments to the task are
+recursively reconstructed through the same mechanism.
+
+Lineage reconstruction currently has the following limitations:
+
+* The object, and any of its transitive dependencies, must have been generated
+  by a task (actor or non-actor). This means that **objects created by
+  ray.put are not recoverable**.
+* Tasks are assumed to be deterministic and idempotent. Thus,
+  **by default, objects created by actor tasks are not reconstructable**. To allow
+  reconstruction of actor task results, set the ``max_task_retries`` parameter
+  to a non-zero value (see :ref:`actor
+  fault tolerance <fault-tolerance-actors>` for more details).
+* Tasks will only be re-executed up to their maximum number of retries. By
+  default, a non-actor task can be retried up to 3 times and an actor task
+  cannot be retried.  This can be overridden with the ``max_retries`` parameter
+  for :ref:`remote functions <fault-tolerance-tasks>` and the
+  ``max_task_retries`` parameter for :ref:`actors <fault-tolerance-actors>`.
+* The owner of the object must still be alive (see :ref:`below
+  <fault-tolerance-ownership>`).
+
+Lineage reconstruction can cause higher than usual driver memory
+usage because the driver keeps the descriptions of any tasks that may be
+re-executed in case of failure. To limit the amount of memory used by
+lineage, set the environment variable ``RAY_max_lineage_bytes`` (default 1GB)
+to evict lineage if the threshold is exceeded.
+
+To disable lineage reconstruction entirely, set the environment variable
+``RAY_TASK_MAX_RETRIES=0`` during ``ray start`` or ``ray.init``.  With this
+setting, if there are no copies of an object left, an ``ObjectLostError`` will
+be raised.
+
+.. _fault-tolerance-ownership:
+
+Recovering from owner failure
+-----------------------------
+
+The owner of an object can die because of node or worker process failure.
+Currently, **Ray does not support recovery from owner failure**. In this case, Ray
+will clean up any remaining copies of the object's value to prevent a memory
+leak. Any workers that subsequently try to get the object's value will receive
+an ``OwnerDiedError`` exception, which can be handled manually.
+
+Understanding `ObjectLostErrors`
+--------------------------------
+
+Ray throws an ``ObjectLostError`` to the application when an object cannot be
+retrieved due to application or system error. This can occur during a
+``ray.get()`` call or when fetching a task's arguments, and can happen for a
+number of reasons. Here is a guide to understanding the root cause for
+different error types:
+
+- ``OwnerDiedError``: The owner of an object, i.e., the Python worker that
+  first created the ``ObjectRef`` via ``.remote()`` or ``ray.put()``, has died.
+  The owner stores critical object metadata and an object cannot be retrieved
+  if this process is lost.
+- ``ObjectReconstructionFailedError``: This error is thrown if an object, or
+  another object that this object depends on, cannot be reconstructed due to
+  one of the limitations described :ref:`above
+  <fault-tolerance-objects-reconstruction>`.
+- ``ReferenceCountingAssertionError``: The object has already been deleted,
+  so it cannot be retrieved. Ray implements automatic memory management through
+  distributed reference counting, so this error should not happen in general.
+  However, there is a `known edge case <https://github.com/ray-project/ray/issues/18456>`_ that can produce this error.
+- ``ObjectFetchTimedOutError``: A node timed out while trying to retrieve a
+  copy of the object from a remote node. This error usually indicates a
+  system-level bug. The timeout period can be configured using the
+  ``RAY_fetch_fail_timeout_milliseconds`` environment variable (default 10
+  minutes).
+- ``ObjectLostError``: The object was successfully created, but no copy is
+  reachable.  This is a generic error thrown when lineage reconstruction is
+  disabled and all copies of the object are lost from the cluster.
diff --git a/doc/source/ray-core/fault_tolerance/tasks.rst b/doc/source/ray-core/fault_tolerance/tasks.rst
new file mode 100644
index 000000000000..69652b1852e8
--- /dev/null
+++ b/doc/source/ray-core/fault_tolerance/tasks.rst
@@ -0,0 +1,85 @@
+.. _fault-tolerance-tasks:
+.. _task-fault-tolerance:
+
+Task Fault Tolerance
+====================
+
+Tasks can fail due to application-level errors, e.g., Python-level exceptions,
+or system-level failures, e.g., a machine fails. Here, we describe the
+mechanisms that an application developer can use to recover from these errors.
+
+Catching application-level failures
+-----------------------------------
+
+Ray surfaces application-level failures as Python-level exceptions. When a task
+on a remote worker or actor fails due to a Python-level exception, Ray wraps
+the original exception in a ``RayTaskError`` and stores this as the task's
+return value. This wrapped exception will be thrown to any worker that tries
+to get the result, either by calling ``ray.get`` or if the worker is executing
+another task that depends on the object.
+
+.. literalinclude:: ../doc_code/task_exceptions.py
+  :language: python
+  :start-after: __task_exceptions_begin__
+  :end-before: __task_exceptions_end__
+
+.. _task-retries:
+
+Retrying failed tasks
+---------------------
+
+When a worker is executing a task, if the worker dies unexpectedly, either
+because the process crashed or because the machine failed, Ray will rerun
+the task until either the task succeeds or the maximum number of retries is
+exceeded. The default number of retries is 3 and can be overridden by
+specifying ``max_retries`` in the ``@ray.remote`` decorator. Specifying -1
+allows infinite retries, and 0 disables retries. To override the default number
+of retries for all tasks submitted, set the OS environment variable
+``RAY_TASK_MAX_RETRIES``. e.g., by passing this to your driver script or by
+using :ref:`runtime environments<runtime-environments>`.
+
+You can experiment with this behavior by running the following code.
+
+.. literalinclude:: ../doc_code/tasks_fault_tolerance.py
+  :language: python
+  :start-after: __tasks_fault_tolerance_retries_begin__
+  :end-before: __tasks_fault_tolerance_retries_end__
+
+When a task returns a result in the Ray object store, it is possible for the
+resulting object to be lost **after** the original task has already finished.
+In these cases, Ray will also try to automatically recover the object by
+re-executing the tasks that created the object. This can be configured through
+the same ``max_retries`` option described here. See :ref:`object fault
+tolerance <fault-tolerance-objects>` for more information.
+
+By default, Ray will **not** retry tasks upon exceptions thrown by application
+code. However, you may control whether application-level errors are retried,
+and even **which** application-level errors are retried, via the
+``retry_exceptions`` argument. This is ``False`` by default. To enable retries
+upon application-level errors, set ``retry_exceptions=True`` to retry upon any
+exception, or pass a list of retryable exceptions. An example is shown below.
+
+.. literalinclude:: ../doc_code/tasks_fault_tolerance.py
+  :language: python
+  :start-after: __tasks_fault_tolerance_retries_exception_begin__
+  :end-before: __tasks_fault_tolerance_retries_exception_end__
+
+Cancelling misbehaving tasks
+----------------------------
+
+If a task is hanging, you may want to cancel the task to continue to make
+progress. You can do this by calling ``ray.cancel`` on an ``ObjectRef``
+returned by the task. By default, this will send a KeyboardInterrupt to the
+task's worker if it is mid-execution.  Passing ``force=True`` to ``ray.cancel``
+will force-exit the worker. See :ref:`the API reference <ray-cancel-ref>` for
+``ray.cancel`` for more details.
+
+Note that currently, Ray will not automatically retry tasks that have been
+cancelled.
+
+Sometimes, application-level code may cause memory leaks on a worker after
+repeated task executions, e.g., due to bugs in third-party libraries.
+To make progress in these cases, you can set the ``max_calls`` option in a
+task's ``@ray.remote`` decorator. Once a worker has executed this many
+invocations of the given remote function, it will automatically exit. By
+default, ``max_calls`` is set to infinity.
diff --git a/doc/source/ray-core/objects.rst b/doc/source/ray-core/objects.rst
index 876123e6a65c..7c7f0b69eb56 100644
--- a/doc/source/ray-core/objects.rst
+++ b/doc/source/ray-core/objects.rst
@@ -106,7 +106,7 @@ If the current node's object store does not contain the object, the object is do
           return 1;
         }
       }
-      Assert.assertThrows(RayTimeoutException.class, 
+      Assert.assertThrows(RayTimeoutException.class,
         () -> Ray.get(Ray.task(MyRayApp::slowFunction).remote(), 3000));
 
 .. tabbed:: C++
@@ -173,6 +173,14 @@ Ray also supports nested object references. This allows you to build composite o
     # alive via reference counting until all outer object references are deleted.
     object_ref_2 = ray.put([object_ref])
 
+Fault Tolerance
+---------------
+
+Ray can automatically recover from object data loss
+via :ref:`lineage reconstruction <fault-tolerance-objects-reconstruction>`
+but not :ref:`owner <fault-tolerance-ownership>` failure.
+See :ref:`Ray fault tolerance <fault-tolerance>` for more details.
+
 More about Ray Objects
 ----------------------
 
@@ -181,4 +189,3 @@ More about Ray Objects
 
     objects/serialization.rst
     objects/object-spilling.rst
-    objects/fault-tolerance.rst
diff --git a/doc/source/ray-core/objects/fault-tolerance.rst b/doc/source/ray-core/objects/fault-tolerance.rst
deleted file mode 100644
index 7626081d301b..000000000000
--- a/doc/source/ray-core/objects/fault-tolerance.rst
+++ /dev/null
@@ -1,15 +0,0 @@
-.. _object-fault-tolerance:
-
-Fault Tolerance
-===============
-
-Typical use of objects is covered by :ref:`task <task-fault-tolerance>` and :ref:`actor <actor-fault-tolerance>` fault tolerance. This section covers more advanced fault tolerance situations that may occur if passing objects by reference around in a Ray application.
-
-Object Ownership and Fault Tolerance
-------------------------------------
-
-Ray delegates the metadata tracking of an object to its *owner process*. Typically, the owner of an object is the worker that created it via ``ray.put()``, or the worker that submitted the task generating an object. For example, the owner of an object could be an actor or the driver process.
-
-The owner of the object tracks the location and reference count for an object. If the owner process is unexpectedly killed, then the object cannot be recovered, even via lineage reconstruction.
-
-For more information about how object ownership works, see the :ref:`Ray Architecture Whitepaper <whitepaper>`.
diff --git a/doc/source/ray-core/tasks.rst b/doc/source/ray-core/tasks.rst
index cc5c8ab37656..f3e65113ca0c 100644
--- a/doc/source/ray-core/tasks.rst
+++ b/doc/source/ray-core/tasks.rst
@@ -227,6 +227,7 @@ Ray tasks can be canceled by calling ``ray.cancel`` (:ref:`docstring <ray-cancel
 
 Scheduling
 ----------
+
 For each task, Ray will choose a node to run it
 and the scheduling decision is based on a few factors like
 :ref:`the task's resource requirements <ray-scheduling-resources>`,
@@ -234,6 +235,16 @@ and the scheduling decision is based on a few factors like
 and :ref:`locations of task arguments <ray-scheduling-locality>`.
 See :ref:`Ray scheduling <ray-scheduling>` for more details.
 
+Fault Tolerance
+---------------
+
+By default, Ray will :ref:`retry <task-retries>` failed tasks
+due to system failures and specified application-level failures.
+You can change this behavior by setting
+``max_retries`` and ``retry_exceptions`` options
+in :ref:`ray.remote() <ray-remote-ref>` and :ref:`.options() <ray-options-ref>`.
+See :ref:`Ray fault tolerance <fault-tolerance>` for more details.
+
 
 More about Ray Tasks
 --------------------
@@ -243,4 +254,3 @@ More about Ray Tasks
 
     tasks/nested-tasks.rst
     tasks/generators.rst
-    tasks/fault-tolerance.rst
diff --git a/doc/source/ray-core/tasks/fault-tolerance.rst b/doc/source/ray-core/tasks/fault-tolerance.rst
deleted file mode 100644
index 81054f4bdfef..000000000000
--- a/doc/source/ray-core/tasks/fault-tolerance.rst
+++ /dev/null
@@ -1,75 +0,0 @@
-.. _task-fault-tolerance:
-
-===============
-Fault Tolerance
-===============
-
-.. _task-retries:
-
-Retries
-=======
-
-When a worker is executing a task, if the worker dies unexpectedly, either
-because the process crashed or because the machine failed, Ray will rerun
-the task until either the task succeeds or the maximum number of retries is
-exceeded. The default number of retries is 3 and can be overridden by
-specifying ``max_retries`` in the ``@ray.remote`` decorator. Specifying -1
-allows infinite retries, and 0 disables retries. To override the default number
-of retries for all tasks submitted, set the OS environment variable
-``RAY_TASK_MAX_RETRIES``. e.g., by passing this to your driver script or by
-using :ref:`runtime environments <runtime-environments>`.
-
-You can experiment with this behavior by running the following code.
-
-.. literalinclude:: ../doc_code/tasks_fault_tolerance.py
-  :language: python
-  :start-after: __tasks_fault_tolerance_retries_begin__
-  :end-before: __tasks_fault_tolerance_retries_end__
-
-You can also control whether application-level errors are retried, and even **which**
-application-level errors are retried, via the ``retry_exceptions`` argument. This is
-``False`` by default, so if your application code within the Ray task raises an
-exception, this failure will **not** be retried. This is to ensure that Ray is not
-retrying non-idempotent tasks when they have partially executed.
-However, if your tasks are idempotent, then you can enable application-level error
-retries with ``retry_exceptions=True``, or even retry a specific set of
-application-level errors (such as a class of exception types that you know to be
-transient) by providing an allowlist of exceptions:
-
-.. literalinclude:: ../doc_code/tasks_fault_tolerance.py
-  :language: python
-  :start-after: __tasks_fault_tolerance_retries_exception_begin__
-  :end-before: __tasks_fault_tolerance_retries_exception_end__
-
-The semantics for each of the potential ``retry_exceptions`` values are as follows:
-
-* ``retry_exceptions=False`` (default): Application-level errors are not retried.
-
-* ``retry_exceptions=True``: All application-level errors are retried.
-
-* ``retry_exceptions=[Exc1, Exc2]``: Application-level errors that are instances of
-  either ``Exc1`` or ``Exc2`` are retried.
-
-.. _object-reconstruction:
-
-Lineage-based Object Reconstruction
-===================================
-
-Ray also implements *lineage reconstruction* to recover task outputs that are
-lost from the distributed object store. This can occur during node failures.
-Ray will first automatically attempt to recover the value by looking for copies
-of the same object on other nodes. If none are found, then Ray will
-automatically recover the value by re-executing the task that created the
-value. Arguments to the task are recursively reconstructed with the same
-method.
-
-Note that lineage reconstruction can cause higher than usual driver memory
-usage because the driver keeps the descriptions of any tasks that may be
-re-executed in case of a failure. To limit the amount of memory used by
-lineage, set the environment variable ``RAY_max_lineage_bytes`` (default 1GB)
-to evict lineage if the threshold is exceeded.
-
-To disable this behavior, set the environment variable
-``RAY_lineage_pinning_enabled=0`` during ``ray start`` or ``ray.init``.  With
-this setting, if there are no copies of an object left, an ``ObjectLostError``
-will be raised.
diff --git a/doc/source/ray-core/user-guide.rst b/doc/source/ray-core/user-guide.rst
index cc17981afc2b..b03bc43202a9 100644
--- a/doc/source/ray-core/user-guide.rst
+++ b/doc/source/ray-core/user-guide.rst
@@ -13,7 +13,8 @@ If you’re brand new to Ray, we recommend starting with the :ref:`walkthrough <
     tasks
     actors
     objects
-    scheduling/index.rst
     handling-dependencies
+    scheduling/index.rst
+    fault-tolerance
     patterns/index.rst
     advanced-topics
diff --git a/doc/source/ray-observability/monitoring-debugging/troubleshoot-failures.rst b/doc/source/ray-observability/monitoring-debugging/troubleshoot-failures.rst
index db8a2810ff41..f5e387c63160 100644
--- a/doc/source/ray-observability/monitoring-debugging/troubleshoot-failures.rst
+++ b/doc/source/ray-observability/monitoring-debugging/troubleshoot-failures.rst
@@ -36,34 +36,6 @@ If Ray crashed, you want to know why and what happened. Currently, this can be a
 
     * Logout and log back in.
 
-Understanding `ObjectLostErrors`
---------------------------------
-Ray throws an ``ObjectLostError`` to the application when an object cannot be
-retrieved due to application or system error. This can occur during a
-``ray.get()`` call or when fetching a task's arguments, and can happen for a
-number of reasons. Here is a guide to understanding the root cause for
-different error types:
-
-- ``ObjectLostError``: The object was successfully created, but then all copies
-  were lost due to node failure.
-- ``OwnerDiedError``: The owner of an object, i.e., the Python worker that
-  first created the ``ObjectRef`` via ``.remote()`` or ``ray.put()``, has died.
-  The owner stores critical object metadata and an object cannot be retrieved
-  if this process is lost.
-- ``ObjectReconstructionFailedError``: Should only be thrown when `lineage
-  reconstruction`_ is enabled. This error is thrown if an object, or another
-  object that this object depends on, cannot be reconstructed because the
-  maximum number of task retries has been exceeded. By default, a non-actor
-  task can be retried up to 3 times and an actor task cannot be retried.
-  This can be overridden with the ``max_retries`` parameter for remote
-  functions and the ``max_task_retries`` parameter for actors.
-- ``ReferenceCountingAssertionError``: The object has already been deleted,
-  so it cannot be retrieved. Ray implements automatic memory management through
-  distributed reference counting, so this error should not happen in general.
-  However, there is a `known edge case`_ that can produce this error.
-
-.. _`lineage reconstruction`: https://docs.ray.io/en/master/ray-core/actors/fault-tolerance.html
-.. _`known edge case`: https://github.com/ray-project/ray/issues/18456
 
 This document discusses some common problems that people run into when using Ray
 as well as some known problems. If you encounter other problems, please

From dd36360ed7d92031662ae685451b6ec688dca5b5 Mon Sep 17 00:00:00 2001
From: shrekris-anyscale <92341594+shrekris-anyscale@users.noreply.github.com>
Date: Fri, 27 Jan 2023 15:58:35 -0800
Subject: [PATCH 031/267] [Serve] [release test] Add max_retries and
 max_restarts (#32011)

The long_running_serve_failure test uses a long-running actor, RandomKiller, to randomly kill Serve actors. This change sets the RandomKiller's max_restarts and max_task_retries to -1, so it can restart after crashes.

Related issue number
Addresses #31741
---
 release/long_running_tests/workloads/serve_failure.py | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/release/long_running_tests/workloads/serve_failure.py b/release/long_running_tests/workloads/serve_failure.py
index 319551b7c94f..caeaf3152ae9 100644
--- a/release/long_running_tests/workloads/serve_failure.py
+++ b/release/long_running_tests/workloads/serve_failure.py
@@ -60,7 +60,7 @@ def update_progress(result):
 serve.start(detached=True)
 
 
-@ray.remote
+@ray.remote(max_restarts=-1, max_task_retries=-1)
 class RandomKiller:
     def __init__(self, kill_period_s=1):
         self.kill_period_s = kill_period_s
@@ -95,15 +95,15 @@ def _get_serve_actors(self):
 
 
 class RandomTest:
-    def __init__(self, max_deployments=1):
+    def __init__(self, random_killer_handle, max_deployments=1):
         self.max_deployments = max_deployments
         self.weighted_actions = [
             (self.create_deployment, 1),
             (self.verify_deployment, 4),
         ]
         self.deployments = []
-        self.random_killer = RandomKiller.remote()
 
+        self.random_killer = random_killer_handle
         for _ in range(max_deployments):
             self.create_deployment()
         self.random_killer.run.remote()
@@ -172,5 +172,6 @@ def run(self):
                 break
 
 
-tester = RandomTest(max_deployments=NUM_NODES * CPUS_PER_NODE)
+random_killer = RandomKiller.remote()
+tester = RandomTest(random_killer, max_deployments=NUM_NODES * CPUS_PER_NODE)
 tester.run()

From 5d1f2e43d9a078d9f1fb8dae9994782f827d059c Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Fri, 27 Jan 2023 19:11:05 -0500
Subject: [PATCH 032/267] [core][state] Adjust worker side reporting with
 batches && add debugstring  (#31840)

Signed-off-by: rickyyx <rickyx@anyscale.com>

This PR introduces a flag RAY_task_events_send_batch_size that controls the number of task events sent to GCS in a batch. With default setting, each core worker will send 10K task events per second to GCS, where GCS could handle 10K task events in ~50 milliseconds.

This PR also adjust the worker side buffer limit to 1M with the new batching setting.

The PR adds some debug informations as well.
---
 BUILD.bazel                                   |   1 +
 src/ray/common/ray_config_def.h               |  11 +-
 src/ray/core_worker/core_worker.cc            |   5 +-
 src/ray/core_worker/task_event_buffer.cc      | 138 ++++++++++--------
 src/ray/core_worker/task_event_buffer.h       |  16 +-
 .../test/task_event_buffer_test.cc            |  58 +++++++-
 src/ray/core_worker/test/task_manager_test.cc |   2 +
 7 files changed, 163 insertions(+), 68 deletions(-)

diff --git a/BUILD.bazel b/BUILD.bazel
index 39c9ddd285da..20759e151419 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -833,6 +833,7 @@ cc_library(
         ":stats_lib",
         ":worker_rpc",
         "//src/ray/protobuf:worker_cc_proto",
+        "@boost//:circular_buffer",
         "@boost//:fiber",
         "@com_google_absl//absl/container:btree",
         "@com_google_absl//absl/container:flat_hash_map",
diff --git a/src/ray/common/ray_config_def.h b/src/ray/common/ray_config_def.h
index eb93e48f520d..e4e4b99667e9 100644
--- a/src/ray/common/ray_config_def.h
+++ b/src/ray/common/ray_config_def.h
@@ -455,9 +455,14 @@ RAY_CONFIG(int64_t, task_events_report_interval_ms, 1000)
 RAY_CONFIG(int64_t, task_events_max_num_task_in_gcs, 100000)
 
 /// Max number of task events stored in the buffer on workers. Any additional events
-/// will be dropped.
-/// Setting the value to -1 allows for unlimited task events buffered on workers.
-RAY_CONFIG(int64_t, task_events_max_num_task_events_in_buffer, 10000)
+/// will be dropped. This is set to a large value to avoid worker side data loss.
+/// For now, avg size of task event is 200Bytes, 1M task events would incur 200MiB
+/// overhead.
+RAY_CONFIG(uint64_t, task_events_max_num_task_events_in_buffer, 1 * 1000 * 1000)
+
+/// Max number of task events to be send in a single message to GCS. This caps both
+/// the message size, and also the processing work on GCS.
+RAY_CONFIG(uint64_t, task_events_send_batch_size, 10 * 1000)
 
 /// Max number of profile events allowed for a single task when sent to GCS.
 /// NOTE: this limit only applies to the profile events per task in a single
diff --git a/src/ray/core_worker/core_worker.cc b/src/ray/core_worker/core_worker.cc
index c3ea072b52db..b58aa8a44b73 100644
--- a/src/ray/core_worker/core_worker.cc
+++ b/src/ray/core_worker/core_worker.cc
@@ -531,7 +531,10 @@ CoreWorker::CoreWorker(const CoreWorkerOptions &options, const WorkerID &worker_
     periodical_runner_.RunFnPeriodically(
         [this] {
           RAY_LOG(INFO) << "Event stats:\n\n"
-                        << io_service_.stats().StatsString() << "\n\n";
+                        << io_service_.stats().StatsString() << "\n\n"
+                        << "-----------------\n"
+                        << "Task Event stats:\n"
+                        << task_event_buffer_->DebugString() << "\n";
         },
         event_stats_print_interval_ms);
   }
diff --git a/src/ray/core_worker/task_event_buffer.cc b/src/ray/core_worker/task_event_buffer.cc
index 10bc43028b94..db419ea68c2a 100644
--- a/src/ray/core_worker/task_event_buffer.cc
+++ b/src/ray/core_worker/task_event_buffer.cc
@@ -22,7 +22,8 @@ namespace worker {
 TaskEventBufferImpl::TaskEventBufferImpl(std::unique_ptr<gcs::GcsClient> gcs_client)
     : work_guard_(boost::asio::make_work_guard(io_service_)),
       periodical_runner_(io_service_),
-      gcs_client_(std::move(gcs_client)) {}
+      gcs_client_(std::move(gcs_client)),
+      buffer_() {}
 
 Status TaskEventBufferImpl::Start(bool auto_flush) {
   absl::MutexLock lock(&mutex_);
@@ -30,8 +31,8 @@ Status TaskEventBufferImpl::Start(bool auto_flush) {
   RAY_CHECK(report_interval_ms > 0)
       << "RAY_task_events_report_interval_ms should be > 0 to use TaskEventBuffer.";
 
-  buffer_.reserve(RayConfig::instance().task_events_max_num_task_events_in_buffer());
-
+  buffer_.set_capacity(
+      {RayConfig::instance().task_events_max_num_task_events_in_buffer()});
   // Reporting to GCS, set up gcs client and and events flushing.
   auto status = gcs_client_->Connect(io_service_);
   if (!status.ok()) {
@@ -100,17 +101,13 @@ void TaskEventBufferImpl::AddTaskEvent(rpc::TaskEvents task_events) {
   absl::MutexLock lock(&mutex_);
 
   auto limit = RayConfig::instance().task_events_max_num_task_events_in_buffer();
-  if (limit > 0 && buffer_.size() >= static_cast<size_t>(limit)) {
-    // Too many task events, start overriding older ones.
-    if (buffer_[next_idx_to_overwrite_].has_profile_events()) {
+  if (limit > 0 && buffer_.full()) {
+    const auto &to_evict = buffer_.front();
+    if (to_evict.has_profile_events()) {
       num_profile_task_events_dropped_++;
     } else {
       num_status_task_events_dropped_++;
     }
-
-    buffer_[next_idx_to_overwrite_] = std::move(task_events);
-    next_idx_to_overwrite_ = (next_idx_to_overwrite_ + 1) % limit;
-    return;
   }
   buffer_.push_back(std::move(task_events));
 }
@@ -119,20 +116,13 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
   if (!enabled_) {
     return;
   }
-  std::vector<rpc::TaskEvents> task_events;
   size_t num_status_task_events_dropped = 0;
   size_t num_profile_task_events_dropped = 0;
+  std::vector<rpc::TaskEvents> to_send;
+
   {
     absl::MutexLock lock(&mutex_);
 
-    RAY_LOG_EVERY_MS(INFO, 15000)
-        << "Pushed task state events to GCS. [total_bytes="
-        << (1.0 * total_events_bytes_) / 1024 / 1024
-        << "MiB][total_count=" << total_num_events_
-        << "][total_status_task_events_dropped=" << num_status_task_events_dropped_
-        << "][total_profile_task_events_dropped=" << num_profile_task_events_dropped_
-        << "][cur_buffer_size=" << buffer_.size() << "].";
-
     // Skip if GCS hasn't finished processing the previous message.
     if (grpc_in_progress_ && !forced) {
       RAY_LOG_EVERY_N_OR_DEBUG(WARNING, 100)
@@ -143,15 +133,19 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
       return;
     }
 
-    if (buffer_.size() == 0) {
+    // No data to send.
+    if (buffer_.empty()) {
       return;
     }
 
-    task_events.reserve(
-        RayConfig::instance().task_events_max_num_task_events_in_buffer());
-    buffer_.swap(task_events);
-    next_idx_to_overwrite_ = 0;
+    size_t num_to_send =
+        std::min(RayConfig::instance().task_events_send_batch_size(), buffer_.size());
+    to_send.insert(to_send.end(),
+                   std::make_move_iterator(buffer_.begin()),
+                   std::make_move_iterator(buffer_.begin() + num_to_send));
+    buffer_.erase(buffer_.begin(), buffer_.begin() + num_to_send);
 
+    // Send and reset the counters
     num_profile_task_events_dropped = num_profile_task_events_dropped_;
     num_profile_task_events_dropped_ = 0;
 
@@ -159,56 +153,49 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
     num_status_task_events_dropped_ = 0;
   }
 
-  // Merge multiple events from a single task attempt run into one task event.
-  absl::flat_hash_map<std::pair<std::string, int>, rpc::TaskEvents> task_events_map;
+  // Convert to rpc::TaskEventsData
+  auto data = std::make_unique<rpc::TaskEventData>();
+  data->set_num_profile_task_events_dropped(num_profile_task_events_dropped);
+  data->set_num_status_task_events_dropped(num_status_task_events_dropped);
 
+  size_t num_task_events = to_send.size();
   size_t num_profile_event_to_send = 0;
   size_t num_status_event_to_send = 0;
-  for (auto event : task_events) {
-    if (event.has_profile_events()) {
+  for (auto &task_event : to_send) {
+    auto events_by_task = data->add_events_by_task();
+    if (task_event.has_profile_events()) {
       num_profile_event_to_send++;
     } else {
       num_status_event_to_send++;
     }
-    auto &task_events_itr =
-        task_events_map[std::make_pair(event.task_id(), event.attempt_number())];
-    task_events_itr.MergeFrom(event);
-  }
-
-  // Convert to rpc::TaskEventsData
-  auto data = std::make_unique<rpc::TaskEventData>();
-  data->set_num_profile_task_events_dropped(num_profile_task_events_dropped);
-  data->set_num_status_task_events_dropped(num_status_task_events_dropped);
-
-  auto num_task_events = task_events_map.size();
-  for (auto itr : task_events_map) {
-    auto events_by_task = data->add_events_by_task();
-    events_by_task->Swap(&itr.second);
+    events_by_task->Swap(&task_event);
   }
 
+  gcs::TaskInfoAccessor *task_accessor;
   {
     // Sending the protobuf to GCS.
     absl::MutexLock lock(&mutex_);
     // Some debug tracking.
     total_num_events_ += num_task_events;
     total_events_bytes_ += data->ByteSizeLong();
-
-    auto on_complete = [this, num_task_events](const Status &status) {
-      absl::MutexLock lock(&mutex_);
-      if (!status.ok()) {
-        RAY_LOG(WARNING) << "Failed to push " << num_task_events
-                         << " task state events to GCS. Data will be lost. [status="
-                         << status.ToString() << "]";
-      } else {
-        RAY_LOG(DEBUG) << "Push " << num_task_events << " task state events to GCS.";
-      }
-      grpc_in_progress_ = false;
-    };
-
     // The flag should be unset when on_complete is invoked.
     grpc_in_progress_ = true;
-    auto status =
-        gcs_client_->Tasks().AsyncAddTaskEventData(std::move(data), on_complete);
+    task_accessor = &gcs_client_->Tasks();
+  }
+
+  auto on_complete = [this, num_task_events](const Status &status) {
+    absl::MutexLock lock(&mutex_);
+    if (!status.ok()) {
+      RAY_LOG(WARNING) << "Failed to push " << num_task_events
+                       << " task state events to GCS. Data will be lost. [status="
+                       << status.ToString() << "]";
+    }
+    grpc_in_progress_ = false;
+  };
+
+  auto status = task_accessor->AsyncAddTaskEventData(std::move(data), on_complete);
+  {
+    absl::MutexLock lock(&mutex_);
     if (!status.ok()) {
       // If we couldn't even send the data by invoking client side callbacks, there's
       // something seriously wrong, and losing data in this case should not be too
@@ -225,6 +212,43 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
   }
 }
 
+const std::string TaskEventBufferImpl::DebugString() {
+  std::stringstream ss;
+
+  if (!Enabled()) {
+    ss << "Task Event Buffer is disabled.";
+    return ss.str();
+  }
+
+  bool grpc_in_progress;
+  size_t num_status_task_events_dropped, num_profile_task_events_dropped,
+      data_buffer_size;
+  uint64_t total_events_bytes, total_num_events;
+
+  {
+    absl::MutexLock lock(&mutex_);
+    grpc_in_progress = grpc_in_progress_;
+    num_status_task_events_dropped = num_status_task_events_dropped_;
+    num_profile_task_events_dropped = num_profile_task_events_dropped_;
+    total_events_bytes = total_events_bytes_;
+    total_num_events = total_num_events_;
+    data_buffer_size = buffer_.size();
+  }
+
+  ss << "\nIO Service Stats:\n";
+  ss << io_service_.stats().StatsString();
+  ss << "\nOther Stats:"
+     << "\n\tgrpc_in_progress:" << grpc_in_progress
+     << "\n\tcurrent number of task events in buffer: " << data_buffer_size
+     << "\n\ttotal task events sent: " << 1.0 * total_events_bytes / 1024 / 1024 << " MiB"
+     << "\n\ttotal number of task events sent: " << total_num_events
+     << "\n\tnum status task events dropped: " << num_status_task_events_dropped
+     << "\n\tnum profile task events dropped: " << num_profile_task_events_dropped
+     << "\n";
+
+  return ss.str();
+}
+
 }  // namespace worker
 
 }  // namespace core
diff --git a/src/ray/core_worker/task_event_buffer.h b/src/ray/core_worker/task_event_buffer.h
index 145b8908e225..7deee0c2e3b7 100644
--- a/src/ray/core_worker/task_event_buffer.h
+++ b/src/ray/core_worker/task_event_buffer.h
@@ -14,6 +14,7 @@
 
 #pragma once
 
+#include <boost/circular_buffer.hpp>
 #include <memory>
 #include <string>
 
@@ -92,6 +93,9 @@ class TaskEventBuffer {
   ///
   /// The TaskEventBuffer will be disabled if Start() returns not ok.
   virtual bool Enabled() const = 0;
+
+  /// Return a string that describes the task event buffer stats.
+  virtual const std::string DebugString() = 0;
 };
 
 /// Implementation of TaskEventBuffer.
@@ -117,11 +121,13 @@ class TaskEventBufferImpl : public TaskEventBuffer {
 
   bool Enabled() const override;
 
+  const std::string DebugString() LOCKS_EXCLUDED(mutex_) override;
+
  private:
   /// Test only functions.
   std::vector<rpc::TaskEvents> GetAllTaskEvents() LOCKS_EXCLUDED(mutex_) {
     absl::MutexLock lock(&mutex_);
-    std::vector<rpc::TaskEvents> copy(buffer_);
+    std::vector<rpc::TaskEvents> copy(buffer_.begin(), buffer_.end());
     return copy;
   }
 
@@ -164,11 +170,8 @@ class TaskEventBufferImpl : public TaskEventBuffer {
   /// True if the TaskEventBuffer is enabled.
   std::atomic<bool> enabled_ = false;
 
-  /// Buffered task events.
-  std::vector<rpc::TaskEvents> buffer_ GUARDED_BY(mutex_);
-
-  /// A iterator into buffer_ that determines which element to be overwritten.
-  size_t next_idx_to_overwrite_ GUARDED_BY(mutex_) = 0;
+  /// Circular buffered task events.
+  boost::circular_buffer_space_optimized<rpc::TaskEvents> buffer_ GUARDED_BY(mutex_);
 
   /// Number of profile task events dropped since the last report flush.
   size_t num_profile_task_events_dropped_ GUARDED_BY(mutex_) = 0;
@@ -188,6 +191,7 @@ class TaskEventBufferImpl : public TaskEventBuffer {
   uint64_t total_num_events_ GUARDED_BY(mutex_) = 0;
 
   FRIEND_TEST(TaskEventBufferTestManualStart, TestGcsClientFail);
+  FRIEND_TEST(TaskEventBufferTestBatchSend, TestBatchedSend);
   FRIEND_TEST(TaskEventBufferTest, TestAddEvent);
   FRIEND_TEST(TaskEventBufferTest, TestFlushEvents);
   FRIEND_TEST(TaskEventBufferTest, TestFailedFlush);
diff --git a/src/ray/core_worker/test/task_event_buffer_test.cc b/src/ray/core_worker/test/task_event_buffer_test.cc
index 3a4d116daaec..5f8088cb0261 100644
--- a/src/ray/core_worker/test/task_event_buffer_test.cc
+++ b/src/ray/core_worker/test/task_event_buffer_test.cc
@@ -38,7 +38,8 @@ class TaskEventBufferTest : public ::testing::Test {
         R"(
 {
   "task_events_report_interval_ms": 1000,
-  "task_events_max_num_task_events_in_buffer": 100
+  "task_events_max_num_task_events_in_buffer": 100,
+  "task_events_send_batch_size": 100
 }
   )");
 
@@ -91,6 +92,20 @@ class TaskEventBufferTestManualStart : public TaskEventBufferTest {
   void SetUp() override {}
 };
 
+class TaskEventBufferTestBatchSend : public TaskEventBufferTest {
+ public:
+  TaskEventBufferTestBatchSend() : TaskEventBufferTest() {
+    RayConfig::instance().initialize(
+        R"(
+{
+  "task_events_report_interval_ms": 1000,
+  "task_events_max_num_task_events_in_buffer": 100,
+  "task_events_send_batch_size": 10
+}
+  )");
+  }
+};
+
 TEST_F(TaskEventBufferTestManualStart, TestGcsClientFail) {
   ASSERT_NE(task_event_buffer_, nullptr);
 
@@ -270,6 +285,47 @@ TEST_F(TaskEventBufferTest, TestForcedFlush) {
   task_event_buffer_->FlushEvents(true);
 }
 
+TEST_F(TaskEventBufferTestBatchSend, TestBatchedSend) {
+  size_t num_events = 100;
+  size_t batch_size = 10;  // Sync with constructor.
+  std::vector<TaskID> task_ids;
+  // Adding some events
+  for (size_t i = 0; i < num_events; ++i) {
+    auto task_id = RandomTaskId();
+    task_ids.push_back(task_id);
+    task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id, 0));
+  }
+
+  auto task_gcs_accessor =
+      static_cast<ray::gcs::MockGcsClient *>(task_event_buffer_->GetGcsClient())
+          ->mock_task_accessor;
+
+  size_t i = 0;
+  // With batch size = 10, there should be 10 flush calls
+  EXPECT_CALL(*task_gcs_accessor, AsyncAddTaskEventData)
+      .Times(num_events / batch_size)
+      .WillRepeatedly(
+          [&i, &batch_size, &task_ids](std::unique_ptr<rpc::TaskEventData> actual_data,
+                                       ray::gcs::StatusCallback callback) {
+            EXPECT_EQ(actual_data->events_by_task_size(), batch_size);
+            for (const auto &task : actual_data->events_by_task()) {
+              // Assert sent data in order.
+              EXPECT_EQ(task_ids[i++].Binary(), task.task_id());
+            }
+            callback(Status::OK());
+            return Status::OK();
+          });
+
+  for (int i = 0; i * batch_size < num_events; i++) {
+    task_event_buffer_->FlushEvents(false);
+    EXPECT_EQ(task_event_buffer_->GetAllTaskEvents().size(),
+              num_events - (i + 1) * batch_size);
+  }
+
+  // With last flush, there should be no more events in the buffer and as data.
+  EXPECT_EQ(task_event_buffer_->GetAllTaskEvents().size(), 0);
+}
+
 TEST_F(TaskEventBufferTest, TestBufferSizeLimit) {
   size_t num_limit = 100;  // Synced with test setup
   size_t num_profile = 50;
diff --git a/src/ray/core_worker/test/task_manager_test.cc b/src/ray/core_worker/test/task_manager_test.cc
index 3bdb156b3eae..1cd73cda00a6 100644
--- a/src/ray/core_worker/test/task_manager_test.cc
+++ b/src/ray/core_worker/test/task_manager_test.cc
@@ -62,6 +62,8 @@ class MockTaskEventBuffer : public worker::TaskEventBuffer {
   MOCK_METHOD(void, Stop, (), (override));
 
   MOCK_METHOD(bool, Enabled, (), (const, override));
+
+  MOCK_METHOD(const std::string, DebugString, (), (override));
 };
 
 class TaskManagerTest : public ::testing::Test {

From 675c6a07c4a56c3d6395882c3d2a04ca4f81e446 Mon Sep 17 00:00:00 2001
From: Scott Lee <scottjlee@users.noreply.github.com>
Date: Fri, 27 Jan 2023 16:28:35 -0800
Subject: [PATCH 033/267] [Dataset] Exclude breaking test case in
 `read_parquet_benchmark_single_node` release test (#31904)

The release test read_parquet_benchmark_single_node fails, due to using Python 3.7 and not having the pickle5 package installed. A similar issue is discussed in #26225. We found that the test failure is contained to the portion which tests a Dataset with a filter expression (the error is related to pickling with this filter expression).

Therefore, we will temporarily disable this portion of the test, while keeping the rest of the release test (which I verified passes on the same cluster). We can come back to this in the future and fix the case with filter. Example of release test successfully running with the filter case removed.

Signed-off-by: Scott Lee <sjl@anyscale.com>
---
 .../dataset/read_parquet_benchmark.py         | 31 +++++++++++--------
 1 file changed, 18 insertions(+), 13 deletions(-)

diff --git a/release/nightly_tests/dataset/read_parquet_benchmark.py b/release/nightly_tests/dataset/read_parquet_benchmark.py
index 183101d03389..70d645b4b53a 100644
--- a/release/nightly_tests/dataset/read_parquet_benchmark.py
+++ b/release/nightly_tests/dataset/read_parquet_benchmark.py
@@ -1,5 +1,3 @@
-import pyarrow as pa
-
 import ray
 from ray.data.dataset import Dataset
 
@@ -39,20 +37,27 @@ def run_read_parquet_benchmark(benchmark: Benchmark):
                 use_threads=use_threads,
             )
 
+    # TODO: Test below is currently excluded, due to failure around
+    # pickling the Dataset involving the filter expression.
+    # The error is present on Python < 3.8, and involves the pickle/pickle5
+    # libraries. `pickle` is included as a default library from Python 3.8+,
+    # whereas Python versions before this must import the backported `pickle5` library
+    # to maintain the same functionality.
+
     # Test with projection and filter pushdowns.
     # Since we have projection and filter pushdown, we can run the read on the full
     # size of one year data fast enough on a single node.
-    test_name = "read-parquet-nyc-taxi-2018-pushdown"
-    filter_expr = (pa.dataset.field("passenger_count") <= 10) & (
-        pa.dataset.field("passenger_count") > 0
-    )
-    benchmark.run(
-        test_name,
-        read_parquet,
-        root="s3://anonymous@air-example-data/ursa-labs-taxi-data/by_year/2018",
-        columns=["passenger_count", "trip_distance"],
-        filter=filter_expr,
-    )
+    # test_name = "read-parquet-nyc-taxi-2018-pushdown"
+    # filter_expr = (pa.dataset.field("passenger_count") <= 10) & (
+    #     pa.dataset.field("passenger_count") > 0
+    # )
+    # benchmark.run(
+    #     test_name,
+    #     read_parquet,
+    #     root="s3://anonymous@air-example-data/ursa-labs-taxi-data/by_year/2018",
+    #     columns=["passenger_count", "trip_distance"],
+    #     filter=filter_expr,
+    # )
 
     # Test with different number files to handle: from a few to many.
     data_dirs = []

From 00416d2c40ae9c1b91aa643e2a7bb65397063681 Mon Sep 17 00:00:00 2001
From: Amog Kamsetty <amogkam@users.noreply.github.com>
Date: Fri, 27 Jan 2023 16:44:50 -0800
Subject: [PATCH 034/267] [Data] Add tests for remainder of map_batches
 operations with new optimizer (#31985)

Signed-off-by: amogkam <amogkamsetty@yahoo.com>

The following operations call map_batches directly: add_column, drop_columns, select_columns, random_sample.

In this PR we add e2e tests for these examples with the new optimizer. In a future PR, we should refactor so that these operations do not call into map_batches and instead have their own logical operator.
---
 .../data/tests/test_execution_optimizer.py    | 31 +++++++++++++++++++
 1 file changed, 31 insertions(+)

diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index 8901826ee616..273aad060b48 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -115,6 +115,37 @@ def test_flat_map_e2e(ray_start_cluster_enabled, enable_optimizer):
     assert ds.take_all() == [0, 0, 1, 1], ds
 
 
+def test_column_ops_e2e(ray_start_cluster_enabled, enable_optimizer):
+    ds = ray.data.range(2)
+    ds = ds.add_column(fn=lambda df: df.iloc[:, 0], col="new_col")
+    assert ds.take_all() == [{"value": 0, "new_col": 0}, {"value": 1, "new_col": 1}], ds
+
+    select_ds = ds.select_columns(cols=["new_col"])
+    assert select_ds.take_all() == [{"new_col": 0}, {"new_col": 1}]
+
+    ds = ds.drop_columns(cols=["new_col"])
+    assert ds.take_all() == [{"value": 0}, {"value": 1}], ds
+
+
+def test_random_sample_e2e(ray_start_cluster_enabled, enable_optimizer):
+    import math
+
+    def ensure_sample_size_close(dataset, sample_percent=0.5):
+        r1 = ds.random_sample(sample_percent)
+        assert math.isclose(
+            r1.count(), int(ds.count() * sample_percent), rel_tol=2, abs_tol=2
+        )
+
+    ds = ray.data.range(10, parallelism=2)
+    ensure_sample_size_close(ds)
+
+    ds = ray.data.range_table(10, parallelism=2)
+    ensure_sample_size_close(ds)
+
+    ds = ray.data.range_tensor(5, parallelism=2, shape=(2, 2))
+    ensure_sample_size_close(ds)
+
+
 if __name__ == "__main__":
     import sys
 

From b5899d47b577bb8fd95ad07c6b7353d99bf8d77a Mon Sep 17 00:00:00 2001
From: Cade Daniel <cade@anyscale.com>
Date: Fri, 27 Jan 2023 16:58:18 -0800
Subject: [PATCH 035/267] [ci/release] Change exponential_backoff_retry to use
 warn instead of info on failure (#32014)

It appears the root cause of flaky failures described in https://github.com/ray-project/ray/issues/31981 is suppressed because we're not logging exceptions in `exponential_backoff_retry`.

Signed-off-by: Cade Daniel <cade@anyscale.com>
---
 release/ray_release/util.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/release/ray_release/util.py b/release/ray_release/util.py
index cd45fab519ed..3eb54ae111bc 100644
--- a/release/ray_release/util.py
+++ b/release/ray_release/util.py
@@ -121,7 +121,7 @@ def exponential_backoff_retry(
             retry_cnt += 1
             if retry_cnt > max_retries:
                 raise
-            logger.info(
+            logger.exception(
                 f"Retry function call failed due to {e} "
                 f"in {retry_delay_s} seconds..."
             )

From 51c5eda4b8dcb706fbe78dedc241f1c5256fd0ab Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Fri, 27 Jan 2023 17:06:27 -0800
Subject: [PATCH 036/267] Revert "[core] Fix gcs healthch manager crash when
 node is removed by node manager. (#31917)" (#31995)

This reverts commit a32b9b1bf21bb3cd971ce48aa9517810693d8f1f.
---
 .bazelrc                                      |  1 -
 BUILD.bazel                                   |  2 +-
 .../gcs_server/gcs_health_check_manager.cc    | 48 ++++++------
 .../gcs/gcs_server/gcs_health_check_manager.h | 23 ++++--
 .../test/gcs_health_check_manager_test.cc     | 75 ++++---------------
 5 files changed, 59 insertions(+), 90 deletions(-)

diff --git a/.bazelrc b/.bazelrc
index 1b98b8f72a3f..1c4b9f296b8f 100644
--- a/.bazelrc
+++ b/.bazelrc
@@ -97,7 +97,6 @@ build:tsan --copt -g
 build:tsan --copt -fno-omit-frame-pointer
 build:tsan --copt -Wno-uninitialized
 build:tsan --linkopt -fsanitize=thread
-build:tsan --cxxopt="-D_RAY_TSAN_BUILD"
 # This config is only for running TSAN with LLVM toolchain on Linux.
 build:tsan-clang --config=tsan
 build:tsan-clang --config=llvm
diff --git a/BUILD.bazel b/BUILD.bazel
index 20759e151419..22e23fbcbc7b 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -1875,7 +1875,7 @@ cc_library(
 
 cc_test(
     name = "gcs_health_check_manager_test",
-    size = "medium",
+    size = "small",
     srcs = [
         "src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc",
     ],
diff --git a/src/ray/gcs/gcs_server/gcs_health_check_manager.cc b/src/ray/gcs/gcs_server/gcs_health_check_manager.cc
index 7a3d99e74e05..831f345ef81a 100644
--- a/src/ray/gcs/gcs_server/gcs_health_check_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_health_check_manager.cc
@@ -53,7 +53,6 @@ void GcsHealthCheckManager::RemoveNode(const NodeID &node_id) {
         if (iter == health_check_contexts_.end()) {
           return;
         }
-        iter->second->Stop();
         health_check_contexts_.erase(iter);
       },
       "GcsHealthCheckManager::RemoveNode");
@@ -61,11 +60,8 @@ void GcsHealthCheckManager::RemoveNode(const NodeID &node_id) {
 
 void GcsHealthCheckManager::FailNode(const NodeID &node_id) {
   RAY_LOG(WARNING) << "Node " << node_id << " is dead because the health check failed.";
-  auto iter = health_check_contexts_.find(node_id);
-  if (iter != health_check_contexts_.end()) {
-    on_node_death_callback_(node_id);
-    health_check_contexts_.erase(iter);
-  }
+  on_node_death_callback_(node_id);
+  health_check_contexts_.erase(node_id);
 }
 
 std::vector<NodeID> GcsHealthCheckManager::GetAllNodes() const {
@@ -79,23 +75,27 @@ std::vector<NodeID> GcsHealthCheckManager::GetAllNodes() const {
 void GcsHealthCheckManager::HealthCheckContext::StartHealthCheck() {
   using ::grpc::health::v1::HealthCheckResponse;
 
-  // Reset the context/request/response for the next request.
-  context_.~ClientContext();
-  new (&context_) grpc::ClientContext();
-  response_.Clear();
+  context_ = std::make_shared<grpc::ClientContext>();
 
   auto deadline =
       std::chrono::system_clock::now() + std::chrono::milliseconds(manager_->timeout_ms_);
-  context_.set_deadline(deadline);
+  context_->set_deadline(deadline);
   stub_->async()->Check(
-      &context_, &request_, &response_, [this, now = absl::Now()](::grpc::Status status) {
+      context_.get(),
+      &request_,
+      &response_,
+      [this, stopped = this->stopped_, context = this->context_, now = absl::Now()](
+          ::grpc::Status status) {
         // This callback is done in gRPC's thread pool.
         STATS_health_check_rpc_latency_ms.Record(
             absl::ToInt64Milliseconds(absl::Now() - now));
+        if (status.error_code() == ::grpc::StatusCode::CANCELLED) {
+          return;
+        }
         manager_->io_service_.post(
-            [this, status]() {
-              if (stopped_) {
-                delete this;
+            [this, stopped, status]() {
+              // Stopped has to be read in the same thread where it's updated.
+              if (*stopped) {
                 return;
               }
               RAY_LOG(DEBUG) << "Health check status: " << int(response_.status());
@@ -110,28 +110,32 @@ void GcsHealthCheckManager::HealthCheckContext::StartHealthCheck() {
               }
 
               if (health_check_remaining_ == 0) {
-                manager_->FailNode(node_id_);
-                delete this;
+                manager_->io_service_.post([this]() { manager_->FailNode(node_id_); },
+                                           "");
               } else {
                 // Do another health check.
                 timer_.expires_from_now(
                     boost::posix_time::milliseconds(manager_->period_ms_));
-                timer_.async_wait([this](auto) { StartHealthCheck(); });
+                timer_.async_wait([this, stopped](auto ec) {
+                  // We need to check stopped here as well since cancel
+                  // won't impact the queued tasks.
+                  if (ec != boost::asio::error::operation_aborted && !*stopped) {
+                    StartHealthCheck();
+                  }
+                });
               }
             },
             "HealthCheck");
       });
 }
 
-void GcsHealthCheckManager::HealthCheckContext::Stop() { stopped_ = true; }
-
 void GcsHealthCheckManager::AddNode(const NodeID &node_id,
                                     std::shared_ptr<grpc::Channel> channel) {
   io_service_.dispatch(
       [this, channel, node_id]() {
         RAY_CHECK(health_check_contexts_.count(node_id) == 0);
-        auto context = new HealthCheckContext(this, channel, node_id);
-        health_check_contexts_.emplace(std::make_pair(node_id, context));
+        auto context = std::make_unique<HealthCheckContext>(this, channel, node_id);
+        health_check_contexts_.emplace(std::make_pair(node_id, std::move(context)));
       },
       "GcsHealthCheckManager::AddNode");
 }
diff --git a/src/ray/gcs/gcs_server/gcs_health_check_manager.h b/src/ray/gcs/gcs_server/gcs_health_check_manager.h
index d877a217d803..e0daea5edfcf 100644
--- a/src/ray/gcs/gcs_server/gcs_health_check_manager.h
+++ b/src/ray/gcs/gcs_server/gcs_health_check_manager.h
@@ -91,16 +91,27 @@ class GcsHealthCheckManager {
                        NodeID node_id)
         : manager_(manager),
           node_id_(node_id),
+          stopped_(std::make_shared<bool>(false)),
           timer_(manager->io_service_),
           health_check_remaining_(manager->failure_threshold_) {
       request_.set_service(node_id.Hex());
       stub_ = grpc::health::v1::Health::NewStub(channel);
       timer_.expires_from_now(
           boost::posix_time::milliseconds(manager_->initial_delay_ms_));
-      timer_.async_wait([this](auto) { StartHealthCheck(); });
+      timer_.async_wait([this](auto ec) {
+        if (ec != boost::asio::error::operation_aborted) {
+          StartHealthCheck();
+        }
+      });
     }
 
-    void Stop();
+    ~HealthCheckContext() {
+      timer_.cancel();
+      if (context_ != nullptr) {
+        context_->TryCancel();
+      }
+      *stopped_ = true;
+    }
 
    private:
     void StartHealthCheck();
@@ -110,12 +121,14 @@ class GcsHealthCheckManager {
     NodeID node_id_;
 
     // Whether the health check has stopped.
-    bool stopped_ = false;
+    std::shared_ptr<bool> stopped_;
 
     /// gRPC related fields
     std::unique_ptr<::grpc::health::v1::Health::Stub> stub_;
 
-    grpc::ClientContext context_;
+    // The context is used in the gRPC callback which is in another
+    // thread, so we need it to be a shared_ptr.
+    std::shared_ptr<grpc::ClientContext> context_;
     ::grpc::health::v1::HealthCheckRequest request_;
     ::grpc::health::v1::HealthCheckResponse response_;
 
@@ -133,7 +146,7 @@ class GcsHealthCheckManager {
   std::function<void(const NodeID &)> on_node_death_callback_;
 
   /// The context of the health check for each nodes.
-  absl::flat_hash_map<NodeID, HealthCheckContext *> health_check_contexts_;
+  absl::flat_hash_map<NodeID, std::unique_ptr<HealthCheckContext>> health_check_contexts_;
 
   /// The delay for the first health check request.
   const int64_t initial_delay_ms_;
diff --git a/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc b/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc
index 31be1bbd5d6d..f4f4bf8cefb2 100644
--- a/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc
@@ -19,13 +19,9 @@
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/optional.hpp>
 #include <boost/thread.hpp>
-#include <cstdlib>
 #include <unordered_map>
 
 using namespace boost;
-using namespace boost::asio;
-using namespace boost::asio::ip;
-
 #include <ray/rpc/grpc_server.h>
 
 #include <chrono>
@@ -34,20 +30,6 @@ using namespace boost::asio::ip;
 #include "gtest/gtest.h"
 #include "ray/gcs/gcs_server/gcs_health_check_manager.h"
 
-int GetFreePort() {
-  io_service io_service;
-  tcp::acceptor acceptor(io_service);
-  tcp::endpoint endpoint;
-
-  // try to bind to port 0 to find a free port
-  acceptor.open(tcp::v4());
-  acceptor.bind(tcp::endpoint(tcp::v4(), 0));
-  endpoint = acceptor.local_endpoint();
-  auto port = endpoint.port();
-  acceptor.close();
-  return port;
-}
-
 using namespace ray;
 using namespace std::literals::chrono_literals;
 
@@ -64,6 +46,7 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
         timeout_ms,
         period_ms,
         failure_threshold);
+    port = 10000;
   }
 
   void TearDown() override {
@@ -82,8 +65,7 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
   NodeID AddServer(bool alive = true) {
     std::promise<int> port_promise;
     auto node_id = NodeID::FromRandom();
-    auto port = GetFreePort();
-    RAY_LOG(INFO) << "Get port " << port;
+
     auto server = std::make_shared<rpc::GrpcServer>(node_id.Hex(), port, true);
 
     auto channel = grpc::CreateChannel("localhost:" + std::to_string(port),
@@ -94,6 +76,7 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
     }
     servers.emplace(node_id, server);
     health_check->AddNode(node_id, channel);
+    ++port;
     return node_id;
   }
 
@@ -132,13 +115,14 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
     }
   }
 
+  int port;
   instrumented_io_context io_service;
   std::unique_ptr<gcs::GcsHealthCheckManager> health_check;
   std::unordered_map<NodeID, std::shared_ptr<rpc::GrpcServer>> servers;
   std::unordered_set<NodeID> dead_nodes;
-  const int64_t initial_delay_ms = 100;
-  const int64_t timeout_ms = 10;
-  const int64_t period_ms = 10;
+  const int64_t initial_delay_ms = 1000;
+  const int64_t timeout_ms = 1000;
+  const int64_t period_ms = 1000;
   const int64_t failure_threshold = 5;
 };
 
@@ -159,6 +143,8 @@ TEST_F(GcsHealthCheckManagerTest, TestBasic) {
     Run(2);  // One for starting RPC and one for the RPC callback.
   }
 
+  Run();  // For failure callback.
+
   ASSERT_EQ(1, dead_nodes.size());
   ASSERT_TRUE(dead_nodes.count(node_id));
 }
@@ -183,6 +169,8 @@ TEST_F(GcsHealthCheckManagerTest, StoppedAndResume) {
     }
   }
 
+  Run();  // For failure callback.
+
   ASSERT_EQ(0, dead_nodes.size());
 }
 
@@ -208,6 +196,8 @@ TEST_F(GcsHealthCheckManagerTest, Crashed) {
     Run(2);  // One for starting RPC and one for the RPC callback.
   }
 
+  Run();  // For failure callback.
+
   ASSERT_EQ(1, dead_nodes.size());
   ASSERT_TRUE(dead_nodes.count(node_id));
 }
@@ -240,49 +230,12 @@ TEST_F(GcsHealthCheckManagerTest, NoRegister) {
     Run(2);  // One for starting RPC and one for the RPC callback.
   }
 
-  Run(1);
+  Run(2);
   ASSERT_EQ(1, dead_nodes.size());
   ASSERT_TRUE(dead_nodes.count(node_id));
 }
 
-TEST_F(GcsHealthCheckManagerTest, StressTest) {
-#ifdef _RAY_TSAN_BUILD
-  GTEST_SKIP() << "Disabled in tsan because of performance";
-#endif
-  boost::asio::io_service::work work(io_service);
-  std::srand(std::time(nullptr));
-  auto t = std::make_unique<std::thread>([this]() { this->io_service.run(); });
-
-  std::vector<NodeID> alive_nodes;
-
-  for (int i = 0; i < 200; ++i) {
-    alive_nodes.emplace_back(AddServer(true));
-    std::this_thread::sleep_for(10ms);
-  }
-
-  for (size_t i = 0; i < 20000UL; ++i) {
-    RAY_LOG(INFO) << "Progress: " << i << "/20000";
-    auto iter = alive_nodes.begin() + std::rand() % alive_nodes.size();
-    health_check->RemoveNode(*iter);
-    DeleteServer(*iter);
-    alive_nodes.erase(iter);
-    alive_nodes.emplace_back(AddServer(true));
-  }
-  RAY_LOG(INFO) << "Finished!";
-  io_service.stop();
-  t->join();
-}
-
 int main(int argc, char **argv) {
-  InitShutdownRAII ray_log_shutdown_raii(ray::RayLog::StartRayLog,
-                                         ray::RayLog::ShutDownRayLog,
-                                         argv[0],
-                                         ray::RayLogLevel::INFO,
-                                         /*log_dir=*/"");
-
-  ray::RayLog::InstallFailureSignalHandler(argv[0]);
-  ray::RayLog::InstallTerminateHandler();
-
   ::testing::InitGoogleTest(&argc, argv);
   return RUN_ALL_TESTS();
 }

From 22177cb01db51f0217a1550ddc942bff9a4341c5 Mon Sep 17 00:00:00 2001
From: Clark Zinzow <clarkzinzow@gmail.com>
Date: Fri, 27 Jan 2023 17:31:21 -0800
Subject: [PATCH 037/267] [Datasets] [Autoscaling Actor Pool - 2/2] Add
 autoscaling support to `MapOperator` actor pool. (#31987)

This PR adds support for autoscaling to the actor pool implementation of `MapOperator` (this PR is stacked on top of https://github.com/ray-project/ray/pull/31986).

The same autoscaling policy as the legacy `ActorPoolStrategy` is maintained, as well as providing more aggressive and sensible downscaling via:
* If there are more idle actors than running/pending actors, scale down.
* Once we're done submitting tasks, cancel pending actors and kill idle actors.

In addition to autoscaling, `max_tasks_in_flight` capping is also implemented.
---
 .../operators/actor_pool_map_operator.py      | 230 +++++++++++++++-
 .../execution/operators/map_operator.py       |  12 +-
 .../tests/test_actor_pool_map_operator.py     | 245 +++++++++++++++++-
 .../test_executor_resource_management.py      |  25 +-
 4 files changed, 485 insertions(+), 27 deletions(-)

diff --git a/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py b/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
index fcee783b55a0..2e67572edbf7 100644
--- a/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
+++ b/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
@@ -1,9 +1,11 @@
 import collections
+from dataclasses import dataclass
 from typing import Dict, Any, Iterator, Callable, List, Tuple, Union, Optional
 
 import ray
 from ray.data.block import Block, BlockMetadata
 from ray.data.context import DatasetContext, DEFAULT_SCHEDULING_STRATEGY
+from ray.data._internal.compute import ActorPoolStrategy
 from ray.data._internal.execution.interfaces import (
     RefBundle,
     ExecutionResources,
@@ -26,30 +28,32 @@ def __init__(
         self,
         transform_fn: Callable[[Iterator[Block]], Iterator[Block]],
         input_op: PhysicalOperator,
+        autoscaling_policy: "AutoscalingPolicy",
         name: str = "ActorPoolMap",
         min_rows_per_bundle: Optional[int] = None,
         ray_remote_args: Optional[Dict[str, Any]] = None,
-        pool_size: int = 1,
     ):
         """Create an ActorPoolMapOperator instance.
 
         Args:
             transform_fn: The function to apply to each ref bundle input.
             input_op: Operator generating input data for this op.
+            autoscaling_policy: A policy controlling when the actor pool should be
+                scaled up and scaled down.
             name: The name of this operator.
             min_rows_per_bundle: The number of rows to gather per batch passed to the
                 transform_fn, or None to use the block size. Setting the batch size is
                 important for the performance of GPU-accelerated transform functions.
                 The actual rows passed may be less if the dataset is small.
             ray_remote_args: Customize the ray remote args for this op's tasks.
-            pool_size: The desired size of the actor pool.
         """
         super().__init__(
             transform_fn, input_op, name, min_rows_per_bundle, ray_remote_args
         )
         self._ray_remote_args = self._apply_default_remote_args(self._ray_remote_args)
 
-        self._pool_size = pool_size
+        # Create autoscaling policy from compute strategy.
+        self._autoscaling_policy = autoscaling_policy
         # A map from task output futures to task state and the actor on which its
         # running.
         self._tasks: Dict[
@@ -69,7 +73,7 @@ def start(self, options: ExecutionOptions):
 
         # Create the actor workers and add them to the pool.
         self._cls = ray.remote(**self._ray_remote_args)(_MapWorker)
-        for _ in range(self._pool_size):
+        for _ in range(self._autoscaling_policy.min_workers):
             self._start_actor()
 
     def _start_actor(self):
@@ -107,9 +111,37 @@ def _dispatch_tasks(self):
             self._tasks[ref] = (task, actor)
             self._handle_task_submitted(task)
 
+        if self._bundle_queue:
+            # Try to scale up if work remains in the work queue.
+            self._scale_up_if_needed()
+        else:
+            # Only try to scale down if the work queue has been fully consumed.
+            self._scale_down_if_needed()
+
+    def _scale_up_if_needed(self):
+        """Try to scale up the pool if the autoscaling policy allows it."""
+        while self._autoscaling_policy.should_scale_up(
+            num_total_workers=self._actor_pool.num_total_actors(),
+            num_running_workers=self._actor_pool.num_running_actors(),
+        ):
+            self._start_actor()
+
+    def _scale_down_if_needed(self):
+        """Try to scale down the pool if the autoscaling policy allows it."""
         # Kill inactive workers if there's no more work to do.
         self._kill_inactive_workers_if_done()
 
+        while self._autoscaling_policy.should_scale_down(
+            num_total_workers=self._actor_pool.num_total_actors(),
+            num_idle_workers=self._actor_pool.num_idle_actors(),
+        ):
+            killed = self._actor_pool.kill_inactive_actor()
+            if not killed:
+                # This scaledown is best-effort, only killing an inactive worker if an
+                # inactive worker exists. If there are no inactive workers to kill, we
+                # break out of the scale-down loop.
+                break
+
     def notify_work_completed(
         self, ref: Union[ObjectRef[ObjectRefGenerator], ray.ObjectRef]
     ):
@@ -141,9 +173,8 @@ def inputs_done(self):
         # once the bundle queue is exhausted.
         self._inputs_done = True
 
-        # Manually trigger inactive worker termination in case the bundle queue is
-        # alread exhausted.
-        self._kill_inactive_workers_if_done()
+        # Try to scale pool down.
+        self._scale_down_if_needed()
 
     def _kill_inactive_workers_if_done(self):
         if self._inputs_done and not self._bundle_queue:
@@ -172,7 +203,7 @@ def progress_str(self) -> str:
         )
 
     def base_resource_usage(self) -> ExecutionResources:
-        min_workers = self._pool_size
+        min_workers = self._autoscaling_policy.min_workers
         return ExecutionResources(
             cpu=self._ray_remote_args.get("num_cpus", 0) * min_workers,
             gpu=self._ray_remote_args.get("num_gpus", 0) * min_workers,
@@ -188,7 +219,22 @@ def current_resource_usage(self) -> ExecutionResources:
         )
 
     def incremental_resource_usage(self) -> ExecutionResources:
-        return ExecutionResources(cpu=0, gpu=0)
+        # We would only have nonzero incremental CPU/GPU resources if a new task would
+        # require scale-up to run.
+        if self._autoscaling_policy.should_scale_up(
+            num_total_workers=self._actor_pool.num_total_actors(),
+            num_running_workers=self._actor_pool.num_running_actors(),
+        ):
+            # A new task would trigger scale-up, so we include the actor resouce
+            # requests in the incremental resources.
+            num_cpus = self._ray_remote_args.get("num_cpus", 0)
+            num_gpus = self._ray_remote_args.get("num_gpus", 0)
+        else:
+            # A new task wouldn't trigger scale-up, so we consider the incremental
+            # compute resources to be 0.
+            num_cpus = 0
+            num_gpus = 0
+        return ExecutionResources(cpu=num_cpus, gpu=num_gpus)
 
     @staticmethod
     def _apply_default_remote_args(ray_remote_args: Dict[str, Any]) -> Dict[str, Any]:
@@ -215,6 +261,128 @@ def submit(
         yield from _map_task(fn, *blocks)
 
 
+# TODO(Clark): Promote this to a public config once we deprecate the legacy compute
+# strategies.
+@dataclass
+class AutoscalingConfig:
+    """Configuration for an autoscaling actor pool."""
+
+    # Minimum number of workers in the actor pool.
+    min_workers: int
+    # Maximum number of workers in the actor pool.
+    max_workers: int
+    # Maximum number of tasks that can be in flight for a single worker.
+    # TODO(Clark): Have this informed by the prefetch_batches configuration, once async
+    # prefetching has been ported to this new actor pool.
+    max_tasks_in_flight: int = 2
+    # Minimum ratio of ready workers to the total number of workers. If the pool is
+    # above this ratio, it will be allowed to be scaled up.
+    ready_to_total_workers_ratio: float = 0.8
+    # Maximum ratio of idle workers to the total number of workers. If the pool goes
+    # above this ratio, the pool will be scaled down.
+    idle_to_total_workers_ratio: float = 0.5
+
+    def __post_init__(self):
+        if self.min_workers < 1:
+            raise ValueError("min_workers must be >= 1, got: ", self.min_workers)
+        if self.max_workers is not None and self.min_workers > self.max_workers:
+            raise ValueError(
+                "min_workers must be <= max_workers, got: ",
+                self.min_workers,
+                self.max_workers,
+            )
+        if self.max_tasks_in_flight < 1:
+            raise ValueError(
+                "max_tasks_in_flight must be >= 1, got: ",
+                self.max_tasks_in_flight,
+            )
+
+    @classmethod
+    def from_compute_strategy(cls, compute_strategy: ActorPoolStrategy):
+        """Convert a legacy ActorPoolStrategy to an AutoscalingConfig."""
+        # TODO(Clark): Remove this once the legacy compute strategies are deprecated.
+        assert isinstance(compute_strategy, ActorPoolStrategy)
+        return cls(
+            min_workers=compute_strategy.min_size,
+            max_workers=compute_strategy.max_size,
+            max_tasks_in_flight=compute_strategy.max_tasks_in_flight_per_actor,
+            ready_to_total_workers_ratio=compute_strategy.ready_to_total_workers_ratio,
+        )
+
+
+class AutoscalingPolicy:
+    """Autoscaling policy for an actor pool, determining when the pool should be scaled
+    up and when it should be scaled down.
+    """
+
+    def __init__(self, autoscaling_config: "AutoscalingConfig"):
+        self._config = autoscaling_config
+
+    @property
+    def min_workers(self) -> int:
+        """The minimum number of actors that must be in the actor pool."""
+        return self._config.min_workers
+
+    @property
+    def max_workers(self) -> int:
+        """The maximum number of actors that can be added to the actor pool."""
+        return self._config.max_workers
+
+    def should_scale_up(self, num_total_workers: int, num_running_workers: int) -> bool:
+        """Whether the actor pool should scale up by adding a new actor.
+
+        Args:
+            num_total_workers: Total number of workers in actor pool.
+            num_running_workers: Number of currently running workers in actor pool.
+
+        Returns:
+            Whether the actor pool should be scaled up by one actor.
+        """
+        # TODO(Clark): Replace the ready-to-total-ratio heuristic with a a work queue
+        # heuristic such that scale-up is only triggered if the current pool doesn't
+        # have enough worker slots to process the work queue.
+        # TODO(Clark): Use profiling of the bundle arrival rate, worker startup
+        # time, and task execution time to tailor the work queue heuristic to the
+        # running workload and observed Ray performance. E.g. this could be done via an
+        # augmented EMA using a queueing model
+        return (
+            # 1. The actor pool will not exceed the configured maximum size.
+            num_total_workers < self._config.max_workers
+            # TODO(Clark): Remove this once we have a good work queue heuristic and our
+            # resource-based backpressure is working well.
+            # 2. At least 80% of the workers in the pool have already started. This will
+            # ensure that workers will be launched in parallel while bounding the worker
+            # pool to requesting 125% of the cluster's available resources.
+            and num_running_workers / num_total_workers
+            > self._config.ready_to_total_workers_ratio
+        )
+
+    def should_scale_down(
+        self,
+        num_total_workers: int,
+        num_idle_workers: int,
+    ) -> bool:
+        """Whether the actor pool should scale down by terminating an inactive actor.
+
+        Args:
+            num_total_workers: Total number of workers in actor pool.
+            num_idle_workers: Number of currently idle workers in the actor pool.
+
+        Returns:
+            Whether the actor pool should be scaled down by one actor.
+        """
+        # TODO(Clark): Add an idleness timeout-based scale-down.
+        # TODO(Clark): Make the idleness timeout dynamically determined by bundle
+        # arrival rate, worker startup time, and task execution time.
+        return (
+            # 1. The actor pool will not go below the configured minimum size.
+            num_total_workers > self._config.min_workers
+            # 2. The actor pool contains more than 50% idle workers.
+            and num_idle_workers / num_total_workers
+            > self._config.idle_to_total_workers_ratio
+        )
+
+
 class _ActorPool:
     """A pool of actors for map task execution.
 
@@ -223,7 +391,8 @@ class _ActorPool:
     actors when the operator is done submitting work to the pool.
     """
 
-    def __init__(self):
+    def __init__(self, max_tasks_in_flight: int = float("inf")):
+        self._max_tasks_in_flight = max_tasks_in_flight
         # Number of tasks in flight per actor.
         self._num_tasks_in_flight: Dict[ray.actor.ActorHandle, int] = {}
         # Actors that are not yet ready (still pending creation).
@@ -271,7 +440,8 @@ def pick_actor(self) -> Optional[ray.actor.ActorHandle]:
         """Provides the least heavily loaded running actor in the pool for task
         submission.
 
-        None will be returned if all actors are still pending.
+        None will be returned if all actors are either at capacity (according to
+        max_tasks_in_flight) or are still pending.
         """
         if not self._num_tasks_in_flight:
             # Actor pool is empty or all actors are still pending.
@@ -281,8 +451,12 @@ def pick_actor(self) -> Optional[ray.actor.ActorHandle]:
             self._num_tasks_in_flight.keys(),
             key=lambda actor: self._num_tasks_in_flight[actor],
         )
-        self._num_tasks_in_flight[actor] += 1
-        return actor
+        if self._num_tasks_in_flight[actor] >= self._max_tasks_in_flight:
+            # All actors are at capacity.
+            return None
+        else:
+            self._num_tasks_in_flight[actor] += 1
+            return actor
 
     def return_actor(self, actor: ray.actor.ActorHandle):
         """Returns the provided actor to the pool."""
@@ -324,6 +498,36 @@ def num_active_actors(self) -> int:
             for num_tasks_in_flight in self._num_tasks_in_flight.values()
         )
 
+    def kill_inactive_actor(self) -> bool:
+        """Kills a single pending or idle actor, if any actors are pending/idle.
+
+        Returns whether an inactive actor was actually killed.
+        """
+        # We prioritize killing pending actors over idle actors to reduce actor starting
+        # churn.
+        killed = self._maybe_kill_pending_actor()
+        if not killed:
+            # If no pending actor was killed, so kill actor.
+            killed = self._maybe_kill_idle_actor()
+        return killed
+
+    def _maybe_kill_pending_actor(self) -> bool:
+        if self._pending_actors:
+            # At least one pending actor, so kill first one.
+            self._kill_pending_actor(next(iter(self._pending_actors.keys())))
+            return True
+        # No pending actors, so indicate to the caller that no actors were killed.
+        return False
+
+    def _maybe_kill_idle_actor(self) -> bool:
+        for actor, tasks_in_flight in self._num_tasks_in_flight.items():
+            if tasks_in_flight == 0:
+                # At least one idle actor, so kill first one found.
+                self._kill_running_actor(actor)
+                return True
+        # No idle actors, so indicate to the caller that no actors were killed.
+        return False
+
     def kill_all_inactive_actors(self):
         """Kills all currently inactive actors and ensures that all actors that become
         idle in the future will be eagerly killed.
diff --git a/python/ray/data/_internal/execution/operators/map_operator.py b/python/ray/data/_internal/execution/operators/map_operator.py
index 0fe279cc05c2..8ebd3ba56f1f 100644
--- a/python/ray/data/_internal/execution/operators/map_operator.py
+++ b/python/ray/data/_internal/execution/operators/map_operator.py
@@ -107,19 +107,21 @@ def create(
         elif isinstance(compute_strategy, ActorPoolStrategy):
             from ray.data._internal.execution.operators.actor_pool_map_operator import (
                 ActorPoolMapOperator,
+                AutoscalingConfig,
+                AutoscalingPolicy,
             )
 
-            pool_size = compute_strategy.max_size
-            if pool_size == float("inf"):
-                # Use min_size if max_size is unbounded (default).
-                pool_size = compute_strategy.min_size
+            autoscaling_config = AutoscalingConfig.from_compute_strategy(
+                compute_strategy
+            )
+            autoscaling_policy = AutoscalingPolicy(autoscaling_config)
             return ActorPoolMapOperator(
                 transform_fn,
                 input_op,
+                autoscaling_policy=autoscaling_policy,
                 name=name,
                 min_rows_per_bundle=min_rows_per_bundle,
                 ray_remote_args=ray_remote_args,
-                pool_size=pool_size,
             )
         else:
             raise ValueError(f"Unsupported execution strategy {compute_strategy}")
diff --git a/python/ray/data/tests/test_actor_pool_map_operator.py b/python/ray/data/tests/test_actor_pool_map_operator.py
index 8ce9c67b4a06..0a9f6dbab3f9 100644
--- a/python/ray/data/tests/test_actor_pool_map_operator.py
+++ b/python/ray/data/tests/test_actor_pool_map_operator.py
@@ -1,10 +1,16 @@
+import collections
 import time
 
 import pytest
 
 import ray
 from ray.tests.conftest import *  # noqa
-from ray.data._internal.execution.operators.actor_pool_map_operator import _ActorPool
+from ray.data._internal.compute import ActorPoolStrategy
+from ray.data._internal.execution.operators.actor_pool_map_operator import (
+    _ActorPool,
+    AutoscalingConfig,
+    AutoscalingPolicy,
+)
 
 
 @ray.remote
@@ -84,6 +90,15 @@ def test_return_actor(self, ray_start_regular_shared):
         assert pool.num_active_actors() == 0
         assert pool.num_idle_actors() == 1  # Actor should now be idle.
 
+    def test_pick_max_tasks_in_flight(self, ray_start_regular_shared):
+        # Test that we can't pick an actor beyond the max_tasks_in_flight cap.
+        pool = _ActorPool(max_tasks_in_flight=2)
+        actor = self._add_ready_worker(pool)
+        assert pool.pick_actor() == actor
+        assert pool.pick_actor() == actor
+        # Check that the 3rd pick doesn't return the actor.
+        assert pool.pick_actor() is None
+
     def test_pick_ordering_lone_idle(self, ray_start_regular_shared):
         # Test that a lone idle actor is the one that's picked.
         pool = _ActorPool()
@@ -113,6 +128,21 @@ def test_pick_ordering_full_order(self, ray_start_regular_shared):
         assert pool.num_active_actors() == 4
         assert pool.num_idle_actors() == 0
 
+    def test_pick_all_max_tasks_in_flight(self, ray_start_regular_shared):
+        # Test that max_tasks_in_flight cap applies to all actors in pool.
+        pool = _ActorPool(max_tasks_in_flight=2)
+        # Add 4 actors to the pool.
+        actors = [self._add_ready_worker(pool) for _ in range(4)]
+        picked_actors = [pool.pick_actor() for _ in range(8)]
+        pick_counts = collections.Counter(picked_actors)
+        # Check that picks were evenly distributed over the pool.
+        assert len(pick_counts) == 4
+        for actor, count in pick_counts.items():
+            assert actor in actors
+            assert count == 2
+        # Check that the next pick doesn't return an ctor.
+        assert pool.pick_actor() is None
+
     def test_pick_ordering_with_returns(self, ray_start_regular_shared):
         # Test that pick ordering works with returns.
         pool = _ActorPool()
@@ -126,6 +156,96 @@ def test_pick_ordering_with_returns(self, ray_start_regular_shared):
         # Check that actor 2 is the next actor that's picked.
         assert pool.pick_actor() == actor2
 
+    def test_kill_inactive_pending_actor(self, ray_start_regular_shared):
+        # Test that a pending actor is killed on the kill_inactive_actor() call.
+        pool = _ActorPool()
+        actor = PoolWorker.remote()
+        ready_ref = actor.ready.remote()
+        pool.add_pending_actor(actor, ready_ref)
+        # Kill inactive actor.
+        killed = pool.kill_inactive_actor()
+        # Check that an actor was killed.
+        assert killed
+        # Check that actor is not in pool.
+        assert pool.get_pending_actor_refs() == []
+        # Check that actor was killed.
+        # Wait a second to let actor killing happen.
+        time.sleep(1)
+        with pytest.raises(ray.exceptions.RayActorError):
+            ray.get(actor.ready.remote())
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 0
+        assert pool.num_pending_actors() == 0
+        assert pool.num_running_actors() == 0
+        assert pool.num_active_actors() == 0
+        assert pool.num_idle_actors() == 0
+
+    def test_kill_inactive_idle_actor(self, ray_start_regular_shared):
+        # Test that a idle actor is killed on the kill_inactive_actor() call.
+        pool = _ActorPool()
+        actor = self._add_ready_worker(pool)
+        # Kill inactive actor.
+        killed = pool.kill_inactive_actor()
+        # Check that an actor was killed.
+        assert killed
+        # Check that actor is not in pool.
+        assert pool.pick_actor() is None
+        # Check that actor was killed.
+        # Wait a second to let actor killing happen.
+        time.sleep(1)
+        with pytest.raises(ray.exceptions.RayActorError):
+            ray.get(actor.ready.remote())
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 0
+        assert pool.num_pending_actors() == 0
+        assert pool.num_running_actors() == 0
+        assert pool.num_active_actors() == 0
+        assert pool.num_idle_actors() == 0
+
+    def test_kill_inactive_active_actor_not_killed(self, ray_start_regular_shared):
+        # Test that active actors are NOT killed on the kill_inactive_actor() call.
+        pool = _ActorPool()
+        actor = self._add_ready_worker(pool)
+        # Pick actor (and double-check that the actor was picked).
+        assert pool.pick_actor() == actor
+        # Kill inactive actor.
+        killed = pool.kill_inactive_actor()
+        # Check that an actor was NOT killed.
+        assert not killed
+        # Check that the active actor is still in the pool.
+        assert pool.pick_actor() == actor
+
+    def test_kill_inactive_pending_over_idle(self, ray_start_regular_shared):
+        # Test that a killing pending actors is prioritized over killing idle actors on
+        # the kill_inactive_actor() call.
+        pool = _ActorPool()
+        # Add pending worker.
+        pending_actor = PoolWorker.remote()
+        ready_ref = pending_actor.ready.remote()
+        pool.add_pending_actor(pending_actor, ready_ref)
+        # Add idle worker.
+        idle_actor = self._add_ready_worker(pool)
+        # Kill inactive actor.
+        killed = pool.kill_inactive_actor()
+        # Check that an actor was killed.
+        assert killed
+        # Check that the idle actor is still in the pool.
+        assert pool.pick_actor() == idle_actor
+        pool.return_actor(idle_actor)
+        # Check that the pending actor is not in pool.
+        assert pool.get_pending_actor_refs() == []
+        # Check that actor was killed.
+        # Wait a second to let actor killing happen.
+        time.sleep(1)
+        with pytest.raises(ray.exceptions.RayActorError):
+            ray.get(pending_actor.ready.remote())
+        # Check that the per-state pool sizes are as expected.
+        assert pool.num_total_actors() == 1
+        assert pool.num_pending_actors() == 0
+        assert pool.num_running_actors() == 1
+        assert pool.num_active_actors() == 0
+        assert pool.num_idle_actors() == 1
+
     def test_kill_all_inactive_pending_actor_killed(self, ray_start_regular_shared):
         # Test that pending actors are killed on the kill_all_inactive_actors() call.
         pool = _ActorPool()
@@ -288,6 +408,129 @@ def test_all_actors_killed(self, ray_start_regular_shared):
         assert pool.num_idle_actors() == 0
 
 
+class TestAutoscalingConfig:
+    def test_min_workers_validation(self):
+        # Test min_workers positivity validation.
+        with pytest.raises(ValueError):
+            AutoscalingConfig(min_workers=0, max_workers=2)
+
+    def test_max_workers_validation(self):
+        # Test max_workers not being less than min_workers validation.
+        with pytest.raises(ValueError):
+            AutoscalingConfig(min_workers=3, max_workers=2)
+
+    def test_max_tasks_in_flight_validation(self):
+        # Test max_tasks_in_flight positivity validation.
+        with pytest.raises(ValueError):
+            AutoscalingConfig(min_workers=1, max_workers=2, max_tasks_in_flight=0)
+
+    def test_full_specification(self):
+        # Basic regression test for full specification.
+        config = AutoscalingConfig(
+            min_workers=2,
+            max_workers=100,
+            max_tasks_in_flight=3,
+            ready_to_total_workers_ratio=0.8,
+            idle_to_total_workers_ratio=0.25,
+        )
+        assert config.min_workers == 2
+        assert config.max_workers == 100
+        assert config.max_tasks_in_flight == 3
+        assert config.ready_to_total_workers_ratio == 0.8
+        assert config.idle_to_total_workers_ratio == 0.25
+
+    def test_from_compute(self):
+        # Test that construction from ActorPoolStrategy works as expected.
+        compute = ActorPoolStrategy(
+            min_size=2, max_size=5, max_tasks_in_flight_per_actor=3
+        )
+        config = AutoscalingConfig.from_compute_strategy(compute)
+        assert config.min_workers == 2
+        assert config.max_workers == 5
+        assert config.max_tasks_in_flight == 3
+        assert config.ready_to_total_workers_ratio == 0.8
+        assert config.idle_to_total_workers_ratio == 0.5
+
+
+class TestAutoscalingPolicy:
+    def test_min_workers(self):
+        # Test that the autoscaling policy forwards the config's min_workers.
+        config = AutoscalingConfig(min_workers=1, max_workers=4)
+        policy = AutoscalingPolicy(config)
+        assert policy.min_workers == 1
+
+    def test_max_workers(self):
+        # Test that the autoscaling policy forwards the config's max_workers.
+        config = AutoscalingConfig(min_workers=1, max_workers=4)
+        policy = AutoscalingPolicy(config)
+        assert policy.max_workers == 4
+
+    def test_should_scale_up_over_max_workers(self):
+        # Test that scale-up is blocked if the pool would go over the configured max
+        # workers.
+        config = AutoscalingConfig(min_workers=1, max_workers=4)
+        policy = AutoscalingPolicy(config)
+        num_total_workers = 4
+        num_running_workers = 4
+        # Shouldn't scale up due to pool max workers.
+        assert not policy.should_scale_up(num_total_workers, num_running_workers)
+
+        num_total_workers = 3
+        num_running_workers = 3
+        # Should scale up since under pool max workers.
+        assert policy.should_scale_up(num_total_workers, num_running_workers)
+
+    def test_should_scale_up_ready_to_total_ratio(self):
+        # Test that scale-up is blocked if under the ready workers to total workers
+        # ratio.
+        config = AutoscalingConfig(
+            min_workers=1, max_workers=4, ready_to_total_workers_ratio=0.5
+        )
+        policy = AutoscalingPolicy(config)
+
+        num_total_workers = 2
+        num_running_workers = 1
+        # Shouldn't scale up due to being under ready workers to total workers ratio.
+        assert not policy.should_scale_up(num_total_workers, num_running_workers)
+
+        num_total_workers = 3
+        num_running_workers = 2
+        # Shouldn scale up due to being over ready workers to total workers ratio.
+        assert policy.should_scale_up(num_total_workers, num_running_workers)
+
+    def test_should_scale_down_min_workers(self):
+        # Test that scale-down is blocked if the pool would go under the configured min
+        # workers.
+        config = AutoscalingConfig(min_workers=2, max_workers=4)
+        policy = AutoscalingPolicy(config)
+        num_total_workers = 2
+        num_idle_workers = 2
+        # Shouldn't scale down due to pool min workers.
+        assert not policy.should_scale_down(num_total_workers, num_idle_workers)
+
+        num_total_workers = 3
+        num_idle_workers = 3
+        # Should scale down since over pool min workers.
+        assert policy.should_scale_down(num_total_workers, num_idle_workers)
+
+    def test_should_scale_down_idle_to_total_ratio(self):
+        # Test that scale-down is blocked if under the idle workers to total workers
+        # ratio.
+        config = AutoscalingConfig(
+            min_workers=1, max_workers=4, idle_to_total_workers_ratio=0.5
+        )
+        policy = AutoscalingPolicy(config)
+        num_total_workers = 4
+        num_idle_workers = 1
+        # Shouldn't scale down due to being under idle workers to total workers ratio.
+        assert not policy.should_scale_down(num_total_workers, num_idle_workers)
+
+        num_total_workers = 4
+        num_idle_workers = 3
+        # Should scale down due to being over idle workers to total workers ratio.
+        assert policy.should_scale_down(num_total_workers, num_idle_workers)
+
+
 if __name__ == "__main__":
     import sys
 
diff --git a/python/ray/data/tests/test_executor_resource_management.py b/python/ray/data/tests/test_executor_resource_management.py
index 016276b7f54a..bc98518326b0 100644
--- a/python/ray/data/tests/test_executor_resource_management.py
+++ b/python/ray/data/tests/test_executor_resource_management.py
@@ -10,9 +10,10 @@
 from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
 from ray.data._internal.execution.util import make_ref_bundles
 from ray.data.tests.test_operators import _mul2_transform
+from ray.data.tests.conftest import *  # noqa
 
 
-def test_resource_utils():
+def test_resource_utils(ray_start_10_cpus_shared):
     r1 = ExecutionResources()
     r2 = ExecutionResources(cpu=1)
     r3 = ExecutionResources(gpu=1)
@@ -43,7 +44,7 @@ def test_resource_utils():
     assert not r5.satisfies_limit(r4)
 
 
-def test_resource_canonicalization():
+def test_resource_canonicalization(ray_start_10_cpus_shared):
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
     op = MapOperator.create(
         _mul2_transform,
@@ -76,7 +77,7 @@ def test_resource_canonicalization():
         )
 
 
-def test_task_pool_resource_reporting():
+def test_task_pool_resource_reporting(ray_start_10_cpus_shared):
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
     op = MapOperator.create(
         _mul2_transform,
@@ -96,16 +97,18 @@ def test_task_pool_resource_reporting():
     assert usage.object_store_memory == pytest.approx(128, abs=50), usage
 
 
-def test_actor_pool_resource_reporting():
+def test_actor_pool_resource_reporting(ray_start_10_cpus_shared):
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
     op = MapOperator.create(
         _mul2_transform,
         input_op=input_op,
         name="TestMapper",
-        compute_strategy=ActorPoolStrategy(2, 2),
+        compute_strategy=ActorPoolStrategy(2, 10),
     )
     op.start(ExecutionOptions())
     assert op.base_resource_usage() == ExecutionResources(cpu=2, gpu=0)
+    # All actors are idle (pending creation), therefore shouldn't need to scale up when
+    # submitting a new task, so incremental resource usage should be 0.
     assert op.incremental_resource_usage() == ExecutionResources(cpu=0, gpu=0)
     # Actors are pending creation, but they still count against CPU utilization.
     assert op.current_resource_usage() == ExecutionResources(
@@ -114,6 +117,8 @@ def test_actor_pool_resource_reporting():
 
     # Add inputs.
     for _ in range(4):
+        # Pool is still idle while waiting for actors to start, so additional tasks
+        # shouldn't trigger scale-up, so incremental resource usage should still be 0.
         assert op.incremental_resource_usage() == ExecutionResources(cpu=0, gpu=0)
         op.add_input(input_op.get_next(), 0)
     # Pool is still idle while waiting for actors to start.
@@ -127,6 +132,13 @@ def test_actor_pool_resource_reporting():
     for work_ref in work_refs:
         ray.get(work_ref)
         op.notify_work_completed(work_ref)
+
+    # Now that both actors have started, a new task would trigger scale-up, so
+    # incremental resource usage should be 1 CPU.
+    inc_usage = op.incremental_resource_usage()
+    assert inc_usage.cpu == 1, inc_usage
+    assert inc_usage.gpu == 0, inc_usage
+
     # Actors have now started and the pool is actively running tasks.
     usage = op.current_resource_usage()
     assert usage.cpu == 2, usage
@@ -134,9 +146,6 @@ def test_actor_pool_resource_reporting():
     # Now that tasks have been submitted, object store memory is accounted for.
     assert usage.object_store_memory == pytest.approx(256, abs=100), usage
 
-    # TODO: test autoscaling resource reporting.
-    # assert op.incremental_resource_usage() == ExecutionResources(cpu=1, gpu=0)
-
     # Indicate that no more inputs will arrive.
     op.inputs_done()
 

From ef28b5aab3cd3b98ef62fb7c0ff08605f59bb9f7 Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Sat, 28 Jan 2023 10:51:15 +0900
Subject: [PATCH 038/267] [Dashboard] Add cluster utilization graph (#31896)

<img width="1731" alt="Screen Shot 2023-01-24 at 1 01 25 AM" src="https://user-images.githubusercontent.com/18510752/214250430-9bac7b06-56fb-44b3-a044-3eaf726d1469.png">

This PR adds the cluster utilization page in the landing view

Co-authored-by: Alan Guo <aguo@anyscale.com>
---
 dashboard/client/src/pages/layout/index.tsx   | 10 ++-
 .../client/src/pages/metrics/Metrics.tsx      |  2 +-
 .../overview/cards/ClusterUtilizationCard.tsx |  2 +-
 .../src/pages/overview/cards/OverviewCard.tsx |  2 +-
 .../cards/RecentJobsCard.component.test.tsx   | 14 ++++-
 .../pages/overview/cards/RecentJobsCard.tsx   |  2 +-
 .../metrics/grafana_dashboard_factory.py      | 63 ++++++++++++++++++-
 7 files changed, 87 insertions(+), 8 deletions(-)

diff --git a/dashboard/client/src/pages/layout/index.tsx b/dashboard/client/src/pages/layout/index.tsx
index cdc6e07a3c76..446a885dbc7c 100644
--- a/dashboard/client/src/pages/layout/index.tsx
+++ b/dashboard/client/src/pages/layout/index.tsx
@@ -65,9 +65,15 @@ const useStyles = makeStyles((theme) => ({
     fontWeight: 500,
     color: "#036DCF",
     backgroundColor: "#036DCF20",
-    padding: theme.spacing(0.5),
+    padding: theme.spacing(0.5, 1),
     margin: theme.spacing(-0.5),
     borderRadius: 4,
+    width: "fit-content",
+  },
+  newUIMenuItem: {
+    "&:hover": {
+      backgroundColor: theme.palette.grey[200],
+    },
   },
 }));
 
@@ -161,7 +167,7 @@ const BasicLayout = ({
           )}
           <ListItem
             button
-            className={classnames(classes.menuItem)}
+            className={classnames(classes.menuItem, classes.newUIMenuItem)}
             onClick={() => navigate("/new")}
           >
             <ListItemText classes={{ primary: classes.newUI }}>
diff --git a/dashboard/client/src/pages/metrics/Metrics.tsx b/dashboard/client/src/pages/metrics/Metrics.tsx
index db51011e4fb6..51a12f2ce262 100644
--- a/dashboard/client/src/pages/metrics/Metrics.tsx
+++ b/dashboard/client/src/pages/metrics/Metrics.tsx
@@ -32,7 +32,7 @@ const useStyles = makeStyles((theme) =>
     },
     chart: {
       width: "100%",
-      height: 300,
+      height: 400,
       overflow: "hidden",
       [theme.breakpoints.up("md")]: {
         // Calculate max width based on 1/3 of the total width minus padding between cards
diff --git a/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx b/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx
index 89108546f2ac..52ad45422c1a 100644
--- a/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx
+++ b/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx
@@ -43,7 +43,7 @@ export const ClusterUtilizationCard = ({
   const { grafanaHost, prometheusHealth, sessionName } =
     useContext(GlobalContext);
   const path =
-    "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=2";
+    "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=41";
   const timeRangeParams = "&from=now-30m&to=now";
 
   return (
diff --git a/dashboard/client/src/pages/overview/cards/OverviewCard.tsx b/dashboard/client/src/pages/overview/cards/OverviewCard.tsx
index 8edae6882702..48cc7711a4e9 100644
--- a/dashboard/client/src/pages/overview/cards/OverviewCard.tsx
+++ b/dashboard/client/src/pages/overview/cards/OverviewCard.tsx
@@ -7,7 +7,7 @@ import { Link } from "react-router-dom";
 const useStyles = makeStyles((theme) =>
   createStyles({
     root: {
-      height: 294,
+      height: 400,
       overflow: "hidden",
     },
   }),
diff --git a/dashboard/client/src/pages/overview/cards/RecentJobsCard.component.test.tsx b/dashboard/client/src/pages/overview/cards/RecentJobsCard.component.test.tsx
index e1eed0a76fe3..5c586e5fcd3c 100644
--- a/dashboard/client/src/pages/overview/cards/RecentJobsCard.component.test.tsx
+++ b/dashboard/client/src/pages/overview/cards/RecentJobsCard.component.test.tsx
@@ -37,6 +37,16 @@ describe("RecentJobsCard", () => {
           submission_id: "raysubmit_45678",
           status: "RUNNING",
         },
+        {
+          job_id: "06000000",
+          submission_id: "raysubmit_56789",
+          status: "RUNNING",
+        },
+        {
+          job_id: "07000000",
+          submission_id: "raysubmit_67890",
+          status: "RUNNING",
+        },
       ],
     } as any);
 
@@ -46,6 +56,8 @@ describe("RecentJobsCard", () => {
     expect(screen.getByText("02000000")).toBeVisible();
     expect(screen.getByText("raysubmit_23456")).toBeVisible();
     expect(screen.getByText("04000000")).toBeVisible();
-    expect(screen.queryByText("05000000")).toBeNull();
+    expect(screen.getByText("05000000")).toBeVisible();
+    expect(screen.getByText("06000000")).toBeVisible();
+    expect(screen.queryByText("07000000")).toBeNull();
   });
 });
diff --git a/dashboard/client/src/pages/overview/cards/RecentJobsCard.tsx b/dashboard/client/src/pages/overview/cards/RecentJobsCard.tsx
index e79526caf438..119914687302 100644
--- a/dashboard/client/src/pages/overview/cards/RecentJobsCard.tsx
+++ b/dashboard/client/src/pages/overview/cards/RecentJobsCard.tsx
@@ -40,7 +40,7 @@ export const RecentJobsCard = ({ className }: RecentJobsCardProps) => {
   const classes = useStyles();
 
   const { jobList } = useJobList();
-  const sortedJobs = _.orderBy(jobList, ["startTime"], ["desc"]).slice(0, 4);
+  const sortedJobs = _.orderBy(jobList, ["startTime"], ["desc"]).slice(0, 6);
 
   return (
     <OverviewCard className={classNames(classes.root, className)}>
diff --git a/dashboard/modules/metrics/grafana_dashboard_factory.py b/dashboard/modules/metrics/grafana_dashboard_factory.py
index 0160b930e9f4..ead306c51cae 100644
--- a/dashboard/modules/metrics/grafana_dashboard_factory.py
+++ b/dashboard/modules/metrics/grafana_dashboard_factory.py
@@ -39,6 +39,8 @@ class Panel:
         id: Integer id used to reference the graph from Metrics.tsx.
         unit: The unit to display on the y-axis of the graph.
         targets: List of query targets.
+        fill: Whether or not the graph will be filled by a color.
+        stack: Whether or not the lines in the graph will be stacked.
     """
 
     title: str
@@ -46,6 +48,8 @@ class Panel:
     id: int
     unit: str
     targets: List[Target]
+    fill: int = 10
+    stack: bool = True
 
 
 METRICS_INPUT_ROOT = os.path.join(os.path.dirname(__file__), "export")
@@ -361,8 +365,55 @@ def max_plus_pending(max_resource, pending_resource):
             ),
         ],
     ),
+    Panel(
+        id=41,
+        title="Cluster Utilization",
+        description="Aggregated utilization of all physical resources (CPU, GPU, memory, disk, or etc.) across the cluster.",
+        unit="%",
+        targets=[
+            # CPU
+            Target(
+                expr="avg(ray_node_cpu_utilization{{{global_filters}}})",
+                legend="CPU (physical)",
+            ),
+            # GPU
+            Target(
+                expr="avg(ray_node_gpus_utilization{{{global_filters}}})",
+                legend="GPU (physical)",
+            ),
+            # Memory
+            Target(
+                expr="sum(ray_node_mem_used{{{global_filters}}}) / on() (sum(ray_node_mem_total{{{global_filters}}})) * 100",
+                legend="Memory (RAM)",
+            ),
+            # GRAM
+            Target(
+                expr="sum(ray_node_gram_used{{{global_filters}}}) / on() (sum(ray_node_gram_available{{{global_filters}}}) + sum(ray_node_gram_used{{{global_filters}}})) * 100",
+                legend="GRAM",
+            ),
+            # Object Store
+            Target(
+                expr='sum(ray_object_store_memory{{{global_filters}}}) / on() sum(ray_resources{{Name="object_store_memory",{global_filters}}}) * 100',
+                legend="Object Store Memory",
+            ),
+            # Disk
+            Target(
+                expr="sum(ray_node_disk_usage{{{global_filters}}}) / on() (sum(ray_node_disk_free{{{global_filters}}}) + sum(ray_node_disk_usage{{{global_filters}}})) * 100",
+                legend="Disk",
+            ),
+        ],
+        fill=0,
+        stack=False,
+    ),
 ]
 
+ids = []
+for panel in GRAFANA_PANELS:
+    ids.append(panel.id)
+assert len(ids) == len(
+    set(ids)
+), f"Duplicated id found. Use unique id for each panel. {ids}"
+
 
 TARGET_TEMPLATE = {
     "exemplar": True,
@@ -499,6 +550,8 @@ def _generate_grafana_panels() -> List[dict]:
         template["gridPos"]["y"] = i // 2
         template["gridPos"]["x"] = 12 * (i % 2)
         template["yaxes"][0]["format"] = panel.unit
+        template["fill"] = panel.fill
+        template["stack"] = panel.stack
         panels.append(template)
     return panels
 
@@ -506,10 +559,18 @@ def _generate_grafana_panels() -> List[dict]:
 GLOBAL_FILTERS = ['SessionName="$SessionName"']
 
 
+def gen_incrementing_alphabets(length):
+    assert 65 + length < 96, "we only support up to 26 targets at a time."
+    # 65: ascii code of 'A'.
+    return list(map(chr, range(65, 65 + length)))
+
+
 def _generate_targets(panel: Panel) -> List[dict]:
     global_filters = ",".join(GLOBAL_FILTERS)
     targets = []
-    for target, ref_id in zip(panel.targets, ["A", "B", "C", "D"]):
+    for target, ref_id in zip(
+        panel.targets, gen_incrementing_alphabets(len(panel.targets))
+    ):
         template = copy.deepcopy(TARGET_TEMPLATE)
         template.update(
             {

From e44a7d0aaee378615a419ab879c99804a78f7426 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Fri, 27 Jan 2023 17:52:28 -0800
Subject: [PATCH 039/267] [Datasets] Add logical operator for
 randomize_block_order() (#31977)

This PR adds logical operator for randomize_block_order(). The change includes:

Introduce AbstractAllToAll for all logical operators converted to AllToAllOperator
RandomizeBlocks logical operator for randomize_block_order().
_internal/planner to move logic for Planner here and have generated function for randomize_blocks. This can be used later to create MapOperator/AllToAllOperator.
---
 .../logical/operators/all_to_all_operator.py  | 45 +++++++++
 .../logical/operators/map_operator.py         | 98 ++++---------------
 .../logical/operators/read_operator.py        | 45 +--------
 .../ray/data/_internal/logical/optimizers.py  |  2 +-
 python/ray/data/_internal/planner/__init__.py |  0
 .../_internal/planner/plan_all_to_all_op.py   | 29 ++++++
 .../ray/data/_internal/planner/plan_map_op.py | 64 ++++++++++++
 .../data/_internal/planner/plan_read_op.py    | 50 ++++++++++
 .../_internal/{logical => planner}/planner.py | 18 ++--
 .../_internal/planner/randomize_blocks.py     | 42 ++++++++
 python/ray/data/dataset.py                    | 11 ++-
 .../data/tests/test_execution_optimizer.py    | 25 ++++-
 12 files changed, 297 insertions(+), 132 deletions(-)
 create mode 100644 python/ray/data/_internal/logical/operators/all_to_all_operator.py
 create mode 100644 python/ray/data/_internal/planner/__init__.py
 create mode 100644 python/ray/data/_internal/planner/plan_all_to_all_op.py
 create mode 100644 python/ray/data/_internal/planner/plan_map_op.py
 create mode 100644 python/ray/data/_internal/planner/plan_read_op.py
 rename python/ray/data/_internal/{logical => planner}/planner.py (61%)
 create mode 100644 python/ray/data/_internal/planner/randomize_blocks.py

diff --git a/python/ray/data/_internal/logical/operators/all_to_all_operator.py b/python/ray/data/_internal/logical/operators/all_to_all_operator.py
new file mode 100644
index 000000000000..f94f54c27e98
--- /dev/null
+++ b/python/ray/data/_internal/logical/operators/all_to_all_operator.py
@@ -0,0 +1,45 @@
+from typing import Any, Dict, Optional
+
+from ray.data._internal.logical.interfaces import LogicalOperator
+
+
+class AbstractAllToAll(LogicalOperator):
+    """Abstract class for logical operators should be converted to physical
+    AllToAllOperator.
+    """
+
+    def __init__(
+        self,
+        name: str,
+        input_op: LogicalOperator,
+        num_outputs: Optional[int] = None,
+        ray_remote_args: Optional[Dict[str, Any]] = None,
+    ):
+        """
+        Args:
+            name: Name for this operator. This is the name that will appear when
+                inspecting the logical plan of a Dataset.
+            input_op: The operator preceding this operator in the plan DAG. The outputs
+                of `input_op` will be the inputs to this operator.
+            num_outputs: The number of expected output bundles outputted by this
+                operator.
+            ray_remote_args: Args to provide to ray.remote.
+        """
+        super().__init__(name, [input_op])
+        self._num_outputs = num_outputs
+        self._ray_remote_args = ray_remote_args or {}
+
+
+class RandomizeBlocks(AbstractAllToAll):
+    """Logical operator for randomize_block_order."""
+
+    def __init__(
+        self,
+        input_op: LogicalOperator,
+        seed: Optional[int] = None,
+    ):
+        super().__init__(
+            "RandomizeBlocks",
+            input_op,
+        )
+        self._seed = seed
diff --git a/python/ray/data/_internal/logical/operators/map_operator.py b/python/ray/data/_internal/logical/operators/map_operator.py
index bc09e8e2c838..a1a1635acc38 100644
--- a/python/ray/data/_internal/logical/operators/map_operator.py
+++ b/python/ray/data/_internal/logical/operators/map_operator.py
@@ -1,20 +1,13 @@
 import sys
-from typing import Any, Dict, Iterable, Iterator, Optional, Union
+from typing import Any, Dict, Iterable, Optional, Union
 
-import ray
 from ray.data._internal.compute import BlockTransform
-from ray.data._internal.execution.interfaces import PhysicalOperator
-from ray.data._internal.execution.operators.map_operator import MapOperator
 from ray.data._internal.logical.interfaces import LogicalOperator
 from ray.data._internal.compute import (
     UDF,
-    get_compute,
-    CallableClass,
     ComputeStrategy,
-    TaskPoolStrategy,
-    ActorPoolStrategy,
 )
-from ray.data.block import BatchUDF, Block, RowUDF
+from ray.data.block import BatchUDF, RowUDF
 
 
 if sys.version_info >= (3, 8):
@@ -26,23 +19,6 @@
 class AbstractMap(LogicalOperator):
     """Abstract class for logical operators should be converted to physical
     MapOperator.
-
-    Args:
-        name: Name for this operator. This is the name that will appear when inspecting
-            the logical plan of a Dataset.
-        input_op: The operator preceding this operator in the plan DAG. The outputs of
-            `input_op` will be the inputs to this operator.
-        block_fn: The transform function to apply to each input block to produce output
-            blocks.
-        target_block_size: The target size for blocks outputted by this operator.
-        fn: User provided UDF to be called in `block_fn`.
-        fn_args: Arguments to `fn`.
-        fn_kwargs: Keyword arguments to `fn`.
-        fn_constructor_args: Arguments to provide to the initializor of `fn` if `fn` is
-            a callable class.
-        fn_constructor_kwargs: Keyword Arguments to provide to the initializor of `fn`
-            if `fn` is a callable class.
-        ray_remote_args: Args to provide to ray.remote.
     """
 
     # TODO: Replace `fn`, `fn_args`, `fn_kwargs`, `fn_constructor_args`, and
@@ -62,6 +38,24 @@ def __init__(
         fn_constructor_kwargs: Optional[Dict[str, Any]] = None,
         ray_remote_args: Optional[Dict[str, Any]] = None,
     ):
+        """
+        Args:
+            name: Name for this operator. This is the name that will appear when
+                inspecting the logical plan of a Dataset.
+            input_op: The operator preceding this operator in the plan DAG. The outputs
+                of `input_op` will be the inputs to this operator.
+            block_fn: The transform function to apply to each input block to produce
+                output blocks.
+            target_block_size: The target size for blocks outputted by this operator.
+            fn: User provided UDF to be called in `block_fn`.
+            fn_args: Arguments to `fn`.
+            fn_kwargs: Keyword arguments to `fn`.
+            fn_constructor_args: Arguments to provide to the initializor of `fn` if
+                `fn` is a callable class.
+            fn_constructor_kwargs: Keyword Arguments to provide to the initializor of
+                `fn` if `fn` is a callable class.
+            ray_remote_args: Args to provide to ray.remote.
+        """
         super().__init__(name, [input_op])
         self._block_fn = block_fn
         self._compute = compute or "tasks"
@@ -172,55 +166,3 @@ def __init__(
             fn=fn,
             ray_remote_args=ray_remote_args,
         )
-
-
-def plan_map_op(op: AbstractMap, input_physical_dag: PhysicalOperator) -> MapOperator:
-    """Get the corresponding physical operators DAG for AbstractMap operators."""
-    compute = get_compute(op._compute)
-    block_fn = op._block_fn
-
-    if isinstance(op._fn, CallableClass):
-        if isinstance(compute, TaskPoolStrategy):
-            raise ValueError(
-                "``compute`` must be specified when using a callable class, "
-                "and must specify the actor compute strategy. "
-                'For example, use ``compute="actors"`` or '
-                "``compute=ActorPoolStrategy(min, max)``."
-            )
-        assert isinstance(compute, ActorPoolStrategy)
-
-        fn_constructor_args = op._fn_constructor_args or ()
-        fn_constructor_kwargs = op._fn_constructor_kwargs or {}
-        fn_ = op._fn
-
-        def fn(item: Any) -> Any:
-            # Wrapper providing cached instantiation of stateful callable class
-            # UDFs.
-            if ray.data._cached_fn is None:
-                ray.data._cached_cls = fn_
-                ray.data._cached_fn = fn_(*fn_constructor_args, **fn_constructor_kwargs)
-            else:
-                # A worker is destroyed when its actor is killed, so we
-                # shouldn't have any worker reuse across different UDF
-                # applications (i.e. different map operators).
-                assert ray.data._cached_cls == fn_
-            return ray.data._cached_fn(item)
-
-    else:
-        fn = op._fn
-    fn_args = (fn,)
-    if op._fn_args:
-        fn_args += op._fn_args
-    fn_kwargs = op._fn_kwargs or {}
-
-    def do_map(blocks: Iterator[Block]) -> Iterator[Block]:
-        yield from block_fn(blocks, *fn_args, **fn_kwargs)
-
-    return MapOperator.create(
-        do_map,
-        input_physical_dag,
-        name=op.name,
-        compute_strategy=compute,
-        min_rows_per_bundle=op._target_block_size,
-        ray_remote_args=op._ray_remote_args,
-    )
diff --git a/python/ray/data/_internal/logical/operators/read_operator.py b/python/ray/data/_internal/logical/operators/read_operator.py
index 451a82a02cc0..0527cd21ca58 100644
--- a/python/ray/data/_internal/logical/operators/read_operator.py
+++ b/python/ray/data/_internal/logical/operators/read_operator.py
@@ -1,13 +1,6 @@
-from typing import Any, Dict, Iterator, List
+from typing import Any, Dict
 
-import ray
-import ray.cloudpickle as cloudpickle
-from ray.data._internal.execution.interfaces import RefBundle, PhysicalOperator
-from ray.data._internal.execution.operators.map_operator import MapOperator
-from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
 from ray.data._internal.logical.interfaces import LogicalOperator
-from ray.data.block import Block, BlockMetadata
-from ray.data.datasource import ReadTask
 from ray.data.datasource.datasource import Datasource
 
 
@@ -26,39 +19,3 @@ def __init__(
         self._parallelism = parallelism
         self._ray_remote_args = ray_remote_args
         self._read_args = read_args
-
-
-def plan_read_op(op: Read) -> PhysicalOperator:
-    """Get the corresponding DAG of physical operators for Read."""
-
-    def get_input_data() -> List[RefBundle]:
-        reader = op._datasource.create_reader(**op._read_args)
-        read_tasks = reader.get_read_tasks(op._parallelism)
-        return [
-            RefBundle(
-                [
-                    (
-                        # TODO(chengsu): figure out a better way to pass read
-                        # tasks other than ray.put().
-                        ray.put(read_task),
-                        BlockMetadata(
-                            num_rows=1,
-                            size_bytes=len(cloudpickle.dumps(read_task)),
-                            schema=None,
-                            input_files=[],
-                            exec_stats=None,
-                        ),
-                    )
-                ],
-                owns_blocks=True,
-            )
-            for read_task in read_tasks
-        ]
-
-    inputs = InputDataBuffer(input_data_factory=get_input_data)
-
-    def do_read(blocks: Iterator[ReadTask]) -> Iterator[Block]:
-        for read_task in blocks:
-            yield from read_task()
-
-    return MapOperator.create(do_read, inputs, name="DoRead")
diff --git a/python/ray/data/_internal/logical/optimizers.py b/python/ray/data/_internal/logical/optimizers.py
index 8839b9383d2e..eaced07affc0 100644
--- a/python/ray/data/_internal/logical/optimizers.py
+++ b/python/ray/data/_internal/logical/optimizers.py
@@ -2,7 +2,7 @@
 
 from ray.data._internal.execution.interfaces import PhysicalOperator
 from ray.data._internal.logical.interfaces import Rule, Optimizer, LogicalOperator
-from ray.data._internal.logical.planner import Planner
+from ray.data._internal.planner.planner import Planner
 
 
 class LogicalOptimizer(Optimizer):
diff --git a/python/ray/data/_internal/planner/__init__.py b/python/ray/data/_internal/planner/__init__.py
new file mode 100644
index 000000000000..e69de29bb2d1
diff --git a/python/ray/data/_internal/planner/plan_all_to_all_op.py b/python/ray/data/_internal/planner/plan_all_to_all_op.py
new file mode 100644
index 000000000000..00675550e8bf
--- /dev/null
+++ b/python/ray/data/_internal/planner/plan_all_to_all_op.py
@@ -0,0 +1,29 @@
+from ray.data._internal.execution.interfaces import PhysicalOperator
+from ray.data._internal.execution.operators.all_to_all_operator import AllToAllOperator
+from ray.data._internal.logical.operators.all_to_all_operator import (
+    AbstractAllToAll,
+    RandomizeBlocks,
+)
+from ray.data._internal.planner.randomize_blocks import generate_randomize_blocks_fn
+
+
+def _plan_all_to_all_op(
+    op: AbstractAllToAll,
+    input_physical_dag: PhysicalOperator,
+) -> AllToAllOperator:
+    """Get the corresponding physical operators DAG for AbstractAllToAll operators.
+
+    Note this method only converts the given `op`, but not its input dependencies.
+    See Planner.plan() for more details.
+    """
+    if isinstance(op, RandomizeBlocks):
+        fn = generate_randomize_blocks_fn(op._seed)
+    else:
+        raise ValueError(f"Found unknown logical operator during planning: {op}")
+
+    return AllToAllOperator(
+        fn,
+        input_physical_dag,
+        num_outputs=op._num_outputs,
+        name=op.name,
+    )
diff --git a/python/ray/data/_internal/planner/plan_map_op.py b/python/ray/data/_internal/planner/plan_map_op.py
new file mode 100644
index 000000000000..2c80c0d01514
--- /dev/null
+++ b/python/ray/data/_internal/planner/plan_map_op.py
@@ -0,0 +1,64 @@
+from typing import Any, Iterator
+
+import ray
+from ray.data._internal.compute import ActorPoolStrategy, TaskPoolStrategy, get_compute
+from ray.data._internal.execution.interfaces import PhysicalOperator
+from ray.data._internal.execution.operators.map_operator import MapOperator
+from ray.data._internal.logical.operators.map_operator import AbstractMap
+from ray.data.block import Block, CallableClass
+
+
+def _plan_map_op(op: AbstractMap, input_physical_dag: PhysicalOperator) -> MapOperator:
+    """Get the corresponding physical operators DAG for AbstractMap operators.
+
+    Note this method only converts the given `op`, but not its input dependencies.
+    See Planner.plan() for more details.
+    """
+    compute = get_compute(op._compute)
+    block_fn = op._block_fn
+
+    if isinstance(op._fn, CallableClass):
+        if isinstance(compute, TaskPoolStrategy):
+            raise ValueError(
+                "``compute`` must be specified when using a callable class, "
+                "and must specify the actor compute strategy. "
+                'For example, use ``compute="actors"`` or '
+                "``compute=ActorPoolStrategy(min, max)``."
+            )
+        assert isinstance(compute, ActorPoolStrategy)
+
+        fn_constructor_args = op._fn_constructor_args or ()
+        fn_constructor_kwargs = op._fn_constructor_kwargs or {}
+        fn_ = op._fn
+
+        def fn(item: Any) -> Any:
+            # Wrapper providing cached instantiation of stateful callable class
+            # UDFs.
+            if ray.data._cached_fn is None:
+                ray.data._cached_cls = fn_
+                ray.data._cached_fn = fn_(*fn_constructor_args, **fn_constructor_kwargs)
+            else:
+                # A worker is destroyed when its actor is killed, so we
+                # shouldn't have any worker reuse across different UDF
+                # applications (i.e. different map operators).
+                assert ray.data._cached_cls == fn_
+            return ray.data._cached_fn(item)
+
+    else:
+        fn = op._fn
+    fn_args = (fn,)
+    if op._fn_args:
+        fn_args += op._fn_args
+    fn_kwargs = op._fn_kwargs or {}
+
+    def do_map(blocks: Iterator[Block]) -> Iterator[Block]:
+        yield from block_fn(blocks, *fn_args, **fn_kwargs)
+
+    return MapOperator.create(
+        do_map,
+        input_physical_dag,
+        name=op.name,
+        compute_strategy=compute,
+        min_rows_per_bundle=op._target_block_size,
+        ray_remote_args=op._ray_remote_args,
+    )
diff --git a/python/ray/data/_internal/planner/plan_read_op.py b/python/ray/data/_internal/planner/plan_read_op.py
new file mode 100644
index 000000000000..c593ebad4348
--- /dev/null
+++ b/python/ray/data/_internal/planner/plan_read_op.py
@@ -0,0 +1,50 @@
+from typing import Iterator, List
+
+import ray
+import ray.cloudpickle as cloudpickle
+from ray.data._internal.execution.interfaces import PhysicalOperator, RefBundle
+from ray.data._internal.execution.operators.map_operator import MapOperator
+from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
+from ray.data._internal.logical.operators.read_operator import Read
+from ray.data.block import Block, BlockMetadata
+from ray.data.datasource.datasource import ReadTask
+
+
+def _plan_read_op(op: Read) -> PhysicalOperator:
+    """Get the corresponding DAG of physical operators for Read.
+
+    Note this method only converts the given `op`, but not its input dependencies.
+    See Planner.plan() for more details.
+    """
+
+    def get_input_data() -> List[RefBundle]:
+        reader = op._datasource.create_reader(**op._read_args)
+        read_tasks = reader.get_read_tasks(op._parallelism)
+        return [
+            RefBundle(
+                [
+                    (
+                        # TODO(chengsu): figure out a better way to pass read
+                        # tasks other than ray.put().
+                        ray.put(read_task),
+                        BlockMetadata(
+                            num_rows=1,
+                            size_bytes=len(cloudpickle.dumps(read_task)),
+                            schema=None,
+                            input_files=[],
+                            exec_stats=None,
+                        ),
+                    )
+                ],
+                owns_blocks=True,
+            )
+            for read_task in read_tasks
+        ]
+
+    inputs = InputDataBuffer(input_data_factory=get_input_data)
+
+    def do_read(blocks: Iterator[ReadTask]) -> Iterator[Block]:
+        for read_task in blocks:
+            yield from read_task()
+
+    return MapOperator.create(do_read, inputs, name="DoRead")
diff --git a/python/ray/data/_internal/logical/planner.py b/python/ray/data/_internal/planner/planner.py
similarity index 61%
rename from python/ray/data/_internal/logical/planner.py
rename to python/ray/data/_internal/planner/planner.py
index eec4cd440551..3f5084755944 100644
--- a/python/ray/data/_internal/logical/planner.py
+++ b/python/ray/data/_internal/planner/planner.py
@@ -1,10 +1,11 @@
 from ray.data._internal.execution.interfaces import PhysicalOperator
 from ray.data._internal.logical.interfaces import LogicalOperator
-from ray.data._internal.logical.operators.read_operator import Read, plan_read_op
-from ray.data._internal.logical.operators.map_operator import (
-    AbstractMap,
-    plan_map_op,
-)
+from ray.data._internal.logical.operators.all_to_all_operator import AbstractAllToAll
+from ray.data._internal.logical.operators.read_operator import Read
+from ray.data._internal.logical.operators.map_operator import AbstractMap
+from ray.data._internal.planner.plan_all_to_all_op import _plan_all_to_all_op
+from ray.data._internal.planner.plan_map_op import _plan_map_op
+from ray.data._internal.planner.plan_read_op import _plan_read_op
 
 
 class Planner:
@@ -23,10 +24,13 @@ def plan(self, logical_dag: LogicalOperator) -> PhysicalOperator:
 
         if isinstance(logical_dag, Read):
             assert not physical_children
-            physical_dag = plan_read_op(logical_dag)
+            physical_dag = _plan_read_op(logical_dag)
         elif isinstance(logical_dag, AbstractMap):
             assert len(physical_children) == 1
-            physical_dag = plan_map_op(logical_dag, physical_children[0])
+            physical_dag = _plan_map_op(logical_dag, physical_children[0])
+        elif isinstance(logical_dag, AbstractAllToAll):
+            assert len(physical_children) == 1
+            physical_dag = _plan_all_to_all_op(logical_dag, physical_children[0])
         else:
             raise ValueError(
                 f"Found unknown logical operator during planning: {logical_dag}"
diff --git a/python/ray/data/_internal/planner/randomize_blocks.py b/python/ray/data/_internal/planner/randomize_blocks.py
new file mode 100644
index 000000000000..6a9343f5b742
--- /dev/null
+++ b/python/ray/data/_internal/planner/randomize_blocks.py
@@ -0,0 +1,42 @@
+from typing import Callable, List, Optional, Tuple
+
+from ray.data._internal.execution.interfaces import RefBundle
+from ray.data._internal.stats import StatsDict
+
+
+def generate_randomize_blocks_fn(
+    seed: Optional[int],
+) -> Callable[[List[RefBundle]], Tuple[List[RefBundle], StatsDict]]:
+    """Generate function to randomize order of blocks."""
+
+    def fn(refs: List[RefBundle]) -> Tuple[List[RefBundle], StatsDict]:
+        import random
+
+        blocks_with_metadata = []
+        for ref_bundle in refs:
+            for block, meta in ref_bundle.blocks:
+                blocks_with_metadata.append((block, meta))
+
+        if len(blocks_with_metadata) == 0:
+            return refs, {}
+        else:
+            if seed is not None:
+                random.seed(seed)
+            input_owned = all(b.owns_blocks for b in refs)
+            random.shuffle(blocks_with_metadata)
+            output = []
+            for block, meta in blocks_with_metadata:
+                output.append(
+                    RefBundle(
+                        [
+                            (
+                                block,
+                                meta,
+                            )
+                        ],
+                        owns_blocks=input_owned,
+                    )
+                )
+            return output, {}
+
+    return fn
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index efdb7556d47e..cdd60b40f7c0 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -30,6 +30,7 @@
 from ray._private.usage import usage_lib
 from ray.air.constants import TENSOR_COLUMN_NAME
 from ray.air.util.data_batch_conversion import BlockFormat
+from ray.data._internal.logical.operators.all_to_all_operator import RandomizeBlocks
 from ray.data._internal.logical.optimizers import LogicalPlan
 from ray.data._internal.logical.operators.map_operator import (
     Filter,
@@ -1096,7 +1097,15 @@ def randomize_block_order(
         """
 
         plan = self._plan.with_stage(RandomizeBlocksStage(seed))
-        return Dataset(plan, self._epoch, self._lazy)
+
+        logical_plan = self._logical_plan
+        if logical_plan is not None:
+            op = RandomizeBlocks(
+                logical_plan.dag,
+                seed=seed,
+            )
+            logical_plan = LogicalPlan(op)
+        return Dataset(plan, self._epoch, self._lazy, logical_plan)
 
     def random_sample(
         self, fraction: float, *, seed: Optional[int] = None
diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index 273aad060b48..6814b796ac36 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -2,7 +2,9 @@
 
 import ray
 from ray.data._internal.execution.operators.map_operator import MapOperator
+from ray.data._internal.execution.operators.all_to_all_operator import AllToAllOperator
 from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
+from ray.data._internal.logical.operators.all_to_all_operator import RandomizeBlocks
 from ray.data._internal.logical.operators.read_operator import Read
 from ray.data._internal.logical.operators.map_operator import (
     MapRows,
@@ -10,7 +12,7 @@
     Filter,
     FlatMap,
 )
-from ray.data._internal.logical.planner import Planner
+from ray.data._internal.planner.planner import Planner
 from ray.data.datasource.parquet_datasource import ParquetDatasource
 
 from ray.tests.conftest import *  # noqa
@@ -146,6 +148,27 @@ def ensure_sample_size_close(dataset, sample_percent=0.5):
     ensure_sample_size_close(ds)
 
 
+def test_randomize_blocks_operator(ray_start_cluster_enabled, enable_optimizer):
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = RandomizeBlocks(
+        read_op,
+        seed=0,
+    )
+    physical_op = planner.plan(op)
+
+    assert op.name == "RandomizeBlocks"
+    assert isinstance(physical_op, AllToAllOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], MapOperator)
+
+
+def test_randomize_blocks_e2e(ray_start_cluster_enabled, enable_optimizer):
+    ds = ray.data.range(12, parallelism=4)
+    ds = ds.randomize_block_order(seed=0)
+    assert ds.take_all() == [6, 7, 8, 0, 1, 2, 3, 4, 5, 9, 10, 11], ds
+
+
 if __name__ == "__main__":
     import sys
 

From b58bb93dc7b28097cfdb4d6a40dee2ce7417583e Mon Sep 17 00:00:00 2001
From: Max Pumperla <max.pumperla@googlemail.com>
Date: Sat, 28 Jan 2023 02:59:05 +0100
Subject: [PATCH 040/267] [docs] collapse navbar (#31994)

---
 doc/source/_static/css/custom.css |   8 +
 doc/source/_toc.yml               | 256 +++++++++++++++---------------
 2 files changed, 135 insertions(+), 129 deletions(-)

diff --git a/doc/source/_static/css/custom.css b/doc/source/_static/css/custom.css
index 5f62d82e16b7..ce9dcb9839e0 100644
--- a/doc/source/_static/css/custom.css
+++ b/doc/source/_static/css/custom.css
@@ -5,6 +5,14 @@
   padding: 0pt;
 }
 
+.toctree-l1.has-children {
+    font-weight: bold;
+}
+
+.toctree-l2 {
+    font-weight: normal;
+}
+
 .topnav {
   background-color: white;
   border-bottom: 1px solid rgba(0, 0, 0, .1);
diff --git a/doc/source/_toc.yml b/doc/source/_toc.yml
index 48ba24c5daa5..fa892b263ea3 100644
--- a/doc/source/_toc.yml
+++ b/doc/source/_toc.yml
@@ -1,53 +1,124 @@
 format: jb-book
 root: index
 parts:
-  - caption: Overview
+  - caption: Ray
     chapters:
       - file: ray-overview/index
+        title: "Getting Started"
       - file: ray-overview/installation
+        title: "Installation"
       - file: ray-overview/use-cases
+        title: "Use Cases"
       - file: ray-overview/ray-libraries
+        title: "Ecosystem"
 
-  - caption: Ray AI Runtime
-    chapters:
-    - file: ray-air/getting-started
-      title: "What is Ray AI Runtime (AIR)?"
-    - file: ray-air/key-concepts
-    - file: ray-air/user-guides
-      sections:
-        - file: ray-air/preprocessors
-        - file: ray-air/trainer
-        - file: ray-air/check-ingest
-        - file: ray-air/tuner
-        - file: ray-air/predictors
-        - file: ray-air/examples/serving_guide
-        - file: ray-air/deployment
-    - file: ray-air/examples/index
-      sections:
-        - file: ray-air/examples/torch_image_example
-        - file: ray-air/examples/convert_existing_pytorch_code_to_ray_air
-        - file: ray-air/examples/convert_existing_tf_code_to_ray_air
-        - file: ray-air/examples/tfx_tabular_train_to_serve
-        - file: ray-air/examples/huggingface_text_classification
-        - file: ray-air/examples/sklearn_example
-        - file: ray-air/examples/xgboost_example
-        - file: ray-air/examples/analyze_tuning_results
-        - file: ray-air/examples/lightgbm_example
-        - file: ray-air/examples/torch_incremental_learning
-        - file: ray-air/examples/rl_serving_example
-        - file: ray-air/examples/rl_online_example
-        - file: ray-air/examples/rl_offline_example
-        - file: ray-air/examples/upload_to_comet_ml
-        - file: ray-air/examples/upload_to_wandb
-        - file: ray-air/examples/feast_example
-        - file: ray-air/examples/automl_with_ray_air
-        - file: ray-air/examples/batch_tuning
-        - file: ray-air/examples/batch_forecasting
-    - file: ray-air/package-ref
-    - file: ray-air/benchmarks
+      - file: ray-core/walkthrough
+        title: "Ray Core"
+        sections:
+          - file: ray-core/key-concepts
+            title: "Key Concepts"
+          - file: ray-core/user-guide
+            title: "User Guides"
+          - file: ray-core/examples/overview
+            title: "Examples"
+            sections:
+              - file: ray-core/examples/monte_carlo_pi
+              - file: ray-core/examples/plot_example-a3c
+              - file: ray-core/examples/plot_example-lm
+              - file: ray-core/examples/plot_hyperparameter
+              - file: ray-core/examples/plot_parameter_server
+              - file: ray-core/examples/plot_pong_example
+              - file: ray-core/examples/highly_parallel
+              - file: ray-core/examples/batch_prediction
+              - file: ray-core/examples/batch_training
+              - file: ray-core/examples/automl_for_time_series
+          - file: ray-core/api
+
+      - file: cluster/getting-started
+        title: "Ray Clusters"
+        sections:
+          - file: cluster/key-concepts
+            title: Key Concepts
+          - file: cluster/kubernetes/index
+            title: Deploying on Kubernetes
+            sections:
+            - file: cluster/kubernetes/getting-started
+            - file: cluster/kubernetes/user-guides
+              sections:
+                - file: cluster/kubernetes/user-guides/k8s-cluster-setup.md
+                - file: cluster/kubernetes/user-guides/config.md
+                - file: cluster/kubernetes/user-guides/configuring-autoscaling.md
+                - file: cluster/kubernetes/user-guides/logging.md
+                - file: cluster/kubernetes/user-guides/gpu.md
+                - file: cluster/kubernetes/user-guides/experimental.md
+            - file: cluster/kubernetes/examples
+              sections:
+                - file: cluster/kubernetes/examples/ml-example.md
+                - file: cluster/kubernetes/examples/gpu-training-example.md
+            - file: cluster/kubernetes/references
+          - file: cluster/vms/index
+            title: Deploying on VMs
+            sections:
+            - file: cluster/vms/getting-started
+            - file: cluster/vms/user-guides/index
+              title: User Guides
+              sections:
+              - file: cluster/vms/user-guides/launching-clusters/index
+              - file: cluster/vms/user-guides/large-cluster-best-practices
+              - file: cluster/vms/user-guides/configuring-autoscaling
+              - file: cluster/vms/user-guides/community/index
+                title: Community-supported Cluster Managers
+                sections:
+                - file: cluster/vms/user-guides/community/yarn
+                - file: cluster/vms/user-guides/community/slurm
+                - file: cluster/vms/user-guides/community/lsf
+            - file: cluster/vms/examples/index
+              title: Examples
+              sections:
+              - file: cluster/vms/examples/ml-example
+            - file: cluster/vms/references/index
+          - file: cluster/running-applications/index
+            title: Applications Guide
+          - file: cluster/faq
+          - file: cluster/package-overview
+
+      - file: ray-air/getting-started
+        title: "Ray AI Runtime (AIR)"
+        sections:
+          - file: ray-air/key-concepts
+          - file: ray-air/user-guides
+            sections:
+              - file: ray-air/preprocessors
+              - file: ray-air/trainer
+              - file: ray-air/check-ingest
+              - file: ray-air/tuner
+              - file: ray-air/predictors
+              - file: ray-air/examples/serving_guide
+              - file: ray-air/deployment
+          - file: ray-air/examples/index
+            sections:
+              - file: ray-air/examples/torch_image_example
+              - file: ray-air/examples/convert_existing_pytorch_code_to_ray_air
+              - file: ray-air/examples/convert_existing_tf_code_to_ray_air
+              - file: ray-air/examples/tfx_tabular_train_to_serve
+              - file: ray-air/examples/huggingface_text_classification
+              - file: ray-air/examples/sklearn_example
+              - file: ray-air/examples/xgboost_example
+              - file: ray-air/examples/analyze_tuning_results
+              - file: ray-air/examples/lightgbm_example
+              - file: ray-air/examples/torch_incremental_learning
+              - file: ray-air/examples/rl_serving_example
+              - file: ray-air/examples/rl_online_example
+              - file: ray-air/examples/rl_offline_example
+              - file: ray-air/examples/upload_to_comet_ml
+              - file: ray-air/examples/upload_to_wandb
+              - file: ray-air/examples/feast_example
+              - file: ray-air/examples/automl_with_ray_air
+              - file: ray-air/examples/batch_tuning
+              - file: ray-air/examples/batch_forecasting
+          - file: ray-air/package-ref
+          - file: ray-air/benchmarks
 
-  - caption: Ray Libraries
-    chapters:
       - file: data/dataset
         title: Ray Data
         sections:
@@ -261,98 +332,25 @@ parts:
               - file: workflows/advanced
               - file: workflows/package-ref
 
-  - caption: Ray Core
-    chapters:
-      - file: ray-core/walkthrough
-        title: Getting Started
-      - file: ray-core/key-concepts
-        title: "Key Concepts"
-      - file: ray-core/user-guide
-        title: "User Guides"
-      - file: ray-core/examples/overview
-        title: "Examples"
-        sections:
-          - file: ray-core/examples/monte_carlo_pi
-          - file: ray-core/examples/plot_example-a3c
-          - file: ray-core/examples/plot_example-lm
-          - file: ray-core/examples/plot_hyperparameter
-          - file: ray-core/examples/plot_parameter_server
-          - file: ray-core/examples/plot_pong_example
-          - file: ray-core/examples/highly_parallel
-          - file: ray-core/examples/batch_prediction
-          - file: ray-core/examples/batch_training
-          - file: ray-core/examples/automl_for_time_series
-      - file: ray-core/api
-
-  - caption: Ray Clusters
-    chapters:
-      - file: cluster/getting-started
-        title: Getting Started
-      - file: cluster/key-concepts
-        title: Key Concepts
-      - file: cluster/kubernetes/index
-        title: Deploying on Kubernetes
-        sections:
-        - file: cluster/kubernetes/getting-started
-        - file: cluster/kubernetes/user-guides
-          sections:
-            - file: cluster/kubernetes/user-guides/k8s-cluster-setup.md
-            - file: cluster/kubernetes/user-guides/config.md
-            - file: cluster/kubernetes/user-guides/configuring-autoscaling.md
-            - file: cluster/kubernetes/user-guides/logging.md
-            - file: cluster/kubernetes/user-guides/gpu.md
-            - file: cluster/kubernetes/user-guides/experimental.md
-        - file: cluster/kubernetes/examples
-          sections:
-            - file: cluster/kubernetes/examples/ml-example.md
-            - file: cluster/kubernetes/examples/gpu-training-example.md
-        - file: cluster/kubernetes/references
-      - file: cluster/vms/index
-        title: Deploying on VMs
-        sections:
-        - file: cluster/vms/getting-started
-        - file: cluster/vms/user-guides/index
-          title: User Guides
-          sections:
-          - file: cluster/vms/user-guides/launching-clusters/index
-          - file: cluster/vms/user-guides/large-cluster-best-practices
-          - file: cluster/vms/user-guides/configuring-autoscaling
-          - file: cluster/vms/user-guides/community/index
-            title: Community-supported Cluster Managers
-            sections:
-            - file: cluster/vms/user-guides/community/yarn
-            - file: cluster/vms/user-guides/community/slurm
-            - file: cluster/vms/user-guides/community/lsf
-        - file: cluster/vms/examples/index
-          title: Examples
-          sections:
-          - file: cluster/vms/examples/ml-example
-        - file: cluster/vms/references/index
-      - file: cluster/running-applications/index
-        title: Applications Guide
-      - file: cluster/faq
-      - file: cluster/package-overview
-
-  - caption: Monitoring and Debugging
-    chapters:
       - file: ray-observability/monitoring-debugging/monitoring-debugging
-        title: User Guides
-      - file: ray-observability/index
-        title: Tools
+        title: "Monitoring and Debugging"
+        sections:
+          - file: ray-observability/index
+            title: Tools
 
-  - caption: References
-    chapters:
       - file: ray-references/api
-      - file: cluster/usage-stats
+        title: References
+        sections:
+          - file: cluster/usage-stats
 
-  - caption: Developer Guides
-    chapters:
       - file: ray-contribute/stability
-      - file: ray-contribute/getting-involved
+        title: Developer Guides
         sections:
-          - file: ray-contribute/development
-          - file: ray-contribute/docs
-          - file: ray-contribute/fake-autoscaler
-          - file: ray-core/examples/testing-tips
-      - file: ray-core/configure
-      - file: ray-contribute/whitepaper
+          - file: ray-contribute/getting-involved
+            sections:
+              - file: ray-contribute/development
+              - file: ray-contribute/docs
+              - file: ray-contribute/fake-autoscaler
+              - file: ray-core/examples/testing-tips
+          - file: ray-core/configure
+          - file: ray-contribute/whitepaper
\ No newline at end of file

From 09f45adab6508118f239c8c56285e1a9f7a3c51a Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Fri, 27 Jan 2023 22:59:45 -0800
Subject: [PATCH 041/267] [core] Add code owner to GCS module. (#32018)

Add code owner to GCS module.
---
 .github/CODEOWNERS | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS
index d715e561c8c8..51e3ffbce96b 100644
--- a/.github/CODEOWNERS
+++ b/.github/CODEOWNERS
@@ -33,6 +33,9 @@
 # All C++ code.
 # /src/ray @ray-project/ray-core-cpp
 
+# GCS
+/src/ray/gcs/ @iycheng @scv119 @rkooo567 @ericl
+
 # Dependencies
 /python/setup.py @richardliaw @ericl @edoakes
 

From 8e188db711683b5c839d530f277e2951b72237c6 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Fri, 27 Jan 2023 23:47:55 -0800
Subject: [PATCH 042/267] Refactor block_fn out of map-like logical operators
 (#32021)

Signed-off-by: Cheng Su <scnju13@gmail.com>
---
 .../logical/operators/map_operator.py         |  53 +++---
 python/ray/data/_internal/planner/filter.py   |  23 +++
 python/ray/data/_internal/planner/flat_map.py |  28 ++++
 .../ray/data/_internal/planner/map_batches.py | 104 ++++++++++++
 python/ray/data/_internal/planner/map_rows.py |  25 +++
 .../ray/data/_internal/planner/plan_map_op.py |  31 +++-
 python/ray/data/dataset.py                    | 155 +++---------------
 .../data/tests/test_execution_optimizer.py    |   3 -
 8 files changed, 251 insertions(+), 171 deletions(-)
 create mode 100644 python/ray/data/_internal/planner/filter.py
 create mode 100644 python/ray/data/_internal/planner/flat_map.py
 create mode 100644 python/ray/data/_internal/planner/map_batches.py
 create mode 100644 python/ray/data/_internal/planner/map_rows.py

diff --git a/python/ray/data/_internal/logical/operators/map_operator.py b/python/ray/data/_internal/logical/operators/map_operator.py
index a1a1635acc38..42bfb3bb1010 100644
--- a/python/ray/data/_internal/logical/operators/map_operator.py
+++ b/python/ray/data/_internal/logical/operators/map_operator.py
@@ -1,13 +1,13 @@
 import sys
 from typing import Any, Dict, Iterable, Optional, Union
 
-from ray.data._internal.compute import BlockTransform
 from ray.data._internal.logical.interfaces import LogicalOperator
 from ray.data._internal.compute import (
     UDF,
     ComputeStrategy,
 )
 from ray.data.block import BatchUDF, RowUDF
+from ray.data.context import DEFAULT_BATCH_SIZE
 
 
 if sys.version_info >= (3, 8):
@@ -21,21 +21,17 @@ class AbstractMap(LogicalOperator):
     MapOperator.
     """
 
-    # TODO: Replace `fn`, `fn_args`, `fn_kwargs`, `fn_constructor_args`, and
-    # `fn_constructor_kwargs` from this API, in favor of `block_fn_args` and
-    # `block_fn_kwargs`. Operators should only be concerned with `block_fn`.
     def __init__(
         self,
         name: str,
         input_op: LogicalOperator,
-        block_fn: BlockTransform,
-        compute: Optional[Union[str, ComputeStrategy]] = None,
-        target_block_size: Optional[int] = None,
-        fn: Optional[UDF] = None,
+        fn: UDF,
         fn_args: Optional[Iterable[Any]] = None,
         fn_kwargs: Optional[Dict[str, Any]] = None,
         fn_constructor_args: Optional[Iterable[Any]] = None,
         fn_constructor_kwargs: Optional[Dict[str, Any]] = None,
+        target_block_size: Optional[int] = None,
+        compute: Optional[Union[str, ComputeStrategy]] = None,
         ray_remote_args: Optional[Dict[str, Any]] = None,
     ):
         """
@@ -44,27 +40,26 @@ def __init__(
                 inspecting the logical plan of a Dataset.
             input_op: The operator preceding this operator in the plan DAG. The outputs
                 of `input_op` will be the inputs to this operator.
-            block_fn: The transform function to apply to each input block to produce
-                output blocks.
-            target_block_size: The target size for blocks outputted by this operator.
-            fn: User provided UDF to be called in `block_fn`.
+            fn: User-defined function to be called.
             fn_args: Arguments to `fn`.
             fn_kwargs: Keyword arguments to `fn`.
             fn_constructor_args: Arguments to provide to the initializor of `fn` if
                 `fn` is a callable class.
             fn_constructor_kwargs: Keyword Arguments to provide to the initializor of
                 `fn` if `fn` is a callable class.
+            target_block_size: The target size for blocks outputted by this operator.
+            compute: The compute strategy, either ``"tasks"`` (default) to use Ray
+                tasks, or ``"actors"`` to use an autoscaling actor pool.
             ray_remote_args: Args to provide to ray.remote.
         """
         super().__init__(name, [input_op])
-        self._block_fn = block_fn
-        self._compute = compute or "tasks"
-        self._target_block_size = target_block_size
         self._fn = fn
         self._fn_args = fn_args
         self._fn_kwargs = fn_kwargs
         self._fn_constructor_args = fn_constructor_args
         self._fn_constructor_kwargs = fn_constructor_kwargs
+        self._target_block_size = target_block_size
+        self._compute = compute or "tasks"
         self._ray_remote_args = ray_remote_args or {}
 
 
@@ -74,34 +69,34 @@ class MapBatches(AbstractMap):
     def __init__(
         self,
         input_op: LogicalOperator,
-        block_fn: BlockTransform,
         fn: BatchUDF,
-        batch_size: Optional[Union[int, Literal["default"]]] = "default",
-        compute: Optional[Union[str, ComputeStrategy]] = None,
+        batch_size: Optional[int] = DEFAULT_BATCH_SIZE,
         batch_format: Literal["default", "pandas", "pyarrow", "numpy"] = "default",
+        prefetch_batches: int = 0,
         zero_copy_batch: bool = False,
-        target_block_size: Optional[int] = None,
         fn_args: Optional[Iterable[Any]] = None,
         fn_kwargs: Optional[Dict[str, Any]] = None,
         fn_constructor_args: Optional[Iterable[Any]] = None,
         fn_constructor_kwargs: Optional[Dict[str, Any]] = None,
+        target_block_size: Optional[int] = None,
+        compute: Optional[Union[str, ComputeStrategy]] = None,
         ray_remote_args: Optional[Dict[str, Any]] = None,
     ):
         super().__init__(
             "MapBatches",
             input_op,
-            block_fn,
-            compute=compute,
-            target_block_size=target_block_size,
-            fn=fn,
+            fn,
             fn_args=fn_args,
             fn_kwargs=fn_kwargs,
             fn_constructor_args=fn_constructor_args,
             fn_constructor_kwargs=fn_constructor_kwargs,
+            target_block_size=target_block_size,
+            compute=compute,
             ray_remote_args=ray_remote_args,
         )
         self._batch_size = batch_size
         self._batch_format = batch_format
+        self._prefetch_batches = prefetch_batches
         self._zero_copy_batch = zero_copy_batch
 
 
@@ -111,7 +106,6 @@ class MapRows(AbstractMap):
     def __init__(
         self,
         input_op: LogicalOperator,
-        block_fn: BlockTransform,
         fn: RowUDF,
         compute: Optional[Union[str, ComputeStrategy]] = None,
         ray_remote_args: Optional[Dict[str, Any]] = None,
@@ -119,9 +113,8 @@ def __init__(
         super().__init__(
             "MapRows",
             input_op,
-            block_fn,
+            fn,
             compute=compute,
-            fn=fn,
             ray_remote_args=ray_remote_args,
         )
 
@@ -132,7 +125,6 @@ class Filter(AbstractMap):
     def __init__(
         self,
         input_op: LogicalOperator,
-        block_fn: BlockTransform,
         fn: RowUDF,
         compute: Optional[Union[str, ComputeStrategy]] = None,
         ray_remote_args: Optional[Dict[str, Any]] = None,
@@ -140,9 +132,8 @@ def __init__(
         super().__init__(
             "Filter",
             input_op,
-            block_fn,
+            fn,
             compute=compute,
-            fn=fn,
             ray_remote_args=ray_remote_args,
         )
 
@@ -153,7 +144,6 @@ class FlatMap(AbstractMap):
     def __init__(
         self,
         input_op: LogicalOperator,
-        block_fn: BlockTransform,
         fn: RowUDF,
         compute: Optional[Union[str, ComputeStrategy]] = None,
         ray_remote_args: Optional[Dict[str, Any]] = None,
@@ -161,8 +151,7 @@ def __init__(
         super().__init__(
             "FlatMap",
             input_op,
-            block_fn,
+            fn,
             compute=compute,
-            fn=fn,
             ray_remote_args=ray_remote_args,
         )
diff --git a/python/ray/data/_internal/planner/filter.py b/python/ray/data/_internal/planner/filter.py
new file mode 100644
index 000000000000..c64beef202d6
--- /dev/null
+++ b/python/ray/data/_internal/planner/filter.py
@@ -0,0 +1,23 @@
+from typing import Callable, Iterator
+
+from ray.data.block import Block, BlockAccessor, RowUDF
+from ray.data.context import DatasetContext
+
+
+def generate_filter_fn() -> Callable[[Iterator[Block]], Iterator[Block]]:
+    """Generate function to apply the UDF to each record of blocks,
+    and filter out records that do not satisfy the given predicate.
+    """
+    context = DatasetContext.get_current()
+
+    def fn(blocks: Iterator[Block], row_fn: RowUDF) -> Iterator[Block]:
+        DatasetContext._set_current(context)
+        for block in blocks:
+            block = BlockAccessor.for_block(block)
+            builder = block.builder()
+            for row in block.iter_rows():
+                if row_fn(row):
+                    builder.add(row)
+            return [builder.build()]
+
+    return fn
diff --git a/python/ray/data/_internal/planner/flat_map.py b/python/ray/data/_internal/planner/flat_map.py
new file mode 100644
index 000000000000..4483b9dd6e2e
--- /dev/null
+++ b/python/ray/data/_internal/planner/flat_map.py
@@ -0,0 +1,28 @@
+from typing import Callable, Iterator
+
+from ray.data._internal.output_buffer import BlockOutputBuffer
+from ray.data.block import Block, BlockAccessor, RowUDF
+from ray.data.context import DatasetContext
+
+
+def generate_flat_map_fn() -> Callable[[Iterator[Block]], Iterator[Block]]:
+    """Generate function to apply the UDF to each record of blocks,
+    and then flatten results.
+    """
+    context = DatasetContext.get_current()
+
+    def fn(blocks: Iterator[Block], row_fn: RowUDF) -> Iterator[Block]:
+        DatasetContext._set_current(context)
+        for block in blocks:
+            output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
+            block = BlockAccessor.for_block(block)
+            for row in block.iter_rows():
+                for r2 in row_fn(row):
+                    output_buffer.add(r2)
+                    if output_buffer.has_next():
+                        yield output_buffer.next()
+            output_buffer.finalize()
+            if output_buffer.has_next():
+                yield output_buffer.next()
+
+    return fn
diff --git a/python/ray/data/_internal/planner/map_batches.py b/python/ray/data/_internal/planner/map_batches.py
new file mode 100644
index 000000000000..c273334acb62
--- /dev/null
+++ b/python/ray/data/_internal/planner/map_batches.py
@@ -0,0 +1,104 @@
+import sys
+from typing import Callable, Iterator, Optional
+
+from ray.data._internal.block_batching import batch_blocks
+from ray.data._internal.output_buffer import BlockOutputBuffer
+from ray.data.block import BatchUDF, Block, DataBatch
+from ray.data.context import DEFAULT_BATCH_SIZE, DatasetContext
+
+
+if sys.version_info >= (3, 8):
+    from typing import Literal
+else:
+    from typing_extensions import Literal
+
+
+def generate_map_batches_fn(
+    batch_size: Optional[int] = DEFAULT_BATCH_SIZE,
+    batch_format: Literal["default", "pandas", "pyarrow", "numpy"] = "default",
+    prefetch_batches: int = 0,
+    zero_copy_batch: bool = False,
+) -> Callable[[Iterator[Block]], Iterator[Block]]:
+    """Generate function to apply the batch UDF to blocks."""
+    import numpy as np
+    import pandas as pd
+    import pyarrow as pa
+
+    context = DatasetContext.get_current()
+
+    def fn(
+        blocks: Iterator[Block], batch_fn: BatchUDF, *fn_args, **fn_kwargs
+    ) -> Iterator[Block]:
+        DatasetContext._set_current(context)
+        output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
+
+        def validate_batch(batch: Block) -> None:
+            if not isinstance(
+                batch, (list, pa.Table, np.ndarray, dict, pd.core.frame.DataFrame)
+            ):
+                raise ValueError(
+                    "The `fn` you passed to `map_batches` returned a value of type "
+                    f"{type(batch)}. This isn't allowed -- `map_batches` expects "
+                    "`fn` to return a `pandas.DataFrame`, `pyarrow.Table`, "
+                    "`numpy.ndarray`, `list`, or `dict[str, numpy.ndarray]`."
+                )
+
+            if isinstance(batch, dict):
+                for key, value in batch.items():
+                    if not isinstance(value, np.ndarray):
+                        raise ValueError(
+                            "The `fn` you passed to `map_batches` returned a "
+                            f"`dict`. `map_batches` expects all `dict` values "
+                            f"to be of type `numpy.ndarray`, but the value "
+                            f"corresponding to key {key!r} is of type "
+                            f"{type(value)}. To fix this issue, convert "
+                            f"the {type(value)} to a `numpy.ndarray`."
+                        )
+
+        def process_next_batch(batch: DataBatch) -> Iterator[Block]:
+            # Apply UDF.
+            try:
+                batch = batch_fn(batch, *fn_args, **fn_kwargs)
+            except ValueError as e:
+                read_only_msgs = [
+                    "assignment destination is read-only",
+                    "buffer source array is read-only",
+                ]
+                err_msg = str(e)
+                if any(msg in err_msg for msg in read_only_msgs):
+                    raise ValueError(
+                        f"Batch mapper function {fn.__name__} tried to mutate a "
+                        "zero-copy read-only batch. To be able to mutate the "
+                        "batch, pass zero_copy_batch=False to map_batches(); "
+                        "this will create a writable copy of the batch before "
+                        "giving it to fn. To elide this copy, modify your mapper "
+                        "function so it doesn't try to mutate its input."
+                    ) from e
+                else:
+                    raise e from None
+
+            validate_batch(batch)
+            # Add output batch to output buffer.
+            output_buffer.add_batch(batch)
+            if output_buffer.has_next():
+                yield output_buffer.next()
+
+        # Ensure that zero-copy batch views are copied so mutating UDFs don't error.
+        formatted_batch_iter = batch_blocks(
+            blocks=blocks,
+            stats=None,
+            batch_size=batch_size,
+            batch_format=batch_format,
+            ensure_copy=not zero_copy_batch and batch_size is not None,
+            prefetch_batches=prefetch_batches,
+        )
+
+        for batch in formatted_batch_iter:
+            yield from process_next_batch(batch)
+
+        # Yield remainder block from output buffer.
+        output_buffer.finalize()
+        if output_buffer.has_next():
+            yield output_buffer.next()
+
+    return fn
diff --git a/python/ray/data/_internal/planner/map_rows.py b/python/ray/data/_internal/planner/map_rows.py
new file mode 100644
index 000000000000..0c8b6c01f57c
--- /dev/null
+++ b/python/ray/data/_internal/planner/map_rows.py
@@ -0,0 +1,25 @@
+from typing import Callable, Iterator
+
+from ray.data._internal.output_buffer import BlockOutputBuffer
+from ray.data.block import Block, BlockAccessor, RowUDF
+from ray.data.context import DatasetContext
+
+
+def generate_map_rows_fn() -> Callable[[Iterator[Block]], Iterator[Block]]:
+    """Generate function to apply the UDF to each record of blocks."""
+    context = DatasetContext.get_current()
+
+    def fn(blocks: Iterator[Block], row_fn: RowUDF) -> Iterator[Block]:
+        DatasetContext._set_current(context)
+        for block in blocks:
+            output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
+            block = BlockAccessor.for_block(block)
+            for row in block.iter_rows():
+                output_buffer.add(row_fn(row))
+                if output_buffer.has_next():
+                    yield output_buffer.next()
+            output_buffer.finalize()
+            if output_buffer.has_next():
+                yield output_buffer.next()
+
+    return fn
diff --git a/python/ray/data/_internal/planner/plan_map_op.py b/python/ray/data/_internal/planner/plan_map_op.py
index 2c80c0d01514..c2157879a690 100644
--- a/python/ray/data/_internal/planner/plan_map_op.py
+++ b/python/ray/data/_internal/planner/plan_map_op.py
@@ -4,7 +4,17 @@
 from ray.data._internal.compute import ActorPoolStrategy, TaskPoolStrategy, get_compute
 from ray.data._internal.execution.interfaces import PhysicalOperator
 from ray.data._internal.execution.operators.map_operator import MapOperator
-from ray.data._internal.logical.operators.map_operator import AbstractMap
+from ray.data._internal.logical.operators.map_operator import (
+    AbstractMap,
+    Filter,
+    FlatMap,
+    MapBatches,
+    MapRows,
+)
+from ray.data._internal.planner.filter import generate_filter_fn
+from ray.data._internal.planner.flat_map import generate_flat_map_fn
+from ray.data._internal.planner.map_batches import generate_map_batches_fn
+from ray.data._internal.planner.map_rows import generate_map_rows_fn
 from ray.data.block import Block, CallableClass
 
 
@@ -14,8 +24,23 @@ def _plan_map_op(op: AbstractMap, input_physical_dag: PhysicalOperator) -> MapOp
     Note this method only converts the given `op`, but not its input dependencies.
     See Planner.plan() for more details.
     """
+    if isinstance(op, MapBatches):
+        transform_fn = generate_map_batches_fn(
+            batch_size=op._batch_size,
+            batch_format=op._batch_format,
+            prefetch_batches=op._prefetch_batches,
+            zero_copy_batch=op._zero_copy_batch,
+        )
+    elif isinstance(op, MapRows):
+        transform_fn = generate_map_rows_fn()
+    elif isinstance(op, FlatMap):
+        transform_fn = generate_flat_map_fn()
+    elif isinstance(op, Filter):
+        transform_fn = generate_filter_fn()
+    else:
+        raise ValueError(f"Found unknown logical operator during planning: {op}")
+
     compute = get_compute(op._compute)
-    block_fn = op._block_fn
 
     if isinstance(op._fn, CallableClass):
         if isinstance(compute, TaskPoolStrategy):
@@ -52,7 +77,7 @@ def fn(item: Any) -> Any:
     fn_kwargs = op._fn_kwargs or {}
 
     def do_map(blocks: Iterator[Block]) -> Iterator[Block]:
-        yield from block_fn(blocks, *fn_args, **fn_kwargs)
+        yield from transform_fn(blocks, *fn_args, **fn_kwargs)
 
     return MapOperator.create(
         do_map,
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index cdd60b40f7c0..84fca0f5b90d 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -38,8 +38,12 @@
     MapRows,
     MapBatches,
 )
+from ray.data._internal.planner.filter import generate_filter_fn
+from ray.data._internal.planner.flat_map import generate_flat_map_fn
+from ray.data._internal.planner.map_batches import generate_map_batches_fn
+from ray.data._internal.planner.map_rows import generate_map_rows_fn
 from ray.data.dataset_iterator import DatasetIterator
-from ray.data._internal.block_batching import batch_block_refs, batch_blocks
+from ray.data._internal.block_batching import batch_block_refs
 from ray.data._internal.block_list import BlockList
 from ray.data._internal.bulk_dataset_iterator import BulkDatasetIterator
 from ray.data._internal.compute import (
@@ -51,7 +55,6 @@
 from ray.data._internal.delegating_block_builder import DelegatingBlockBuilder
 from ray.data._internal.equalize import _equalize
 from ray.data._internal.lazy_block_list import LazyBlockList
-from ray.data._internal.output_buffer import BlockOutputBuffer
 from ray.data._internal.util import (
     _estimate_available_parallelism,
     _is_local_scheme,
@@ -61,7 +64,6 @@
 from ray.data._internal.plan import (
     ExecutionPlan,
     OneToOneStage,
-    _adapt_for_multiple_blocks,
 )
 from ray.data._internal.stage_impl import (
     RandomizeBlocksStage,
@@ -316,25 +318,13 @@ def map(
             )
 
         self._warn_slow()
-        context = DatasetContext.get_current()
-
-        @_adapt_for_multiple_blocks
-        def transform(block: Block, fn: RowUDF[T, U]) -> Iterable[Block]:
-            DatasetContext._set_current(context)
-            output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
-            block = BlockAccessor.for_block(block)
-            for row in block.iter_rows():
-                output_buffer.add(fn(row))
-                if output_buffer.has_next():
-                    yield output_buffer.next()
-            output_buffer.finalize()
-            if output_buffer.has_next():
-                yield output_buffer.next()
+
+        transform_fn = generate_map_rows_fn()
 
         plan = self._plan.with_stage(
             OneToOneStage(
                 "map",
-                transform,
+                transform_fn,
                 compute,
                 ray_remote_args,
                 fn=fn,
@@ -345,7 +335,6 @@ def transform(block: Block, fn: RowUDF[T, U]) -> Iterable[Block]:
         if logical_plan is not None:
             map_op = MapRows(
                 logical_plan.dag,
-                transform,
                 fn,
                 compute=compute,
                 ray_remote_args=ray_remote_args,
@@ -540,8 +529,6 @@ def map_batches(
             :meth:`~Dataset.default_batch_format`
                 Call this function to determine the default batch type.
         """  # noqa: E501
-        import pandas as pd
-        import pyarrow as pa
 
         if batch_format == "native":
             warnings.warn(
@@ -592,85 +579,12 @@ def map_batches(
                     f"{fn}"
                 )
 
-        context = DatasetContext.get_current()
-
-        def transform(
-            blocks: Iterable[Block],
-            batch_fn: BatchUDF,
-            *fn_args,
-            **fn_kwargs,
-        ) -> Iterable[Block]:
-            DatasetContext._set_current(context)
-            output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
-
-            def validate_batch(batch: Block) -> None:
-                if not isinstance(
-                    batch, (list, pa.Table, np.ndarray, dict, pd.core.frame.DataFrame)
-                ):
-                    raise ValueError(
-                        "The `fn` you passed to `map_batches` returned a value of type "
-                        f"{type(batch)}. This isn't allowed -- `map_batches` expects "
-                        "`fn` to return a `pandas.DataFrame`, `pyarrow.Table`, "
-                        "`numpy.ndarray`, `list`, or `dict[str, numpy.ndarray]`."
-                    )
-
-                if isinstance(batch, dict):
-                    for key, value in batch.items():
-                        if not isinstance(value, np.ndarray):
-                            raise ValueError(
-                                "The `fn` you passed to `map_batches` returned a "
-                                f"`dict`. `map_batches` expects all `dict` values "
-                                f"to be of type `numpy.ndarray`, but the value "
-                                f"corresponding to key {key!r} is of type "
-                                f"{type(value)}. To fix this issue, convert "
-                                f"the {type(value)} to a `numpy.ndarray`."
-                            )
-
-            def process_next_batch(batch: DataBatch) -> Iterator[Block]:
-                # Apply UDF.
-                try:
-                    batch = batch_fn(batch, *fn_args, **fn_kwargs)
-                except ValueError as e:
-                    read_only_msgs = [
-                        "assignment destination is read-only",
-                        "buffer source array is read-only",
-                    ]
-                    err_msg = str(e)
-                    if any(msg in err_msg for msg in read_only_msgs):
-                        raise ValueError(
-                            f"Batch mapper function {fn.__name__} tried to mutate a "
-                            "zero-copy read-only batch. To be able to mutate the "
-                            "batch, pass zero_copy_batch=False to map_batches(); "
-                            "this will create a writable copy of the batch before "
-                            "giving it to fn. To elide this copy, modify your mapper "
-                            "function so it doesn't try to mutate its input."
-                        ) from e
-                    else:
-                        raise e from None
-
-                validate_batch(batch)
-                # Add output batch to output buffer.
-                output_buffer.add_batch(batch)
-                if output_buffer.has_next():
-                    yield output_buffer.next()
-
-            # Ensure that zero-copy batch views are copied so mutating UDFs don't error.
-            formatted_batch_iter = batch_blocks(
-                blocks=blocks,
-                stats=None,
-                batch_size=batch_size,
-                batch_format=batch_format,
-                ensure_copy=not zero_copy_batch and batch_size is not None,
-                prefetch_batches=prefetch_batches,
-            )
-
-            for batch in formatted_batch_iter:
-                yield from process_next_batch(batch)
-
-            # Yield remainder block from output buffer.
-            output_buffer.finalize()
-            if output_buffer.has_next():
-                yield output_buffer.next()
+        transform_fn = generate_map_batches_fn(
+            batch_size=batch_size,
+            batch_format=batch_format,
+            prefetch_batches=prefetch_batches,
+            zero_copy_batch=zero_copy_batch,
+        )
 
         # breakpoint()
         if hasattr(fn, "__self__") and isinstance(
@@ -682,7 +596,7 @@ def process_next_batch(batch: DataBatch) -> Iterator[Block]:
 
         stage = OneToOneStage(
             stage_name,
-            transform,
+            transform_fn,
             compute,
             ray_remote_args,
             # TODO(Clark): Add a strict cap here.
@@ -699,10 +613,8 @@ def process_next_batch(batch: DataBatch) -> Iterator[Block]:
         if logical_plan is not None:
             map_batches_op = MapBatches(
                 logical_plan.dag,
-                transform,
                 fn,
                 batch_size=batch_size,
-                compute=compute,
                 batch_format=batch_format,
                 zero_copy_batch=zero_copy_batch,
                 target_block_size=target_block_size,
@@ -710,6 +622,7 @@ def process_next_batch(batch: DataBatch) -> Iterator[Block]:
                 fn_kwargs=fn_kwargs,
                 fn_constructor_args=fn_constructor_args,
                 fn_constructor_kwargs=fn_constructor_kwargs,
+                compute=compute,
                 ray_remote_args=ray_remote_args,
             )
             logical_plan = LogicalPlan(map_batches_op)
@@ -894,31 +807,17 @@ def flat_map(
             )
 
         self._warn_slow()
-        context = DatasetContext.get_current()
-
-        @_adapt_for_multiple_blocks
-        def transform(block: Block, fn: RowUDF[T, U]) -> Iterable[Block]:
-            DatasetContext._set_current(context)
-            output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
-            block = BlockAccessor.for_block(block)
-            for row in block.iter_rows():
-                for r2 in fn(row):
-                    output_buffer.add(r2)
-                    if output_buffer.has_next():
-                        yield output_buffer.next()
-            output_buffer.finalize()
-            if output_buffer.has_next():
-                yield output_buffer.next()
+
+        transform_fn = generate_flat_map_fn()
 
         plan = self._plan.with_stage(
-            OneToOneStage("flat_map", transform, compute, ray_remote_args, fn=fn)
+            OneToOneStage("flat_map", transform_fn, compute, ray_remote_args, fn=fn)
         )
 
         logical_plan = self._logical_plan
         if logical_plan is not None:
             op = FlatMap(
                 input_op=logical_plan.dag,
-                block_fn=transform,
                 fn=fn,
                 compute=compute,
                 ray_remote_args=ray_remote_args,
@@ -974,27 +873,17 @@ def filter(
             )
 
         self._warn_slow()
-        context = DatasetContext.get_current()
-
-        @_adapt_for_multiple_blocks
-        def transform(block: Block, fn: RowUDF[T, U]) -> Iterable[Block]:
-            DatasetContext._set_current(context)
-            block = BlockAccessor.for_block(block)
-            builder = block.builder()
-            for row in block.iter_rows():
-                if fn(row):
-                    builder.add(row)
-            return [builder.build()]
+
+        transform_fn = generate_filter_fn()
 
         plan = self._plan.with_stage(
-            OneToOneStage("filter", transform, compute, ray_remote_args, fn=fn)
+            OneToOneStage("filter", transform_fn, compute, ray_remote_args, fn=fn)
         )
 
         logical_plan = self._logical_plan
         if logical_plan is not None:
             op = Filter(
                 input_op=logical_plan.dag,
-                block_fn=transform,
                 fn=fn,
                 compute=compute,
                 ray_remote_args=ray_remote_args,
diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index 6814b796ac36..c6468f4ea164 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -56,7 +56,6 @@ def test_map_rows_operator(ray_start_cluster_enabled, enable_optimizer):
     read_op = Read(ParquetDatasource())
     op = MapRows(
         read_op,
-        lambda it: (x for x in it),
         lambda x: x,
     )
     physical_op = planner.plan(op)
@@ -78,7 +77,6 @@ def test_filter_operator(ray_start_cluster_enabled, enable_optimizer):
     read_op = Read(ParquetDatasource())
     op = Filter(
         read_op,
-        lambda it: (x for x in it),
         lambda x: x,
     )
     physical_op = planner.plan(op)
@@ -100,7 +98,6 @@ def test_flat_map(ray_start_cluster_enabled, enable_optimizer):
     read_op = Read(ParquetDatasource())
     op = FlatMap(
         read_op,
-        lambda it: ([x, x] for x in it),
         lambda x: x,
     )
     physical_op = planner.plan(op)

From cc6d30a267c928db50fd9db48fc25ada779dff2f Mon Sep 17 00:00:00 2001
From: Max Pumperla <max.pumperla@googlemail.com>
Date: Sat, 28 Jan 2023 10:54:36 +0100
Subject: [PATCH 043/267] [train][docs] fix doc search issues, examples gallery
 & filter (#31635)

Co-authored-by: Amog Kamsetty <amogkam@users.noreply.github.com>
Co-authored-by: Kai Fricke <krfricke@users.noreply.github.com>
---
 doc/source/_static/css/custom.css             |   7 +-
 doc/source/_static/js/tags.js                 |  32 ++--
 doc/source/_toc.yml                           |  27 +++-
 doc/source/conf.py                            |  13 +-
 doc/source/images/tf_logo.png                 | Bin 0 -> 29954 bytes
 doc/source/train/api.rst                      |  65 +++++++-
 doc/source/train/architecture.rst             |  54 +++++--
 doc/source/train/config_guide.rst             |  24 +--
 doc/source/train/dl_guide.rst                 |  32 ++--
 doc/source/train/examples.rst                 | 140 ++++++++++++++----
 .../examples/horovod/horovod_example.rst      |   6 +-
 .../examples/mlflow_fashion_mnist_example.rst |   6 +-
 .../benchmark_example.rst                     |   6 +-
 .../pytorch/torch_fashion_mnist_example.rst   |   6 +-
 .../pytorch/torch_regression_example.rst      |   1 +
 .../pytorch/tune_cifar_torch_pbt_example.rst  |   6 +-
 .../examples/tf/tensorflow_mnist_example.rst  |   6 +-
 .../tf/tune_tensorflow_mnist_example.rst      |   6 +-
 .../transformers/transformers_example.rst     |   6 +-
 doc/source/train/faq.rst                      |   9 +-
 doc/source/train/gbdt.rst                     |   8 +-
 doc/source/train/getting-started.rst          |   4 +-
 doc/source/train/key-concepts.rst             |  20 ++-
 doc/source/train/train.rst                    |  11 +-
 doc/source/train/user-guides.rst              |   4 +-
 25 files changed, 363 insertions(+), 136 deletions(-)
 create mode 100644 doc/source/images/tf_logo.png

diff --git a/doc/source/_static/css/custom.css b/doc/source/_static/css/custom.css
index ce9dcb9839e0..221eb33fa6a8 100644
--- a/doc/source/_static/css/custom.css
+++ b/doc/source/_static/css/custom.css
@@ -472,7 +472,7 @@ footer {
   color: var(--pst-color-text-secondary);
 }
 
-/* override default colors used in the Sphnix theme */
+/* override default colors used in the Sphinx theme */
 :root {
   --tabs-color-label-active: #0475DE;
   --tabs-color-label-hover: #0475DE;
@@ -494,3 +494,8 @@ footer {
 :root {
   --blue: #0475DE;
 }
+
+/* Make the hover color of tag/gallery buttons differ from "active" */
+.tag.btn-outline-primary:hover {
+    background-color: rgba(20, 99, 208, 0.62) !important;
+}
\ No newline at end of file
diff --git a/doc/source/_static/js/tags.js b/doc/source/_static/js/tags.js
index dc271cb617ce..a627898d270b 100644
--- a/doc/source/_static/js/tags.js
+++ b/doc/source/_static/js/tags.js
@@ -23,22 +23,26 @@ window.addEventListener('load', () => {
       .then(panelTagMap => {
 
           for (const panelId in panelTagMap) {
-              let element = document.getElementsByClassName(panelId)[0];
-
-              // For each panel, attach data tags to the 4-th parent of the panel,
-              // which is the "div" element that we can later toggle.
-              // Sphinx Panels is too inflexible to allow us to attach data tags
-              // directly to the container.
-              for (let i = 0; i < 4; i++) {
-                  if (element.parentNode) {
-                      element = element.parentElement;
-                      element.setAttribute('data-tags', panelTagMap[panelId]);
-                  }
-                  else {
-                      console.log(panelId + ' has no parent element,' +
-                          'please check if the panel has been tagged correctly.');
+              try { // panel might not be in _this_ gallery
+                  let element = document.getElementsByClassName(panelId)[0];
+
+                  // For each panel, attach data tags to the 4-th parent of the panel,
+                  // which is the "div" element that we can later toggle.
+                  // Sphinx Panels is too inflexible to allow us to attach data tags
+                  // directly to the container.
+                  for (let i = 0; i < 4; i++) {
+                      if (element.parentNode) {
+                          element = element.parentElement;
+                          element.setAttribute('data-tags', panelTagMap[panelId]);
+                      }
+                      else {
+                          console.log(panelId + ' has no parent element,' +
+                              'please check if the panel has been tagged correctly.');
+                      }
                   }
               }
+              // simply skip panels not in this gallery
+              catch(err) {}
           }
 
           const allButton = document.getElementById('allButton')
diff --git a/doc/source/_toc.yml b/doc/source/_toc.yml
index fa892b263ea3..5168a4923121 100644
--- a/doc/source/_toc.yml
+++ b/doc/source/_toc.yml
@@ -145,15 +145,40 @@ parts:
         title: Ray Train
         sections:
           - file: train/getting-started
+            title: "Getting Started"
           - file: train/key-concepts
+            title: "Key Concepts"
           - file: train/user-guides
+            title: "User Guides"
             sections:
               - file: train/config_guide
+                title: "Configuring Ray Train"
               - file: train/dl_guide
+                title: "Deep Learning Guide"
               - file: train/gbdt
+                title: "XGBoost/LightGBM guide"
               - file: train/architecture
-          - file: train/faq
+                title: "Ray Train Architecture"
           - file: train/examples
+            title: "Examples"
+            sections:
+              - file: train/examples/pytorch/torch_fashion_mnist_example
+                title: "PyTorch Fashion MNIST Example"
+              - file: train/examples/transformers/transformers_example
+                title: "HF Transformers Example"
+              - file: train/examples/tf/tensorflow_mnist_example
+                title: "TensorFlow MNIST Example"
+              - file: train/examples/horovod/horovod_example
+                title: "Horovod Example"
+              - file: train/examples/mlflow_fashion_mnist_example
+                title: "MLflow Callback Example"
+              - file: train/examples/tf/tune_tensorflow_mnist_example
+                title: "Tune & TensorFlow Example"
+              - file: train/examples/pytorch/tune_cifar_torch_pbt_example
+                title: "Tune & PyTorch Example"
+              - file: train/examples/pytorch/torch_data_prefetch_benchmark/benchmark_example
+                title: "Torch Data Prefetching Benchmark"
+          - file: train/faq
           - file: train/api
 
       - file: tune/index
diff --git a/doc/source/conf.py b/doc/source/conf.py
index 20c8c89ddb7b..95750148649f 100644
--- a/doc/source/conf.py
+++ b/doc/source/conf.py
@@ -354,10 +354,19 @@
     "xgboostExample": "Classification,XGBoost,Training,Preprocessing,Prediction",
     "timeSeriesAutoML": "Regression,Sklearn,Tuning",
     "AIRExamples": "Regression,Classification,Training,Tuning,Prediction,"
-    "Preprocessing,Serving,PyTorch,TensorFlow,XGBoost,LightGBM,Sklearn"
+    "Preprocessing,Serving,PyTorch,TensorFlow,XGBoost,LightGBM,Sklearn",
+    # Tags for Ray Train examples gallery
+    "trainTorchFashionMnist": "PyTorch,Training",
+    "trainTransformers": "PyTorch,Training,HuggingFace",
+    "trainTensorflowMnist": "TensorFlow,Training",
+    "trainHorovod": "Horovod, PyTorch,Training",
+    "trainMlflow": "MLflow,Training",
+    "trainTuneTensorflow": "TensorFlow,Training,Tuning",
+    "trainTunePyTorch": "PyTorch,Training,Tuning",
+    "trainBenchmark": "PyTorch,Training"
     # TODO add and integrate tags for other libraries.
     # Tune has a proper example library
-    # Train, Serve, RLlib and AIR could use one.
+    # Serve, RLlib and AIR could use one.
 }
 
 # Create file with tag mappings for tags.js to use.
diff --git a/doc/source/images/tf_logo.png b/doc/source/images/tf_logo.png
new file mode 100644
index 0000000000000000000000000000000000000000..6bc2536aad0994650b93d9d799311f23df256c4e
GIT binary patch
literal 29954
zcmeFZcTiK``Y#+&RJtMxf(Qbk7wJluqJ-Xi?;YvAhytS2(4@D}rAcoI7Ni$L?;_0r
z0i{Yy?oRxkbI&{T&b)uTGrzfa=HLv*ti9HLp3l=h>sfmnqoMYUjF^@f1Okyk6y>!*
zpewZ?&}Go|tH3uxD!D?yUsvp(s6GLK>JmuKEeU~tGg>QZse(X(tRPVMD-h@u_$vG-
z2;}n+1lqI!fyCZ{K-AB(+cYJBfvZ-^&*VW^+@Ji;(qs_G`z}QOiH`s5_Ci3giBBi?
z_wj~GT3S^~T2<L=_R4&2PH{t}f>9xeuz!u&oq`OiM1?Tk?_w=0{hr-+#Jz-_W^su^
zgj~fCxg`24@*Hojvs2BqflQ%&*(19NPvvbKlfCSQ2Rm{Tu7%Az?@Mk34<B8GuAg1p
zBLal^@6Ue`_%8zgcOf97u;=b1jgTpIJ3wHo;V5bcWu|K&P%Vl;7Eq-2_j!Bf_R_cl
zv3EL*!sVP{(}XZ^98p<+L9KKX0_3H*X9Of5kOi~<Q(+8GPL-u3)0iQ$462d5+NP1P
z#fxo<XQ=?zp^Lt92L$TM`sH2@S!qx~Mnaq3<o8|J(Ei$WdV!VMW&8wO<Q|K^XzLds
z5Vqth%b`*oOQs!rjV(sfbd~xUl;$!B#IDQ&<WG><+M1X?(o}0(`NC;cOj$1Q)u{pS
zbxj<8h1cm@CTj<;g*L_Xi-Zl4k*8TZd%M~UfS}(~6)i4-K#F@c<q%;b)`a)N6Aoy$
zsqnA_{CunoP8%H|Y{}8SyMxRV7oX~<&QY?P*0?#i8_PuQ#j>7>dM9--0z;Kgk%qLB
z%$N||1>yY)_{mheI*nnb_LXhyxXE%M@7c-{fUM4Wi-;Qp(%?ULc0zg?vEJ^)-`TMX
zp&o+!-Vi5O_=gSiZ=o0;vfgnn$0>nFu)EN-ljCyy^vn3^P3Lr(tL9@0#FVBRP7O{r
zV#)#dd+*`RkV22Ux2`=GcR6135|Ty}zmx9q9s&?(Ed~b-I~PV+7-h(ljFN@i;@s$J
z%#$Vi6Z!W7youOJFt^bg<`dx^E}JHClcX7GC;tq;#Lsuckg4v~{A4mToNT47qJ`LV
zj5CMcJgfttK{3Ao^i)C)_*6$7zJ9;G1<bdBP;YW9tWj@X{{%p&bQ`aP=XtO&%8@5o
z-yo;*+njny);SYi38Xv@z!cIE2R`hZP@c*^I3?s>r2V5oaU@OxMG0&aYrs?Lz5{W{
zvs+30Ga3xafnWFvq;T4i;ca9UP+D;joKtnrr`qbFVKvF2-vR^&a-uhWnCaxi3Axm$
zQaG$Tc%+}7bxz6iOBoL`6pxW26(GRK&neGMliSmzYmI~0ESz&N2H;I3@83F{TIQuI
zFYJjIdi4QL>o@&l6-Rt17c$h%7%}}Ai%f2mtYne+1p>eBn*=;|v{-1Skivk?c&k#`
z1$bc<tBN<h30|s?C)5q4VTL5Oo2l9x6;}o|6!C)+e+T~r0A`<5s6bwZ#y?;J7Xyx`
zgu01+fCt_(sS7Z0T~O<=ZsYx=E$+vC36xC*Qj_&~yGF|4Q2o-6fU%<UZ7F@K`v)-s
z3#;i`xOn)2m+W<9*pr}B>P8K%8u^^cJ;`sG4;(YFiFmE0@B+ZjB~<tLHkt1FRC6lE
zso0k*QJfSj;X_IuA9Jr?mFl9+M`tRK%+O(|qLofQJ=kY6U;*WYN1zZdL~KTwnd+<>
z4uJ@kDU9dBs&paFZm+N6{NkY#h7gT1AC(1e@+;G>w_z|$9*4n05u6BJtbl$1@R6dr
z%qVW%tp~d>+*BHRO29T2MV%%aoTJQu$t;t%+4W2HG;rFvi2WV>voQg4ZB$Xq;fn3U
zK;8CQ@xajGb@!LU-8FAY7O>mvaZ*B~^&I@Ddpyo&{;Hw5tS13&iVu9MZ)A}j);ZzT
zS){=U{EJVb$_bl2oQApyh^%o#TxoM$3GWnBPjQ%c3`*Cqs!j?3E3?13ux;zBH~PNc
zK(Y)Zs=tY*SGq{@LV`y}F^7xg6KU)Hy@0=hB?9)$kHD#<0F0=`nb<pK|1+46#2GuE
zAi!t>W0=E(cQ?fb`nAn*rv+5HCZKh=5-tyg6R+gyCbK$b!~!?xI2-Uu9x1}%mHHZ|
z*6mNYJDc#Nl<Nbaq`be2R1A5ahr=vf=?QMOz{Z9nG_Ue4mBt3KZ4uyYM))+vNr=<C
ze;f#LSxKhS;oJSlcmbTo8br9@(1<#(cS6eZBm-t5wwN_Xs)jzsc__O+&VuaBn7aVd
z-)exwKHe%@ya389kfAtP!|9wqkJtI$S2S?nu&30JKpCVrQv@;2jq~sCap6*^Oe-T0
zYBEIo4HXw-V#WcIOqv_S{*gG{-?oi~z5h%E)U9H?H-h`6i_0_f&j3dwSnR@h@*MtM
zfdiMKWMTpUPeMI~1l_!8Q8cIlxbkhh3{-e%<vUC^`VYgi#q_(_UCI(t$K*o6cqPC%
zB@`d2SI%PdhV|4Edds~CV=qc*%M%)-aG{byjPo{@fb0tn)d@Y|&Q>1~u;S3-JAZU>
z%QN=jAWD=8jXye2N9hBB82-oo(U682#YrlDyc|Cc^Ed!vJ#Sn=33Ul@9GOe5WeLLX
zZShy&Gf*OkZ>p6R$t<vGa!El*L929flN@J)#Cv#<1+cG5oRk;X0BjT!FWVSxV&!l_
z1P#a8UE#-ugF5zAD7a|&cA|ygYG7{-J^;IMnKztZU+^iezRNt#;mW@<-s_XLhsVXB
z;yRGLBUkb!t^iflfb)7vA%}pEQzv;!3hO-(h>BbgXI)r_lfoV`yU*NBAQ=(A#oaD4
zCHdwRz}qdxaMlHZL?V-4Uj^ll;(bL?m^AnW)PBAPSb-MjR>U!2V7CJVI=+s8Txco3
z0Ymsm!wtzi{w@Vf?)p2K`@xm|OUL{m5Fswq!ewdgz5@{la^b|;0Mu3ToeNlt>K=aG
z^2`@}8hhDiG{ALu2Y9e{_YY2<tT#9*LA8#G@|Qsx7I^$%oLAv8eMMJ+0YY3+4VSed
zdVsqKZ$4m71k=vHSN?w!ONjvw$0M8|RFt^Spm0@uKA;*)R9Q+sP?k;7C=moNC^2Hd
ztSp6>K<p3k*CHQYUeY&suW@GlG!N=1ysXGRws7P@&pD<7Nw}4mR0gaQ!G!bQ2b!0a
zp%|7aQgQQVGx~?uK55c!lk#XZ9zjti5Wbr?0Xp%QtQ5S5dRG&mt<Aq3zA8E}h@PB9
zwaEmaImRZS9a?f9CqN(>eC^0j<g9-k#Ex<zoLztyl5iJ2;C+R(vquq$o3i!$)WXC$
z`LCD&RgUV;Up)8HZjkpjB0?0{jGm4>zm!6K*0M8NFD74|yc(GK8j!OEZ*LEOStR7N
zf_A&IE$?{>-vE1qpm!?Fuipm_`?x3VV28^X4u3)4GnZ}AE7?y)wgVUUb2dNK>aG(!
zfaVm$5}=vOE8kO0LU33AaRc_t?AaafRl=k^GeXNX@|tS4Jk-3`K0FRIK>iLbFX0@G
z^hBG+NB3m_zEb-R4_9%&=l7rlmFPKrABjG$^Orf*-2!Mf{b<<6>+3)TA;F<<(U1!*
zm(vYIgy=TkAn(ZZVYe^ks&qp0qO2e%dygLer?9o$SK*H#)Rjs>)B356v9fC1i?4?!
ziN#gzxkg`jF6iuClPAOZb38511+>icez-4f*@*SPOP)Q-nAS;~41sP2S7)-AvN%!~
z0)8lR73U>gU;P!Ut<hUfOaYN~A08X!H_jR(TcKv$-E!Z#2|yYKf006R{eWvBA6HCD
z9g*>@USZ-qf>hN%Zj;fSl|uq%weiixMbW=J-`mN8Ou4_mu{}hN+VJV;Y>6)))h0Z*
zMq>m*WRR}%KyY^4aRQJH4_n*RPaUqS*}N3-Lbk49$8)M+bDW6S`-O=(i=TZ44#xui
z%eZh*I->j}J>b(3q8-Olqd{utnN?J&Q;E0gA!I>!7#H{W3M8wvPWee#Ag9I%ZM~#L
z%|_I1$L190!(JqF)=L?n3dPm2E(6)?fI}0;(Ee$I<vAGS)$RV=&A!JHH#C_Crr+Hk
zX9S4q*^S!(e{Q5B1Ac!q6`*%o8joSAN%Wqq4wWpw0Q)EgiV(GbF}wsA{BLsT2E56n
zI{APnqzm3hy`&+=U1aI3ulE>d&GOggUtzDs{~g_&W;c(0pu8GolG_BPwsdI}1mGUE
zDJAEr8REtSSR?>Zc)twJoc*C+YPN*l*KfB6rdZ^=@NSVyvY-qQDyq;>M#rfL*ZKbh
ziF2Fs(-{lB<C4~`KCTq5tSZ8OXLZPiVqk$r7I^P}N76&0_qU<L-^{)9P4kPd(60@P
zrPR-~DF&b)aBy+3Z~{ez8t0uU3E8l>!Z1@bfvJsY|1C-#%B@jt-wH9R%?qeojJw<*
z4$ILpytfnblLf231?N~(|D?EbH+6W{C!w8uYV8!rJxL8-FuHtPYE$_6^fD;?Q%oq)
z@@G$acj}+)Q2j3Hj6T<<Hlg>Ot77KJQ}!&jPyZH_<My|%sY9sBhI8jp-EP_2E`pjN
zv4%-C-KPPa%GH(N$C?282lyJ^@XFJ)inenMUKMLv_(V41T}=!2VAo+^OPbVq>XvVX
zT1us6^-^5pV_wpK*9q0Dv9{lXqD`Ww{d@{T<kWAeQ1u$p)<~a(aiKGiyW+FuMuiAR
z=?pdK!JtFd@(0krOg$~S>u?pW-s=s8SH48Ix4mR6yk4TXIc@`xq0L`f(lkKQN%l#F
zEr3lK9bapcf@F~GKviKZpHym-ac(RPd8U82F-Rl$T5sbx-vj|dzCGpi<8)6$zf_6W
zZ3hO(lzV@kCkK#F|B1dhb6Ni!lb{(tpK8;J^y~L1yMYY~<~z2^{bX(S!#G8c8ZvL&
zI`hGpCh}>>P%^H({8OL;>uYYbg>s>upXFw52L)z_Klu1{;J~nIN-oqfW4uQU@>aO)
z!ba>Fa#QrQG&}U)&>Wl!*5)RA$74#4=Z+8P2qGyz0G!CzR*Ruh?y)$8y04)U_7=SM
zxErt)11>$k;bKEskvZz0<??>uy*j{dcumn(hhd9F(w%L~1+tsma4>-tETsdi|F@WQ
zdR|R)tds5Rf!EZdDLZAJYp~j}7fb({|4^RbQ<DQ@w$0=~)ur#60VrtTbI^9yl+9@o
zY-Kx0te<yWAR<CQ$gFzAsVsKWI;V_~wx*LMhim0C(DI~$<6@S$)Ce(=7T6qOj$ooG
z18LiAjvuuxgq6uDU07`USJfwbzaXIRE++(RiYFR`_dsFBe3XPb`NtfiJW~2o9L4qT
zO%u`%Le4d-R#R}P5a;heLK@V72jltnC;TQ1U;%undfG|3MZ^2}jnVnfhd}ks|7D`R
zx;Y--HnxF!P5?|?ypF>OL^XDaxN&^L>BYzx?<=6S&~XPBY9My0G1AD>m-cv~kD<q3
z%F^xMDplF>FM^JhF9j|HLFxfZP~in2!zCWTt;iFd%keX1it#Ka9G3L}r3b{3%o+}D
zP`H+c98h!0@OwUx265~S0M%Cf<a{c8_(b40b21!wu1olLkyS68WI6(P`4pw_90vS%
zNDJ4o2q(t#3s5nh<lV-%Q9w$UaH4bK`4cFG0KWpBXn@!Wab_&T^Bq72e9rv%|0To!
z?;8PtCE}|+NP}`dBN8Ym#eX3|K9|Bvif;~pQldKX0^!*(C|^iI5vL%2PXn-f%V&5!
z{<1uFvRimo@UKhHb8zvN`j^xxeNMw`se}6s(xBDD*Bh<B=sHek|35DE|BqGuLrVA{
zf$TTWphdgHfRKf^fcfE5_HCLYjtmfbXf87&;8QesyuOnGMfJ$TRv4FHxH-&I=*w+!
zZ1Eo%MBapGacz?V+cX)7G70>$^M7b&kvx63ZDe>f32LVl*kD0djdS6DL84hF*dX)r
zZ~c!AdAaqU^TxN6jqFRe2r`aRyc=2AfEvN*gxB$*oo{At!<bK@$~8!vWLjM9s~e#3
zH~6L$D5-ADyHsuLfj|xmYBx#5O!YrNO%h0+yJuQFbf^Z|P^OKAEg${|a5qTAHJ!JG
zY;9(rl~nVK_LAa!3Qq%pmcsf^%dDamuxjeTnWm`Fe;SI=(rcV;3?l&4X18RzGJK}_
z$J`Nh<ZJKc40Rp-T6xn_mVQdJ;uP=x>kAR}Ge(xBD3=WKlm_o2j01kR`VX3Kz9QR3
z#Jpi9f?&zhDD1ntxR~I^#{|1rRuQ35Q75h`__pRG0nhvXSyH}M-6?128@>SREANG!
zT*FsOtG}L5IPDmSM2cy?AcuON4PfQ)&hyU=Df{fU)Ec*L;L1*e=YN2bXkh2*Jf%zA
z*gpBwkcj{!V_U%lP$`h2*w(01Auiaha77mPLy6yy{`V6ejQ^tXZ;xPyYltctsWMV-
z@D?9DvIM^G{<}xa2~m(vKOl!tEBD_@DhyI8A(t$D`Cd-_COMGBTyRb(!({N3i@T`)
z_RkQg8!MASQZmY_^{6(1%lU5PE5Hp|p4`T5SRq#C$WCbdul)%anc#;-H63EBIurZ3
zjKD+<AfLf3aUQD3a`xd)Z(}pe3*0F$Z?(?`5!_axx3y2|0Lo+^z8%YwX4^0ce^0VH
zs}1ZgvdiS{Qej?=vS-tVZMn~Zg;=a{2~SaC;3pA;?Nr~p750{;GrBC+h#gf*eCR0t
zO#K#4a$;Oaf|Q~{Afg=O7$^`?q&H`5fL+7uoZ?#$GhhdzB@5&vPzn{m*!WPKk+Y`N
zBrIe%Q$-J9CTu8fdYg@(<oF&k8Ln7pK)H)_k8E?e#^BIU1$nbEu~uG<)T3H2@6@}(
zUjU383vv3fJ02-qXd*p;rgz`rWk@^aZ3xmw3B@h0oj?ij6OB#0RQ(YlPe>YafP5Mc
zqvm`>H9+;#LHwC2OAW9NzUKt$j{^3C=Hm(i057j3GoP=d;sU6ec0)o=v4ROeaq_eA
z8(!NUshZMllFh_}OOWQYlVx({e$JW&w2P@t57!8=hXM7I3F8bn^MUWDn;(5i&6XS#
z&W5V8^?iNenPZ(demUC}kZSm^RGAs`@O<702VmczY-E0Vt@xRZ*rHUyQ>Z?0LrVM&
zZ-11k5<UvBrE*}%Xj3|PIN9q1*V|g~RqMMC5SlJlylu+ZeRDC~D1U4lE!dPDwE(W2
z;~nF>{Zrew3Da)~I8163E|ump&1_7RK0vc+N1Kd*{q=W~wjQ3nif0P|?8f=GabE}Q
zqr}w>*BaVkZ;RzaKJId~iX9X#x?^j$5io$({EEUAs_-}VcdKegP%f=N5^v~jPfqr(
zt7wc4Q8FB0UnK>`m7d}DQ{gv{0v6a%irBQw)iwj<97zYs+uJ|6&t9c@hyYMwVsJu%
zYODZ)=G2&u^H7~|Rg7lI%C@%Hn^geKE(D$e{i4Mc#0?a|T4S^ckl<-V>XoX!4xvYl
z*i!SGKDgSAkF4)x)6@sBoYGsjH!UE3^5ZT*zoXT+S$&IOz~Qwbj{iyFYYE*)sZ#L<
zvuH&z2vX46VUv|`c1f!07JAIu3Ft58TWNfu#~paZ1>gL|iG2|$4D+&`wYr5lCu)_d
zQQvZ^H%Ma!f(Q45?MKx7_Bc2G`>+50{x1UmGYG^&ZxXn?zl=m}R^`=^#K`XvTJCI#
z9+}l;D*~acD(8IGJou6)M&4V?Zi8<#_iT_g@9p~0Qm;!^*>TSTywN6fLpS>_sEk|p
z6^PEcU%SFAd2b9@CX!eTjAKnY_nWm%;5;v0tMM|Ja62a7G7y+EMXu7Q?Xe6KgLHDk
zZ~WEsZ^s+=neiK*F8?3*3D|FnOhypS_-JR1ow0^U%Z>SgRo|BSoLPOBl1A~<EZY6C
ztOn8$lV9lfwh|<HpcUFH!E^HxzF22{q8=HMN<7GMae&ms*Bt(e>E7Rv>?#HlJfT3C
zrw7FapzoU(;8!>VfD$Q$PcQ#dpBgx2LEm-X*EL?47DV`EIrG*3GTmu<3FBZ@^>m!)
z!k}wm)ZnUAm(hhh;S+1Sqq2Dnr4dGRDew=)Wqq^O+}f}1PTHrgW^2)}+;#;VMf?1c
zx6#lF@Py)Q@M>NZR8N^UZ7V=j@}^=~>d8t$#98HDYrETar&U04PklA|fG33^usO0k
z<npm!o8vQxduqc=7zC=t%wKi)B>5xRaYPij${TeTqMmt>l5xR9`dQjQ>hKJ+wJy~+
z(dI~NJm;rPv(0tl<~A!=lCze{?Pv^12G4L|PQ)Nv&#HevfQ+=x71=EpxdjUK&K12p
z84p3UVxDouxJb;-&N}I>v(i&?2G`i^CI#;%1=$tCs-Eu9LyS03MCtcQVeQ<cr_{&8
zo$1#Lk@phS^xZGA5mRz#p5_JHSyf~_^GFLli|g+S=>W^slcNZgt<}?Zm4vo4bAquV
z0m%=lP7@cVrlxZ8)H08OU7HLU56V<k>a(p6l-zHMC0Q9dkA2L0FooH7#r{TQLXf@Y
znFCb4dK07~4Y1v$nJV53R#7T$p2io}+S-Bj=~~OVnoTG@;YXvA$H&%6wb{XYkBm)&
z-nXi!j?*Z$_n~hy2LyFWlRdo(g*qB1AN?W|2Pbne=#&?LFJ5IFM-x|@nm5iA&b5Ws
zR?qLgbgc4fqVshZI?+jw*KqqouXRI_w>i$K(05fDGV3cx>9HEzJ}?NY&;Z0vg@$s?
zglC-Yart#PTQCX^CjZRaw9jn{N+eG3Iu?UmYjrlB;mVc4M1@I(t|DTXvBz$9p|5QO
z(j^j|B05AHVCk*rBKzOdDjrJLI()QENV9rh(p1d0>a{Fh<mTsjxOvvr*0x7?AyF})
zGxMc1UhtSgGEY01N^SaevalvnKKaN4_4)oQCkF@?j$mu2@VnG+Xlh!*IlWmfXCt+s
z8a*Q@)@8f0^k?FNuj#a>O3d>unkQX_^_Z-AVgDp%i!O6+mw%>8V8Lm^=tB!vyO`$1
z$Xzery^3Y}LN`BlQmnV~?rlES_2A|lc;s4?FM~4OL_n1yGKe#|?~3Tc@t4pf(R+G`
z2H5eluvLy1Q@}BGnFd+C+Jd3wrcH)jUt^8CO@bqp6PTXqSWe|sN7W~^tN<MH(nh+{
zsJ+SWTVdrCi=-Z3@h3^uj|-Yjcm4mQz&MI%Yeh<rJsg{AkVH`RSXAxO4>z{V^Dn<!
zg`H`Q#t^l^{+8yuwg|4$vwV;BZS-fIUzT3jpS97u$r!LIWqJ&h7VPdlrT?-j9bvEp
z#iR~~inKa)e^R>W?x<_E=Ic}U)vinlEA0tlQbC%r&MB{#l9v()H^FwvRS^#du!Y#!
z0S3O*mbK_@jr#AWWpg3E7hhb#lE-$~opA5Az{*mz^iW!u8D<2Arct@65d}ny)(Dxa
zq%N`AL*vlx-gZX#V!C6tO>~=g8B2iLOR_2yoeJjd;YqMNC8dNOy;|xu{ih2%k4V-P
zH&yyuDLg;3DSj-rcC>y}d<~4wNwKDF!R`hT-aL*2_i3M~LA?B}z8?aFmGiA|Qxn5R
z^%&JGKa?Qg<8i@Lt>jhJ&slNiW7AMf08I(p)DhA2M><S$!QqgHK5l*aq`>uO?48kd
z&yc~F->m_cmE!ng5;ig~uKXB7R#i{OO)7;dDH_tfy>i3K+QktWy@pxd@VcchB-D)k
z)VcXdsfDdXUAo@)qUDf5SU-AT$$T|vPsWR$UEOqabUw5)EA;tlkl*I8jesQ>&h13y
zRxS#$5N?2#qVD?ipQFF!66XhxH|D_Q5(jdA2M?=>j2XZ2kD2Nh9<vp6u5t<q@#+yK
zKF9$t<Q!8wNAKzCie728)c?X~DN0{*1zam~5Y*#R)0R;R_sT!slV)2E*Ru34>-py6
ziAXBFifcsX6W9o3SfD!9>Fw9eJ*Qp}%{C61igibv_mT0?BZ%d4q(|oh{35f{hPE~Z
zbm{87-+Sntok@_wSx#b;d@{So*&~~QI1JOW{aAX(XC$QLm6aRW5Sm9IhpYLx9qh@_
zoHTQ<KDe!*(K^)O#GL|YUZdB1f2+GHtN(hC!(aAM&{Zz3Q{I$KKztk~m%iA1zWjCl
z;CSy=G^P~kbQ1ZbwtFl7OC~a_itIo&eOTvUX6cOzP2u@?$ivQOoHgn}ZhwlP6Rg`D
zqQk2Usar*Wi4=Ixj-a{2aM|6jGE>E2?m%!qLAEoyo&JKo3Y=}YCBoo4@$5IOL1)td
zLd~|^B9Y6Wy)QhmOqqM%pE)@42D?|>P(20W1ip6M+cA||wmMOnt02XE{e1W|?I1O-
z%3h`7m6vuqdTH_boyh}~z1zfSCj66JyWHO0n9WlqHqxL!?O!ucr&_NM$1}W+D%~M`
zsWXkxPQ(@8$B9ACH?B4dH+XZuJN-Des7XE*Y;0_-DyMv!{jgNJ9knHZPW)vWnx3_O
zwbJRno6F9h=ipB9z4GtEdFnnqUW;(nQAsy3<=-l%HdpT`&1wp&XCO!ClgRc0yNb0B
zMrL0_gojq&(itHy1C)ZWMtWmUfnTV7f4t;ij`BD6g3GxkU7FX^(UU#-L&6nBi-iEW
zsWmSDH{VsS#)0}ZR|aS1M1@Mj*6+-(B7>A|nulP?^IjB_qNUPWI~%=IbFZeP!%(Lm
zXFo3W9rE7}2$`dsUcAiX<N^s}E$7dbx)`jYHAd!G-dJ=+T7m<M2d_u(hdBVF#XGCX
zJ*k_AW=r#-2m7rt11uLZbntryN{c_%u~Va&J4+gsl?1E%Sdq)lPF{g|GRs2(=$l*q
zci5l!_+(U^rXB6?J(<X}S*%7HqdaXKPF>}cdm^>xkhh3MXc`&Qz}6>>{JZBRKQlkH
z$>wH>(poFNIgb|h1HN87&v<e@d~a+t(`}#ePp1mDV3k#RvDeq`)KN~kO_Ydlvt_kH
z3oG)upsI>zVmcesbj^s{af9+vEN42egNs_2xW~(w4Ek&2ljMslT5YRKekC5fA^Zlq
zUh4dz4;bElju&^e0;EY8+Me?8_9yAr-CaKhB3RJX)wO(Yhw-X0W+2=ah#A>29_S*a
zS1iP$V0FB)0U<gactX#576ltp{-aUBA}xLoDM!YG9wVvy*r=Pez@opZ+%WVeudCli
z;6;0UTy38d!-t|bAtsg<bzekoYha1##-uN4h-3n>0o<+zx<$>|d6&E<Kyf+I&E3Uy
zsp{T{{*CqKz{3;cq`6aC(U7+B+!41^Z#m~4Kgti{dP|uY?;C%rpo@lf=|g4(sH3RK
zqa&^9nbWkHYdZQHyGiG(0%F%Dpzw1Ox2^8z5v5&&>fKw-zt-*=jAh#G{wUx{Y_Q!H
ztx4*Vbu4#BDPH>^&Vn`<xn?{2<ii$S))+NCz-)S2%W=d&jSjk^$rVWdK5NGm120SO
zk4}4S`zrd&==xi(<_UTU&0i%eY_gz~Xh+q0Kf^2}4^)l4^0FX$*$tOmN>k?^lbCB-
zm((4`LYxWAS3j&H>3^S=Zf4D?^R4r$<b~R~T05VmuAd$$78cxdWo>qm^Li$-^P<~8
zr~xMJM(if+nC>Y-#9CQN<TEm!_Sk35KiI8lLONIVbGbzU3{CREH0?&AJTB2H$a$UG
zv+j;Z@o}dwSP!e(tNQD`O~?%BPkG1i$YZc$rhQsimj}7_lCL?yrOqCd#T|dDA98F{
z|2UW1Uy!9XTmYBXd!KW*RK9XDb*+ejR#)cDNY%fO=d2+@Mi~+8w9eVod0!`<E9XCZ
zV(r}Xv3vSx*_C0=x7PPU%TK(H$t`&Qh-k!rq(D%8MgY=2F*%u5;jV^lhAH=ZYaEa8
zr#D!a{rdWK@&IBx^@Oz1@@m?K7#MBVm2{Jco5c(l!q-~QyA;c#_SVIi7<3kNr^GfE
zJY1Qczb#5^4|o);sA+Bg#=2>|X@tV{;)NAG@}p}W4WA>Tmrv0Cgi&NK00<YPNMmbA
z#h_cF&W`y`Wm8w%W|nw7Px@tnu~%~TxgUzJm2ZJND^<uVS-r6V1<9PaNUZP@CQ)7`
zd8uip&=X(3sW4WOllVH5>soV&)%pJCIqwWqEU_4o?oL}FPz%%oOpTfVtOJ{r8MuF0
zWL&vJSyk5<B1#cq43^H1AP-XdZfXAcy*Kv&3yvtOBL$PB)dt_{U2`_tM*(EsT_Ry4
z-(lc-4@GrIp4A_ZiV9A~7m;y5508CKO~<PzTDIOCGFvE1-uiX0oz~9xo+c~v7syJ)
zX0_+mm8^rwOvY3W12&IYqO54S(2z(nR<oHW(hmOhLztTB0ise|$(|q0bY5FDO1j`U
zW|(Mh$kP{@O8s=)dvNi|J^jiZ=vEnpZ-=tmWzItit=M5-;t2+AhCwh-e1Wu9gP6hN
zwM?q9=oFLg%9m?TXnLGp^tg4D>|5qOoNghf4u_6U&w8X}VddA1H#QDkO1d`GFTOk4
zjs_fzw4ML-lz^~`R|3o|gru%&dFbm1PxM;4bw`?=ioag^9p|lUu(64kD_6rTORPCh
zxZiEl#qpr+)BC>Nt0bUu4U4<P2KWIIm+|)k%vX`|x9>#}5eHj_c!@=UUFx_Wh}V{L
zbQ&h*7O3)zz(*QNW)#Z#?)o2G@Q5yS-MUH_LPklDe=t6h=~dQ#tXNSsdcy^Maz28C
zWIO?pZ9lBbQCst+GwEwuyf*lPTAdJ5J##pON}#eHGnOn0@ElrYQRF=fmGcVXN}_2@
zyus)g?<Ve(^{}`bx~L}9kO7ed>KId;0_Px~)&bG>rcZhP_hP~lRdGwN<jo)RU!QY6
zs=mIlI8POlqrGWvc?;leN-Ce<Yx^}l?9fBnrQW-iPJXX~{!~g|zVO<f;0pJtk?8)o
zU)#AA)5V+IViZyq%W1rX49$hG-Mr90s2U8N1p@MV0nJ2x&Rqk=6kK1zq`E?RO}kPc
zB0bLcIu&N~XOnhwOhq4EP>lia*h|e_Co{{B={Ly}7(`V|JbvdAaQzYZ^mRR666|{G
zkfWlUJpH-0<%+l=Na?BR9LktoWhlLY{#&9+sF)x<bfKF};#|cft~BC%JEs}bF(1^;
z%dxJtI(-~mu3Q54lw{#Bhh1bQl0-!CfL$DR90X>jTE?+M{uzf~FsPFc_o$P*WIw3*
z&+?^pyih#PlJsgF=M%_KNm=RZMLc!TS|(||R>#Y5{*0ledX!->rU;YTy5NH=<1IP0
z-<qi(fRuhl(cgy~AcNj?&~cd`F1_uZzbo2ahT9akh*9=W=uLU<O=^k)AbtD!VV&T9
z-->65<a22!_Vn2jU=!pVrhb$NmYgX%UAMPCIJQaH-R---w3OreGcRw!%k*&FxGf+@
zdC3>$PN)ic7hmq~meARRXCh4dT$JPK2BLc^{cJX2O+(jo^%W#qDq~BpCf+#YK{KQn
zYQZ12t=|r*X(XB{{aSp?m#`CE;hzSj*V0cf=hTq_)XdiyBdIN)HBwgP*&ciRI@r#G
zMh;22R`uovsJNi6bwzFmQ%69-jM-VA%JNR$IGj6NY5FtZYAS7Tycs6qiVNr!k)<J?
z;4p^@QAeP-k_Z^2FFJj0<x>=E{=^&8qY{c3*zsycTv_L9iR5c>_PKG@IC5QBtG1JS
zzRxD8uOZJQh@*t>N5@AZ+H@`SHL&S@*LutZ0XnQ^&1ZS}OudyOxzEMhH8<&Ol@%gt
zE0D48c8X3GjOc>@M7|)LajoBNXl&%!+1z{s&PeXFi6}niK`0?tnM}@JLfr()`MePb
zqX`P~s>Pl17cT~XNn@VioXFu(aC_u3{LW9A*7($hAkC|O$5JN{$kG~56OsFU#!Dr_
zd6-E{vJtLNC32ACmbp)i*LOXeZIdhXrH(c?0)S0xMIchUeKoo<nmZUlrIH?ujX-Re
znwMwI)cNN(@9)%!GzKiX86_k03#)#&MY>*m31V5$e*K*Ed?)7k+MR8Ue7_4)$O56n
zOwve~65%-FQwh*qNC|Ii8uR-#|J?r4GYX(TE^E%e7Nt*4Y(7$`pkI^Zz1tg>qpFG;
znuMMEXM`wKcdjg1p2;s<8`CE@Ne(G{&v#{Pm*s+Ka3f4=H0UHx^l*eCFLkkwwI;)D
zlK12iVSDbNbj9^s266SXOB<G?3i8;A%e-e_pgY4-kj*Xn5IN?U8Z!t9t??LJ+gAG<
z>EHDuZ|1+SLL@ze;0M4C0ZK~}bh5QGil(fAn2L}3pp@Mog-`!NV1af4Hua$IG@}%K
z-vFZ{I+P|<_gvh~-2GkZ&Mrda%y`j`?u?k=jr+8x7dXqHiwnEUJD?X(z5jKQD-GdT
zXd{Q+UQWW^Q9QN!9Q#<@P<MJ+%LsWyIJ>{e_zPR*EFOXt4H7|Q5R!awrZW<AiwW#2
z;do?1sANHSV)3*<>oxCCuZ_URlJhQ+%{oQxzz;CLr}Nu?*^X;12hfi!PHd*>57WOB
z@a@Z#XPCw5pC3Eh?q6pwC3zRauy^m)n&0qxR>9i4l?Cl@ygx|~g^w@g(2ogiWz`Hx
zfy=eE>;dw?zk`v41l`V$_W5GjlOyt5bPDTW%Q6({tCt<LRpPEzZFEvhW5*X@?spVM
zYd2`Pt-FlvHc$V&&K`9|4@VW+&qRs;T<Ks-3~}-pnSW8&@B!C~NIA%G98-HFjhOi(
zXmT0>lO3lh*L0XsVco~bk_z;Lh`6atLzK_1fyJ9-vVuOUn$w9I1pWRLnNAvCT!8DL
zaiEmPO7l(*4_B^^2uxA4xax*m`|CS7{85H}g=deRKW$}Fvp_wBP~TZ~x$4CEUE8G{
z&kU17t=?;K(68Sd*%1uDO3nm4&V4l9U`#4gC_Jn(m38vWYEgw9bv`kN3b9r->zoYl
zY!gGIi=2zmlxAof+wU6Mm0}-zId1_OYkVm=uHmVSx!*?3l&*Vd{ycG=1e30Dj<mp=
zs7*DgfNYqd2U+&Q#foxUeO`hyYC-xcO>(8aNI&<aBbGN$4_8#4hKZo(I0s2fs8vPI
zULWuL!2q6X=7?*%930vp==Jo`>&OujFRrso%DW*INcecm?7Un0_}bpUkWbwpU*ZYj
z&S?R}5MsLCW>zBYAQzHHmd>jo4^X4p);?bD(e*n9G&@Z&@v|KK!ponOucmw3BW?i;
zyX~D22J~kP1HGwT+9!I<dzp&7^aTXmRoSyCp;;zpRC|HK`*$NBBYYi5#Ygs@xCj8x
zi1yjt|9Ooc;ccEW_v~!L?`xU`?Ma)WSBTfMuY(AxF}nzjkEP%oE!K@tP2SNyQS-SI
z9TPg5^05>*7quGCu~KXF9~T4iQNi`(j*2!jkC1>-?`3Fi0O3i5xxW6?=q1!aG@FDq
zBL4T5UfPH8-%zG39z4C=Sq{6+D34Gr-j>GkoMm{fzsN%%8kfKq&*Yqg^5%J=LQ?Bb
zzD`l(1oZQ{qdI>mq?WSHdxtP0hP}#zp4mmX%pOjp<i5`=9M`>UCL$49pP-CMdncMK
zit-APoY`gn3PbmLRX5gwFCgjg+xycsdUTr?agHLv*v6S4V81)UKFjCkJ~us!sfO<a
zguQ93(Jp2Uc;TGbm&p>se>CKOa99)3#r{2B72$UMQlbgaQ=;HltRb)Fr$~4!7;xCH
zzXUzWF&9B;|8{-CP?aTo##0=+sM>%3_aevGv$XT>YWL8idXJH-P(v2M+Ie)#yQ5!8
z&p(ZB5C`P$_Stz^E=qHwP}6Qi_11-Gp+EXRcE$hHh>UFgqN_m#x7^q$Km;vzJiJcV
zusmSKFO}P{(vpALArPb*2@PBgbpT4PE8vG-r)?XiqM56yEM(lhQu;@Yq)84qYHfo-
zy%QC5abrMl^@SQoW_bL>VUjV<>d3zC+9=d8e19uJfH%OLl%n$UkAw!{+shw9)N!0C
z-s>_DhlX5^*w<Mh9U8j<xaT=#WE&eBi&w>@hsjf5h9UcW?X8JD6I00-xiD;e`AH@t
z!yw0RZEO)dcRQP4s{i+9#qta^H_qb#KBaigL1pj<$D&(F4Y^6c+No^bHc;|52G6r;
z)X^Vtq82)o!y8v5J>6p-vzS&k*QX_k1xAWfOquz%XHE13QYd<!WJJ^Z&B~_|VpChu
zV@t`d=sf9Ny}APmTgJhe3@B@NOH9WAw#YqnV}vBc1yJ-pg^;pVhj6sSAFV5{^6-X1
ziANH{pR0isOyVc~;SseP=VYL3tH;Y-?FRFx6o}}rFCQHM)=25JN@C?P>3!-w?vpAq
zxrsi2K>WIq?gAn5k(gKBI(%OHm8U@;N~x_GAAK0y=i+xObh>CMko=020a`MgB|$$T
zGY=cF`tSD_rzCebpgRd%J0}mM*)xX`VVsje0~cwtA7^jv^x3`D8ufwrZCo%DwSA-!
ztyfT0g%^D>SLbVaUxct<jD?@%Q0z55ZG8u{M~qtYZtlJ{GdDmA?q*uiuRxvar?ODD
z_}$lgPuCBweI1uwyrZy0y=QRCKqNblb*$w__Kg3QMWiL^VNLd_K8<Zp+6_?OD)KSE
zZ+_redp-4?t!Y34FQC~|8dVa+qWdh!VYaxS_2PTd-AmvvJBG%M0h;y+Rh5h9dqDfw
z9NOS|4}Fb}I4fREvz~K)ogUhwSz0FD|D(02ZDA;kz1fA^Llj-Wk3r5nv>sN|@(+&X
z_m|KYoS&6Olx;k@*xy)~9Yrqk&gk;zq6Oz>XW>f|6T&dc7331Ze)+}1jC8qHs}FF_
zAU=Su9o(LV?+lykdm^0i?ayX<D^gFtFux7LZmD7T&Nc;5H_21ZSO2tS0MDI<#h)4m
zFU+$6u{=P9PKWwQI<0eP<4<(Bd$yf8f6&hxO!=PPxonyar&8ZfnnLvJPmmr9&VDXC
zZF~h%%q<t(*k<FXcI@TSK3N`n6B7G&!=B+`_W_|qJ(jyp8!pg$_CBd_Q^Cu4iefTj
z%f2q|Y`#b6GS^_Yp3X7G${Zvor;7ld|465htFId|QjRQzRK)OrEha;~rV{d0KMhSU
z3GQybL#REn?f&&eE9fZ%Y0Wy(V|u0aios*d#{EoA%$M02ei5uowNsfKk)e|~&H6C(
zz(4lmxyBWr3?_4MqPi|UZO^iuK!(g7N<pHyQ6$?v_IHM##uwK`Nr8QaX&az_aHYTW
z({$RqmaR&Ui_?a_GXa;SM6UQYxt;`WQLfv0<{gY@Q}W*5FZ*;)wV;L4q$$>nzt$Ub
z2L4#Z75`$$@mJ5_on4xNrDh<=ZNxa5Hp0)}0Cte)0n=0u=akcIS+;VSTGbS%7DSw4
za<`c~3N+(4fgLjY6#RE5=KMX31qF6obuM%4PS>d13!ZofCq{d4^Y8no-CPXDYBMA@
zglL|*^Ybvj&kLA!d*g2h?@r8?UjrT(WvRO5v)8vWc)0v76Fab)nJTT)Uw33KdJHk-
zCQ3%<4ygLOb7Z?G@8s%q3S^~R+%<c=<_r0)@<hL7Y&yc$_zP4eaV`1AnZ~Ic_td*<
z)=KA9G>hx(5RaiyV{O;+5ilCw(Yn<$(zZ>)@Al(+xhkqTwb!|CEp$_6WWL8=uE->#
zyE$78SrxLdkKuFdnO{maW!ZPOibcIU{b2k`D*v@JWhQsp6+Id+vWmE%sjWxdnxz85
z_v9`r6M^6o22vyNC|+fSz0#~$$>JA3sGcAAVK=mczxfnNb9ZweICMLKZI5)x*iEnb
z^?3X23N<-*{|K;;%uIY8v~(!XJ!SAcE3PUJ#Xk&3QcwfkaMqaPb&|Q01aS9Zj62C?
zX|v+xXdsAu_I;nWIypO6@@u;c1YSPoWAkJDX|AO*Fa<_SX;E71+~Mx6PUS!bmhhtK
zCej1U4>4|>N3GtDJ#9cIQa<eBsae-Wx9;4v=Ka-=Kl6-1P+#p(mXZ>E7pZN1FxsEm
z&)z)=)%P<xx`HoB5YFisWb<LEXZ*m|`efzduhif7Y7yc$Jt%@Rl;1LAN1h>s>Tvzp
zK5rA1=#Jt2Q#GyK!JrQ_*%^5Zb0;EawNUp|L!T&7!TuSbb?XCdiYY%arXI;_epKEA
zZ#ny5Ylj(YnWfM^;g{T)m)y({dqFYxQB&lRK$dTw`~myRpY{>0RIUUA4KM?9x~Boa
zt5Gr$_vVjce&-r{>8N}zuB7JvX_D3T**6j{V|O#`#Rz##<$w+usZCVt2a!hi<**|f
zyMh7X5^(s7IpTy;lb!|^6E48Sp`57Fn6^7+WsWHgwkkvBg0+liCeYnT*9tu!Nok?q
z?E>f<7wG)UTSn_0lHZi~Rj3bqu)hLw->`e})cHK0r^I&m2TQfETtENfPhi22;=Myd
zYrrxiS~y><5!wRlg}2--5fXe-S`X1;t@yf`iA)Bg@BAJ}SbIrx3*cHr0&c&Gi&$Lm
zJe#vD%VRlgS)l5vNj7$>EL|MX70!H8S@p*8p@bWE_u=Q@8&lNIP0Fgld!MuaOg*x_
zztqL6@jL*TfT*l=R$Nc-zH|9leuPR`cVvZErd4{KMYw1DXp=`4Ym2=65IBEnhP7Kc
zVRFVY)x)+Nuzz}w;cI4)Bwj($gbs4OD+AZi_tP<VKEk*4MV)<Zgt>;!Zz!1P4-9gA
zkLN#PxWvNle&dVomAw&W`V@Iu^6kk-vt$v!7EE-Dz8lf&kMVUjd|ofQnCojCk>qqV
zy?1uIEyU~eK(P78Dt4~%##pR|B)r9bM-}`{Q%U#YQPZzXhKyBf^E`9WFRJ05dQ)Qd
z?hx%C0l}wy)PUFW#K^oey{SJIFpzNiIK9tCw)K=*N^rME{AAT5$wb<<)cpaf_j+~e
ziRa-{Pu9=lb>BKc%r#+${^rLW(!W<fzT;Jv1+kQ0UiRT9OTNQ;QtJ*EIZJ^do-&MB
zxbs$MUbj}Uh-0|tLr@7o*IOK9)p`hPCZ8b1>|R273sZMp#r39{95?)bxK44wN1C5G
z{T7x!eG576_FkaxOT9|v!AP~jt>|THF0e2X3^&%IQKlI8`SK1U^%}sks`DW))M_Jb
zfS#w^cbm-6{l@h9>qRcrZ>FE`10EbVqfc|@l?9aG=i`IgC5nOi+&R%*Zi=VB+qXXU
z&XEEQrlK2Hmq|PtO(m&fQJuG1+}@&Th3G|>?+&@UNLo|szYw|y+x$Vt6G@`XNwe+|
z61j`U9rtEblCdMJs;2Fpkdp<5dX#@Ds5$;n3SPK5w(q6F-(<2G_0x|d*5Ph}LK1gi
zFhDkT^<1|uLz(^<#EFUs7x$RN+W;1G2ERS3jQYmLtoZ`iUqT?XFs)}_CK{sUnpxnt
z90S>-aybNRpYB^-Po1y%d}Weh|4zw(7llwmQ}fh>E$4+C+qIr?H@Eub=@IMk5$H6f
z+x@Ey-^(vkMfV(Jd!1A@ADI2Nis@#m-k5iL)|?}@StEf@?i@cD9xwD{;}0qzJ+UW;
zKQj6HaGZGOsPcNe+xaY~JB>5*OW`ewL`RcXnj`x9YiItO7K3t^087JGzWZ9JsA4_x
zH~MwKHzIn97`!%lm=B3GSewd?Jgns-)t1U`A&TZde4HG>YAnrr{J{0A&67Tgpc%A3
zBe*i!9y05xHl49l#jy=GvH6K;_>UQFxRk!zG|!krgO7WgA2u<Fd&zygZ$01s+J0xc
z!1|;tmSy2@DZ4N@W)TW%JxV3K-zV@%<Bo#rf*jM1>4F!op>`z}XsI(kUZhix{<6y%
z`BHQr(eus4>5*upa%Hf$kI$NFTcJ$W+|VG_KG<z&31BYzs;+K%6|WIrlXZY|E6&y)
zp_kuwxf}iGlZVzNN-lhX7yLD@1e{<z8qqHnbe(>e843DF!<PMj0JQVyIEha(tJdoI
zr|CtH`;e;g31B-qf1ZG4eqUk4K6T3P7b?0vH+{-=C*YFbruhR(fGn)~yL0D6J@l_-
ziI;L$@9{i8vAD)twWqbFo36~cI`ypy>MiTwYYiMPjsQnX)Kj9(4D=KFvC!V8V9(>%
z>E!48xk89`7Hg{~+-I&xv-t^`<;cB|A5QIJDyb#}&bW=PB7cfkqK%t%;IJ;D!A%Bf
z0TWLp{@M^bx~9oeTfMuv8Q3Z<h-<vCD%1_SDSdu_5NaJ{xRvkV-V%PQ|N07m;3Zo7
z;YBko?#QB{^91m>r1!*D5JmqR&@N8Fx9jGoqOEXq*bqYQgCKB(_OT*!gVuO92<Z6O
zk2eknH1|9Dra4ZvWcu!3Qx;&gbQwV|d~Hi1>|($Aq}uQ6_<=HRiDoG2n*bG}_jN;E
zMh!nVg#{L9(aferY8G+9!7B^a2?NsU6qx!Y+93g1FNQ;bPeoGGzj-qXx1|v+f!7eK
zGFN~nu{45DIMI}^em9_z8=J;RdloqJ-6-QA?oQx^VBL7W8lNqA+MLVzGu1%nn|{__
z>B0jO_t<shlmjDG5d2eG`p>;uoT8V=fwHB{4}X$xDpAtp+_A|ArcI9i<R78c9_TQ~
z@uszjE<9|Dp;NM?gn?r@{|mIsbBx#8?eoRc<cVjKlH)&b84y?6DOra;Sltux|BRp*
z*4~f4jZxHca{2w?E)*_M;Q^775c;vSdKJg}2?}X0-yq2Uqvhs){3kQaoI`~qX6w&o
zHbCGzJZ*uha$aXM0_`GC+8g6c1WhwJB8i*K;3e?l3tq4GZtb=z)>K554)MFT2ve&z
zE^~u%$>R*Ij&%aUFyh-Id}NR5X4L>Elbr*X_$rIMSi3Lba%Z4Etet<?m}cJLMHus^
zkW7Ip$0OdicTA3cmS7#Hg^sQyP;^W_OT#}306eJ@{nbqVqALn`CWiLp%}NQsxX>(b
zcwO*~B%rs*Qt<i4Rq=srnJ?A^57^alylAQ!hHypNQ?|X$%6hL>B1Ted@@_9`^5Es2
zP5m9;1=#HEW?bCe5_>Zvl}4CU(xY@3D84EwF424dU;FHFkfYK>@8?}!o2AR7yf5nb
zs9Fcis<CqVV(S~Uvu))hKc2;P3^-4t9T2Z^!_tSf1G7eyW<@G;`U%TFiyj6~04IQv
zo}Zt|-#{-;g|Run6C_{QDn*WgO`A|5AO)kYh0oyxJFiIrrzRp$y>n9ePHfGRN0Z(B
z8QiZwKzY|39&IA1Z0W){wdgi$yq*^-CF-F7MBkJhoUzgFA|i>Pjc7(Yk4hQBcU-D`
zXfyyk_hGGkYMAaD8#<~;Q0e{j&+^2@!v6Zr*T~7qNxl7GHRG@Q`BQ?$wCNfcl^g1h
zdn^ur!63A9E<mq*dNg|{870jmuK$987geEpk~OY@p%I;kmz@0QQ*(@1`+VN`B(cq6
zd-qOWfvSoHz3;r^t>W{Yo4IE_=?9pf2?R`ZB9|4r48Ao#Aoj2&jlH6G7m#S#BJ>Y}
z1yO&+FN_Yt;L)5%<}QLMk4lSYP<PGH25LIxFE{cZ0j#Z(=KWJyJwgu;N1NB&t`cwT
zp2Q^oa1s{^tJYc3qF=XGhLb7O#XkJykX{%m<}zlUU`b`p(BYSFzhhl<EKPo3hOviO
zW4^}>#EZ3{Z>@-~xjQ*WQN#&7v#>g0EJPPj5-{F;$wX=3!O!sQM*kd7r+x>Gp1x??
z))Y9H##kxTv+Q{v@+=Ko40MH3+YIZMw7!&TaSPru34}M)hy*=I)8qM052DhD>)DS@
zhIP3rlz;7>+|cWp@J;<x)pJhHpWw@p>39r0u_hu`m)2)P;3v)+!E+2hsjFa%K)Z-Y
z9cwL=5I%my(to2}oQPZgEEar4hRNmW^&hm+f|n~PNxe-^p*6Y4)xCj%@6UaGQE#8n
zNKB3*>+<1`FJ3Th%W;FR4hGvg=4Cz)kx1as^`gEU*^&Bky1&fdppEE#L4oNtYm$J)
zuM#`=T8=)jvGBazYZSV-F50#@h78J+P`o+FLh{K1leO~>ae|oXm79m%wRXF2dr>*M
zKRI&wnkMkh5=*!j-`BgQb{4v?afb;&uMWL)3NzUn_@1Z*9eFs02Kro>Q$y4W%k9mg
zLVmKHh>u7qFh3e0E)01=AP~UWWELIJC$(|)s=#OH9+7m=x8YC3+rLz&eYLMpFD1VX
z+E@f0+j@_%-!X;ezP5<vx3)eb#~na=($g$2JU{M=*anhNhb_^i#BlvO4h1T!O~w9L
zcAZHMa{=kI%gOYNsAgO52UEsnTeL>A?(Qz=M~^T=-O22NCmJynf!255wFzD(VgJcI
z@p=06DhEZBl7vKzT9<;^wE@ura=m<hwpt0Dk*KNdEUb3WOTOD~=RwNuRqp6%KWhwH
zPu)38p_TJX+}g|6z<;&Cc=x6Djsl}>$i6s3wod1s1@6TKW2t9$yMD(@LQOEf8fPW-
zcvmhh?#mAo$`=Tv-dksI+y-7#V}GxMPWBMaISwvotEIdsaynGrx=Q5=bwvP&-Fqd%
z-)QY}+UiY$5>76hW`Dv`2AB<>I>0?*ni*@^(<z?jxm>}$s-jT>JZl&Qbd)koe0I?5
zz&i!cTRYlK#lVWF#ZyBs@;FDjtsf5KDy>@N9Rp5397JP19^VQN^ZOIj6jycMTtgQ*
z@;F&1d6nJ-SHXA@JfB!AzZ!3<I;*yoW-?Dtk^pBt<SyINW}P`{ibl6T&N+X5dcl>@
zfSJhj*y>pr9=n<(ZB29uco}42{&2<qY~6lDr1`k_Je@O7e$tqmG#!8do5y6fXaA-=
z%Ajv5@XbcijrAwJImA?ItjR>h?<iII@4QX`dSAwkRz|Wrx_1m+s~CS2I~L4j@i8A<
zPoq#GX>V&235;5loN-axi@bU7$Jyqr+L9&n;)P}!`%m+hU(hF)ZUS#buvlxPuw9ku
zI9>OXnqHEu;i3NN>M5>Y!Zz@|w!-w(&00CojWs!DJ7?#E&+lzF$FSSuYy3kh*8{GB
zBB_-N7nS}1yL_j)X*+Ymoh0z){(X-Jew`i<j!|PH^ZhVpCjXcNx6?zazNzakE!d?m
z;xJEuGOQ0I(T6464Du2ql(HbIyw)0KVj0W%VArE^%t;RQcy-OfgbiD7gS-}GB;11|
zWItpejLMXf%Y<Ph)JT=1X9iZa;y4}ED)=Jet*x)(;wNax@C2!&m5FP#r8m+0whO=W
zDwsWUusHqr<m6G?hU@eB@84+8kp0W^&z+L(wbz`rrk?HD+6JxIzS{XVi6GV<N61Rx
zh&WBK(c{}0SCu~FPDqXpy)iI^_+0+-cUQY3EK7T-O&&8d<h>$oy}zA>VT!pZCqXi6
zxA%_!UofP8Aw!1A4BfO$TuYgPhk^6P(PGSXKll2LDAt|h(-BNu<%2_3_rzk{^T+?I
zy|W67>Wkk!2BL%*fPsXPinM?-r2Y_xkPxJ$LAtv|L_xwKhLBQnkf9`o8U*QdXc)R{
zknWkYw$Hga7w7KWoagz^4crXuS$plZzU%#d-glDqeeBX#ameTXZyEEg+_=&t2yTUX
z;b4wjKR0B?GIKRpJGB^yW%cQ;z~n>sisa^!wzf(*@efd046>-JhNmI=bFLj*rz$Rg
zh~H^pd%KjSz1Jgxi7mVybw9}5o~M#3=$+nm`R~S4WAU~D8nU*Re#mI%f3xEs<*?=q
z=rVr~sHgiLF!#0f(Aw`rJuSM9ixow21M+phj@P3v1|Qlm^M6zX{;+ET+>~Xasfa}H
z=FC(|+6^JJfGtp|yaEtAlJLoVpzVfh*n6TB``DQ{t@t@kuFoRsq{~G7CjT|bdYfMr
zQ%63;qcsY{^X!%{8S`Zqx{%)mG-IzH|KTgnG0Cm5ksoH)wSz*&s#^N)8qBV0$&I{`
zYMs3D{!dqvK%X(9?s$bnayf)kBsK_=4iN1=8%z9yMe+>#D8ZLff~B_*_MW>WEP8&f
zK>kSV4_>c(OZGQND2qOCVPj%_*i@HlOL6AHb4zHjf8M=>XS3s;OUl<F5o<<%u^FyD
z`49L0{knTuwZ9r@w!b+isTFBmZ?uK=qSkTKTE4ut)wt&#)6(aeyI45}a&M;KIy?KW
zH+9=MS0t(3BiT3+7eJ5X9xk!=+|Zl7{{WJ7H*xRd(y6N_cu=3$sUG(1XDlW+pBO*y
z+hE|WT>JBf=mm&g6~Ibu^bTXMJ${8tEF=b8KuKx;Dd?mO%@0NX4V2XfVHcq0nkx3A
zS?3K~c4?L2&;^g|4F(|Pc*0fo@=qm4OrtzEV(lJMPtFo7E5}qgPDQTv&{?&_T1!32
z4l<CKc+-#*Ff=S~n(F<znu=Rso6FSNV-d%6>j-9QeYi<enEmk?uiT+XgPncdeqMme
z2aHI>DdMBirF1<o6DEOJusB}$$31qpkbr@dJj#!&f^ruF+3}zDJe7Edn5B4X&z-q2
z^QFzKp>CqXzru`IqloO>I4J}|Ww-2uvi!ClC#&L2{o=i@EEOf26k${%*`WsUQ-Zrq
zJH$(sJnAWLiLbwXc~H82{5)Mk)AnozygJTNW5&B%l0k*^WF^a*q)TD5LZRXldQV#y
zNn7CY!!8r$YR5j5vq<8-yQs$Cxc?$1tR6eL2R$c6+$@tnB34w7uNbF0G8k@u$L{QQ
zR=)+KmAkTXa@iRsN2s7P)+)dG+Fzrz=v@X1+f?>SL{>E^7`8udYV9@f7U_NVW}hU}
zkW$~cq8O*(dUeb8Gdt_9BM!uc?_<hLdxfXl)7cl345WI;o-FX+ne<d%Y;=w|?C|G2
zM)E%x956>Ixf_`YQs)MQcmns!HC98|j;C!z@*Y=%j1#`s?Jx|iZqfwMLn*3nsQsDo
z_#`}Jv<{P!&}JrjXfPQtj-N-oZozF9O^s)b7?+$gx&0q02u9A`Ah|B9&*C+*keisJ
zbid5=4jB9InVx%NC%+yi89-YQ!ahofnzZFPIE<uiuhsg)o3{2TJt7!7%n?~g^47^*
z`!PS|{yVO)z#lnPP<<?uzL36TPdM6i0h6m6!6NfMXhsk3H&Oy_UQQ><<I5qrb3v3(
zGT-_^@-fl>_YzTKzo}SddN{n7L4UlBE6T-c!?XL#c+2=1x(QJc9wN7u-5onxiadl*
zw<gW;@r?D@({Yxu$mDNdH%tE^t(i0|c7O7(>3+v!Cvx5SltR?{e^JI#MtU7G(LL88
zwZ}iy_iRfKya~n)@hdCg4Z%JFTA!X$vp+N3r%l_~NcFH+jT;@CKj-AY4}`|gTPhn7
z=0B#zbNjn>tlifA5vbW)z9SozJb?|XD=Y1a-mKXRwD&Qx##hFLO0*bJU8hp$@-7Kn
zlH#FJqfo<c*=p1m4dLd6H<T6Ka(i-hK{ou=&u|Gg8dbi{Ja5{+a1`OSr9PgO$OkRR
zo8a_H_`T>7lMq7A-Z^9Azk_TW$j?rSjc|c2Sl`i<?_Zxta9<t=QcIPxRZ79%+)7>d
z5D#ZDvZiT<9;H4R_x~<kU;|=|sgr*k;jf=Zl|0VnORcc{icxLV>wa#-dMtD0Ry(()
zUNycjd`h21*zYK@j16{c#8#FTG(r!cQNcMlj?){avD<Ps$ZSDJt7GpH7c*i9=wq$E
ztvf*?TH@*z=AC~zW$pTwo0?jC@0JhbGf%xF3wv~hayHRw1$V}+)B>BOG2`eumN!<}
zRQkR*D|rULuf%y>VUWc*CN%1YeggBaU;EGfY8cL|J!He*(<&wYg*eYIHaQ>N*FOc>
zl+a%Kc#KiL7??>Ny;Xcl>41YjWIK=WIUYi@cv$PFxgyPGUukZP^h+mcmu|_*9pvxj
zGb;!y&d=SM*ekZ<Xwqb~SZ)>KB$G21YZ-8SU?~3SC?lg^5Mi>+bz!sVATDKz8;M>&
z#s3u*W>;o5g&hhwP<@x`*BtXs%hWWr<N9gzysrJ8-pa}rqi1UR6(9ygQ=h9vO5=JF
z{(SFlEZEd)y6XzoC<n6-W`EDTBfcHW%WKHET#Z6`r_k=`V;;a;Fpkq4{6I=e<JWoE
zaY?d&0^whJKcH`5AP(^7{D_?|OCGI}i4Y;pz*jRDl4%$`fJq`nOQ2a!jxZfTGt0@7
zheqI}ScsTlI5q8#ME2`YI$g|+@>H_Zd!T*om>8-{_Z;aj>_XB#zkXt2BrCeb5(G&A
zyS%_0arF0QVK1kbD$@YPwR5yLP199-c*rhI^BJ%ht{w%vznPUSs_A9`+#_<aB=R@g
z8rPykzD8H;s!LpA>U;m^RA&dv95rlG<o@?N$JSe-w(X)sr(ui1WjZ7r8@W89HaR?6
zrw7z(fRHiaU0s!aoi_fPua!~8oA1^P=fj*2N2^<Wmn>?Xm>i5IuFDE<I38}Q)pl=X
z>~B7jy$iar2)Ac@zX!@YqR`1BPONIr;Z6mgGM-5irpi@5tBhtu(s>))QMp+*@|I|y
z>%DXVZmblF|FY9jX#Cnc0DjygQpC7ad(wlSlljvWms`;rL;6~(PcRL$(~P{q2Tv>F
zpCS)p`0bvnS+0sxJ+CZRveKA2*(^9l?U}ME6qq^uuuu*$*t{>a>u}XPHX+XGk+{95
z-Ms*MkEU(8hueQRilB9?bb&$3uWrA;M}e#Q`R8LV!PM15{DjPA0d45<J%tN3&Gi$b
ztDp@K<GltkPfG6Ywu~1C^ooMvxND+)EdR)d$|OU4oPk{l2mA@X_uz<?5-J*4sTj<L
z+8=h``xpT@xE7>|?QK0+r1e|n9+jESTfax{4j7uQ*fT}9B1={iJ&$%RK<U&+Y94Iy
z@MDW<V=v*y4daWEc#9?vD+=k^3lw1+@e@369yN*TS#+egOC|T42HaN-&0IINCKeM9
zx9xfQi!}=L#`vuSZW$mC0@5A5O#IKo)ku^fYdqJ_vO2Ntr8W8VjfJoo4m`N!#-g+_
zO~6LmEL7r?CII&{{B<=`eL|gCah=))#`(nqOV@K_882T;=fZvC<UjPTAk*JEu}RWg
z0OyX*$@<M>xCf1E&#9!?<LE0E$fkYnP2p^jt_cpSP~Tyv9OXxSma{P1Y6UgTi<1|_
z84PNlXTz>t#h>kzPz-6@rn)sLR+Q~sbR>Ev<o4|=XIXU`;$Bs8NM4;K^J+n5tmGra
zSEmP{-b-)|!;4W}gi=xx5a9}QfXmCVOr!oZnwAiex4hg|^TBsD;rTWGh&`16m(!@%
zRclE%DV}^%M2U%d__it+^Ey20BRP7UYb#bB2xH8uv^cT$<)b$fb2UbM&wfxNv)NVW
zyg!{!MWQTY?>z5))OwnYr{8}L^`9}BuyDVkh1=Ty&Nt+MF@BK%4%<Z?{1Ln6rs5XM
zek!SHJKE3&Y8s8Z2H!YAo+2-Ae`OFWPZj*clU)<hGazxLZ!L{?>zO!*Rm*C&q>1;q
zv~)c7Wz!RwY?6LTKG9gcTh;(jVx9bvPS^Pde-zdxRWrVbM5EE*2zg5ntC%!8{PiW*
zyeFfsrC6)4`{(4!;>Rp`MKePt&Z}KOMUoYbdvE^!5>ILrl*RjkwP#EMzG~t>>ze^o
zxR>gty#lNKDf!RFGlvdiixnxV7VV{={(7ZJ`w(<0X+K%eCXn@cwIzp`(`-Jn3Aovj
z#!pD}iBSspxLH4j_$vY0m5MqF(k@ml2S-Oo5bRY`KTgB0Sf-A=pKU@w%w>nK>WxJ`
z+;b8wFW=y#t)iR#EI{k(Bp7L@zPr8u!n-bEvyAnj_ViJG@Heia&aY<)+}xn!dKN-m
zxGK`<j9yLJ*ea)e`8ivdCbFpNwZZ`3@Qw+nvXsiz6)HH~sc;^M<@X3*y}mg1;R(rF
zJ<`Rx<EwbgOm56f@N{p9U{vkXj^B6Qfu^kc9nDUczreNNko-ubS^2$Jk70uW4SUbG
zLnN__Zq>H$wo7$+U7p_tATS^Y&5ZpJe3Y}fOTu@q?iB;W>;YsNL>z^C-YOWk9i}Wl
zg%A#fBhx>TgFACGgpT;l9htjOE%sm@^Ep$*N%|aqcXGF2xsc~f*)5>UsY3X1$aJ7S
z%x*4iUDUQw3>4-b^QikO@wEPT?`JO`>}`Hnh|FfcW64c20nLv?=yCp>{@phs)5nxr
zHm;gK7xE0;+;n(rMMAYn-P*Pw7C!E<CbRvVQIE~`w5)e9y<d$1oJaIi7CnQGuN8~I
zsN|gm>C2H{0=}y%F1<M}d-I#a&O+>=cC>+Bt1`n(cxWMu^?3cOb0Hv&;6?72na`8=
zd#RROB6yjo7(qo>r`@6_z5R0>IIw)bwAJ0sv%XI9wS+4&Cd2k-+V4xB4t4pdZ`D=u
z1tgLj#yca=g?oLb=~^B^i2ZgAkl$6T>{#y*4E;8E_E-*d57|P({2*VGsbUK)$MMt7
z<l8T^OwyVz7*X5*Yv*+XoJq|>?9tEcF-kZ6S9%NmS#%R9tpU1-Uo4H9u+z+3u0IVk
zyjI%{yeub+u)2?KMWFt@2QdcP1EX$}am#J*YFy^!eXii8g&ZFa+y409Hk>00hB=n#
z{>LA(vnvnlA^X*A`~7FkzcFjp;jDk<XoO*r+|3yfOsE*PexOvxiYh-^^x%tjwduT@
zC(@^~s@LbT3g|%nuZ-3SZY$kAi=2FJhs(wL+gUvS2!4AD){%$QSdRMyaW}oz-EbgI
z*8oJe;-d{4C@n>HyO<V3DQ~psjBU{Swedqu>~JsQQDN<g6TPL5fs~e{uV03k_iumL
zxIONb+~WzyT<gjxt_zePrzhG7S{|G6-Mmwr6=Kk};K1-(vM?`x_(%U94ekutptflh
z#pTuA&Ue`}UN8=T3?%xJ^H~A@i*5+!&ra8`(;s{T*Mxy=Q%{++fGtK|vUgVqY?@yF
zCS9nkFMHar#6`0CpAlDCaRXO>pbkxehwzhHg`bSL!T2!Fzr3M;gWWHkEXTV^)r~-f
zZ<E>D-F>t7vr|ehIs#*n<J=g40&X9OF8OBbZS8X0zZl9z9PGrh-`5QMj<JIG)S%yg
zZNAq@U83gzZK@#?E3M95<lwXVggey$c9eCQDKE7<4JcFOejM;n47nocoK*|~li9U_
z!eEGv^zyTjcLBvvk})GO93#bLrT)7bTUO0~J8|IM*0ggJ?2IbUkXZ1ijtwgyC~|hw
zDBGlz8h|(C)J>bx%+6LLdB+9@=$Ez1E}+|_*!wCdT_+|j7D%rq5p@^{A~#j$dkGwf
zZ*8rleHw(lTg`7MjG_c+HKmb}QmW!d)i4;xxJCjp+5M5%B48e9`^75K{FgdkmEW<`
zgKl#~!8(iGTPrNvqiQwuQ~J*=l&_LXryZ~L8ea@A`dM(XgMxI|6}SeT#()wa>>GgB
z+q4Ym-RGS1g4t`c>XV6qiT>7@X*b|j3_--7H+Jm!O9hiC5`6WW(V}zY{)_p2*V6sU
zlO^Mks|#=R0#7Fz&UK}Y#`~|%px3O?=|Z<uJJW{7dvQ*sbH#w-voS>SgA{<tm96kM
z!`)R-?^W&5IH(!4-umN;LUR;H?=3{nZ^;sIk8cC^W-A#?YkyUo6!{7_%fdn^xgNja
zL@y$B!$K?*<!fY0*nk=~>Y7AuB-8Z;*RN)JbUO_qyiaB%VFnYEU6RzXS5&foNT%%{
z)6Ygx7nbBCo)!(F>c)FVi(h1r+RqwRDG#9JpVy)Hlm1l#hUP368;zQ`pQNEZu>uF;
zh01<*Q%P&j;7`1swe#m`YQFr_NtmpZ_e=lAQPfN`utPI=xi0<bDK{JZ?rxzf2o?^!
z<_I-pZ(C-o?8t;`eoc&-<>*2@;-P*DuDu7Wu4%DrPDt9MpD#H*hAcQI6-spB4#<W}
z(;f3aDNnvU>mz3`Y*#Tlj1-{uXPiY;Yl;6h3sv%b&a<L7T78bzUs6NZwJ*Cf^NH_k
z@0QyY9-#z^#QudXKS~d-VHFB=?b@fux`61vjRM81!j%ID_5p^!*Anh6KXQ@g?SzB7
zm}B5QoVmzed#`ONS+Tqzb3DtDr!8zZabPiy>LvHe4Gh`m_J|=@DLi<>CR%N~o{s7h
z3WUn4l2cidD(irgz9`d@y&yi;!|I#e3yoSA?NJ53M0%U8m~jb=cas>xm0%B`*(UI0
z+d0z%i~DLuU8)zr5I6b22^TsyT!4oh3DhSg>8}?^aHvv4L-uDV*#I{@>R(r#k`_1)
zhkGZ_Ig|#})yQA?`1+()m^V?QY)emHWZu$g-@F6(HVxgE-<`F0XN*Z%S;%?4h#Kfc
zyy5F(k^DIybmAoz!fD5u*Pg}8G3jj<-(ycH(l*~z$@Au7{;S0%Oi<87cQx4lRm3Vf
z!ad=(4!FI--77E1JW5|7^#T7y&`<yG_>JT?AE24BhB*1K^6QNLMI&5JDwQ;^&wG&y
z(WygecVE|V6^(Oy8DG<uy^1}55M|TgTUSlb9W*b-3qB>Q%0;?!B1M7fD=*x7j>Fpc
zIIcM?73*sf8XX>uGiR;;-G6zA&J2;mhun7_0I2x5Yka1QzCyKYSf*%OB*L}mTj56e
zB_<tM01)l4Ew#Wjy^W4OxrS~Z+KB@O>g`MCR7V>MLSM$Y-uQAL*2o9*hYmL}l`aHw
z{TT)Zhr_9kjnfC!FLA0t<;`2NbRY>T{r8;Kx@Y+u_TII^<&fTYoM9Zu3UKuO;FZF?
zEck6RiK!!b8-yEF8lCQG!u-@r{AY+^!mI`WdzDOkL6+q()y^}N(=g2d@A%X#jX54s
z^cFuxR0YJ?yq@5-k~<^1+nJf9=|OkwDHhxH_noh2JszCgzd^<fU3qI(;XALj0<=$V
zA6VPa>-Nd)<0r3&QC8A2n59uYlqi=;=~LhO{9#>MY=MnRO)3VJA3CN~74=sUv0GR$
zadMtx&PJcCnE)9c6lL=>HUE1iG$MxVOhYcwpJ5Z;G*v0W_{yqVoF>yx*}Tu@ItF5X
zt3jX%^v`FeYJu?i&YCIftl!L&P5srbwcyj*6va!==e2?2BeY#4hr9jlF8nq%oo^-f
zq6pG{smfRG&9hz3af9i_slg)g0bdBibb4}jJ_|ILQYia#!${M=`Bqk!PxP(Utk1+>
z<un2VK0dAA`~4t5!g!B93}oY}qJsC)YbyY}{ccX|prmcOO=W8VA^w;L4^$>kI_xhi
zwY=~yZg?g*m%)Ms)RIiGyAec|l&qMtkLzUwR}p_X9wY>z6%A*)&$qt<@c5+eR7>tt
zOB2k_Ix)3dCAQo2$!FL|i9J<C(<h9S*hwJ$1}*&MDG%KZaJ%0_6Va&BIfwLUIV|iB
zpMpwA#=x$d$CglmQFwJJR<QIthon}<-J8y(v&fxpo}<Egzj0~bx+-yLO+tmna4vyl
zO<@yRo3$Ty1H%@yHR!QkQ{B)TDYTqNDZbV_xA<_m&HpvWPl+lhLjk#ya})MWj1Sas
z$wl2xUpp=~J}8w+J<H7r>gG?3H(ROqcg<AXDq`3R3eumE3g+E<WgHgA^~sl32{pXb
z+Y~LMYRcL3&V?$tAp&#<n!seDv0wQScu+lO2s6RnXPJ+gks;r$^@eTiO;7nPxciXb
zAy7G!R1JG-!WCRerr<bWUkit6v+SiF=vMeZOydVGvM`8a;f(LxsCjTPxbcAz*#^Qu
z1E%fsLS1_Nvk471AIW9iX#JS|SdQaPp(3`8T)ZfNSfdwH?f~VMK%hIjv>JNX+?(=s
z$7%4X<aQlUE1wc%(o1##E!vipktCkT2QpmsE$k`wd(wssN;cXB%Eh&f>%`ssW}44Y
zEu7vhFAjw9Fsp*^)Cd$Rsq`S!22cMDLKx(2otz!KPLQg_=4{`wfK8P_5+K#7WD1Mu
zh%G$7V@H5u-kmVF66Ypnn5?{WEuNU_rB$uL)yLAlcIP4G)@Vg6g&WyDuSM!T56iK6
z_pr=3bJw>SnN*O8L?$o5$^OM52f|tKk>4>CE}$|etEVK~_%8Z9Lm2qR233oH%QTos
zQ94sB(XR4|cLs|vd}yX0<34R*5p|5;v^eq>=O1z`s(=s04t+UHN!>pOD$qC4u|4kC
zM2_uJ4<(c?25V;cFnB~ef8H80-!)RJl976)vD+;SAAA&urMQ5urMtB6*g&r_jXRVd
zWuL2jvr)b0Ja7drl1<KX^Awf4pC0H{j;WojGRk;eo+?c77|L9U3r(_#RH&#dOLkQ@
zny&NPF16%`2Is4e?M~oK6-H%m*G$@snK=WevLFSjCAZ%`9^#&6UNZ1yu=TBMET1Hi
z6Pe={xGE{kkAie|(Wl#`$UF(l%Ck2WvH5^kJN8-d`)|vXLsI`;=-;2!X~o_?>(z6k
z81uMXM>*^c?~koRxa36Rgz)@p%)L~mg>ygrWuPFrc5N*!tvUz)a^WB7(I#cf>YcZr
z){cr4r9DD6R)OQ;Ewn*BPQJODZbCE{+ut{%6)Lqt>>`H=(wxiJ%Yw^%cEFBcl{cij
zvYNV|1LWpE7VaN0Xsxa5va54aTC)E8M8X=^aaF*9ga=)q7;aM7VH%8wPu1#ogn!xr
zll!Sb_IASx%7ZUadIJa0SN)L`x~P-T7-?GIV&l#WO$O7Gyozu1HE1=zcn_kDVzJN~
zf^c=x(;K5rV@Z9ih<0ITLR2z|Nam?(Y2~fp<hJ=w87(iXt$=4y4Hp5qlWtX|aE=7P
zlM;TT%R3x|hMHomU+>1ZtN&7#xKRO55_DVmdfHIm6L+kX*vzq_Gna(S?>6v;=<|8P
znWFp8Q^!c)LWrO>q#{~9!lf*(f#6sa%sGC#t=LQxd2EI0`H`q!x<!BjNM4L`CQa$6
z;G#z6w*8(-_P!P8^rEa}y9N4@aUfeA(JumlI~df|vjyuISEH*i&7S1LUG=}EfS$!`
zM+UpGceH-4D+SRkQoH!6!Ip%Pfc8fQxcB!6@rqS_nS8WcSbgX9`6#X5n57h-!c1By
z(c@yMZG5NngS?mOsEgIxh&d|!t~7wyco%fe8~u20(dDkVg0@NAc7H{bR^Gb`-{5N|
zChWw5`&`O%Tn*bO%p^Jhw-6RDMF+pr=<9%s!dRSEGE&%37y`og{EhAyMTSnFXxMEy
zNFAQ%`blyR_a0qq-5%2r6*&X-!PMZBUv^SH=;RP=5Bmi(mW^UA$N$v(oZQ`Z`jU1n
zJC;K1<qv=2LMAO;3r%FeV<1H5J|0Cgqh8|ac2K$jCft@xn|C&nG%v06UWTv4_3Hs!
zYRM-R=G&f*uH4dieTrrYwpMd*Rdg0&{41r4*!Zwd)0TptEkB_h9lv7=mzIL+M^p`y
zc@PU)HMH%gyuJe!oEBsAX^yIyCW5E!h&c~6mErhULM*a8r@u}+sZ>bG((~=Csh3pt
zny9#L@>cq`@SN;i4^AT*o8NCD*ekp*2%n7I>8cuhvLOn5>eBidOq_j}1?}8h@&1eo
z;rKEm;O=DBd`p96O*?un_0fXiPiE3U1?Q>f4Za$)B7ckHfcqDleeK9`hH~rj><jd?
zWQFQOv8i8CTfuYX)rt;cLww9j>(1-<tV$znEmHKOI(Bk1<@NUh+X#AElEfhA0~Ad=
zL<Mw}29K>VChV!D*LF5~z{^V&VIa|oEm?=n3WHA*EX9W6*n*a26QvVWH2E2IM#IGf
z3*5ThF}_4r;dRbZkAyWQzDZ47Hv%R0?Ng1YZ|jU;TYTF|6lXR6MsNkBqlaBQ$6XGw
zd1&7^6jdiFoIatQlXtDOFxj?qo_4)imP&g?5+^Yf<(*Hlu&)Wn>-BM3Xb=<M4t+07
zGCRmr3g7VdemAhtGN5aH;^^<m6O*GKU#Os2YlQi=i?M5<cTG_3z6>M${50Eq>T~*o
zbq6_kSqE)B=C)c%F{1@;_w9+3WnQuT65g5z()N$jCKV8Lud%VH*Y*P1q<bPi$YM)^
z$D{<M%0Qw|*E{^6aa{AfUnA|OY$HugDe58Z13W}2y~u<T*Z$}A|JexClN@L-UxF_B
z{As{C6%@SvKd=8+BTz_Ip+i~Cs`l0b{6!8|Ic--nV^?!=Q)hGVgG@+3NQhTJlvn79
zhM<7BfQYz|7>@w>ML=QuKIZ>;gPnt!m4(;;{S7em7myeW@`vSK{)c{Q^zMHFm%c4a

literal 0
HcmV?d00001

diff --git a/doc/source/train/api.rst b/doc/source/train/api.rst
index 424aedfd0acf..61ea64fefa31 100644
--- a/doc/source/train/api.rst
+++ b/doc/source/train/api.rst
@@ -2,6 +2,7 @@
 
 Ray Train API
 =============
+
 This page covers framework specific integrations with Ray Train and Ray Train Developer APIs.
 
 For core Ray AIR APIs, take a look at the :ref:`AIR Trainer package reference <air-trainer-ref>`.
@@ -14,12 +15,17 @@ Trainer and Predictor Integrations
 XGBoost
 ~~~~~~~
 
+``XGBoostTrainer``
+******************
+
 .. autoclass:: ray.train.xgboost.XGBoostTrainer
     :members:
     :show-inheritance:
 
     .. automethod:: __init__
 
+``XGBoostPredictor``
+********************
 
 .. automodule:: ray.train.xgboost
     :members:
@@ -29,12 +35,18 @@ XGBoost
 LightGBM
 ~~~~~~~~
 
+``LightGBMTrainer``
+*******************
+
 .. autoclass:: ray.train.lightgbm.LightGBMTrainer
     :members:
     :show-inheritance:
 
     .. automethod:: __init__
 
+``LightGBMPredictor``
+*********************
+
 
 .. automodule:: ray.train.lightgbm
     :members:
@@ -44,12 +56,17 @@ LightGBM
 TensorFlow
 ~~~~~~~~~~
 
+``TensorflowTrainer``
+*********************
+
 .. autoclass:: ray.train.tensorflow.TensorflowTrainer
     :members:
     :show-inheritance:
 
     .. automethod:: __init__
 
+``TensorflowPredictor`` and ``TensorflowCheckpoint``
+****************************************************
 
 .. automodule:: ray.train.tensorflow
     :members:
@@ -59,6 +76,9 @@ TensorFlow
 PyTorch
 ~~~~~~~
 
+``TorchTrainer``
+****************
+
 .. autoclass:: ray.train.torch.TorchTrainer
     :members:
     :show-inheritance:
@@ -66,6 +86,9 @@ PyTorch
     .. automethod:: __init__
 
 
+``TorchPredictor``
+******************
+
 .. automodule:: ray.train.torch
     :members:
     :exclude-members: TorchTrainer
@@ -74,12 +97,17 @@ PyTorch
 Horovod
 ~~~~~~~
 
+``HorovodTrainer``
+******************
+
 .. autoclass:: ray.train.horovod.HorovodTrainer
     :members:
     :show-inheritance:
 
     .. automethod:: __init__
 
+``HorovodConfig``
+*****************
 
 .. automodule:: ray.train.horovod
     :members:
@@ -89,12 +117,17 @@ Horovod
 HuggingFace
 ~~~~~~~~~~~
 
+``HuggingFaceTrainer``
+**********************
+
 .. autoclass:: ray.train.huggingface.HuggingFaceTrainer
     :members:
     :show-inheritance:
 
     .. automethod:: __init__
 
+``HuggingFacePredictor`` and ``HuggingFaceCheckpoint``
+******************************************************
 
 .. automodule:: ray.train.huggingface
     :members:
@@ -104,12 +137,17 @@ HuggingFace
 Scikit-Learn
 ~~~~~~~~~~~~
 
+``SklearnTrainer``
+******************
+
 .. autoclass:: ray.train.sklearn.SklearnTrainer
     :members:
     :show-inheritance:
 
     .. automethod:: __init__
 
+``SklearnPredictor`` and ``SklearnCheckpoint``
+**********************************************
 
 .. automodule:: ray.train.sklearn
     :members:
@@ -119,6 +157,9 @@ Scikit-Learn
 Mosaic
 ~~~~~~
 
+``MosaicTrainer``
+*****************
+
 .. autoclass:: ray.train.mosaic.MosaicTrainer
     :members:
     :show-inheritance:
@@ -132,16 +173,32 @@ Mosaic
     :show-inheritance:
 
 
-Reinforcement Learning (RLlib)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Reinforcement Learning with RLlib
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+``RLTrainer``
+*************
+
+.. autoclass:: ray.train.rl.RLTrainer
+    :members:
+    :show-inheritance:
+
+    .. automethod:: __init__
+
+``RLPredictor`` and ``RLCheckpoint``
+************************************
 
 .. automodule:: ray.train.rl
     :members:
+    :exclude-members: RLTrainer
     :show-inheritance:
 
 
 Base Classes (Developer APIs)
 -----------------------------
+
+.. _train-base-trainer:
+
 .. autoclass:: ray.train.trainer.BaseTrainer
     :members:
     :noindex:
@@ -165,8 +222,12 @@ Base Classes (Developer APIs)
     .. automethod:: __init__
         :noindex:
 
+.. _train-backend:
+
 .. autoclass:: ray.train.backend.Backend
     :members:
 
+.. _train-backend-config:
+
 .. autoclass:: ray.train.backend.BackendConfig
     :members:
diff --git a/doc/source/train/architecture.rst b/doc/source/train/architecture.rst
index 2c44247fe843..733f86c6cfbe 100644
--- a/doc/source/train/architecture.rst
+++ b/doc/source/train/architecture.rst
@@ -1,44 +1,66 @@
 .. _train-arch:
 
+.. TODO: the diagram and some of the components (in the given context) are outdated.
+         Make sure to fix this.
+
 Ray Train Architecture
 ======================
 
-A diagram of the Ray Train architecture is provided below.
+The process of training models with Ray Train consists of several components.
+First, depending on the training framework you want to work with, you will have
+to provide a so-called ``Trainer`` that manages the training process.
+For instance, to use a PyTorch model, you use a ``TorchTrainer``.
+The actual training load is distributed among workers on a cluster that belong
+to a ``WorkerGroup``.
+Each framework has its specific communication protocols and exchange formats,
+which is why Ray Train provides ``Backend`` implementations (e.g. ``TorchBackend``)
+that can be used to run the training process using a ``BackendExecutor``.
+
+Here's a visual overview of the architecture components of Ray Train:
 
 .. image:: train-arch.svg
     :width: 70%
     :align: center
 
+Below we discuss each component in a bit more detail.
 
 Trainer
 -------
 
-The Trainer is the main class that is exposed in the Ray Train API that users will interact with.
+Trainers are your main entry point to the Ray Train API.
+Train provides a :ref:`BaseTrainer<train-base-trainer>`, and
+many framework-specific Trainers inherit from the derived ``DataParallelTrainer``
+(like TensorFlow or Torch) and ``GBDTTrainer`` (like XGBoost or LightGBM).
+Defining an actual Trainer, such as ``TorchTrainer`` works as follows:
 
-* The user will pass in a *function* which defines the training logic.
+* You pass in a *function* to the Trainer which defines the training logic.
 * The Trainer will create an :ref:`Executor <train-arch-executor>` to run the distributed training.
-* The Trainer will handle callbacks based on the results from the BackendExecutor.
+* The Trainer will handle callbacks based on the results from the executor.
 
-.. _train-arch-executor:
+.. _train-arch-backend:
 
-Executor
---------
+Backend
+-------
 
-The executor is an interface which handles execution of distributed training.
+Backends are used to initialize and manage framework-specific communication protocols.
+Each training library (Torch, Horovod, TensorFlow, etc.) has a separate backend
+and takes specific configuration values defined in a :ref:`BackendConfig<train-backend-config>`.
+Each backend comes with a ``BackendExecutor`` that is used to run the training process.
 
-* The executor will handle the creation of an actor group and will be initialized in conjunction with a backend.
-* Worker resources, number of workers, and placement strategy will be passed to the Worker Group.
+.. _train-arch-executor:
 
+Executor
+--------
 
-Backend
--------
+The executor is an interface (``BackendExecutor``) that executes distributed training.
+It handles the creation of a group of workers (using :ref:`Ray Actors<actor-guide>`)
+and is initialized with a :ref:`backend<train-arch-backend>`.
+The executor passes all required resources, the number of workers, and information about
+worker placement to the ``WorkerGroup``.
 
-A backend is used in conjunction with the executor to initialize and manage framework-specific communication protocols.
-Each communication library (Torch, Horovod, TensorFlow, etc.) will have a separate backend and will take a specific configuration value.
 
 WorkerGroup
 -----------
 
 The WorkerGroup is a generic utility class for managing a group of Ray Actors.
-
-* This is similar in concept to Fiber's `Ring <https://uber.github.io/fiber/experimental/ring/>`_.
+This is similar in concept to Fiber's `Ring <https://uber.github.io/fiber/experimental/ring/>`_.
diff --git a/doc/source/train/config_guide.rst b/doc/source/train/config_guide.rst
index d152e958beb6..0b6c0381ddcb 100644
--- a/doc/source/train/config_guide.rst
+++ b/doc/source/train/config_guide.rst
@@ -1,13 +1,13 @@
 .. _train-config:
 
-Configurations User Guide
-=========================
+Ray Train Configuration User Guide
+==================================
 
 The following overviews how to configure scale-out, run options, and fault-tolerance for Train.
 For more details on how to configure data ingest, also refer to :ref:`air-ingest`.
 
-Scaling configuration (``ScalingConfig``)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Scaling Configurations in Train (``ScalingConfig``)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The scaling configuration specifies distributed training properties like the number of workers or the
 resources per worker.
@@ -22,8 +22,8 @@ The properties of the scaling configuration are :ref:`tunable <air-tuner-search-
     :end-before: __scaling_config_end__
 
 
-Run configuration (``RunConfig``)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Run Configuration in Train (``RunConfig``)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The run configuration specifies distributed training properties like the number of workers or the
 resources per worker.
@@ -37,8 +37,8 @@ The properties of the run configuration are :ref:`not tunable <air-tuner-search-
     :start-after: __run_config_start__
     :end-before: __run_config_end__
 
-Failure configuration (``FailureConfig``)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Failure configurations in Train (``FailureConfig``)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The failure configuration specifies how training failures should be dealt with.
 
@@ -52,8 +52,8 @@ are :ref:`not tunable <air-tuner-search-space>`.
     :start-after: __failure_config_start__
     :end-before: __failure_config_end__
 
-Sync configuration (``SyncConfig``)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Sync configurations in Train (``SyncConfig``)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The sync configuration specifies how to synchronize checkpoints between the
 Ray cluster and remote storage.
@@ -69,8 +69,8 @@ are :ref:`not tunable <air-tuner-search-space>`.
     :end-before: __sync_config_end__
 
 
-Checkpoint configuration (``CheckpointConfig``)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Checkpoint configurations in Train (``CheckpointConfig``)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The checkpoint configuration specifies how often to checkpoint training state
 and how many checkpoints to keep.
diff --git a/doc/source/train/dl_guide.rst b/doc/source/train/dl_guide.rst
index 9f0e208a543f..3fa2e6d812a3 100644
--- a/doc/source/train/dl_guide.rst
+++ b/doc/source/train/dl_guide.rst
@@ -1,7 +1,7 @@
 .. _train-dl-guide:
 
-Deep Learning User Guide
-========================
+Distributed Deep Learning with Ray Train User Guide
+===================================================
 
 This guide explains how to use Train to scale PyTorch, TensorFlow and Horovod.
 
@@ -16,8 +16,8 @@ In this guide, we cover examples for the following use cases:
 
 .. _train-backends:
 
-Backends
---------
+Using Deep Learning Frameworks as Backends
+------------------------------------------
 
 Ray Train provides a thin API around different backend frameworks for
 distributed deep learning. At the moment, Ray Train allows you to perform
@@ -38,15 +38,15 @@ training with:
 
 .. _train-porting-code:
 
-Porting code to Ray Train
--------------------------
+Porting code from PyTorch, TensorFlow, or Horovod to Ray Train
+--------------------------------------------------------------
 
 The following instructions assume you have a training function
 that can already be run on a single worker for one of the supported
 :ref:`backend <train-backends>` frameworks.
 
-Update training function
-~~~~~~~~~~~~~~~~~~~~~~~~
+Updating your training function
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 First, you'll want to update your training function to support distributed
 training.
@@ -173,8 +173,8 @@ training.
     To onboard onto Horovod, please visit the `Horovod guide
     <https://horovod.readthedocs.io/en/stable/index.html#get-started>`_.
 
-Create Ray Train Trainer
-~~~~~~~~~~~~~~~~~~~~~~~~
+Creating a Ray Train Trainer
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 ``Trainer``\s are the primary Ray Train classes that are used to manage state and
 execute training. You can create a simple ``Trainer`` for the backend of choice
@@ -273,8 +273,8 @@ To customize the backend setup, you can use the :ref:`framework-specific config
 
 For more configurability, please reference the :py:class:`~ray.train.data_parallel_trainer.DataParallelTrainer` API.
 
-Run training function
-~~~~~~~~~~~~~~~~~~~~~
+Running your training function
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 With a distributed training function and a Ray Train ``Trainer``, you are now
 ready to start training!
@@ -407,8 +407,8 @@ of the :py:class:`~ray.air.result.Result` object returned by ``Trainer.fit()``.
 
 .. _train-datasets:
 
-Distributed Data Ingest with Ray Datasets
------------------------------------------
+Distributed Data Ingest with Ray Datasets and Ray Train
+-------------------------------------------------------
 
 :ref:`Ray Datasets <datasets>` are the recommended way to work with large datasets in Ray Train. Datasets provides automatic loading, sharding, and pipelined ingest (optional) of Data across multiple Train workers.
 To get started, pass in one or more datasets under the ``datasets`` keyword argument for Trainer (e.g., ``Trainer(datasets={...})``).
@@ -444,8 +444,8 @@ For more details on how to configure data ingest for Train, please refer to :ref
 
 .. _train-monitoring:
 
-Logging, Checkpointing and Callbacks
-------------------------------------
+Logging, Checkpointing and Callbacks in Ray Train
+-------------------------------------------------
 
 Ray Train has mechanisms to easily collect intermediate results from the training workers during the training run
 and also has a :ref:`Callback interface <train-callbacks>` to perform actions on these intermediate results (such as logging, aggregations, etc.).
diff --git a/doc/source/train/examples.rst b/doc/source/train/examples.rst
index 12e482c12272..40200eb5821e 100644
--- a/doc/source/train/examples.rst
+++ b/doc/source/train/examples.rst
@@ -7,47 +7,115 @@ Ray Train Examples
    .py files in ray/python/ray/train/examples.
 
 Below are examples for using Ray Train with a variety of models, frameworks, 
-and use cases.
+and use cases. You can filter these examples by the following categories:
 
-General Examples
-----------------
 
-PyTorch
-~~~~~~~
+.. raw:: html
 
-* :doc:`/train/examples/pytorch/torch_fashion_mnist_example`:
-  End-to-end example for PyTorch.
+    <div>
+        <div id="allButton" type="button" class="tag btn btn-primary">All</div>
 
-* :doc:`/train/examples/transformers/transformers_example`:
-  End-to-end example for HuggingFace Transformers (PyTorch).
+        <!--Frameworks-->
+        <div type="button" class="tag btn btn-outline-primary">PyTorch</div>
+        <div type="button" class="tag btn btn-outline-primary">TensorFlow</div>
+        <div type="button" class="tag btn btn-outline-primary">HuggingFace</div>
+        <div type="button" class="tag btn btn-outline-primary">Horovod</div>
+        <div type="button" class="tag btn btn-outline-primary">MLflow</div>
 
-TensorFlow
-~~~~~~~~~~
+        <!--Workload-->
+        <div type="button" class="tag btn btn-outline-primary">Training</div>
+        <div type="button" class="tag btn btn-outline-primary">Tuning</div>
+    </div>
 
-* :doc:`/train/examples/tf/tensorflow_mnist_example`:
-  End-to-end example for TensorFlow
 
-Horovod
-~~~~~~~
+Distributed Training Examples using Ray Train
+---------------------------------------------
 
-* :doc:`/train/examples/horovod/horovod_example`:
-  End-to-end example for Horovod (with PyTorch)
+.. panels::
+    :container: container pb-4 full-width
+    :column: col-md-4 px-2 py-2
+    :img-top-cls: pt-5 w-75 d-block mx-auto
 
+    ---
+    :img-top: /images/pytorch_logo.png
 
-Logger/Callback Examples
-------------------------
-* :doc:`/train/examples/mlflow_fashion_mnist_example`:
-  Example for logging training to MLflow via the ``MLflowLoggerCallback``
+    +++
+    .. link-button:: torch_fashion_mnist_ex
+        :type: ref
+        :text: PyTorch Fashion MNIST Training Example
+        :classes: btn-link btn-block stretched-link trainTorchFashionMnist
 
+    ---
+    :img-top: /images/hugging.png
 
-Ray Tune Integration Examples
------------------------------
+    +++
+    .. link-button:: train_transformers_example
+        :type: ref
+        :text: Transformers with PyTorch Training Example
+        :classes: btn-link btn-block stretched-link trainTransformers
 
-* :doc:`/train/examples/tf/tune_tensorflow_mnist_example`:
-  End-to-end example for tuning a TensorFlow model.
+    ---
+    :img-top: /images/tf_logo.png
 
-* :doc:`/train/examples/pytorch/tune_cifar_torch_pbt_example`:
-  End-to-end example for tuning a PyTorch model with PBT.
+    +++
+    .. link-button:: tensorflow_mnist_example
+        :type: ref
+        :text: TensorFlow MNIST Training Example
+        :classes: btn-link btn-block stretched-link trainTensorflowMnist
+
+    ---
+    :img-top: /images/horovod.png
+
+    +++
+    .. link-button:: horovod_example
+        :type: ref
+        :text: End-to-end Horovod Training Example
+        :classes: btn-link btn-block stretched-link trainHorovod
+
+
+Ray Train Examples Using Loggers & Callbacks
+--------------------------------------------
+
+.. panels::
+    :container: container pb-4 full-width
+    :column: col-md-4 px-2 py-2
+    :img-top-cls: pt-5 w-75 d-block mx-auto
+
+    ---
+    :img-top: /images/mlflow.png
+
+    +++
+    .. link-button:: train_mlflow_example
+        :type: ref
+        :text: Logging Training Runs with MLflow
+        :classes: btn-link btn-block stretched-link trainMlflow
+
+
+Ray Train & Tune Integration Examples
+-------------------------------------
+
+.. panels::
+    :container: container pb-4 full-width
+    :column: col-md-4 px-2 py-2
+    :img-top-cls: pt-5 w-75 d-block mx-auto
+
+    ---
+    :img-top: /images/tune.png
+
+    +++
+    .. link-button:: tune_train_tf_example
+        :type: ref
+        :text: End-to-end Example for Tuning a TensorFlow Model
+        :classes: btn-link btn-block stretched-link trainTuneTensorflow
+
+    ---
+    :img-top: /images/tune.png
+
+    +++
+    .. link-button:: tune_train_torch_example
+        :type: ref
+        :text: End-to-end Example for Tuning a PyTorch Model with PBT
+        :classes: btn-link btn-block stretched-link trainTunePyTorch
 
 ..
     TODO implement these examples!
@@ -63,9 +131,19 @@ Ray Tune Integration Examples
 
     * Example training on Vision model.
 
-Benchmarks
-----------
+Ray Train Benchmarks
+--------------------
+
+.. panels::
+    :container: container pb-4 full-width
+    :column: col-md-4 px-2 py-2
+    :img-top-cls: pt-5 w-75 d-block mx-auto
 
-* :doc:`/train/examples/pytorch/torch_data_prefetch_benchmark/benchmark_example`:
-  Benchmark example for the PyTorch data transfer auto pipeline.
+    ---
+    :img-top: /ray-overview/images/ray_svg_logo.svg
 
+    +++
+    .. link-button:: train_benchmark
+        :type: ref
+        :text: Benchmark example for the PyTorch data transfer auto pipeline
+        :classes: btn-link btn-block stretched-link trainBenchmark
diff --git a/doc/source/train/examples/horovod/horovod_example.rst b/doc/source/train/examples/horovod/horovod_example.rst
index 42830d38ecc2..0593a275be09 100644
--- a/doc/source/train/examples/horovod/horovod_example.rst
+++ b/doc/source/train/examples/horovod/horovod_example.rst
@@ -1,6 +1,8 @@
 :orphan:
 
-horovod_example
-===============
+.. _horovod_example:
+
+Horovod Distributed Training Example with PyTorch & Ray Train
+=============================================================
 
 .. literalinclude:: /../../python/ray/train/examples/horovod/horovod_example.py
diff --git a/doc/source/train/examples/mlflow_fashion_mnist_example.rst b/doc/source/train/examples/mlflow_fashion_mnist_example.rst
index 5f04779badbd..fb3d6106d36c 100644
--- a/doc/source/train/examples/mlflow_fashion_mnist_example.rst
+++ b/doc/source/train/examples/mlflow_fashion_mnist_example.rst
@@ -1,6 +1,8 @@
 :orphan:
 
-mlflow_fashion_mnist_example
-============================
+.. _train_mlflow_example:
+
+Logging Ray Train Training Runs with MLflow (using Callbacks)
+=============================================================
 
 .. literalinclude:: /../../python/ray/train/examples/mlflow_fashion_mnist_example.py
diff --git a/doc/source/train/examples/pytorch/torch_data_prefetch_benchmark/benchmark_example.rst b/doc/source/train/examples/pytorch/torch_data_prefetch_benchmark/benchmark_example.rst
index 5237191880ba..4c923e9a94cb 100644
--- a/doc/source/train/examples/pytorch/torch_data_prefetch_benchmark/benchmark_example.rst
+++ b/doc/source/train/examples/pytorch/torch_data_prefetch_benchmark/benchmark_example.rst
@@ -1,7 +1,9 @@
 :orphan:
 
-Torch Data Prefetching Benchmark
-================================
+.. _train_benchmark:
+
+Torch Data Prefetching Benchmark for Ray Train
+==============================================
 
 We provide a benchmark example to show how the auto pipeline for host to device data transfer speeds up training on GPUs.
 This functionality can be easily enabled by setting ``auto_transfer=True`` in :func:`train.torch.prepare_data_loader`.
diff --git a/doc/source/train/examples/pytorch/torch_fashion_mnist_example.rst b/doc/source/train/examples/pytorch/torch_fashion_mnist_example.rst
index 5b5e0d47d480..2955441efaf0 100644
--- a/doc/source/train/examples/pytorch/torch_fashion_mnist_example.rst
+++ b/doc/source/train/examples/pytorch/torch_fashion_mnist_example.rst
@@ -1,6 +1,8 @@
 :orphan:
 
-torch_fashion_mnist_example
-===========================
+.. _torch_fashion_mnist_ex:
+
+Running Distributed Training of a PyTorch Model on Fashion MNIST with Ray Train
+===============================================================================
 
 .. literalinclude:: /../../python/ray/train/examples/pytorch/torch_fashion_mnist_example.py
diff --git a/doc/source/train/examples/pytorch/torch_regression_example.rst b/doc/source/train/examples/pytorch/torch_regression_example.rst
index 133f091c1f0a..7ddad6fe21c7 100644
--- a/doc/source/train/examples/pytorch/torch_regression_example.rst
+++ b/doc/source/train/examples/pytorch/torch_regression_example.rst
@@ -1,3 +1,4 @@
+
 :orphan:
 
 torch_regression_example
diff --git a/doc/source/train/examples/pytorch/tune_cifar_torch_pbt_example.rst b/doc/source/train/examples/pytorch/tune_cifar_torch_pbt_example.rst
index 6d9c1eaf3abe..a7e9d54e2086 100644
--- a/doc/source/train/examples/pytorch/tune_cifar_torch_pbt_example.rst
+++ b/doc/source/train/examples/pytorch/tune_cifar_torch_pbt_example.rst
@@ -1,6 +1,8 @@
 :orphan:
 
-tune_cifar_torch_pbt_example
-============================
+.. _tune_train_torch_example:
+
+Tuning Hyperparameters of a Distributed PyTorch Model with PBT using Ray Train & Tune
+=====================================================================================
 
 .. literalinclude:: /../../python/ray/train/examples/pytorch/tune_cifar_torch_pbt_example.py
diff --git a/doc/source/train/examples/tf/tensorflow_mnist_example.rst b/doc/source/train/examples/tf/tensorflow_mnist_example.rst
index a63bca284a75..0a03a9462d76 100644
--- a/doc/source/train/examples/tf/tensorflow_mnist_example.rst
+++ b/doc/source/train/examples/tf/tensorflow_mnist_example.rst
@@ -1,6 +1,8 @@
 :orphan:
 
-tensorflow_mnist_example
-========================
+.. _tensorflow_mnist_example:
+
+Running Distributed Training of a TensorFlow Model on MNIST with Ray Train
+==========================================================================
 
 .. literalinclude:: /../../python/ray/train/examples/tf/tensorflow_mnist_example.py
diff --git a/doc/source/train/examples/tf/tune_tensorflow_mnist_example.rst b/doc/source/train/examples/tf/tune_tensorflow_mnist_example.rst
index efc7db7cdc22..724710861565 100644
--- a/doc/source/train/examples/tf/tune_tensorflow_mnist_example.rst
+++ b/doc/source/train/examples/tf/tune_tensorflow_mnist_example.rst
@@ -1,6 +1,8 @@
 :orphan:
 
-tune_tensorflow_mnist_example
-=============================
+.. _tune_train_tf_example:
+
+Tuning Hyperparameters of a Distributed TensorFlow Model using Ray Train & Tune
+===============================================================================
 
 .. literalinclude:: /../../python/ray/train/examples/tf/tune_tensorflow_mnist_example.py
diff --git a/doc/source/train/examples/transformers/transformers_example.rst b/doc/source/train/examples/transformers/transformers_example.rst
index 6325b1c4f088..7f7eeb4547fc 100644
--- a/doc/source/train/examples/transformers/transformers_example.rst
+++ b/doc/source/train/examples/transformers/transformers_example.rst
@@ -1,6 +1,8 @@
 :orphan:
 
-transformers_example
-====================
+.. _train_transformers_example :
+
+Ray Train Example for HuggingFace Transformers with PyTorch
+===========================================================
 
 .. literalinclude:: /../../python/ray/train/examples/transformers/transformers_example.py
diff --git a/doc/source/train/faq.rst b/doc/source/train/faq.rst
index 94cfe9f6c799..76534e86f16d 100644
--- a/doc/source/train/faq.rst
+++ b/doc/source/train/faq.rst
@@ -14,8 +14,8 @@ distributed training communication is done with Torch's ``DistributedDataParalle
 
 Take a look at the :ref:`Pytorch <pytorch-training-parity>` and :ref:`Tensorflow <tf-training-parity>` benchmarks to check performance parity.
 
-How do I set resources?
------------------------
+How do I set training resources in Ray Train?
+---------------------------------------------
 
 By default, each worker will reserve 1 CPU resource, and an additional 1 GPU resource if ``use_gpu=True``.
 
@@ -28,8 +28,9 @@ you can initialize the ``Trainer`` with ``resources_per_worker`` specified in ``
    can still be run with Ray Train today without these functions.
 
 
-My multi-node  PyTorch GPU training is hanging or giving me obscure NCCL errors. What do I do?
-----------------------------------------------------------------------------------------------
+My multi-node PyTorch GPU training is hanging or giving me obscure NCCL errors. What do I do?
+---------------------------------------------------------------------------------------------
+
 If you are on a multi-node GPU training setup and training is hanging, or you get errors like
 `RuntimeError: NCCL error in: /pytorch/torch/lib/c10d/ProcessGroupNCCL.cpp:911, unhandled system error`
 it could be that there is some networking misconfiguration in your cluster.
diff --git a/doc/source/train/gbdt.rst b/doc/source/train/gbdt.rst
index 8855050624b3..a4f1aec6cb68 100644
--- a/doc/source/train/gbdt.rst
+++ b/doc/source/train/gbdt.rst
@@ -1,12 +1,12 @@
 .. _train-gbdt-guide:
 
-XGBoost / LightGBM User Guide
-=============================
+XGBoost & LightGBM User Guide for Ray Train
+===========================================
 
 Ray Train has built-in support for XGBoost and LightGBM.
 
-Basic Usage
------------
+Basic Training with Tree-Based Models in Train
+----------------------------------------------
 
 Just as in the original `xgboost.train() <https://xgboost.readthedocs.io/en/stable/parameter.html>`__ and
 `lightgbm.train() <https://lightgbm.readthedocs.io/en/latest/Parameters.html>`__ functions, the
diff --git a/doc/source/train/getting-started.rst b/doc/source/train/getting-started.rst
index 5a5b483fa506..cb59e5f64c9d 100644
--- a/doc/source/train/getting-started.rst
+++ b/doc/source/train/getting-started.rst
@@ -1,7 +1,7 @@
 .. _train-getting-started:
 
-Getting Started
-===============
+Getting Started with Distributed Model Training in Ray Train
+============================================================
 
 Ray Train offers multiple ``Trainers`` which implement scalable model training for different machine learning frameworks.
 Here are examples for some of the commonly used trainers:
diff --git a/doc/source/train/key-concepts.rst b/doc/source/train/key-concepts.rst
index bec0bed8460f..c477099d2104 100644
--- a/doc/source/train/key-concepts.rst
+++ b/doc/source/train/key-concepts.rst
@@ -1,7 +1,7 @@
 .. _train-key-concepts:
 
-Key Concepts
-============
+Key Concepts of Ray Train
+=========================
 
 There are four main concepts in the Ray Train library.
 
@@ -22,6 +22,10 @@ The output of a Trainer run is a :ref:`Result <train-key-concepts-results>` that
 metrics from the training run and the latest saved :ref:`Checkpoint <air-checkpoint-ref>`.
 Trainers can also be configured with :ref:`Datasets <air-ingest>` and :ref:`Preprocessors <air-preprocessors>` for scalable data ingest and preprocessing.
 
+
+Deep Learning, Tree-Based, and other Trainers
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
 There are three categories of built-in Trainers:
 
 .. tabbed:: Deep Learning Trainers
@@ -65,8 +69,8 @@ There are three categories of built-in Trainers:
 
 .. _train-key-concepts-config:
 
-Configuration
--------------
+Train Configuration
+-------------------
 
 Trainers are configured with configuration objects. There are two main configuration classes,
 the :class:`ScalingConfig <ray.air.config.ScalingConfig>` and the :class:`RunConfig <ray.air.config.RunConfig>`.
@@ -77,8 +81,8 @@ Check out the :ref:`Configurations User Guide <train-config>` for an in-depth gu
 
 .. _train-key-concepts-results:
 
-Checkpoints
------------
+Train Checkpoints
+-----------------
 
 Calling ``Trainer.fit()`` returns a :class:`Result <ray.air.result.Result>` object, which includes
 information about the run such as the reported metrics and the saved checkpoints.
@@ -91,8 +95,8 @@ Checkpoints have the following purposes:
 
 .. _train-key-concepts-predictors:
 
-Predictors
-----------
+Train Predictors
+----------------
 
 Predictors are the counterpart to Trainers. A Trainer trains a model on a dataset, and a predictor
 uses the resulting model and performs inference on it.
diff --git a/doc/source/train/train.rst b/doc/source/train/train.rst
index 5d9523b965c1..c79ab6ea278a 100644
--- a/doc/source/train/train.rst
+++ b/doc/source/train/train.rst
@@ -42,8 +42,8 @@ There are three broad categories of Trainers that Train offers:
 * Leverage the :ref:`Ray cluster launcher <cluster-index>` to launch autoscaling or spot instance clusters on any cloud.
 
 
-Quick Start
------------
+Quick Start to Distributed Training with Ray Train
+--------------------------------------------------
 
 .. tabbed:: XGBoost
 
@@ -79,10 +79,11 @@ Quick Start
 
 .. _train-framework-catalog:
 
-Framework Catalog
------------------
+Training Framework Catalog
+--------------------------
 
-Here is a catalog of the framework-specific Trainer, Checkpoint, and Predictor classes that ship out of the box with Train:
+Here is a catalog of the framework-specific Trainer, Checkpoint, and Predictor
+classes that ship out of the box with Train:
 
 .. list-table::
 
diff --git a/doc/source/train/user-guides.rst b/doc/source/train/user-guides.rst
index cd636041ffe0..175c3de901c7 100644
--- a/doc/source/train/user-guides.rst
+++ b/doc/source/train/user-guides.rst
@@ -1,5 +1,5 @@
-User Guides
-===========
+Ray Train User Guides
+=====================
 
 .. panels::
     :container: container pb-4 full-width

From f9fa0b28f53c500a668f542e220a531ecb8df1fb Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Sat, 28 Jan 2023 21:57:09 +0900
Subject: [PATCH 044/267] [Dashboard] Timeline implemented by a new task
 backend (#31856)

Signed-off-by: SangBin Cho <rkooo567@gmail.com>

This PR implements the timeline to the ray dashboard using new task backend.

Implement the task events -> chrome tracing logic. Most of code is copied from existing code. TODO add unit tests (although we already have one, it is a pretty weak test).
Create a timeline endpoint that can 1. download the json file (to download & upload manually) 2. return the json array buffer (to load onto perfetto directly)
Create a subsection that has 3 features. 1. Download button. 2. Open perfetto button. 3. Instruction accordion.
---
 dashboard/client/src/common/AlertDialog.tsx   |  52 ++++++
 dashboard/client/src/components/TitleCard.tsx |   4 +-
 dashboard/client/src/pages/job/JobDetail.tsx  |   4 +
 .../client/src/pages/job/TaskTimeline.tsx     |  76 +++++++++
 dashboard/client/src/service/task.ts          |   4 +
 dashboard/modules/state/state_head.py         |  19 +++
 dashboard/state_aggregator.py                 |  15 +-
 python/ray/_private/profiling.py              | 157 +++++++++++++++++
 python/ray/experimental/shuffle.py            |   1 -
 python/ray/experimental/state/common.py       |   2 +-
 python/ray/tests/BUILD                        |   1 +
 python/ray/tests/test_state_api.py            |   1 +
 python/ray/tests/test_state_api_2.py          | 161 ++++++++++++++++++
 13 files changed, 489 insertions(+), 8 deletions(-)
 create mode 100644 dashboard/client/src/common/AlertDialog.tsx
 create mode 100644 dashboard/client/src/pages/job/TaskTimeline.tsx
 create mode 100644 python/ray/tests/test_state_api_2.py

diff --git a/dashboard/client/src/common/AlertDialog.tsx b/dashboard/client/src/common/AlertDialog.tsx
new file mode 100644
index 000000000000..3543aa74e96d
--- /dev/null
+++ b/dashboard/client/src/common/AlertDialog.tsx
@@ -0,0 +1,52 @@
+import {
+  Button,
+  Dialog,
+  DialogActions,
+  DialogContent,
+  DialogContentText,
+  DialogTitle,
+} from "@material-ui/core";
+import React, { PropsWithChildren } from "react";
+import { ClassNameProps } from "./props";
+
+type AlertDialogProps = PropsWithChildren<
+  {
+    open: boolean;
+    handleClose: any;
+    onAgree: any;
+    title: string;
+    contents: string;
+  } & ClassNameProps
+>;
+
+export const AlertDialog = ({
+  open,
+  handleClose,
+  onAgree,
+  title,
+  contents,
+}: AlertDialogProps) => {
+  return (
+    <div>
+      <Dialog
+        open={open}
+        onClose={handleClose}
+        aria-labelledby="alert-dialog-title"
+        aria-describedby="alert-dialog-description"
+      >
+        <DialogTitle id="alert-dialog-title">{title}</DialogTitle>
+        <DialogContent>
+          <DialogContentText id="alert-dialog-description">
+            {contents}
+          </DialogContentText>
+        </DialogContent>
+        <DialogActions>
+          <Button onClick={handleClose}>Disagree</Button>
+          <Button onClick={onAgree} autoFocus>
+            Agree
+          </Button>
+        </DialogActions>
+      </Dialog>
+    </div>
+  );
+};
diff --git a/dashboard/client/src/components/TitleCard.tsx b/dashboard/client/src/components/TitleCard.tsx
index db088f775e60..b4f46655199f 100644
--- a/dashboard/client/src/components/TitleCard.tsx
+++ b/dashboard/client/src/components/TitleCard.tsx
@@ -13,9 +13,7 @@ const useStyles = makeStyles((theme) => ({
     color: theme.palette.text.secondary,
     marginBottom: theme.spacing(1),
   },
-  body: {
-    padding: theme.spacing(0.5),
-  },
+  body: {},
 }));
 
 const TitleCard = ({
diff --git a/dashboard/client/src/pages/job/JobDetail.tsx b/dashboard/client/src/pages/job/JobDetail.tsx
index dbc408ff8f80..2c6e0d47830b 100644
--- a/dashboard/client/src/pages/job/JobDetail.tsx
+++ b/dashboard/client/src/pages/job/JobDetail.tsx
@@ -18,6 +18,7 @@ import { useJobDetail } from "./hook/useJobDetail";
 import { useJobProgress } from "./hook/useJobProgress";
 import { JobTaskNameProgressTable } from "./JobTaskNameProgressTable";
 import { TaskProgressBar } from "./TaskProgressBar";
+import { TaskTimeline } from "./TaskTimeline";
 
 const useStyle = makeStyles((theme) => ({
   root: {
@@ -174,6 +175,9 @@ export const JobDetailChartsPage = ({
         />
       </TitleCard>
       <TitleCard title="Tasks">{tasksSectionContents}</TitleCard>
+      <TitleCard title="Task Timeline">
+        <TaskTimeline jobId={jobId} />
+      </TitleCard>
       <TitleCard title="Task Table">
         <TaskList jobId={jobId} />
       </TitleCard>
diff --git a/dashboard/client/src/pages/job/TaskTimeline.tsx b/dashboard/client/src/pages/job/TaskTimeline.tsx
new file mode 100644
index 000000000000..50e7fd2b3357
--- /dev/null
+++ b/dashboard/client/src/pages/job/TaskTimeline.tsx
@@ -0,0 +1,76 @@
+import {
+  Button,
+  createStyles,
+  makeStyles,
+  Typography,
+} from "@material-ui/core";
+import React from "react";
+import { RiDownload2Line } from "react-icons/ri";
+import { ClassNameProps } from "../../common/props";
+import { downloadTaskTimelineHref } from "../../service/task";
+
+const useStyle = makeStyles((theme) => ({
+  root: {
+    padding: theme.spacing(2, 0, 0),
+  },
+  button: {
+    marginTop: theme.spacing(2),
+  },
+}));
+
+type TaskTimelineProps = {
+  jobId: string;
+};
+
+export const TaskTimeline = ({ jobId }: TaskTimelineProps) => {
+  const classes = useStyle();
+
+  return (
+    <div className={classes.root}>
+      {/* TODO(aguo): Add link to external documentation about Timeline view. */}
+      <Typography>
+        Timeline view shows how tasks are executed across different nodes and
+        worker processes.
+        <br />
+        Download the trace file and analyze it by uploading it to tools like{" "}
+        <a href="https://ui.perfetto.dev/" target="_blank" rel="noreferrer">
+          Perfetto UI
+        </a>{" "}
+        or if you are using chrome,{" "}
+        <a href="chrome://tracing">chrome://tracing</a>. You can use the tool by
+        visiting chrome://tracing using your address bar.
+      </Typography>
+      <TimelineDownloadButton className={classes.button} jobId={jobId} />
+    </div>
+  );
+};
+
+const useTimelineDownloadButtonStyles = makeStyles((theme) =>
+  createStyles({
+    label: {
+      color: "black",
+    },
+  }),
+);
+
+type TimelineDownloadButtonProps = {
+  jobId: string;
+} & ClassNameProps;
+
+const TimelineDownloadButton = ({
+  jobId,
+  className,
+}: TimelineDownloadButtonProps) => {
+  const classes = useTimelineDownloadButtonStyles();
+  return (
+    <Button
+      className={className}
+      variant="outlined"
+      startIcon={<RiDownload2Line />}
+      href={downloadTaskTimelineHref(jobId)}
+      classes={{ label: classes.label }}
+    >
+      Download trace file
+    </Button>
+  );
+};
diff --git a/dashboard/client/src/service/task.ts b/dashboard/client/src/service/task.ts
index 50bb04e1e789..bb25ad2acb4a 100644
--- a/dashboard/client/src/service/task.ts
+++ b/dashboard/client/src/service/task.ts
@@ -5,3 +5,7 @@ import { get } from "./requestHandlers";
 export const getTasks = () => {
   return get<StateApiResponse<Task>>("api/v0/tasks?detail=1&limit=10000");
 };
+
+export const downloadTaskTimelineHref = (jobId: string) => {
+  return `/api/v0/tasks/timeline?job_id=${jobId}&download=1`;
+};
diff --git a/dashboard/modules/state/state_head.py b/dashboard/modules/state/state_head.py
index b2e755b35e0d..9c0a7747abb2 100644
--- a/dashboard/modules/state/state_head.py
+++ b/dashboard/modules/state/state_head.py
@@ -1,9 +1,11 @@
 import asyncio
 import logging
 from dataclasses import asdict
+from datetime import datetime
 from typing import Callable, List, Tuple, Optional
 
 import aiohttp.web
+from aiohttp.web import Response
 from abc import ABC, abstractmethod
 from ray._private.usage.usage_lib import TagKey, record_extra_usage_tag
 import ray.dashboard.optional_utils as dashboard_optional_utils
@@ -462,6 +464,23 @@ async def summarize_objects(self, req: aiohttp.web.Request) -> aiohttp.web.Respo
         record_extra_usage_tag(TagKey.CORE_STATE_API_SUMMARIZE_OBJECTS, "1")
         return await self._handle_summary_api(self._state_api.summarize_objects, req)
 
+    @routes.get("/api/v0/tasks/timeline")
+    @RateLimitedModule.enforce_max_concurrent_calls
+    async def tasks_timeline(self, req: aiohttp.web.Request) -> aiohttp.web.Response:
+        job_id = req.query.get("job_id")
+        download = req.query.get("download")
+        result = await self._state_api.generate_task_timeline(job_id)
+        if download == "1":
+            # Support download if specified.
+            now_str = datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
+            content_disposition = (
+                f'attachment; filename="timeline-{job_id}-{now_str}.json"'
+            )
+            headers = {"Content-Disposition": content_disposition}
+        else:
+            headers = None
+        return Response(text=result, content_type="application/json", headers=headers)
+
     @routes.get("/api/v0/delay/{delay_s}")
     async def delayed_response(self, req: aiohttp.web.Request):
         """Testing only. Response after a specified delay."""
diff --git a/dashboard/state_aggregator.py b/dashboard/state_aggregator.py
index c75b5d5385db..6e5e6852ea25 100644
--- a/dashboard/state_aggregator.py
+++ b/dashboard/state_aggregator.py
@@ -4,10 +4,11 @@
 
 from dataclasses import asdict, fields
 from itertools import islice
-from typing import List, Tuple
+from typing import List, Tuple, Optional
 from datetime import datetime
 
 from ray._private.ray_constants import env_integer
+from ray._private.profiling import chrome_tracing_dump
 
 import ray.dashboard.memory_utils as memory_utils
 import ray.dashboard.utils as dashboard_utils
@@ -393,7 +394,7 @@ def _to_task_state(task_attempt: dict) -> dict:
             task_state = {}
             task_info = task_attempt.get("task_info", {})
             state_updates = task_attempt.get("state_updates", [])
-            profiling_data = task_attempt.get("profiling_data", {})
+            profiling_data = task_attempt.get("profile_events", {})
             if profiling_data:
                 for event in profiling_data["events"]:
                     # End/start times are recorded in ns. We convert them to ms.
@@ -433,7 +434,8 @@ def _to_task_state(task_attempt: dict) -> dict:
             for state in common_pb2.TaskStatus.keys():
                 key = f"{state.lower()}_ts"
                 if key in state_updates:
-                    # timestamp is recorded in ns.
+                    # timestamp is recorded as nanosecond from the backend.
+                    # We need to convert it to the second.
                     ts_ms = int(state_updates[key]) // 1e6
                     events.append(
                         {
@@ -759,6 +761,13 @@ async def summarize_objects(self, option: SummaryApiOptions) -> SummaryApiRespon
             num_filtered=result.num_filtered,
         )
 
+    async def generate_task_timeline(self, job_id: Optional[str]) -> List[dict]:
+        filters = [("job_id", "=", job_id)] if job_id else None
+        result = await self.list_tasks(
+            option=ListApiOptions(detail=True, filters=filters, limit=10000)
+        )
+        return chrome_tracing_dump(result.result)
+
     def _message_to_dict(
         self,
         *,
diff --git a/python/ray/_private/profiling.py b/python/ray/_private/profiling.py
index 09f2f1b48f35..76b39e8e0e4b 100644
--- a/python/ray/_private/profiling.py
+++ b/python/ray/_private/profiling.py
@@ -1,4 +1,7 @@
 import os
+import json
+from collections import defaultdict
+from typing import List
 
 import ray
 
@@ -16,6 +19,26 @@ def __exit__(self, type, value, tb):
 PROFILING_ENABLED = "RAY_PROFILING" in os.environ
 NULL_LOG_SPAN = _NullLogSpan()
 
+# Colors are specified at
+# https://github.com/catapult-project/catapult/blob/master/tracing/tracing/base/color_scheme.html.  # noqa: E501
+_default_color_mapping = defaultdict(
+    lambda: "generic_work",
+    {
+        "worker_idle": "cq_build_abandoned",
+        "task": "rail_response",
+        "task:deserialize_arguments": "rail_load",
+        "task:execute": "rail_animation",
+        "task:store_outputs": "rail_idle",
+        "wait_for_function": "detailed_memory_dump",
+        "ray.get": "good",
+        "ray.put": "terrible",
+        "ray.wait": "vsync_highlight_color",
+        "submit_task": "background_memory_dump",
+        "fetch_and_run_function": "detailed_memory_dump",
+        "register_remote_function": "detailed_memory_dump",
+    },
+)
+
 
 def profile(event_type, extra_data=None):
     """Profile a span of time so that it appears in the timeline visualization.
@@ -54,3 +77,137 @@ def profile(event_type, extra_data=None):
     if worker.mode == ray._private.worker.LOCAL_MODE:
         return NULL_LOG_SPAN
     return worker.core_worker.profile_event(event_type.encode("ascii"), extra_data)
+
+
+def chrome_tracing_dump(
+    tasks: List[dict],
+) -> str:
+    """Generate a chrome/perfetto tracing dump using task events.
+
+    Args:
+        tasks: List of tasks generated by a state API list_tasks(detail=True).
+
+    Returns:
+        Json serialized dump to create a chrome/perfetto tracing.
+    """
+    # All events from given tasks.
+    all_events = []
+
+    # Chrome tracing doesn't have a concept of "node". Instead, we use
+    # chrome tracing's pid == ray's node.
+    # chrome tracing's tid == ray's process.
+    # Note that pid or tid is usually integer, but ray's node/process has
+    # ids in string.
+    # Unfortunately, perfetto doesn't allow to have string as a value of pid/tid.
+    # To workaround it, we use Metadata event from chrome tracing schema
+    # (https://docs.google.com/document/d/1CvAClvFfyA5R-PhYUmn5OOQtYMH4h6I0nSsKchNAySU/preview#heading=h.xqopa5m0e28f) # noqa
+    # which allows pid/tid -> name mapping. In order to use this schema
+    # we build node_ip/(node_ip, worker_id) -> arbitrary index mapping.
+
+    # node ip address -> node idx.
+    node_to_index = {}
+    # Arbitrary index mapped to the ip address.
+    node_idx = 0
+    # (node index, worker id) -> worker idx
+    worker_to_index = {}
+    # Arbitrary index mapped to the (node index, worker id).
+    worker_idx = 0
+
+    for task in tasks:
+        if task.get("task_id") is None:
+            # If we have a missing data due to data report issue
+            # we just skip this entry.
+            # This shouldn't happen after merging
+            # https://github.com/ray-project/ray/pull/31837
+            continue
+
+        profiling_data = task.get("profiling_data", [])
+        if profiling_data:
+            node_ip_address = profiling_data["node_ip_address"]
+            component_events = profiling_data["events"]
+            component_type = profiling_data["component_type"]
+            component_id = component_type + ":" + profiling_data["component_id"]
+
+            if component_type not in ["worker", "driver"]:
+                continue
+
+            for event in component_events:
+                extra_data = event["extra_data"]
+                # Propagate extra data.
+                extra_data["task_id"] = task["task_id"]
+                extra_data["job_id"] = task["job_id"]
+                extra_data["attempt_number"] = task["attempt_number"]
+                extra_data["func_or_class_name"] = task["func_or_class_name"]
+                extra_data["actor_id"] = task["actor_id"]
+                event_name = event["event_name"]
+
+                # build a id -> arbitrary index mapping
+                if node_ip_address not in node_to_index:
+                    node_to_index[node_ip_address] = node_idx
+                    # Whenever new node ip is introduced, we increment the index.
+                    node_idx += 1
+
+                if (
+                    node_to_index[node_ip_address],
+                    component_id,
+                ) not in worker_to_index:  # noqa
+                    worker_to_index[
+                        (node_to_index[node_ip_address], component_id)
+                    ] = worker_idx  # noqa
+                    worker_idx += 1
+
+                new_event = {
+                    # The category of the event.
+                    "cat": event_name,
+                    # The string displayed on the event.
+                    "name": event_name,
+                    # The identifier for the group of rows that the event
+                    # appears in.
+                    "pid": node_to_index[node_ip_address],
+                    # The identifier for the row that the event appears in.
+                    "tid": worker_to_index[
+                        (node_to_index[node_ip_address], component_id)
+                    ],
+                    # The start time is in ms. Convert it to microseconds.
+                    "ts": event["start_time"] * 10e3,
+                    # The duration is in ms. Convert it to microseconds.
+                    "dur": (event["end_time"] * 10e3) - (event["start_time"] * 10e3),
+                    # What is this?
+                    "ph": "X",
+                    # This is the name of the color to display the box in.
+                    "cname": _default_color_mapping[event["event_name"]],
+                    # The extra user-defined data.
+                    "args": extra_data,
+                }
+
+                # Modify the json with the additional user-defined extra data.
+                # This can be used to add fields or override existing fields.
+                if "cname" in extra_data:
+                    new_event["cname"] = event["extra_data"]["cname"]
+                if "name" in extra_data:
+                    new_event["name"] = extra_data["name"]
+                all_events.append(new_event)
+
+            for node, i in node_to_index.items():
+                all_events.append(
+                    {
+                        "name": "process_name",
+                        "ph": "M",
+                        "pid": i,
+                        "args": {"name": f"Node {node}"},
+                    }
+                )
+
+            for worker, i in worker_to_index.items():
+                all_events.append(
+                    {
+                        "name": "thread_name",
+                        "ph": "M",
+                        "tid": i,
+                        "pid": worker[0],
+                        "args": {"name": worker[1]},
+                    }
+                )
+
+    # Handle task event disabled.
+    return json.dumps(all_events)
diff --git a/python/ray/experimental/shuffle.py b/python/ray/experimental/shuffle.py
index f22e508e27b7..64ce1792d9d1 100644
--- a/python/ray/experimental/shuffle.py
+++ b/python/ray/experimental/shuffle.py
@@ -22,7 +22,6 @@
 
     Shuffled 9536 MiB in 16.579771757125854 seconds
 """
-
 import time
 from typing import Any, Callable, Iterable, List, Tuple, Union
 
diff --git a/python/ray/experimental/state/common.py b/python/ray/experimental/state/common.py
index 6e997820857c..ac2626185aa8 100644
--- a/python/ray/experimental/state/common.py
+++ b/python/ray/experimental/state/common.py
@@ -551,7 +551,7 @@ class TaskState(StateSchema):
     profiling_data: List[dict] = state_column(detail=True, filterable=False)
     #: The time when the task starts to run. A Unix timestamp in ms.
     start_time_ms: Optional[int] = state_column(detail=True, filterable=False)
-    #: The time when the task finishes or failed. A Unix timestamp in ms.
+    #: The time when the task is finished or failed. A Unix timestamp in ms.
     end_time_ms: Optional[int] = state_column(detail=True, filterable=False)
 
 
diff --git a/python/ray/tests/BUILD b/python/ray/tests/BUILD
index 56241ea1343b..62ea4bfeffec 100644
--- a/python/ray/tests/BUILD
+++ b/python/ray/tests/BUILD
@@ -274,6 +274,7 @@ py_test_module_list(
     "test_threaded_actor.py",
     "test_stress_failure.py",
     "test_state_api.py",
+    "test_state_api_2.py",
     "test_reconstruction.py",
     "test_reconstruction_2.py",
     "test_reconstruction_stress.py",
diff --git a/python/ray/tests/test_state_api.py b/python/ray/tests/test_state_api.py
index c37f4b0fc00c..31b861456d4f 100644
--- a/python/ray/tests/test_state_api.py
+++ b/python/ray/tests/test_state_api.py
@@ -812,6 +812,7 @@ async def test_api_manager_list_tasks(state_api_manager):
     data = data
     assert len(data) == 2
     assert result.total == 2
+    print(data)
     verify_schema(TaskState, data[0])
     assert data[0]["node_id"] == node_id.hex()
     verify_schema(TaskState, data[1])
diff --git a/python/ray/tests/test_state_api_2.py b/python/ray/tests/test_state_api_2.py
new file mode 100644
index 000000000000..1a7339c2d8a2
--- /dev/null
+++ b/python/ray/tests/test_state_api_2.py
@@ -0,0 +1,161 @@
+import asyncio
+import json
+import os
+
+from collections import defaultdict
+
+import ray
+import requests
+import pytest
+
+from ray._private.profiling import chrome_tracing_dump
+from ray.experimental.state.api import list_tasks, list_actors, list_workers, list_nodes
+from ray._private.test_utils import wait_for_condition
+
+
+def test_timeline(shutdown_only):
+    ray.init()
+    job_id = ray.get_runtime_context().get_job_id()
+
+    @ray.remote
+    def f():
+        pass
+
+    @ray.remote
+    class Actor:
+        def ready(self):
+            pass
+
+    @ray.remote
+    class AsyncActor:
+        async def f(self):
+            await asyncio.sleep(5)
+
+        async def g(self):
+            await asyncio.sleep(5)
+
+    @ray.remote
+    class ThreadedActor:
+        def f(self):
+            import time
+
+            time.sleep(5)
+
+        def g(self):
+            import time
+
+            time.sleep(5)
+
+    [f.remote() for _ in range(4)]
+    a = Actor.remote()
+    b = AsyncActor.remote()
+    c = ThreadedActor.options(max_concurrency=15).remote()
+
+    [a.ready.remote() for _ in range(4)]
+    ray.get(b.f.remote())
+    [b.f.remote() for _ in range(4)]
+    [b.g.remote() for _ in range(4)]
+    [c.f.remote() for _ in range(4)]
+    [c.g.remote() for _ in range(4)]
+
+    result = json.loads(chrome_tracing_dump(list_tasks(detail=True)))
+
+    # ph is the type of the event
+    actor_to_events = defaultdict(list)
+    task_to_events = defaultdict(list)
+    index_to_workers = {}
+    index_to_nodes = {}
+
+    for item in result:
+        if item["ph"] == "M":
+            # metadata event
+            name = item["name"]
+            if name == "thread_name":
+                index_to_workers[item["tid"]] = item["args"]["name"]
+            elif name == "process_name":
+                index_to_nodes[item["pid"]] = item["args"]["name"]
+            else:
+                raise ValueError(f"Unexecpted name from metadata event {name}")
+        elif item["ph"] == "X":
+            # regular interval event
+            actor_id = item["args"]["actor_id"]
+            assert "actor_id" in item["args"]
+            assert "attempt_number" in item["args"]
+            assert "func_or_class_name" in item["args"]
+            assert "job_id" in item["args"]
+            assert "task_id" in item["args"]
+
+            if actor_id:
+                actor_to_events[actor_id].append(item)
+            else:
+                task_to_events[item["args"]["task_id"]].append(item)
+        else:
+            raise ValueError(f"Unexpected event type {item['ph']}")
+
+    actors = {actor["actor_id"]: actor for actor in list_actors(detail=True)}
+    tasks = {task["task_id"]: task for task in list_tasks(detail=True)}
+    workers = {worker["worker_id"]: worker for worker in list_workers(detail=True)}
+    nodes = {node["node_ip"]: node for node in list_nodes(detail=True)}
+
+    for actor_id, events in actor_to_events.items():
+        # Event type is tested from test_advanced.py::test_profiling_api
+        for event in events:
+            # Make sure actor id is correctly set.
+            assert event["args"]["actor_id"] == actor_id
+            assert event["args"]["job_id"] == job_id
+            task_id = event["args"]["task_id"]
+            assert (
+                event["args"]["func_or_class_name"]
+                == tasks[task_id]["func_or_class_name"]
+            )  # noqa
+        # Make sure the worker id is correct.
+        # ID is recorded as [worker_type]:[worker_id]
+        worker_id_from_event = index_to_workers[event["tid"]].split(":")[1]
+        # Node is recorded as Node [ip_address]
+        node_id_from_event = index_to_nodes[event["pid"]].split(" ")[1]
+        assert actors[actor_id]["pid"] == workers[worker_id_from_event]["pid"]
+        assert actors[actor_id]["node_id"] == nodes[node_id_from_event]["node_id"]
+
+    for task_id, events in task_to_events.items():
+        for event in events:
+            # Make sure actor id is correctly set.
+            assert event["args"]["job_id"] == job_id
+            task_id = event["args"]["task_id"]
+            assert (
+                event["args"]["func_or_class_name"]
+                == tasks[task_id]["func_or_class_name"]
+            )  # noqa
+        # Make sure the worker id is correct.
+        worker_id_from_event = index_to_workers[event["tid"]].split(":")[1]
+        node_id_from_event = index_to_nodes[event["pid"]].split(" ")[1]
+        assert tasks[task_id]["worker_id"] == worker_id_from_event
+        assert tasks[task_id]["node_id"] == nodes[node_id_from_event]["node_id"]
+
+
+def test_timeline_request(shutdown_only):
+    context = ray.init()
+    dashboard_url = f"http://{context['webui_url']}"
+
+    @ray.remote
+    def f():
+        pass
+
+    ray.get([f.remote() for _ in range(5)])
+
+    # Make sure the API works.
+    def verify():
+        resp = requests.get(f"{dashboard_url}/api/v0/tasks/timeline")
+        resp.raise_for_status()
+        assert resp.json(), "No result has returned"
+        return True
+
+    wait_for_condition(verify, timeout=10)
+
+
+if __name__ == "__main__":
+    import sys
+
+    if os.environ.get("PARALLEL_CI"):
+        sys.exit(pytest.main(["-n", "auto", "--boxed", "-vs", __file__]))
+    else:
+        sys.exit(pytest.main(["-sv", __file__]))

From 20bfcdd7f834daa0a97a630613152280465ac537 Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Sat, 28 Jan 2023 09:04:34 -0800
Subject: [PATCH 045/267] [RLlib] Separate PPO torch regression test, and make
 it longer (#31892)

Signed-off-by: Artur Niederfahrenhorst <artur@anyscale.com>
---
 release/release_tests.yaml                    |  4 +--
 .../ppo-breakoutnoframeskip-v5-tf.yaml}       |  0
 .../ppo-breakoutnoframeskip-v5-torch.yaml     | 36 +++++++++++++++++++
 3 files changed, 38 insertions(+), 2 deletions(-)
 rename release/rllib_tests/learning_tests/yaml_files/ppo/{ppo-breakoutnoframeskip-v5.yaml => tf/ppo-breakoutnoframeskip-v5-tf.yaml} (100%)
 create mode 100644 release/rllib_tests/learning_tests/yaml_files/ppo/torch/ppo-breakoutnoframeskip-v5-torch.yaml

diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index e1db50e84d51..0560a7f47cfd 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -3174,7 +3174,7 @@
 
   run:
     timeout: 18000
-    script: python learning_tests/run.py --yaml-sub-dir=ppo --framework=tf
+    script: python learning_tests/run.py --yaml-sub-dir=ppo/tf --framework=tf
 
 
   alert: default
@@ -3197,7 +3197,7 @@
 
   run:
     timeout: 18000
-    script: python learning_tests/run.py --yaml-sub-dir=ppo --framework=torch
+    script: python learning_tests/run.py --yaml-sub-dir=ppo/torch --framework=torch
 
 
   alert: default
diff --git a/release/rllib_tests/learning_tests/yaml_files/ppo/ppo-breakoutnoframeskip-v5.yaml b/release/rllib_tests/learning_tests/yaml_files/ppo/tf/ppo-breakoutnoframeskip-v5-tf.yaml
similarity index 100%
rename from release/rllib_tests/learning_tests/yaml_files/ppo/ppo-breakoutnoframeskip-v5.yaml
rename to release/rllib_tests/learning_tests/yaml_files/ppo/tf/ppo-breakoutnoframeskip-v5-tf.yaml
diff --git a/release/rllib_tests/learning_tests/yaml_files/ppo/torch/ppo-breakoutnoframeskip-v5-torch.yaml b/release/rllib_tests/learning_tests/yaml_files/ppo/torch/ppo-breakoutnoframeskip-v5-torch.yaml
new file mode 100644
index 000000000000..3241d39d37ab
--- /dev/null
+++ b/release/rllib_tests/learning_tests/yaml_files/ppo/torch/ppo-breakoutnoframeskip-v5-torch.yaml
@@ -0,0 +1,36 @@
+ppo-breakoutnoframeskip-v5:
+    env: ALE/Breakout-v5
+    run: PPO
+    # Minimum reward and total ts (in given time_total_s) to pass this test.
+    pass_criteria:
+        episode_reward_mean: 50.0
+        timesteps_total: 7000000
+    stop:
+        # This is double the time we use for tf because of 2x throughput there.
+        time_total_s: 7200
+    config:
+        # Make analogous to old v4 + NoFrameskip.
+        env_config:
+            frameskip: 1
+            full_action_space: false
+            repeat_action_probability: 0.0
+        lambda: 0.95
+        kl_coeff: 0.5
+        clip_rewards: True
+        clip_param: 0.1
+        vf_clip_param: 10.0
+        entropy_coeff: 0.01
+        train_batch_size: 5000
+        rollout_fragment_length: auto
+        sgd_minibatch_size: 500
+        num_sgd_iter: 10
+        num_workers: 30
+        num_envs_per_worker: 1
+        batch_mode: truncate_episodes
+        observation_filter: NoFilter
+        model:
+            vf_share_layers: true
+        num_gpus: 2
+        min_time_s_per_iteration: 30
+        lr: 0.0001
+        grad_clip: 100

From c88934950f8035e1ad2c3defc9a28aceb0dd2f12 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Sat, 28 Jan 2023 09:12:59 -0800
Subject: [PATCH 046/267] Revert "[core][state] Adjust worker side reporting
 with batches && add debugstring  (#31840)" (#32024)

This reverts commit 5d1f2e43d9a078d9f1fb8dae9994782f827d059c.
---
 BUILD.bazel                                   |   1 -
 src/ray/common/ray_config_def.h               |  11 +-
 src/ray/core_worker/core_worker.cc            |   5 +-
 src/ray/core_worker/task_event_buffer.cc      | 138 ++++++++----------
 src/ray/core_worker/task_event_buffer.h       |  16 +-
 .../test/task_event_buffer_test.cc            |  58 +-------
 src/ray/core_worker/test/task_manager_test.cc |   2 -
 7 files changed, 68 insertions(+), 163 deletions(-)

diff --git a/BUILD.bazel b/BUILD.bazel
index 22e23fbcbc7b..18e82f0f244a 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -833,7 +833,6 @@ cc_library(
         ":stats_lib",
         ":worker_rpc",
         "//src/ray/protobuf:worker_cc_proto",
-        "@boost//:circular_buffer",
         "@boost//:fiber",
         "@com_google_absl//absl/container:btree",
         "@com_google_absl//absl/container:flat_hash_map",
diff --git a/src/ray/common/ray_config_def.h b/src/ray/common/ray_config_def.h
index e4e4b99667e9..eb93e48f520d 100644
--- a/src/ray/common/ray_config_def.h
+++ b/src/ray/common/ray_config_def.h
@@ -455,14 +455,9 @@ RAY_CONFIG(int64_t, task_events_report_interval_ms, 1000)
 RAY_CONFIG(int64_t, task_events_max_num_task_in_gcs, 100000)
 
 /// Max number of task events stored in the buffer on workers. Any additional events
-/// will be dropped. This is set to a large value to avoid worker side data loss.
-/// For now, avg size of task event is 200Bytes, 1M task events would incur 200MiB
-/// overhead.
-RAY_CONFIG(uint64_t, task_events_max_num_task_events_in_buffer, 1 * 1000 * 1000)
-
-/// Max number of task events to be send in a single message to GCS. This caps both
-/// the message size, and also the processing work on GCS.
-RAY_CONFIG(uint64_t, task_events_send_batch_size, 10 * 1000)
+/// will be dropped.
+/// Setting the value to -1 allows for unlimited task events buffered on workers.
+RAY_CONFIG(int64_t, task_events_max_num_task_events_in_buffer, 10000)
 
 /// Max number of profile events allowed for a single task when sent to GCS.
 /// NOTE: this limit only applies to the profile events per task in a single
diff --git a/src/ray/core_worker/core_worker.cc b/src/ray/core_worker/core_worker.cc
index b58aa8a44b73..c3ea072b52db 100644
--- a/src/ray/core_worker/core_worker.cc
+++ b/src/ray/core_worker/core_worker.cc
@@ -531,10 +531,7 @@ CoreWorker::CoreWorker(const CoreWorkerOptions &options, const WorkerID &worker_
     periodical_runner_.RunFnPeriodically(
         [this] {
           RAY_LOG(INFO) << "Event stats:\n\n"
-                        << io_service_.stats().StatsString() << "\n\n"
-                        << "-----------------\n"
-                        << "Task Event stats:\n"
-                        << task_event_buffer_->DebugString() << "\n";
+                        << io_service_.stats().StatsString() << "\n\n";
         },
         event_stats_print_interval_ms);
   }
diff --git a/src/ray/core_worker/task_event_buffer.cc b/src/ray/core_worker/task_event_buffer.cc
index db419ea68c2a..10bc43028b94 100644
--- a/src/ray/core_worker/task_event_buffer.cc
+++ b/src/ray/core_worker/task_event_buffer.cc
@@ -22,8 +22,7 @@ namespace worker {
 TaskEventBufferImpl::TaskEventBufferImpl(std::unique_ptr<gcs::GcsClient> gcs_client)
     : work_guard_(boost::asio::make_work_guard(io_service_)),
       periodical_runner_(io_service_),
-      gcs_client_(std::move(gcs_client)),
-      buffer_() {}
+      gcs_client_(std::move(gcs_client)) {}
 
 Status TaskEventBufferImpl::Start(bool auto_flush) {
   absl::MutexLock lock(&mutex_);
@@ -31,8 +30,8 @@ Status TaskEventBufferImpl::Start(bool auto_flush) {
   RAY_CHECK(report_interval_ms > 0)
       << "RAY_task_events_report_interval_ms should be > 0 to use TaskEventBuffer.";
 
-  buffer_.set_capacity(
-      {RayConfig::instance().task_events_max_num_task_events_in_buffer()});
+  buffer_.reserve(RayConfig::instance().task_events_max_num_task_events_in_buffer());
+
   // Reporting to GCS, set up gcs client and and events flushing.
   auto status = gcs_client_->Connect(io_service_);
   if (!status.ok()) {
@@ -101,13 +100,17 @@ void TaskEventBufferImpl::AddTaskEvent(rpc::TaskEvents task_events) {
   absl::MutexLock lock(&mutex_);
 
   auto limit = RayConfig::instance().task_events_max_num_task_events_in_buffer();
-  if (limit > 0 && buffer_.full()) {
-    const auto &to_evict = buffer_.front();
-    if (to_evict.has_profile_events()) {
+  if (limit > 0 && buffer_.size() >= static_cast<size_t>(limit)) {
+    // Too many task events, start overriding older ones.
+    if (buffer_[next_idx_to_overwrite_].has_profile_events()) {
       num_profile_task_events_dropped_++;
     } else {
       num_status_task_events_dropped_++;
     }
+
+    buffer_[next_idx_to_overwrite_] = std::move(task_events);
+    next_idx_to_overwrite_ = (next_idx_to_overwrite_ + 1) % limit;
+    return;
   }
   buffer_.push_back(std::move(task_events));
 }
@@ -116,13 +119,20 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
   if (!enabled_) {
     return;
   }
+  std::vector<rpc::TaskEvents> task_events;
   size_t num_status_task_events_dropped = 0;
   size_t num_profile_task_events_dropped = 0;
-  std::vector<rpc::TaskEvents> to_send;
-
   {
     absl::MutexLock lock(&mutex_);
 
+    RAY_LOG_EVERY_MS(INFO, 15000)
+        << "Pushed task state events to GCS. [total_bytes="
+        << (1.0 * total_events_bytes_) / 1024 / 1024
+        << "MiB][total_count=" << total_num_events_
+        << "][total_status_task_events_dropped=" << num_status_task_events_dropped_
+        << "][total_profile_task_events_dropped=" << num_profile_task_events_dropped_
+        << "][cur_buffer_size=" << buffer_.size() << "].";
+
     // Skip if GCS hasn't finished processing the previous message.
     if (grpc_in_progress_ && !forced) {
       RAY_LOG_EVERY_N_OR_DEBUG(WARNING, 100)
@@ -133,19 +143,15 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
       return;
     }
 
-    // No data to send.
-    if (buffer_.empty()) {
+    if (buffer_.size() == 0) {
       return;
     }
 
-    size_t num_to_send =
-        std::min(RayConfig::instance().task_events_send_batch_size(), buffer_.size());
-    to_send.insert(to_send.end(),
-                   std::make_move_iterator(buffer_.begin()),
-                   std::make_move_iterator(buffer_.begin() + num_to_send));
-    buffer_.erase(buffer_.begin(), buffer_.begin() + num_to_send);
+    task_events.reserve(
+        RayConfig::instance().task_events_max_num_task_events_in_buffer());
+    buffer_.swap(task_events);
+    next_idx_to_overwrite_ = 0;
 
-    // Send and reset the counters
     num_profile_task_events_dropped = num_profile_task_events_dropped_;
     num_profile_task_events_dropped_ = 0;
 
@@ -153,49 +159,56 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
     num_status_task_events_dropped_ = 0;
   }
 
-  // Convert to rpc::TaskEventsData
-  auto data = std::make_unique<rpc::TaskEventData>();
-  data->set_num_profile_task_events_dropped(num_profile_task_events_dropped);
-  data->set_num_status_task_events_dropped(num_status_task_events_dropped);
+  // Merge multiple events from a single task attempt run into one task event.
+  absl::flat_hash_map<std::pair<std::string, int>, rpc::TaskEvents> task_events_map;
 
-  size_t num_task_events = to_send.size();
   size_t num_profile_event_to_send = 0;
   size_t num_status_event_to_send = 0;
-  for (auto &task_event : to_send) {
-    auto events_by_task = data->add_events_by_task();
-    if (task_event.has_profile_events()) {
+  for (auto event : task_events) {
+    if (event.has_profile_events()) {
       num_profile_event_to_send++;
     } else {
       num_status_event_to_send++;
     }
-    events_by_task->Swap(&task_event);
+    auto &task_events_itr =
+        task_events_map[std::make_pair(event.task_id(), event.attempt_number())];
+    task_events_itr.MergeFrom(event);
+  }
+
+  // Convert to rpc::TaskEventsData
+  auto data = std::make_unique<rpc::TaskEventData>();
+  data->set_num_profile_task_events_dropped(num_profile_task_events_dropped);
+  data->set_num_status_task_events_dropped(num_status_task_events_dropped);
+
+  auto num_task_events = task_events_map.size();
+  for (auto itr : task_events_map) {
+    auto events_by_task = data->add_events_by_task();
+    events_by_task->Swap(&itr.second);
   }
 
-  gcs::TaskInfoAccessor *task_accessor;
   {
     // Sending the protobuf to GCS.
     absl::MutexLock lock(&mutex_);
     // Some debug tracking.
     total_num_events_ += num_task_events;
     total_events_bytes_ += data->ByteSizeLong();
-    // The flag should be unset when on_complete is invoked.
-    grpc_in_progress_ = true;
-    task_accessor = &gcs_client_->Tasks();
-  }
 
-  auto on_complete = [this, num_task_events](const Status &status) {
-    absl::MutexLock lock(&mutex_);
-    if (!status.ok()) {
-      RAY_LOG(WARNING) << "Failed to push " << num_task_events
-                       << " task state events to GCS. Data will be lost. [status="
-                       << status.ToString() << "]";
-    }
-    grpc_in_progress_ = false;
-  };
+    auto on_complete = [this, num_task_events](const Status &status) {
+      absl::MutexLock lock(&mutex_);
+      if (!status.ok()) {
+        RAY_LOG(WARNING) << "Failed to push " << num_task_events
+                         << " task state events to GCS. Data will be lost. [status="
+                         << status.ToString() << "]";
+      } else {
+        RAY_LOG(DEBUG) << "Push " << num_task_events << " task state events to GCS.";
+      }
+      grpc_in_progress_ = false;
+    };
 
-  auto status = task_accessor->AsyncAddTaskEventData(std::move(data), on_complete);
-  {
-    absl::MutexLock lock(&mutex_);
+    // The flag should be unset when on_complete is invoked.
+    grpc_in_progress_ = true;
+    auto status =
+        gcs_client_->Tasks().AsyncAddTaskEventData(std::move(data), on_complete);
     if (!status.ok()) {
       // If we couldn't even send the data by invoking client side callbacks, there's
       // something seriously wrong, and losing data in this case should not be too
@@ -212,43 +225,6 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
   }
 }
 
-const std::string TaskEventBufferImpl::DebugString() {
-  std::stringstream ss;
-
-  if (!Enabled()) {
-    ss << "Task Event Buffer is disabled.";
-    return ss.str();
-  }
-
-  bool grpc_in_progress;
-  size_t num_status_task_events_dropped, num_profile_task_events_dropped,
-      data_buffer_size;
-  uint64_t total_events_bytes, total_num_events;
-
-  {
-    absl::MutexLock lock(&mutex_);
-    grpc_in_progress = grpc_in_progress_;
-    num_status_task_events_dropped = num_status_task_events_dropped_;
-    num_profile_task_events_dropped = num_profile_task_events_dropped_;
-    total_events_bytes = total_events_bytes_;
-    total_num_events = total_num_events_;
-    data_buffer_size = buffer_.size();
-  }
-
-  ss << "\nIO Service Stats:\n";
-  ss << io_service_.stats().StatsString();
-  ss << "\nOther Stats:"
-     << "\n\tgrpc_in_progress:" << grpc_in_progress
-     << "\n\tcurrent number of task events in buffer: " << data_buffer_size
-     << "\n\ttotal task events sent: " << 1.0 * total_events_bytes / 1024 / 1024 << " MiB"
-     << "\n\ttotal number of task events sent: " << total_num_events
-     << "\n\tnum status task events dropped: " << num_status_task_events_dropped
-     << "\n\tnum profile task events dropped: " << num_profile_task_events_dropped
-     << "\n";
-
-  return ss.str();
-}
-
 }  // namespace worker
 
 }  // namespace core
diff --git a/src/ray/core_worker/task_event_buffer.h b/src/ray/core_worker/task_event_buffer.h
index 7deee0c2e3b7..145b8908e225 100644
--- a/src/ray/core_worker/task_event_buffer.h
+++ b/src/ray/core_worker/task_event_buffer.h
@@ -14,7 +14,6 @@
 
 #pragma once
 
-#include <boost/circular_buffer.hpp>
 #include <memory>
 #include <string>
 
@@ -93,9 +92,6 @@ class TaskEventBuffer {
   ///
   /// The TaskEventBuffer will be disabled if Start() returns not ok.
   virtual bool Enabled() const = 0;
-
-  /// Return a string that describes the task event buffer stats.
-  virtual const std::string DebugString() = 0;
 };
 
 /// Implementation of TaskEventBuffer.
@@ -121,13 +117,11 @@ class TaskEventBufferImpl : public TaskEventBuffer {
 
   bool Enabled() const override;
 
-  const std::string DebugString() LOCKS_EXCLUDED(mutex_) override;
-
  private:
   /// Test only functions.
   std::vector<rpc::TaskEvents> GetAllTaskEvents() LOCKS_EXCLUDED(mutex_) {
     absl::MutexLock lock(&mutex_);
-    std::vector<rpc::TaskEvents> copy(buffer_.begin(), buffer_.end());
+    std::vector<rpc::TaskEvents> copy(buffer_);
     return copy;
   }
 
@@ -170,8 +164,11 @@ class TaskEventBufferImpl : public TaskEventBuffer {
   /// True if the TaskEventBuffer is enabled.
   std::atomic<bool> enabled_ = false;
 
-  /// Circular buffered task events.
-  boost::circular_buffer_space_optimized<rpc::TaskEvents> buffer_ GUARDED_BY(mutex_);
+  /// Buffered task events.
+  std::vector<rpc::TaskEvents> buffer_ GUARDED_BY(mutex_);
+
+  /// A iterator into buffer_ that determines which element to be overwritten.
+  size_t next_idx_to_overwrite_ GUARDED_BY(mutex_) = 0;
 
   /// Number of profile task events dropped since the last report flush.
   size_t num_profile_task_events_dropped_ GUARDED_BY(mutex_) = 0;
@@ -191,7 +188,6 @@ class TaskEventBufferImpl : public TaskEventBuffer {
   uint64_t total_num_events_ GUARDED_BY(mutex_) = 0;
 
   FRIEND_TEST(TaskEventBufferTestManualStart, TestGcsClientFail);
-  FRIEND_TEST(TaskEventBufferTestBatchSend, TestBatchedSend);
   FRIEND_TEST(TaskEventBufferTest, TestAddEvent);
   FRIEND_TEST(TaskEventBufferTest, TestFlushEvents);
   FRIEND_TEST(TaskEventBufferTest, TestFailedFlush);
diff --git a/src/ray/core_worker/test/task_event_buffer_test.cc b/src/ray/core_worker/test/task_event_buffer_test.cc
index 5f8088cb0261..3a4d116daaec 100644
--- a/src/ray/core_worker/test/task_event_buffer_test.cc
+++ b/src/ray/core_worker/test/task_event_buffer_test.cc
@@ -38,8 +38,7 @@ class TaskEventBufferTest : public ::testing::Test {
         R"(
 {
   "task_events_report_interval_ms": 1000,
-  "task_events_max_num_task_events_in_buffer": 100,
-  "task_events_send_batch_size": 100
+  "task_events_max_num_task_events_in_buffer": 100
 }
   )");
 
@@ -92,20 +91,6 @@ class TaskEventBufferTestManualStart : public TaskEventBufferTest {
   void SetUp() override {}
 };
 
-class TaskEventBufferTestBatchSend : public TaskEventBufferTest {
- public:
-  TaskEventBufferTestBatchSend() : TaskEventBufferTest() {
-    RayConfig::instance().initialize(
-        R"(
-{
-  "task_events_report_interval_ms": 1000,
-  "task_events_max_num_task_events_in_buffer": 100,
-  "task_events_send_batch_size": 10
-}
-  )");
-  }
-};
-
 TEST_F(TaskEventBufferTestManualStart, TestGcsClientFail) {
   ASSERT_NE(task_event_buffer_, nullptr);
 
@@ -285,47 +270,6 @@ TEST_F(TaskEventBufferTest, TestForcedFlush) {
   task_event_buffer_->FlushEvents(true);
 }
 
-TEST_F(TaskEventBufferTestBatchSend, TestBatchedSend) {
-  size_t num_events = 100;
-  size_t batch_size = 10;  // Sync with constructor.
-  std::vector<TaskID> task_ids;
-  // Adding some events
-  for (size_t i = 0; i < num_events; ++i) {
-    auto task_id = RandomTaskId();
-    task_ids.push_back(task_id);
-    task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id, 0));
-  }
-
-  auto task_gcs_accessor =
-      static_cast<ray::gcs::MockGcsClient *>(task_event_buffer_->GetGcsClient())
-          ->mock_task_accessor;
-
-  size_t i = 0;
-  // With batch size = 10, there should be 10 flush calls
-  EXPECT_CALL(*task_gcs_accessor, AsyncAddTaskEventData)
-      .Times(num_events / batch_size)
-      .WillRepeatedly(
-          [&i, &batch_size, &task_ids](std::unique_ptr<rpc::TaskEventData> actual_data,
-                                       ray::gcs::StatusCallback callback) {
-            EXPECT_EQ(actual_data->events_by_task_size(), batch_size);
-            for (const auto &task : actual_data->events_by_task()) {
-              // Assert sent data in order.
-              EXPECT_EQ(task_ids[i++].Binary(), task.task_id());
-            }
-            callback(Status::OK());
-            return Status::OK();
-          });
-
-  for (int i = 0; i * batch_size < num_events; i++) {
-    task_event_buffer_->FlushEvents(false);
-    EXPECT_EQ(task_event_buffer_->GetAllTaskEvents().size(),
-              num_events - (i + 1) * batch_size);
-  }
-
-  // With last flush, there should be no more events in the buffer and as data.
-  EXPECT_EQ(task_event_buffer_->GetAllTaskEvents().size(), 0);
-}
-
 TEST_F(TaskEventBufferTest, TestBufferSizeLimit) {
   size_t num_limit = 100;  // Synced with test setup
   size_t num_profile = 50;
diff --git a/src/ray/core_worker/test/task_manager_test.cc b/src/ray/core_worker/test/task_manager_test.cc
index 1cd73cda00a6..3bdb156b3eae 100644
--- a/src/ray/core_worker/test/task_manager_test.cc
+++ b/src/ray/core_worker/test/task_manager_test.cc
@@ -62,8 +62,6 @@ class MockTaskEventBuffer : public worker::TaskEventBuffer {
   MOCK_METHOD(void, Stop, (), (override));
 
   MOCK_METHOD(bool, Enabled, (), (const, override));
-
-  MOCK_METHOD(const std::string, DebugString, (), (override));
 };
 
 class TaskManagerTest : public ::testing::Test {

From 80d13d16fdeb7c591962192ee200bf2be30d9ecc Mon Sep 17 00:00:00 2001
From: Max Pumperla <max.pumperla@googlemail.com>
Date: Sat, 28 Jan 2023 18:34:44 +0100
Subject: [PATCH 047/267] [docs] simple web crawler example (#31900)

---
 doc/source/_static/css/custom.css             |   5 +
 doc/source/_static/js/custom.js               |  18 ++
 doc/source/_toc.yml                           |   1 +
 doc/source/custom_directives.py               |   4 +-
 doc/source/ray-air/user-guides.rst            |   9 +-
 .../ray-core/examples/web-crawler.ipynb       | 244 ++++++++++++++++++
 doc/source/ray-overview/eco-gallery.yml       |  10 +-
 doc/source/ray-overview/use-cases.rst         | 122 ++++-----
 python/requirements_test.txt                  |   1 +
 9 files changed, 322 insertions(+), 92 deletions(-)
 create mode 100644 doc/source/ray-core/examples/web-crawler.ipynb

diff --git a/doc/source/_static/css/custom.css b/doc/source/_static/css/custom.css
index 221eb33fa6a8..00c1677d1a83 100644
--- a/doc/source/_static/css/custom.css
+++ b/doc/source/_static/css/custom.css
@@ -316,6 +316,10 @@ img.horizontal-scroll {
     float: right;
 }
 
+.card-body {
+    padding: 0.5rem !important;
+}
+
 /* Wrap code blocks instead of horizontal scrolling. */
 pre {
     white-space: pre-wrap;
@@ -325,6 +329,7 @@ pre {
 .cell .cell_output {
     max-height: 250px;
     overflow-y: auto;
+    font-weight: bold;
 }
 
 /* Yellow doesn't render well on light background */
diff --git a/doc/source/_static/js/custom.js b/doc/source/_static/js/custom.js
index 7db383309c9b..13dcfc9c57d8 100644
--- a/doc/source/_static/js/custom.js
+++ b/doc/source/_static/js/custom.js
@@ -28,6 +28,24 @@ window.addEventListener("scroll", loadVisibleTermynals);
 createTermynals();
 loadVisibleTermynals();
 
+
+document.addEventListener("DOMContentLoaded", function() {
+  let images = document.getElementsByClassName("fixed-height-img");
+  let maxHeight = 0;
+
+  for (let i = 0; i < images.length; i++) {
+    if (images[i].height > maxHeight) {
+      maxHeight = images[i].height;
+    }
+  }
+
+  for (let i = 0; i < images.length; i++) {
+    let margin = Math.floor((maxHeight - images[i].height) / 2);
+    images[i].style.cssText = "margin-top: " + margin + "px !important;" +
+        "margin-bottom: " + margin + "px !important;"
+  }
+});
+
 // Remember the scroll position when the page is unloaded.
 window.onload = function() {
     let sidebar = document.querySelector("#bd-docs-nav");
diff --git a/doc/source/_toc.yml b/doc/source/_toc.yml
index 5168a4923121..c21f9dc22177 100644
--- a/doc/source/_toc.yml
+++ b/doc/source/_toc.yml
@@ -32,6 +32,7 @@ parts:
               - file: ray-core/examples/batch_prediction
               - file: ray-core/examples/batch_training
               - file: ray-core/examples/automl_for_time_series
+              - file: ray-core/examples/web-crawler
           - file: ray-core/api
 
       - file: cluster/getting-started
diff --git a/doc/source/custom_directives.py b/doc/source/custom_directives.py
index d3f3bb6f547c..3e15ddbaa930 100644
--- a/doc/source/custom_directives.py
+++ b/doc/source/custom_directives.py
@@ -313,10 +313,10 @@ def build_gallery(app):
         ---
         :img-top: {item["image"]}
 
-        {item["description"]}
-
         {gh_stars}
 
+        {item["description"]}
+
         +++
         .. link-button:: {item["website"]}
             {ref}
diff --git a/doc/source/ray-air/user-guides.rst b/doc/source/ray-air/user-guides.rst
index 4ab31a63f8bd..03d127f09630 100644
--- a/doc/source/ray-air/user-guides.rst
+++ b/doc/source/ray-air/user-guides.rst
@@ -12,14 +12,13 @@ AIR User Guides
 .. panels::
     :container: text-center
     :column: col-md-4 px-2 py-2
-    :img-top-cls: pt-5 w-75 d-block mx-auto
+    :img-top-cls: pt-5 w-75 d-block mx-auto fixed-height-img
 
     ---
     :img-top:  /ray-air/images/preprocessors.svg
 
     .. https://docs.google.com/drawings/d/1ZIbsXv5vvwTVIEr2aooKxuYJ_VL7-8VMNlRinAiPaTI/edit
 
-    +++
     .. link-button:: /ray-air/preprocessors
         :type: ref
         :text: Using Preprocessors
@@ -30,7 +29,6 @@ AIR User Guides
 
     .. https://docs.google.com/drawings/d/15SXGHbKPWdrzx3aTAIFcO2uh_s6Q7jLU03UMuwKSzzM/edit
 
-    +++
     .. link-button:: trainer
         :type: ref
         :text: Using Trainers
@@ -41,7 +39,6 @@ AIR User Guides
 
     .. https://docs.google.com/drawings/d/10GZE_6s6ss8PSxLYyzcbj6yEalWO4N7MS7ao8KO7ne0/edit
 
-    +++
     .. link-button:: air-ingest
         :type: ref
         :text: Configuring Training Datasets
@@ -52,7 +49,6 @@ AIR User Guides
 
     .. https://docs.google.com/drawings/d/1yMd12iMkyo6DGrFoET1TIlKfFnXX9dfh2u3GSdTz6W4/edit
 
-    +++
     .. link-button:: /ray-air/tuner
         :type: ref
         :text: Configuring Hyperparameter Tuning
@@ -63,7 +59,6 @@ AIR User Guides
 
     .. https://docs.google.com/presentation/d/1jfkQk0tGqgkLgl10vp4-xjcbYG9EEtlZV_Vnve_NenQ/edit#slide=id.g131c21f5e88_0_549
 
-    +++
     .. link-button:: predictors
         :type: ref
         :text: Using Predictors for Inference
@@ -74,7 +69,6 @@ AIR User Guides
 
     .. https://docs.google.com/drawings/d/1-rg77bV-vEMURXZw5_mIOUFM3FObIIYbFOiYzFJW_68/edit
 
-    +++
     .. link-button:: /ray-air/examples/serving_guide
         :type: ref
         :text: Deploying Predictors with Serve
@@ -85,7 +79,6 @@ AIR User Guides
 
     .. https://docs.google.com/drawings/d/1ja1RfNCEFn50B9FHWSemUzwhtPAmVyoak1JqEJUmxs4/edit
 
-    +++
     .. link-button:: air-deployment
         :type: ref
         :text: How to Deploy AIR
diff --git a/doc/source/ray-core/examples/web-crawler.ipynb b/doc/source/ray-core/examples/web-crawler.ipynb
new file mode 100644
index 000000000000..920e2ed94ca9
--- /dev/null
+++ b/doc/source/ray-core/examples/web-crawler.ipynb
@@ -0,0 +1,244 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "source": [
+    "# Speed up your web crawler by parallelizing it with Ray"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "In this example we'll quickly demonstrate how to build a simple web scraper in Python and\n",
+    "parallelize it with Ray Tasks with minimal code changes.\n",
+    "\n",
+    "To run this example locally on your machine, please first install `ray` and `beautifulsoup` with\n",
+    "\n",
+    "```\n",
+    "pip install \"beautifulsoup4==4.11.1\" \"ray>=2.2.0\"\n",
+    "```\n",
+    "\n",
+    "First, we'll define a function called `find_links` which takes a starting page (`start_url`) to crawl,\n",
+    "and we'll take the Ray documentation as example of such a starting point.\n",
+    "Our crawler simply extracts all available links from the starting URL that contain a given `base_url`\n",
+    "(e.g. in our example we only want to follow links on `http://docs.ray.io`, not any external links).\n",
+    "The `find_links` function is then called recursively with all the links we found this way, until a\n",
+    "certain depth is reached.\n",
+    "\n",
+    "To extract the links from HTML elements on a site, we define a little helper function called\n",
+    "`extract_links`, which takes care of handling relative URLs properly and sets a limit on the\n",
+    "number of links returned from a site (`max_results`) to control the runtime of the crawler more easily.\n",
+    "\n",
+    "Here's the full implementation:"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 154,
+   "outputs": [],
+   "source": [
+    "import requests\n",
+    "from bs4 import BeautifulSoup\n",
+    "\n",
+    "def extract_links(elements, base_url, max_results=100):\n",
+    "    links = []\n",
+    "    for e in elements:\n",
+    "        url = e[\"href\"]\n",
+    "        if \"https://\" not in url:\n",
+    "            url = base_url + url\n",
+    "        if base_url in url:\n",
+    "            links.append(url)\n",
+    "    return set(links[:max_results])\n",
+    "\n",
+    "\n",
+    "def find_links(start_url, base_url, depth=2):\n",
+    "    if depth == 0:\n",
+    "        return set()\n",
+    "\n",
+    "    page = requests.get(start_url)\n",
+    "    soup = BeautifulSoup(page.content, \"html.parser\")\n",
+    "    elements = soup.find_all(\"a\", href=True)\n",
+    "    links = extract_links(elements, base_url)\n",
+    "\n",
+    "    for url in links:\n",
+    "        new_links = find_links(url, base_url, depth-1)\n",
+    "        links = links.union(new_links)\n",
+    "    return links"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "Let's define a starting and base URL and crawl the Ray docs to a `depth` of 2."
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 162,
+   "outputs": [],
+   "source": [
+    "base = \"https://docs.ray.io/en/latest/\"\n",
+    "docs = base + \"index.html\""
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 163,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 19.3 s, sys: 340 ms, total: 19.7 s\n",
+      "Wall time: 25.8 s\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": "591"
+     },
+     "execution_count": 163,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "%time len(find_links(docs, base))"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "As you can see, crawling the documentation root recursively like this returns a\n",
+    "total of `591` pages and the wall time comes in at around 25 seconds.\n",
+    "\n",
+    "Crawling pages can be parallelized in many ways.\n",
+    "Probably the simplest way is to simple start with multiple starting URLs and call\n",
+    "`find_links` in parallel for each of them.\n",
+    "We can do this with [Ray Tasks](https://docs.ray.io/en/latest/ray-core/tasks.html) in a straightforward way.\n",
+    "We simply use the `ray.remote` decorator to wrap the `find_links` function in a task called `find_links_task` like this:"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 157,
+   "outputs": [],
+   "source": [
+    "import ray\n",
+    "\n",
+    "@ray.remote\n",
+    "def find_links_task(start_url, base_url, depth=2):\n",
+    "    return find_links(start_url, base_url, depth)"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "To use this task to kick off a parallel call, the only thing you have to do is use\n",
+    "`find_links_tasks.remote(...)` instead of calling the underlying Python function directly.\n",
+    "\n",
+    "Here's how you run six crawlers in parallel, the first three (redundantly) crawl\n",
+    "`docs.ray.io` again, the other three crawl the main entry points of the Ray RLlib,\n",
+    "Tune, and Serve libraries, respectively:"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 160,
+   "outputs": [],
+   "source": [
+    "links = [find_links_task.remote(f\"{base}{lib}/index.html\", base)\n",
+    "         for lib in [\"\", \"\", \"\", \"rllib\", \"tune\", \"serve\"]]"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 161,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "591\n",
+      "591\n",
+      "105\n",
+      "204\n",
+      "105\n",
+      "CPU times: user 65.5 ms, sys: 47.8 ms, total: 113 ms\n",
+      "Wall time: 27.2 s\n"
+     ]
+    }
+   ],
+   "source": [
+    "%time for res in ray.get(links): print(len(res))"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "This parallel run crawls around four times the number of pages in roughly the same time as the initial, sequential run.\n",
+    "Note the use of `ray.get` in the timed run to retrieve the results from Ray (the `remote` call promise gets resolved with `get`).\n",
+    "\n",
+    "Of course, there are much smarter ways to create a crawler and efficiently parallelize it, and this example\n",
+    "gives you a starting point to work from."
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 2
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython2",
+   "version": "2.7.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 0
+}
diff --git a/doc/source/ray-overview/eco-gallery.yml b/doc/source/ray-overview/eco-gallery.yml
index ff47b975a178..5876e8f372f9 100644
--- a/doc/source/ray-overview/eco-gallery.yml
+++ b/doc/source/ray-overview/eco-gallery.yml
@@ -1,8 +1,8 @@
 meta:
-  section-titles: true
-  container: container pb-12
-  column: col-md-12 px-2 py-2
-  img-top-cls: pt-10 w-50 d-block mx-auto
+  section-titles: false
+  container: container pb-4
+  column: col-md-4 px-1 py-1
+  img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
 
 buttons:
   classes: btn-outline-info btn-block
@@ -146,7 +146,7 @@ projects:
       random forests, gradient boosting, k-means and DBSCAN, and is designed to
       interoperate with the Python numerical and scientific libraries NumPy and SciPy.
     website: https://docs.ray.io/en/master/joblib.html
-    repo: https://docs.ray.io/en/master/joblib.html
+    repo: https://github.com/scikit-learn/scikit-learn
     image: ../images/scikit.png
   - name: Seldon Alibi Integration
     section_title: Seldon Alibi
diff --git a/doc/source/ray-overview/use-cases.rst b/doc/source/ray-overview/use-cases.rst
index acb326c335d3..751e0686b784 100644
--- a/doc/source/ray-overview/use-cases.rst
+++ b/doc/source/ray-overview/use-cases.rst
@@ -44,14 +44,13 @@ Batch Inference
 Batch inference refers to generating model predictions over a set of input observations. The model could be a regression model, neural network, or simply a Python function. Ray can scale batch inference from single GPU machines to large clusters.
 
 .. panels::
-    :container: container pb-4
-    :column: col-md-4 px-2 py-2
-    :img-top-cls: pt-5 w-75 d-block mx-auto
+    :container: container pb-3
+    :column: col-md-3 px-1 py-1
+    :img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
 
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: https://github.com/ray-project/ray-educational-materials/blob/main/Computer_vision_workloads/Semantic_segmentation/Scaling_batch_inference.ipynb
         :type: url
         :text: [Tutorial] Architectures for Scalable Batch Inference with Ray
@@ -59,7 +58,6 @@ Batch inference refers to generating model predictions over a set of input obser
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: https://www.anyscale.com/blog/model-batch-inference-in-ray-actors-actorpool-and-datasets
         :type: url
         :text: [Blog] Batch Inference in Ray: Actors, ActorPool, and Datasets
@@ -67,7 +65,6 @@ Batch inference refers to generating model predictions over a set of input obser
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: /ray-core/examples/batch_prediction
         :type: ref
         :text: [Example] Batch Prediction using Ray Core
@@ -75,7 +72,6 @@ Batch inference refers to generating model predictions over a set of input obser
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: /data/examples/nyc_taxi_basic_processing
         :type: ref
         :text: [Example] Batch Inference on NYC taxi data using Ray Data
@@ -84,7 +80,6 @@ Batch inference refers to generating model predictions over a set of input obser
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: /data/examples/ocr_example
         :type: ref
         :text: [Example] Batch OCR processing using Ray Data
@@ -111,14 +106,13 @@ There are three ways of using Ray to express this workload.
   Add link to many model training blog.
 
 .. panels::
-    :container: container pb-4
-    :column: col-md-4 px-2 py-2
-    :img-top-cls: pt-5 w-75 d-block mx-auto
+    :container: container pb-3
+    :column: col-md-3 px-1 py-1
+    :img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
 
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: https://www.anyscale.com/blog/training-one-million-machine-learning-models-in-record-time-with-ray
         :type: url
         :text: [Blog] Training One Million ML Models in Record Time with Ray
@@ -126,7 +120,6 @@ There are three ways of using Ray to express this workload.
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: /ray-core/examples/batch_training
         :type: ref
         :text: [Example] Batch Training with Ray Core
@@ -134,7 +127,6 @@ There are three ways of using Ray to express this workload.
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: /data/examples/batch_training
         :type: ref
         :text: [Example] Batch Training with Ray Datasets
@@ -142,7 +134,6 @@ There are three ways of using Ray to express this workload.
     ---
     :img-top: /images/tune.png
 
-    +++
     .. link-button:: /tune/tutorials/tune-run
         :type: ref
         :text: [Guide] Tune Basic Parallel Experiments
@@ -150,7 +141,6 @@ There are three ways of using Ray to express this workload.
     ---
     :img-top: /images/tune.png
 
-    +++
     .. link-button:: /ray-air/examples/batch_tuning
         :type: ref
         :text: [Example] Batch Training and Tuning using Ray Tune
@@ -158,7 +148,6 @@ There are three ways of using Ray to express this workload.
     ---
     :img-top: /images/carrot.png
 
-    +++
     .. link-button:: https://www.youtube.com/watch?v=3t26ucTy0Rs
         :type: url
         :text: [Talk] Scaling Instacart fulfillment ML on Ray
@@ -172,14 +161,13 @@ Ray Serve is particularly well suited for model composition, enabling you to bui
 
 
 .. panels::
-    :container: container pb-4
-    :column: col-md-4 px-2 py-2
-    :img-top-cls: pt-5 w-75 d-block mx-auto
+    :container: container pb-3
+    :column: col-md-3 px-1 py-1
+    :img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
 
     ---
     :img-top: /images/serve.svg
 
-    +++
     .. link-button:: https://www.youtube.com/watch?v=UtH-CMpmxvI
         :type: url
         :text: [Talk] Productionizing ML at Scale with Ray Serve
@@ -187,7 +175,6 @@ Ray Serve is particularly well suited for model composition, enabling you to bui
     ---
     :img-top: /images/serve.svg
 
-    +++
     .. link-button:: https://www.anyscale.com/blog/simplify-your-mlops-with-ray-and-ray-serve
         :type: url
         :text: [Blog] Simplify your MLOps with Ray & Ray Serve
@@ -195,7 +182,6 @@ Ray Serve is particularly well suited for model composition, enabling you to bui
     ---
     :img-top: /images/serve.svg
 
-    +++
     .. link-button:: /serve/getting_started
         :type: ref
         :text: [Guide] Getting Started with Ray Serve
@@ -203,7 +189,6 @@ Ray Serve is particularly well suited for model composition, enabling you to bui
     ---
     :img-top: /images/serve.svg
 
-    +++
     .. link-button:: /serve/model_composition
         :type: ref
         :text: [Guide] Model Composition in Serve
@@ -211,7 +196,6 @@ Ray Serve is particularly well suited for model composition, enabling you to bui
     ---
     :img-top: /images/grid.png
 
-    +++
     .. link-button:: /serve/tutorials/index
         :type: ref
         :text: [Gallery] Serve Examples Gallery
@@ -219,7 +203,6 @@ Ray Serve is particularly well suited for model composition, enabling you to bui
     ---
     :img-top: /images/grid.png
 
-    +++
     .. link-button:: https://www.anyscale.com/blog?tag=ray_serve
         :type: url
         :text: [Gallery] More Serve Use Cases on the Blog
@@ -232,14 +215,13 @@ Ray's Tune library enables any parallel Ray workload to be run under a hyperpara
 Learn more about the Tune library with the following talks and user guides.
 
 .. panels::
-    :container: container pb-4
-    :column: col-md-4 px-2 py-2
-    :img-top-cls: pt-5 w-75 d-block mx-auto
+    :container: container pb-3
+    :column: col-md-3 px-1 py-1
+    :img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
 
     ---
     :img-top: /images/tune.png
 
-    +++
     .. link-button:: /tune/getting-started
         :type: ref
         :text: [Guide] Getting Started with Ray Tune
@@ -247,7 +229,6 @@ Learn more about the Tune library with the following talks and user guides.
     ---
     :img-top: /images/tune.png
 
-    +++
     .. link-button:: https://www.anyscale.com/blog/how-to-distribute-hyperparameter-tuning-using-ray-tune
         :type: url
         :text: [Blog] How to distribute hyperparameter tuning with Ray Tune
@@ -255,7 +236,6 @@ Learn more about the Tune library with the following talks and user guides.
     ---
     :img-top: /images/tune.png
 
-    +++
     .. link-button:: https://www.youtube.com/watch?v=KgYZtlbFYXE
         :type: url
         :text: [Talk] Simple Distributed Hyperparameter Optimization
@@ -263,7 +243,6 @@ Learn more about the Tune library with the following talks and user guides.
     ---
     :img-top: /images/tune.png
 
-    +++
     .. link-button:: https://www.anyscale.com/blog/hyperparameter-search-hugging-face-transformers-ray-tune
         :type: url
         :text: [Blog] Hyperparameter Search with 🤗 Transformers
@@ -271,7 +250,6 @@ Learn more about the Tune library with the following talks and user guides.
     ---
     :img-top: /images/grid.png
 
-    +++
     .. link-button:: /tune/examples/index
         :type: ref
         :text: [Gallery] Ray Tune Examples Gallery
@@ -279,7 +257,6 @@ Learn more about the Tune library with the following talks and user guides.
     ---
     :img-top: /images/grid.png
 
-    +++
     .. link-button:: https://www.anyscale.com/blog?tag=ray-tune
         :type: url
         :text: More Tune use cases on the Blog
@@ -293,14 +270,13 @@ providing distributed orchestration and management capabilities out of the box.
 Learn more about the Train library with the following talks and user guides.
 
 .. panels::
-    :container: container pb-4
-    :column: col-md-4 px-2 py-2
-    :img-top-cls: pt-5 w-75 d-block mx-auto
+    :container: container pb-3
+    :column: col-md-3 px-1 py-1
+    :img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
 
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: https://www.youtube.com/watch?v=e-A93QftCfc
         :type: url
         :text: [Talk] Ray Train, PyTorch, TorchX, and distributed deep learning
@@ -308,7 +284,6 @@ Learn more about the Train library with the following talks and user guides.
     ---
     :img-top: /images/uber.png
 
-    +++
     .. link-button:: https://www.uber.com/blog/elastic-xgboost-ray/
         :type: url
         :text: [Blog] Elastic Distributed Training with XGBoost on Ray
@@ -316,7 +291,6 @@ Learn more about the Train library with the following talks and user guides.
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: /train/train
         :type: ref
         :text: [Guide] Getting Started with Ray Train
@@ -324,7 +298,6 @@ Learn more about the Train library with the following talks and user guides.
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: /ray-air/examples/huggingface_text_classification
         :type: ref
         :text: [Example] Fine-tune a 🤗 Transformers model
@@ -332,7 +305,6 @@ Learn more about the Train library with the following talks and user guides.
     ---
     :img-top: /images/grid.png
 
-    +++
     .. link-button:: /train/examples
         :type: ref
         :text: [Gallery] Ray Train Examples Gallery
@@ -340,7 +312,6 @@ Learn more about the Train library with the following talks and user guides.
     ---
     :img-top: /images/grid.png
 
-    +++
     .. link-button:: https://www.anyscale.com/blog?tag=ray_train
         :type: url
         :text: [Gallery] More Train Use Cases on the Blog
@@ -352,14 +323,13 @@ Reinforcement Learning
 RLlib is an open-source library for reinforcement learning (RL), offering support for production-level, highly distributed RL workloads while maintaining unified and simple APIs for a large variety of industry applications. RLlib is used by industry leaders in many different verticals, such as climate control, industrial control, manufacturing and logistics, finance, gaming, automobile, robotics, boat design, and many others.
 
 .. panels::
-    :container: container pb-4
-    :column: col-md-4 px-2 py-2
-    :img-top-cls: pt-5 w-75 d-block mx-auto
+    :container: container pb-3
+    :column: col-md-3 px-1 py-1
+    :img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
 
     ---
     :img-top: /rllib/images/rllib-logo.png
 
-    +++
     .. link-button:: https://applied-rl-course.netlify.app/
         :type: url
         :text: [Course] Applied Reinforcement Learning with RLlib
@@ -367,7 +337,6 @@ RLlib is an open-source library for reinforcement learning (RL), offering suppor
     ---
     :img-top: /rllib/images/rllib-logo.png
 
-    +++
     .. link-button:: https://medium.com/distributed-computing-with-ray/intro-to-rllib-example-environments-3a113f532c70
         :type: url
         :text: [Blog] Intro to RLlib: Example Environments
@@ -375,7 +344,6 @@ RLlib is an open-source library for reinforcement learning (RL), offering suppor
     ---
     :img-top: /rllib/images/rllib-logo.png
 
-    +++
     .. link-button:: /rllib/rllib-training
         :type: ref
         :text: [Guide] Getting Started with RLlib
@@ -383,7 +351,6 @@ RLlib is an open-source library for reinforcement learning (RL), offering suppor
     ---
     :img-top: /images/riot.png
 
-    +++
     .. link-button:: https://www.anyscale.com/events/2022/03/29/deep-reinforcement-learning-at-riot-games
         :type: url
         :text: [Talk] Deep reinforcement learning at Riot Games
@@ -391,7 +358,6 @@ RLlib is an open-source library for reinforcement learning (RL), offering suppor
     ---
     :img-top: /images/grid.png
 
-    +++
     .. link-button:: /rllib/rllib-examples
         :type: ref
         :text: [Gallery] RLlib Examples Gallery
@@ -399,7 +365,6 @@ RLlib is an open-source library for reinforcement learning (RL), offering suppor
     ---
     :img-top: /images/grid.png
 
-    +++
     .. link-button:: https://www.anyscale.com/blog?tag=rllib
         :type: url
         :text: [Gallery] More RL Use Cases on the Blog
@@ -411,14 +376,13 @@ ML Platform
 The following highlights feature companies leveraging Ray's unified API to build simpler, more flexible ML platforms.
 
 .. panels::
-    :container: container pb-4
-    :column: col-md-4 px-2 py-2
-    :img-top-cls: pt-5 w-75 d-block mx-auto
+    :container: container pb-3
+    :column: col-md-3 px-1 py-1
+    :img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
 
     ---
     :img-top: /images/shopify.png
 
-    +++
     .. link-button:: https://shopify.engineering/merlin-shopify-machine-learning-platform
         :type: url
         :text: [Blog] The Magic of Merlin - Shopify's New ML Platform
@@ -426,7 +390,6 @@ The following highlights feature companies leveraging Ray's unified API to build
     ---
     :img-top: /images/uber.png
 
-    +++
     .. link-button:: https://drive.google.com/file/d/1BS5lfXfuG5bnI8UM6FdUrR7CiSuWqdLn/view
         :type: url
         :text: [Slides] Large Scale Deep Learning Training and Tuning with Ray
@@ -434,7 +397,6 @@ The following highlights feature companies leveraging Ray's unified API to build
     ---
     :img-top: /images/carrot.png
 
-    +++
     .. link-button:: https://www.instacart.com/company/how-its-made/griffin-how-instacarts-ml-platform-tripled-ml-applications-in-a-year/
         :type: url
         :text: [Blog] Griffin: How Instacart’s ML Platform Tripled in a year
@@ -442,7 +404,6 @@ The following highlights feature companies leveraging Ray's unified API to build
     ---
     :img-top: /images/predibase.png
 
-    +++
     .. link-button:: https://www.youtube.com/watch?v=B5v9B5VSI7Q
         :type: url
         :text: [Talk] Predibase - A low-code deep learning platform built for scale
@@ -450,7 +411,6 @@ The following highlights feature companies leveraging Ray's unified API to build
     ---
     :img-top: /images/gke.png
 
-    +++
     .. link-button:: https://cloud.google.com/blog/products/ai-machine-learning/build-a-ml-platform-with-kubeflow-and-ray-on-gke
         :type: url
         :text: [Blog] Building a ML Platform with Kubeflow and Ray on GKE
@@ -458,26 +418,25 @@ The following highlights feature companies leveraging Ray's unified API to build
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: https://www.youtube.com/watch?v=_L0lsShbKaY
         :type: url
         :text: [Talk] Ray Summit Panel - ML Platform on Ray
         :classes: btn-link btn-block stretched-link summitMLPlatform
 
+
 End-to-End ML Workflows
 -----------------------
 
 The following are highlighted examples utilizing Ray AIR to implement end-to-end ML workflows.
 
 .. panels::
-    :container: container pb-4
-    :column: col-md-4 px-2 py-2
-    :img-top-cls: pt-5 w-75 d-block mx-auto
+    :container: container pb-3
+    :column: col-md-3 px-1 py-1
+    :img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
 
     ---
     :img-top: /images/text-classification.png
 
-    +++
     .. link-button:: /ray-air/examples/huggingface_text_classification
         :type: ref
         :text: [Example] Text classification with Ray
@@ -485,7 +444,6 @@ The following are highlighted examples utilizing Ray AIR to implement end-to-end
     ---
     :img-top: /images/image-classification.webp
 
-    +++
     .. link-button:: /ray-air/examples/torch_image_example
         :type: ref
         :text: [Example] Image classification with Ray
@@ -493,7 +451,6 @@ The following are highlighted examples utilizing Ray AIR to implement end-to-end
     ---
     :img-top: /images/credit.png
 
-    +++
     .. link-button:: /ray-air/examples/feast_example
         :type: ref
         :text: [Example] Credit scoring with Ray and Feast
@@ -501,7 +458,6 @@ The following are highlighted examples utilizing Ray AIR to implement end-to-end
     ---
     :img-top: /images/tabular-data.png
 
-    +++
     .. link-button:: /ray-air/examples/xgboost_example
         :type: ref
         :text: [Example] Machine learning on tabular data
@@ -509,7 +465,6 @@ The following are highlighted examples utilizing Ray AIR to implement end-to-end
     ---
     :img-top: /images/timeseries.png
 
-    +++
     .. link-button:: /ray-core/examples/automl_for_time_series
         :type: ref
         :text: [Example] AutoML for Time Series with Ray
@@ -517,7 +472,6 @@ The following are highlighted examples utilizing Ray AIR to implement end-to-end
     ---
     :img-top: /images/grid.png
 
-    +++
     .. link-button:: /ray-air/examples/index
         :type: ref
         :text: [Gallery] Full Ray AIR Examples Gallery
@@ -529,14 +483,13 @@ Large Scale Workload Orchestration
 The following highlights feature companies leveraging Ray Core's distributed APIs to simplify the orchestration of large scale workloads.
 
 .. panels::
-    :container: container pb-4
-    :column: col-md-4 px-2 py-2
-    :img-top-cls: pt-5 w-75 d-block mx-auto
+    :container: container pb-3
+    :column: col-md-3 px-1 py-1
+    :img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
 
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: https://archive.ph/o/aNvFN/https://www.businessinsider.com/openai-chatgpt-trained-on-anyscale-ray-generative-lifelike-ai-models-2022-12
         :type: url
         :text: [Blog] How OpenAI Uses Ray to Train Tools like ChatGPT
@@ -544,7 +497,6 @@ The following highlights feature companies leveraging Ray Core's distributed API
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: https://www.anyscale.com/blog/building-highly-available-and-scalable-online-applications-on-ray-at-ant
         :type: url
         :text: [Blog] Highly Available and Scalable Online Applications on Ray at Ant Group
@@ -553,8 +505,24 @@ The following highlights feature companies leveraging Ray Core's distributed API
     ---
     :img-top: /images/ray_logo.png
 
-    +++
     .. link-button:: https://www.anyscale.com/blog/ray-forward-2022
         :type: url
         :text: [Blog] Ray Forward 2022 Conference: Hyper-scale Ray Application Use Cases
         :classes: btn-link btn-block stretched-link rayForward
+
+
+Basic Examples
+--------------
+
+.. panels::
+    :container: container pb-3
+    :column: col-md-3 px-1 py-1
+    :img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
+
+    ---
+    :img-top: /images/ray_logo.png
+
+    .. link-button:: /ray-core/examples/web-crawler
+        :type: ref
+        :text: Speed up your web crawler by parallelizing it with Ray
+        :classes: btn-link btn-block stretched-link webCrawler
diff --git a/python/requirements_test.txt b/python/requirements_test.txt
index 256c4d7130aa..8e994f34e43c 100644
--- a/python/requirements_test.txt
+++ b/python/requirements_test.txt
@@ -11,6 +11,7 @@ azure-mgmt-compute==23.1.0
 azure-mgmt-network==19.0.0
 azure-mgmt-resource==20.0.0
 msrestazure==0.6.4
+beautifulsoup4==4.11.1
 boto3==1.23.10
 # Todo: investigate if we can get rid of this and exchange for ray.cloudpickle
 cloudpickle==2.2.0

From 112a26533d1d53d218474ce4c9e535b6bf5c22ca Mon Sep 17 00:00:00 2001
From: Balaji Veeramani <balaji@anyscale.com>
Date: Sat, 28 Jan 2023 16:45:59 -0800
Subject: [PATCH 048/267] [Datasets] [Docs] Add `seealso` to map-related
 methods (#30579)

This PR adds seealso notes to help users distinguish between map, flat_map, and map_batches.

Signed-off-by: Balaji Veeramani <balaji@anyscale.com>
---
 python/ray/data/dataset.py | 40 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 40 insertions(+)

diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index 84fca0f5b90d..48b3dff224b4 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -304,6 +304,20 @@ def map(
                 must be used.
             ray_remote_args: Additional resource requirements to request from
                 ray (e.g., num_gpus=1 to request GPUs for the map tasks).
+
+        .. seealso::
+
+            :meth:`~Dataset.flat_map`:
+                Call this method to create new records from existing ones. Unlike
+                :meth:`~Dataset.map`, a function passed to :meth:`~Dataset.flat_map`
+                can return multiple records.
+
+                :meth:`~Dataset.flat_map` isn't recommended because it's slow; call
+                :meth:`~Dataset.map_batches` instead.
+
+            :meth:`~Dataset.map_batches`
+                Call this method to transform batches of data. It's faster and more
+                flexible than :meth:`~Dataset.map` and :meth:`~Dataset.flat_map`.
         """
         if isinstance(fn, CallableClass) and (
             compute is None
@@ -528,6 +542,20 @@ def map_batches(
 
             :meth:`~Dataset.default_batch_format`
                 Call this function to determine the default batch type.
+
+            :meth:`~Dataset.flat_map`:
+                Call this method to create new records from existing ones. Unlike
+                :meth:`~Dataset.map`, a function passed to :meth:`~Dataset.flat_map`
+                can return multiple records.
+
+                :meth:`~Dataset.flat_map` isn't recommended because it's slow; call
+                :meth:`~Dataset.map_batches` instead.
+
+            :meth:`~Dataset.map`
+                Call this method to transform one record at time.
+
+                This method isn't recommended because it's slow; call
+                :meth:`~Dataset.map_batches` instead.
         """  # noqa: E501
 
         if batch_format == "native":
@@ -793,6 +821,18 @@ def flat_map(
                 must be used.
             ray_remote_args: Additional resource requirements to request from
                 ray (e.g., num_gpus=1 to request GPUs for the map tasks).
+
+        .. seealso::
+
+            :meth:`~Dataset.map_batches`
+                Call this method to transform batches of data. It's faster and more
+                flexible than :meth:`~Dataset.map` and :meth:`~Dataset.flat_map`.
+
+            :meth:`~Dataset.map`
+                Call this method to transform one record at time.
+
+                This method isn't recommended because it's slow; call
+                :meth:`~Dataset.map_batches` instead.
         """
         if isinstance(fn, CallableClass) and (
             compute is None

From 1929bb187412aa28d7303cc00ec81b0bd7cf6f57 Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Sat, 28 Jan 2023 17:08:52 -0800
Subject: [PATCH 049/267] [RLlib] Give more time to impala release tests
 (#31910)

Signed-off-by: Artur Niederfahrenhorst <artur@anyscale.com>
---
 .../yaml_files/impala/impala-breakoutnoframeskip-v5.yaml   | 7 ++-----
 1 file changed, 2 insertions(+), 5 deletions(-)

diff --git a/release/rllib_tests/learning_tests/yaml_files/impala/impala-breakoutnoframeskip-v5.yaml b/release/rllib_tests/learning_tests/yaml_files/impala/impala-breakoutnoframeskip-v5.yaml
index bc81412d94ce..e0d054164cb4 100644
--- a/release/rllib_tests/learning_tests/yaml_files/impala/impala-breakoutnoframeskip-v5.yaml
+++ b/release/rllib_tests/learning_tests/yaml_files/impala/impala-breakoutnoframeskip-v5.yaml
@@ -6,7 +6,7 @@ impala-breakoutnoframeskip-v5:
         episode_reward_mean: 200.0
         timesteps_total: 6000000
     stop:
-        time_total_s: 1800
+        time_total_s: 2400
     config:
         # Make analogous to old v4 + NoFrameskip.
         env_config:
@@ -18,8 +18,5 @@ impala-breakoutnoframeskip-v5:
         num_workers: 10
         num_envs_per_worker: 5
         clip_rewards: True
-        lr_schedule: [
-            [0, 0.0005],
-            [20000000, 0.000000000001],
-        ]
+        lr: 0.0005
         num_gpus: 1

From 6708b31fbd7ced3039005e16d62af5c13069efef Mon Sep 17 00:00:00 2001
From: Eric Liang <ekhliang@gmail.com>
Date: Sat, 28 Jan 2023 17:31:18 -0800
Subject: [PATCH 050/267] [docs] remove archive link (#32030)

Signed-off-by: Eric Liang <ekhliang@gmail.com>
---
 doc/source/ray-overview/use-cases.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/doc/source/ray-overview/use-cases.rst b/doc/source/ray-overview/use-cases.rst
index 751e0686b784..2cbf22472fc3 100644
--- a/doc/source/ray-overview/use-cases.rst
+++ b/doc/source/ray-overview/use-cases.rst
@@ -490,7 +490,7 @@ The following highlights feature companies leveraging Ray Core's distributed API
     ---
     :img-top: /images/ray_logo.png
 
-    .. link-button:: https://archive.ph/o/aNvFN/https://www.businessinsider.com/openai-chatgpt-trained-on-anyscale-ray-generative-lifelike-ai-models-2022-12
+    .. link-button:: https://www.businessinsider.com/openai-chatgpt-trained-on-anyscale-ray-generative-lifelike-ai-models-2022-12
         :type: url
         :text: [Blog] How OpenAI Uses Ray to Train Tools like ChatGPT
         :classes: btn-link btn-block stretched-link chatgpt

From cce092be387952ddbfffe6c4ebc9f33a056af4b8 Mon Sep 17 00:00:00 2001
From: Luke Hsiao <luke@hsiao.dev>
Date: Sun, 29 Jan 2023 23:53:18 -0700
Subject: [PATCH 051/267] Fix whitespace in help message for ray cli (#31905)

Without this patch, several of the help text are missing whitespace. For
example, `--dashboard-host` appears as follows:

  --dashboard-host TEXT           the host to bind the dashboard server to,
                                  either localhost (127.0.0.1) or 0.0.0.0
                                  (available from all interfaces). By default,
                                  thisis localhost.

This patch adds the correct trailing whitespace so there are spaces.

Signed-off-by: Luke Hsiao <luke.hsiao@numbersstation.ai>
---
 python/ray/scripts/scripts.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/python/ray/scripts/scripts.py b/python/ray/scripts/scripts.py
index 29001ae19554..048a7afe0f97 100644
--- a/python/ray/scripts/scripts.py
+++ b/python/ray/scripts/scripts.py
@@ -406,7 +406,7 @@ def debug(address):
     required=False,
     default="localhost",
     help="the host to bind the dashboard server to, either localhost "
-    "(127.0.0.1) or 0.0.0.0 (available from all interfaces). By default, this"
+    "(127.0.0.1) or 0.0.0.0 (available from all interfaces). By default, this "
     "is localhost.",
 )
 @click.option(
@@ -467,8 +467,8 @@ def debug(address):
 @click.option(
     "--temp-dir",
     default=None,
-    help="manually specify the root temporary dir of the Ray process, only works"
-    "when --head is specified",
+    help="manually specify the root temporary dir of the Ray process, only "
+    "works when --head is specified",
 )
 @click.option(
     "--storage",
@@ -515,7 +515,7 @@ def debug(address):
     "--ray-debugger-external",
     is_flag=True,
     default=False,
-    help="Make the Ray debugger available externally to the node. This is only"
+    help="Make the Ray debugger available externally to the node. This is only "
     "safe to activate if the node is behind a firewall.",
 )
 @click.option(

From 3fc2aac9750f29b7ecb14a4c3977ddde966ff2c4 Mon Sep 17 00:00:00 2001
From: Sven Mika <svenmika1977@gmail.com>
Date: Mon, 30 Jan 2023 16:33:26 +0100
Subject: [PATCH 052/267] [RLlib] Auto-detect old gym/gymnasium APIs and wrap
 accordingly. Configurable. (#31960)

---
 rllib/algorithms/algorithm.py                 |   8 +
 rllib/algorithms/algorithm_config.py          |  11 ++
 rllib/env/utils.py                            |  79 +++++++++-
 .../backward_compat/test_gym_env_apis.py      | 138 +++++++++++++++++-
 rllib/utils/gym.py                            |  10 +-
 5 files changed, 228 insertions(+), 18 deletions(-)

diff --git a/rllib/algorithms/algorithm.py b/rllib/algorithms/algorithm.py
index 61b75e8e4fbf..e5e0c778af8f 100644
--- a/rllib/algorithms/algorithm.py
+++ b/rllib/algorithms/algorithm.py
@@ -2259,6 +2259,14 @@ def _is_multi_agent(self):
                         return isinstance(self, MultiAgentEnv)
 
                 return env_id, lambda cfg: _wrapper.remote(cfg)
+            # gym.Env-subclass: Also go through our RLlib gym-creator.
+            elif issubclass(env_specifier, gym.Env):
+                return env_id, functools.partial(
+                    _gym_env_creator,
+                    env_descriptor=env_specifier,
+                    auto_wrap_old_gym_envs=config.get("auto_wrap_old_gym_envs", True),
+                )
+            # All other env classes: Call c'tor directly.
             else:
                 return env_id, lambda cfg: env_specifier(cfg)
 
diff --git a/rllib/algorithms/algorithm_config.py b/rllib/algorithms/algorithm_config.py
index f2bb985b72ef..227d2f51d0b0 100644
--- a/rllib/algorithms/algorithm_config.py
+++ b/rllib/algorithms/algorithm_config.py
@@ -282,6 +282,7 @@ def __init__(self, algo_class=None):
         # Whether this env is an atari env (for atari-specific preprocessing).
         # If not specified, we will try to auto-detect this.
         self.is_atari = None
+        self.auto_wrap_old_gym_envs = True
 
         # `self.rollouts()`
         self.num_rollout_workers = 0
@@ -1074,6 +1075,7 @@ def environment(
         clip_actions: Optional[bool] = NotProvided,
         disable_env_checking: Optional[bool] = NotProvided,
         is_atari: Optional[bool] = NotProvided,
+        auto_wrap_old_gym_envs: Optional[bool] = NotProvided,
     ) -> "AlgorithmConfig":
         """Sets the config's RL-environment settings.
 
@@ -1117,6 +1119,13 @@ def environment(
             is_atari: This config can be used to explicitly specify whether the env is
                 an Atari env or not. If not specified, RLlib will try to auto-detect
                 this during config validation.
+            auto_wrap_old_gym_envs: Whether to auto-wrap old gym environments (using
+                the pre 0.24 gym APIs, e.g. reset() returning single obs and no info
+                dict). If True, RLlib will automatically wrap the given gym env class
+                with the gym-provided compatibility wrapper
+                (gym.wrappers.EnvCompatibility). If False, RLlib will produce a
+                descriptive error on which steps to perform to upgrade to gymnasium
+                (or to switch this flag to True).
 
         Returns:
             This updated AlgorithmConfig object.
@@ -1147,6 +1156,8 @@ def environment(
             self.disable_env_checking = disable_env_checking
         if is_atari is not NotProvided:
             self.is_atari = is_atari
+        if auto_wrap_old_gym_envs is not NotProvided:
+            self.auto_wrap_old_gym_envs = auto_wrap_old_gym_envs
 
         return self
 
diff --git a/rllib/env/utils.py b/rllib/env/utils.py
index 0a4d1c5bafe5..314f7ff8e3c2 100644
--- a/rllib/env/utils.py
+++ b/rllib/env/utils.py
@@ -1,10 +1,26 @@
+import logging
+from typing import Type, Union
+
 import gymnasium as gym
 
 from ray.rllib.env.env_context import EnvContext
-from ray.rllib.utils.error import ERR_MSG_INVALID_ENV_DESCRIPTOR, EnvError
+from ray.rllib.env.multi_agent_env import MultiAgentEnv
+from ray.rllib.env.wrappers.multi_agent_env_compatibility import (
+    MultiAgentEnvCompatibility,
+)
+from ray.rllib.utils.error import (
+    ERR_MSG_INVALID_ENV_DESCRIPTOR,
+    ERR_MSG_OLD_GYM_API,
+    EnvError,
+)
+from ray.rllib.utils.gym import check_old_gym_env
+from ray.util import log_once
 from ray.util.annotations import PublicAPI
 
 
+logger = logging.getLogger(__name__)
+
+
 @PublicAPI
 def try_import_pyspiel(error: bool = False):
     """Tries importing pyspiel and returns the module (or None).
@@ -59,7 +75,11 @@ def try_import_open_spiel(error: bool = False):
         return None
 
 
-def _gym_env_creator(env_context: EnvContext, env_descriptor: str) -> gym.Env:
+def _gym_env_creator(
+    env_context: EnvContext,
+    env_descriptor: Union[str, Type[gym.Env]],
+    auto_wrap_old_gym_envs: bool = True,
+) -> gym.Env:
     """Tries to create a gym env given an EnvContext object and descriptor.
 
     Note: This function tries to construct the env from a string descriptor
@@ -72,9 +92,15 @@ def _gym_env_creator(env_context: EnvContext, env_descriptor: str) -> gym.Env:
         env_context: The env context object to configure the env.
             Note that this is a config dict, plus the properties:
             `worker_index`, `vector_index`, and `remote`.
-        env_descriptor: The env descriptor, e.g. CartPole-v1,
-            ALE/MsPacman-v5, VizdoomBasic-v0, or
-            CartPoleContinuousBulletEnv-v0.
+        env_descriptor: The env descriptor as a gym-registered string, e.g. CartPole-v1,
+            ALE/MsPacman-v5, VizdoomBasic-v0, or CartPoleContinuousBulletEnv-v0.
+            Alternatively, the gym.Env subclass to use.
+        auto_wrap_old_gym_envs: Whether to auto-wrap old gym environments (using
+            the pre 0.24 gym APIs, e.g. reset() returning single obs and no info
+            dict). If True, RLlib will automatically wrap the given gym env class
+            with the gym-provided compatibility wrapper (gym.wrappers.EnvCompatibility).
+            If False, RLlib will produce a descriptive error on which steps to perform
+            to upgrade to gymnasium (or to switch this flag to True).
 
     Returns:
         The actual gym environment object.
@@ -102,16 +128,53 @@ def _gym_env_creator(env_context: EnvContext, env_descriptor: str) -> gym.Env:
     # Try creating a gym env. If this fails we can output a
     # decent error message.
     try:
+        # If class provided, call constructor directly.
+        if isinstance(env_descriptor, type):
+            env = env_descriptor(env_context)
         # Special case: Atari not supported by gymnasium yet -> Need to use their
         # GymV26 compatibility wrapper class.
         # TODO(sven): Remove this if-block once gymnasium fully supports Atari envs.
-        if env_descriptor.startswith("ALE/"):
-            return gym.make(
+        elif env_descriptor.startswith("ALE/"):
+            env = gym.make(
                 "GymV26Environment-v0",
                 env_id=env_descriptor,
                 make_kwargs=env_context,
             )
         else:
-            return gym.make(env_descriptor, **env_context)
+            env = gym.make(env_descriptor, **env_context)
+        # If we are dealing with an old gym-env API, use the provided compatibility
+        # wrapper.
+        if auto_wrap_old_gym_envs:
+            try:
+                # Call the env's reset() method to check for the env using the old
+                # gym (reset doesn't take `seed` and `options` args and returns only
+                # the initial observations) or new gymnasium APIs (reset takes `seed`
+                # and `options` AND returns observations and infos).
+                obs_and_infos = env.reset(seed=None, options={})
+                # Check return values for correct gymnasium .
+                check_old_gym_env(reset_results=obs_and_infos)
+            # TypeError for `reset()` not accepting seed/options.
+            # ValueError for `check_old_gym_env` raising error if return values
+            # incorrect.
+            except Exception:
+                if log_once("auto_wrap_gym_api"):
+                    logger.warning(
+                        "`config.auto_wrap_old_gym_envs` is activated AND you seem to "
+                        "have provided an old gym-API environment. RLlib will therefore"
+                        " try to auto-fix the following error. However, please "
+                        "consider switching over to the new `gymnasium` APIs:\n"
+                        + ERR_MSG_OLD_GYM_API
+                    )
+                # Multi-agent case.
+                if isinstance(env, MultiAgentEnv):
+                    env = MultiAgentEnvCompatibility(env)
+                # Single agent (gymnasium.Env) case.
+                else:
+                    env = gym.wrappers.EnvCompatibility(env)
+                # Repeat the checks, now everything should work.
+                obs_and_infos = env.reset(seed=None, options={})
+                check_old_gym_env(reset_results=obs_and_infos)
     except gym.error.Error:
         raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))
+
+    return env
diff --git a/rllib/tests/backward_compat/test_gym_env_apis.py b/rllib/tests/backward_compat/test_gym_env_apis.py
index de80c926bf30..7b5e1cf390f4 100644
--- a/rllib/tests/backward_compat/test_gym_env_apis.py
+++ b/rllib/tests/backward_compat/test_gym_env_apis.py
@@ -2,6 +2,10 @@
 
 import ray
 from ray.rllib.algorithms.ppo import PPOConfig
+from ray.rllib.env.multi_agent_env import MultiAgentEnv
+from ray.rllib.env.wrappers.multi_agent_env_compatibility import (
+    MultiAgentEnvCompatibility,
+)
 from ray.rllib.utils.gym import try_import_gymnasium_and_gym
 from ray.tune.registry import register_env
 
@@ -45,6 +49,25 @@ def render(self):
         pass
 
 
+class GymnasiumNewAPIButThrowsErrorOnReset(gym.Env):
+    render_mode = "human"
+
+    def __init__(self, config=None):
+        self.observation_space = gym.spaces.Box(-1.0, 1.0, (1,))
+        self.action_space = gym.spaces.Discrete(2)
+
+    def reset(self, *, seed=None, options=None):
+        assert False, "kaboom!"
+        return self.observation_space.sample(), {}
+
+    def step(self, action):
+        terminated = truncated = True
+        return self.observation_space.sample(), 1.0, terminated, truncated, {}
+
+    def render(self):
+        pass
+
+
 class OldGymEnv(old_gym.Env):
     def __init__(self, config=None):
         self.observation_space = old_gym.spaces.Box(-1.0, 1.0, (1,))
@@ -64,6 +87,35 @@ def render(self, mode="human"):
         pass
 
 
+class MultiAgentGymnasiumOldAPI(MultiAgentEnv):
+    def __init__(self, config=None):
+        super().__init__()
+        self.observation_space = gym.spaces.Dict(
+            {"agent0": gym.spaces.Box(-1.0, 1.0, (1,))}
+        )
+        self.action_space = gym.spaces.Dict({"agent0": gym.spaces.Discrete(2)})
+        self._observation_space_in_preferred_format = True
+        self._action_space_in_preferred_format = True
+
+    def reset(self):
+        return {"agent0": self.observation_space.sample()}
+
+    def step(self, action):
+        done = True
+        return (
+            {"agent0": self.observation_space.sample()},
+            {"agent0": 1.0},
+            {"agent0": done, "__all__": done},
+            {},
+        )
+
+    def seed(self, seed=None):
+        pass
+
+    def render(self, mode="human"):
+        pass
+
+
 class TestGymEnvAPIs(unittest.TestCase):
     @classmethod
     def setUpClass(cls) -> None:
@@ -79,7 +131,7 @@ def test_gymnasium_old_api(self):
         def test_():
             (
                 PPOConfig()
-                .environment(env=GymnasiumOldAPI)
+                .environment(env=GymnasiumOldAPI, auto_wrap_old_gym_envs=False)
                 .rollouts(num_envs_per_worker=2, num_rollout_workers=2)
                 .build()
             )
@@ -90,13 +142,24 @@ def test_():
             lambda: test_(),
         )
 
+    def test_gymnasium_old_api_using_auto_wrap(self):
+        """Tests a gymnasium Env that uses the old API, but is auto-wrapped by RLlib."""
+        algo = (
+            PPOConfig()
+            .environment(env=GymnasiumOldAPI, auto_wrap_old_gym_envs=True)
+            .rollouts(num_envs_per_worker=2, num_rollout_workers=2)
+            .build()
+        )
+        algo.train()
+        algo.stop()
+
     def test_gymnasium_new_api_but_old_spaces(self):
         """Tests a gymnasium Env that uses the new API, but has old spaces."""
 
         def test_():
             (
                 PPOConfig()
-                .environment(env=GymnasiumNewAPIButOldSpaces)
+                .environment(GymnasiumNewAPIButOldSpaces, auto_wrap_old_gym_envs=True)
                 .rollouts(num_envs_per_worker=2, num_rollout_workers=2)
                 .build()
             )
@@ -107,7 +170,23 @@ def test_():
             lambda: test_(),
         )
 
-    def test_gymnasium_old_api_but_wrapped(self):
+    def test_gymnasium_new_api_but_throws_error_on_reset(self):
+        """Tests a gymnasium Env that uses the new API, but errors on reset() call."""
+
+        def test_():
+            (
+                PPOConfig()
+                .environment(
+                    GymnasiumNewAPIButThrowsErrorOnReset,
+                    auto_wrap_old_gym_envs=True,
+                )
+                .rollouts(num_envs_per_worker=1, num_rollout_workers=0)
+                .build()
+            )
+
+        self.assertRaisesRegex(AssertionError, "kaboom!", lambda: test_())
+
+    def test_gymnasium_old_api_but_manually_wrapped(self):
         """Tests a gymnasium Env that uses the old API, but is correctly wrapped."""
 
         from gymnasium.wrappers import EnvCompatibility
@@ -119,7 +198,7 @@ def test_gymnasium_old_api_but_wrapped(self):
 
         algo = (
             PPOConfig()
-            .environment(env="test")
+            .environment("test", auto_wrap_old_gym_envs=False)
             .rollouts(num_envs_per_worker=2, num_rollout_workers=2)
             .build()
         )
@@ -127,12 +206,12 @@ def test_gymnasium_old_api_but_wrapped(self):
         algo.stop()
 
     def test_old_gym_env(self):
-        """Tests a old gym.Env (should fail)."""
+        """Tests a old gym.Env (should fail, even with auto-wrapping enabled)."""
 
         def test_():
             (
                 PPOConfig()
-                .environment(env=OldGymEnv)
+                .environment(env=OldGymEnv, auto_wrap_old_gym_envs=True)
                 .rollouts(num_envs_per_worker=2, num_rollout_workers=2)
                 .build()
             )
@@ -143,6 +222,53 @@ def test_():
             lambda: test_(),
         )
 
+    def test_multi_agent_gymnasium_old_api(self):
+        """Tests a MultiAgentEnv (gymnasium.Env subclass) that uses the old API."""
+
+        def test_():
+            (
+                PPOConfig()
+                .environment(
+                    MultiAgentGymnasiumOldAPI,
+                    auto_wrap_old_gym_envs=False,
+                )
+                .build()
+            )
+
+        self.assertRaisesRegex(
+            ValueError,
+            ".*In particular, the `reset\\(\\)` method seems to be faulty..*",
+            lambda: test_(),
+        )
+
+    def test_multi_agent_gymnasium_old_api_auto_wrapped(self):
+        """Tests a MultiAgentEnv (gymnasium.Env subclass) that uses the old API."""
+
+        algo = (
+            PPOConfig()
+            .environment(
+                MultiAgentGymnasiumOldAPI,
+                auto_wrap_old_gym_envs=True,
+            )
+            .build()
+        )
+        algo.train()
+        algo.stop()
+
+    def test_multi_agent_gymnasium_old_api_manually_wrapped(self):
+        """Tests a MultiAgentEnv (gymnasium.Env subclass) that uses the old API."""
+
+        register_env(
+            "test",
+            lambda env_ctx: MultiAgentEnvCompatibility(
+                MultiAgentGymnasiumOldAPI(env_ctx)
+            ),
+        )
+
+        algo = PPOConfig().environment("test", auto_wrap_old_gym_envs=False).build()
+        algo.train()
+        algo.stop()
+
 
 if __name__ == "__main__":
     import pytest
diff --git a/rllib/utils/gym.py b/rllib/utils/gym.py
index 7a763400c9de..55f16aa8713e 100644
--- a/rllib/utils/gym.py
+++ b/rllib/utils/gym.py
@@ -27,12 +27,14 @@ def check_old_gym_env(
                 and isinstance(env.observation_space.spaces[1], gym.spaces.Dict)
             )
         ):
-            raise ValueError
+            raise ValueError(
+                "The number of values returned from `gym.Env.reset(seed=.., options=..)"
+                "` must be 2! Make sure your `reset()` method returns: [obs] and "
+                "[infos]."
+            )
     # Check `step()` results.
     elif step_results is not None:
-        if len(step_results) == 4:
-            return ValueError
-        elif len(step_results) == 5:
+        if len(step_results) == 5:
             return False
         else:
             raise ValueError(

From d390df83668c8e1670fb14087a8771d89a594a06 Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Mon, 30 Jan 2023 07:48:48 -0800
Subject: [PATCH 053/267] [RLlib] Reparameterize the construction of
 TrainerRunner and RLTrainers (#31991)

* trying out a new configuration pattern for trainer runner and rl trainers

Signed-off-by: Kourosh Hakhamaneshi <kourosh@anyscale.com>
---
 rllib/BUILD                                   |   9 +-
 rllib/algorithms/algorithm_config.py          |  46 ++++++-
 rllib/core/rl_trainer/rl_trainer.py           |  93 +++++++++++--
 rllib/core/rl_trainer/scaling_config.py       |  21 +++
 .../core/rl_trainer/tests/test_rl_trainer.py  |  10 +-
 .../rl_trainer/tests/test_trainer_runner.py   | 126 ++++++++++++++---
 .../tests/test_trainer_runner_config.py       |   1 -
 .../tests/test_trainer_runner_local.py        |  70 ----------
 rllib/core/rl_trainer/tf/tf_rl_trainer.py     |  32 +----
 .../torch/tests/test_torch_rl_trainer.py      |  25 ++--
 .../core/rl_trainer/torch/torch_rl_trainer.py |  53 +++----
 rllib/core/rl_trainer/trainer_runner.py       | 129 +++++++++---------
 .../core/rl_trainer/trainer_runner_config.py  |  99 +++++++-------
 rllib/core/testing/utils.py                   |  12 +-
 rllib/utils/framework.py                      |  29 +++-
 15 files changed, 436 insertions(+), 319 deletions(-)
 create mode 100644 rllib/core/rl_trainer/scaling_config.py
 delete mode 100644 rllib/core/rl_trainer/tests/test_trainer_runner_local.py

diff --git a/rllib/BUILD b/rllib/BUILD
index 46642d737365..432014f1dd60 100644
--- a/rllib/BUILD
+++ b/rllib/BUILD
@@ -1838,17 +1838,10 @@ py_test(
 py_test(
     name = "test_trainer_runner",
     tags = ["team:rllib", "multi_gpu", "exclusive"],
-    size = "medium",
+    size = "large",
     srcs = ["core/rl_trainer/tests/test_trainer_runner.py"]
 )
 
-py_test(
-    name = "test_trainer_runner_local",
-    tags = ["team:rllib", "core", "exclusive"],
-    size = "medium",
-    srcs = ["core/rl_trainer/tests/test_trainer_runner_local.py"]
-)
-
 py_test(
     name = "test_trainer_runner_config",
     tags = ["team:rllib", "core"],
diff --git a/rllib/algorithms/algorithm_config.py b/rllib/algorithms/algorithm_config.py
index 227d2f51d0b0..639d2950708d 100644
--- a/rllib/algorithms/algorithm_config.py
+++ b/rllib/algorithms/algorithm_config.py
@@ -17,6 +17,7 @@
 import ray
 from ray.rllib.algorithms.callbacks import DefaultCallbacks
 from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
+from ray.rllib.core.rl_trainer.rl_trainer import RLTrainerHPs
 from ray.rllib.core.rl_trainer.trainer_runner_config import (
     TrainerRunnerConfig,
     ModuleSpec,
@@ -242,6 +243,9 @@ def __init__(self, algo_class=None):
         self.num_gpus_per_worker = 0
         self._fake_gpus = False
         self.num_cpus_for_local_worker = 1
+        self.num_trainer_workers = 0
+        self.num_gpus_per_trainer_worker = 0
+        self.num_cpus_per_trainer_worker = 1
         self.custom_resources_per_worker = {}
         self.placement_strategy = "PACK"
 
@@ -318,6 +322,10 @@ def __init__(self, algo_class=None):
         self.max_requests_in_flight_per_sampler_worker = 2
         self.rl_trainer_class = None
         self._enable_rl_trainer_api = False
+        # experimental: this will contain the hyper-parameters that are passed to the
+        # RLTrainer, for computing loss, etc. New algorithms have to set this to their
+        # own default. .training() will modify the fields of this object.
+        self._rl_trainer_hps = RLTrainerHPs()
 
         # `self.callbacks()`
         self.callbacks_class = DefaultCallbacks
@@ -443,6 +451,10 @@ def __init__(self, algo_class=None):
         self.soft_horizon = DEPRECATED_VALUE
         self.no_done_at_end = DEPRECATED_VALUE
 
+    @property
+    def rl_trainer_hps(self) -> RLTrainerHPs:
+        return self._rl_trainer_hps
+
     def to_dict(self) -> AlgorithmConfigDict:
         """Converts all settings into a legacy config dict for backward compatibility.
 
@@ -947,6 +959,9 @@ def resources(
         num_cpus_per_worker: Optional[Union[float, int]] = NotProvided,
         num_gpus_per_worker: Optional[Union[float, int]] = NotProvided,
         num_cpus_for_local_worker: Optional[int] = NotProvided,
+        num_trainer_workers: Optional[int] = NotProvided,
+        num_cpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
+        num_gpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
         custom_resources_per_worker: Optional[dict] = NotProvided,
         placement_strategy: Optional[str] = NotProvided,
     ) -> "AlgorithmConfig":
@@ -966,6 +981,20 @@ def resources(
                 fractional. This is usually needed only if your env itself requires a
                 GPU (i.e., it is a GPU-intensive video game), or model inference is
                 unusually expensive.
+            num_trainer_workers: Number of workers used for training. A value of 0
+                means training will take place on a local worker on head node CPUs or 1
+                GPU (determined by `num_gpus_per_trainer_worker`). For multi-gpu
+                training, set number of workers greater than 1 and set
+                `num_gpus_per_trainer_worker` accordingly (e.g. 4 GPUs total, and model
+                needs 2 GPUs: `num_trainer_workers = 2` and
+                `num_gpus_per_trainer_worker = 2`)
+            num_cpus_per_trainer_worker: Number of CPUs allocated per trainer worker.
+                Only necessary for custom processing pipeline inside each RLTrainer
+                requiring multiple CPU cores. Ignored if `num_trainer_workers = 0`.
+            num_gpus_per_trainer_worker: Number of GPUs allocated per worker. If
+                `num_trainer_workers = 0`, any value greater than 0 will run the
+                training on a single GPU on the head node, while a value of 0 will run
+                the training on head node CPU cores.
             custom_resources_per_worker: Any custom Ray resources to allocate per
                 worker.
             num_cpus_for_local_worker: Number of CPUs to allocate for the algorithm.
@@ -1006,6 +1035,13 @@ def resources(
         if placement_strategy is not NotProvided:
             self.placement_strategy = placement_strategy
 
+        if num_trainer_workers is not NotProvided:
+            self.num_trainer_workers = num_trainer_workers
+        if num_cpus_per_trainer_worker is not NotProvided:
+            self.num_cpus_per_trainer_worker = num_cpus_per_trainer_worker
+        if num_gpus_per_trainer_worker is not NotProvided:
+            self.num_gpus_per_trainer_worker = num_gpus_per_trainer_worker
+
         return self
 
     def framework(
@@ -2644,12 +2680,16 @@ def get_trainer_runner_config(
             .module(module_spec)
             .trainer(
                 trainer_class=self.rl_trainer_class,
-                eager_tracing=self.eager_tracing,
                 # TODO (Kourosh): optimizer config can now be more complicated.
                 optimizer_config={"lr": self.lr},
+                rl_trainer_hps=self.rl_trainer_hps,
+            )
+            .resources(
+                num_trainer_workers=self.num_trainer_workers,
+                num_cpus_per_trainer_worker=self.num_cpus_per_trainer_worker,
+                num_gpus_per_trainer_worker=self.num_gpus_per_trainer_worker,
             )
-            .resources(num_gpus=self.num_gpus, fake_gpus=self._fake_gpus)
-            .algorithm(algorithm_config=self)
+            .framework(eager_tracing=self.eager_tracing)
         )
 
         return config
diff --git a/rllib/core/rl_trainer/rl_trainer.py b/rllib/core/rl_trainer/rl_trainer.py
index 8969cab69a1e..ca78f7a096f7 100644
--- a/rllib/core/rl_trainer/rl_trainer.py
+++ b/rllib/core/rl_trainer/rl_trainer.py
@@ -1,5 +1,6 @@
 import abc
 
+from dataclasses import dataclass, field
 import logging
 import numpy as np
 from typing import (
@@ -14,7 +15,6 @@
     Tuple,
     Type,
     Union,
-    TYPE_CHECKING,
 )
 
 from ray.rllib.utils.framework import try_import_tf, try_import_torch
@@ -23,6 +23,7 @@
     ModuleID,
     SingleAgentRLModuleSpec,
 )
+
 from ray.rllib.core.rl_module.marl_module import (
     MultiAgentRLModule,
     MultiAgentRLModuleSpec,
@@ -31,10 +32,8 @@
 from ray.rllib.utils.nested_dict import NestedDict
 from ray.rllib.utils.numpy import convert_to_numpy
 from ray.rllib.utils.typing import TensorType
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
-if TYPE_CHECKING:
-    from ray.air.config import ScalingConfig
-    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 
 torch, _ = try_import_torch()
 tf1, tf, tfv = try_import_tf()
@@ -48,6 +47,32 @@
 ParamDictType = Dict[ParamRef, ParamType]
 
 
+@dataclass
+class FrameworkHPs:
+    """The framework specific hyper-parameters.
+
+    Args:
+        eager_tracing: Whether to trace the model in eager mode. This enables tf
+            tracing mode by wrapping the loss function computation in a tf.function.
+            This is useful for speeding up the training loop. However, it is not
+            compatible with all tf operations. For example, tf.print is not supported
+            in tf.function.
+    """
+
+    eager_tracing: bool = False
+
+
+@dataclass
+class RLTrainerHPs:
+    """The hyper-parameters for RLTrainer.
+
+    When creating a new RLTrainer, the new hyper-parameters have to be defined by
+    subclassing this class and adding the new hyper-parameters as fields.
+    """
+
+    pass
+
+
 class RLTrainer:
     """Base class for RLlib algorithm trainers.
 
@@ -118,9 +143,9 @@ def __init__(
         ] = None,
         module: Optional[RLModule] = None,
         optimizer_config: Mapping[str, Any] = None,
-        distributed: bool = False,
-        scaling_config: Optional["ScalingConfig"] = None,
-        algorithm_config: Optional["AlgorithmConfig"] = None,
+        trainer_scaling_config: TrainerScalingConfig = TrainerScalingConfig(),
+        trainer_hyperparameters: Optional[RLTrainerHPs] = RLTrainerHPs(),
+        framework_hyperparameters: Optional[FrameworkHPs] = FrameworkHPs(),
     ):
         # TODO (Kourosh): Having the entire algorithm_config inside trainer may not be
         # the best idea in the world, but it's easy to implement and user will
@@ -140,9 +165,10 @@ def __init__(
         self.module_spec = module_spec
         self.module_obj = module
         self.optimizer_config = optimizer_config
-        self.distributed = distributed
-        self.scaling_config = scaling_config
-        self.config = algorithm_config
+        self.config = trainer_hyperparameters
+
+        # pick the configs that we need for the trainer from scaling config
+        self._distributed = trainer_scaling_config.num_workers > 1
 
         # These are the attributes that are set during build
         self._module: MultiAgentRLModule = None
@@ -151,6 +177,10 @@ def __init__(
         self._param_to_optim: Dict[ParamRef, Optimizer] = {}
         self._params: ParamDictType = {}
 
+    @property
+    def distributed(self) -> bool:
+        return self._distributed
+
     @property
     def module(self) -> MultiAgentRLModule:
         return self._module
@@ -611,3 +641,46 @@ def __check_if_build_called(self):
                 "RLTrainer.build() must be called after constructing a "
                 "RLTrainer and before calling any methods on it."
             )
+
+
+@dataclass
+class RLTrainerSpec:
+    """The spec for construcitng RLTrainer actors.
+
+    Args:
+        rl_trainer_class: The RLTrainer class to use.
+        module_spec: The underlying (MA)RLModule spec to completely define the module.
+        module: Alternatively the RLModule instance can be passed in directly. This
+            only works if the RLTrainer is not an actor.
+        backend_config: The backend config for properly distributing the RLModule.
+        optimizer_config: The optimizer setting to apply during training.
+        trainer_hyperparameters: The extra config for the loss/additional update. This
+            should be a subclass of RLTrainerHPs. This is useful for passing in
+            algorithm configs that contains the hyper-parameters for loss computation,
+            change of training behaviors, etc. e.g lr, entropy_coeff.
+    """
+
+    rl_trainer_class: Type["RLTrainer"]
+    module_spec: Union["SingleAgentRLModuleSpec", "MultiAgentRLModuleSpec"] = None
+    module: Optional["RLModule"] = None
+    trainer_scaling_config: TrainerScalingConfig = field(
+        default_factory=TrainerScalingConfig
+    )
+    optimizer_config: Dict[str, Any] = field(default_factory=dict)
+    trainer_hyperparameters: RLTrainerHPs = field(default_factory=RLTrainerHPs)
+    framework_hyperparameters: FrameworkHPs = field(default_factory=FrameworkHPs)
+
+    def get_params_dict(self) -> Dict[str, Any]:
+        """Returns the parameters than be passed to the RLTrainer constructor."""
+        return {
+            "module": self.module,
+            "module_spec": self.module_spec,
+            "trainer_scaling_config": self.trainer_scaling_config,
+            "optimizer_config": self.optimizer_config,
+            "trainer_hyperparameters": self.trainer_hyperparameters,
+            "framework_hyperparameters": self.framework_hyperparameters,
+        }
+
+    def build(self) -> "RLTrainer":
+        """Builds the RLTrainer instance."""
+        return self.rl_trainer_class(**self.get_params_dict())
diff --git a/rllib/core/rl_trainer/scaling_config.py b/rllib/core/rl_trainer/scaling_config.py
new file mode 100644
index 000000000000..1c8054ef4468
--- /dev/null
+++ b/rllib/core/rl_trainer/scaling_config.py
@@ -0,0 +1,21 @@
+from dataclasses import dataclass
+
+
+@dataclass
+class TrainerScalingConfig:
+    """Configuratiom for scaling training actors.
+
+    Attributes:
+        num_workers: The number of workers to use for training. num_workers=0 means you
+            have only one local worker (either on 1 CPU or 1 GPU)
+        num_cpus_per_worker: The number of CPUs to allocate per worker. If
+            num_workers=0 and num_gpus_per_worker=0, regardless of this value, the
+            training will run on a single CPU.
+        num_gpus_per_worker: The number of GPUs to allocate per worker. If
+            num_workers=0, any number greater than 0 will run the training on a single
+            GPU. A value of zero will run the training on a single CPU.
+    """
+
+    num_workers: int = 0
+    num_cpus_per_worker: int = 1
+    num_gpus_per_worker: int = 0
diff --git a/rllib/core/rl_trainer/tests/test_rl_trainer.py b/rllib/core/rl_trainer/tests/test_rl_trainer.py
index 8af9b0ae7245..b33bea2a1cc6 100644
--- a/rllib/core/rl_trainer/tests/test_rl_trainer.py
+++ b/rllib/core/rl_trainer/tests/test_rl_trainer.py
@@ -11,16 +11,12 @@
 from ray.rllib.core.testing.tf.bc_rl_trainer import BCTfRLTrainer
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID
 from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
 
-def get_trainer(distributed=False) -> RLTrainer:
+def get_trainer() -> RLTrainer:
     env = gym.make("CartPole-v1")
 
-    # TODO: Another way to make RLTrainer would be to construct the module first
-    # and then apply trainer to it. We should also allow that. In fact if we figure
-    # out the serialization of RLModules we can simply pass the module the trainer
-    # and internally it will serialize and deserialize the module for distributed
-    # construction.
     trainer = BCTfRLTrainer(
         module_spec=SingleAgentRLModuleSpec(
             module_class=DiscreteBCTFModule,
@@ -29,7 +25,7 @@ def get_trainer(distributed=False) -> RLTrainer:
             model_config={"hidden_dim": 32},
         ),
         optimizer_config={"lr": 1e-3},
-        distributed=distributed,
+        trainer_scaling_config=TrainerScalingConfig(),
     )
 
     trainer.build()
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner.py b/rllib/core/rl_trainer/tests/test_trainer_runner.py
index 5743c891b4c4..67a511b6d5bc 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner.py
@@ -2,55 +2,130 @@
 import unittest
 import ray
 import time
+import numpy as np
+import itertools
 
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID, MultiAgentBatch
-from ray.rllib.utils.test_utils import get_cartpole_dataset_reader
+from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
+from ray.rllib.utils.framework import try_import_tf
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 from ray.rllib.core.testing.utils import (
     get_trainer_runner,
+    get_rl_trainer,
     add_module_to_runner_or_trainer,
 )
 
 
 class TestTrainerRunner(unittest.TestCase):
-    """This test is setup for 2 gpus."""
-
-    # TODO: This unittest should also test other resource allocations like multi-cpu,
-    # multi-node multi-gpu, etc.
-
     @classmethod
-    def setUp(cls) -> None:
+    def setUpClass(cls) -> None:
         ray.init()
 
+        # Settings to test
+        cls.scaling_configs = {
+            "local-cpu": TrainerScalingConfig(num_workers=0, num_gpus_per_worker=0),
+            "local-gpu": TrainerScalingConfig(num_workers=0, num_gpus_per_worker=0.5),
+            "remote-cpu": TrainerScalingConfig(num_workers=1),
+            "remote-gpu": TrainerScalingConfig(num_workers=1, num_gpus_per_worker=0.5),
+            "multi-gpu-ddp": TrainerScalingConfig(num_workers=2, num_gpus_per_worker=1),
+            "multi-cpu-ddp": TrainerScalingConfig(num_workers=2, num_cpus_per_worker=2),
+            # "multi-gpu-ddp-pipeline": TrainerScalingConfig(
+            #     num_workers=2, num_gpus_per_worker=2
+            # ),
+        }
+
     @classmethod
-    def tearDown(cls) -> None:
+    def tearDownClass(cls) -> None:
         ray.shutdown()
 
+    def test_trainer_runner_local(self):
+
+        tf1, tf, tfv = try_import_tf()
+        tf1.executing_eagerly()
+
+        # TODO (Avnish): tf does not clear out the GPU memory footprint, therefore
+        # doing it first before torch will result in OOM. Find a way to clear out the
+        # GPU memory footprint of tf.
+        fws = ["torch"]
+        scaling_modes = ["local-cpu", "local-gpu"]
+        test_iterator = itertools.product(fws, scaling_modes)
+
+        env = gym.make("CartPole-v1")
+        for fw, scaling_mode in test_iterator:
+            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}")
+            ray.init(ignore_reinit_error=True)
+            scaling_config = self.scaling_configs[scaling_mode]
+            runner = get_trainer_runner(fw, env, scaling_config)
+            local_trainer = get_rl_trainer(fw, env)
+            local_trainer.build()
+
+            # make the state of the trainer and the local runner identical
+            local_trainer.set_state(runner.get_state()[0])
+
+            reader = get_cartpole_dataset_reader(batch_size=500)
+            batch = reader.next()
+            batch = batch.as_multi_agent()
+            check(local_trainer.update(batch), runner.update(batch)[0])
+
+            new_module_id = "test_module"
+
+            add_module_to_runner_or_trainer(fw, env, new_module_id, runner)
+            add_module_to_runner_or_trainer(fw, env, new_module_id, local_trainer)
+
+            # make the state of the trainer and the local runner identical
+            local_trainer.set_state(runner.get_state()[0])
+
+            # do another update
+            batch = reader.next()
+            ma_batch = MultiAgentBatch(
+                {new_module_id: batch, DEFAULT_POLICY_ID: batch}, env_steps=batch.count
+            )
+            check(local_trainer.update(ma_batch), runner.update(ma_batch)[0])
+
+            check(local_trainer.get_state(), runner.get_state()[0])
+
+            # make sure the runner resources are freed up so that we don't autoscale
+            del runner
+            del local_trainer
+            ray.shutdown()
+            time.sleep(10)
+
     def test_update_multigpu(self):
-        """Test training in a 2 gpu setup and that weights are synchronized."""
 
-        for fw in ["tf", "torch"]:
+        # TODO (Avnish): The tf + remote-gpu test is flakey. Removing for now until
+        # investigated.
+        fws = ["torch"]
+        scaling_modes = self.scaling_configs.keys()
+        test_iterator = itertools.product(fws, scaling_modes)
+
+        for fw, scaling_mode in test_iterator:
+            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}.")
             ray.init(ignore_reinit_error=True)
-            print(f"Testing framework: {fw}.")
             env = gym.make("CartPole-v1")
-            runner = get_trainer_runner(fw, env, compute_config=dict(num_gpus=2))
-            reader = get_cartpole_dataset_reader(batch_size=500)
+
+            scaling_config = self.scaling_configs[scaling_mode]
+            runner = get_trainer_runner(fw, env, scaling_config)
+            reader = get_cartpole_dataset_reader(batch_size=1024)
 
             min_loss = float("inf")
             for iter_i in range(1000):
                 batch = reader.next()
-                res_0, res_1 = runner.update(batch.as_multi_agent())
+                results = runner.update(batch.as_multi_agent())
 
-                loss = (res_0["loss"]["total_loss"] + res_1["loss"]["total_loss"]) / 2
+                loss = np.mean([res["loss"]["total_loss"] for res in results])
                 min_loss = min(loss, min_loss)
                 print(f"[iter = {iter_i}] Loss: {loss:.3f}, Min Loss: {min_loss:.3f}")
                 # The loss is initially around 0.69 (ln2). When it gets to around
                 # 0.57 the return of the policy gets to around 100.
                 if min_loss < 0.57:
                     break
-                self.assertEqual(
-                    res_0["mean_weight"]["default_policy"],
-                    res_1["mean_weight"]["default_policy"],
-                )
+
+                for res1, res2 in zip(results, results[1:]):
+                    self.assertEqual(
+                        res1["mean_weight"]["default_policy"],
+                        res2["mean_weight"]["default_policy"],
+                    )
+
             self.assertLess(min_loss, 0.57)
 
             # make sure the runner resources are freed up so that we don't autoscale
@@ -60,11 +135,18 @@ def test_update_multigpu(self):
 
     def test_add_remove_module(self):
 
-        for fw in ["tf", "torch"]:
+        # TODO (Avnish): The tf + remote-gpu test is flakey. Removing for now until
+        # investigated.
+        fws = ["torch"]
+        scaling_modes = self.scaling_configs.keys()
+        test_iterator = itertools.product(fws, scaling_modes)
+
+        for fw, scaling_mode in test_iterator:
+            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}.")
             ray.init(ignore_reinit_error=True)
-            print(f"Testing framework: {fw}.")
             env = gym.make("CartPole-v1")
-            runner = get_trainer_runner(fw, env, compute_config=dict(num_gpus=2))
+            scaling_config = self.scaling_configs[scaling_mode]
+            runner = get_trainer_runner(fw, env, scaling_config)
             reader = get_cartpole_dataset_reader(batch_size=500)
             batch = reader.next()
 
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner_config.py b/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
index acdc67731337..46e215acd86d 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
@@ -31,7 +31,6 @@ def test_trainer_runner_build(self):
             .trainer(
                 trainer_class=BCTfRLTrainer,
             )
-            .algorithm(algorithm_config=AlgorithmConfig())
         )
         config.build()
 
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner_local.py b/rllib/core/rl_trainer/tests/test_trainer_runner_local.py
deleted file mode 100644
index 9986cf98dd3d..000000000000
--- a/rllib/core/rl_trainer/tests/test_trainer_runner_local.py
+++ /dev/null
@@ -1,70 +0,0 @@
-import gymnasium as gym
-import unittest
-
-import ray
-
-from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID, MultiAgentBatch
-from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
-from ray.rllib.utils.framework import try_import_tf
-from ray.rllib.core.testing.utils import (
-    add_module_to_runner_or_trainer,
-    get_trainer_runner,
-    get_rl_trainer,
-)
-
-
-tf1, tf, tfv = try_import_tf()
-tf1.executing_eagerly()
-
-
-class TestTrainerRunnerLocal(unittest.TestCase):
-    """This test is a trainer test setup for no gpus."""
-
-    # TODO: Make a unittest that does not need 2 gpus to run.
-    # So that the user can run it locally as well.
-    @classmethod
-    def setUp(cls) -> None:
-        ray.init()
-
-    @classmethod
-    def tearDown(cls) -> None:
-        ray.shutdown()
-
-    def test_trainer_runner_no_gpus(self):
-        env = gym.make("CartPole-v1")
-        for fw in ["tf", "torch"]:
-            runner = get_trainer_runner(fw, env, compute_config=dict(num_gpus=0))
-            local_trainer = get_rl_trainer(fw, env)
-            local_trainer.build()
-
-            # make the state of the trainer and the local runner identical
-            local_trainer.set_state(runner.get_state()[0])
-
-            reader = get_cartpole_dataset_reader(batch_size=500)
-            batch = reader.next()
-            batch = batch.as_multi_agent()
-            check(local_trainer.update(batch), runner.update(batch)[0])
-
-            new_module_id = "test_module"
-
-            add_module_to_runner_or_trainer(fw, env, new_module_id, runner)
-            add_module_to_runner_or_trainer(fw, env, new_module_id, local_trainer)
-
-            # make the state of the trainer and the local runner identical
-            local_trainer.set_state(runner.get_state()[0])
-
-            # do another update
-            batch = reader.next()
-            ma_batch = MultiAgentBatch(
-                {new_module_id: batch, DEFAULT_POLICY_ID: batch}, env_steps=batch.count
-            )
-            check(local_trainer.update(ma_batch), runner.update(ma_batch)[0])
-
-            check(local_trainer.get_state(), runner.get_state()[0])
-
-
-if __name__ == "__main__":
-    import pytest
-    import sys
-
-    sys.exit(pytest.main(["-v", __file__]))
diff --git a/rllib/core/rl_trainer/tf/tf_rl_trainer.py b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
index 44a8f6d21581..0455a0e772e0 100644
--- a/rllib/core/rl_trainer/tf/tf_rl_trainer.py
+++ b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
@@ -9,10 +9,10 @@
     Dict,
     Sequence,
     Hashable,
-    TYPE_CHECKING,
 )
 
 from ray.rllib.core.rl_trainer.rl_trainer import (
+    FrameworkHPs,
     RLTrainer,
     ParamOptimizerPairs,
     ParamRef,
@@ -25,19 +25,13 @@
     ModuleID,
     SingleAgentRLModuleSpec,
 )
-from ray.rllib.core.rl_module.marl_module import (
-    MultiAgentRLModule,
-    MultiAgentRLModuleSpec,
-)
+from ray.rllib.core.rl_module.marl_module import MultiAgentRLModule
 from ray.rllib.policy.sample_batch import MultiAgentBatch
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.framework import try_import_tf
 from ray.rllib.utils.typing import TensorType
 from ray.rllib.utils.nested_dict import NestedDict
 
-if TYPE_CHECKING:
-    from ray.air.config import ScalingConfig
-    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 
 tf1, tf, tfv = try_import_tf()
 
@@ -94,24 +88,10 @@ class TfRLTrainer(RLTrainer):
     def __init__(
         self,
         *,
-        module_spec: Optional[
-            Union[SingleAgentRLModuleSpec, MultiAgentRLModuleSpec]
-        ] = None,
-        module: Optional[RLModule] = None,
-        optimizer_config: Mapping[str, Any],
-        distributed: bool = False,
-        enable_tf_function: bool = True,
-        scaling_config: Optional["ScalingConfig"] = None,
-        algorithm_config: Optional["AlgorithmConfig"] = None,
+        framework_hyperparameters: Optional[FrameworkHPs] = FrameworkHPs(),
+        **kwargs,
     ):
-        super().__init__(
-            module_spec=module_spec,
-            module=module,
-            optimizer_config=optimizer_config,
-            distributed=distributed,
-            scaling_config=scaling_config,
-            algorithm_config=algorithm_config,
-        )
+        super().__init__(framework_hyperparameters=framework_hyperparameters, **kwargs)
 
         # TODO (Kourosh): This is required to make sure tf computes the values in the
         # end. Two question remains:
@@ -121,7 +101,7 @@ def __init__(
         # does not mention this as a requirement?
         tf1.enable_eager_execution()
 
-        self._enable_tf_function = enable_tf_function
+        self._enable_tf_function = framework_hyperparameters.eager_tracing
         if self._enable_tf_function:
             self._update_fn = tf.function(self._do_update_fn)
         else:
diff --git a/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py b/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
index 40806048b6dc..9de3c1d47259 100644
--- a/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
+++ b/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
@@ -12,20 +12,12 @@
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID
 from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
 from ray.rllib.utils.numpy import convert_to_numpy
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
-from ray.air.config import ScalingConfig
 
-
-def _get_trainer(scaling_config=None, distributed: bool = False) -> RLTrainer:
+def _get_trainer() -> RLTrainer:
     env = gym.make("CartPole-v1")
-    scaling_config = scaling_config or ScalingConfig()
-    distributed = False
-
-    # TODO: Another way to make RLTrainer would be to construct the module first
-    # and then apply trainer to it. We should also allow that. In fact if we figure
-    # out the serialization of RLModules we can simply pass the module the trainer
-    # and internally it will serialize and deserialize the module for distributed
-    # construction.
+
     trainer = BCTorchRLTrainer(
         module_spec=SingleAgentRLModuleSpec(
             module_class=DiscreteBCTorchModule,
@@ -33,9 +25,8 @@ def _get_trainer(scaling_config=None, distributed: bool = False) -> RLTrainer:
             action_space=env.action_space,
             model_config={"hidden_dim": 32},
         ),
-        scaling_config=scaling_config,
         optimizer_config={"lr": 1e-3},
-        distributed=distributed,
+        trainer_scaling_config=TrainerScalingConfig(),
     )
 
     trainer.build()
@@ -54,7 +45,7 @@ def tearDown(cls) -> None:
 
     def test_end_to_end_update(self):
 
-        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
+        trainer = _get_trainer()
         reader = get_cartpole_dataset_reader(batch_size=512)
 
         min_loss = float("inf")
@@ -77,7 +68,7 @@ def test_compute_gradients(self):
         Tests that if we sum all the trainable variables the gradient of output w.r.t.
         the weights is all ones.
         """
-        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
+        trainer = _get_trainer()
 
         params = trainer.get_parameters(trainer.module[DEFAULT_POLICY_ID])
         loss = {"total_loss": sum([param.sum() for param in params])}
@@ -96,7 +87,7 @@ def test_apply_gradients(self):
         standard SGD/Adam update rule.
         """
 
-        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
+        trainer = _get_trainer()
 
         # calculated the expected new params based on gradients of all ones.
         params = trainer.get_parameters(trainer.module[DEFAULT_POLICY_ID])
@@ -120,7 +111,7 @@ def test_add_remove_module(self):
         all variables the updated parameters follow the SGD update rule.
         """
         env = gym.make("CartPole-v1")
-        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
+        trainer = _get_trainer()
 
         # add a test module with SGD optimizer with a known lr
         lr = 1e-4
diff --git a/rllib/core/rl_trainer/torch/torch_rl_trainer.py b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
index b8313b47a584..8fe28c662718 100644
--- a/rllib/core/rl_trainer/torch/torch_rl_trainer.py
+++ b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
@@ -8,7 +8,6 @@
     Hashable,
     Optional,
     Callable,
-    TYPE_CHECKING,
 )
 
 from ray.rllib.core.rl_module.rl_module import (
@@ -16,10 +15,7 @@
     ModuleID,
     SingleAgentRLModuleSpec,
 )
-from ray.rllib.core.rl_module.marl_module import (
-    MultiAgentRLModule,
-    MultiAgentRLModuleSpec,
-)
+from ray.rllib.core.rl_module.marl_module import MultiAgentRLModule
 from ray.rllib.core.rl_trainer.rl_trainer import (
     RLTrainer,
     ParamOptimizerPairs,
@@ -28,6 +24,7 @@
     ParamDictType,
 )
 from ray.rllib.core.rl_module.torch.torch_rl_module import TorchDDPRLModule
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 from ray.rllib.policy.sample_batch import MultiAgentBatch
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.typing import TensorType
@@ -37,11 +34,8 @@
 torch, nn = try_import_torch()
 
 if torch:
-    from ray.air.config import ScalingConfig
     from ray.train.torch.train_loop_utils import _TorchAccelerator
 
-if TYPE_CHECKING:
-    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 
 logger = logging.getLogger(__name__)
 
@@ -53,31 +47,14 @@ class TorchRLTrainer(RLTrainer):
     def __init__(
         self,
         *,
-        module_spec: Optional[
-            Union[SingleAgentRLModuleSpec, MultiAgentRLModuleSpec]
-        ] = None,
-        module: Optional[RLModule] = None,
-        optimizer_config: Mapping[str, Any],
-        distributed: bool = False,
-        scaling_config: Optional["ScalingConfig"] = None,
-        algorithm_config: Optional["AlgorithmConfig"] = None,
+        trainer_scaling_config: TrainerScalingConfig = TrainerScalingConfig(),
+        **kwargs,
     ):
-        super().__init__(
-            module_spec=module_spec,
-            module=module,
-            optimizer_config=optimizer_config,
-            distributed=distributed,
-            scaling_config=scaling_config,
-            algorithm_config=algorithm_config,
-        )
+        super().__init__(trainer_scaling_config=trainer_scaling_config, **kwargs)
 
-        # TODO (Kourosh): Scaling config is required for torch trainer to do proper DDP
-        # wraping setup but not so much required for tf. we need to
-        scaling_config = scaling_config or ScalingConfig()
-        self._world_size = scaling_config.num_workers or 1
-        self._use_gpu = scaling_config.use_gpu
+        # pick the stuff that we need from the scaling config
+        self._use_gpu = trainer_scaling_config.num_gpus_per_worker > 0
 
-        # These attributes are set in the `build` method.
         self._device = None
 
     @property
@@ -135,6 +112,12 @@ def build(self) -> None:
             self._device = torch.device("cpu")
         super().build()
 
+    @override(RLTrainer)
+    def _make_module(self) -> MultiAgentRLModule:
+        module = super()._make_module()
+        self._map_module_to_device(module)
+        return module
+
     @override(RLTrainer)
     def _make_distributed_module(self) -> MultiAgentRLModule:
         module = self._make_module()
@@ -146,11 +129,9 @@ def _make_distributed_module(self) -> MultiAgentRLModule:
         # register them in the MultiAgentRLModule. We should find a better way to
         # handle this.
         if isinstance(module, torch.nn.Module):
-            module.to(self._device)
             module = TorchDDPRLModule(module)
         else:
             for key in module.keys():
-                module[key].to(self._device)
                 module.add_module(key, TorchDDPRLModule(module[key]), override=True)
 
         return module
@@ -210,3 +191,11 @@ def add_module(
             self._module.add_module(
                 module_id, TorchDDPRLModule(self._module[module_id]), override=True
             )
+
+    def _map_module_to_device(self, module: MultiAgentRLModule) -> None:
+        """Moves the module to the correct device."""
+        if isinstance(module, torch.nn.Module):
+            module.to(self._device)
+        else:
+            for key in module.keys():
+                module[key].to(self._device)
diff --git a/rllib/core/rl_trainer/trainer_runner.py b/rllib/core/rl_trainer/trainer_runner.py
index c6fcda3deacf..b6889c77d973 100644
--- a/rllib/core/rl_trainer/trainer_runner.py
+++ b/rllib/core/rl_trainer/trainer_runner.py
@@ -1,5 +1,5 @@
 import math
-from typing import Any, List, Mapping, Type, Optional, Callable, Dict
+from typing import Any, List, Mapping, Type, Optional, Callable, Dict, TYPE_CHECKING
 
 import ray
 
@@ -9,16 +9,30 @@
     SingleAgentRLModuleSpec,
 )
 from ray.rllib.core.rl_trainer.rl_trainer import (
-    RLTrainer,
+    RLTrainerSpec,
     ParamOptimizerPairs,
     Optimizer,
 )
-
 from ray.rllib.policy.sample_batch import MultiAgentBatch
+from ray.train._internal.backend_executor import BackendExecutor
 
+if TYPE_CHECKING:
+    from ray.rllib.core.rl_trainer.rl_trainer import RLTrainer
 
-from ray.air.config import ScalingConfig
-from ray.train._internal.backend_executor import BackendExecutor
+
+def _get_backend_config(rl_trainer_class: Type["RLTrainer"]) -> str:
+    if rl_trainer_class.framework == "torch":
+        from ray.train.torch import TorchConfig
+
+        backend_config = TorchConfig()
+    elif rl_trainer_class.framework == "tf":
+        from ray.train.tensorflow import TensorflowConfig
+
+        backend_config = TensorflowConfig()
+    else:
+        raise ValueError("framework must be either torch or tf")
+
+    return backend_config
 
 
 class TrainerRunner:
@@ -47,32 +61,23 @@ class TrainerRunner:
 
     def __init__(
         self,
-        trainer_class: Type[RLTrainer],
-        trainer_config: Mapping[str, Any],
-        compute_config: Mapping[str, Any],
+        rl_trainer_spec: RLTrainerSpec,
     ):
-        num_gpus = compute_config.get("num_gpus", 0)
-        use_fake_gpus = compute_config.get("_use_fake_gpus", False)
-        self._trainer_config = trainer_config
-
-        if num_gpus > 0:
-            scaling_config = ScalingConfig(
-                num_workers=num_gpus,
-                use_gpu=(not use_fake_gpus),
-            )
-
-            if trainer_class.framework == "torch":
-                from ray.train.torch import TorchConfig
-
-                backend_config = TorchConfig()
-            elif trainer_class.framework == "tf":
-                from ray.train.tensorflow import TensorflowConfig
+        scaling_config = rl_trainer_spec.trainer_scaling_config
+        rl_trainer_class = rl_trainer_spec.rl_trainer_class
 
-                backend_config = TensorflowConfig()
-            else:
-                raise ValueError("framework must be either torch or tf")
+        # TODO (Kourosh): Go with a _remote flag instead of _is_local to be more
+        # explicit
+        self._is_local = scaling_config.num_workers == 0
+        self._trainer = None
+        self._workers = None
 
-            self.backend_executor = BackendExecutor(
+        if self._is_local:
+            self._trainer = rl_trainer_class(**rl_trainer_spec.get_params_dict())
+            self._trainer.build()
+        else:
+            backend_config = _get_backend_config(rl_trainer_class)
+            backend_executor = BackendExecutor(
                 backend_config=backend_config,
                 num_workers=scaling_config.num_workers,
                 num_cpus_per_worker=scaling_config.num_cpus_per_worker,
@@ -80,23 +85,19 @@ def __init__(
                 max_retries=0,
             )
 
-            # TODO(avnishn, kourosh): Should we pass in scaling config into the
-            # trainer?
-            trainer_config["distributed"] = self._distributed = bool(num_gpus > 1)
-            trainer_config["scaling_config"] = scaling_config
-            self.backend_executor.start(
-                train_cls=trainer_class, train_cls_kwargs=trainer_config
+            backend_executor.start(
+                train_cls=rl_trainer_class,
+                train_cls_kwargs=rl_trainer_spec.get_params_dict(),
             )
-            self._workers = [
-                w.actor for w in self.backend_executor.worker_group.workers
-            ]
 
+            self._workers = [w.actor for w in backend_executor.worker_group.workers]
+
+            # run the neural network building code on remote workers
             ray.get([w.build.remote() for w in self._workers])
 
-        else:
-            trainer_config["distributed"] = self._distributed = False
-            self._trainer = trainer_class(**trainer_config)
-            self._trainer.build()
+    @property
+    def is_local(self) -> bool:
+        return self._is_local
 
     def update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
         """Do a gradient based update to the RLTrainer(s) maintained by this TrainerRunner.
@@ -107,10 +108,10 @@ def update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
         Returns:
             A list of dictionaries of results from the updates from the RLTrainer(s)
         """
-        if self._distributed:
-            return self._distributed_update(batch)
-        else:
+        if self.is_local:
             return [self._trainer.update(batch)]
+        else:
+            return self._distributed_update(batch)
 
     def _distributed_update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
         """Do a gradient based update to the RLTrainers using DDP training.
@@ -157,13 +158,13 @@ def additional_update(self, *args, **kwargs) -> List[Mapping[str, Any]]:
             A list of dictionaries of results from the updates from each worker.
         """
 
-        if self._distributed:
+        if self.is_local:
+            return [self._trainer.additional_update(*args, **kwargs)]
+        else:
             refs = []
             for worker in self._workers:
                 refs.append(worker.additional_update.remote(*args, **kwargs))
             return ray.get(refs)
-        else:
-            return [self._trainer.additional_update(*args, **kwargs)]
 
     def add_module(
         self,
@@ -186,7 +187,14 @@ def add_module(
             optimizer_cls: The optimizer class to use. If None, the set_optimizer_fn
                 should be provided.
         """
-        if self._distributed:
+        if self.is_local:
+            self._trainer.add_module(
+                module_id=module_id,
+                module_spec=module_spec,
+                set_optimizer_fn=set_optimizer_fn,
+                optimizer_cls=optimizer_cls,
+            )
+        else:
             refs = []
             for worker in self._workers:
                 ref = worker.add_module.remote(
@@ -197,13 +205,6 @@ def add_module(
                 )
                 refs.append(ref)
             ray.get(refs)
-        else:
-            self._trainer.add_module(
-                module_id=module_id,
-                module_spec=module_spec,
-                set_optimizer_fn=set_optimizer_fn,
-                optimizer_cls=optimizer_cls,
-            )
 
     def remove_module(self, module_id: ModuleID) -> None:
         """Remove a module from the RLTrainers maintained by this TrainerRunner.
@@ -212,14 +213,14 @@ def remove_module(self, module_id: ModuleID) -> None:
             module_id: The id of the module to remove.
 
         """
-        if self._distributed:
+        if self.is_local:
+            self._trainer.remove_module(module_id)
+        else:
             refs = []
             for worker in self._workers:
                 ref = worker.remove_module.remote(module_id)
                 refs.append(ref)
             ray.get(refs)
-        else:
-            self._trainer.remove_module(module_id)
 
     def get_weight(self) -> Dict:
         """Get the weights of the MARLModule.
@@ -232,13 +233,13 @@ def get_weight(self) -> Dict:
 
     def get_state(self) -> List[Mapping[ModuleID, Mapping[str, Any]]]:
         """Get the states of the RLTrainers"""
-        if self._distributed:
+        if self.is_local:
+            return [self._trainer.get_state()]
+        else:
             refs = []
             for worker in self._workers:
                 refs.append(worker.get_state.remote())
             return ray.get(refs)
-        else:
-            return [self._trainer.get_state()]
 
     def set_state(self, state: List[Mapping[ModuleID, Mapping[str, Any]]]) -> None:
         """Sets the states of the RLTrainers.
@@ -247,10 +248,10 @@ def set_state(self, state: List[Mapping[ModuleID, Mapping[str, Any]]]) -> None:
             state: The state of the RLTrainers
 
         """
-        if self._distributed:
+        if self.is_local:
+            self._trainer.set_state(state)
+        else:
             refs = []
             for worker in self._workers:
                 refs.append(worker.set_state.remote(state))
             ray.get(refs)
-        else:
-            self._trainer.set_state(state)
diff --git a/rllib/core/rl_trainer/trainer_runner_config.py b/rllib/core/rl_trainer/trainer_runner_config.py
index d193e7cbb1f8..d8de08c05328 100644
--- a/rllib/core/rl_trainer/trainer_runner_config.py
+++ b/rllib/core/rl_trainer/trainer_runner_config.py
@@ -1,11 +1,18 @@
 from typing import Type, Optional, TYPE_CHECKING, Union, Dict
+
 from ray.rllib.core.rl_module.marl_module import MultiAgentRLModuleSpec
 from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
-from ray.rllib.utils.from_config import NotProvided
 from ray.rllib.core.rl_trainer.trainer_runner import TrainerRunner
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
+from ray.rllib.core.rl_trainer.rl_trainer import (
+    RLTrainerSpec,
+    RLTrainerHPs,
+    FrameworkHPs,
+)
+from ray.rllib.utils.from_config import NotProvided
+
 
 if TYPE_CHECKING:
-    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
     from ray.rllib.core.rl_trainer import RLTrainer
 
 ModuleSpec = Union[SingleAgentRLModuleSpec, MultiAgentRLModuleSpec]
@@ -26,15 +33,16 @@ def __init__(self, cls: Type[TrainerRunner] = None) -> None:
 
         # `self.trainer()`
         self.trainer_class = None
-        self.eager_tracing = True
         self.optimizer_config = None
+        self.rl_trainer_hps = RLTrainerHPs()
 
         # `self.resources()`
-        self.num_gpus = 0
-        self.fake_gpus = False
+        self.num_gpus_per_trainer_worker = 0
+        self.num_cpus_per_trainer_worker = 1
+        self.num_trainer_workers = 1
 
-        # `self.algorithm()`
-        self.algorithm_config = None
+        # `self.framework()`
+        self.eager_tracing = False
 
     def validate(self) -> None:
 
@@ -50,51 +58,39 @@ def validate(self) -> None:
                 "the RLTrainer class with .trainer(trainer_class=MyTrainerClass)."
             )
 
-        if self.algorithm_config is None:
-            raise ValueError(
-                "Must provide algorithm_config for RLTrainer. Use "
-                ".algorithm(algorithm_config=MyConfig)."
-            )
-
         if self.optimizer_config is None:
             # get the default optimizer config if it's not provided
             # TODO (Kourosh): Change the optimizer config to a dataclass object.
             self.optimizer_config = {"lr": 1e-3}
 
-        if self.fake_gpus and self.num_gpus <= 0:
-            raise ValueError("If fake_gpus is True, num_gpus must be greater than 0.")
-
     def build(self) -> TrainerRunner:
         self.validate()
 
-        # If the module class is a multi agent class it will override the default
-        # MultiAgentRLModule class. otherwise, it will be a single agent wrapped with
-        # mutliagent
-        # TODO (Kourosh): What should be scaling_config? it's not clear what
-        # should be passed in as trainer_config and what will be inferred
-        return self.trainer_runner_class(
-            trainer_class=self.trainer_class,
-            trainer_config={
-                "module_spec": self.module_spec,
-                # TODO (Kourosh): should this be inferred inside the constructor?
-                "distributed": self.num_gpus > 1,
-                # TODO (Avnish): add this
-                # "enable_tf_function": self.eager_tracing,
-                "optimizer_config": self.optimizer_config,
-                "algorithm_config": self.algorithm_config,
-            },
-            compute_config={
-                "num_gpus": self.num_gpus,
-                # TODO (Avnish): add this
-                # "fake_gpus": self.fake_gpus,
-            },
+        scaling_config = TrainerScalingConfig(
+            num_workers=self.num_trainer_workers,
+            num_gpus_per_worker=self.num_gpus_per_trainer_worker,
+            num_cpus_per_worker=self.num_cpus_per_trainer_worker,
         )
 
-    def algorithm(
-        self, algorithm_config: Optional["AlgorithmConfig"] = NotProvided
+        framework_hps = FrameworkHPs(eager_tracing=self.eager_tracing)
+
+        rl_trainer_spec = RLTrainerSpec(
+            rl_trainer_class=self.trainer_class,
+            module_spec=self.module_spec,
+            optimizer_config=self.optimizer_config,
+            trainer_scaling_config=scaling_config,
+            trainer_hyperparameters=self.rl_trainer_hps,
+            framework_hyperparameters=framework_hps,
+        )
+
+        return self.trainer_runner_class(rl_trainer_spec)
+
+    def framework(
+        self, eager_tracing: Optional[bool] = NotProvided
     ) -> "TrainerRunnerConfig":
-        if algorithm_config is not NotProvided:
-            self.algorithm_config = algorithm_config
+
+        if eager_tracing is not NotProvided:
+            self.eager_tracing = eager_tracing
         return self
 
     def module(
@@ -109,14 +105,17 @@ def module(
 
     def resources(
         self,
-        num_gpus: Optional[Union[float, int]] = NotProvided,
-        fake_gpus: Optional[bool] = NotProvided,
+        num_trainer_workers: Optional[int] = NotProvided,
+        num_gpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
+        num_cpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
     ) -> "TrainerRunnerConfig":
 
-        if num_gpus is not NotProvided:
-            self.num_gpus = num_gpus
-        if fake_gpus is not NotProvided:
-            self.fake_gpus = fake_gpus
+        if num_trainer_workers is not NotProvided:
+            self.num_trainer_workers = num_trainer_workers
+        if num_gpus_per_trainer_worker is not NotProvided:
+            self.num_gpus_per_trainer_worker = num_gpus_per_trainer_worker
+        if num_cpus_per_trainer_worker is not NotProvided:
+            self.num_cpus_per_trainer_worker = num_cpus_per_trainer_worker
 
         return self
 
@@ -124,15 +123,15 @@ def trainer(
         self,
         *,
         trainer_class: Optional[Type["RLTrainer"]] = NotProvided,
-        eager_tracing: Optional[bool] = NotProvided,
         optimizer_config: Optional[Dict] = NotProvided,
+        rl_trainer_hps: Optional[RLTrainerHPs] = NotProvided,
     ) -> "TrainerRunnerConfig":
 
         if trainer_class is not NotProvided:
             self.trainer_class = trainer_class
-        if eager_tracing is not NotProvided:
-            self.eager_tracing = eager_tracing
         if optimizer_config is not NotProvided:
             self.optimizer_config = optimizer_config
+        if rl_trainer_hps is not NotProvided:
+            self.rl_trainer_hps = rl_trainer_hps
 
         return self
diff --git a/rllib/core/testing/utils.py b/rllib/core/testing/utils.py
index bd96492bac50..01e38f07ad8a 100644
--- a/rllib/core/testing/utils.py
+++ b/rllib/core/testing/utils.py
@@ -4,6 +4,8 @@
 
 from ray.rllib.utils.annotations import DeveloperAPI
 from ray.rllib.core.rl_trainer.trainer_runner import TrainerRunner
+from ray.rllib.core.rl_trainer.rl_trainer import RLTrainerSpec
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
 from ray.rllib.core.rl_module.marl_module import (
     MultiAgentRLModuleSpec,
@@ -101,17 +103,19 @@ def get_rl_trainer(
 def get_trainer_runner(
     framework: str,
     env: "gym.Env",
-    compute_config: dict,
+    scaling_config: TrainerScalingConfig,
     is_multi_agent: bool = False,
 ) -> TrainerRunner:
-    trainer_class = get_trainer_class(framework)
-    trainer_cfg = dict(
+
+    rl_trainer_spec = RLTrainerSpec(
+        rl_trainer_class=get_trainer_class(framework),
         module_spec=get_module_spec(
             framework=framework, env=env, is_multi_agent=is_multi_agent
         ),
         optimizer_config={"lr": 0.1},
+        trainer_scaling_config=scaling_config,
     )
-    runner = TrainerRunner(trainer_class, trainer_cfg, compute_config=compute_config)
+    runner = TrainerRunner(rl_trainer_spec)
 
     return runner
 
diff --git a/rllib/utils/framework.py b/rllib/utils/framework.py
index 7ae4a4c5ddfc..98a4d4dc3ee1 100644
--- a/rllib/utils/framework.py
+++ b/rllib/utils/framework.py
@@ -59,6 +59,7 @@ def try_import_tf(error: bool = False):
     Raises:
         ImportError: If error=True and tf is not installed.
     """
+    tf_stub = _TFStub()
     # Make sure, these are reset after each test case
     # that uses them: del os.environ["RLLIB_TEST_NO_TF_IMPORT"]
     if "RLLIB_TEST_NO_TF_IMPORT" in os.environ:
@@ -86,7 +87,7 @@ def try_import_tf(error: bool = False):
                     "install at least one deep-learning framework: "
                     "`pip install [torch|tensorflow|jax]`."
                 )
-            return None, None, None
+            return None, tf_stub, None
 
     # Try "reducing" tf to tf.compat.v1.
     try:
@@ -108,6 +109,24 @@ def try_import_tf(error: bool = False):
     return tf1_module, tf_module, version
 
 
+# Fake module for tf.
+class _TFStub:
+    def __init__(self) -> None:
+        self.keras = _KerasStub()
+
+
+# Fake module for tf.keras.
+class _KerasStub:
+    def __init__(self) -> None:
+        self.Model = _FakeTfClassStub
+
+
+# Fake classes under keras (e.g for tf.keras.Model)
+class _FakeTfClassStub:
+    def __init__(self, *a, **kw):
+        raise ImportError("Could not import `tensorflow`. Try pip install tensorflow.")
+
+
 @DeveloperAPI
 def tf_function(tf_module):
     """Conditional decorator for @tf.function.
@@ -157,20 +176,20 @@ class _NNStub:
     def __init__(self, *a, **kw):
         # Fake nn.functional module within torch.nn.
         self.functional = None
-        self.Module = _FakeClassStub
+        self.Module = _FakeTorchClassStub
         self.parallel = _ParallelStub()
 
 
 # Fake class for e.g. torch.nn.Module to allow it to be inherited from.
-class _FakeClassStub:
+class _FakeTorchClassStub:
     def __init__(self, *a, **kw):
         raise ImportError("Could not import `torch`. Try pip install torch.")
 
 
 class _ParallelStub:
     def __init__(self, *a, **kw):
-        self.DataParallel = _FakeClassStub
-        self.DistributedDataParallel = _FakeClassStub
+        self.DataParallel = _FakeTorchClassStub
+        self.DistributedDataParallel = _FakeTorchClassStub
 
 
 @PublicAPI

From d26b55b1327719bbf886348d5e938befc853ef5a Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Mon, 30 Jan 2023 08:12:26 -0800
Subject: [PATCH 054/267] [RLlib; release tests] Unify RLlib's team tag to be
 `rllib` (not `rl`) (#32036)

---
 release/release_tests.yaml | 72 +++++++++++++++++++-------------------
 1 file changed, 36 insertions(+), 36 deletions(-)

diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index 0560a7f47cfd..74c9f57d1c7e 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -1787,7 +1787,7 @@
     test_suite: long_running_tests
 
   frequency: weekly
-  team: rl
+  team: rllib
   env: staging
   cluster:
     cluster_env: ../rllib_tests/app_config.yaml
@@ -1817,7 +1817,7 @@
     test_suite: long_running_tests
 
   frequency: weekly
-  team: rl
+  team: rllib
   env: staging
   cluster:
     cluster_env: ../rllib_tests/app_config.yaml
@@ -2665,7 +2665,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2688,7 +2688,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2710,7 +2710,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2734,7 +2734,7 @@
 #    test_suite: rllib_tests
 
 #  frequency: nightly
-#  team: rl
+#  team: rllib
 #  env: staging
 
 #  cluster:
@@ -2758,7 +2758,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2781,7 +2781,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2803,7 +2803,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2825,7 +2825,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2847,7 +2847,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2869,7 +2869,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2891,7 +2891,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2913,7 +2913,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2935,7 +2935,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2958,7 +2958,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -2981,7 +2981,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3004,7 +3004,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3027,7 +3027,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3050,7 +3050,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3073,7 +3073,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3096,7 +3096,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3119,7 +3119,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3142,7 +3142,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3165,7 +3165,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3188,7 +3188,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3211,7 +3211,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3234,7 +3234,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3256,7 +3256,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3279,7 +3279,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3302,7 +3302,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3325,7 +3325,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3348,7 +3348,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3370,7 +3370,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3393,7 +3393,7 @@
     test_suite: rllib_tests
 
   frequency: nightly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:
@@ -3416,7 +3416,7 @@
     test_suite: rllib_tests
 
   frequency: weekly
-  team: rl
+  team: rllib
   env: staging
 
   cluster:

From 56b79117af1c0a9c786c9e88c3f4d1311de84593 Mon Sep 17 00:00:00 2001
From: Gabriel Prado <53158208+Capiru@users.noreply.github.com>
Date: Mon, 30 Jan 2023 17:14:43 +0100
Subject: [PATCH 055/267] [RLlib] Contribution of LeelaChessZero algorithm for
 playing chess in a MultiAgent env. (#31480)

---
 doc/source/rllib/rllib-algorithms.rst         |  17 +
 python/requirements/ml/requirements_rllib.txt |   3 +
 release/release_tests.yaml                    |  24 +
 .../multi-agent-connect4.yaml                 |  19 +
 rllib/BUILD                                   |   8 +
 rllib/algorithms/leela_chess_zero/README.md   |  23 +
 rllib/algorithms/leela_chess_zero/__init__.py |  15 +
 .../leela_chess_zero/leela_chess_zero.py      | 411 ++++++++++++++++++
 .../leela_chess_zero_model.py                 | 174 ++++++++
 .../leela_chess_zero_policy.py                | 147 +++++++
 rllib/algorithms/leela_chess_zero/mcts.py     | 214 +++++++++
 .../tests/test_leela_chess_zero.py            |  53 +++
 rllib/algorithms/registry.py                  |   7 +
 rllib/examples/env/pettingzoo_chess.py        | 196 +++++++++
 rllib/examples/env/pettingzoo_connect4.py     | 180 ++++++++
 .../examples/multi-agent-leela-chess-zero.py  |  51 +++
 .../leela_chess_zero/custom_model.py          |  55 +++
 17 files changed, 1597 insertions(+)
 create mode 100644 release/rllib_tests/learning_tests/yaml_files/leela_chess_zero/multi-agent-connect4.yaml
 create mode 100644 rllib/algorithms/leela_chess_zero/README.md
 create mode 100644 rllib/algorithms/leela_chess_zero/__init__.py
 create mode 100644 rllib/algorithms/leela_chess_zero/leela_chess_zero.py
 create mode 100644 rllib/algorithms/leela_chess_zero/leela_chess_zero_model.py
 create mode 100644 rllib/algorithms/leela_chess_zero/leela_chess_zero_policy.py
 create mode 100644 rllib/algorithms/leela_chess_zero/mcts.py
 create mode 100644 rllib/algorithms/leela_chess_zero/tests/test_leela_chess_zero.py
 create mode 100644 rllib/examples/env/pettingzoo_chess.py
 create mode 100644 rllib/examples/env/pettingzoo_connect4.py
 create mode 100644 rllib/examples/multi-agent-leela-chess-zero.py
 create mode 100644 rllib/tuned_examples/leela_chess_zero/custom_model.py

diff --git a/doc/source/rllib/rllib-algorithms.rst b/doc/source/rllib/rllib-algorithms.rst
index b397bdb10cd5..d7fa54cbf8c9 100644
--- a/doc/source/rllib/rllib-algorithms.rst
+++ b/doc/source/rllib/rllib-algorithms.rst
@@ -33,6 +33,7 @@ Algorithm                      Frameworks Discrete Actions              Continuo
 `DQN`_, `Rainbow`_             tf + torch **Yes** `+parametric`_        No                 **Yes**                                                                   tf + torch
 `APEX-DQN`_                    tf + torch **Yes** `+parametric`_        No                 **Yes**                                                                   torch
 `IMPALA`_                      tf + torch **Yes** `+parametric`_        **Yes**            **Yes**     `+RNN`_, `+LSTM auto-wrapping`_, `+Attention`_, `+autoreg`_   tf + torch
+`LeelaChessZero`_              torch      **Yes** `+parametric`_        No                 **Yes**                                                                   torch
 `MAML`_                        tf + torch No                            **Yes**            No                                                                        torch
 `MARWIL`_                      tf + torch **Yes** `+parametric`_        **Yes**            **Yes**     `+RNN`_                                                       torch
 `MBMPO`_                       torch      No                            **Yes**            No                                                                        torch
@@ -840,6 +841,22 @@ Tuned examples: `Sparse reward CartPole <https://github.com/ray-project/ray/blob
    :members: training
 
    
+.. _leelachesszero:
+
+MultiAgent LeelaChessZero (LeelaChessZero)
+------------------------------------------
+|pytorch|
+`[source] <https://lczero.org/>`__ `[implementation] <https://github.com/ray-project/ray/blob/master/rllib/algorithms/leela_chess_zero>`__ LeelaChessZero is an RL agent originally inspired by AlphaZero for playing chess. This version adapts it to handle a MultiAgent competitive environment of chess. The code can be scaled to any number of workers.
+
+Tuned examples: tbd
+
+**LeelaChessZero-specific configs** (see also `common configs <rllib-training.html#common-parameters>`__):
+
+.. autoclass:: ray.rllib.algorithms.leela_chess_zero.leela_chess_zero.LeelaChessZeroConfig
+   :members: training
+
+
+
 .. _curiosity:
 
 Curiosity (ICM: Intrinsic Curiosity Module)
diff --git a/python/requirements/ml/requirements_rllib.txt b/python/requirements/ml/requirements_rllib.txt
index 9e352bdad292..490c524dd776 100644
--- a/python/requirements/ml/requirements_rllib.txt
+++ b/python/requirements/ml/requirements_rllib.txt
@@ -16,6 +16,9 @@ kaggle_environments==1.7.11
 mlagents_envs==0.28.0
 # For tests on PettingZoo's multi-agent envs.
 pettingzoo==1.22.1; python_version >= '3.7'
+# When installing pettingzoo, chess is missing, even though its a dependancy
+# TODO: remove if a future pettingzoo and/or ray version fixes this dependancy issue
+chess==1.7.0
 pymunk==6.2.1
 supersuit==3.7.0; python_version >= '3.7'
 # For tests on minigrid.
diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index 74c9f57d1c7e..eaa62ec6f4f9 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -3440,6 +3440,30 @@
 
   alert: default
 
+- name: rllib_learning_tests_leela_chess_zero
+  group: RLlib tests
+  working_dir: rllib_tests
+
+  legacy:
+    test_name: learning_tests
+    test_suite: rllib_tests
+
+  frequency: nightly
+  team: rl
+  env: staging
+
+  cluster:
+    cluster_env: app_config.yaml
+    cluster_compute: 1gpu_16cpus.yaml  
+
+  run:
+    timeout: 18000
+    script: python learning_tests/run.py --yaml-sub-dir=leela_chess_zero
+    type: sdk_command
+    file_manager: job
+
+  alert: default
+
 ########################
 # Core Nightly Tests
 ########################
diff --git a/release/rllib_tests/learning_tests/yaml_files/leela_chess_zero/multi-agent-connect4.yaml b/release/rllib_tests/learning_tests/yaml_files/leela_chess_zero/multi-agent-connect4.yaml
new file mode 100644
index 000000000000..2a5d820ec3fb
--- /dev/null
+++ b/release/rllib_tests/learning_tests/yaml_files/leela_chess_zero/multi-agent-connect4.yaml
@@ -0,0 +1,19 @@
+connect-4-leela-zero:
+    env: ray.rllib.examples.env.pettingzoo_connect4.MultiAgentConnect4
+    run: LeelaChessZero
+    pass_criteria:
+      episode_reward_mean: 0.5
+    stop:
+      policy_reward_mean/p_0: 0.9
+      timesteps_total: 1000000
+    config:
+      # Only supported for torch right now.
+      framework: torch
+      num_workers: 8
+      model:
+        custom_model: ray.rllib.tuned_examples.leela_chess_zero.custom_model.DenseModel
+      multiagent:
+        policies: ["p_0","p_1"]
+        policies_to_train: ["p_0"]
+        policy_mapping_fn:
+          type: ray.rllib.tuned_examples.leela_chess_zero.custom_model.PolicyMappingFn
diff --git a/rllib/BUILD b/rllib/BUILD
index 432014f1dd60..0d3ef01f0019 100644
--- a/rllib/BUILD
+++ b/rllib/BUILD
@@ -884,6 +884,14 @@ py_test(
     srcs = ["algorithms/alpha_zero/tests/test_alpha_zero.py"]
 )
 
+# LeelaChessZero
+py_test(
+    name = "test_leela_chess_zero",
+    tags = ["team:rllib","torch_only", "algorithms_dir"],
+    size = "medium",
+    srcs = ["algorithms/leela_chess_zero/tests/test_leela_chess_zero.py"]
+)
+
 # APEX-DQN
 py_test(
     name = "test_apex_dqn",
diff --git a/rllib/algorithms/leela_chess_zero/README.md b/rllib/algorithms/leela_chess_zero/README.md
new file mode 100644
index 000000000000..d5825d5d82bd
--- /dev/null
+++ b/rllib/algorithms/leela_chess_zero/README.md
@@ -0,0 +1,23 @@
+# LeelaChessZero implementation for Ray/RLlib
+## Notes
+
+This code implements a multi-player LeelaChessZero agent, the Leela Chess Zero’s neural network is largely based on the DeepMind’s AlphaGo Zero and AlphaZero architecture. There are however some changes. It should be trained in a competition with multiple versions of its past self.
+
+The code for LeelaChessZero only supports the PyTorch framework.
+It assumes that the environment is a MultiAgent Chess environment, that has a discrete action space and returns an observation as a dictionary with two keys:
+
+ - `obs` that contains an observation under either the form of a state vector or an image
+ - `action_mask` that contains a mask over the legal actions
+ 
+ It should also implement a `get_state`and a `set_state` function, used in the MCTS implementation.
+ 
+ The model used in AlphaZero trainer should extend `TorchModelV2` and implement the method `compute_priors_and_value`. 
+ 
+## Example on Chess
+
+
+
+## References
+
+- AlphaZero: https://arxiv.org/abs/1712.01815
+- LeelaChessZero: https://lczero.org/dev/
diff --git a/rllib/algorithms/leela_chess_zero/__init__.py b/rllib/algorithms/leela_chess_zero/__init__.py
new file mode 100644
index 000000000000..5965a8f628a6
--- /dev/null
+++ b/rllib/algorithms/leela_chess_zero/__init__.py
@@ -0,0 +1,15 @@
+from ray.rllib.algorithms.leela_chess_zero.leela_chess_zero import (
+    LeelaChessZero,
+    LeelaChessZeroConfig,
+    LeelaChessZeroDefaultCallbacks,
+)
+from ray.rllib.algorithms.leela_chess_zero.leela_chess_zero_policy import (
+    LeelaChessZeroPolicy,
+)
+
+__all__ = [
+    "LeelaChessZero",
+    "LeelaChessZeroConfig",
+    "LeelaChessZeroPolicy",
+    "LeelaChessZeroDefaultCallbacks",
+]
diff --git a/rllib/algorithms/leela_chess_zero/leela_chess_zero.py b/rllib/algorithms/leela_chess_zero/leela_chess_zero.py
new file mode 100644
index 000000000000..d3169cdd4ff4
--- /dev/null
+++ b/rllib/algorithms/leela_chess_zero/leela_chess_zero.py
@@ -0,0 +1,411 @@
+import logging
+from typing import List, Optional, Type, Union
+
+from ray.rllib.algorithms.algorithm import Algorithm
+from ray.rllib.algorithms.algorithm_config import AlgorithmConfig, NotProvided
+from ray.rllib.algorithms.callbacks import DefaultCallbacks
+from ray.rllib.execution.rollout_ops import (
+    synchronous_parallel_sample,
+)
+from ray.rllib.execution.train_ops import (
+    train_one_step,
+)
+from ray.rllib.utils.typing import ResultDict
+from ray.rllib.policy.sample_batch import concat_samples
+from ray.rllib.models.catalog import ModelCatalog
+from ray.rllib.models.modelv2 import restore_original_dimensions
+from ray.rllib.models.torch.torch_action_dist import TorchCategorical
+from ray.rllib.policy.policy import Policy
+from ray.rllib.utils.annotations import override
+from ray.rllib.utils.framework import try_import_torch
+from ray.rllib.utils.replay_buffers.utils import validate_buffer_config
+from ray.rllib.utils.replay_buffers import PrioritizedReplayBuffer
+from ray.rllib.utils.deprecation import DEPRECATED_VALUE
+from ray.rllib.utils.metrics import (
+    NUM_AGENT_STEPS_SAMPLED,
+    NUM_ENV_STEPS_SAMPLED,
+    SYNCH_WORKER_WEIGHTS_TIMER,
+)
+
+from ray.rllib.algorithms.leela_chess_zero.leela_chess_zero_model import (
+    LeelaChessZeroModel,
+)
+from ray.rllib.algorithms.leela_chess_zero.leela_chess_zero_policy import (
+    LeelaChessZeroPolicy,
+)
+from ray.rllib.algorithms.leela_chess_zero.mcts import MCTS
+
+torch, nn = try_import_torch()
+
+logger = logging.getLogger(__name__)
+
+
+class LeelaChessZeroDefaultCallbacks(DefaultCallbacks):
+    """LeelaChessZero callbacks.
+    If you use custom callbacks, you must extend this class and call super()
+    for on_episode_start.
+    """
+
+    def __init__(self):
+        super().__init__()
+
+    @override(DefaultCallbacks)
+    def on_episode_start(self, worker, base_env, policies, episode, **kwargs):
+        # save env state when an episode starts
+        env = base_env.get_sub_environments()[0]
+        state = env.get_state()
+        episode.user_data["initial_state"] = state
+        episode.user_data["current_state"] = [state]
+
+    @override(DefaultCallbacks)
+    def on_episode_step(self, worker, base_env, policies, episode, **kwargs) -> None:
+        env = base_env.get_sub_environments()[0]
+        state = env.get_state()
+        episode.user_data["current_state"].append(state)
+
+
+class LeelaChessZeroConfig(AlgorithmConfig):
+    """Defines a configuration class from which a LeelaChessZero Algorithm can be built.
+
+    Example:
+        >>> from ray.rllib.algorithms.leela_chess_zero as lc0 # doctest: +SKIP
+        >>> from lc0 import LeelaChessZeroConfig # doctest: +SKIP
+        >>> config = LeelaChessZeroConfig()   # doctest: +SKIP
+        >>> config = config.training(sgd_minibatch_size=256)   # doctest: +SKIP
+        >>> config = config..resources(num_gpus=0)   # doctest: +SKIP
+        >>> config = config..rollouts(num_rollout_workers=4)   # doctest: +SKIP
+        >>> print(config.to_dict()) # doctest: +SKIP
+        >>> # Build a Algorithm object from the config and run 1 training iteration.
+        >>> algo = config.build(env="CartPole-v1")  # doctest: +SKIP
+        >>> algo.train() # doctest: +SKIP
+
+    Example:
+        >>> from ray.rllib.algorithms.leela_chess_zero as lc0 # doctest: +SKIP
+        >>> from lc0 import LeelaChessZeroConfig # doctest: +SKIP
+        >>> from ray import air # doctest: +SKIP
+        >>> from ray import tune # doctest: +SKIP
+        >>> config = LeelaChessZeroConfig() # doctest: +SKIP
+        >>> # Print out some default values.
+        >>> print(config.shuffle_sequences) # doctest: +SKIP
+        >>> # Update the config object.
+        >>> config.training(lr=tune.grid_search([0.001, 0.0001]))  # doctest: +SKIP
+        >>> # Set the config object's env.
+        >>> config.environment(env="CartPole-v1")   # doctest: +SKIP
+        >>> # Use to_dict() to get the old-style python config dict
+        >>> # when running with tune.
+        >>> tune.Tuner( # doctest: +SKIP
+        ...     "LeelaChessZero", # doctest: +SKIP
+        ...     run_config=air.RunConfig(stop={ # doctest: +SKIP
+                    "episode_reward_mean": 200}), # doctest: +SKIP
+        ...     param_space=config.to_dict(), # doctest: +SKIP
+        ... ).fit() # doctest: +SKIP
+    """
+
+    def __init__(self, algo_class=None):
+        """Initializes a LeelaChessZeroConfig instance."""
+        super().__init__(algo_class=algo_class or LeelaChessZero)
+
+        # fmt: off
+        # __sphinx_doc_begin__
+        # LeelaChessZero specific config settings:
+        self.sgd_minibatch_size = 256
+        self.shuffle_sequences = True
+        self.num_sgd_iter = 30
+        self.replay_buffer_config = {
+            "_enable_replay_buffer_api": True,
+            "type": "MultiAgentReplayBuffer",
+            "underlying_replay_buffer_config": {
+                "type": PrioritizedReplayBuffer,
+                "capacity": 10000, "storage_unit": "episodes",
+                "prioritized_replay_alpha": 0.6, "prioritized_replay_beta": 0.4,
+                "prioritized_replay_eps": 1e-6,
+            },
+        }
+        # Number of timesteps to collect from rollout workers before we start
+        # sampling from replay buffers for learning. Whether we count this in agent
+        # steps  or environment steps depends on config["multiagent"]["count_steps_by"].
+        self.num_steps_sampled_before_learning_starts = 1000
+        self.lr_schedule = None
+        self.vf_share_layers = False
+        self.mcts_config = {
+            "puct_coefficient": 2**0.5,
+            "num_simulations": 25,
+            "temperature": 1.5,
+            "dirichlet_epsilon": 0.25,
+            "dirichlet_noise": 0.03,
+            "argmax_tree_policy": True,
+            "add_dirichlet_noise": True,
+            "epsilon": 0.05,
+            "turn_based_flip": True,
+            "argmax_child_value": True,
+        }
+        self.model = {"custom_model" : LeelaChessZeroModel}
+
+        # Override some of AlgorithmConfig's default values with AlphaZero-specific
+        # values.
+        self.framework_str = "torch"
+        self.callbacks_class = LeelaChessZeroDefaultCallbacks
+        self.lr = 1e-3
+        self.num_rollout_workers = 8
+        self.rollout_fragment_length = 200
+        self.train_batch_size = 2048
+        self.batch_mode = "complete_episodes"
+        # Extra configuration for eval that disables exploration.
+        self.evaluation(evaluation_config={
+            "mcts_config": {
+                "argmax_tree_policy": True,
+                "add_dirichlet_noise": False,
+            },
+        })
+        # __sphinx_doc_end__
+        # fmt: on
+
+        self.buffer_size = DEPRECATED_VALUE
+
+    @override(AlgorithmConfig)
+    def callbacks(
+        self, *, callbacks_class: Optional[DefaultCallbacks] = NotProvided, **kwargs
+    ) -> "LeelaChessZeroConfig":
+        super().callbacks(callbacks_class, **kwargs)
+
+        if callbacks_class is not NotProvided:
+            self.callbacks_class = callbacks_class
+        return self
+
+    @override(AlgorithmConfig)
+    def training(
+        self,
+        *,
+        sgd_minibatch_size: Optional[int] = NotProvided,
+        shuffle_sequences: Optional[bool] = NotProvided,
+        num_sgd_iter: Optional[int] = NotProvided,
+        replay_buffer_config: Optional[dict] = NotProvided,
+        lr: Optional[float] = NotProvided,
+        lr_schedule: Optional[List[List[Union[int, float]]]] = NotProvided,
+        vf_share_layers: Optional[bool] = NotProvided,
+        mcts_config: Optional[dict] = NotProvided,
+        num_steps_sampled_before_learning_starts: Optional[int] = NotProvided,
+        model: Optional[dict] = NotProvided,
+        **kwargs,
+    ) -> "LeelaChessZeroConfig":
+        """Sets the training related configuration.
+
+        Args:
+            sgd_minibatch_size: Total SGD batch size across all devices for SGD.
+            shuffle_sequences: Whether to shuffle sequences in the batch when training
+                (recommended).
+            num_sgd_iter: Number of SGD iterations in each outer loop.
+            replay_buffer_config: Replay buffer config.
+                Examples:
+                {
+                "_enable_replay_buffer_api": True,
+                "type": "MultiAgentReplayBuffer",
+                "learning_starts": 1000,
+                "capacity": 50000,
+                "replay_sequence_length": 1,
+                }
+                - OR -
+                {
+                "_enable_replay_buffer_api": True,
+                "type": "MultiAgentPrioritizedReplayBuffer",
+                "capacity": 50000,
+                "prioritized_replay_alpha": 0.6,
+                "prioritized_replay_beta": 0.4,
+                "prioritized_replay_eps": 1e-6,
+                "replay_sequence_length": 1,
+                }
+                - Where -
+                prioritized_replay_alpha: Alpha parameter controls the degree of
+                prioritization in the buffer. In other words, when a buffer sample has
+                a higher temporal-difference error, with how much more probability
+                should it drawn to use to update the parametrized Q-network. 0.0
+                corresponds to uniform probability. Setting much above 1.0 may quickly
+                result as the sampling distribution could become heavily “pointy” with
+                low entropy.
+                prioritized_replay_beta: Beta parameter controls the degree of
+                importance sampling which suppresses the influence of gradient updates
+                from samples that have higher probability of being sampled via alpha
+                parameter and the temporal-difference error.
+                prioritized_replay_eps: Epsilon parameter sets the baseline probability
+                for sampling so that when the temporal-difference error of a sample is
+                zero, there is still a chance of drawing the sample.
+            lr_schedule: Learning rate schedule. In the format of
+                [[timestep, lr-value], [timestep, lr-value], ...]
+                Intermediary timesteps will be assigned to interpolated learning rate
+                values. A schedule should normally start from timestep 0.
+            vf_share_layers: Share layers for value function. If you set this to True,
+                it's important to tune vf_loss_coeff.
+            mcts_config: MCTS specific settings.
+            num_steps_sampled_before_learning_starts: Number of timesteps to collect
+                from rollout workers before we start sampling from replay buffers for
+                learning. Whether we count this in agent steps  or environment steps
+                depends on config["multiagent"]["count_steps_by"].
+
+        Returns:
+            This updated AlgorithmConfig object.
+        """
+        # Pass kwargs onto super's `training()` method.
+        super().training(**kwargs)
+
+        if sgd_minibatch_size is not NotProvided:
+            self.sgd_minibatch_size = sgd_minibatch_size
+        if shuffle_sequences is not NotProvided:
+            self.shuffle_sequences = shuffle_sequences
+        if num_sgd_iter is not NotProvided:
+            self.num_sgd_iter = num_sgd_iter
+        if replay_buffer_config is not NotProvided:
+            self.replay_buffer_config = replay_buffer_config
+        if lr is not NotProvided:
+            self.lr = lr
+        if lr_schedule is not NotProvided:
+            self.lr_schedule = lr_schedule
+        if vf_share_layers is not NotProvided:
+            self.vf_share_layers = vf_share_layers
+        if mcts_config is not NotProvided:
+            # only assign provided keys
+            for k, v in mcts_config.items():
+                self.mcts_config[k] = v
+        if num_steps_sampled_before_learning_starts is not NotProvided:
+            self.num_steps_sampled_before_learning_starts = (
+                num_steps_sampled_before_learning_starts
+            )
+        if model is not NotProvided:
+            self.model = model
+
+        return self
+
+    @override(AlgorithmConfig)
+    def update_from_dict(self, config_dict) -> "LeelaChessZeroConfig":
+        config_dict = config_dict.copy()
+
+        if "ranked_rewards" in config_dict:
+            value = config_dict.pop("ranked_rewards")
+            self.training(ranked_rewards=value)
+
+        return super().update_from_dict(config_dict)
+
+    @override(AlgorithmConfig)
+    def validate(self) -> None:
+        """Checks and updates the config based on settings."""
+        # Call super's validation method.
+        super().validate()
+        validate_buffer_config(self)
+
+
+def leela_chess_zero_loss(policy, model, dist_class, train_batch):
+    # get inputs unflattened inputs
+    input_dict = restore_original_dimensions(
+        train_batch["obs"], policy.observation_space, "torch"
+    )
+    # forward pass in model
+    model_out = model.forward(input_dict, None, [1])
+    logits, _ = model_out
+    values = model.value_function()
+    logits, values = torch.squeeze(logits), torch.squeeze(values)
+    priors = nn.Softmax(dim=-1)(logits)
+    # compute actor and critic losses
+    policy_loss = torch.mean(
+        -torch.sum(train_batch["mcts_policies"] * torch.log(priors), dim=-1)
+    )
+    value_loss = torch.mean(torch.pow(values - train_batch["value_label"], 2))
+    # compute total loss
+    total_loss = (policy_loss + value_loss) / 2
+    return total_loss, policy_loss, value_loss
+
+
+class LeelaChessZeroPolicyWrapperClass(LeelaChessZeroPolicy):
+    def __init__(self, obs_space, action_space, config):
+        model = ModelCatalog.get_model_v2(
+            obs_space, action_space, action_space.n, config["model"], "torch"
+        )
+        _, env_creator = Algorithm._get_env_id_and_creator(config["env"], config)
+
+        def _env_creator():
+            return env_creator(config["env_config"])
+
+        def mcts_creator():
+            mcts_params = config["mcts_config"]
+            return MCTS(model, mcts_params)
+
+        super().__init__(
+            obs_space,
+            action_space,
+            config,
+            model,
+            leela_chess_zero_loss,
+            TorchCategorical,
+            mcts_creator,
+            _env_creator,
+        )
+
+
+class LeelaChessZero(Algorithm):
+    @classmethod
+    @override(Algorithm)
+    def get_default_config(cls) -> AlgorithmConfig:
+        return LeelaChessZeroConfig()
+
+    @override(Algorithm)
+    def get_default_policy_class(self, *args, **kwargs) -> Optional[Type[Policy]]:
+        return LeelaChessZeroPolicyWrapperClass
+
+    @override(Algorithm)
+    def training_step(self) -> ResultDict:
+        """TODO:
+
+        Returns:
+            The results dict from executing the training iteration.
+        """
+
+        # Sample n MultiAgentBatches from n workers.
+        new_sample_batches = synchronous_parallel_sample(
+            worker_set=self.workers, concat=False
+        )
+
+        for batch in new_sample_batches:
+            # Update sampling step counters.
+            self._counters[NUM_ENV_STEPS_SAMPLED] += batch.env_steps()
+            self._counters[NUM_AGENT_STEPS_SAMPLED] += batch.agent_steps()
+            # Store new samples in the replay buffer
+            if self.local_replay_buffer is not None:
+                self.local_replay_buffer.add(batch)
+
+        if self.local_replay_buffer is not None:
+            # Update target network every `target_network_update_freq` sample steps.
+            cur_ts = self._counters[
+                NUM_AGENT_STEPS_SAMPLED
+                if self.config.count_steps_by == "agent_steps"
+                else NUM_ENV_STEPS_SAMPLED
+            ]
+
+            if cur_ts > self.config.num_steps_sampled_before_learning_starts:
+                train_batch = self.local_replay_buffer.sample(
+                    self.config.train_batch_size
+                )
+            else:
+                train_batch = None
+        else:
+            train_batch = concat_samples(new_sample_batches)
+
+        # Learn on the training batch.
+        # Use simple optimizer (only for multi-agent or tf-eager; all other
+        # cases should use the multi-GPU optimizer, even if only using 1 GPU)
+        train_results = {}
+        if train_batch is not None:
+            train_results = train_one_step(self, train_batch)
+
+        # TODO: Move training steps counter update outside of `train_one_step()` method.
+        # # Update train step counters.
+        # self._counters[NUM_ENV_STEPS_TRAINED] += train_batch.env_steps()
+        # self._counters[NUM_AGENT_STEPS_TRAINED] += train_batch.agent_steps()
+
+        # Update weights and global_vars - after learning on the local worker - on all
+        # remote workers.
+        global_vars = {
+            "timestep": self._counters[NUM_ENV_STEPS_SAMPLED],
+        }
+        with self._timers[SYNCH_WORKER_WEIGHTS_TIMER]:
+            self.workers.sync_weights(global_vars=global_vars)
+
+        # Return all collected metrics for the iteration.
+        return train_results
diff --git a/rllib/algorithms/leela_chess_zero/leela_chess_zero_model.py b/rllib/algorithms/leela_chess_zero/leela_chess_zero_model.py
new file mode 100644
index 000000000000..b03d970a5442
--- /dev/null
+++ b/rllib/algorithms/leela_chess_zero/leela_chess_zero_model.py
@@ -0,0 +1,174 @@
+import numpy as np
+
+from ray.rllib.models.torch.torch_modelv2 import TorchModelV2
+from ray.rllib.utils.typing import TensorType, ModelConfigDict
+from ray.rllib.utils.annotations import override
+from ray.rllib.models.preprocessors import get_preprocessor
+from ray.rllib.utils.framework import try_import_torch
+
+torch, nn = try_import_torch()
+F = nn.functional
+
+
+def convert_to_tensor(arr):
+    tensor = torch.from_numpy(np.asarray(arr))
+    if tensor.dtype == torch.double:
+        tensor = tensor.float()
+    return tensor
+
+
+class LeelaChessZeroModel(TorchModelV2, nn.Module):
+    def __init__(
+        self,
+        obs_space,
+        action_space,
+        num_outputs: int,
+        model_config: ModelConfigDict,
+        name: str,
+    ):
+        TorchModelV2.__init__(
+            self, obs_space, action_space, num_outputs, model_config, name
+        )
+        nn.Module.__init__(self)
+        try:
+            self.preprocessor = get_preprocessor(obs_space.original_space)(
+                obs_space.original_space
+            )
+        except Exception:
+            self.preprocessor = get_preprocessor(obs_space)(obs_space)
+
+        self.action_masking = False
+        self.alpha_zero_obs = True
+        if self.alpha_zero_obs:
+            self.input_channel_size = 111
+        else:
+            self.input_channel_size = 19
+
+        filters = 32
+        res_blocks = 3
+        se_channels = 0
+        policy_conv_size = 73
+        policy_output_size = 4672
+        self.num_outputs = 4672
+        self.name = name
+        self.obs_space = obs_space
+        self.action_space = action_space
+        self.model_config = model_config
+
+        self.filters = filters
+        self.res_blocks = res_blocks
+        self.se_channels = se_channels
+        self.policy_conv_size = policy_conv_size
+        self.policy_output_size = policy_output_size
+        self.pre_conv = nn.Conv2d(
+            self.input_channel_size, self.filters, 3, padding="same"
+        )
+        self.conv1 = nn.Conv2d(self.filters, self.filters, 3, padding="same")
+        self.conv2 = nn.Conv2d(self.filters, self.filters, 3, padding="same")
+        self.pool = nn.AvgPool2d(8)
+        self.se1 = nn.Linear(self.filters, self.se_channels)
+        self.se2 = nn.Linear(self.se_channels, self.filters * 2)
+        self.fc_head = nn.Linear(self.filters * 64, 128)
+        self.value_head = nn.Linear(128, 1)
+        self.policy_conv1 = nn.Conv2d(
+            self.filters, self.policy_conv_size, 3, padding="same"
+        )
+        self.policy_fc = nn.Linear(self.policy_conv_size * 64, self.policy_output_size)
+        self._value = None
+
+    @override(TorchModelV2)
+    def forward(self, input_dict, state, seq_lens):
+        try:
+            obs = input_dict["obs"]["observation"]
+            action_mask = input_dict["obs"]["action_mask"]
+        except KeyError:
+            try:
+                obs = input_dict["obs"]
+                action_mask = input_dict["action_mask"]
+            except KeyError:
+                try:
+                    obs = input_dict["observation"]
+                    action_mask = input_dict["action_mask"]
+                except KeyError:
+                    print(input_dict)
+                    raise Exception("No observation in input_dict")
+        if self.alpha_zero_obs:
+            if not type(obs) == torch.Tensor:
+                obs = torch.from_numpy(obs.astype(np.float32))
+                action_mask = torch.from_numpy(action_mask.astype(np.float32))
+            try:
+                obs = torch.transpose(obs, 3, 1)
+                obs = torch.transpose(obs, 3, 2)
+            except IndexError:
+                obs = torch.reshape(obs, (1, 8, 8, self.input_channel_size))
+                obs = torch.transpose(obs, 3, 1)
+                obs = torch.transpose(obs, 3, 2)
+
+        x = self.pre_conv(obs)
+        residual = x
+        for i in range(self.res_blocks):
+            x = self.conv1(x)
+            x = self.conv2(x)
+            if self.se_channels > 0:
+                input = x
+                se = self.pool(x)
+                se = torch.flatten(se, 1)
+                se = F.relu(self.se1(se))
+                se = self.se2(se)
+                w, b = torch.tensor_split(se, 2, dim=-1)
+                z = torch.sigmoid(w)
+                input = torch.reshape(input, (-1, self.filters, 64))
+                z = torch.reshape(z, (-1, self.filters, 1))
+                se = torch.mul(z, input)
+                se = torch.reshape(se, (-1, self.filters, 8, 8))
+                se += b
+            x += residual
+            residual = x
+            x = torch.relu(x)
+        value = torch.flatten(x, 1)
+        value = torch.relu(self.fc_head(value))
+        value = torch.tanh(self.value_head(value))
+        policy = self.policy_conv1(x)
+        policy = torch.flatten(policy, 1)
+        policy = self.policy_fc(policy)
+        self._value = value.squeeze(1)
+
+        if self.action_masking:
+            masked_policy = self.apply_action_mask(policy, action_mask)
+            return masked_policy, state
+        else:
+            return policy, state
+
+    @override(TorchModelV2)
+    def value_function(self) -> TensorType:
+        return self._value
+
+    def apply_action_mask(self, policy, action_mask):
+        masked_policy = torch.mul(policy, action_mask)
+        action_mask = torch.clamp(torch.log(action_mask), -1e10, 3.4e38)
+        return masked_policy + action_mask
+
+    def get_board_evaluation(self, obs):
+        return self.compute_priors_and_value(obs)
+
+    def compute_priors_and_value(self, obs):
+        new_obs = torch.from_numpy(
+            obs["observation"]
+            .astype(np.float32)
+            .reshape([1, 8, 8, self.input_channel_size])
+        )
+        new_action_mask = torch.from_numpy(
+            obs["action_mask"].astype(np.float32).reshape([1, self.num_outputs])
+        )
+        input_dict = {"obs": {"observation": new_obs, "action_mask": new_action_mask}}
+        with torch.no_grad():
+            model_out = self.forward(input_dict, None, [1])
+            logits, _ = model_out
+            value = self.value_function()
+            logits, value = torch.squeeze(logits), torch.squeeze(value)
+            priors = nn.Softmax(dim=-1)(logits)
+            value = nn.Tanh()(value)
+
+            priors = priors.cpu().numpy()
+            value = value.cpu().numpy()
+            return priors, value
diff --git a/rllib/algorithms/leela_chess_zero/leela_chess_zero_policy.py b/rllib/algorithms/leela_chess_zero/leela_chess_zero_policy.py
new file mode 100644
index 000000000000..c54ec58637aa
--- /dev/null
+++ b/rllib/algorithms/leela_chess_zero/leela_chess_zero_policy.py
@@ -0,0 +1,147 @@
+import numpy as np
+
+from ray.rllib.policy.policy import Policy
+from ray.rllib.policy.torch_policy import TorchPolicy
+from ray.rllib.algorithms.leela_chess_zero.mcts import Node, RootParentNode
+from ray.rllib.utils.annotations import override
+from ray.rllib.utils.framework import try_import_torch
+from ray.rllib.utils.metrics.learner_info import LEARNER_STATS_KEY
+
+
+torch, _ = try_import_torch()
+
+
+class LeelaChessZeroPolicy(TorchPolicy):
+    def __init__(
+        self,
+        observation_space,
+        action_space,
+        config,
+        model,
+        loss,
+        action_distribution_class,
+        mcts_creator,
+        env_creator,
+        **kwargs
+    ):
+        super().__init__(
+            observation_space,
+            action_space,
+            config,
+            model=model,
+            loss=loss,
+            action_distribution_class=action_distribution_class,
+        )
+        # we maintain an env copy in the policy that is used during mcts
+        # simulations
+        self.env_creator = env_creator
+        self.mcts = mcts_creator()
+        self.env = self.env_creator()
+        self.obs_space = observation_space
+        # only used in multi policy competitive environments
+        self.elo = 400
+
+    @override(TorchPolicy)
+    def compute_actions(
+        self,
+        obs_batch,
+        state_batches=None,
+        prev_action_batch=None,
+        prev_reward_batch=None,
+        info_batch=None,
+        episodes=None,
+        **kwargs
+    ):
+        input_dict = {"obs": obs_batch}
+        if prev_action_batch is not None:
+            input_dict["prev_actions"] = prev_action_batch
+        if prev_reward_batch is not None:
+            input_dict["prev_rewards"] = prev_reward_batch
+
+        return self.compute_actions_from_input_dict(
+            input_dict=input_dict,
+            episodes=episodes,
+            state_batches=state_batches,
+        )
+
+    @override(Policy)
+    def compute_actions_from_input_dict(
+        self, input_dict, explore=None, timestep=None, episodes=None, **kwargs
+    ):
+        with torch.no_grad():
+            actions = []
+            for i, episode in enumerate(episodes):
+                env_state = episode.user_data["current_state"][-1]
+                # create tree root node
+                obs = self.env.set_state(env_state)
+                tree_node = Node(
+                    state=env_state,
+                    obs=obs,
+                    reward=0,
+                    done=False,
+                    action=None,
+                    parent=RootParentNode(env=self.env),
+                    mcts=self.mcts,
+                )
+
+                # run monte carlo simulations to compute the actions
+                # and record the tree
+                mcts_policy, action, tree_node = self.mcts.compute_action(tree_node)
+
+                # record action
+                actions.append(action)
+                # store new node
+                episode.user_data["tree_node"] = tree_node
+
+                # store mcts policies vectors and current tree root node
+                if episode.length == 0:
+                    episode.user_data["mcts_policies"] = [mcts_policy]
+                else:
+                    episode.user_data["mcts_policies"].append(mcts_policy)
+                break
+            return (
+                np.array(actions),
+                [],
+                self.extra_action_out(
+                    input_dict, kwargs.get("state_batches", []), self.model, None
+                ),
+            )
+
+    @override(Policy)
+    def postprocess_trajectory(
+        self, sample_batch, other_agent_batches=None, episode=None
+    ):
+        # add mcts policies to sample batch
+        sample_batch["mcts_policies"] = np.array(episode.user_data["mcts_policies"])[
+            sample_batch["t"]
+        ]
+        # final episode reward corresponds to the value (if not discounted)
+        # for all transitions in episode
+        final_reward = sample_batch["rewards"][-1]
+        sample_batch["value_label"] = final_reward * np.ones_like(sample_batch["t"])
+        return sample_batch
+
+    @override(TorchPolicy)
+    def learn_on_batch(self, postprocessed_batch):
+        train_batch = self._lazy_tensor_dict(postprocessed_batch)
+
+        loss_out, policy_loss, value_loss = self._loss(
+            self, self.model, self.dist_class, train_batch
+        )
+        self._optimizers[0].zero_grad()
+        loss_out.backward()
+
+        grad_process_info = self.extra_grad_process(self._optimizers[0], loss_out)
+        self._optimizers[0].step()
+
+        grad_info = self.extra_grad_info(train_batch)
+        grad_info.update(grad_process_info)
+        grad_info.update(
+            {
+                "total_loss": loss_out.detach().cpu().numpy(),
+                "policy_loss": policy_loss.detach().cpu().numpy(),
+                "value_loss": value_loss.detach().cpu().numpy(),
+            }
+        )
+
+        return {LEARNER_STATS_KEY: grad_info}
diff --git a/rllib/algorithms/leela_chess_zero/mcts.py b/rllib/algorithms/leela_chess_zero/mcts.py
new file mode 100644
index 000000000000..afbe3d52d1c2
--- /dev/null
+++ b/rllib/algorithms/leela_chess_zero/mcts.py
@@ -0,0 +1,214 @@
+"""
+Mcts implementation modified from
+https://github.com/brilee/python_uct/blob/master/numpy_impl.py
+"""
+import collections
+import math
+
+import numpy as np
+import copy
+
+
+class Node:
+    def __init__(
+        self, action, obs, done, reward, state, mcts, parent=None, multi_agent=False
+    ):
+        self.env = parent.env
+        self.action = action  # Action used to go to this state
+
+        self.is_expanded = False
+        self.parent = parent
+        self.children = {}
+
+        self.action_space_size = self.env.action_space.n
+        self.child_total_value = np.zeros(
+            [self.action_space_size], dtype=np.float32
+        )  # Q
+        self.child_priors = np.zeros([self.action_space_size], dtype=np.float32)  # P
+        self.child_number_visits = np.zeros(
+            [self.action_space_size], dtype=np.float32
+        )  # N
+
+        self.reward = reward
+        self.done = done
+        self.state = state
+        self.obs = obs
+
+        current_agents = list(obs.keys())
+        current_agent = current_agents[0]
+        for key in current_agents:
+            if "player_" in key:
+                multi_agent = True
+        if multi_agent:
+            current_agent = self.state.agent_selection
+            if type(self.reward) == dict:
+                self.reward = self.reward[current_agent]
+            if type(self.done) == dict:
+                self.done = self.done[current_agent]
+            if type(self.obs) == dict:
+                self.valid_actions = obs[current_agent]["action_mask"].astype(bool)
+                self.obs = obs[current_agent]
+        else:
+            self.valid_actions = obs["action_mask"].astype(bool)
+            self.obs = obs
+
+        self.mcts = mcts
+
+        self.multi_agent = multi_agent
+
+    @property
+    def number_visits(self):
+        return self.parent.child_number_visits[self.action]
+
+    @number_visits.setter
+    def number_visits(self, value):
+        self.parent.child_number_visits[self.action] = value
+
+    @property
+    def total_value(self):
+        return self.parent.child_total_value[self.action]
+
+    @total_value.setter
+    def total_value(self, value):
+        self.parent.child_total_value[self.action] = value
+
+    def child_Q(self):
+        # TODO (weak todo) add "softmax" version of the Q-value
+        return self.child_total_value / (1 + self.child_number_visits)
+
+    def child_U(self):
+        return (
+            math.sqrt(self.number_visits)
+            * self.child_priors
+            / (1 + self.child_number_visits)
+        )
+
+    def best_action(self):
+        """
+        :return: action
+        """
+        child_score = self.child_Q() + self.mcts.c_puct * self.child_U()
+        masked_child_score = child_score
+        if self.mcts.exploit_child_value:
+            masked_child_score[~self.valid_actions] = -1e22
+            action = np.argmax(masked_child_score)
+            assert self.valid_actions[action] == 1
+            return action
+        else:
+            masked_child_score[~self.valid_actions] = 0
+            masked_child_score[self.valid_actions] += 1 + abs(
+                np.min(masked_child_score)
+            )
+            p = masked_child_score / np.sum(masked_child_score)
+            action = np.random.choice(
+                np.arange(len(masked_child_score)),
+                p=p,
+            )
+            assert self.valid_actions[action] == 1
+            return action
+
+    def select(self):
+        current_node = self
+        while current_node.is_expanded:
+            best_action = current_node.best_action()
+            current_node = current_node.get_child(best_action)
+        return current_node
+
+    def expand(self, child_priors):
+        self.is_expanded = True
+        self.total_value = 0
+        self.parent.child_total_value[self.action] = 0
+        self.child_priors = child_priors
+
+    def get_child(self, action):
+        if action not in self.children:
+            self.env.set_state(self.state)
+            obs, reward, done, _, _ = self.env.step(action)
+            next_state = self.env.get_state()
+            self.children[action] = Node(
+                state=next_state,
+                action=action,
+                parent=self,
+                reward=reward,
+                done=done,
+                obs=obs,
+                mcts=self.mcts,
+            )
+        return self.children[action]
+
+    def backup(self, value):
+        current = self
+
+        while current.parent is not None:
+            if self.mcts.turn_based_flip:
+                value = -value
+            current.number_visits += 1
+            current.total_value += value
+            current = current.parent
+
+
+class RootParentNode:
+    def __init__(self, env, state=None):
+        self.parent = None
+        self.child_total_value = collections.defaultdict(float)
+        self.child_number_visits = collections.defaultdict(float)
+        self.env = env
+        if state is None:
+            self.state = env.get_state()
+        else:
+            self.state = state
+
+
+class MCTS:
+    def __init__(self, model, mcts_param):
+        self.model = model
+        self.temperature = mcts_param["temperature"]
+        self.dir_epsilon = mcts_param["dirichlet_epsilon"]
+        self.dir_noise = mcts_param["dirichlet_noise"]
+        self.num_sims = mcts_param["num_simulations"]
+        self.exploit = mcts_param["argmax_tree_policy"]
+        self.add_dirichlet_noise = mcts_param["add_dirichlet_noise"]
+        self.c_puct = mcts_param["puct_coefficient"]
+        self.epsilon = mcts_param["epsilon"]
+        self.turn_based_flip = mcts_param["turn_based_flip"]
+        self.exploit_child_value = mcts_param["argmax_child_value"]
+
+    def compute_action(self, node):
+        initial_state = copy.deepcopy(node.state)
+        for _ in range(self.num_sims):
+            node.env.set_state(copy.deepcopy(initial_state))
+            leaf = node.select()
+            if leaf.done:
+                value = -leaf.reward * 10
+            else:
+                child_priors, value = self.model.compute_priors_and_value(leaf.obs)
+                if self.add_dirichlet_noise:
+                    child_priors = (1 - self.dir_epsilon) * child_priors
+                    child_priors += self.dir_epsilon * np.random.dirichlet(
+                        [self.dir_noise] * child_priors.size
+                    )
+
+                leaf.expand(child_priors)
+            leaf.backup(value)
+
+        # Tree policy target (TPT)
+        tree_policy = node.child_number_visits / node.number_visits
+        tree_policy = tree_policy / np.max(
+            tree_policy
+        )  # to avoid overflows when computing softmax
+        tree_policy = np.power(tree_policy, self.temperature)
+        tree_policy *= node.valid_actions
+        tree_policy = tree_policy / np.sum(tree_policy)
+        epsilon_exploration = np.random.choice(
+            [True, False], p=[self.epsilon, 1 - self.epsilon]
+        )
+        if self.exploit and not epsilon_exploration:
+            # if exploit then choose action that has the maximum
+            # tree policy probability
+            action = np.argmax(tree_policy)
+        else:
+            # otherwise sample an action according to tree policy probabilities
+            action = np.random.choice(np.arange(node.action_space_size), p=tree_policy)
+        assert node.valid_actions[action] == 1
+        node.env.set_state(initial_state)
+        return tree_policy, action, node.children[action]
diff --git a/rllib/algorithms/leela_chess_zero/tests/test_leela_chess_zero.py b/rllib/algorithms/leela_chess_zero/tests/test_leela_chess_zero.py
new file mode 100644
index 000000000000..d7f7aaab4db7
--- /dev/null
+++ b/rllib/algorithms/leela_chess_zero/tests/test_leela_chess_zero.py
@@ -0,0 +1,53 @@
+import unittest
+
+import ray
+import ray.rllib.algorithms.leela_chess_zero.leela_chess_zero as lz
+from ray.rllib.algorithms.leela_chess_zero.leela_chess_zero_model import (
+    LeelaChessZeroModel,
+)
+from ray.rllib.examples.env.pettingzoo_chess import MultiAgentChess
+from ray.rllib.utils.test_utils import (
+    check_train_results,
+    framework_iterator,
+)
+
+
+class TestLeelaChessZero(unittest.TestCase):
+    @classmethod
+    def setUpClass(cls) -> None:
+        ray.init()
+
+    @classmethod
+    def tearDownClass(cls) -> None:
+        ray.shutdown()
+
+    def test_leela_chess_zero_compilation(self):
+        """Test whether LeelaChessZero can be built with PyTorch frameworks."""
+        config = (
+            lz.LeelaChessZeroConfig()
+            .environment(env=MultiAgentChess)
+            .training(
+                sgd_minibatch_size=256,
+                train_batch_size=256,
+                num_sgd_iter=1,
+                model={"custom_model": LeelaChessZeroModel, "max_seq_len": 200},
+                mcts_config={"num_simulations": 2},
+            )
+            .resources(num_gpus=0)
+        )
+        num_iterations = 1
+        # Only working for torch right now.
+        for _ in framework_iterator(config, frameworks="torch"):
+            algo = config.build()
+            for i in range(num_iterations):
+                results = algo.train()
+                check_train_results(results)
+                print(results)
+            algo.stop()
+
+
+if __name__ == "__main__":
+    import pytest
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/rllib/algorithms/registry.py b/rllib/algorithms/registry.py
index 75528aac5d2c..409548d2e4c1 100644
--- a/rllib/algorithms/registry.py
+++ b/rllib/algorithms/registry.py
@@ -216,6 +216,12 @@ def _import_td3():
     return td3.TD3, td3.TD3.get_default_config()
 
 
+def _import_leela_chess_zero():
+    import ray.rllib.algorithms.leela_chess_zero as lc0
+
+    return lc0.LeelaChessZero, lc0.LeelaChessZero.get_default_config()
+
+
 ALGORITHMS = {
     "A2C": _import_a2c,
     "A3C": _import_a3c,
@@ -251,6 +257,7 @@ def _import_td3():
     "SimpleQ": _import_simple_q,
     "SlateQ": _import_slate_q,
     "TD3": _import_td3,
+    "LeelaChessZero": _import_leela_chess_zero,
 }
 
 
diff --git a/rllib/examples/env/pettingzoo_chess.py b/rllib/examples/env/pettingzoo_chess.py
new file mode 100644
index 000000000000..49bdb3fb00da
--- /dev/null
+++ b/rllib/examples/env/pettingzoo_chess.py
@@ -0,0 +1,196 @@
+from pettingzoo import AECEnv
+from pettingzoo.classic.chess.chess import raw_env as chess_v5
+import copy
+from ray.rllib.env.multi_agent_env import MultiAgentEnv
+from typing import Dict, Any
+import chess as ch
+import numpy as np
+
+
+class MultiAgentChess(MultiAgentEnv):
+    """An interface to the PettingZoo MARL environment library.
+    See: https://github.com/Farama-Foundation/PettingZoo
+    Inherits from MultiAgentEnv and exposes a given AEC
+    (actor-environment-cycle) game from the PettingZoo project via the
+    MultiAgentEnv public API.
+    Note that the wrapper has some important limitations:
+    1. All agents have the same action_spaces and observation_spaces.
+       Note: If, within your aec game, agents do not have homogeneous action /
+       observation spaces, apply SuperSuit wrappers
+       to apply padding functionality: https://github.com/Farama-Foundation/
+       SuperSuit#built-in-multi-agent-only-functions
+    2. Environments are positive sum games (-> Agents are expected to cooperate
+       to maximize reward). This isn't a hard restriction, it just that
+       standard algorithms aren't expected to work well in highly competitive
+       games.
+    Examples:
+        >>> from pettingzoo.butterfly import prison_v3
+        >>> from ray.rllib.env.wrappers.pettingzoo_env import PettingZooEnv
+        >>> env = PettingZooEnv(prison_v3.env())
+        >>> obs = env.reset()
+        >>> print(obs)
+        # only returns the observation for the agent which should be stepping
+        {
+            'prisoner_0': array([[[0, 0, 0],
+                [0, 0, 0],
+                [0, 0, 0],
+                ...,
+                [0, 0, 0],
+                [0, 0, 0],
+                [0, 0, 0]]], dtype=uint8)
+        }
+        >>> obs, rewards, dones, infos = env.step({
+        ...                 "prisoner_0": 1
+        ...             })
+        # only returns the observation, reward, info, etc, for
+        # the agent who's turn is next.
+        >>> print(obs)
+        {
+            'prisoner_1': array([[[0, 0, 0],
+                [0, 0, 0],
+                [0, 0, 0],
+                ...,
+                [0, 0, 0],
+                [0, 0, 0],
+                [0, 0, 0]]], dtype=uint8)
+        }
+        >>> print(rewards)
+        {
+            'prisoner_1': 0
+        }
+        >>> print(dones)
+        {
+            'prisoner_1': False, '__all__': False
+        }
+        >>> print(infos)
+        {
+            'prisoner_1': {'map_tuple': (1, 0)}
+        }
+    """
+
+    def __init__(
+        self,
+        config: Dict[Any, Any] = None,
+        env: AECEnv = None,
+    ):
+        super().__init__()
+        if env is None:
+            self.env = chess_v5()
+        else:
+            self.env = env
+        self.env.reset()
+        # TODO (avnishn): Remove this after making petting zoo env compatible with
+        #  check_env.
+        self._skip_env_checking = True
+
+        self.config = config
+        if self.config is None:
+            self.config = {}
+        try:
+            self.config["random_start"] = self.config["random_start"]
+        except KeyError:
+            self.config["random_start"] = 4
+        # Get first observation space, assuming all agents have equal space
+        self.observation_space = self.env.observation_space(self.env.agents[0])
+
+        # Get first action space, assuming all agents have equal space
+        self.action_space = self.env.action_space(self.env.agents[0])
+
+        assert all(
+            self.env.observation_space(agent) == self.observation_space
+            for agent in self.env.agents
+        ), (
+            "Observation spaces for all agents must be identical. Perhaps "
+            "SuperSuit's pad_observations wrapper can help (useage: "
+            "`supersuit.aec_wrappers.pad_observations(env)`"
+        )
+
+        assert all(
+            self.env.action_space(agent) == self.action_space
+            for agent in self.env.agents
+        ), (
+            "Action spaces for all agents must be identical. Perhaps "
+            "SuperSuit's pad_action_space wrapper can help (usage: "
+            "`supersuit.aec_wrappers.pad_action_space(env)`"
+        )
+        self._agent_ids = set(self.env.agents)
+
+    def random_start(self, random_moves):
+        self.env.board = ch.Board()
+        for i in range(random_moves):
+            self.env.board.push(np.random.choice(list(self.env.board.legal_moves)))
+        return self.env.board
+
+    def observe(self):
+        return {
+            self.env.agent_selection: self.env.observe(self.env.agent_selection),
+            "state": self.get_state(),
+        }
+
+    def reset(self, *args, **kwargs):
+        self.env.reset()
+        if self.config["random_start"] > 0:
+            self.random_start(self.config["random_start"])
+        return (
+            {self.env.agent_selection: self.env.observe(self.env.agent_selection)},
+            {self.env.agent_selection: {}},
+        )
+
+    def step(self, action):
+        try:
+            self.env.step(action[self.env.agent_selection])
+        except (KeyError, IndexError):
+            self.env.step(action)
+        except AssertionError:
+            # Illegal action
+            print(action)
+            raise AssertionError("Illegal action")
+
+        obs_d = {}
+        rew_d = {}
+        done_d = {}
+        truncated_d = {}
+        info_d = {}
+        while self.env.agents:
+            obs, rew, done, trunc, info = self.env.last()
+            a = self.env.agent_selection
+            obs_d[a] = obs
+            rew_d[a] = rew
+            done_d[a] = done
+            truncated_d[a] = trunc
+            info_d[a] = info
+            if self.env.terminations[self.env.agent_selection]:
+                self.env.step(None)
+                done_d["__all__"] = True
+                truncated_d["__all__"] = True
+            else:
+                done_d["__all__"] = False
+                truncated_d["__all__"] = False
+                break
+
+        return obs_d, rew_d, done_d, truncated_d, info_d
+
+    def close(self):
+        self.env.close()
+
+    def seed(self, seed=None):
+        self.env.seed(seed)
+
+    def render(self, mode="human"):
+        return self.env.render(mode)
+
+    @property
+    def agent_selection(self):
+        return self.env.agent_selection
+
+    @property
+    def get_sub_environments(self):
+        return self.env.unwrapped
+
+    def get_state(self):
+        state = copy.deepcopy(self.env)
+        return state
+
+    def set_state(self, state):
+        self.env = copy.deepcopy(state)
+        return self.env.observe(self.env.agent_selection)
diff --git a/rllib/examples/env/pettingzoo_connect4.py b/rllib/examples/env/pettingzoo_connect4.py
new file mode 100644
index 000000000000..d238077971a6
--- /dev/null
+++ b/rllib/examples/env/pettingzoo_connect4.py
@@ -0,0 +1,180 @@
+from pettingzoo import AECEnv
+from pettingzoo.classic.connect_four_v3 import raw_env as connect_four_v3
+import copy
+from ray.rllib.env.multi_agent_env import MultiAgentEnv
+from typing import Dict, Any
+
+
+class MultiAgentConnect4(MultiAgentEnv):
+    """An interface to the PettingZoo MARL environment library.
+    See: https://github.com/Farama-Foundation/PettingZoo
+    Inherits from MultiAgentEnv and exposes a given AEC
+    (actor-environment-cycle) game from the PettingZoo project via the
+    MultiAgentEnv public API.
+    Note that the wrapper has some important limitations:
+    1. All agents have the same action_spaces and observation_spaces.
+       Note: If, within your aec game, agents do not have homogeneous action /
+       observation spaces, apply SuperSuit wrappers
+       to apply padding functionality: https://github.com/Farama-Foundation/
+       SuperSuit#built-in-multi-agent-only-functions
+    2. Environments are positive sum games (-> Agents are expected to cooperate
+       to maximize reward). This isn't a hard restriction, it just that
+       standard algorithms aren't expected to work well in highly competitive
+       games.
+    Examples:
+        >>> from pettingzoo.butterfly import prison_v3
+        >>> from ray.rllib.env.wrappers.pettingzoo_env import PettingZooEnv
+        >>> env = PettingZooEnv(prison_v3.env())
+        >>> obs = env.reset()
+        >>> print(obs)
+        # only returns the observation for the agent which should be stepping
+        {
+            'prisoner_0': array([[[0, 0, 0],
+                [0, 0, 0],
+                [0, 0, 0],
+                ...,
+                [0, 0, 0],
+                [0, 0, 0],
+                [0, 0, 0]]], dtype=uint8)
+        }
+        >>> obs, rewards, dones, infos = env.step({
+        ...                 "prisoner_0": 1
+        ...             })
+        # only returns the observation, reward, info, etc, for
+        # the agent who's turn is next.
+        >>> print(obs)
+        {
+            'prisoner_1': array([[[0, 0, 0],
+                [0, 0, 0],
+                [0, 0, 0],
+                ...,
+                [0, 0, 0],
+                [0, 0, 0],
+                [0, 0, 0]]], dtype=uint8)
+        }
+        >>> print(rewards)
+        {
+            'prisoner_1': 0
+        }
+        >>> print(dones)
+        {
+            'prisoner_1': False, '__all__': False
+        }
+        >>> print(infos)
+        {
+            'prisoner_1': {'map_tuple': (1, 0)}
+        }
+    """
+
+    def __init__(
+        self,
+        config: Dict[Any, Any] = None,
+        env: AECEnv = None,
+    ):
+        super().__init__()
+        if env is None:
+            self.env = connect_four_v3()
+        else:
+            self.env = env
+        self.env.reset()
+        # TODO (avnishn): Remove this after making petting zoo env compatible with
+        #  check_env.
+        self._skip_env_checking = True
+
+        self.config = config
+        # Get first observation space, assuming all agents have equal space
+        self.observation_space = self.env.observation_space(self.env.agents[0])
+
+        # Get first action space, assuming all agents have equal space
+        self.action_space = self.env.action_space(self.env.agents[0])
+
+        assert all(
+            self.env.observation_space(agent) == self.observation_space
+            for agent in self.env.agents
+        ), (
+            "Observation spaces for all agents must be identical. Perhaps "
+            "SuperSuit's pad_observations wrapper can help (useage: "
+            "`supersuit.aec_wrappers.pad_observations(env)`"
+        )
+
+        assert all(
+            self.env.action_space(agent) == self.action_space
+            for agent in self.env.agents
+        ), (
+            "Action spaces for all agents must be identical. Perhaps "
+            "SuperSuit's pad_action_space wrapper can help (usage: "
+            "`supersuit.aec_wrappers.pad_action_space(env)`"
+        )
+        self._agent_ids = set(self.env.agents)
+
+    def observe(self):
+        return {
+            self.env.agent_selection: self.env.observe(self.env.agent_selection),
+            "state": self.get_state(),
+        }
+
+    def reset(self, *args, **kwargs):
+        self.env.reset()
+        return (
+            {self.env.agent_selection: self.env.observe(self.env.agent_selection)},
+            {self.env.agent_selection: {}},
+        )
+
+    def step(self, action):
+        try:
+            self.env.step(action[self.env.agent_selection])
+        except (KeyError, IndexError):
+            self.env.step(action)
+        except AssertionError:
+            # Illegal action
+            print(action)
+            raise AssertionError("Illegal action")
+
+        obs_d = {}
+        rew_d = {}
+        done_d = {}
+        trunc_d = {}
+        info_d = {}
+        while self.env.agents:
+            obs, rew, done, trunc, info = self.env.last()
+            a = self.env.agent_selection
+            obs_d[a] = obs
+            rew_d[a] = rew
+            done_d[a] = done
+            trunc_d[a] = trunc
+            info_d[a] = info
+            if self.env.terminations[self.env.agent_selection]:
+                self.env.step(None)
+                done_d["__all__"] = True
+                trunc_d["__all__"] = True
+            else:
+                done_d["__all__"] = False
+                trunc_d["__all__"] = False
+                break
+
+        return obs_d, rew_d, done_d, trunc_d, info_d
+
+    def close(self):
+        self.env.close()
+
+    def seed(self, seed=None):
+        self.env.seed(seed)
+
+    def render(self, mode="human"):
+        return self.env.render(mode)
+
+    @property
+    def agent_selection(self):
+        return self.env.agent_selection
+
+    @property
+    def get_sub_environments(self):
+        return self.env.unwrapped
+
+    def get_state(self):
+        state = copy.deepcopy(self.env)
+        return state
+
+    def set_state(self, state):
+        self.env = copy.deepcopy(state)
+        return self.env.observe(self.env.agent_selection)
diff --git a/rllib/examples/multi-agent-leela-chess-zero.py b/rllib/examples/multi-agent-leela-chess-zero.py
new file mode 100644
index 000000000000..c42497b4fa32
--- /dev/null
+++ b/rllib/examples/multi-agent-leela-chess-zero.py
@@ -0,0 +1,51 @@
+from ray.rllib.algorithms.leela_chess_zero import LeelaChessZeroConfig
+from ray.rllib.examples.env.pettingzoo_chess import MultiAgentChess
+from ray.rllib.policy.policy import PolicySpec
+
+
+p0 = (
+    LeelaChessZeroConfig()
+    .training(
+        mcts_config={
+            "num_simulations": 20,
+            "turn_based_flip": True,
+            "argmax_tree_policy": True,
+            "argmax_child_value": True,
+        }
+    )
+    .environment(MultiAgentChess)
+)
+random = (
+    LeelaChessZeroConfig()
+    .training(mcts_config={"num_simulations": 3, "epsilon": 1})
+    .environment(MultiAgentChess)
+)
+
+
+config = (
+    LeelaChessZeroConfig()
+    .environment(MultiAgentChess)
+    .rollouts(num_rollout_workers=11)
+    .resources(num_gpus=1, num_cpus_per_worker=1, num_gpus_per_worker=0.0)
+    .framework("torch")
+    .multi_agent(
+        # 2 agents per env.
+        #  p_0 represent a trainable policy that should get better with training
+        #  p_1 represents a policy which avoids and/or pursues most trivial
+        # checkmates in 1, but doesnt learn
+        policies={"p_0": PolicySpec(config=p0), "p_1": PolicySpec(config=random)},
+        # Train only the first policy.
+        policies_to_train=["p_0"],
+        policy_mapping_fn=(
+            lambda aid, eps, worker, **kw: "p_"
+            + str("0" if int(aid.split("_")[-1]) % 2 == 0 else "1")
+        ),
+    )
+)
+
+# this stops when
+stop = {
+    "policy_reward_mean/p_0": 0.5,
+    "timesteps_total": 2000000,
+    "time_total_s": 180000,
+}
diff --git a/rllib/tuned_examples/leela_chess_zero/custom_model.py b/rllib/tuned_examples/leela_chess_zero/custom_model.py
new file mode 100644
index 000000000000..b9aa4a64d108
--- /dev/null
+++ b/rllib/tuned_examples/leela_chess_zero/custom_model.py
@@ -0,0 +1,55 @@
+from ray.rllib.algorithms.alpha_zero.models.custom_torch_models import (
+    ActorCriticModel,
+    Flatten,
+)
+import torch.nn as nn
+
+
+class DenseModel(ActorCriticModel):
+    def __init__(self, obs_space, action_space, num_outputs, model_config, name):
+        ActorCriticModel.__init__(
+            self, obs_space, action_space, num_outputs, model_config, name
+        )
+        in_shape = 84
+        self.shared_layers = nn.Sequential(
+            Flatten(),
+            nn.Linear(in_features=in_shape, out_features=2048),
+            nn.ReLU(),
+            nn.Linear(in_features=2048, out_features=2048),
+            nn.ReLU(),
+        )
+        self.actor_layers = nn.Sequential(
+            nn.Linear(in_features=2048, out_features=action_space.n)
+        )
+        self.critic_layers = nn.Sequential(
+            nn.Linear(in_features=2048, out_features=1), nn.Tanh()
+        )
+        self._value_out = None
+
+    def forward(self, input_dict, state, seq_lens):
+        try:
+            x = input_dict["obs"]
+        except KeyError:
+            x = input_dict["observation"]
+        x = self.shared_layers(x)
+        # actor outputs
+        logits = self.actor_layers(x)
+
+        # compute value
+        self._value_out = self.critic_layers(x)
+        return logits, None
+
+
+class PolicyMappingFn:
+    """Example for a callable class specifyable in yaml files as `policy_mapping_fn`.
+
+    See for example:
+    ray/rllib/tuned_examples/alpha_star/multi-agent-cartpole-alpha-star.yaml
+    """
+
+    def __call__(self, agent_id, episode, worker, **kwargs):
+        return "p_" + (
+            str("0" if int(agent_id.split("_")[-1]) % 2 == 0 else "1")
+            if (episode.episode_id) % 2 == 0
+            else str("1" if int(agent_id.split("_")[-1]) % 2 == 0 else "0")
+        )

From e331f6ebaff01d051790df87f5b62d4751833834 Mon Sep 17 00:00:00 2001
From: Alex Wu <alex@anyscale.io>
Date: Mon, 30 Jan 2023 09:59:44 -0800
Subject: [PATCH 056/267] [2/n] Stabilize GCS/Autoscaler interface: Drain and
 Kill Node API (#32002)

This PR adds a DrainAndKillNode endpoint to the monitor service. It has the exact same semantics as the GcsNodeManager::HandleDrainNode.


---------

Co-authored-by: Alex <alex@anyscale.com>
---
 python/ray/tests/test_monitor_service.py      | 51 +++++++++++++++++++
 .../ray/gcs/gcs_server/gcs_node_manager.h     |  1 +
 src/ray/gcs/gcs_server/gcs_monitor_server.cc  | 15 +++++-
 src/ray/gcs/gcs_server/gcs_monitor_server.h   | 10 +++-
 src/ray/gcs/gcs_server/gcs_node_manager.cc    |  2 +-
 src/ray/gcs/gcs_server/gcs_node_manager.h     |  2 +-
 src/ray/gcs/gcs_server/gcs_server.cc          |  2 +-
 .../test/gcs_monitor_server_test.cc           | 24 ++++++++-
 src/ray/protobuf/monitor.proto                | 13 +++++
 src/ray/rpc/gcs_server/gcs_rpc_server.h       |  5 ++
 10 files changed, 118 insertions(+), 7 deletions(-)

diff --git a/python/ray/tests/test_monitor_service.py b/python/ray/tests/test_monitor_service.py
index 71c7a3e2af47..f14ff44654aa 100644
--- a/python/ray/tests/test_monitor_service.py
+++ b/python/ray/tests/test_monitor_service.py
@@ -1,8 +1,10 @@
+import binascii
 import pytest
 
 import ray
 import grpc
 from ray.core.generated import monitor_pb2, monitor_pb2_grpc
+from ray.cluster_utils import Cluster
 
 
 @pytest.fixture
@@ -12,7 +14,56 @@ def monitor_stub(ray_start_regular_shared):
     return monitor_pb2_grpc.MonitorGcsServiceStub(channel)
 
 
+@pytest.fixture
+def monitor_stub_with_cluster():
+    cluster = Cluster()
+    cluster.add_node(num_cpus=1)
+    cluster.wait_for_nodes()
+
+    channel = grpc.insecure_channel(cluster.gcs_address)
+    stub = monitor_pb2_grpc.MonitorGcsServiceStub(channel)
+
+    cluster.connect()
+
+    yield stub, cluster
+    ray.shutdown()
+    cluster.shutdown()
+
+
 def test_ray_version(monitor_stub):
     request = monitor_pb2.GetRayVersionRequest()
     response = monitor_stub.GetRayVersion(request)
     assert response.version == ray.__version__
+
+
+def count_live_nodes():
+    return sum(1 for node in ray.nodes() if node["Alive"])
+
+
+def test_drain_and_kill_node(monitor_stub_with_cluster):
+    monitor_stub, cluster = monitor_stub_with_cluster
+
+    head_node = ray.nodes()[0]["NodeID"]
+
+    cluster.add_node(num_cpus=2)
+    cluster.wait_for_nodes()
+
+    assert count_live_nodes() == 2
+
+    node_ids = {node["NodeID"] for node in ray.nodes()}
+    worker_nodes = node_ids - {head_node}
+    assert len(worker_nodes) == 1
+
+    worker_node_id = next(iter(worker_nodes))
+
+    request = monitor_pb2.DrainAndKillNodeRequest(
+        node_ids=[binascii.unhexlify(worker_node_id)]
+    )
+    response = monitor_stub.DrainAndKillNode(request)
+
+    assert response.drained_nodes == request.node_ids
+    assert count_live_nodes() == 1
+
+    response = monitor_stub.DrainAndKillNode(request)
+    assert response.drained_nodes == request.node_ids
+    assert count_live_nodes() == 1
diff --git a/src/mock/ray/gcs/gcs_server/gcs_node_manager.h b/src/mock/ray/gcs/gcs_server/gcs_node_manager.h
index 10d5686d0bf2..417b966c65a4 100644
--- a/src/mock/ray/gcs/gcs_server/gcs_node_manager.h
+++ b/src/mock/ray/gcs/gcs_server/gcs_node_manager.h
@@ -42,6 +42,7 @@ class MockGcsNodeManager : public GcsNodeManager {
                rpc::GetInternalConfigReply *reply,
                rpc::SendReplyCallback send_reply_callback),
               (override));
+  MOCK_METHOD(void, DrainNode, (const NodeID &node_id), (override));
 };
 
 }  // namespace gcs
diff --git a/src/ray/gcs/gcs_server/gcs_monitor_server.cc b/src/ray/gcs/gcs_server/gcs_monitor_server.cc
index af0d36c93134..ad1092a141fd 100644
--- a/src/ray/gcs/gcs_server/gcs_monitor_server.cc
+++ b/src/ray/gcs/gcs_server/gcs_monitor_server.cc
@@ -19,7 +19,8 @@
 namespace ray {
 namespace gcs {
 
-GcsMonitorServer::GcsMonitorServer() {}
+GcsMonitorServer::GcsMonitorServer(std::shared_ptr<GcsNodeManager> gcs_node_manager)
+    : gcs_node_manager_(gcs_node_manager) {}
 
 void GcsMonitorServer::HandleGetRayVersion(rpc::GetRayVersionRequest request,
                                            rpc::GetRayVersionReply *reply,
@@ -28,5 +29,17 @@ void GcsMonitorServer::HandleGetRayVersion(rpc::GetRayVersionRequest request,
   send_reply_callback(Status::OK(), nullptr, nullptr);
 }
 
+void GcsMonitorServer::HandleDrainAndKillNode(
+    rpc::DrainAndKillNodeRequest request,
+    rpc::DrainAndKillNodeReply *reply,
+    rpc::SendReplyCallback send_reply_callback) {
+  for (const auto &node_id_bytes : request.node_ids()) {
+    const auto node_id = NodeID::FromBinary(node_id_bytes);
+    gcs_node_manager_->DrainNode(node_id);
+    *reply->add_drained_nodes() = node_id_bytes;
+  }
+  send_reply_callback(Status::OK(), nullptr, nullptr);
+}
+
 }  // namespace gcs
 }  // namespace ray
diff --git a/src/ray/gcs/gcs_server/gcs_monitor_server.h b/src/ray/gcs/gcs_server/gcs_monitor_server.h
index 4fa85bb3b5f7..860a6eb440aa 100644
--- a/src/ray/gcs/gcs_server/gcs_monitor_server.h
+++ b/src/ray/gcs/gcs_server/gcs_monitor_server.h
@@ -14,6 +14,7 @@
 
 #pragma once
 
+#include "ray/gcs/gcs_server/gcs_node_manager.h"
 #include "ray/rpc/gcs_server/gcs_rpc_server.h"
 
 namespace ray {
@@ -23,11 +24,18 @@ namespace gcs {
 /// GCS and `monitor.py`
 class GcsMonitorServer : public rpc::MonitorServiceHandler {
  public:
-  explicit GcsMonitorServer();
+  explicit GcsMonitorServer(std::shared_ptr<GcsNodeManager> gcs_node_manager);
 
   void HandleGetRayVersion(rpc::GetRayVersionRequest request,
                            rpc::GetRayVersionReply *reply,
                            rpc::SendReplyCallback send_reply_callback) override;
+
+  void HandleDrainAndKillNode(rpc::DrainAndKillNodeRequest request,
+                              rpc::DrainAndKillNodeReply *reply,
+                              rpc::SendReplyCallback send_reply_callback) override;
+
+ private:
+  std::shared_ptr<GcsNodeManager> gcs_node_manager_;
 };
 }  // namespace gcs
 }  // namespace ray
diff --git a/src/ray/gcs/gcs_server/gcs_node_manager.cc b/src/ray/gcs/gcs_server/gcs_node_manager.cc
index 31363a4c07c4..3da4a49c3f5e 100644
--- a/src/ray/gcs/gcs_server/gcs_node_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_node_manager.cc
@@ -76,7 +76,6 @@ void GcsNodeManager::HandleDrainNode(rpc::DrainNodeRequest request,
     const auto &node_drain_request = request.drain_node_data(i);
     const auto node_id = NodeID::FromBinary(node_drain_request.node_id());
 
-    RAY_LOG(INFO) << "Draining node info, node id = " << node_id;
     DrainNode(node_id);
     auto drain_node_status = reply->add_drain_node_status();
     drain_node_status->set_node_id(node_id.Binary());
@@ -86,6 +85,7 @@ void GcsNodeManager::HandleDrainNode(rpc::DrainNodeRequest request,
 }
 
 void GcsNodeManager::DrainNode(const NodeID &node_id) {
+  RAY_LOG(INFO) << "Draining node info, node id = " << node_id;
   auto node = RemoveNode(node_id, /* is_intended = */ true);
   if (!node) {
     RAY_LOG(INFO) << "Node " << node_id << " is already removed";
diff --git a/src/ray/gcs/gcs_server/gcs_node_manager.h b/src/ray/gcs/gcs_server/gcs_node_manager.h
index 015805061df9..f8a727309236 100644
--- a/src/ray/gcs/gcs_server/gcs_node_manager.h
+++ b/src/ray/gcs/gcs_server/gcs_node_manager.h
@@ -129,7 +129,7 @@ class GcsNodeManager : public rpc::NodeInfoHandler {
 
   /// Drain the given node.
   /// Idempotent.
-  void DrainNode(const NodeID &node_id);
+  virtual void DrainNode(const NodeID &node_id);
 
  private:
   /// Add the dead node to the cache. If the cache is full, the earliest dead node is
diff --git a/src/ray/gcs/gcs_server/gcs_server.cc b/src/ray/gcs/gcs_server/gcs_server.cc
index 1b013bd79f22..4705e854fcb6 100644
--- a/src/ray/gcs/gcs_server/gcs_server.cc
+++ b/src/ray/gcs/gcs_server/gcs_server.cc
@@ -590,7 +590,7 @@ void GcsServer::InitGcsTaskManager() {
 }
 
 void GcsServer::InitMonitorServer() {
-  monitor_server_ = std::make_unique<GcsMonitorServer>();
+  monitor_server_ = std::make_unique<GcsMonitorServer>(gcs_node_manager_);
   monitor_grpc_service_.reset(
       new rpc::MonitorGrpcService(main_service_, *monitor_server_));
   rpc_server_.RegisterService(*monitor_grpc_service_);
diff --git a/src/ray/gcs/gcs_server/test/gcs_monitor_server_test.cc b/src/ray/gcs/gcs_server/test/gcs_monitor_server_test.cc
index cba584afc6a3..3b914d5d22c8 100644
--- a/src/ray/gcs/gcs_server/test/gcs_monitor_server_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_monitor_server_test.cc
@@ -20,15 +20,20 @@
 #include "ray/gcs/gcs_server/test/gcs_server_test_util.h"
 #include "ray/gcs/test/gcs_test_util.h"
 #include "ray/gcs/gcs_server/gcs_monitor_server.h"
-#include "mock/ray/pubsub/publisher.h"
+#include "mock/ray/gcs/gcs_server/gcs_node_manager.h"
 // clang-format on
 
+using namespace testing;
+
 namespace ray {
 class GcsMonitorServerTest : public ::testing::Test {
  public:
-  GcsMonitorServerTest() : monitor_server_() {}
+  GcsMonitorServerTest()
+      : mock_node_manager_(std::make_shared<gcs::MockGcsNodeManager>()),
+        monitor_server_(mock_node_manager_) {}
 
  protected:
+  std::shared_ptr<gcs::MockGcsNodeManager> mock_node_manager_;
   gcs::GcsMonitorServer monitor_server_;
 };
 
@@ -43,4 +48,19 @@ TEST_F(GcsMonitorServerTest, TestRayVersion) {
   ASSERT_EQ(reply.version(), kRayVersion);
 }
 
+TEST_F(GcsMonitorServerTest, TestDrainAndKillNode) {
+  rpc::DrainAndKillNodeRequest request;
+  rpc::DrainAndKillNodeReply reply;
+  auto send_reply_callback =
+      [](ray::Status status, std::function<void()> f1, std::function<void()> f2) {};
+
+  *request.add_node_ids() = NodeID::FromRandom().Binary();
+  *request.add_node_ids() = NodeID::FromRandom().Binary();
+
+  EXPECT_CALL(*mock_node_manager_, DrainNode(_)).Times(Exactly(2));
+  monitor_server_.HandleDrainAndKillNode(request, &reply, send_reply_callback);
+
+  ASSERT_EQ(reply.drained_nodes().size(), 2);
+}
+
 }  // namespace ray
diff --git a/src/ray/protobuf/monitor.proto b/src/ray/protobuf/monitor.proto
index b8190fd9d1e1..894c1666241d 100644
--- a/src/ray/protobuf/monitor.proto
+++ b/src/ray/protobuf/monitor.proto
@@ -22,9 +22,22 @@ message GetRayVersionReply {
   string version = 1;
 }
 
+message DrainAndKillNodeRequest {
+  // The node ids to drain.
+  repeated bytes node_ids = 1;
+}
+
+message DrainAndKillNodeReply {
+  // The node ids which are beginning to drain.
+  repeated bytes drained_nodes = 2;
+}
+
 // This service provides a stable interface for a monitor/autoscaler process to interact
 // with Ray.
 service MonitorGcsService {
   // Get the ray version of the service.
   rpc GetRayVersion(GetRayVersionRequest) returns (GetRayVersionReply);
+  // Request that GCS drain and kill a node. This call is idempotent, and could
+  // need to be retried if the head node fails.
+  rpc DrainAndKillNode(DrainAndKillNodeRequest) returns (DrainAndKillNodeReply);
 }
diff --git a/src/ray/rpc/gcs_server/gcs_rpc_server.h b/src/ray/rpc/gcs_server/gcs_rpc_server.h
index bcfca5052d9b..93ba6dc3b439 100644
--- a/src/ray/rpc/gcs_server/gcs_rpc_server.h
+++ b/src/ray/rpc/gcs_server/gcs_rpc_server.h
@@ -222,6 +222,10 @@ class MonitorGcsServiceHandler {
   virtual void HandleGetRayVersion(GetRayVersionRequest request,
                                    GetRayVersionReply *reply,
                                    SendReplyCallback send_reply_callback) = 0;
+
+  virtual void HandleDrainAndKillNode(DrainAndKillNodeRequest request,
+                                      DrainAndKillNodeReply *reply,
+                                      SendReplyCallback send_reply_callback) = 0;
 };
 
 /// The `GrpcService` for `MonitorServer`.
@@ -241,6 +245,7 @@ class MonitorGrpcService : public GrpcService {
       const std::unique_ptr<grpc::ServerCompletionQueue> &cq,
       std::vector<std::unique_ptr<ServerCallFactory>> *server_call_factories) override {
     MONITOR_SERVICE_RPC_HANDLER(GetRayVersion);
+    MONITOR_SERVICE_RPC_HANDLER(DrainAndKillNode);
   }
 
  private:

From 907e9689ab600cc9393a5761090b2e3340831f3e Mon Sep 17 00:00:00 2001
From: Jiajun Yao <jeromeyjj@gmail.com>
Date: Tue, 31 Jan 2023 02:29:32 +0800
Subject: [PATCH 057/267] [Core] Remove dead actor checkpoint code (#32045)

Checkpointable actor is already removed in https://github.com/ray-project/ray/pull/10333
---
 python/ray/actor.py                     |   2 +-
 python/ray/tests/test_actor_advanced.py | 168 ------------------------
 2 files changed, 1 insertion(+), 169 deletions(-)

diff --git a/python/ray/actor.py b/python/ray/actor.py
index 2da99a470c9d..30863c815849 100644
--- a/python/ray/actor.py
+++ b/python/ray/actor.py
@@ -1189,7 +1189,7 @@ def __getattr__(self, item):
             raise AttributeError(
                 f"'{type(self).__name__}' object has " f"no attribute '{item}'"
             )
-        if item in ["__ray_terminate__", "__ray_checkpoint__"]:
+        if item in ["__ray_terminate__"]:
 
             class FakeActorMethod(object):
                 def __call__(self, *args, **kwargs):
diff --git a/python/ray/tests/test_actor_advanced.py b/python/ray/tests/test_actor_advanced.py
index eef0c60736fa..22194e8f074f 100644
--- a/python/ray/tests/test_actor_advanced.py
+++ b/python/ray/tests/test_actor_advanced.py
@@ -11,7 +11,6 @@
 from ray._private.test_utils import (
     SignalActor,
     convert_actor_state,
-    get_non_head_nodes,
     kill_actor_and_wait_for_failure,
     make_global_state_accessor,
     run_string_as_driver,
@@ -268,173 +267,6 @@ def inc(actor_handle):
     results = ray.get(results)
 
 
-def setup_counter_actor(
-    test_checkpoint=False, save_exception=False, resume_exception=False
-):
-    # Only set the checkpoint interval if we're testing with checkpointing.
-    checkpoint_interval = -1
-    if test_checkpoint:
-        checkpoint_interval = 5
-
-    @ray.remote(checkpoint_interval=checkpoint_interval)
-    class Counter:
-        _resume_exception = resume_exception
-
-        def __init__(self, save_exception):
-            self.x = 0
-            self.num_inc_calls = 0
-            self.save_exception = save_exception
-            self.restored = False
-
-        def node_id(self):
-            return ray._private.worker.global_worker.node.unique_id
-
-        def inc(self, *xs):
-            self.x += 1
-            self.num_inc_calls += 1
-            return self.x
-
-        def get_num_inc_calls(self):
-            return self.num_inc_calls
-
-        def test_restore(self):
-            # This method will only return True if __ray_restore__ has been
-            # called.
-            return self.restored
-
-        def __ray_save__(self):
-            if self.save_exception:
-                raise Exception("Exception raised in checkpoint save")
-            return self.x, self.save_exception
-
-        def __ray_restore__(self, checkpoint):
-            if self._resume_exception:
-                raise Exception("Exception raised in checkpoint resume")
-            self.x, self.save_exception = checkpoint
-            self.num_inc_calls = 0
-            self.restored = True
-
-    node_id = ray._private.worker.global_worker.node.unique_id
-
-    # Create an actor that is not on the raylet.
-    actor = Counter.remote(save_exception)
-    while ray.get(actor.node_id.remote()) == node_id:
-        actor = Counter.remote(save_exception)
-
-    args = [ray.put(0) for _ in range(100)]
-    ids = [actor.inc.remote(*args[i:]) for i in range(100)]
-
-    return actor, ids
-
-
-@pytest.mark.skip("Fork/join consistency not yet implemented.")
-def test_distributed_handle(ray_start_cluster_2_nodes):
-    cluster = ray_start_cluster_2_nodes
-    counter, ids = setup_counter_actor(test_checkpoint=False)
-
-    @ray.remote
-    def fork_many_incs(counter, num_incs):
-        x = None
-        for _ in range(num_incs):
-            x = counter.inc.remote()
-        # Only call ray.get() on the last task submitted.
-        return ray.get(x)
-
-    # Fork num_iters times.
-    count = ray.get(ids[-1])
-    num_incs = 100
-    num_iters = 10
-    forks = [fork_many_incs.remote(counter, num_incs) for _ in range(num_iters)]
-    ray.wait(forks, num_returns=len(forks))
-    count += num_incs * num_iters
-
-    # Kill the second plasma store to get rid of the cached objects and
-    # trigger the corresponding raylet to exit.
-    # TODO: kill raylet instead once this test is not skipped.
-    get_non_head_nodes(cluster)[0].kill_plasma_store(wait=True)
-
-    # Check that the actor did not restore from a checkpoint.
-    assert not ray.get(counter.test_restore.remote())
-    # Check that we can submit another call on the actor and get the
-    # correct counter result.
-    x = ray.get(counter.inc.remote())
-    assert x == count + 1
-
-
-@pytest.mark.skip("This test does not work yet.")
-def test_remote_checkpoint_distributed_handle(ray_start_cluster_2_nodes):
-    cluster = ray_start_cluster_2_nodes
-    counter, ids = setup_counter_actor(test_checkpoint=True)
-
-    @ray.remote
-    def fork_many_incs(counter, num_incs):
-        x = None
-        for _ in range(num_incs):
-            x = counter.inc.remote()
-        # Only call ray.get() on the last task submitted.
-        return ray.get(x)
-
-    # Fork num_iters times.
-    count = ray.get(ids[-1])
-    num_incs = 100
-    num_iters = 10
-    forks = [fork_many_incs.remote(counter, num_incs) for _ in range(num_iters)]
-    ray.wait(forks, num_returns=len(forks))
-    ray.wait([counter.__ray_checkpoint__.remote()])
-    count += num_incs * num_iters
-
-    # Kill the second plasma store to get rid of the cached objects and
-    # trigger the corresponding raylet to exit.
-    # TODO: kill raylet instead once this test is not skipped.
-    get_non_head_nodes(cluster)[0].kill_plasma_store(wait=True)
-
-    # Check that the actor restored from a checkpoint.
-    assert ray.get(counter.test_restore.remote())
-    # Check that the number of inc calls since actor initialization is
-    # exactly zero, since there could not have been another inc call since
-    # the remote checkpoint.
-    num_inc_calls = ray.get(counter.get_num_inc_calls.remote())
-    assert num_inc_calls == 0
-    # Check that we can submit another call on the actor and get the
-    # correct counter result.
-    x = ray.get(counter.inc.remote())
-    assert x == count + 1
-
-
-@pytest.mark.skip("Fork/join consistency not yet implemented.")
-def test_checkpoint_distributed_handle(ray_start_cluster_2_nodes):
-    cluster = ray_start_cluster_2_nodes
-    counter, ids = setup_counter_actor(test_checkpoint=True)
-
-    @ray.remote
-    def fork_many_incs(counter, num_incs):
-        x = None
-        for _ in range(num_incs):
-            x = counter.inc.remote()
-        # Only call ray.get() on the last task submitted.
-        return ray.get(x)
-
-    # Fork num_iters times.
-    count = ray.get(ids[-1])
-    num_incs = 100
-    num_iters = 10
-    forks = [fork_many_incs.remote(counter, num_incs) for _ in range(num_iters)]
-    ray.wait(forks, num_returns=len(forks))
-    count += num_incs * num_iters
-
-    # Kill the second plasma store to get rid of the cached objects and
-    # trigger the corresponding raylet to exit.
-    # TODO: kill raylet instead once this test is not skipped.
-    get_non_head_nodes(cluster)[0].kill_plasma_store(wait=True)
-
-    # Check that the actor restored from a checkpoint.
-    assert ray.get(counter.test_restore.remote())
-    # Check that we can submit another call on the actor and get the
-    # correct counter result.
-    x = ray.get(counter.inc.remote())
-    assert x == count + 1
-
-
 @pytest.fixture
 def setup_queue_actor():
     ray.init(num_cpus=1, object_store_memory=int(150 * 1024 * 1024))

From 664c8442c32f5ae2fd3361a9db7450fbf07c2511 Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Mon, 30 Jan 2023 10:45:25 -0800
Subject: [PATCH 058/267] Revert "Revert "[core] Fix gcs healthch manager crash
 when node is removed by node manager."" (#32019)

This reverts commit 51c5eda4b8dcb706fbe78dedc241f1c5256fd0ab.

Reverts #31995

Skip the windows test.

Signed-off-by: Yi Cheng <74173148+iycheng@users.noreply.github.com>
---
 .bazelrc                                      |  1 +
 BUILD.bazel                                   |  2 +-
 ci/ci.sh                                      |  1 +
 .../gcs_server/gcs_health_check_manager.cc    | 48 ++++++------
 .../gcs/gcs_server/gcs_health_check_manager.h | 23 ++----
 .../test/gcs_health_check_manager_test.cc     | 75 +++++++++++++++----
 6 files changed, 91 insertions(+), 59 deletions(-)

diff --git a/.bazelrc b/.bazelrc
index 1c4b9f296b8f..1b98b8f72a3f 100644
--- a/.bazelrc
+++ b/.bazelrc
@@ -97,6 +97,7 @@ build:tsan --copt -g
 build:tsan --copt -fno-omit-frame-pointer
 build:tsan --copt -Wno-uninitialized
 build:tsan --linkopt -fsanitize=thread
+build:tsan --cxxopt="-D_RAY_TSAN_BUILD"
 # This config is only for running TSAN with LLVM toolchain on Linux.
 build:tsan-clang --config=tsan
 build:tsan-clang --config=llvm
diff --git a/BUILD.bazel b/BUILD.bazel
index 18e82f0f244a..39c9ddd285da 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -1874,7 +1874,7 @@ cc_library(
 
 cc_test(
     name = "gcs_health_check_manager_test",
-    size = "small",
+    size = "medium",
     srcs = [
         "src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc",
     ],
diff --git a/ci/ci.sh b/ci/ci.sh
index 3d757a9cdeb2..79527a0a8f23 100755
--- a/ci/ci.sh
+++ b/ci/ci.sh
@@ -124,6 +124,7 @@ test_core() {
         -//:event_test
         -//:gcs_server_rpc_test
         -//:ray_syncer_test # TODO (iycheng): it's flaky on windows. Add it back once we figure out the cause
+        -//:gcs_health_check_manager_test
         -//:gcs_client_reconnection_test
       )
       ;;
diff --git a/src/ray/gcs/gcs_server/gcs_health_check_manager.cc b/src/ray/gcs/gcs_server/gcs_health_check_manager.cc
index 831f345ef81a..7a3d99e74e05 100644
--- a/src/ray/gcs/gcs_server/gcs_health_check_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_health_check_manager.cc
@@ -53,6 +53,7 @@ void GcsHealthCheckManager::RemoveNode(const NodeID &node_id) {
         if (iter == health_check_contexts_.end()) {
           return;
         }
+        iter->second->Stop();
         health_check_contexts_.erase(iter);
       },
       "GcsHealthCheckManager::RemoveNode");
@@ -60,8 +61,11 @@ void GcsHealthCheckManager::RemoveNode(const NodeID &node_id) {
 
 void GcsHealthCheckManager::FailNode(const NodeID &node_id) {
   RAY_LOG(WARNING) << "Node " << node_id << " is dead because the health check failed.";
-  on_node_death_callback_(node_id);
-  health_check_contexts_.erase(node_id);
+  auto iter = health_check_contexts_.find(node_id);
+  if (iter != health_check_contexts_.end()) {
+    on_node_death_callback_(node_id);
+    health_check_contexts_.erase(iter);
+  }
 }
 
 std::vector<NodeID> GcsHealthCheckManager::GetAllNodes() const {
@@ -75,27 +79,23 @@ std::vector<NodeID> GcsHealthCheckManager::GetAllNodes() const {
 void GcsHealthCheckManager::HealthCheckContext::StartHealthCheck() {
   using ::grpc::health::v1::HealthCheckResponse;
 
-  context_ = std::make_shared<grpc::ClientContext>();
+  // Reset the context/request/response for the next request.
+  context_.~ClientContext();
+  new (&context_) grpc::ClientContext();
+  response_.Clear();
 
   auto deadline =
       std::chrono::system_clock::now() + std::chrono::milliseconds(manager_->timeout_ms_);
-  context_->set_deadline(deadline);
+  context_.set_deadline(deadline);
   stub_->async()->Check(
-      context_.get(),
-      &request_,
-      &response_,
-      [this, stopped = this->stopped_, context = this->context_, now = absl::Now()](
-          ::grpc::Status status) {
+      &context_, &request_, &response_, [this, now = absl::Now()](::grpc::Status status) {
         // This callback is done in gRPC's thread pool.
         STATS_health_check_rpc_latency_ms.Record(
             absl::ToInt64Milliseconds(absl::Now() - now));
-        if (status.error_code() == ::grpc::StatusCode::CANCELLED) {
-          return;
-        }
         manager_->io_service_.post(
-            [this, stopped, status]() {
-              // Stopped has to be read in the same thread where it's updated.
-              if (*stopped) {
+            [this, status]() {
+              if (stopped_) {
+                delete this;
                 return;
               }
               RAY_LOG(DEBUG) << "Health check status: " << int(response_.status());
@@ -110,32 +110,28 @@ void GcsHealthCheckManager::HealthCheckContext::StartHealthCheck() {
               }
 
               if (health_check_remaining_ == 0) {
-                manager_->io_service_.post([this]() { manager_->FailNode(node_id_); },
-                                           "");
+                manager_->FailNode(node_id_);
+                delete this;
               } else {
                 // Do another health check.
                 timer_.expires_from_now(
                     boost::posix_time::milliseconds(manager_->period_ms_));
-                timer_.async_wait([this, stopped](auto ec) {
-                  // We need to check stopped here as well since cancel
-                  // won't impact the queued tasks.
-                  if (ec != boost::asio::error::operation_aborted && !*stopped) {
-                    StartHealthCheck();
-                  }
-                });
+                timer_.async_wait([this](auto) { StartHealthCheck(); });
               }
             },
             "HealthCheck");
       });
 }
 
+void GcsHealthCheckManager::HealthCheckContext::Stop() { stopped_ = true; }
+
 void GcsHealthCheckManager::AddNode(const NodeID &node_id,
                                     std::shared_ptr<grpc::Channel> channel) {
   io_service_.dispatch(
       [this, channel, node_id]() {
         RAY_CHECK(health_check_contexts_.count(node_id) == 0);
-        auto context = std::make_unique<HealthCheckContext>(this, channel, node_id);
-        health_check_contexts_.emplace(std::make_pair(node_id, std::move(context)));
+        auto context = new HealthCheckContext(this, channel, node_id);
+        health_check_contexts_.emplace(std::make_pair(node_id, context));
       },
       "GcsHealthCheckManager::AddNode");
 }
diff --git a/src/ray/gcs/gcs_server/gcs_health_check_manager.h b/src/ray/gcs/gcs_server/gcs_health_check_manager.h
index e0daea5edfcf..d877a217d803 100644
--- a/src/ray/gcs/gcs_server/gcs_health_check_manager.h
+++ b/src/ray/gcs/gcs_server/gcs_health_check_manager.h
@@ -91,27 +91,16 @@ class GcsHealthCheckManager {
                        NodeID node_id)
         : manager_(manager),
           node_id_(node_id),
-          stopped_(std::make_shared<bool>(false)),
           timer_(manager->io_service_),
           health_check_remaining_(manager->failure_threshold_) {
       request_.set_service(node_id.Hex());
       stub_ = grpc::health::v1::Health::NewStub(channel);
       timer_.expires_from_now(
           boost::posix_time::milliseconds(manager_->initial_delay_ms_));
-      timer_.async_wait([this](auto ec) {
-        if (ec != boost::asio::error::operation_aborted) {
-          StartHealthCheck();
-        }
-      });
+      timer_.async_wait([this](auto) { StartHealthCheck(); });
     }
 
-    ~HealthCheckContext() {
-      timer_.cancel();
-      if (context_ != nullptr) {
-        context_->TryCancel();
-      }
-      *stopped_ = true;
-    }
+    void Stop();
 
    private:
     void StartHealthCheck();
@@ -121,14 +110,12 @@ class GcsHealthCheckManager {
     NodeID node_id_;
 
     // Whether the health check has stopped.
-    std::shared_ptr<bool> stopped_;
+    bool stopped_ = false;
 
     /// gRPC related fields
     std::unique_ptr<::grpc::health::v1::Health::Stub> stub_;
 
-    // The context is used in the gRPC callback which is in another
-    // thread, so we need it to be a shared_ptr.
-    std::shared_ptr<grpc::ClientContext> context_;
+    grpc::ClientContext context_;
     ::grpc::health::v1::HealthCheckRequest request_;
     ::grpc::health::v1::HealthCheckResponse response_;
 
@@ -146,7 +133,7 @@ class GcsHealthCheckManager {
   std::function<void(const NodeID &)> on_node_death_callback_;
 
   /// The context of the health check for each nodes.
-  absl::flat_hash_map<NodeID, std::unique_ptr<HealthCheckContext>> health_check_contexts_;
+  absl::flat_hash_map<NodeID, HealthCheckContext *> health_check_contexts_;
 
   /// The delay for the first health check request.
   const int64_t initial_delay_ms_;
diff --git a/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc b/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc
index f4f4bf8cefb2..31be1bbd5d6d 100644
--- a/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_health_check_manager_test.cc
@@ -19,9 +19,13 @@
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/optional.hpp>
 #include <boost/thread.hpp>
+#include <cstdlib>
 #include <unordered_map>
 
 using namespace boost;
+using namespace boost::asio;
+using namespace boost::asio::ip;
+
 #include <ray/rpc/grpc_server.h>
 
 #include <chrono>
@@ -30,6 +34,20 @@ using namespace boost;
 #include "gtest/gtest.h"
 #include "ray/gcs/gcs_server/gcs_health_check_manager.h"
 
+int GetFreePort() {
+  io_service io_service;
+  tcp::acceptor acceptor(io_service);
+  tcp::endpoint endpoint;
+
+  // try to bind to port 0 to find a free port
+  acceptor.open(tcp::v4());
+  acceptor.bind(tcp::endpoint(tcp::v4(), 0));
+  endpoint = acceptor.local_endpoint();
+  auto port = endpoint.port();
+  acceptor.close();
+  return port;
+}
+
 using namespace ray;
 using namespace std::literals::chrono_literals;
 
@@ -46,7 +64,6 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
         timeout_ms,
         period_ms,
         failure_threshold);
-    port = 10000;
   }
 
   void TearDown() override {
@@ -65,7 +82,8 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
   NodeID AddServer(bool alive = true) {
     std::promise<int> port_promise;
     auto node_id = NodeID::FromRandom();
-
+    auto port = GetFreePort();
+    RAY_LOG(INFO) << "Get port " << port;
     auto server = std::make_shared<rpc::GrpcServer>(node_id.Hex(), port, true);
 
     auto channel = grpc::CreateChannel("localhost:" + std::to_string(port),
@@ -76,7 +94,6 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
     }
     servers.emplace(node_id, server);
     health_check->AddNode(node_id, channel);
-    ++port;
     return node_id;
   }
 
@@ -115,14 +132,13 @@ class GcsHealthCheckManagerTest : public ::testing::Test {
     }
   }
 
-  int port;
   instrumented_io_context io_service;
   std::unique_ptr<gcs::GcsHealthCheckManager> health_check;
   std::unordered_map<NodeID, std::shared_ptr<rpc::GrpcServer>> servers;
   std::unordered_set<NodeID> dead_nodes;
-  const int64_t initial_delay_ms = 1000;
-  const int64_t timeout_ms = 1000;
-  const int64_t period_ms = 1000;
+  const int64_t initial_delay_ms = 100;
+  const int64_t timeout_ms = 10;
+  const int64_t period_ms = 10;
   const int64_t failure_threshold = 5;
 };
 
@@ -143,8 +159,6 @@ TEST_F(GcsHealthCheckManagerTest, TestBasic) {
     Run(2);  // One for starting RPC and one for the RPC callback.
   }
 
-  Run();  // For failure callback.
-
   ASSERT_EQ(1, dead_nodes.size());
   ASSERT_TRUE(dead_nodes.count(node_id));
 }
@@ -169,8 +183,6 @@ TEST_F(GcsHealthCheckManagerTest, StoppedAndResume) {
     }
   }
 
-  Run();  // For failure callback.
-
   ASSERT_EQ(0, dead_nodes.size());
 }
 
@@ -196,8 +208,6 @@ TEST_F(GcsHealthCheckManagerTest, Crashed) {
     Run(2);  // One for starting RPC and one for the RPC callback.
   }
 
-  Run();  // For failure callback.
-
   ASSERT_EQ(1, dead_nodes.size());
   ASSERT_TRUE(dead_nodes.count(node_id));
 }
@@ -230,12 +240,49 @@ TEST_F(GcsHealthCheckManagerTest, NoRegister) {
     Run(2);  // One for starting RPC and one for the RPC callback.
   }
 
-  Run(2);
+  Run(1);
   ASSERT_EQ(1, dead_nodes.size());
   ASSERT_TRUE(dead_nodes.count(node_id));
 }
 
+TEST_F(GcsHealthCheckManagerTest, StressTest) {
+#ifdef _RAY_TSAN_BUILD
+  GTEST_SKIP() << "Disabled in tsan because of performance";
+#endif
+  boost::asio::io_service::work work(io_service);
+  std::srand(std::time(nullptr));
+  auto t = std::make_unique<std::thread>([this]() { this->io_service.run(); });
+
+  std::vector<NodeID> alive_nodes;
+
+  for (int i = 0; i < 200; ++i) {
+    alive_nodes.emplace_back(AddServer(true));
+    std::this_thread::sleep_for(10ms);
+  }
+
+  for (size_t i = 0; i < 20000UL; ++i) {
+    RAY_LOG(INFO) << "Progress: " << i << "/20000";
+    auto iter = alive_nodes.begin() + std::rand() % alive_nodes.size();
+    health_check->RemoveNode(*iter);
+    DeleteServer(*iter);
+    alive_nodes.erase(iter);
+    alive_nodes.emplace_back(AddServer(true));
+  }
+  RAY_LOG(INFO) << "Finished!";
+  io_service.stop();
+  t->join();
+}
+
 int main(int argc, char **argv) {
+  InitShutdownRAII ray_log_shutdown_raii(ray::RayLog::StartRayLog,
+                                         ray::RayLog::ShutDownRayLog,
+                                         argv[0],
+                                         ray::RayLogLevel::INFO,
+                                         /*log_dir=*/"");
+
+  ray::RayLog::InstallFailureSignalHandler(argv[0]);
+  ray::RayLog::InstallTerminateHandler();
+
   ::testing::InitGoogleTest(&argc, argv);
   return RUN_ALL_TESTS();
 }

From cc5baaa6556b4a84eaaa41a63bd7674e836bdd00 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Mon, 30 Jan 2023 12:36:35 -0800
Subject: [PATCH 059/267] [tune] Do not default to reuse_actors=True when
 mixins are used (#31999)

Mixins don't work well with reuse_actors because the init is only called on construction. In the case of mlflow, this means that reused actors will try to overwrite state from the trials that previously ran on them. This is incorrect behavior and errors on the mlflow server side.

Thus, we should default to not reuse actors for mixins.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 python/ray/air/integrations/wandb.py      |  6 +++++-
 python/ray/tune/integration/mlflow.py     |  2 ++
 python/ray/tune/integration/wandb.py      |  1 +
 python/ray/tune/tests/test_actor_reuse.py | 19 +++++++++++++++++++
 python/ray/tune/tune.py                   | 17 +++++++++++++++++
 5 files changed, 44 insertions(+), 1 deletion(-)

diff --git a/python/ray/air/integrations/wandb.py b/python/ray/air/integrations/wandb.py
index bd52e3c3ff85..b2806a19a530 100644
--- a/python/ray/air/integrations/wandb.py
+++ b/python/ray/air/integrations/wandb.py
@@ -30,7 +30,6 @@
     from wandb.sdk.lib.disabled import RunDisabled
     from wandb.sdk.data_types.base_types.wb_value import WBValue
 except ImportError:
-    logger.error("pip install 'wandb' to use WandbLoggerCallback/WandbTrainableMixin.")
     wandb = json_dumps_safer = Run = RunDisabled = WBValue = None
 
 
@@ -544,6 +543,11 @@ def __init__(
         save_checkpoints: bool = False,
         **kwargs,
     ):
+        if not wandb:
+            raise RuntimeError(
+                "Wandb was not found - please install with `pip install wandb`"
+            )
+
         if save_checkpoints:
             warnings.warn(
                 "`save_checkpoints` is deprecated. Use `upload_checkpoints` instead.",
diff --git a/python/ray/tune/integration/mlflow.py b/python/ray/tune/integration/mlflow.py
index 581f2181234f..85e839ab4a7c 100644
--- a/python/ray/tune/integration/mlflow.py
+++ b/python/ray/tune/integration/mlflow.py
@@ -169,6 +169,8 @@ def train_fn(config):
     )
 )
 class MLflowTrainableMixin:
+    _is_mixin = True
+
     def __init__(self, config: Dict, *args, **kwargs):
         self.mlflow_util = _MLflowLoggerUtil()
 
diff --git a/python/ray/tune/integration/wandb.py b/python/ray/tune/integration/wandb.py
index f5d3f7902cda..02a81d9237be 100644
--- a/python/ray/tune/integration/wandb.py
+++ b/python/ray/tune/integration/wandb.py
@@ -148,6 +148,7 @@ def train_fn(config):
 )
 class WandbTrainableMixin:
     _wandb = wandb
+    _is_mixin = True
 
     def __init__(self, config: Dict, *args, **kwargs):
         if not isinstance(self, Trainable):
diff --git a/python/ray/tune/tests/test_actor_reuse.py b/python/ray/tune/tests/test_actor_reuse.py
index 1d5942ce98ba..e0672fbbb3a8 100644
--- a/python/ray/tune/tests/test_actor_reuse.py
+++ b/python/ray/tune/tests/test_actor_reuse.py
@@ -8,6 +8,7 @@
 from ray.tune import Trainable, run_experiments, register_trainable
 from ray.tune.error import TuneError
 from ray.tune.schedulers.trial_scheduler import FIFOScheduler, TrialScheduler
+from ray.tune.tune import _check_mixin
 
 
 @pytest.fixture
@@ -379,5 +380,23 @@ def test_multi_trial_reuse_heterogeneous(ray_start_4_cpus_extra):
     assert sorted([t.last_result["num_resets"] for t in trials]) == [0, 0, 0, 1, 1, 1]
 
 
+def test_detect_reuse_mixins():
+    from ray.tune.integration.mlflow import mlflow_mixin
+
+    assert not _check_mixin("PPO")
+
+    def train(config):
+        pass
+
+    assert not _check_mixin(train)
+    assert _check_mixin(mlflow_mixin(train))
+
+    class MyTrainable(Trainable):
+        pass
+
+    assert not _check_mixin(MyTrainable)
+    assert _check_mixin(mlflow_mixin(MyTrainable))
+
+
 if __name__ == "__main__":
     sys.exit(pytest.main(["-v", __file__]))
diff --git a/python/ray/tune/tune.py b/python/ray/tune/tune.py
index a577999dc3fb..53ccca7dba9b 100644
--- a/python/ray/tune/tune.py
+++ b/python/ray/tune/tune.py
@@ -97,6 +97,17 @@ def _check_default_resources_override(
     )
 
 
+def _check_mixin(run_identifier: Union[Experiment, str, Type, Callable]) -> bool:
+    trainable_cls = _get_trainable(run_identifier)
+    if not trainable_cls:
+        # Default to True
+        return True
+
+    return hasattr(trainable_cls, "__mixins__") or getattr(
+        trainable_cls, "_is_mixin", False
+    )
+
+
 def _check_gpus_in_resources(
     resources: Optional[Union[Dict, PlacementGroupFactory]]
 ) -> bool:
@@ -536,7 +547,13 @@ class and registered trainables.
                 # will be requested, yet, so default to False
                 _check_default_resources_override(trainable)
             )
+            and not (
+                # Mixins do not work with reuse_actors as the mixin setup will only
+                # be invoked once
+                _check_mixin(trainable)
+            )
         )
+        logger.debug(f"Auto-detected `reuse_actors={reuse_actors}`")
 
     if (
         isinstance(scheduler, (PopulationBasedTraining, PopulationBasedTrainingReplay))

From 43a0d8f4cee7ebc763258b4481ac96856798f3fa Mon Sep 17 00:00:00 2001
From: Eric Liang <ekhliang@gmail.com>
Date: Mon, 30 Jan 2023 12:53:54 -0800
Subject: [PATCH 060/267] [metrics] Switch metric view to 5 min by default
 #32065

Signed-off-by: Eric Liang <ekhliang@gmail.com>
---
 dashboard/client/src/pages/metrics/Metrics.tsx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dashboard/client/src/pages/metrics/Metrics.tsx b/dashboard/client/src/pages/metrics/Metrics.tsx
index 51a12f2ce262..76909bd9449d 100644
--- a/dashboard/client/src/pages/metrics/Metrics.tsx
+++ b/dashboard/client/src/pages/metrics/Metrics.tsx
@@ -209,7 +209,7 @@ export const Metrics = ({ newIA = false }: MetricsProps) => {
     useContext(GlobalContext);
 
   const [timeRangeOption, setTimeRangeOption] = useState<TimeRangeOptions>(
-    TimeRangeOptions.THIRTY_MINS,
+    TimeRangeOptions.FIVE_MINS,
   );
   const [[from, to], setTimeRange] = useState<[string | null, string | null]>([
     null,

From 96440cf7253e4fa90cec2ec34ca074bcfe4a2143 Mon Sep 17 00:00:00 2001
From: Eric Liang <ekhliang@gmail.com>
Date: Mon, 30 Jan 2023 13:21:41 -0800
Subject: [PATCH 061/267] [data] [streaming] Fixes to autoscaling actor pool
 streaming op (#32023)

Fixes:
- Properly wire max tasks per actor to pool
- Account for internal queue size in scheduling algorithm
- Small improvements to progress bar UX
---
 .../data/_internal/execution/interfaces.py    |   7 +
 .../operators/actor_pool_map_operator.py      |  14 +-
 .../execution/streaming_executor_state.py     |  17 +-
 python/ray/data/tests/conftest.py             |   9 +
 python/ray/data/tests/test_operators.py       |  22 +-
 .../ray/data/tests/test_streaming_executor.py | 208 ++-----------
 .../data/tests/test_streaming_integration.py  | 283 ++++++++++++++++++
 7 files changed, 361 insertions(+), 199 deletions(-)
 create mode 100644 python/ray/data/tests/test_streaming_integration.py

diff --git a/python/ray/data/_internal/execution/interfaces.py b/python/ray/data/_internal/execution/interfaces.py
index 3f05eb7e05cb..899b6ac9379f 100644
--- a/python/ray/data/_internal/execution/interfaces.py
+++ b/python/ray/data/_internal/execution/interfaces.py
@@ -293,6 +293,13 @@ def num_active_work_refs(self) -> int:
         """
         return len(self.get_work_refs())
 
+    def internal_queue_size(self) -> int:
+        """If the operator has an internal input queue, return its size.
+
+        This is used to report tasks pending submission to actor pools.
+        """
+        return 0
+
     def notify_work_completed(self, work_ref: ray.ObjectRef) -> None:
         """Executor calls this when the given work is completed and local.
 
diff --git a/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py b/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
index 2e67572edbf7..831e4190ba3c 100644
--- a/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
+++ b/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
@@ -60,7 +60,7 @@ def __init__(
             ObjectRef[ObjectRefGenerator], Tuple[_TaskState, ray.actor.ActorHandle]
         ] = {}
         # A pool of running actors on which we can execute mapper tasks.
-        self._actor_pool = _ActorPool()
+        self._actor_pool = _ActorPool(autoscaling_policy._config.max_tasks_in_flight)
         # A queue of bundles awaiting dispatch to actors.
         self._bundle_queue = collections.deque()
         # Cached actor class.
@@ -68,6 +68,9 @@ def __init__(
         # Whether no more submittable bundles will be added.
         self._inputs_done = False
 
+    def internal_queue_size(self) -> int:
+        return len(self._bundle_queue)
+
     def start(self, options: ExecutionOptions):
         super().start(options)
 
@@ -197,10 +200,11 @@ def num_active_work_refs(self) -> int:
         return len(self._tasks)
 
     def progress_str(self) -> str:
-        return (
-            f"{self._actor_pool.num_running_actors()} "
-            f"({self._actor_pool.num_pending_actors()} pending)"
-        )
+        base = f"{self._actor_pool.num_running_actors()} actors"
+        pending = self._actor_pool.num_pending_actors()
+        if pending:
+            base += f" ({pending} pending)"
+        return base
 
     def base_resource_usage(self) -> ExecutionResources:
         min_workers = self._autoscaling_policy.min_workers
diff --git a/python/ray/data/_internal/execution/streaming_executor_state.py b/python/ray/data/_internal/execution/streaming_executor_state.py
index a208dc5ecb96..4b6e6e739242 100644
--- a/python/ray/data/_internal/execution/streaming_executor_state.py
+++ b/python/ray/data/_internal/execution/streaming_executor_state.py
@@ -60,9 +60,9 @@ def num_queued(self) -> int:
         """Return the number of queued bundles across all inqueues."""
         return sum(len(q) for q in self.inqueues)
 
-    def num_active_tasks(self):
-        """Return the number of Ray futures pending for this operator."""
-        return self.op.num_active_work_refs()
+    def num_processing(self):
+        """Return the number of bundles currently in processing for this operator."""
+        return self.op.num_active_work_refs() + self.op.internal_queue_size()
 
     def add_output(self, ref: RefBundle) -> None:
         """Move a bundle produced by the operator to its outqueue."""
@@ -77,8 +77,9 @@ def refresh_progress_bar(self) -> None:
             self.progress_bar.set_description(self.summary_str())
 
     def summary_str(self) -> str:
-        queued = self.num_queued()
-        desc = f"{self.op.name}: {self.num_active_tasks()} active, {queued} queued"
+        queued = self.num_queued() + self.op.internal_queue_size()
+        active = self.op.num_active_work_refs()
+        desc = f"{self.op.name}: {active} active, {queued} queued"
         suffix = self.op.progress_str()
         if suffix:
             desc += f", {suffix}"
@@ -209,7 +210,7 @@ def select_operator_to_run(
 
     This is currently implemented by applying backpressure on operators that are
     producing outputs faster than they are consuming them `len(outqueue)`, as well as
-    operators with a large number of running tasks `num_active_tasks()`.
+    operators with a large number of running tasks `num_processing()`.
 
     Note that memory limits also apply to the outqueue of the output operator. This
     provides backpressure if the consumer is slow. However, once a bundle is returned
@@ -237,9 +238,9 @@ def select_operator_to_run(
     if not ops:
         return None
 
-    # Equally penalize outqueue length and active tasks for backpressure.
+    # Equally penalize outqueue length and num bundles processing for backpressure.
     return min(
-        ops, key=lambda op: len(topology[op].outqueue) + topology[op].num_active_tasks()
+        ops, key=lambda op: len(topology[op].outqueue) + topology[op].num_processing()
     )
 
 
diff --git a/python/ray/data/tests/conftest.py b/python/ray/data/tests/conftest.py
index abc66d8ac51e..de089750c052 100644
--- a/python/ray/data/tests/conftest.py
+++ b/python/ray/data/tests/conftest.py
@@ -1,3 +1,4 @@
+import copy
 import os
 import posixpath
 
@@ -272,6 +273,14 @@ def _assert_base_partitioned_ds(
     yield _assert_base_partitioned_ds
 
 
+@pytest.fixture
+def restore_dataset_context(request):
+    """Restore any DatasetContext changes after the test runs"""
+    original = copy.deepcopy(ray.data.context.DatasetContext.get_current())
+    yield
+    ray.data.context.DatasetContext._set_current(original)
+
+
 @pytest.fixture(params=[True, False])
 def use_push_based_shuffle(request):
     ctx = ray.data.context.DatasetContext.get_current()
diff --git a/python/ray/data/tests/test_operators.py b/python/ray/data/tests/test_operators.py
index d616d71d0215..3b433448f4e9 100644
--- a/python/ray/data/tests/test_operators.py
+++ b/python/ray/data/tests/test_operators.py
@@ -101,7 +101,9 @@ def dummy_all_transform(bundles: List[RefBundle]):
 def test_map_operator_bulk(ray_start_regular_shared, use_actors):
     # Create with inputs.
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
-    compute_strategy = ActorPoolStrategy() if use_actors else TaskPoolStrategy()
+    compute_strategy = (
+        ActorPoolStrategy(max_size=1) if use_actors else TaskPoolStrategy()
+    )
     op = MapOperator.create(
         _mul2_transform,
         input_op=input_op,
@@ -113,9 +115,16 @@ def test_map_operator_bulk(ray_start_regular_shared, use_actors):
     op.start(ExecutionOptions())
     if use_actors:
         # Actor will be pending after starting the operator.
-        assert op.progress_str() == "0 (1 pending)"
+        assert op.progress_str() == "0 actors (1 pending)"
+    assert op.internal_queue_size() == 0
+    i = 0
     while input_op.has_next():
         op.add_input(input_op.get_next(), 0)
+        i += 1
+        if use_actors:
+            assert op.internal_queue_size() == i
+        else:
+            assert op.internal_queue_size() == 0
     op.inputs_done()
     work_refs = op.get_work_refs()
     while work_refs:
@@ -126,10 +135,11 @@ def test_map_operator_bulk(ray_start_regular_shared, use_actors):
         if use_actors and work_refs:
             # After actor is ready (first work ref resolved), actor will remain ready
             # while there is work to do.
-            assert op.progress_str() == "1 (0 pending)"
+            assert op.progress_str() == "1 actors"
+    assert op.internal_queue_size() == 0
     if use_actors:
         # After all work is done, actor will have been killed to free up resources..
-        assert op.progress_str() == "0 (0 pending)"
+        assert op.progress_str() == "0 actors"
     else:
         assert op.progress_str() == ""
 
@@ -227,7 +237,9 @@ def test_map_operator_ray_args(shutdown_only, use_actors):
     ray.init(num_cpus=0, num_gpus=1)
     # Create with inputs.
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(10)]))
-    compute_strategy = ActorPoolStrategy() if use_actors else TaskPoolStrategy()
+    compute_strategy = (
+        ActorPoolStrategy(max_size=1) if use_actors else TaskPoolStrategy()
+    )
     op = MapOperator.create(
         _mul2_transform,
         input_op=input_op,
diff --git a/python/ray/data/tests/test_streaming_executor.py b/python/ray/data/tests/test_streaming_executor.py
index 2762ec0a69f5..02ecefeed691 100644
--- a/python/ray/data/tests/test_streaming_executor.py
+++ b/python/ray/data/tests/test_streaming_executor.py
@@ -2,18 +2,13 @@
 import time
 from unittest.mock import MagicMock
 
-from typing import List, Any
-
 import ray
-from ray.data.context import DatasetContext
 from ray.data._internal.execution.interfaces import (
     ExecutionOptions,
     ExecutionResources,
-    RefBundle,
     PhysicalOperator,
 )
 from ray.data._internal.execution.streaming_executor import (
-    StreamingExecutor,
     _debug_dump_topology,
     _validate_topology,
 )
@@ -24,13 +19,10 @@
     select_operator_to_run,
     _execution_allowed,
 )
-from ray.data._internal.execution.operators.all_to_all_operator import AllToAllOperator
 from ray.data._internal.execution.operators.map_operator import MapOperator
 from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
 from ray.data._internal.execution.util import make_ref_bundles
 from ray.util.scheduling_strategies import NodeAffinitySchedulingStrategy
-from ray._private.test_utils import wait_for_condition
-from ray.data.tests.conftest import *  # noqa
 
 
 @ray.remote
@@ -46,15 +38,7 @@ def map_fn(block_iter):
     return map_fn
 
 
-def ref_bundles_to_list(bundles: List[RefBundle]) -> List[List[Any]]:
-    output = []
-    for bundle in bundles:
-        for block, _ in bundle.blocks:
-            output.append(ray.get(block))
-    return output
-
-
-def test_build_streaming_topology(ray_start_10_cpus_shared):
+def test_build_streaming_topology():
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
     o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
@@ -68,7 +52,7 @@ def test_build_streaming_topology(ray_start_10_cpus_shared):
     assert list(topo) == [o1, o2, o3]
 
 
-def test_disallow_non_unique_operators(ray_start_10_cpus_shared):
+def test_disallow_non_unique_operators():
     inputs = make_ref_bundles([[x] for x in range(20)])
     # An operator [o1] cannot used in the same DAG twice.
     o1 = InputDataBuffer(inputs)
@@ -79,7 +63,7 @@ def test_disallow_non_unique_operators(ray_start_10_cpus_shared):
         build_streaming_topology(o4, ExecutionOptions())
 
 
-def test_process_completed_tasks(ray_start_10_cpus_shared):
+def test_process_completed_tasks():
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
     o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
@@ -111,7 +95,7 @@ def test_process_completed_tasks(ray_start_10_cpus_shared):
     o2.inputs_done.assert_called_once()
 
 
-def test_select_operator_to_run(ray_start_10_cpus_shared):
+def test_select_operator_to_run():
     opt = ExecutionOptions()
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
@@ -143,19 +127,34 @@ def test_select_operator_to_run(ray_start_10_cpus_shared):
     )
 
     # Test backpressure includes num active tasks as well.
-    topo[o3].num_active_tasks = MagicMock(return_value=2)
+    o3.num_active_work_refs = MagicMock(return_value=2)
+    o3.internal_queue_size = MagicMock(return_value=0)
+    assert (
+        select_operator_to_run(topo, ExecutionResources(), ExecutionResources(), True)
+        == o2
+    )
+    # nternal queue size is added to num active tasks.
+    o3.num_active_work_refs = MagicMock(return_value=0)
+    o3.internal_queue_size = MagicMock(return_value=2)
     assert (
         select_operator_to_run(topo, ExecutionResources(), ExecutionResources(), True)
         == o2
     )
-    topo[o2].num_active_tasks = MagicMock(return_value=2)
+    o2.num_active_work_refs = MagicMock(return_value=2)
+    o2.internal_queue_size = MagicMock(return_value=0)
+    assert (
+        select_operator_to_run(topo, ExecutionResources(), ExecutionResources(), True)
+        == o3
+    )
+    o2.num_active_work_refs = MagicMock(return_value=0)
+    o2.internal_queue_size = MagicMock(return_value=2)
     assert (
         select_operator_to_run(topo, ExecutionResources(), ExecutionResources(), True)
         == o3
     )
 
 
-def test_dispatch_next_task(ray_start_10_cpus_shared):
+def test_dispatch_next_task():
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
     o1_state = OpState(o1, [])
@@ -175,7 +174,7 @@ def test_dispatch_next_task(ray_start_10_cpus_shared):
     assert o2.add_input.called_once_with("dummy2")
 
 
-def test_debug_dump_topology(ray_start_10_cpus_shared):
+def test_debug_dump_topology():
     opt = ExecutionOptions()
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
@@ -186,7 +185,7 @@ def test_debug_dump_topology(ray_start_10_cpus_shared):
     _debug_dump_topology(topo)
 
 
-def test_validate_topology(ray_start_10_cpus_shared):
+def test_validate_topology():
     opt = ExecutionOptions()
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
@@ -208,7 +207,7 @@ def test_validate_topology(ray_start_10_cpus_shared):
         _validate_topology(topo, ExecutionResources(cpu=10))
 
 
-def test_execution_allowed(ray_start_10_cpus_shared):
+def test_execution_allowed():
     op = InputDataBuffer([])
 
     # CPU.
@@ -253,7 +252,7 @@ def test_execution_allowed(ray_start_10_cpus_shared):
     )
 
 
-def test_select_ops_ensure_at_least_one_live_operator(ray_start_10_cpus_shared):
+def test_select_ops_ensure_at_least_one_live_operator():
     opt = ExecutionOptions()
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
@@ -289,160 +288,7 @@ def test_select_ops_ensure_at_least_one_live_operator(ray_start_10_cpus_shared):
     )
 
 
-def test_pipelined_execution(ray_start_10_cpus_shared):
-    executor = StreamingExecutor(ExecutionOptions())
-    inputs = make_ref_bundles([[x] for x in range(20)])
-    o1 = InputDataBuffer(inputs)
-    o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
-    o3 = MapOperator.create(make_transform(lambda block: [b * 2 for b in block]), o2)
-
-    def reverse_sort(inputs: List[RefBundle]):
-        reversed_list = inputs[::-1]
-        return reversed_list, {}
-
-    o4 = AllToAllOperator(reverse_sort, o3)
-    it = executor.execute(o4)
-    output = ref_bundles_to_list(it)
-    expected = [[x * -2] for x in range(20)][::-1]
-    assert output == expected, (output, expected)
-
-
-def test_e2e_option_propagation(ray_start_10_cpus_shared):
-    DatasetContext.get_current().new_execution_backend = True
-    DatasetContext.get_current().use_streaming_executor = True
-
-    def run():
-        ray.data.range(5, parallelism=5).map(
-            lambda x: x, compute=ray.data.ActorPoolStrategy(2, 2)
-        ).take_all()
-
-    DatasetContext.get_current().execution_options.resource_limits = (
-        ExecutionResources()
-    )
-    run()
-
-    DatasetContext.get_current().execution_options.resource_limits.cpu = 1
-    with pytest.raises(ValueError):
-        run()
-
-
-def test_configure_spread_e2e(ray_start_10_cpus_shared):
-    from ray import remote_function
-
-    tasks = []
-
-    def _test_hook(fn, args, strategy):
-        if "map_task" in str(fn):
-            tasks.append(strategy)
-
-    remote_function._task_launch_hook = _test_hook
-    DatasetContext.get_current().use_streaming_executor = True
-    DatasetContext.get_current().execution_options.preserve_order = True
-
-    # Simple 2-stage pipeline.
-    ray.data.range(2, parallelism=2).map(lambda x: x, num_cpus=2).take_all()
-
-    # Read tasks get SPREAD by default, subsequent ones use default policy.
-    tasks = sorted(tasks)
-    assert tasks == ["DEFAULT", "DEFAULT", "SPREAD", "SPREAD"]
-
-
-def test_scheduling_progress_when_output_blocked():
-    # Processing stages should fully finish even if output is completely stalled.
-
-    @ray.remote
-    class Counter:
-        def __init__(self):
-            self.i = 0
-
-        def inc(self):
-            self.i += 1
-
-        def get(self):
-            return self.i
-
-    counter = Counter.remote()
-
-    def func(x):
-        ray.get(counter.inc.remote())
-        return x
-
-    DatasetContext.get_current().use_streaming_executor = True
-    DatasetContext.get_current().execution_options.preserve_order = True
-
-    # Only take the first item from the iterator.
-    it = iter(
-        ray.data.range(100, parallelism=100)
-        .map_batches(func, batch_size=None)
-        .iter_batches(batch_size=None)
-    )
-    next(it)
-    # The pipeline should fully execute even when the output iterator is blocked.
-    wait_for_condition(lambda: ray.get(counter.get.remote()) == 100)
-    # Check we can take the rest.
-    assert list(it) == [[x] for x in range(1, 100)]
-
-
-def test_backpressure_from_output():
-    # Here we set the memory limit low enough so the output getting blocked will
-    # actually stall execution.
-
-    @ray.remote
-    class Counter:
-        def __init__(self):
-            self.i = 0
-
-        def inc(self):
-            self.i += 1
-
-        def get(self):
-            return self.i
-
-    counter = Counter.remote()
-
-    def func(x):
-        ray.get(counter.inc.remote())
-        return x
-
-    ctx = DatasetContext.get_current()
-    try:
-        ctx.use_streaming_executor = True
-        ctx.execution_options.resource_limits.object_store_memory = 10000
-
-        # Only take the first item from the iterator.
-        it = iter(
-            ray.data.range(100000, parallelism=100)
-            .map_batches(func, batch_size=None)
-            .iter_batches(batch_size=None)
-        )
-        next(it)
-        num_finished = ray.get(counter.get.remote())
-        assert num_finished < 5, num_finished
-
-        # Check we can get the rest.
-        for rest in it:
-            pass
-        assert ray.get(counter.get.remote()) == 100
-    finally:
-        ctx.execution_options.resource_limits.object_store_memory = None
-
-
-def test_e2e_liveness_with_output_backpressure_edge_case():
-    # At least one operator is ensured to be running, if the output becomes idle.
-    ctx = DatasetContext.get_current()
-    ctx.use_streaming_executor = True
-    ctx.execution_options.preserve_order = True
-    try:
-        ctx.execution_options.resource_limits.object_store_memory = 1
-        ds = ray.data.range(10000, parallelism=100).map(lambda x: x, num_cpus=2)
-        # This will hang forever if the liveness logic is wrong, since the output
-        # backpressure will prevent any operators from running at all.
-        assert ds.take_all() == list(range(10000))
-    finally:
-        ctx.execution_options.resource_limits.object_store_memory = None
-
-
-def test_configure_output_locality(ray_start_10_cpus_shared):
+def test_configure_output_locality():
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
     o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
diff --git a/python/ray/data/tests/test_streaming_integration.py b/python/ray/data/tests/test_streaming_integration.py
new file mode 100644
index 000000000000..3512cbe68dfd
--- /dev/null
+++ b/python/ray/data/tests/test_streaming_integration.py
@@ -0,0 +1,283 @@
+import pytest
+import time
+
+from typing import List, Any
+
+import ray
+from ray.data.context import DatasetContext
+from ray.data._internal.execution.interfaces import (
+    ExecutionOptions,
+    ExecutionResources,
+    RefBundle,
+)
+from ray.data._internal.execution.streaming_executor import (
+    StreamingExecutor,
+)
+from ray.data._internal.execution.operators.all_to_all_operator import AllToAllOperator
+from ray.data._internal.execution.operators.map_operator import MapOperator
+from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
+from ray.data._internal.execution.util import make_ref_bundles
+from ray._private.test_utils import wait_for_condition
+from ray.data.tests.conftest import *  # noqa
+
+
+def make_transform(block_fn):
+    def map_fn(block_iter):
+        for block in block_iter:
+            yield block_fn(block)
+
+    return map_fn
+
+
+def ref_bundles_to_list(bundles: List[RefBundle]) -> List[List[Any]]:
+    output = []
+    for bundle in bundles:
+        for block, _ in bundle.blocks:
+            output.append(ray.get(block))
+    return output
+
+
+def test_pipelined_execution(ray_start_10_cpus_shared):
+    executor = StreamingExecutor(ExecutionOptions())
+    inputs = make_ref_bundles([[x] for x in range(20)])
+    o1 = InputDataBuffer(inputs)
+    o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
+    o3 = MapOperator.create(make_transform(lambda block: [b * 2 for b in block]), o2)
+
+    def reverse_sort(inputs: List[RefBundle]):
+        reversed_list = inputs[::-1]
+        return reversed_list, {}
+
+    o4 = AllToAllOperator(reverse_sort, o3)
+    it = executor.execute(o4)
+    output = ref_bundles_to_list(it)
+    expected = [[x * -2] for x in range(20)][::-1]
+    assert output == expected, (output, expected)
+
+
+def test_e2e_option_propagation(ray_start_10_cpus_shared, restore_dataset_context):
+    DatasetContext.get_current().new_execution_backend = True
+    DatasetContext.get_current().use_streaming_executor = True
+
+    def run():
+        ray.data.range(5, parallelism=5).map(
+            lambda x: x, compute=ray.data.ActorPoolStrategy(2, 2)
+        ).take_all()
+
+    DatasetContext.get_current().execution_options.resource_limits = (
+        ExecutionResources()
+    )
+    run()
+
+    DatasetContext.get_current().execution_options.resource_limits.cpu = 1
+    with pytest.raises(ValueError):
+        run()
+
+
+def test_configure_spread_e2e(ray_start_10_cpus_shared, restore_dataset_context):
+    from ray import remote_function
+
+    tasks = []
+
+    def _test_hook(fn, args, strategy):
+        if "map_task" in str(fn):
+            tasks.append(strategy)
+
+    remote_function._task_launch_hook = _test_hook
+    DatasetContext.get_current().use_streaming_executor = True
+    DatasetContext.get_current().execution_options.preserve_order = True
+
+    # Simple 2-stage pipeline.
+    ray.data.range(2, parallelism=2).map(lambda x: x, num_cpus=2).take_all()
+
+    # Read tasks get SPREAD by default, subsequent ones use default policy.
+    tasks = sorted(tasks)
+    assert tasks == ["DEFAULT", "DEFAULT", "SPREAD", "SPREAD"]
+
+
+def test_scheduling_progress_when_output_blocked(
+    ray_start_10_cpus_shared, restore_dataset_context
+):
+    # Processing stages should fully finish even if output is completely stalled.
+
+    @ray.remote
+    class Counter:
+        def __init__(self):
+            self.i = 0
+
+        def inc(self):
+            self.i += 1
+
+        def get(self):
+            return self.i
+
+    counter = Counter.remote()
+
+    def func(x):
+        ray.get(counter.inc.remote())
+        return x
+
+    DatasetContext.get_current().use_streaming_executor = True
+    DatasetContext.get_current().execution_options.preserve_order = True
+
+    # Only take the first item from the iterator.
+    it = iter(
+        ray.data.range(100, parallelism=100)
+        .map_batches(func, batch_size=None)
+        .iter_batches(batch_size=None)
+    )
+    next(it)
+    # The pipeline should fully execute even when the output iterator is blocked.
+    wait_for_condition(lambda: ray.get(counter.get.remote()) == 100)
+    # Check we can take the rest.
+    assert list(it) == [[x] for x in range(1, 100)]
+
+
+def test_backpressure_from_output(ray_start_10_cpus_shared, restore_dataset_context):
+    # Here we set the memory limit low enough so the output getting blocked will
+    # actually stall execution.
+
+    @ray.remote
+    class Counter:
+        def __init__(self):
+            self.i = 0
+
+        def inc(self):
+            self.i += 1
+
+        def get(self):
+            return self.i
+
+    counter = Counter.remote()
+
+    def func(x):
+        ray.get(counter.inc.remote())
+        return x
+
+    ctx = DatasetContext.get_current()
+    ctx.use_streaming_executor = True
+    ctx.execution_options.resource_limits.object_store_memory = 10000
+
+    # Only take the first item from the iterator.
+    it = iter(
+        ray.data.range(100000, parallelism=100)
+        .map_batches(func, batch_size=None)
+        .iter_batches(batch_size=None)
+    )
+    next(it)
+    num_finished = ray.get(counter.get.remote())
+    assert num_finished < 5, num_finished
+
+    # Check we can get the rest.
+    for rest in it:
+        pass
+    assert ray.get(counter.get.remote()) == 100
+
+
+def test_e2e_liveness_with_output_backpressure_edge_case(
+    ray_start_10_cpus_shared, restore_dataset_context
+):
+    # At least one operator is ensured to be running, if the output becomes idle.
+    ctx = DatasetContext.get_current()
+    ctx.use_streaming_executor = True
+    ctx.execution_options.preserve_order = True
+    ctx.execution_options.resource_limits.object_store_memory = 1
+    ds = ray.data.range(10000, parallelism=100).map(lambda x: x, num_cpus=2)
+    # This will hang forever if the liveness logic is wrong, since the output
+    # backpressure will prevent any operators from running at all.
+    assert ds.take_all() == list(range(10000))
+
+
+def test_e2e_autoscaling_up(ray_start_10_cpus_shared, restore_dataset_context):
+    DatasetContext.get_current().new_execution_backend = True
+    DatasetContext.get_current().use_streaming_executor = True
+
+    @ray.remote(max_concurrency=10)
+    class Barrier:
+        def __init__(self, n, delay=0):
+            self.n = n
+            self.delay = delay
+            self.max_waiters = 0
+            self.cur_waiters = 0
+
+        def wait(self):
+            self.cur_waiters += 1
+            if self.cur_waiters > self.max_waiters:
+                self.max_waiters = self.cur_waiters
+            self.n -= 1
+            print("wait", self.n)
+            while self.n > 0:
+                time.sleep(0.1)
+            time.sleep(self.delay)
+            print("wait done")
+            self.cur_waiters -= 1
+
+        def get_max_waiters(self):
+            return self.max_waiters
+
+    b1 = Barrier.remote(6)
+
+    def barrier1(x):
+        ray.get(b1.wait.remote(), timeout=10)
+        return x
+
+    # Tests that we autoscale up to necessary size.
+    # 6 tasks + 1 tasks in flight per actor => need at least 6 actors to run.
+    ray.data.range(6, parallelism=6).map_batches(
+        barrier1,
+        compute=ray.data.ActorPoolStrategy(1, 6, max_tasks_in_flight_per_actor=1),
+        batch_size=None,
+    ).take_all()
+    assert ray.get(b1.get_max_waiters.remote()) == 6
+
+    b2 = Barrier.remote(3, delay=2)
+
+    def barrier2(x):
+        ray.get(b2.wait.remote(), timeout=10)
+        return x
+
+    # Tests that we don't over-scale up.
+    # 6 tasks + 2 tasks in flight per actor => only scale up to 3 actors
+    ray.data.range(6, parallelism=6).map_batches(
+        barrier2,
+        compute=ray.data.ActorPoolStrategy(1, 3, max_tasks_in_flight_per_actor=2),
+        batch_size=None,
+    ).take_all()
+    assert ray.get(b2.get_max_waiters.remote()) == 3
+
+    # Tests that the max pool size is respected.
+    b3 = Barrier.remote(6)
+
+    def barrier3(x):
+        ray.get(b3.wait.remote(), timeout=2)
+        return x
+
+    # This will hang, since the actor pool is too small.
+    with pytest.raises(ray.exceptions.RayTaskError):
+        ray.data.range(6, parallelism=6).map(
+            barrier3, compute=ray.data.ActorPoolStrategy(1, 2)
+        ).take_all()
+
+
+def test_e2e_autoscaling_down(ray_start_10_cpus_shared, restore_dataset_context):
+    DatasetContext.get_current().new_execution_backend = True
+    DatasetContext.get_current().use_streaming_executor = True
+
+    def f(x):
+        time.sleep(1)
+        return x
+
+    # Tests that autoscaling works even when resource constrained via actor killing.
+    # To pass this, we need to autoscale down to free up slots for task execution.
+    DatasetContext.get_current().execution_options.resource_limits.cpu = 2
+    ray.data.range(5, parallelism=5).map_batches(
+        f,
+        compute=ray.data.ActorPoolStrategy(1, 2),
+        batch_size=None,
+    ).map_batches(lambda x: x, batch_size=None, num_cpus=2).take_all()
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))

From baac0a650649160d88080b53f813ef28588688de Mon Sep 17 00:00:00 2001
From: Cade Daniel <cade@anyscale.com>
Date: Mon, 30 Jan 2023 13:23:59 -0800
Subject: [PATCH 062/267] [CI] Increase target time for
 `test_result_throughput_cluster` (#32062)

https://github.com/ray-project/ray/issues/31337 has become flaky again due to a low timeout. This PR follows https://github.com/ray-project/ray/pull/31338 and increases the timeout.
---
 release/ray_release/alerts/tune_tests.py                    | 2 +-
 .../workloads/test_result_throughput_cluster.py             | 6 +++---
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/release/ray_release/alerts/tune_tests.py b/release/ray_release/alerts/tune_tests.py
index 2cd01c9c530b..250961f7232f 100644
--- a/release/ray_release/alerts/tune_tests.py
+++ b/release/ray_release/alerts/tune_tests.py
@@ -44,7 +44,7 @@ def handle_result(
         target_time = 900 if not was_smoke_test else 400
     elif test_name == "result_throughput_cluster":
         target_terminated = 1000
-        target_time = 135
+        target_time = 160
     elif test_name == "result_throughput_single_node":
         target_terminated = 96
         target_time = 120
diff --git a/release/tune_tests/scalability_tests/workloads/test_result_throughput_cluster.py b/release/tune_tests/scalability_tests/workloads/test_result_throughput_cluster.py
index 5b892818e8cd..1eecfa7cdfd4 100644
--- a/release/tune_tests/scalability_tests/workloads/test_result_throughput_cluster.py
+++ b/release/tune_tests/scalability_tests/workloads/test_result_throughput_cluster.py
@@ -8,7 +8,7 @@
 
 Test owner: krfricke
 
-Acceptance criteria: Should run faster than 135 seconds.
+Acceptance criteria: Should run faster than 160 seconds.
 
 Theoretical minimum time: 100 seconds
 """
@@ -31,11 +31,11 @@ def main():
     results_per_second = 0.5
     trial_length_s = 100
 
-    max_runtime = 130
+    max_runtime = 160
 
     if _is_ray_cluster():
         # Add constant overhead for SSH connection
-        max_runtime = 130
+        max_runtime = 160
 
     timed_tune_run(
         name="result throughput cluster",

From fe729aa39a8e6a05e4e16c104e9dfc0fbfd57bae Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Mon, 30 Jan 2023 14:07:44 -0800
Subject: [PATCH 063/267] [core] Add generic `__ray_ready__` method to Actor
 classes (#31997)

We currently have no canonical way to await actors. Users can define their own _is-ready_ methods, schedule a future, and await these, but this has to be done for every actor class separately.

This does not match other patterns - e.g. we have `actor.__ray_terminate__.remote()` for actor termination and `placement_group.ready()` for placement group ready futures.

This PR adds a new `__ray_ready__` magic actor method that just returns `True`. It can be used to await actors becoming ready (newly scheduled actors), and actors having processed all of their other enqueued tasks.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 python/ray/actor.py            |  7 +++++--
 python/ray/tests/test_actor.py | 21 ++++++++++++++++++++-
 2 files changed, 25 insertions(+), 3 deletions(-)

diff --git a/python/ray/actor.py b/python/ray/actor.py
index 30863c815849..6bf93281fc83 100644
--- a/python/ray/actor.py
+++ b/python/ray/actor.py
@@ -1316,11 +1316,14 @@ def _modify_class(cls):
             "'class ClassName(object):' instead of 'class ClassName:'."
         )
 
-    # Modify the class to have an additional method that will be used for
-    # terminating the worker.
+    # Modify the class to have additional methods
+    # for checking actor alive status and to terminate the worker.
     class Class(cls):
         __ray_actor_class__ = cls  # The original actor class
 
+        def __ray_ready__(self):
+            return True
+
         def __ray_terminate__(self):
             worker = ray._private.worker.global_worker
             if worker.mode != ray.LOCAL_MODE:
diff --git a/python/ray/tests/test_actor.py b/python/ray/tests/test_actor.py
index 5a12a70a4656..baaa7fa7137e 100644
--- a/python/ray/tests/test_actor.py
+++ b/python/ray/tests/test_actor.py
@@ -1108,6 +1108,20 @@ def check_file_written():
     os.unlink(tmpfile.name)
 
 
+def test_actor_ready(ray_start_regular_shared):
+    @ray.remote
+    class Actor:
+        pass
+
+    actor = Actor.remote()
+
+    with pytest.raises(TypeError):
+        # Method can't be called directly
+        actor.__ray_ready__()
+
+    assert ray.get(actor.__ray_ready__.remote())
+
+
 def test_return_actor_handle_from_actor(ray_start_regular_shared):
     @ray.remote
     class Inner:
@@ -1148,7 +1162,12 @@ def method_one(self) -> None:
     assert methods == ["method_one"]
 
     all_methods = set(dir(f))
-    assert all_methods == {"__init__", "method_one", "__ray_terminate__"}
+    assert all_methods == {
+        "__init__",
+        "method_one",
+        "__ray_ready__",
+        "__ray_terminate__",
+    }
 
     method_options = [fn for fn in dir(f.method_one) if not fn.startswith("_")]
 

From b350f8d4ee823afcda139b86f6348765c2a0e232 Mon Sep 17 00:00:00 2001
From: shrekris-anyscale <92341594+shrekris-anyscale@users.noreply.github.com>
Date: Mon, 30 Jan 2023 14:44:00 -0800
Subject: [PATCH 064/267] [Serve] Mark `long_running_serve_failure` test as
 `stable` (#32063)

The long_running_serve_failure release test is marked as unstable due to recent failures. Recently, #31945 and #32011 have resolved the root causes of these failures. After those changes, the test ran successfully for 15+ hours without failure. This change limits the test's iterations, so it doesn't run forever, and it marks the test as stable.
---
 release/long_running_tests/workloads/serve_failure.py | 8 ++++----
 release/release_tests.yaml                            | 2 +-
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/release/long_running_tests/workloads/serve_failure.py b/release/long_running_tests/workloads/serve_failure.py
index caeaf3152ae9..4dac08549c1e 100644
--- a/release/long_running_tests/workloads/serve_failure.py
+++ b/release/long_running_tests/workloads/serve_failure.py
@@ -25,6 +25,8 @@
 
 # RandomTest setup constants
 CPUS_PER_NODE = 10
+NUM_ITERATIONS = 350
+ACTIONS_PER_ITERATION = 20
 
 RAY_UNIT_TEST = "RAY_UNIT_TEST" in os.environ
 
@@ -138,11 +140,10 @@ def verify_deployment(self):
                 time.sleep(0.01)
 
     def run(self):
-        iteration = 0
         start_time = time.time()
         previous_time = start_time
-        while True:
-            for _ in range(20):
+        for iteration in range(NUM_ITERATIONS):
+            for _ in range(ACTIONS_PER_ITERATION):
                 actions, weights = zip(*self.weighted_actions)
                 action_chosen = random.choices(actions, weights=weights)[0]
                 print(f"Executing {action_chosen}")
@@ -166,7 +167,6 @@ def run(self):
                 }
             )
             previous_time = new_time
-            iteration += 1
 
             if RAY_UNIT_TEST:
                 break
diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index eaa62ec6f4f9..210910e27f60 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -2062,7 +2062,7 @@
   group: Long running tests
   working_dir: long_running_tests
 
-  stable: false
+  stable: true
 
   legacy:
     test_name: serve_failure

From fb96935e45f3307e36b19f3408c1e36d4300265b Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Mon, 30 Jan 2023 15:19:43 -0800
Subject: [PATCH 065/267] [core] Reduce the timeout for many nodes actor tests.
 (#32066)

Reduce the timeout for many nodes actor test given that a test should finish within 1h.
It can save some cost for problematic runs.
---
 release/benchmarks/distributed/many_nodes_tests/actor_test.py | 3 +++
 release/release_tests.yaml                                    | 2 +-
 2 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/release/benchmarks/distributed/many_nodes_tests/actor_test.py b/release/benchmarks/distributed/many_nodes_tests/actor_test.py
index 495570a74c6d..fd14b70d6236 100644
--- a/release/benchmarks/distributed/many_nodes_tests/actor_test.py
+++ b/release/benchmarks/distributed/many_nodes_tests/actor_test.py
@@ -118,7 +118,10 @@ def main():
             result["perf_metrics"] = perf
             dashboard_test.update_release_test_result(result)
 
+        print(f"Writing data into file: {os.environ['TEST_OUTPUT_JSON']}")
         json.dump(result, out_file)
+    print(f"Result: {json.dumps(result, indent=2)}")
+    print("Test finished successfully!")
 
 
 if __name__ == "__main__":
diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index 210910e27f60..f476309df65b 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -3911,7 +3911,7 @@
     cluster_compute: distributed/many_nodes_tests/compute_config.yaml
 
   run:
-    timeout: 7200
+    timeout: 3600
     # 2cpus per node x 1000 nodes / 0.2 cpus per actor = 10k
     # 2cpus per node x 2000 nodes / 0.2 cpus per actor = 20k
     script: python distributed/many_nodes_tests/actor_test.py --no-wait --cpus-per-actor=0.2 --total-actors 10000 20000

From fefd5e321f35cc2cb5fcccff4e9bfcd16ad782fd Mon Sep 17 00:00:00 2001
From: Alan Guo <aguo@anyscale.com>
Date: Mon, 30 Jan 2023 15:21:00 -0800
Subject: [PATCH 066/267] Fix unit test (#32084)

---
 dashboard/client/src/pages/metrics/Metrics.component.test.tsx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/dashboard/client/src/pages/metrics/Metrics.component.test.tsx b/dashboard/client/src/pages/metrics/Metrics.component.test.tsx
index 42b778234884..73f6467cd569 100644
--- a/dashboard/client/src/pages/metrics/Metrics.component.test.tsx
+++ b/dashboard/client/src/pages/metrics/Metrics.component.test.tsx
@@ -45,7 +45,7 @@ describe("Metrics", () => {
 
     render(<Metrics newIA />, { wrapper: Wrapper });
     await screen.findByText(/View in Grafana/);
-    expect(screen.getByText(/30 minutes/)).toBeVisible();
+    expect(screen.getByText(/5 minutes/)).toBeVisible();
     expect(screen.getByText(/Tasks/)).toBeVisible();
     expect(screen.getByText(/Actors/)).toBeVisible();
     expect(screen.getByText(/Scheduler and autoscaler/)).toBeVisible();
@@ -61,7 +61,7 @@ describe("Metrics", () => {
     render(<Metrics newIA />, { wrapper: MetricsDisabledWrapper });
     await screen.findByText(/Grafana or prometheus server not detected./);
     expect(screen.queryByText(/View in Grafana/)).toBeNull();
-    expect(screen.queryByText(/30 minutes/)).toBeNull();
+    expect(screen.queryByText(/5 minutes/)).toBeNull();
     expect(screen.queryByText(/Tasks/)).toBeNull();
     expect(screen.queryByText(/Actors/)).toBeNull();
     expect(screen.queryByText(/Scheduler and autoscaler/)).toBeNull();

From 34e2cd54645984eea72b6b4360a3c9d57ee4a879 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Mon, 30 Jan 2023 16:48:29 -0800
Subject: [PATCH 067/267] [Datasets] Remove the non-useful comment in
 `map_batches()` (#32020)

This PR is a quick fix to remove the non-useful comment introduced in https://github.com/ray-project/ray/pull/31526, probably during debugging.

Replace the comment with a meaningful one.
---
 python/ray/data/dataset.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index 48b3dff224b4..9fb4a153eb28 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -614,7 +614,7 @@ def map_batches(
             zero_copy_batch=zero_copy_batch,
         )
 
-        # breakpoint()
+        # TODO(chengsu): pass function name to MapBatches logical operator.
         if hasattr(fn, "__self__") and isinstance(
             fn.__self__, ray.data.preprocessor.Preprocessor
         ):

From 755b56f9ed2f0f223aecc7a3cd59b7bd5dbb7563 Mon Sep 17 00:00:00 2001
From: Eric Liang <ekhliang@gmail.com>
Date: Mon, 30 Jan 2023 17:35:24 -0800
Subject: [PATCH 068/267] simplify metrics pgae (#32089)

Signed-off-by: Eric Liang <ekhliang@gmail.com>

Combine tasks and actors sections
Move object store memory back up to the logical section (it's one of the most useful metrics, it shouldn't be buried)
Improve titles
---
 .../client/src/pages/metrics/Metrics.tsx      | 30 ++++++++-----------
 1 file changed, 12 insertions(+), 18 deletions(-)

diff --git a/dashboard/client/src/pages/metrics/Metrics.tsx b/dashboard/client/src/pages/metrics/Metrics.tsx
index 76909bd9449d..be13274b11e9 100644
--- a/dashboard/client/src/pages/metrics/Metrics.tsx
+++ b/dashboard/client/src/pages/metrics/Metrics.tsx
@@ -105,7 +105,7 @@ type MetricsSectionConfig = {
 // NOTE: please keep the titles here in sync with grafana_dashboard_factory.py
 const METRICS_CONFIG: MetricsSectionConfig[] = [
   {
-    title: "Tasks",
+    title: "Tasks and Actors",
     contents: [
       {
         title: "Scheduler Task State",
@@ -115,11 +115,6 @@ const METRICS_CONFIG: MetricsSectionConfig[] = [
         title: "Active Tasks by Name",
         path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=35",
       },
-    ],
-  },
-  {
-    title: "Actors",
-    contents: [
       {
         title: "Scheduler Actor State",
         path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=33",
@@ -131,12 +126,8 @@ const METRICS_CONFIG: MetricsSectionConfig[] = [
     ],
   },
   {
-    title: "Scheduler and autoscaler",
+    title: "Ray Resource Usage",
     contents: [
-      {
-        title: "Node Count",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=24",
-      },
       {
         title: "Scheduler CPUs (logical slots)",
         path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=27",
@@ -146,14 +137,22 @@ const METRICS_CONFIG: MetricsSectionConfig[] = [
         path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=28",
       },
       {
-        title: "Scheduler Placement Groups",
+        title: "Object Store Memory",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=29",
+      },
+      {
+        title: "Placement Groups",
         path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=40",
       },
     ],
   },
   {
-    title: "Node metrics",
+    title: "Hardware Utilization",
     contents: [
+      {
+        title: "Node Count",
+        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=24",
+      },
       {
         title: "Node CPU (hardware utilization)",
         path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=2",
@@ -186,15 +185,10 @@ const METRICS_CONFIG: MetricsSectionConfig[] = [
         title: "Node CPU by Component",
         path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=37",
       },
-
       {
         title: "Node Memory by Component",
         path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=34",
       },
-      {
-        title: "Object Store Memory",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=29",
-      },
     ],
   },
 ];

From f325ced534211585bc48098e83796a70a49dc41d Mon Sep 17 00:00:00 2001
From: Emmy Li <78717839+emmyscode@users.noreply.github.com>
Date: Mon, 30 Jan 2023 17:42:42 -0800
Subject: [PATCH 069/267] [docs] Update top-navigation.js (#32075)

Currently, the dropdown menu "Resources" in the Ray documentation contains a link called "Training." This link points to the [same site](https://www.anyscale.com/events) as "Events." However, we want this to direct to the repository of [technical training content](https://github.com/ray-project/ray-educational-materials).

Co-authored-by: angelinalg <122562471+angelinalg@users.noreply.github.com>
---
 doc/source/_static/js/top-navigation.js | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/doc/source/_static/js/top-navigation.js b/doc/source/_static/js/top-navigation.js
index 6c1c4aec4a92..e01c8b34599a 100644
--- a/doc/source/_static/js/top-navigation.js
+++ b/doc/source/_static/js/top-navigation.js
@@ -100,7 +100,7 @@ learnMenu.setAttribute("class", "menu")
 learnMenu.innerHTML = "<a href='#'>Resources" + downCaret + "</a>"
 learnList = document.createElement("ul")
 learnList.innerHTML += "<li><a href='https://discuss.ray.io/'><span class='primary'>Discussion Forum</span><span class='secondary'>Get your Ray questions answered</span></a></li>"
-learnList.innerHTML += "<li><a href='https://www.anyscale.com/events?type=anyscale-academy'><span class='primary'>Training</span><span class='secondary'>Hands-on learning</span></a></li>"
+learnList.innerHTML += "<li><a href='https://github.com/ray-project/ray-educational-materials'><span class='primary'>Training</span><span class='secondary'>Hands-on learning</span></a></li>"
 learnList.innerHTML += "<li><a href='https://www.anyscale.com/blog'><span class='primary'>Blog</span><span class='secondary'>Updates, best practices, user-stories</span></a></li>"
 learnList.innerHTML += "<li><a href='https://www.anyscale.com/events'><span class='primary'>Events</span><span class='secondary'>Webinars, meetups, office hours</span></a></li>"
 learnList.innerHTML += "<li><a href='https://www.anyscale.com/user-stories'><span class='primary'>Success Stories</span><span class='secondary'>Real-world workload examples</span></a></li>"
@@ -127,4 +127,4 @@ anyscaleButton.onclick = function () {
 
 topNavContent.append(anyscaleButton)
 
-document.getElementsByClassName("topnav")[0].append(topNavContent)
\ No newline at end of file
+document.getElementsByClassName("topnav")[0].append(topNavContent)

From dc974cb6c03e90e2e697b2c906c5424e48d55725 Mon Sep 17 00:00:00 2001
From: Yiqing Wang <YQ-Wang@users.noreply.github.com>
Date: Mon, 30 Jan 2023 18:03:45 -0800
Subject: [PATCH 070/267] [docs] deploying static ray cluster to K8S with
 external Redis for fault tolerance (#31949)

This PR adds the documentation and sample config files for deploying Ray to K8S without using KubeRay. As KubeRay CRDs need cluster-scoped permissions, this PR helps those users who do not have cluster-scoped permissions to install Ray Cluster in their K8S.
---
 doc/source/_toc.yml                           |   1 +
 .../static-ray-cluster-networkpolicy.yaml     | 303 ++++++++++++++
 ...atic-ray-cluster.with-fault-tolerance.yaml | 369 ++++++++++++++++++
 doc/source/cluster/kubernetes/user-guides.md  |   3 +
 .../static-ray-cluster-without-kuberay.md     | 202 ++++++++++
 5 files changed, 878 insertions(+)
 create mode 100644 doc/source/cluster/kubernetes/configs/static-ray-cluster-networkpolicy.yaml
 create mode 100644 doc/source/cluster/kubernetes/configs/static-ray-cluster.with-fault-tolerance.yaml
 create mode 100644 doc/source/cluster/kubernetes/user-guides/static-ray-cluster-without-kuberay.md

diff --git a/doc/source/_toc.yml b/doc/source/_toc.yml
index c21f9dc22177..223b1f9276ba 100644
--- a/doc/source/_toc.yml
+++ b/doc/source/_toc.yml
@@ -52,6 +52,7 @@ parts:
                 - file: cluster/kubernetes/user-guides/logging.md
                 - file: cluster/kubernetes/user-guides/gpu.md
                 - file: cluster/kubernetes/user-guides/experimental.md
+                - file: cluster/kubernetes/user-guides/static-ray-cluster-without-kuberay.md
             - file: cluster/kubernetes/examples
               sections:
                 - file: cluster/kubernetes/examples/ml-example.md
diff --git a/doc/source/cluster/kubernetes/configs/static-ray-cluster-networkpolicy.yaml b/doc/source/cluster/kubernetes/configs/static-ray-cluster-networkpolicy.yaml
new file mode 100644
index 000000000000..1ff2022da6c9
--- /dev/null
+++ b/doc/source/cluster/kubernetes/configs/static-ray-cluster-networkpolicy.yaml
@@ -0,0 +1,303 @@
+# If your Kubernetes has a default deny network policy for pods, you need to manually apply this network policy 
+# to allow the bidirectional communication among the head and worker nodes in the Ray cluster.
+
+# The ports between the min-worker-port and max-worker-port are listed separately because targeting a range of
+# ports is only available after Kubernetes v1.25 
+# (https://kubernetes.io/docs/concepts/services-networking/network-policies/#targeting-a-range-of-ports).
+
+# Ingress
+apiVersion: networking.k8s.io/v1
+kind: NetworkPolicy
+metadata:
+  name: ray-cluster-ingress
+spec:
+  podSelector:
+    matchLabels:
+      app: ray-cluster-head
+  policyTypes:
+    - Ingress
+  ingress:
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 6379
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 6380
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 8265
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 8076
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 8077
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 8078
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 52365
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10001
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10002
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10003
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10004
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10005
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10006
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10007
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10008
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10009
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10010
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10011
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10012
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10013
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10014
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10015
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10016
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10017
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10018
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10019
+  - from:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10020
+
+# Egress
+---
+apiVersion: networking.k8s.io/v1
+kind: NetworkPolicy
+metadata:
+  name: ray-cluster-egress
+spec:
+  podSelector:
+    matchLabels:
+      app: ray-cluster-head
+  policyTypes:
+    - Egress
+  egress:
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 6379
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 6380
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 8265 
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 8076
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 8077
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 8078
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 52365
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10001
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10002
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10003
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10004
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10005
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10006
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10007
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10008
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10009
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10010
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10011
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10012
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10013
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10014
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10015
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10016
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10017
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10018
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10019
+  - to:
+    - podSelector: {}
+    ports:
+    - protocol: TCP
+      port: 10020
\ No newline at end of file
diff --git a/doc/source/cluster/kubernetes/configs/static-ray-cluster.with-fault-tolerance.yaml b/doc/source/cluster/kubernetes/configs/static-ray-cluster.with-fault-tolerance.yaml
new file mode 100644
index 000000000000..2e5d02720c7e
--- /dev/null
+++ b/doc/source/cluster/kubernetes/configs/static-ray-cluster.with-fault-tolerance.yaml
@@ -0,0 +1,369 @@
+# This section is only required for deploying Redis on Kubernetes for the purpose of enabling Ray 
+# to write GCS metadata to an external Redis for fault tolerance. If you have already deployed Redis 
+# on Kubernetes, this section can be removed.
+kind: ConfigMap
+apiVersion: v1
+metadata:
+  name: redis-config
+  labels:
+    app: redis
+data:
+  redis.conf: |-
+    dir /data
+    port 6379
+    bind 0.0.0.0
+    appendonly yes
+    protected-mode no
+    pidfile /data/redis-6379.pid
+---
+apiVersion: v1
+kind: Service
+metadata:
+  name: redis
+  labels:
+    app: redis
+spec:
+  type: ClusterIP
+  ports:
+    - name: redis
+      port: 6379
+  selector:
+    app: redis
+---
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: redis
+  labels:
+    app: redis
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: redis
+  template:
+    metadata:
+      labels:
+        app: redis
+    spec:
+      containers:
+        - name: redis
+          image: redis:5.0.8
+          command:
+            - "sh"
+            - "-c"
+            - "redis-server /usr/local/etc/redis/redis.conf"
+          ports:
+            - containerPort: 6379
+          volumeMounts:
+            - name: config
+              mountPath: /usr/local/etc/redis/redis.conf
+              subPath: redis.conf
+      volumes:
+        - name: config
+          configMap:
+            name: redis-config
+---
+# Ray head node service, allowing worker pods to discover the head node to perform the bidirectional communication.
+# More contexts can be found at [the Ports configurations doc](https://docs.ray.io/en/latest/ray-core/configure.html#ports-configurations).
+apiVersion: v1
+kind: Service
+metadata:
+  name: service-ray-cluster
+  labels:
+    app: ray-cluster-head
+spec:
+  ports:
+  - name: client
+    protocol: TCP
+    port: 10001
+    targetPort: 10001
+  - name: dashboard
+    protocol: TCP
+    port: 8265
+    targetPort: 8265
+  - name: gcs-server
+    protocol: TCP
+    port: 6380
+    targetPort: 6380
+  - name: object-manager-port
+    protocol: TCP
+    port: 8076
+    targetPort: 8076
+  - name: node-manager-port
+    protocol: TCP
+    port: 8077
+    targetPort: 8077
+  - name: dashboard-agent-grpc-port
+    protocol: TCP
+    port: 8078
+    targetPort: 8078
+  - name: dashboard-agent-listen-port
+    protocol: TCP
+    port: 52365
+    targetPort: 52365
+  - name: worker-port-1
+    protocol: TCP
+    port: 10002
+    targetPort: 10002
+  - name: worker-port-2
+    protocol: TCP
+    port: 10003
+    targetPort: 10003
+  - name: worker-port-3
+    protocol: TCP
+    port: 10004
+    targetPort: 10004
+  - name: worker-port-4
+    protocol: TCP
+    port: 10005
+    targetPort: 10005
+  - name: worker-port-5
+    protocol: TCP
+    port: 10006
+    targetPort: 10006
+  - name: worker-port-6
+    protocol: TCP
+    port: 10007
+    targetPort: 10007
+  - name: worker-port-7
+    protocol: TCP
+    port: 10008
+    targetPort: 10008
+  - name: worker-port-8
+    protocol: TCP
+    port: 10009
+    targetPort: 10009
+  - name: worker-port-9
+    protocol: TCP
+    port: 10010
+    targetPort: 10010
+  - name: worker-port-10
+    protocol: TCP
+    port: 10011
+    targetPort: 10011
+  - name: worker-port-11
+    protocol: TCP
+    port: 10012
+    targetPort: 10012
+  - name: worker-port-12
+    protocol: TCP
+    port: 10013
+    targetPort: 10013
+  - name: worker-port-13
+    protocol: TCP
+    port: 10014
+    targetPort: 10014
+  - name: worker-port-14
+    protocol: TCP
+    port: 10015
+    targetPort: 10015
+  - name: worker-port-15
+    protocol: TCP
+    port: 10016
+    targetPort: 10016
+  - name: worker-port-16
+    protocol: TCP
+    port: 10017
+    targetPort: 10017
+  - name: worker-port-17
+    protocol: TCP
+    port: 10018
+    targetPort: 10018
+  - name: worker-port-18
+    protocol: TCP
+    port: 10019
+    targetPort: 10019
+  - name: worker-port-19
+    protocol: TCP
+    port: 10020
+    targetPort: 10020
+  selector:
+    app: ray-cluster-head
+---
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: deployment-ray-head
+  labels:
+    app: ray-cluster-head
+spec:
+  # Do not change this - Ray currently only supports one head node per cluster.
+  replicas: 1
+  selector:
+    matchLabels:
+      component: ray-head
+      type: ray
+      app: ray-cluster-head
+  template:
+    metadata:
+      labels:
+        component: ray-head
+        type: ray
+        app: ray-cluster-head
+    spec:
+      # If the head node goes down, the entire cluster (including all worker
+      # nodes) will go down as well. If you want Kubernetes to bring up a new
+      # head node in this case, set this to "Always," else set it to "Never."
+      restartPolicy: Always
+
+      # This volume allocates shared memory for Ray to use for its plasma
+      # object store. If you do not provide this, Ray will fall back to
+      # /tmp which cause slowdowns if it's not a shared memory volume.
+      volumes:
+      - name: dshm
+        emptyDir:
+          medium: Memory
+      containers:
+        - name: ray-head
+          image: rayproject/ray:2.2.0
+          imagePullPolicy: Always
+          command: [ "/bin/bash", "-c", "--" ]
+          # if there is no password for Redis, set --redis-password=''
+          args:
+            - "ray start --head --port=6380 --num-cpus=$MY_CPU_REQUEST --dashboard-host=0.0.0.0 --object-manager-port=8076 --node-manager-port=8077 --dashboard-agent-grpc-port=8078 --dashboard-agent-listen-port=52365 --min-worker-port=10002 --max-worker-port=10020 --redis-password='' --block"
+          ports:
+            - containerPort: 6380 # GCS server
+            - containerPort: 10001 # Used by Ray Client
+            - containerPort: 8265 # Used by Ray Dashboard
+            - containerPort: 8076 # Ray object manager port
+            - containerPort: 8077 # Ray node manager port
+            - containerPort: 8078 # Ray dashboard agent grpc port
+            - containerPort: 52365 # Ray dashboard agent listen port
+            - containerPort: 10002 # min worker port
+            - containerPort: 10003 # available worker port
+            - containerPort: 10004 # available worker port
+            - containerPort: 10005 # available worker port
+            - containerPort: 10006 # available worker port
+            - containerPort: 10007 # available worker port
+            - containerPort: 10008 # available worker port
+            - containerPort: 10009 # available worker port
+            - containerPort: 10010 # available worker port
+            - containerPort: 10011 # available worker port
+            - containerPort: 10012 # available worker port
+            - containerPort: 10013 # available worker port
+            - containerPort: 10014 # available worker port
+            - containerPort: 10015 # available worker port
+            - containerPort: 10016 # available worker port
+            - containerPort: 10017 # available worker port
+            - containerPort: 10018 # available worker port
+            - containerPort: 10019 # available worker port
+            - containerPort: 10020 # max worker port
+          # This volume allocates shared memory for Ray to use for its plasma
+          # object store. If you do not provide this, Ray will fall back to
+          # /tmp which cause slowdowns if it's not a shared memory volume.
+          volumeMounts:
+            - mountPath: /dev/shm
+              name: dshm
+          env:
+            # RAY_REDIS_ADDRESS lets ray use external Redis for fault tolerance
+            - name: RAY_REDIS_ADDRESS
+              value: redis:6379 # ip address for the external Redis, which is "redis:6379" in this example
+            # This is used in the ray start command so that Ray can spawn the
+            # correct number of processes. Omitting this may lead to degraded
+            # performance.
+            - name: MY_CPU_REQUEST
+              valueFrom:
+                resourceFieldRef:
+                  resource: requests.cpu
+          resources:
+            limits:
+              cpu: "1"
+              memory: "2G"
+            requests:
+              # For production use-cases, we recommend specifying integer CPU reqests and limits.
+              # We also recommend setting requests equal to limits for both CPU and memory.
+              # For this example, we use a 500m CPU request to accomodate resource-constrained local
+              # Kubernetes testing environments such as KinD and minikube.
+              cpu: "500m"
+              # The rest state memory usage of the Ray head node is around 1Gb. We do not
+              # recommend allocating less than 2Gb memory for the Ray head pod.
+              # For production use-cases, we recommend allocating at least 8Gb memory for each Ray container.
+              memory: "2G"
+---
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: deployment-ray-worker
+  labels:
+    app: ray-cluster-worker
+spec:
+  # Change this to scale the number of worker nodes started in the Ray cluster.
+  replicas: 2
+  selector:
+    matchLabels:
+      component: ray-worker
+      type: ray
+      app: ray-cluster-worker
+  template:
+    metadata:
+      labels:
+        component: ray-worker
+        type: ray
+        app: ray-cluster-worker
+    spec:
+      restartPolicy: Always
+      volumes:
+      - name: dshm
+        emptyDir:
+          medium: Memory
+      containers:
+      - name: ray-worker
+        image: rayproject/ray:2.2.0
+        imagePullPolicy: Always
+        command: ["/bin/bash", "-c", "--"]
+        args:
+          - "ray start --num-cpus=$MY_CPU_REQUEST --address=$SERVICE_RAY_CLUSTER_SERVICE_HOST:$SERVICE_RAY_CLUSTER_SERVICE_PORT_GCS_SERVER --object-manager-port=8076 --node-manager-port=8077 --dashboard-agent-grpc-port=8078 --dashboard-agent-listen-port=52365 --min-worker-port=10002 --max-worker-port=10020 --block"
+        ports:
+          - containerPort: 8076
+          - containerPort: 8077
+          - containerPort: 8078
+          - containerPort: 52365
+          - containerPort: 10002
+          - containerPort: 10003
+          - containerPort: 10004
+          - containerPort: 10005
+          - containerPort: 10006
+          - containerPort: 10007
+          - containerPort: 10008
+          - containerPort: 10009
+          - containerPort: 10010
+          - containerPort: 10011
+          - containerPort: 10012
+          - containerPort: 10013
+          - containerPort: 10014
+          - containerPort: 10015
+          - containerPort: 10016
+          - containerPort: 10017
+          - containerPort: 10018
+          - containerPort: 10019
+          - containerPort: 10020 
+        # This volume allocates shared memory for Ray to use for its plasma
+        # object store. If you do not provide this, Ray will fall back to
+        # /tmp which cause slowdowns if it's not a shared memory volume.
+        volumeMounts:
+          - mountPath: /dev/shm
+            name: dshm
+        env:
+          # This is used in the ray start command so that Ray can spawn the
+          # correct number of processes. Omitting this may lead to degraded
+          # performance.
+          - name: MY_CPU_REQUEST
+            valueFrom:
+              resourceFieldRef:
+                resource: requests.cpu
+          # The resource requests and limits in this config are too small for production!
+          # It is better to use a few large Ray pods than many small ones.
+          # For production, it is ideal to size each Ray pod to take up the
+          # entire Kubernetes node on which it is scheduled.
+        resources:
+          limits:
+            cpu: "1"
+            memory: "1G"
+            # For production use-cases, we recommend specifying integer CPU reqests and limits.
+            # We also recommend setting requests equal to limits for both CPU and memory.
+            # For this example, we use a 500m CPU request to accomodate resource-constrained local
+            # Kubernetes testing environments such as KinD and minikube.
+          requests:
+            cpu: "500m"
+            memory: "1G"
diff --git a/doc/source/cluster/kubernetes/user-guides.md b/doc/source/cluster/kubernetes/user-guides.md
index fd7a7be6d64a..1c49aedc2ddc 100644
--- a/doc/source/cluster/kubernetes/user-guides.md
+++ b/doc/source/cluster/kubernetes/user-guides.md
@@ -1,4 +1,5 @@
 (kuberay-guides)=
+
 # User Guides
 
 :::{note}
@@ -8,9 +9,11 @@ at the {ref}`introductory guide <kuberay-quickstart>` first.
 
 In these guides, we go into further depth on several topics related to
 deployments of Ray on Kubernetes.
+
 * {ref}`kuberay-k8s-setup`
 * {ref}`kuberay-config`
 * {ref}`kuberay-autoscaling`
 * {ref}`kuberay-gpu`
 * {ref}`kuberay-logging`
 * {ref}`kuberay-experimental`
+* {ref}`deploy-a-static-ray-cluster-without-kuberay`
diff --git a/doc/source/cluster/kubernetes/user-guides/static-ray-cluster-without-kuberay.md b/doc/source/cluster/kubernetes/user-guides/static-ray-cluster-without-kuberay.md
new file mode 100644
index 000000000000..76f2400d845f
--- /dev/null
+++ b/doc/source/cluster/kubernetes/user-guides/static-ray-cluster-without-kuberay.md
@@ -0,0 +1,202 @@
+(deploy-a-static-ray-cluster-without-kuberay)=
+
+# (Advanced) Deploying a static Ray cluster without KubeRay
+
+This deployment method for Ray no longer requires the use of CustomResourceDefinitions (CRDs).
+In contrast, the CRDs is a prerequisite to use KubeRay. One of its key components, the KubeRay operator,
+manages the Ray cluster resources by watching for Kubernetes events (create/delete/update).
+Although the KubeRay operator can function within a single namespace, the use of CRDs has a cluster-wide scope.
+If the necessary Kubernetes admin permissions are not available for deploying KubeRay, this doc introduces a way to deploy a static Ray cluster to Kubernetes without using KubeRay. However, it should be noted that this deployment method lacks the built-in
+autoscaling feature that KubeRay provides.
+
+## Preparation
+
+### Install the latest Ray release
+
+This step is necessary for interacting with remote clusters using {ref}`Ray Job Submission <jobs-overview>`.
+
+```
+! pip install -U "ray[default]"
+```
+
+See {ref}`installation` for more details.
+
+### Install kubectl
+
+To interact with Kubernetes, we will use kubectl. Installation instructions can be found in the [Kubernetes documentation](https://kubernetes.io/docs/tasks/tools/#kubectl).
+
+### Access a Kubernetes cluster
+
+We will need access to a Kubernetes cluster. There are two options:
+
+1. Configure access to a remote Kubernetes cluster
+**OR**
+
+2. Run the examples locally by [installing kind](https://kind.sigs.k8s.io/docs/user/quick-start/#installation). Start your [kind](https://kind.sigs.k8s.io/) cluster by running the following command:
+
+```
+! kind create cluster
+```
+
+To execute the example in this guide, ensure that your Kubernetes cluster (or local Kind cluster) can handle additional resource requests of 3 CPU and 3Gi memory.
+Also, ensure that both your Kubernetes cluster and Kubectl are at least version 1.19.
+
+### Deploying a Redis for fault tolerance
+
+Note that [the Kubernetes deployment config file](https://raw.githubusercontent.com/ray-project/ray/master/doc/source/cluster/kubernetes/configs/static-ray-cluster.with-fault-tolerance.yaml) has a section to deploy a Redis to Kubernetes so that the Ray head can write through the GCS metadata.
+If a Redis has already been deployed on Kubernetes, this section can be omitted.
+
+## Deploying a static Ray cluster
+
+In this section, we will deploy a static Ray cluster into the `default` namespace without using KubeRay. To use another
+namespace, specify the namespace in your kubectl commands:
+
+`kubectl -n <your-namespace> ...`
+
+```
+# Deploy a sample Ray Cluster from the Ray repo:
+
+! kubectl apply -f https://raw.githubusercontent.com/ray-project/ray/master/doc/source/cluster/kubernetes/configs/static-ray-cluster.with-fault-tolerance.yaml
+
+# Note that the Ray cluster has fault tolerance enabled by default using the external Redis. 
+# Please set the Redis IP address in the config.
+
+# The password is currently set as '' for the external Redis. 
+# Please download the config file and substitute the real password for the empty string if the external Redis has a password.
+```
+
+Once the Ray cluster has been deployed, you can view the pods for the head node and worker nodes by running
+
+```
+! kubectl get pods
+
+# NAME                                             READY   STATUS    RESTARTS   AGE
+# deployment-ray-head-xxxxx                        1/1     Running   0          XXs
+# deployment-ray-worker-xxxxx                      1/1     Running   0          XXs
+# deployment-ray-worker-xxxxx                      1/1     Running   0          XXs
+```
+
+Wait for the pods to reach the `Running` state. This may take a few minutes -- most of this time is spent downloading the Ray images.
+In a separate shell, you may wish to observe the pods' status in real-time with the following command:
+
+```
+# If you're on MacOS, first `brew install watch`.
+# Run in a separate shell:
+
+! watch -n 1 kubectl get pod
+```
+
+If your pods are stuck in the `Pending` state, you can check for errors via `kubectl describe pod deployment-ray-head-xxxx-xxxxx`
+and ensure that your Docker resource limits are set high enough.
+
+Note that in production scenarios, you will want to use larger Ray pods. In fact, it is advantageous to size each Ray pod to take up an entire Kubernetes node. See the [configuration guide](kuberay-config) for more details.
+
+## Deploying a network policy for the static Ray cluster
+
+If your Kubernetes has a default deny network policy for pods, you need to manually create a network policy to allow bidirectional
+communication among the head and worker nodes in the Ray cluster as mentioned in [the ports configurations doc](https://docs.ray.io/en/latest/ray-core/configure.html#ports-configurations).
+
+Note that the statically set port ranges for the worker ports in [the Kubernetes deployment config file](https://raw.githubusercontent.com/ray-project/ray/master/doc/source/cluster/kubernetes/configs/static-ray-cluster.with-fault-tolerance.yaml)
+are only required when there is a corresponding network policy created for the default deny behavior.
+Otherwise the statically set worker port ranges are not required.
+
+```
+# Create a sample network policy for the static Ray cluster from the Ray repo:
+! kubectl apply -f https://raw.githubusercontent.com/ray-project/ray/master/doc/source/cluster/kubernetes/configs/static-ray-cluster-networkpolicy.yaml
+```
+
+Once the network policy has been deployed, you can view the network policy for the static Ray cluster by running
+
+```
+! kubectl get networkpolicies
+
+# NAME                               POD-SELECTOR                           AGE
+# ray-cluster-egress                 app=ray-cluster-head                   XXs
+# ray-cluster-ingress                app=ray-cluster-head                   XXs
+```
+
+### External Redis Integration for fault tolerance
+
+Ray by default uses an internal key-value store, called the Global Control Store (GCS). The GCS runs on the head node and stores cluster
+metadata. One drawback of this approach is that the head node loses the metadata if it crashes.
+Ray can also write this metadata to an external Redis for reliability and high availability.
+With this setup, the static Ray cluster can recover from head node crashes and tolerate GCS failures without losing connections to worker nodes.
+
+To use this feature, we need to pass in the `RAY_REDIS_ADDRESS` env var and `--redis-password` in the Ray head node section of [the Kubernetes deployment config file](https://raw.githubusercontent.com/ray-project/ray/master/doc/source/cluster/kubernetes/configs/static-ray-cluster.with-fault-tolerance.yaml).
+
+## Running Applications on the static Ray Cluster
+
+In this section, we will interact with the static Ray cluster that just got deployed.
+
+### Accessing the cluster with kubectl exec
+
+Same as the Ray cluster that deployed using KubeRay, we can exec directly into the head pod and run a Ray program.
+
+Firstly, run the command below to get the head pod:
+
+```
+! kubectl get pods --selector=app=ray-cluster-head
+
+# NAME                                             READY   STATUS    RESTARTS   AGE
+# deployment-ray-head-xxxxx                        1/1     Running   0          XXs
+```
+
+We can now execute a Ray program on the previously identified head pod. The following command connects to the Ray Cluster and then terminates the Ray program.
+
+```
+# Substitute your output from the last cell in place of "deployment-ray-head-xxxxx"
+
+! kubectl exec deployment-ray-head-xxxxx -it -c ray-head -- python -c "import ray; ray.init('auto')"
+# 2022-08-10 11:23:17,093 INFO worker.py:1312 -- Connecting to existing Ray cluster at address: <IP address>:6380...
+# 2022-08-10 11:23:17,097 INFO worker.py:1490 -- Connected to Ray cluster. View the dashboard at ...
+```
+
+Although the above cell can be useful for occasional execution on the Ray Cluster, the recommended approach for running an application on a Ray Cluster is to use [Ray Jobs](jobs-quickstart).
+
+### Ray Job submission
+
+To set up your Ray Cluster for Ray Jobs submission, it is necessary to ensure that the Ray Jobs port is accessible to the client.
+Ray receives job requests through the Dashboard server on the head node.
+
+First, we need to identify the Ray head node. The static Ray cluster configuration file sets up a
+[Kubernetes service](https://kubernetes.io/docs/concepts/services-networking/service/) that targets the Ray head pod.
+This service lets us interact with Ray clusters without directly executing commands in the Ray container.
+To identify the Ray head service for our example cluster, run:
+
+```
+! kubectl get service service-ray-cluster
+
+# NAME                             TYPE        CLUSTER-IP     EXTERNAL-IP   PORT(S)                            AGE
+# service-ray-cluster              ClusterIP   10.92.118.20   <none>        6380/TCP,8265/TCP,10001/TCP...     XXs
+```
+
+Now that we have the name of the service, we can use port-forwarding to access the Ray Dashboard port (8265 by default).
+
+```
+# Execute this in a separate shell.
+# Substitute the service name in place of service-ray-cluster
+
+! kubectl port-forward service/service-ray-cluster 8265:8265
+```
+
+Now that we have access to the Dashboard port, we can submit jobs to the Ray Cluster for execution:
+
+```
+! ray job submit --address http://localhost:8265 -- python -c "import ray; ray.init(); print(ray.cluster_resources())"
+```
+
+## Cleanup
+
+### Deleting a Ray Cluster
+
+Delete the static Ray cluster service and deployments
+
+```
+! kubectl delete -f https://raw.githubusercontent.com/ray-project/ray/master/doc/source/cluster/kubernetes/configs/static-ray-cluster.with-fault-tolerance.yaml
+```
+
+Delete the static Ray cluster network policy
+
+```
+! kubectl delete -f https://raw.githubusercontent.com/ray-project/ray/master/doc/source/cluster/kubernetes/configs/static-ray-cluster-networkpolicy.yaml
+```

From b477f4bd239d80741a1c0180b77d3534b40c836b Mon Sep 17 00:00:00 2001
From: Alan Guo <aguo@anyscale.com>
Date: Mon, 30 Jan 2023 21:05:32 -0800
Subject: [PATCH 071/267] fix frontend tests after #32089 (#32097)

Signed-off-by: Alan Guo <aguo@anyscale.com>
---
 .../pages/metrics/Metrics.component.test.tsx   | 18 ++++++++----------
 1 file changed, 8 insertions(+), 10 deletions(-)

diff --git a/dashboard/client/src/pages/metrics/Metrics.component.test.tsx b/dashboard/client/src/pages/metrics/Metrics.component.test.tsx
index 73f6467cd569..5198cd38a540 100644
--- a/dashboard/client/src/pages/metrics/Metrics.component.test.tsx
+++ b/dashboard/client/src/pages/metrics/Metrics.component.test.tsx
@@ -41,30 +41,28 @@ const MetricsDisabledWrapper = ({ children }: PropsWithChildren<{}>) => {
 
 describe("Metrics", () => {
   it("renders", async () => {
-    expect.assertions(6);
+    expect.assertions(5);
 
     render(<Metrics newIA />, { wrapper: Wrapper });
     await screen.findByText(/View in Grafana/);
     expect(screen.getByText(/5 minutes/)).toBeVisible();
-    expect(screen.getByText(/Tasks/)).toBeVisible();
-    expect(screen.getByText(/Actors/)).toBeVisible();
-    expect(screen.getByText(/Scheduler and autoscaler/)).toBeVisible();
-    expect(screen.getByText(/Node metrics/)).toBeVisible();
+    expect(screen.getByText(/Tasks and Actors/)).toBeVisible();
+    expect(screen.getByText(/Ray Resource Usage/)).toBeVisible();
+    expect(screen.getByText(/Hardware Utilization/)).toBeVisible();
     expect(
       screen.queryByText(/Grafana or prometheus server not detected./),
     ).toBeNull();
   });
 
   it("renders warning when ", async () => {
-    expect.assertions(6);
+    expect.assertions(5);
 
     render(<Metrics newIA />, { wrapper: MetricsDisabledWrapper });
     await screen.findByText(/Grafana or prometheus server not detected./);
     expect(screen.queryByText(/View in Grafana/)).toBeNull();
     expect(screen.queryByText(/5 minutes/)).toBeNull();
-    expect(screen.queryByText(/Tasks/)).toBeNull();
-    expect(screen.queryByText(/Actors/)).toBeNull();
-    expect(screen.queryByText(/Scheduler and autoscaler/)).toBeNull();
-    expect(screen.queryByText(/Node metrics/)).toBeNull();
+    expect(screen.queryByText(/Tasks and Actors/)).toBeNull();
+    expect(screen.queryByText(/Ray Resource Usage/)).toBeNull();
+    expect(screen.queryByText(/Hardware Utilization/)).toBeNull();
   });
 });

From 8a0e4538b04ab04ef382ac4ff92d4ca2fc8a5596 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Mon, 30 Jan 2023 23:20:26 -0800
Subject: [PATCH 072/267] [Datasets] Add logical operator for random_shuffle()
 (#32080)

---
 .../logical/operators/all_to_all_operator.py  |  19 +
 .../_internal/planner/exchange/__init__.py    |   0
 .../_internal/planner/exchange/interfaces.py  |  86 +++
 .../pull_based_shuffle_task_scheduler.py      | 100 +++
 .../push_based_shuffle_task_scheduler.py      | 688 ++++++++++++++++++
 .../planner/exchange/shuffle_task_spec.py     |  88 +++
 .../_internal/planner/plan_all_to_all_op.py   |   4 +
 .../data/_internal/planner/random_shuffle.py  |  42 ++
 python/ray/data/dataset.py                    |  17 +-
 .../data/tests/test_execution_optimizer.py    |  31 +-
 10 files changed, 1072 insertions(+), 3 deletions(-)
 create mode 100644 python/ray/data/_internal/planner/exchange/__init__.py
 create mode 100644 python/ray/data/_internal/planner/exchange/interfaces.py
 create mode 100644 python/ray/data/_internal/planner/exchange/pull_based_shuffle_task_scheduler.py
 create mode 100644 python/ray/data/_internal/planner/exchange/push_based_shuffle_task_scheduler.py
 create mode 100644 python/ray/data/_internal/planner/exchange/shuffle_task_spec.py
 create mode 100644 python/ray/data/_internal/planner/random_shuffle.py

diff --git a/python/ray/data/_internal/logical/operators/all_to_all_operator.py b/python/ray/data/_internal/logical/operators/all_to_all_operator.py
index f94f54c27e98..ca2b47913a90 100644
--- a/python/ray/data/_internal/logical/operators/all_to_all_operator.py
+++ b/python/ray/data/_internal/logical/operators/all_to_all_operator.py
@@ -43,3 +43,22 @@ def __init__(
             input_op,
         )
         self._seed = seed
+
+
+class RandomShuffle(AbstractAllToAll):
+    """Logical operator for random_shuffle."""
+
+    def __init__(
+        self,
+        input_op: LogicalOperator,
+        seed: Optional[int] = None,
+        num_outputs: Optional[int] = None,
+        ray_remote_args: Optional[Dict[str, Any]] = None,
+    ):
+        super().__init__(
+            "RandomShuffle",
+            input_op,
+            num_outputs=num_outputs,
+            ray_remote_args=ray_remote_args,
+        )
+        self._seed = seed
diff --git a/python/ray/data/_internal/planner/exchange/__init__.py b/python/ray/data/_internal/planner/exchange/__init__.py
new file mode 100644
index 000000000000..e69de29bb2d1
diff --git a/python/ray/data/_internal/planner/exchange/interfaces.py b/python/ray/data/_internal/planner/exchange/interfaces.py
new file mode 100644
index 000000000000..b8c924e459d1
--- /dev/null
+++ b/python/ray/data/_internal/planner/exchange/interfaces.py
@@ -0,0 +1,86 @@
+from typing import Any, Dict, List, Optional, Tuple, Union
+
+from ray.data._internal.execution.interfaces import RefBundle
+from ray.data._internal.stats import StatsDict
+from ray.data.block import Block, BlockMetadata
+
+
+class ExchangeTaskSpec:
+    """
+    An interface to specify the exchange map and reduce tasks.
+
+    Subclasses should implement the `map` and `reduce` static methods.
+    `map` method is to transform one input block into multiple output blocks.
+    `reduce` is to combine multiple map output blocks. Both methods are
+    single-task operations. See `ExchangeScheduler` for how to distribute
+    the operations across multiple tasks.
+
+    Any custom arguments for `map` and `reduce` methods should be specified by
+    setting `map_args` and `reduce_args`.
+
+    The concept here is similar to the exchange operator described in
+    "Volcano - An Extensible and Parallel Query Evaluation System"
+    (https://dl.acm.org/doi/10.1109/69.273032).
+    """
+
+    def __init__(self, map_args: List[Any] = None, reduce_args: List[Any] = None):
+        self._map_args = map_args or []
+        self._reduce_args = reduce_args or []
+        assert isinstance(self._map_args, list)
+        assert isinstance(self._reduce_args, list)
+
+    @staticmethod
+    def map(
+        idx: int,
+        block: Block,
+        output_num_blocks: int,
+    ) -> List[Union[BlockMetadata, Block]]:
+        """
+        Map function to be run on each input block.
+
+        Returns list of [BlockMetadata, Block1, Block2, ..., BlockN].
+        """
+        raise NotImplementedError
+
+    @staticmethod
+    def reduce(
+        *mapper_outputs: List[Block],
+        partial_reduce: bool = False,
+    ) -> Tuple[Block, BlockMetadata]:
+        """
+        Reduce function to be run for each output block.
+
+        Args:
+            mapper_outputs: List of map output blocks to reduce.
+            partial_reduce: Whether should partially or fully reduce.
+
+        Returns:
+            The reduced block and its metadata.
+        """
+        raise NotImplementedError
+
+
+class ExchangeTaskScheduler:
+    """
+    An interface to schedule exchange tasks (`exchange_spec`) for multi-nodes
+    execution.
+    """
+
+    def __init__(self, exchange_spec: ExchangeTaskSpec):
+        """
+        Args:
+            exchange_spec: The implementation of exchange tasks to execute.
+        """
+        self._exchange_spec = exchange_spec
+
+    def execute(
+        self,
+        refs: List[RefBundle],
+        output_num_blocks: int,
+        map_ray_remote_args: Optional[Dict[str, Any]] = None,
+        reduce_ray_remote_args: Optional[Dict[str, Any]] = None,
+    ) -> Tuple[List[RefBundle], StatsDict]:
+        """
+        Execute the exchange tasks on input `refs`.
+        """
+        raise NotImplementedError
diff --git a/python/ray/data/_internal/planner/exchange/pull_based_shuffle_task_scheduler.py b/python/ray/data/_internal/planner/exchange/pull_based_shuffle_task_scheduler.py
new file mode 100644
index 000000000000..fcfeaeb478fb
--- /dev/null
+++ b/python/ray/data/_internal/planner/exchange/pull_based_shuffle_task_scheduler.py
@@ -0,0 +1,100 @@
+from typing import Any, Dict, List, Optional, Tuple
+
+from ray.data._internal.execution.interfaces import RefBundle
+from ray.data._internal.planner.exchange.interfaces import ExchangeTaskScheduler
+from ray.data._internal.progress_bar import ProgressBar
+from ray.data._internal.remote_fn import cached_remote_fn
+from ray.data._internal.stats import StatsDict
+
+
+class PullBasedShuffleTaskScheduler(ExchangeTaskScheduler):
+    """
+    The pull-based map-reduce shuffle scheduler.
+
+    Map tasks are first scheduled to generate map output blocks. After all map output
+    are generated, then reduce tasks are scheduled to combine map output blocks
+    together.
+
+    The concept here is similar to
+    "MapReduce: Simplified Data Processing on Large Clusters"
+    (https://dl.acm.org/doi/10.1145/1327452.1327492).
+    """
+
+    def execute(
+        self,
+        refs: List[RefBundle],
+        output_num_blocks: int,
+        map_ray_remote_args: Optional[Dict[str, Any]] = None,
+        reduce_ray_remote_args: Optional[Dict[str, Any]] = None,
+    ) -> Tuple[List[RefBundle], StatsDict]:
+        # TODO: eagerly delete the input and map output block references in order to
+        # eagerly release the blocks' memory.
+        input_blocks = []
+        for ref_bundle in refs:
+            for block, _ in ref_bundle.blocks:
+                input_blocks.append(block)
+        input_num_blocks = len(input_blocks)
+        input_owned = all(b.owns_blocks for b in refs)
+
+        if map_ray_remote_args is None:
+            map_ray_remote_args = {}
+        if reduce_ray_remote_args is None:
+            reduce_ray_remote_args = {}
+        if "scheduling_strategy" not in reduce_ray_remote_args:
+            reduce_ray_remote_args = reduce_ray_remote_args.copy()
+            reduce_ray_remote_args["scheduling_strategy"] = "SPREAD"
+
+        shuffle_map = cached_remote_fn(self._exchange_spec.map)
+        shuffle_reduce = cached_remote_fn(self._exchange_spec.reduce)
+
+        map_bar = ProgressBar("Shuffle Map", total=input_num_blocks)
+
+        shuffle_map_out = [
+            shuffle_map.options(
+                **map_ray_remote_args,
+                num_returns=1 + output_num_blocks,
+            ).remote(i, block, output_num_blocks, *self._exchange_spec._map_args)
+            for i, block in enumerate(input_blocks)
+        ]
+
+        # The first item returned is the BlockMetadata.
+        shuffle_map_metadata = []
+        for i, refs in enumerate(shuffle_map_out):
+            shuffle_map_metadata.append(refs[-1])
+            shuffle_map_out[i] = refs[:-1]
+
+        shuffle_map_metadata = map_bar.fetch_until_complete(shuffle_map_metadata)
+        map_bar.close()
+
+        reduce_bar = ProgressBar("Shuffle Reduce", total=output_num_blocks)
+        shuffle_reduce_out = [
+            shuffle_reduce.options(**reduce_ray_remote_args, num_returns=2,).remote(
+                *self._exchange_spec._reduce_args,
+                *[shuffle_map_out[i][j] for i in range(input_num_blocks)],
+            )
+            for j in range(output_num_blocks)
+        ]
+
+        new_blocks, new_metadata = zip(*shuffle_reduce_out)
+        new_metadata = reduce_bar.fetch_until_complete(list(new_metadata))
+        reduce_bar.close()
+
+        output = []
+        for block, meta in zip(new_blocks, new_metadata):
+            output.append(
+                RefBundle(
+                    [
+                        (
+                            block,
+                            meta,
+                        )
+                    ],
+                    owns_blocks=input_owned,
+                )
+            )
+        stats = {
+            "map": shuffle_map_metadata,
+            "reduce": new_metadata,
+        }
+
+        return (output, stats)
diff --git a/python/ray/data/_internal/planner/exchange/push_based_shuffle_task_scheduler.py b/python/ray/data/_internal/planner/exchange/push_based_shuffle_task_scheduler.py
new file mode 100644
index 000000000000..412b225bf545
--- /dev/null
+++ b/python/ray/data/_internal/planner/exchange/push_based_shuffle_task_scheduler.py
@@ -0,0 +1,688 @@
+import logging
+import math
+from typing import Any, Callable, Dict, List, Optional, Tuple, TypeVar, Union
+
+import ray
+from ray.data._internal.execution.interfaces import RefBundle
+from ray.data._internal.planner.exchange.interfaces import ExchangeTaskScheduler
+from ray.data._internal.progress_bar import ProgressBar
+from ray.data._internal.remote_fn import cached_remote_fn
+from ray.data._internal.stats import StatsDict
+from ray.data.block import Block, BlockAccessor, BlockExecStats, BlockMetadata
+from ray.data.context import DatasetContext
+from ray.types import ObjectRef
+from ray.util.scheduling_strategies import NodeAffinitySchedulingStrategy
+
+logger = logging.getLogger(__name__)
+
+
+T = TypeVar("T")
+U = TypeVar("U")
+
+
+class _MergeTaskSchedule:
+    def __init__(self, output_num_blocks: int, num_merge_tasks_per_round: int):
+        self.output_num_blocks = output_num_blocks
+        self.num_merge_tasks_per_round = num_merge_tasks_per_round
+        self.merge_partition_size = output_num_blocks // num_merge_tasks_per_round
+        self._partitions_with_extra_task = output_num_blocks % num_merge_tasks_per_round
+
+    def get_num_reducers_per_merge_idx(self, merge_idx: int) -> int:
+        """
+        Each intermediate merge task will produce outputs for a partition of P
+        final reduce tasks. This helper function returns P based on the merge
+        task index.
+        """
+        assert merge_idx < self.num_merge_tasks_per_round
+        partition_size = self.merge_partition_size
+        if merge_idx < self._partitions_with_extra_task:
+            partition_size += 1
+        return partition_size
+
+    def get_merge_idx_for_reducer_idx(self, reducer_idx: int) -> int:
+        if reducer_idx < self.merge_partition_size * self._partitions_with_extra_task:
+            merge_idx = reducer_idx // (self.merge_partition_size + 1)
+        else:
+            reducer_idx -= (
+                self.merge_partition_size + 1
+            ) * self._partitions_with_extra_task
+            merge_idx = (
+                self._partitions_with_extra_task
+                + reducer_idx // self.merge_partition_size
+            )
+        assert merge_idx < self.num_merge_tasks_per_round
+        return merge_idx
+
+    def round_robin_reduce_idx_iterator(self):
+        """
+        When there are multiple nodes, merge tasks are spread throughout the
+        cluster to improve load-balancing. Each merge task produces outputs for
+        a contiguous partition of reduce tasks. This method creates an iterator
+        that returns reduce task indices round-robin across the merge tasks.
+        This can be used to submit reduce tasks in a way that spreads the load
+        evenly across the cluster.
+        """
+        idx = 0
+        round_idx = 0
+        while idx < self.output_num_blocks:
+            for merge_idx in range(self.num_merge_tasks_per_round):
+                if merge_idx < self._partitions_with_extra_task:
+                    reduce_idx = merge_idx * (self.merge_partition_size + 1)
+                    partition_size = self.merge_partition_size + 1
+                else:
+                    reduce_idx = self._partitions_with_extra_task * (
+                        self.merge_partition_size + 1
+                    )
+                    merge_idx -= self._partitions_with_extra_task
+                    reduce_idx += merge_idx * self.merge_partition_size
+                    partition_size = self.merge_partition_size
+
+                if round_idx >= partition_size:
+                    continue
+
+                reduce_idx += round_idx
+                yield reduce_idx
+                idx += 1
+            round_idx += 1
+
+
+class _PushBasedShuffleStage:
+    def __init__(
+        self,
+        output_num_blocks: int,
+        num_rounds: int,
+        num_map_tasks_per_round: int,
+        merge_task_placement: List[str],
+    ):
+        self.num_rounds = num_rounds
+        self.num_map_tasks_per_round = num_map_tasks_per_round
+        self.num_merge_tasks_per_round = len(merge_task_placement)
+
+        node_strategies = {
+            node_id: {
+                "scheduling_strategy": NodeAffinitySchedulingStrategy(
+                    node_id, soft=True
+                )
+            }
+            for node_id in set(merge_task_placement)
+        }
+        self._merge_task_options = [
+            node_strategies[node_id] for node_id in merge_task_placement
+        ]
+
+        self.merge_schedule = _MergeTaskSchedule(
+            output_num_blocks, self.num_merge_tasks_per_round
+        )
+
+    def get_merge_task_options(self, merge_idx):
+        return self._merge_task_options[merge_idx]
+
+
+class _PipelinedStageExecutor:
+    def __init__(
+        self,
+        stage_iter,
+        num_tasks_per_round: int,
+        max_concurrent_rounds: int = 1,
+        progress_bar: Optional[ProgressBar] = None,
+    ):
+        self._stage_iter = stage_iter
+        self._num_tasks_per_round = num_tasks_per_round
+        self._max_concurrent_rounds = max_concurrent_rounds
+        self._progress_bar = progress_bar
+
+        self._rounds: List[List[ObjectRef]] = []
+        self._task_idx = 0
+
+        self._submit_round()
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        """
+        Submit one round of tasks. If we already have the max concurrent rounds
+        in flight, first wait for the oldest round of tasks to finish.
+        """
+        prev_metadata = []
+        if all(len(r) == 0 for r in self._rounds):
+            raise StopIteration
+
+        if len(self._rounds) >= self._max_concurrent_rounds:
+            prev_metadata_refs = self._rounds.pop(0)
+            if prev_metadata_refs:
+                if self._progress_bar is not None:
+                    prev_metadata = self._progress_bar.fetch_until_complete(
+                        prev_metadata_refs
+                    )
+                else:
+                    prev_metadata = ray.get(prev_metadata_refs)
+
+        self._submit_round()
+
+        return prev_metadata
+
+    def _submit_round(self):
+        assert len(self._rounds) < self._max_concurrent_rounds
+        task_round = []
+        for _ in range(self._num_tasks_per_round):
+            try:
+                task_round.append(next(self._stage_iter))
+            except StopIteration:
+                break
+        self._rounds.append(task_round)
+
+
+class _MapStageIterator:
+    def __init__(self, input_blocks_list, shuffle_map, map_args):
+        self._input_blocks_list = input_blocks_list
+        self._shuffle_map = shuffle_map
+        self._map_args = map_args
+
+        self._mapper_idx = 0
+        self._map_results = []
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        if not self._input_blocks_list:
+            raise StopIteration
+
+        block = self._input_blocks_list.pop(0)
+        # NOTE(swang): Results are shuffled between map and merge tasks, so
+        # there is no advantage to colocating specific map and merge tasks.
+        # Therefore, we do not specify a node affinity policy for map tasks
+        # in case the caller or Ray has a better scheduling strategy, e.g.,
+        # based on data locality.
+        map_result = self._shuffle_map.remote(
+            self._mapper_idx,
+            block,
+            *self._map_args,
+        )
+        metadata_ref = map_result.pop(-1)
+        self._map_results.append(map_result)
+        self._mapper_idx += 1
+        return metadata_ref
+
+    def pop_map_results(self) -> List[List[ObjectRef]]:
+        map_results = self._map_results
+        self._map_results = []
+        return map_results
+
+
+class _MergeStageIterator:
+    def __init__(
+        self,
+        map_stage_iter: _MapStageIterator,
+        shuffle_merge,
+        stage: _PushBasedShuffleStage,
+        reduce_args,
+    ):
+        self._map_stage_iter = map_stage_iter
+        self._shuffle_merge = shuffle_merge
+        self._stage = stage
+        self._reduce_args = reduce_args
+
+        self._merge_idx = 0
+        self._map_result_buffer = None
+        # Final outputs from the map-merge stage.
+        # This is a map from merge task index to a nested list of merge results
+        # (ObjectRefs). Each merge task index corresponds to a partition of P
+        # final reduce tasks.
+        self._all_merge_results = [
+            [] for _ in range(self._stage.num_merge_tasks_per_round)
+        ]
+
+    def __next__(self):
+        if not self._map_result_buffer or not self._map_result_buffer[0]:
+            assert self._merge_idx == 0
+            self._map_result_buffer = self._map_stage_iter.pop_map_results()
+
+        if not self._map_result_buffer:
+            raise StopIteration
+
+        # Shuffle the map results for the merge tasks.
+        merge_args = [map_result.pop(0) for map_result in self._map_result_buffer]
+        num_merge_returns = self._stage.merge_schedule.get_num_reducers_per_merge_idx(
+            self._merge_idx
+        )
+        merge_result = self._shuffle_merge.options(
+            num_returns=1 + num_merge_returns,
+            **self._stage.get_merge_task_options(self._merge_idx),
+        ).remote(
+            *merge_args,
+            reduce_args=self._reduce_args,
+        )
+        metadata_ref = merge_result.pop(-1)
+        self._all_merge_results[self._merge_idx].append(merge_result)
+        del merge_result
+
+        self._merge_idx += 1
+        self._merge_idx %= self._stage.num_merge_tasks_per_round
+        return metadata_ref
+
+    def pop_merge_results(self) -> List[List[ObjectRef]]:
+        all_merge_results = self._all_merge_results
+        self._all_merge_results = []
+        return all_merge_results
+
+
+class _ReduceStageIterator:
+    def __init__(
+        self,
+        stage: _PushBasedShuffleStage,
+        shuffle_reduce,
+        all_merge_results: List[List[List[ObjectRef]]],
+        ray_remote_args,
+        reduce_args: List[Any],
+    ):
+        self._shuffle_reduce = shuffle_reduce
+        self._stage = stage
+        self._reduce_arg_blocks: List[Tuple[int, List[ObjectRef]]] = []
+        self._ray_remote_args = ray_remote_args
+        self._reduce_args = reduce_args
+
+        for reduce_idx in self._stage.merge_schedule.round_robin_reduce_idx_iterator():
+            merge_idx = self._stage.merge_schedule.get_merge_idx_for_reducer_idx(
+                reduce_idx
+            )
+            reduce_arg_blocks = [
+                merge_results.pop(0) for merge_results in all_merge_results[merge_idx]
+            ]
+            self._reduce_arg_blocks.append((reduce_idx, reduce_arg_blocks))
+        assert len(self._reduce_arg_blocks) == stage.merge_schedule.output_num_blocks
+
+        for merge_idx, merge_results in enumerate(all_merge_results):
+            assert all(len(merge_result) == 0 for merge_result in merge_results), (
+                "Reduce stage did not process outputs from merge tasks at index: "
+                f"{merge_idx}"
+            )
+
+        self._reduce_results: List[Tuple[int, ObjectRef]] = []
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        if not self._reduce_arg_blocks:
+            raise StopIteration
+
+        reduce_idx, reduce_arg_blocks = self._reduce_arg_blocks.pop(0)
+        merge_idx = self._stage.merge_schedule.get_merge_idx_for_reducer_idx(reduce_idx)
+        # Submit one partition of reduce tasks, one for each of the P
+        # outputs produced by the corresponding merge task.
+        # We also add the merge task arguments so that the reduce task
+        # is colocated with its inputs.
+        block, meta = self._shuffle_reduce.options(
+            **self._ray_remote_args,
+            **self._stage.get_merge_task_options(merge_idx),
+            num_returns=2,
+        ).remote(*self._reduce_args, *reduce_arg_blocks, partial_reduce=False)
+        self._reduce_results.append((reduce_idx, block))
+        return meta
+
+    def pop_reduce_results(self):
+        reduce_results = self._reduce_results
+        self._reduce_results = []
+        return reduce_results
+
+
+class PushBasedShuffleTaskScheduler(ExchangeTaskScheduler):
+    """
+    Push-based shuffle merges intermediate map outputs on the reducer nodes
+    while other map tasks are executing. The merged outputs are merged again
+    during a final reduce stage. This works as follows:
+
+    1. Submit rounds of concurrent map and merge tasks until all map inputs
+    have been processed. In each round, we execute:
+
+       M map tasks
+         Each produces N outputs. Each output contains P blocks.
+       N merge tasks
+         Takes 1 output from each of M map tasks.
+         Each produces P outputs.
+       Where M and N are chosen to maximize parallelism across CPUs. Note that
+       this assumes that all CPUs in the cluster will be dedicated to the
+       shuffle job.
+
+       Map and merge tasks are pipelined so that we always merge the previous
+       round of map outputs while executing the next round of map tasks.
+
+    2. In the final reduce stage:
+       R reduce tasks
+         Takes 1 output from one of the merge tasks from every round.
+
+    Notes:
+        N * P = R = total number of output blocks
+        M / N = merge factor - the ratio of map : merge tasks is to improve
+          pipelined parallelism. For example, if map takes twice as long to
+          execute as merge, then we should set this to 2.
+        See paper at https://arxiv.org/abs/2203.05072 for more details.
+    """
+
+    def execute(
+        self,
+        refs: List[RefBundle],
+        output_num_blocks: int,
+        map_ray_remote_args: Optional[Dict[str, Any]] = None,
+        reduce_ray_remote_args: Optional[Dict[str, Any]] = None,
+        merge_factor: int = 2,
+    ) -> Tuple[List[RefBundle], StatsDict]:
+        logger.info("Using experimental push-based shuffle.")
+        # TODO: Preemptively clear the blocks list since we will incrementally delete
+        # the last remaining references as we submit the dependent map tasks during the
+        # map-merge stage.
+
+        # TODO(swang): For jobs whose reduce work is heavier than the map work,
+        # we should support fractional merge factors.
+        # TODO(swang): For large jobs, we should try to choose the merge factor
+        # automatically, e.g., by running one test round of map and merge tasks
+        # and comparing their run times.
+        # TODO(swang): Add option to automatically reduce write amplification
+        # during map-merge stage, by limiting how many partitions can be
+        # processed concurrently.
+        input_blocks_list = []
+        for ref_bundle in refs:
+            for block, _ in ref_bundle.blocks:
+                input_blocks_list.append(block)
+        input_owned = all(b.owns_blocks for b in refs)
+
+        if map_ray_remote_args is None:
+            map_ray_remote_args = {}
+        if reduce_ray_remote_args is None:
+            reduce_ray_remote_args = {}
+        # The placement strategy for reduce tasks is overwritten to colocate
+        # them with their inputs from the merge stage, so remove any
+        # pre-specified scheduling strategy here.
+        reduce_ray_remote_args = reduce_ray_remote_args.copy()
+        reduce_ray_remote_args.pop("scheduling_strategy", None)
+
+        # Compute all constants used for task scheduling.
+        num_cpus_per_node_map = _get_num_cpus_per_node_map()
+        stage = self._compute_shuffle_schedule(
+            num_cpus_per_node_map,
+            len(input_blocks_list),
+            merge_factor,
+            output_num_blocks,
+        )
+
+        map_fn = self._map_partition
+        merge_fn = self._merge
+
+        def map_partition(*args, **kwargs):
+            return map_fn(self._exchange_spec.map, *args, **kwargs)
+
+        def merge(*args, **kwargs):
+            return merge_fn(self._exchange_spec.reduce, *args, **kwargs)
+
+        shuffle_map = cached_remote_fn(map_partition)
+        shuffle_map = shuffle_map.options(
+            **map_ray_remote_args,
+            num_returns=1 + stage.num_merge_tasks_per_round,
+        )
+
+        map_stage_iter = _MapStageIterator(
+            input_blocks_list,
+            shuffle_map,
+            [output_num_blocks, stage.merge_schedule, *self._exchange_spec._map_args],
+        )
+        map_bar = ProgressBar("Shuffle Map", position=0, total=len(input_blocks_list))
+        map_stage_executor = _PipelinedStageExecutor(
+            map_stage_iter, stage.num_map_tasks_per_round, progress_bar=map_bar
+        )
+
+        shuffle_merge = cached_remote_fn(merge)
+        merge_stage_iter = _MergeStageIterator(
+            map_stage_iter, shuffle_merge, stage, self._exchange_spec._reduce_args
+        )
+        merge_stage_executor = _PipelinedStageExecutor(
+            merge_stage_iter, stage.num_merge_tasks_per_round, max_concurrent_rounds=2
+        )
+
+        # Execute the map-merge stage. This submits tasks in rounds of M map
+        # tasks and N merge tasks each. Task execution between map and merge is
+        # pipelined, so that while executing merge for one round of inputs, we
+        # also execute the map tasks for the following round.
+        map_done = False
+        merge_done = False
+        map_stage_metadata = []
+        merge_stage_metadata = []
+        while not (map_done and merge_done):
+            try:
+                map_stage_metadata += next(map_stage_executor)
+            except StopIteration:
+                map_done = True
+                break
+
+            try:
+                merge_stage_metadata += next(merge_stage_executor)
+            except StopIteration:
+                merge_done = True
+                break
+
+        map_bar.close()
+        all_merge_results = merge_stage_iter.pop_merge_results()
+
+        # Execute and wait for the reduce stage.
+        reduce_bar = ProgressBar("Shuffle Reduce", total=output_num_blocks)
+        shuffle_reduce = cached_remote_fn(self._exchange_spec.reduce)
+        reduce_stage_iter = _ReduceStageIterator(
+            stage,
+            shuffle_reduce,
+            all_merge_results,
+            reduce_ray_remote_args,
+            self._exchange_spec._reduce_args,
+        )
+
+        max_reduce_tasks_in_flight = output_num_blocks
+        ctx = DatasetContext.get_current()
+        if ctx.pipeline_push_based_shuffle_reduce_tasks:
+            # If pipelining is enabled, we should still try to utilize all
+            # cores.
+            max_reduce_tasks_in_flight = min(
+                max_reduce_tasks_in_flight, sum(num_cpus_per_node_map.values())
+            )
+
+        reduce_stage_executor = _PipelinedStageExecutor(
+            reduce_stage_iter,
+            max_reduce_tasks_in_flight,
+            max_concurrent_rounds=2,
+            progress_bar=reduce_bar,
+        )
+        reduce_stage_metadata = []
+        while True:
+            try:
+                reduce_stage_metadata += next(reduce_stage_executor)
+            except StopIteration:
+                break
+
+        new_blocks = reduce_stage_iter.pop_reduce_results()
+        sorted_blocks = [
+            (block[0], block[1], reduce_stage_metadata[i])
+            for i, block in enumerate(new_blocks)
+        ]
+        sorted_blocks.sort(key=lambda x: x[0])
+        _, new_blocks, reduce_stage_metadata = zip(*sorted_blocks)
+        del sorted_blocks
+
+        assert (
+            len(new_blocks) == output_num_blocks
+        ), f"Expected {output_num_blocks} outputs, produced {len(new_blocks)}"
+        reduce_bar.close()
+
+        output = []
+        for block, meta in zip(new_blocks, reduce_stage_metadata):
+            output.append(
+                RefBundle(
+                    [
+                        (
+                            block,
+                            meta,
+                        )
+                    ],
+                    owns_blocks=input_owned,
+                )
+            )
+        stats = {
+            "map": map_stage_metadata,
+            "merge": merge_stage_metadata,
+            "reduce": reduce_stage_metadata,
+        }
+
+        return (output, stats)
+
+    @staticmethod
+    def _map_partition(
+        map_fn,
+        idx: int,
+        block: Block,
+        output_num_blocks: int,
+        schedule: _MergeTaskSchedule,
+        *map_args: List[Any],
+    ) -> List[Union[BlockMetadata, Block]]:
+        mapper_outputs = map_fn(idx, block, output_num_blocks, *map_args)
+        meta = mapper_outputs.pop(-1)
+
+        parts = []
+        merge_idx = 0
+        while mapper_outputs:
+            partition_size = schedule.get_num_reducers_per_merge_idx(merge_idx)
+            parts.append(mapper_outputs[:partition_size])
+            mapper_outputs = mapper_outputs[partition_size:]
+            merge_idx += 1
+        assert len(parts) == schedule.num_merge_tasks_per_round, (
+            len(parts),
+            schedule.num_merge_tasks_per_round,
+        )
+        return parts + [meta]
+
+    @staticmethod
+    def _merge(
+        reduce_fn,
+        *all_mapper_outputs: List[List[Block]],
+        reduce_args: Optional[List[Any]] = None,
+    ) -> List[Union[BlockMetadata, Block]]:
+        """
+        Returns list of [BlockMetadata, O1, O2, O3, ...output_num_blocks].
+        """
+        assert (
+            len({len(mapper_outputs) for mapper_outputs in all_mapper_outputs}) == 1
+        ), "Received different number of map inputs"
+        stats = BlockExecStats.builder()
+        if not reduce_args:
+            reduce_args = []
+
+        num_rows = 0
+        size_bytes = 0
+        schema = None
+        for i, mapper_outputs in enumerate(zip(*all_mapper_outputs)):
+            block, meta = reduce_fn(*reduce_args, *mapper_outputs, partial_reduce=True)
+            yield block
+
+            block = BlockAccessor.for_block(block)
+            num_rows += block.num_rows()
+            size_bytes += block.size_bytes()
+            schema = block.schema()
+            del block
+
+        yield BlockMetadata(
+            num_rows=num_rows,
+            size_bytes=size_bytes,
+            schema=schema,
+            input_files=None,
+            exec_stats=stats.build(),
+        )
+
+    @staticmethod
+    def _compute_shuffle_schedule(
+        num_cpus_per_node_map: Dict[str, int],
+        num_input_blocks: int,
+        merge_factor: int,
+        num_output_blocks: int,
+    ) -> _PushBasedShuffleStage:
+        num_cpus_total = sum(v for v in num_cpus_per_node_map.values())
+        task_parallelism = min(num_cpus_total, num_input_blocks)
+
+        num_tasks_per_map_merge_group = merge_factor + 1
+        num_merge_tasks_per_round = 0
+        merge_task_placement = []
+        leftover_cpus = 0
+        # Compute the total number of merge tasks and their node placement.
+        # Each merge task should be grouped with `merge_factor` map tasks for
+        # pipelining. These groups should then be spread across nodes according
+        # to CPU availability for load-balancing.
+        for node, num_cpus in num_cpus_per_node_map.items():
+            node_parallelism = min(
+                num_cpus, num_input_blocks // len(num_cpus_per_node_map)
+            )
+            num_merge_tasks = node_parallelism // num_tasks_per_map_merge_group
+            for i in range(num_merge_tasks):
+                merge_task_placement.append(node)
+            num_merge_tasks_per_round += num_merge_tasks
+
+            # Handle the case where a single node cannot fit a group of map and
+            # merge tasks, but we can spread the group across multiple distinct
+            # nodes.
+            leftover_cpus += node_parallelism % num_tasks_per_map_merge_group
+            if num_merge_tasks == 0 and leftover_cpus > num_tasks_per_map_merge_group:
+                merge_task_placement.append(node)
+                num_merge_tasks_per_round += 1
+                leftover_cpus -= num_tasks_per_map_merge_group
+        if num_merge_tasks_per_round == 0:
+            merge_task_placement.append(list(num_cpus_per_node_map)[0])
+            num_merge_tasks_per_round = 1
+
+        assert num_merge_tasks_per_round == len(merge_task_placement)
+        num_map_tasks_per_round = max(task_parallelism - num_merge_tasks_per_round, 1)
+
+        num_rounds = math.ceil(num_input_blocks / num_map_tasks_per_round)
+        return _PushBasedShuffleStage(
+            num_output_blocks,
+            num_rounds,
+            num_map_tasks_per_round,
+            merge_task_placement,
+        )
+
+
+def _execute_pipelined_stage(
+    stage_fn: Callable[[T], Tuple[ObjectRef, U]],
+    prev_metadata_refs: List[ObjectRef],
+    stage_args: List[T],
+    progress_bar: Optional[ProgressBar] = None,
+) -> Tuple[List[BlockMetadata], List[ObjectRef], List[U]]:
+    """
+    Helper function to execute a stage of tasks. This will wait for the
+    previous round of tasks to complete before submitting the next.
+    """
+    # TODO(swang): Straggler tasks can cause pipeline bubbles. Instead of
+    # waiting for all previous tasks, we should wait for some tasks on each
+    # node to finish.
+    if progress_bar is not None:
+        prev_metadata = progress_bar.fetch_until_complete(prev_metadata_refs)
+    else:
+        prev_metadata = ray.get(prev_metadata_refs)
+    prev_metadata_refs.clear()
+
+    metadata_refs = []
+    data_outputs = []
+    while stage_args:
+        arg = stage_args.pop(0)
+        metadata_ref, data_output = stage_fn(arg)
+        metadata_refs.append(metadata_ref)
+        data_outputs.append(data_output)
+    return prev_metadata, metadata_refs, data_outputs
+
+
+def _get_num_cpus_per_node_map() -> Dict[str, int]:
+    nodes = ray.nodes()
+    # Map from per-node resource name to number of CPUs available on that
+    # node.
+    num_cpus_per_node_map = {}
+    for node in nodes:
+        resources = node["Resources"]
+        num_cpus = int(resources.get("CPU", 0))
+        if num_cpus == 0:
+            continue
+        num_cpus_per_node_map[node["NodeID"]] = num_cpus
+    return num_cpus_per_node_map
diff --git a/python/ray/data/_internal/planner/exchange/shuffle_task_spec.py b/python/ray/data/_internal/planner/exchange/shuffle_task_spec.py
new file mode 100644
index 000000000000..474d69b03279
--- /dev/null
+++ b/python/ray/data/_internal/planner/exchange/shuffle_task_spec.py
@@ -0,0 +1,88 @@
+import math
+from typing import List, Optional, Tuple, Union
+
+import numpy as np
+
+from ray.data._internal.delegating_block_builder import DelegatingBlockBuilder
+from ray.data._internal.planner.exchange.interfaces import ExchangeTaskSpec
+from ray.data.block import Block, BlockAccessor, BlockExecStats, BlockMetadata
+
+
+class ShuffleTaskSpec(ExchangeTaskSpec):
+    """
+    The implementation for shuffle tasks.
+
+    This is used by random_shuffle() and repartition().
+    """
+
+    def __init__(
+        self,
+        random_shuffle: bool = False,
+        random_seed: Optional[int] = None,
+    ):
+        super().__init__(
+            map_args=[random_shuffle, random_seed],
+            reduce_args=[random_shuffle, random_seed],
+        )
+
+    @staticmethod
+    def map(
+        idx: int,
+        block: Block,
+        output_num_blocks: int,
+        random_shuffle: bool,
+        random_seed: Optional[int],
+    ) -> List[Union[BlockMetadata, Block]]:
+        # TODO: Support fusion with other upstream operators.
+        stats = BlockExecStats.builder()
+        block = BlockAccessor.for_block(block)
+
+        # Randomize the distribution of records to blocks.
+        if random_shuffle:
+            seed_i = random_seed + idx if random_seed is not None else None
+            block = block.random_shuffle(seed_i)
+            block = BlockAccessor.for_block(block)
+
+        slice_sz = max(1, math.ceil(block.num_rows() / output_num_blocks))
+        slices = []
+        for i in range(output_num_blocks):
+            slices.append(block.slice(i * slice_sz, (i + 1) * slice_sz))
+
+        # Randomize the distribution order of the blocks (this prevents empty
+        # outputs when input blocks are very small).
+        if random_shuffle:
+            random = np.random.RandomState(seed_i)
+            random.shuffle(slices)
+
+        num_rows = sum(BlockAccessor.for_block(s).num_rows() for s in slices)
+        assert num_rows == block.num_rows(), (num_rows, block.num_rows())
+        metadata = block.get_metadata(input_files=None, exec_stats=stats.build())
+        return slices + [metadata]
+
+    @staticmethod
+    def reduce(
+        random_shuffle: bool,
+        random_seed: Optional[int],
+        *mapper_outputs: List[Block],
+        partial_reduce: bool = False,
+    ) -> Tuple[Block, BlockMetadata]:
+        # TODO: Support fusion with other downstream operators.
+        stats = BlockExecStats.builder()
+        builder = DelegatingBlockBuilder()
+        for block in mapper_outputs:
+            builder.add_block(block)
+        new_block = builder.build()
+        accessor = BlockAccessor.for_block(new_block)
+        if random_shuffle:
+            new_block = accessor.random_shuffle(
+                random_seed if random_seed is not None else None
+            )
+            accessor = BlockAccessor.for_block(new_block)
+        new_metadata = BlockMetadata(
+            num_rows=accessor.num_rows(),
+            size_bytes=accessor.size_bytes(),
+            schema=accessor.schema(),
+            input_files=None,
+            exec_stats=stats.build(),
+        )
+        return new_block, new_metadata
diff --git a/python/ray/data/_internal/planner/plan_all_to_all_op.py b/python/ray/data/_internal/planner/plan_all_to_all_op.py
index 00675550e8bf..b3b96b2e6f98 100644
--- a/python/ray/data/_internal/planner/plan_all_to_all_op.py
+++ b/python/ray/data/_internal/planner/plan_all_to_all_op.py
@@ -2,8 +2,10 @@
 from ray.data._internal.execution.operators.all_to_all_operator import AllToAllOperator
 from ray.data._internal.logical.operators.all_to_all_operator import (
     AbstractAllToAll,
+    RandomShuffle,
     RandomizeBlocks,
 )
+from ray.data._internal.planner.random_shuffle import generate_random_shuffle_fn
 from ray.data._internal.planner.randomize_blocks import generate_randomize_blocks_fn
 
 
@@ -18,6 +20,8 @@ def _plan_all_to_all_op(
     """
     if isinstance(op, RandomizeBlocks):
         fn = generate_randomize_blocks_fn(op._seed)
+    elif isinstance(op, RandomShuffle):
+        fn = generate_random_shuffle_fn(op._seed, op._num_outputs)
     else:
         raise ValueError(f"Found unknown logical operator during planning: {op}")
 
diff --git a/python/ray/data/_internal/planner/random_shuffle.py b/python/ray/data/_internal/planner/random_shuffle.py
new file mode 100644
index 000000000000..26b73733a1e7
--- /dev/null
+++ b/python/ray/data/_internal/planner/random_shuffle.py
@@ -0,0 +1,42 @@
+from typing import Any, Callable, Dict, List, Optional, Tuple
+
+from ray.data._internal.execution.interfaces import RefBundle
+from ray.data._internal.planner.exchange.push_based_shuffle_task_scheduler import (
+    PushBasedShuffleTaskScheduler,
+)
+from ray.data._internal.planner.exchange.shuffle_task_spec import ShuffleTaskSpec
+from ray.data._internal.planner.exchange.pull_based_shuffle_task_scheduler import (
+    PullBasedShuffleTaskScheduler,
+)
+from ray.data._internal.stats import StatsDict
+from ray.data.context import DatasetContext
+
+
+def generate_random_shuffle_fn(
+    seed: Optional[int],
+    num_outputs: Optional[int] = None,
+    ray_remote_args: Optional[Dict[str, Any]] = None,
+) -> Callable[[List[RefBundle]], Tuple[List[RefBundle], StatsDict]]:
+    """Generate function to randomly shuffle each records of blocks."""
+
+    def fn(refs: List[RefBundle]) -> Tuple[List[RefBundle], StatsDict]:
+        num_input_blocks = sum(len(r.blocks) for r in refs)
+        shuffle_spec = ShuffleTaskSpec(random_shuffle=True, random_seed=seed)
+
+        if DatasetContext.get_current().use_push_based_shuffle:
+            if num_outputs is not None:
+                raise NotImplementedError(
+                    "Push-based shuffle doesn't support setting num_blocks yet."
+                )
+            scheduler = PushBasedShuffleTaskScheduler(shuffle_spec)
+        else:
+            scheduler = PullBasedShuffleTaskScheduler(shuffle_spec)
+
+        return scheduler.execute(
+            refs,
+            num_outputs or num_input_blocks,
+            map_ray_remote_args=ray_remote_args,
+            reduce_ray_remote_args=ray_remote_args,
+        )
+
+    return fn
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index 9fb4a153eb28..4839cdf4fcd1 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -30,7 +30,10 @@
 from ray._private.usage import usage_lib
 from ray.air.constants import TENSOR_COLUMN_NAME
 from ray.air.util.data_batch_conversion import BlockFormat
-from ray.data._internal.logical.operators.all_to_all_operator import RandomizeBlocks
+from ray.data._internal.logical.operators.all_to_all_operator import (
+    RandomShuffle,
+    RandomizeBlocks,
+)
 from ray.data._internal.logical.optimizers import LogicalPlan
 from ray.data._internal.logical.operators.map_operator import (
     Filter,
@@ -1000,7 +1003,17 @@ def random_shuffle(
         plan = self._plan.with_stage(
             RandomShuffleStage(seed, num_blocks, ray_remote_args)
         )
-        return Dataset(plan, self._epoch, self._lazy)
+
+        logical_plan = self._logical_plan
+        if logical_plan is not None:
+            op = RandomShuffle(
+                logical_plan.dag,
+                seed=seed,
+                num_outputs=num_blocks,
+                ray_remote_args=ray_remote_args,
+            )
+            logical_plan = LogicalPlan(op)
+        return Dataset(plan, self._epoch, self._lazy, logical_plan)
 
     def randomize_block_order(
         self,
diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index c6468f4ea164..7b9c7336ca2b 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -4,7 +4,10 @@
 from ray.data._internal.execution.operators.map_operator import MapOperator
 from ray.data._internal.execution.operators.all_to_all_operator import AllToAllOperator
 from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
-from ray.data._internal.logical.operators.all_to_all_operator import RandomizeBlocks
+from ray.data._internal.logical.operators.all_to_all_operator import (
+    RandomShuffle,
+    RandomizeBlocks,
+)
 from ray.data._internal.logical.operators.read_operator import Read
 from ray.data._internal.logical.operators.map_operator import (
     MapRows,
@@ -166,6 +169,32 @@ def test_randomize_blocks_e2e(ray_start_cluster_enabled, enable_optimizer):
     assert ds.take_all() == [6, 7, 8, 0, 1, 2, 3, 4, 5, 9, 10, 11], ds
 
 
+def test_random_shuffle_operator(ray_start_cluster_enabled, enable_optimizer):
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = RandomShuffle(
+        read_op,
+        seed=0,
+    )
+    physical_op = planner.plan(op)
+
+    assert op.name == "RandomShuffle"
+    assert isinstance(physical_op, AllToAllOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], MapOperator)
+
+
+def test_random_shuffle_e2e(
+    ray_start_cluster_enabled, enable_optimizer, use_push_based_shuffle
+):
+    ds = ray.data.range(12, parallelism=4)
+    r1 = ds.random_shuffle(seed=0).take_all()
+    r2 = ds.random_shuffle(seed=1024).take_all()
+    assert r1 != r2, (r1, r2)
+    assert sorted(r1) == [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11], r1
+    assert sorted(r2) == [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11], r2
+
+
 if __name__ == "__main__":
     import sys
 

From 06197a52224aea8e619a0639211a010cd8b7d210 Mon Sep 17 00:00:00 2001
From: Jian Xiao <99709935+jianoaix@users.noreply.github.com>
Date: Mon, 30 Jan 2023 23:21:25 -0800
Subject: [PATCH 073/267] Add TaskContext for transform function (#32081)

---
 python/ray/data/_internal/compute.py          |  6 +++--
 .../data/_internal/execution/interfaces.py    | 14 +++++++++++
 .../data/_internal/execution/legacy_compat.py | 15 ++++++++----
 .../operators/actor_pool_map_operator.py      | 13 ++++++++---
 .../operators/all_to_all_operator.py          |  6 ++++-
 .../execution/operators/map_operator.py       | 13 +++++++----
 .../operators/task_pool_map_operator.py       |  6 ++++-
 python/ray/data/_internal/plan.py             | 23 +++++++++++--------
 python/ray/data/_internal/planner/filter.py   | 10 +++++---
 python/ray/data/_internal/planner/flat_map.py | 10 +++++---
 .../ray/data/_internal/planner/map_batches.py | 11 ++++++---
 python/ray/data/_internal/planner/map_rows.py | 10 +++++---
 .../ray/data/_internal/planner/plan_map_op.py | 12 ++++++----
 .../data/_internal/planner/plan_read_op.py    |  8 +++++--
 .../_internal/planner/randomize_blocks.py     |  8 ++++---
 .../data/_internal/shuffle_and_partition.py   |  4 +++-
 python/ray/data/_internal/stage_impl.py       | 15 ++++++++++--
 python/ray/data/tests/test_bulk_executor.py   |  4 ++--
 python/ray/data/tests/test_operators.py       |  6 ++---
 .../data/tests/test_streaming_integration.py  |  4 ++--
 20 files changed, 141 insertions(+), 57 deletions(-)

diff --git a/python/ray/data/_internal/compute.py b/python/ray/data/_internal/compute.py
index ceb93d0ebc69..997a1af92a1e 100644
--- a/python/ray/data/_internal/compute.py
+++ b/python/ray/data/_internal/compute.py
@@ -6,6 +6,7 @@
 import ray
 from ray.data._internal.block_list import BlockList
 from ray.data._internal.delegating_block_builder import DelegatingBlockBuilder
+from ray.data._internal.execution.interfaces import TaskContext
 from ray.data._internal.progress_bar import ProgressBar
 from ray.data._internal.remote_fn import cached_remote_fn
 from ray.data.block import (
@@ -27,14 +28,15 @@
 T = TypeVar("T")
 U = TypeVar("U")
 
+
 # Block transform function applied by task and actor pools.
 BlockTransform = Union[
     # TODO(Clark): Once Ray only supports Python 3.8+, use protocol to constrain block
     # transform type.
     # Callable[[Block, ...], Iterable[Block]]
     # Callable[[Block, BatchUDF, ...], Iterable[Block]],
-    Callable[[Iterable[Block]], Iterable[Block]],
-    Callable[[Iterable[Block], Union[BatchUDF, RowUDF]], Iterable[Block]],
+    Callable[[Iterable[Block], TaskContext], Iterable[Block]],
+    Callable[[Iterable[Block], TaskContext, Union[BatchUDF, RowUDF]], Iterable[Block]],
     Callable[..., Iterable[Block]],
 ]
 
diff --git a/python/ray/data/_internal/execution/interfaces.py b/python/ray/data/_internal/execution/interfaces.py
index 899b6ac9379f..8b11b84583de 100644
--- a/python/ray/data/_internal/execution/interfaces.py
+++ b/python/ray/data/_internal/execution/interfaces.py
@@ -8,6 +8,7 @@
 from ray.data.block import Block, BlockMetadata
 from ray.data.context import DatasetContext
 from ray.types import ObjectRef
+from typing import Callable
 
 
 @dataclass
@@ -155,6 +156,19 @@ class ExecutionOptions:
     preserve_order: bool = True
 
 
+@dataclass
+class TaskContext:
+    """This describes the information of a task running block transform."""
+
+    # The index of task. Each task has a unique task index within the same
+    # operator.
+    task_idx: int
+
+
+# Block transform function applied by task and actor pools.
+TransformFn = Callable[[Iterable[Block], TaskContext], Iterable[Block]]
+
+
 class PhysicalOperator(Operator):
     """Abstract class for physical operators.
 
diff --git a/python/ray/data/_internal/execution/legacy_compat.py b/python/ray/data/_internal/execution/legacy_compat.py
index 07fb4fcf1153..5bc7e3435035 100644
--- a/python/ray/data/_internal/execution/legacy_compat.py
+++ b/python/ray/data/_internal/execution/legacy_compat.py
@@ -31,6 +31,7 @@
     Executor,
     PhysicalOperator,
     RefBundle,
+    TaskContext,
 )
 
 
@@ -147,7 +148,7 @@ def _blocks_to_input_buffer(blocks: BlockList, owns_blocks: bool) -> PhysicalOpe
             for b in i.blocks:
                 trace_allocation(b[0], "legacy_compat.blocks_to_input_buf[0]")
 
-        def do_read(blocks: Iterator[Block]) -> Iterator[Block]:
+        def do_read(blocks: Iterator[Block], ctx: TaskContext) -> Iterator[Block]:
             for read_task in blocks:
                 yield from read_task()
 
@@ -214,8 +215,8 @@ def fn(item: Any) -> Any:
             fn_args += stage.fn_args
         fn_kwargs = stage.fn_kwargs or {}
 
-        def do_map(blocks: Iterator[Block]) -> Iterator[Block]:
-            yield from block_fn(blocks, *fn_args, **fn_kwargs)
+        def do_map(blocks: Iterator[Block], ctx: TaskContext) -> Iterator[Block]:
+            yield from block_fn(blocks, ctx, *fn_args, **fn_kwargs)
 
         return MapOperator.create(
             do_map,
@@ -231,14 +232,18 @@ def do_map(blocks: Iterator[Block]) -> Iterator[Block]:
         remote_args = stage.ray_remote_args
         stage_name = stage.name
 
-        def bulk_fn(refs: List[RefBundle]) -> Tuple[List[RefBundle], StatsDict]:
+        def bulk_fn(
+            refs: List[RefBundle], ctx: TaskContext
+        ) -> Tuple[List[RefBundle], StatsDict]:
             input_owned = all(b.owns_blocks for b in refs)
             if isinstance(stage, RandomizeBlocksStage):
                 output_owned = input_owned  # Passthrough ownership hack.
             else:
                 output_owned = True
             block_list = _bundles_to_block_list(refs)
-            block_list, stats_dict = fn(block_list, input_owned, block_udf, remote_args)
+            block_list, stats_dict = fn(
+                block_list, ctx, input_owned, block_udf, remote_args
+            )
             output = _block_list_to_bundles(block_list, owns_blocks=output_owned)
             if not stats_dict:
                 stats_dict = {stage_name: block_list.get_metadata()}
diff --git a/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py b/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
index 831e4190ba3c..d5a2bafa7a6d 100644
--- a/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
+++ b/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
@@ -11,6 +11,7 @@
     ExecutionResources,
     ExecutionOptions,
     PhysicalOperator,
+    TaskContext,
 )
 from ray.data._internal.execution.operators.map_operator import (
     MapOperator,
@@ -67,6 +68,7 @@ def __init__(
         self._cls = None
         # Whether no more submittable bundles will be added.
         self._inputs_done = False
+        self._next_task_idx = 0
 
     def internal_queue_size(self) -> int:
         return len(self._bundle_queue)
@@ -107,9 +109,11 @@ def _dispatch_tasks(self):
             # Submit the map task.
             bundle = self._bundle_queue.popleft()
             input_blocks = [block for block, _ in bundle.blocks]
+            ctx = TaskContext(task_idx=self._next_task_idx)
             ref = actor.submit.options(num_returns="dynamic").remote(
-                self._transform_fn_ref, *input_blocks
+                self._transform_fn_ref, ctx, *input_blocks
             )
+            self._next_task_idx += 1
             task = _TaskState(bundle)
             self._tasks[ref] = (task, actor)
             self._handle_task_submitted(task)
@@ -260,9 +264,12 @@ def ready(self):
         return "ok"
 
     def submit(
-        self, fn: Callable[[Iterator[Block]], Iterator[Block]], *blocks: Block
+        self,
+        fn: Callable[[Iterator[Block], TaskContext], Iterator[Block]],
+        ctx,
+        *blocks: Block,
     ) -> Iterator[Union[Block, List[BlockMetadata]]]:
-        yield from _map_task(fn, *blocks)
+        yield from _map_task(fn, ctx, *blocks)
 
 
 # TODO(Clark): Promote this to a public config once we deprecate the legacy compute
diff --git a/python/ray/data/_internal/execution/operators/all_to_all_operator.py b/python/ray/data/_internal/execution/operators/all_to_all_operator.py
index 9a10adfee11d..4fb1a2871820 100644
--- a/python/ray/data/_internal/execution/operators/all_to_all_operator.py
+++ b/python/ray/data/_internal/execution/operators/all_to_all_operator.py
@@ -4,6 +4,7 @@
 from ray.data._internal.execution.interfaces import (
     RefBundle,
     PhysicalOperator,
+    TaskContext,
 )
 
 
@@ -31,6 +32,7 @@ def __init__(
             name: The name of this operator.
         """
         self._bulk_fn = bulk_fn
+        self._next_task_index = 0
         self._num_outputs = num_outputs
         self._input_buffer: List[RefBundle] = []
         self._output_buffer: List[RefBundle] = []
@@ -50,7 +52,9 @@ def add_input(self, refs: RefBundle, input_index: int) -> None:
         self._input_buffer.append(refs)
 
     def inputs_done(self) -> None:
-        self._output_buffer, self._stats = self._bulk_fn(self._input_buffer)
+        ctx = TaskContext(task_idx=self._next_task_index)
+        self._output_buffer, self._stats = self._bulk_fn(self._input_buffer, ctx)
+        self._next_task_index += 1
         self._input_buffer.clear()
         super().inputs_done()
 
diff --git a/python/ray/data/_internal/execution/operators/map_operator.py b/python/ray/data/_internal/execution/operators/map_operator.py
index 8ebd3ba56f1f..1546f8c15422 100644
--- a/python/ray/data/_internal/execution/operators/map_operator.py
+++ b/python/ray/data/_internal/execution/operators/map_operator.py
@@ -1,7 +1,7 @@
 from abc import ABC, abstractmethod
 from dataclasses import dataclass
 import itertools
-from typing import List, Iterator, Any, Dict, Callable, Optional, Union
+from typing import List, Iterator, Any, Dict, Optional, Union
 
 import ray
 from ray.data.block import Block, BlockAccessor, BlockMetadata, BlockExecStats
@@ -15,6 +15,8 @@
     ExecutionOptions,
     ExecutionResources,
     PhysicalOperator,
+    TaskContext,
+    TransformFn,
 )
 from ray.data._internal.memory_tracing import trace_allocation
 from ray.data._internal.stats import StatsDict
@@ -32,7 +34,7 @@ class MapOperator(PhysicalOperator, ABC):
 
     def __init__(
         self,
-        transform_fn: Callable[[Iterator[Block]], Iterator[Block]],
+        transform_fn: TransformFn,
         input_op: PhysicalOperator,
         name: str,
         min_rows_per_bundle: Optional[int],
@@ -62,7 +64,7 @@ def __init__(
     @classmethod
     def create(
         cls,
-        transform_fn: Callable[[Iterator[Block]], Iterator[Block]],
+        transform_fn: TransformFn,
         input_op: PhysicalOperator,
         name: str = "Map",
         # TODO(ekl): slim down ComputeStrategy to only specify the compute
@@ -325,7 +327,8 @@ def to_metrics_dict(self) -> Dict[str, int]:
 
 
 def _map_task(
-    fn: Callable[[Iterator[Block]], Iterator[Block]],
+    fn: TransformFn,
+    ctx: TaskContext,
     *blocks: Block,
 ) -> Iterator[Union[Block, List[BlockMetadata]]]:
     """Remote function for a single operator task.
@@ -341,7 +344,7 @@ def _map_task(
     """
     output_metadata = []
     stats = BlockExecStats.builder()
-    for b_out in fn(iter(blocks)):
+    for b_out in fn(iter(blocks), ctx):
         # TODO(Clark): Add input file propagation from input blocks.
         m_out = BlockAccessor.for_block(b_out).get_metadata([], None)
         m_out.exec_stats = stats.build()
diff --git a/python/ray/data/_internal/execution/operators/task_pool_map_operator.py b/python/ray/data/_internal/execution/operators/task_pool_map_operator.py
index 342d7e2b5f94..2004667c05ad 100644
--- a/python/ray/data/_internal/execution/operators/task_pool_map_operator.py
+++ b/python/ray/data/_internal/execution/operators/task_pool_map_operator.py
@@ -6,6 +6,7 @@
     RefBundle,
     ExecutionResources,
     PhysicalOperator,
+    TaskContext,
 )
 from ray.data._internal.execution.operators.map_operator import (
     MapOperator,
@@ -44,14 +45,17 @@ def __init__(
             transform_fn, input_op, name, min_rows_per_bundle, ray_remote_args
         )
         self._tasks: Dict[ObjectRef[ObjectRefGenerator], _TaskState] = {}
+        self._next_task_idx = 0
 
     def _add_bundled_input(self, bundle: RefBundle):
         # Submit the task as a normal Ray task.
         map_task = cached_remote_fn(_map_task, num_returns="dynamic")
         input_blocks = [block for block, _ in bundle.blocks]
+        ctx = TaskContext(task_idx=self._next_task_idx)
         ref = map_task.options(**self._ray_remote_args).remote(
-            self._transform_fn_ref, *input_blocks
+            self._transform_fn_ref, ctx, *input_blocks
         )
+        self._next_task_idx += 1
         task = _TaskState(bundle)
         self._tasks[ref] = task
         self._handle_task_submitted(task)
diff --git a/python/ray/data/_internal/plan.py b/python/ray/data/_internal/plan.py
index 47097bf2821b..c1c30078daf5 100644
--- a/python/ray/data/_internal/plan.py
+++ b/python/ray/data/_internal/plan.py
@@ -29,6 +29,7 @@
     is_task_compute,
 )
 from ray.data._internal.dataset_logger import DatasetLogger
+from ray.data._internal.execution.interfaces import TaskContext
 from ray.data._internal.lazy_block_list import LazyBlockList
 from ray.data._internal.stats import DatasetStats, DatasetStatsSummary
 from ray.data.block import Block
@@ -904,6 +905,7 @@ def fuse(self, prev: Stage):
 
         def block_fn(
             blocks: Iterable[Block],
+            ctx: TaskContext,
             fn: UDF,
             *fn_args,
             **fn_kwargs,
@@ -921,8 +923,8 @@ def block_fn(
             prev_fn_args = (
                 prev_fn_args if prev_fn_ is None else (prev_fn_,) + prev_fn_args
             )
-            blocks = block_fn1(blocks, *prev_fn_args, **prev_fn_kwargs)
-            return block_fn2(blocks, *self_fn_args, **self_fn_kwargs)
+            blocks = block_fn1(blocks, ctx, *prev_fn_args, **prev_fn_kwargs)
+            return block_fn2(blocks, ctx, *self_fn_args, **self_fn_kwargs)
 
         return OneToOneStage(
             name,
@@ -1015,19 +1017,20 @@ def fuse(self, prev: Stage):
         prev_block_fn = prev.block_fn
         if self.block_udf is None:
 
-            def block_udf(blocks: Iterable[Block]) -> Iterable[Block]:
-                yield from prev_block_fn(blocks, *prev_fn_args, **prev_fn_kwargs)
+            def block_udf(blocks: Iterable[Block], ctx: TaskContext) -> Iterable[Block]:
+                yield from prev_block_fn(blocks, ctx, *prev_fn_args, **prev_fn_kwargs)
 
         else:
             self_block_udf = self.block_udf
 
-            def block_udf(blocks: Iterable[Block]) -> Iterable[Block]:
+            def block_udf(blocks: Iterable[Block], ctx: TaskContext) -> Iterable[Block]:
                 blocks = prev_block_fn(
                     blocks,
+                    ctx,
                     *prev_fn_args,
                     **prev_fn_kwargs,
                 )
-                yield from self_block_udf(blocks)
+                yield from self_block_udf(blocks, ctx)
 
         return AllToAllStage(
             name, self.num_blocks, self.fn, True, block_udf, prev.ray_remote_args
@@ -1103,7 +1106,9 @@ def _rewrite_read_stage(
     )
 
     @_adapt_for_multiple_blocks
-    def block_fn(read_fn: Callable[[], Iterator[Block]]) -> Iterator[Block]:
+    def block_fn(
+        read_fn: Callable[[], Iterator[Block]], ctx: TaskContext
+    ) -> Iterator[Block]:
         for block in read_fn():
             yield block
 
@@ -1222,8 +1227,8 @@ def _adapt_for_multiple_blocks(
     fn: Callable[..., Iterable[Block]],
 ) -> Callable[..., Iterable[Block]]:
     @functools.wraps(fn)
-    def wrapper(blocks: Iterable[Block], *args, **kwargs):
+    def wrapper(blocks: Iterable[Block], ctx: TaskContext, *args, **kwargs):
         for block in blocks:
-            yield from fn(block, *args, **kwargs)
+            yield from fn(block, ctx, *args, **kwargs)
 
     return wrapper
diff --git a/python/ray/data/_internal/planner/filter.py b/python/ray/data/_internal/planner/filter.py
index c64beef202d6..54c1c2f4c1c3 100644
--- a/python/ray/data/_internal/planner/filter.py
+++ b/python/ray/data/_internal/planner/filter.py
@@ -1,16 +1,20 @@
-from typing import Callable, Iterator
+from typing import Iterator
 
+from ray.data._internal.execution.interfaces import TaskContext, TransformFn
 from ray.data.block import Block, BlockAccessor, RowUDF
 from ray.data.context import DatasetContext
 
 
-def generate_filter_fn() -> Callable[[Iterator[Block]], Iterator[Block]]:
+def generate_filter_fn() -> TransformFn:
     """Generate function to apply the UDF to each record of blocks,
     and filter out records that do not satisfy the given predicate.
     """
+
     context = DatasetContext.get_current()
 
-    def fn(blocks: Iterator[Block], row_fn: RowUDF) -> Iterator[Block]:
+    def fn(
+        blocks: Iterator[Block], ctx: TaskContext, row_fn: RowUDF
+    ) -> Iterator[Block]:
         DatasetContext._set_current(context)
         for block in blocks:
             block = BlockAccessor.for_block(block)
diff --git a/python/ray/data/_internal/planner/flat_map.py b/python/ray/data/_internal/planner/flat_map.py
index 4483b9dd6e2e..29a0274aa0f0 100644
--- a/python/ray/data/_internal/planner/flat_map.py
+++ b/python/ray/data/_internal/planner/flat_map.py
@@ -1,17 +1,21 @@
-from typing import Callable, Iterator
+from typing import Iterator
 
+from ray.data._internal.execution.interfaces import TaskContext, TransformFn
 from ray.data._internal.output_buffer import BlockOutputBuffer
 from ray.data.block import Block, BlockAccessor, RowUDF
 from ray.data.context import DatasetContext
 
 
-def generate_flat_map_fn() -> Callable[[Iterator[Block]], Iterator[Block]]:
+def generate_flat_map_fn() -> TransformFn:
     """Generate function to apply the UDF to each record of blocks,
     and then flatten results.
     """
+
     context = DatasetContext.get_current()
 
-    def fn(blocks: Iterator[Block], row_fn: RowUDF) -> Iterator[Block]:
+    def fn(
+        blocks: Iterator[Block], ctx: TaskContext, row_fn: RowUDF
+    ) -> Iterator[Block]:
         DatasetContext._set_current(context)
         for block in blocks:
             output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
diff --git a/python/ray/data/_internal/planner/map_batches.py b/python/ray/data/_internal/planner/map_batches.py
index c273334acb62..a3565ba53b65 100644
--- a/python/ray/data/_internal/planner/map_batches.py
+++ b/python/ray/data/_internal/planner/map_batches.py
@@ -1,7 +1,8 @@
 import sys
-from typing import Callable, Iterator, Optional
+from typing import Iterator, Optional
 
 from ray.data._internal.block_batching import batch_blocks
+from ray.data._internal.execution.interfaces import TaskContext, TransformFn
 from ray.data._internal.output_buffer import BlockOutputBuffer
 from ray.data.block import BatchUDF, Block, DataBatch
 from ray.data.context import DEFAULT_BATCH_SIZE, DatasetContext
@@ -18,7 +19,7 @@ def generate_map_batches_fn(
     batch_format: Literal["default", "pandas", "pyarrow", "numpy"] = "default",
     prefetch_batches: int = 0,
     zero_copy_batch: bool = False,
-) -> Callable[[Iterator[Block]], Iterator[Block]]:
+) -> TransformFn:
     """Generate function to apply the batch UDF to blocks."""
     import numpy as np
     import pandas as pd
@@ -27,7 +28,11 @@ def generate_map_batches_fn(
     context = DatasetContext.get_current()
 
     def fn(
-        blocks: Iterator[Block], batch_fn: BatchUDF, *fn_args, **fn_kwargs
+        blocks: Iterator[Block],
+        ctx: TaskContext,
+        batch_fn: BatchUDF,
+        *fn_args,
+        **fn_kwargs,
     ) -> Iterator[Block]:
         DatasetContext._set_current(context)
         output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
diff --git a/python/ray/data/_internal/planner/map_rows.py b/python/ray/data/_internal/planner/map_rows.py
index 0c8b6c01f57c..81bcccae64a4 100644
--- a/python/ray/data/_internal/planner/map_rows.py
+++ b/python/ray/data/_internal/planner/map_rows.py
@@ -1,15 +1,19 @@
-from typing import Callable, Iterator
+from typing import Iterator
 
+from ray.data._internal.execution.interfaces import TaskContext, TransformFn
 from ray.data._internal.output_buffer import BlockOutputBuffer
 from ray.data.block import Block, BlockAccessor, RowUDF
 from ray.data.context import DatasetContext
 
 
-def generate_map_rows_fn() -> Callable[[Iterator[Block]], Iterator[Block]]:
+def generate_map_rows_fn() -> TransformFn:
     """Generate function to apply the UDF to each record of blocks."""
+
     context = DatasetContext.get_current()
 
-    def fn(blocks: Iterator[Block], row_fn: RowUDF) -> Iterator[Block]:
+    def fn(
+        blocks: Iterator[Block], ctx: TaskContext, row_fn: RowUDF
+    ) -> Iterator[Block]:
         DatasetContext._set_current(context)
         for block in blocks:
             output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
diff --git a/python/ray/data/_internal/planner/plan_map_op.py b/python/ray/data/_internal/planner/plan_map_op.py
index c2157879a690..6cf4a42a200e 100644
--- a/python/ray/data/_internal/planner/plan_map_op.py
+++ b/python/ray/data/_internal/planner/plan_map_op.py
@@ -1,8 +1,12 @@
 from typing import Any, Iterator
 
 import ray
-from ray.data._internal.compute import ActorPoolStrategy, TaskPoolStrategy, get_compute
-from ray.data._internal.execution.interfaces import PhysicalOperator
+from ray.data._internal.compute import (
+    ActorPoolStrategy,
+    TaskPoolStrategy,
+    get_compute,
+)
+from ray.data._internal.execution.interfaces import PhysicalOperator, TaskContext
 from ray.data._internal.execution.operators.map_operator import MapOperator
 from ray.data._internal.logical.operators.map_operator import (
     AbstractMap,
@@ -76,8 +80,8 @@ def fn(item: Any) -> Any:
         fn_args += op._fn_args
     fn_kwargs = op._fn_kwargs or {}
 
-    def do_map(blocks: Iterator[Block]) -> Iterator[Block]:
-        yield from transform_fn(blocks, *fn_args, **fn_kwargs)
+    def do_map(blocks: Iterator[Block], ctx: TaskContext) -> Iterator[Block]:
+        yield from transform_fn(blocks, ctx, *fn_args, **fn_kwargs)
 
     return MapOperator.create(
         do_map,
diff --git a/python/ray/data/_internal/planner/plan_read_op.py b/python/ray/data/_internal/planner/plan_read_op.py
index c593ebad4348..56bc459fab56 100644
--- a/python/ray/data/_internal/planner/plan_read_op.py
+++ b/python/ray/data/_internal/planner/plan_read_op.py
@@ -2,7 +2,11 @@
 
 import ray
 import ray.cloudpickle as cloudpickle
-from ray.data._internal.execution.interfaces import PhysicalOperator, RefBundle
+from ray.data._internal.execution.interfaces import (
+    PhysicalOperator,
+    RefBundle,
+    TaskContext,
+)
 from ray.data._internal.execution.operators.map_operator import MapOperator
 from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
 from ray.data._internal.logical.operators.read_operator import Read
@@ -43,7 +47,7 @@ def get_input_data() -> List[RefBundle]:
 
     inputs = InputDataBuffer(input_data_factory=get_input_data)
 
-    def do_read(blocks: Iterator[ReadTask]) -> Iterator[Block]:
+    def do_read(blocks: Iterator[ReadTask], ctx: TaskContext) -> Iterator[Block]:
         for read_task in blocks:
             yield from read_task()
 
diff --git a/python/ray/data/_internal/planner/randomize_blocks.py b/python/ray/data/_internal/planner/randomize_blocks.py
index 6a9343f5b742..222aa3e7a4a3 100644
--- a/python/ray/data/_internal/planner/randomize_blocks.py
+++ b/python/ray/data/_internal/planner/randomize_blocks.py
@@ -1,15 +1,17 @@
 from typing import Callable, List, Optional, Tuple
 
-from ray.data._internal.execution.interfaces import RefBundle
+from ray.data._internal.execution.interfaces import RefBundle, TaskContext
 from ray.data._internal.stats import StatsDict
 
 
 def generate_randomize_blocks_fn(
     seed: Optional[int],
-) -> Callable[[List[RefBundle]], Tuple[List[RefBundle], StatsDict]]:
+) -> Callable[[List[RefBundle], TaskContext], Tuple[List[RefBundle], StatsDict]]:
     """Generate function to randomize order of blocks."""
 
-    def fn(refs: List[RefBundle]) -> Tuple[List[RefBundle], StatsDict]:
+    def fn(
+        refs: List[RefBundle], context: TaskContext
+    ) -> Tuple[List[RefBundle], StatsDict]:
         import random
 
         blocks_with_metadata = []
diff --git a/python/ray/data/_internal/shuffle_and_partition.py b/python/ray/data/_internal/shuffle_and_partition.py
index 45ab69b4721f..db278705993f 100644
--- a/python/ray/data/_internal/shuffle_and_partition.py
+++ b/python/ray/data/_internal/shuffle_and_partition.py
@@ -4,6 +4,7 @@
 import numpy as np
 
 from ray.data._internal.delegating_block_builder import DelegatingBlockBuilder
+from ray.data._internal.execution.interfaces import TaskContext
 from ray.data._internal.push_based_shuffle import PushBasedShufflePlan
 from ray.data._internal.shuffle import ShuffleOp, SimpleShufflePlan
 from ray.data.block import Block, BlockAccessor, BlockExecStats, BlockMetadata
@@ -36,8 +37,9 @@ def map(
     ) -> List[Union[BlockMetadata, Block]]:
         stats = BlockExecStats.builder()
         if block_udf:
+            ctx = TaskContext(task_idx=idx)
             # TODO(ekl) note that this effectively disables block splitting.
-            blocks = list(block_udf([block]))
+            blocks = list(block_udf([block], ctx))
             if len(blocks) > 1:
                 builder = BlockAccessor.for_block(blocks[0]).builder()
                 for b in blocks:
diff --git a/python/ray/data/_internal/stage_impl.py b/python/ray/data/_internal/stage_impl.py
index 38bd467407c5..da3c236a0360 100644
--- a/python/ray/data/_internal/stage_impl.py
+++ b/python/ray/data/_internal/stage_impl.py
@@ -8,6 +8,7 @@
     SimpleShufflePartitionOp,
 )
 from ray.data._internal.block_list import BlockList
+from ray.data._internal.execution.interfaces import TaskContext
 from ray.data._internal.remote_fn import cached_remote_fn
 from ray.data._internal.sort import sort_impl
 from ray.data.context import DatasetContext
@@ -31,7 +32,11 @@ def __init__(self, num_blocks: int, shuffle: bool):
         if shuffle:
 
             def do_shuffle(
-                block_list, clear_input_blocks: bool, block_udf, remote_args
+                block_list,
+                ctx: TaskContext,
+                clear_input_blocks: bool,
+                block_udf,
+                remote_args,
             ):
                 if clear_input_blocks:
                     blocks = block_list.copy()
@@ -94,7 +99,13 @@ def __init__(
         output_num_blocks: Optional[int],
         remote_args: Optional[Dict[str, Any]] = None,
     ):
-        def do_shuffle(block_list, clear_input_blocks: bool, block_udf, remote_args):
+        def do_shuffle(
+            block_list,
+            ctx: TaskContext,
+            clear_input_blocks: bool,
+            block_udf,
+            remote_args,
+        ):
             num_blocks = block_list.executed_num_blocks()  # Blocking.
             if num_blocks == 0:
                 return block_list, {}
diff --git a/python/ray/data/tests/test_bulk_executor.py b/python/ray/data/tests/test_bulk_executor.py
index c63d5c9bd094..3c466675246e 100644
--- a/python/ray/data/tests/test_bulk_executor.py
+++ b/python/ray/data/tests/test_bulk_executor.py
@@ -16,7 +16,7 @@
 
 
 def make_transform(block_fn):
-    def map_fn(block_iter):
+    def map_fn(block_iter, ctx):
         for block in block_iter:
             yield block_fn(block)
 
@@ -47,7 +47,7 @@ def delay_first(block):
     o2 = MapOperator.create(make_transform(delay_first), o1)
     o3 = MapOperator.create(make_transform(lambda block: [b * 2 for b in block]), o2)
 
-    def reverse_sort(inputs: List[RefBundle]):
+    def reverse_sort(inputs: List[RefBundle], ctx):
         reversed_list = inputs[::-1]
         return reversed_list, {}
 
diff --git a/python/ray/data/tests/test_operators.py b/python/ray/data/tests/test_operators.py
index 3b433448f4e9..964d22a83119 100644
--- a/python/ray/data/tests/test_operators.py
+++ b/python/ray/data/tests/test_operators.py
@@ -33,7 +33,7 @@ def _get_blocks(bundle: RefBundle, output_list: List[Block]):
         output_list.append(ray.get(block))
 
 
-def _mul2_transform(block_iter: Iterable[Block]) -> Iterable[Block]:
+def _mul2_transform(block_iter: Iterable[Block], ctx) -> Iterable[Block]:
     for block in block_iter:
         yield [b * 2 for b in block]
 
@@ -59,7 +59,7 @@ def test_input_data_buffer(ray_start_regular_shared):
 
 
 def test_all_to_all_operator():
-    def dummy_all_transform(bundles: List[RefBundle]):
+    def dummy_all_transform(bundles: List[RefBundle], ctx):
         return make_ref_bundles([[1, 2], [3, 4]]), {"FooStats": []}
 
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
@@ -198,7 +198,7 @@ def test_map_operator_streamed(ray_start_regular_shared, use_actors):
 @pytest.mark.parametrize("use_actors", [False, True])
 def test_map_operator_min_rows_per_bundle(shutdown_only, use_actors):
     # Simple sanity check of batching behavior.
-    def _check_batch(block_iter: Iterable[Block]) -> Iterable[Block]:
+    def _check_batch(block_iter: Iterable[Block], ctx) -> Iterable[Block]:
         block_iter = list(block_iter)
         assert len(block_iter) == 5, block_iter
         for block in block_iter:
diff --git a/python/ray/data/tests/test_streaming_integration.py b/python/ray/data/tests/test_streaming_integration.py
index 3512cbe68dfd..f67ebeaae0a9 100644
--- a/python/ray/data/tests/test_streaming_integration.py
+++ b/python/ray/data/tests/test_streaming_integration.py
@@ -22,7 +22,7 @@
 
 
 def make_transform(block_fn):
-    def map_fn(block_iter):
+    def map_fn(block_iter, ctx):
         for block in block_iter:
             yield block_fn(block)
 
@@ -44,7 +44,7 @@ def test_pipelined_execution(ray_start_10_cpus_shared):
     o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
     o3 = MapOperator.create(make_transform(lambda block: [b * 2 for b in block]), o2)
 
-    def reverse_sort(inputs: List[RefBundle]):
+    def reverse_sort(inputs: List[RefBundle], ctx):
         reversed_list = inputs[::-1]
         return reversed_list, {}
 

From d91d2d60e667f0709735474d80f0759c95622202 Mon Sep 17 00:00:00 2001
From: Alan Guo <aguo@anyscale.com>
Date: Mon, 30 Jan 2023 23:34:30 -0800
Subject: [PATCH 074/267] Advanced Progress Bar (#31750)

This progress bar automatically shows progress by groupings.

Things that belong to the same parent are all put in a group.
If a group has multiple children with the same name, those are merged together into a virtual group.

These virtual groups have different visual treatment because a virtual group should not add an additional level of nesting.
---
 .../src/components/PlacementGroupTable.tsx    |   2 +-
 .../components/ProgressBar/ProgressBar.tsx    | 110 +++++--
 dashboard/client/src/components/TaskTable.tsx |   2 +-
 dashboard/client/src/components/TitleCard.tsx |   4 +-
 .../AdvancedProgressBar.component.test.tsx    | 145 +++++++++
 .../AdvancedProgressBar.tsx                   | 183 +++++++++++
 .../pages/job/AdvancedProgressBar/index.ts    |   1 +
 dashboard/client/src/pages/job/JobDetail.tsx  |  80 ++---
 .../client/src/pages/job/JobProgressBar.tsx   |  82 +++++
 .../client/src/pages/job/TaskProgressBar.tsx  | 115 ++++---
 .../src/pages/job/hook/useJobProgress.ts      | 164 ++++++++--
 dashboard/client/src/service/job.ts           |   7 +
 dashboard/client/src/type/job.d.ts            |  43 +++
 dashboard/modules/state/state_head.py         |   5 +-
 dashboard/state_aggregator.py                 |  32 +-
 python/ray/experimental/state/common.py       | 295 +++++++++++++++++-
 python/ray/tests/test_state_api_summary.py    | 194 ++++++++++++
 17 files changed, 1276 insertions(+), 188 deletions(-)
 create mode 100644 dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.component.test.tsx
 create mode 100644 dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.tsx
 create mode 100644 dashboard/client/src/pages/job/AdvancedProgressBar/index.ts
 create mode 100644 dashboard/client/src/pages/job/JobProgressBar.tsx

diff --git a/dashboard/client/src/components/PlacementGroupTable.tsx b/dashboard/client/src/components/PlacementGroupTable.tsx
index dd2ac7084e98..9a513fe96ce5 100644
--- a/dashboard/client/src/components/PlacementGroupTable.tsx
+++ b/dashboard/client/src/components/PlacementGroupTable.tsx
@@ -134,7 +134,7 @@ const PlacementGroupTable = ({
         <TableBody>
           {list.map(
             ({ placement_group_id, name, creator_job_id, state, stats }) => (
-              <TableRow>
+              <TableRow key={placement_group_id}>
                 <TableCell align="center">
                   <Tooltip
                     className={classes.idCol}
diff --git a/dashboard/client/src/components/ProgressBar/ProgressBar.tsx b/dashboard/client/src/components/ProgressBar/ProgressBar.tsx
index 539bfc7b6abd..e85a4968c999 100644
--- a/dashboard/client/src/components/ProgressBar/ProgressBar.tsx
+++ b/dashboard/client/src/components/ProgressBar/ProgressBar.tsx
@@ -6,7 +6,8 @@ import {
   Typography,
 } from "@material-ui/core";
 import React from "react";
-import { StyledTooltip } from "../Tooltip";
+import { RiArrowDownSLine, RiArrowRightSLine } from "react-icons/ri";
+import { HelpInfo, StyledTooltip } from "../Tooltip";
 
 const useStyles = makeStyles((theme) =>
   createStyles({
@@ -37,6 +38,19 @@ const useStyles = makeStyles((theme) =>
       borderRadius: 4,
       marginRight: theme.spacing(1),
     },
+    hint: {
+      marginLeft: theme.spacing(0.5),
+    },
+    progressBarContainer: {
+      display: "flex",
+      flexDirection: "row",
+      alignItems: "center",
+    },
+    icon: {
+      width: 16,
+      height: 16,
+      marginRight: theme.spacing(1),
+    },
     progressBarRoot: {
       display: "flex",
       flexDirection: "row",
@@ -52,6 +66,12 @@ const useStyles = makeStyles((theme) =>
         marginRight: 1,
       },
     },
+    progressTotal: {
+      flex: "1 0 40px",
+      marginLeft: theme.spacing(1),
+      textAlign: "end",
+      whiteSpace: "nowrap",
+    },
   }),
 );
 
@@ -64,6 +84,10 @@ export type ProgressBarSegment = {
    * Name of this segment
    */
   label: string;
+  /**
+   * Text to show to explain the segment better.
+   */
+  hint?: string;
   /**
    * A CSS color used to represent the segment.
    */
@@ -98,6 +122,20 @@ export type ProgressBarProps = {
    * Whether to show the a legend as a tooltip.
    */
   showTooltip?: boolean;
+  /**
+   * Whether to show the total progress to the right of the progress bar.
+   * Example: 5 / 20
+   * This should be set to the number that should be shown in the left side of the fraction.
+   * If this is undefined, don't show it.
+   */
+  showTotalProgress?: number;
+  /**
+   * If true, we show an expanded icon to the left of the progress bar.
+   * If false, we show an unexpanded icon to the left of the progress bar.
+   * If undefined, we don't show any icon.
+   */
+  expanded?: boolean;
+  onClick?: () => void;
 };
 
 export const ProgressBar = ({
@@ -106,6 +144,9 @@ export const ProgressBar = ({
   unaccountedLabel,
   showLegend = true,
   showTooltip = false,
+  showTotalProgress,
+  expanded,
+  onClick,
 }: ProgressBarProps) => {
   const classes = useStyles();
   const segmentTotal = progress.reduce((acc, { value }) => acc + value, 0);
@@ -118,7 +159,8 @@ export const ProgressBar = ({
           ...progress,
           {
             value: finalTotal - segmentTotal,
-            label: unaccountedLabel ?? "unaccounted",
+            label: unaccountedLabel ?? "Unaccounted",
+            hint: "Unaccounted tasks can happen when there are too many tasks. Ray drops older tasks to conserve memory.",
             color: "#EEEEEE",
           },
         ]
@@ -127,7 +169,7 @@ export const ProgressBar = ({
   const filteredSegments = segments.filter(({ value }) => value);
 
   return (
-    <div className={classes.root}>
+    <div className={classes.root} onClick={onClick}>
       {showLegend && (
         <div className={classes.legendRoot}>
           <div className={classes.legendItemContainer}>
@@ -137,7 +179,7 @@ export const ProgressBar = ({
             />
             <Typography>Total: {finalTotal}</Typography>
           </div>
-          {filteredSegments.map(({ value, label, color }) => (
+          {filteredSegments.map(({ value, label, hint, color }) => (
             <div key={label} className={classes.legendItemContainer}>
               <div
                 className={classes.colorLegend}
@@ -146,34 +188,48 @@ export const ProgressBar = ({
               <Typography>
                 {label}: {value}
               </Typography>
+              {hint && <HelpInfo className={classes.hint}>{hint}</HelpInfo>}
             </div>
           ))}
         </div>
       )}
-      <LegendTooltip
-        showTooltip={showTooltip}
-        total={finalTotal}
-        segments={filteredSegments}
-      >
-        <div
-          className={classes.progressBarRoot}
-          style={{
-            backgroundColor: segmentTotal === 0 ? "lightGrey" : "white",
-          }}
-        >
-          {filteredSegments.map(({ color, label, value }) => (
-            <span
-              key={label}
-              className={classes.segment}
-              style={{
-                flex: value,
-                backgroundColor: color,
-              }}
-              data-testid="progress-bar-segment"
-            />
+      <div className={classes.progressBarContainer}>
+        {expanded !== undefined &&
+          (expanded ? (
+            <RiArrowDownSLine className={classes.icon} />
+          ) : (
+            <RiArrowRightSLine className={classes.icon} />
           ))}
-        </div>
-      </LegendTooltip>
+        <LegendTooltip
+          showTooltip={showTooltip}
+          total={finalTotal}
+          segments={filteredSegments}
+        >
+          <div
+            className={classes.progressBarRoot}
+            style={{
+              backgroundColor: segmentTotal === 0 ? "lightGrey" : "white",
+            }}
+          >
+            {filteredSegments.map(({ color, label, value }) => (
+              <span
+                key={label}
+                className={classes.segment}
+                style={{
+                  flex: value,
+                  backgroundColor: color,
+                }}
+                data-testid="progress-bar-segment"
+              />
+            ))}
+          </div>
+        </LegendTooltip>
+        {showTotalProgress !== undefined && (
+          <div className={classes.progressTotal}>
+            {showTotalProgress} / {finalTotal}
+          </div>
+        )}
+      </div>
     </div>
   );
 };
diff --git a/dashboard/client/src/components/TaskTable.tsx b/dashboard/client/src/components/TaskTable.tsx
index c4f59ac3c66a..d21d013704ea 100644
--- a/dashboard/client/src/components/TaskTable.tsx
+++ b/dashboard/client/src/components/TaskTable.tsx
@@ -156,7 +156,7 @@ const TaskTable = ({
               start_time_ms,
               end_time_ms,
             }) => (
-              <TableRow>
+              <TableRow key={task_id}>
                 <TableCell align="center">
                   <Tooltip
                     className={classes.idCol}
diff --git a/dashboard/client/src/components/TitleCard.tsx b/dashboard/client/src/components/TitleCard.tsx
index b4f46655199f..e3c561332bb1 100644
--- a/dashboard/client/src/components/TitleCard.tsx
+++ b/dashboard/client/src/components/TitleCard.tsx
@@ -19,11 +19,11 @@ const useStyles = makeStyles((theme) => ({
 const TitleCard = ({
   title,
   children,
-}: PropsWithChildren<{ title: ReactNode | string }>) => {
+}: PropsWithChildren<{ title?: ReactNode | string }>) => {
   const classes = useStyles();
   return (
     <Paper className={classes.card}>
-      <div className={classes.title}>{title}</div>
+      {title && <div className={classes.title}>{title}</div>}
       <div className={classes.body}>{children}</div>
     </Paper>
   );
diff --git a/dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.component.test.tsx b/dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.component.test.tsx
new file mode 100644
index 000000000000..8220daa6a414
--- /dev/null
+++ b/dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.component.test.tsx
@@ -0,0 +1,145 @@
+import { Table, TableBody } from "@material-ui/core";
+import { ThemeProvider } from "@material-ui/styles";
+import { render, screen } from "@testing-library/react";
+import userEvent from "@testing-library/user-event";
+import React, { PropsWithChildren } from "react";
+import { lightTheme } from "../../../theme";
+import { TypeTaskType } from "../../../type/task";
+import { AdvancedProgressBarSegment } from "./AdvancedProgressBar";
+
+const Wrapper = ({ children }: PropsWithChildren<{}>) => {
+  return (
+    <ThemeProvider theme={lightTheme}>
+      <Table>
+        <TableBody>{children}</TableBody>
+      </Table>
+    </ThemeProvider>
+  );
+};
+
+describe("AdvancedProgressBarSegment", () => {
+  it("renders without children", async () => {
+    expect.assertions(2);
+    render(
+      <AdvancedProgressBarSegment
+        jobProgressGroup={{
+          name: "group 1",
+          key: "group1",
+          progress: {
+            numFinished: 1,
+            numRunning: 9,
+          },
+          children: [],
+          type: TypeTaskType.ACTOR_CREATION_TASK,
+        }}
+      />,
+      { wrapper: Wrapper },
+    );
+    await screen.findByText(/group 1/);
+    expect(screen.getByText(/1 \/ 10/)).toBeVisible();
+    expect(screen.getByTitle("Expand").parentElement).not.toBeVisible();
+  });
+
+  it("renders with children", async () => {
+    expect.assertions(7);
+    const user = userEvent.setup();
+
+    render(
+      <AdvancedProgressBarSegment
+        jobProgressGroup={{
+          name: "group 1",
+          key: "group1",
+          progress: {
+            numFinished: 1,
+            numRunning: 9,
+          },
+          children: [
+            {
+              name: "child",
+              key: "child",
+              progress: {
+                numFinished: 1,
+              },
+              children: [],
+              type: TypeTaskType.NORMAL_TASK,
+            },
+          ],
+          type: TypeTaskType.ACTOR_CREATION_TASK,
+        }}
+      />,
+      { wrapper: Wrapper },
+    );
+    await screen.findByText(/group 1/);
+    expect(screen.getByTitle("Expand").parentElement).toBeVisible();
+    expect(screen.getByText(/^1 \/ 10$/)).toBeVisible();
+    await user.click(screen.getByTitle("Expand"));
+    await screen.findByText(/child/);
+    screen.getByText(/child/);
+    expect(screen.getByTitle("Collapse").parentElement).toBeVisible();
+    expect(screen.getAllByTitle("Expand")).toHaveLength(1); // There should only be one for the child segment
+    expect(screen.getByText(/^1 \/ 1$/)).toBeVisible();
+    await user.click(screen.getByTitle("Collapse"));
+    expect(screen.queryByText(/child/)).toBeNull();
+    expect(screen.queryByText(/^1 \/ 1$/)).toBeNull();
+  });
+
+  it("renders with GROUP and children", async () => {
+    expect.assertions(12);
+    const user = userEvent.setup();
+
+    render(
+      <AdvancedProgressBarSegment
+        jobProgressGroup={{
+          name: "group 1",
+          key: "group1",
+          progress: {
+            numFinished: 3,
+            numRunning: 7,
+          },
+          type: "GROUP",
+          children: [
+            {
+              name: "child",
+              key: "child",
+              progress: {
+                numFinished: 3,
+              },
+              type: TypeTaskType.NORMAL_TASK,
+              children: [
+                {
+                  name: "grandchild",
+                  key: "grandchild",
+                  progress: {
+                    numFinished: 1,
+                  },
+                  type: TypeTaskType.NORMAL_TASK,
+                  children: [],
+                },
+              ],
+            },
+          ],
+        }}
+      />,
+      { wrapper: Wrapper },
+    );
+    await screen.findByText(/group 1/);
+    expect(screen.getByTitle("Expand").parentElement).toBeVisible();
+    expect(screen.getByText(/^3 \/ 10$/)).toBeVisible();
+    await user.click(screen.getByTitle("Expand"));
+    await screen.findByText(/child/);
+    screen.getByText(/child/);
+    expect(screen.getByTitle("Collapse group").parentElement).toBeVisible();
+    expect(screen.getAllByTitle("Expand")).toHaveLength(1); // There should only be one for the child segment
+    expect(screen.getByText(/^3 \/ 3$/)).toBeVisible();
+    await user.click(screen.getByTitle("Expand"));
+    await screen.findByText(/grandchild/);
+    expect(screen.getByTitle("Collapse group").parentElement).toBeVisible();
+    expect(screen.getByTitle("Collapse").parentElement).toBeVisible(); // Collapse on the child segment
+    expect(screen.getAllByTitle("Expand")).toHaveLength(1); // There should only be one for the grand child segment
+    expect(screen.getByText(/^1 \/ 1$/)).toBeVisible();
+    await user.click(screen.getByTitle("Collapse group"));
+    expect(screen.getByText(/^3 \/ 10$/)).toBeVisible();
+    expect(screen.queryByText(/^3 \/ 3$/)).toBeNull();
+    expect(screen.queryByText(/^1 \/ 1$/)).toBeNull();
+  });
+});
diff --git a/dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.tsx b/dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.tsx
new file mode 100644
index 000000000000..4791b6c8a74d
--- /dev/null
+++ b/dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.tsx
@@ -0,0 +1,183 @@
+import {
+  createStyles,
+  makeStyles,
+  Table,
+  TableBody,
+  TableCell,
+  TableRow,
+} from "@material-ui/core";
+import classNames from "classnames";
+import React, { useState } from "react";
+import {
+  RiAddLine,
+  RiArrowDownSLine,
+  RiArrowRightSLine,
+  RiCloseLine,
+  RiSubtractLine,
+} from "react-icons/ri";
+import { ClassNameProps } from "../../../common/props";
+import { JobProgressGroup } from "../../../type/job";
+import { MiniTaskProgressBar } from "../TaskProgressBar";
+
+export type AdvancedProgressBarProps = {
+  progressGroups: JobProgressGroup[] | undefined;
+} & ClassNameProps;
+
+export const AdvancedProgressBar = ({
+  progressGroups,
+  className,
+}: AdvancedProgressBarProps) => {
+  return (
+    <Table className={className}>
+      <TableBody>
+        {progressGroups !== undefined ? (
+          progressGroups.map((group) => (
+            <AdvancedProgressBarSegment
+              key={group.key}
+              jobProgressGroup={group}
+            />
+          ))
+        ) : (
+          <TableRow>
+            <TableCell>Loading...</TableCell>
+          </TableRow>
+        )}
+      </TableBody>
+    </Table>
+  );
+};
+
+const useAdvancedProgressBarSegmentStyles = makeStyles((theme) =>
+  createStyles({
+    nameContainer: {
+      paddingLeft: 0,
+      whiteSpace: "nowrap",
+      display: "flex",
+      alignItems: "center",
+    },
+    spacer: {
+      width: 4,
+    },
+    progressBarContainer: {
+      width: "100%",
+      paddingRight: 0,
+    },
+    icon: {
+      width: 16,
+      height: 16,
+      verticalAlign: "top",
+      marginRight: theme.spacing(0.5),
+    },
+    iconHidden: {
+      visibility: "hidden",
+    },
+  }),
+);
+
+export type AdvancedProgressBarSegmentProps = {
+  jobProgressGroup: JobProgressGroup;
+  /**
+   * Whether the segment should be expanded or not.
+   * Only applies to this segment and not it's children.
+   */
+  startExpanded?: boolean;
+  /**
+   * How nested this segment is.
+   * By default, we assume this is a top level segment.
+   */
+  nestedIndex?: number;
+  /**
+   * Whether to show a collapse button to the left. Used to collapse the parent.
+   * This is a special case for "GROUP"s
+   */
+  showParentCollapseButton?: boolean;
+  onParentCollapseButtonPressed?: () => void;
+};
+
+export const AdvancedProgressBarSegment = ({
+  jobProgressGroup: { name, progress, children, type },
+  startExpanded = false,
+  nestedIndex = 1,
+  showParentCollapseButton = false,
+  onParentCollapseButtonPressed,
+}: AdvancedProgressBarSegmentProps) => {
+  const classes = useAdvancedProgressBarSegmentStyles();
+
+  const [expanded, setExpanded] = useState(startExpanded);
+  const isGroup = type === "GROUP";
+
+  const IconComponent = isGroup
+    ? expanded
+      ? RiSubtractLine
+      : RiAddLine
+    : expanded
+    ? RiArrowDownSLine
+    : RiArrowRightSLine;
+
+  const showCollapse = isGroup && expanded;
+  const handleCollapse = showCollapse
+    ? () => {
+        setExpanded(false);
+      }
+    : undefined;
+
+  return (
+    <React.Fragment>
+      {/* Don't show the "GROUP" type rows if it's expanded. We only show the children */}
+      {isGroup && expanded ? null : (
+        <TableRow>
+          <TableCell
+            className={classes.nameContainer}
+            onClick={() => {
+              setExpanded(!expanded);
+            }}
+          >
+            {showParentCollapseButton && (
+              <RiSubtractLine
+                title="Collapse group"
+                onClick={onParentCollapseButtonPressed}
+                className={classNames(classes.icon)}
+                style={{ marginLeft: 24 * (nestedIndex - 1) }}
+              />
+            )}
+            <IconComponent
+              title={expanded ? "Collapse" : "Expand"}
+              className={classNames(classes.icon, {
+                [classes.iconHidden]: children.length === 0,
+              })}
+              style={{
+                // Complex logic on where to place the icon depending on the grouping type
+                marginLeft: showParentCollapseButton
+                  ? 4
+                  : 24 * (isGroup ? nestedIndex - 1 : nestedIndex),
+                marginRight: isGroup ? 28 : 4,
+              }}
+            />
+            {name}
+            {isGroup && (
+              <React.Fragment>
+                <span className={classes.spacer} />
+                {"("}
+                <RiCloseLine /> {children.length}
+                {")"}
+              </React.Fragment>
+            )}
+          </TableCell>
+          <TableCell className={classes.progressBarContainer}>
+            <MiniTaskProgressBar {...progress} showTotal />
+          </TableCell>
+        </TableRow>
+      )}
+      {expanded &&
+        children.map((child, index) => (
+          <AdvancedProgressBarSegment
+            key={child.key}
+            jobProgressGroup={child}
+            nestedIndex={isGroup ? nestedIndex : nestedIndex + 1}
+            showParentCollapseButton={showCollapse && index === 0}
+            onParentCollapseButtonPressed={handleCollapse}
+          />
+        ))}
+    </React.Fragment>
+  );
+};
diff --git a/dashboard/client/src/pages/job/AdvancedProgressBar/index.ts b/dashboard/client/src/pages/job/AdvancedProgressBar/index.ts
new file mode 100644
index 000000000000..ce041fba6cc6
--- /dev/null
+++ b/dashboard/client/src/pages/job/AdvancedProgressBar/index.ts
@@ -0,0 +1 @@
+export * from "./AdvancedProgressBar";
diff --git a/dashboard/client/src/pages/job/JobDetail.tsx b/dashboard/client/src/pages/job/JobDetail.tsx
index 2c6e0d47830b..4c3b791a216c 100644
--- a/dashboard/client/src/pages/job/JobDetail.tsx
+++ b/dashboard/client/src/pages/job/JobDetail.tsx
@@ -1,9 +1,9 @@
 import { makeStyles } from "@material-ui/core";
-import { Alert } from "@material-ui/lab";
 import dayjs from "dayjs";
 import React, { useContext } from "react";
 import { Link } from "react-router-dom";
 import { GlobalContext } from "../../App";
+import { CollapsibleSection } from "../../common/CollapsibleSection";
 import { DurationText } from "../../common/DurationText";
 import Loading from "../../components/Loading";
 import { MetadataSection } from "../../components/MetadataSection";
@@ -15,18 +15,13 @@ import PlacementGroupList from "../state/PlacementGroup";
 import TaskList from "../state/task";
 
 import { useJobDetail } from "./hook/useJobDetail";
-import { useJobProgress } from "./hook/useJobProgress";
-import { JobTaskNameProgressTable } from "./JobTaskNameProgressTable";
-import { TaskProgressBar } from "./TaskProgressBar";
+import { JobProgressBar } from "./JobProgressBar";
 import { TaskTimeline } from "./TaskTimeline";
 
 const useStyle = makeStyles((theme) => ({
   root: {
     padding: theme.spacing(2),
   },
-  taskProgressTable: {
-    marginTop: theme.spacing(2),
-  },
 }));
 
 type JobDetailChartsPageProps = {
@@ -39,7 +34,6 @@ export const JobDetailChartsPage = ({
   const classes = useStyle();
   const { job, msg, params } = useJobDetail();
   const jobId = params.id;
-  const { progress, error, driverExists } = useJobProgress(jobId);
 
   if (!job) {
     return (
@@ -54,54 +48,6 @@ export const JobDetailChartsPage = ({
     );
   }
 
-  const tasksSectionContents = (() => {
-    if (!driverExists) {
-      return <TaskProgressBar />;
-    }
-    const { status } = job;
-    if (!progress || error) {
-      return (
-        <Alert severity="warning">
-          No tasks visualizations because prometheus is not detected. Please
-          make sure prometheus is running and refresh this page. See:{" "}
-          <a
-            href="https://docs.ray.io/en/latest/ray-observability/ray-metrics.html"
-            target="_blank"
-            rel="noreferrer"
-          >
-            https://docs.ray.io/en/latest/ray-observability/ray-metrics.html
-          </a>
-          .
-          <br />
-          If you are hosting prometheus on a separate machine or using a
-          non-default port, please set the RAY_PROMETHEUS_HOST env var to point
-          to your prometheus server when launching ray.
-        </Alert>
-      );
-    }
-    if (status === "SUCCEEDED" || status === "FAILED") {
-      return (
-        <React.Fragment>
-          <TaskProgressBar {...progress} showAsComplete />
-          <JobTaskNameProgressTable
-            className={classes.taskProgressTable}
-            jobId={jobId}
-          />
-        </React.Fragment>
-      );
-    } else {
-      return (
-        <React.Fragment>
-          <TaskProgressBar {...progress} />
-          <JobTaskNameProgressTable
-            className={classes.taskProgressTable}
-            jobId={jobId}
-          />
-        </React.Fragment>
-      );
-    }
-  })();
-
   return (
     <div className={classes.root}>
       <TitleCard title={`JOB - ${params.id}`}>
@@ -174,16 +120,26 @@ export const JobDetailChartsPage = ({
           ]}
         />
       </TitleCard>
-      <TitleCard title="Tasks">{tasksSectionContents}</TitleCard>
+      <TitleCard title="Tasks">
+        <JobProgressBar jobId={jobId} job={job} />
+      </TitleCard>
       <TitleCard title="Task Timeline">
         <TaskTimeline jobId={jobId} />
       </TitleCard>
-      <TitleCard title="Task Table">
-        <TaskList jobId={jobId} />
+      <TitleCard>
+        <CollapsibleSection title="Task Table">
+          <TaskList jobId={jobId} />
+        </CollapsibleSection>
+      </TitleCard>
+      <TitleCard>
+        <CollapsibleSection title="Actors">
+          <ActorList jobId={jobId} />
+        </CollapsibleSection>
       </TitleCard>
-      <TitleCard title="Actors">{<ActorList jobId={jobId} />}</TitleCard>
-      <TitleCard title="Placement Groups">
-        <PlacementGroupList jobId={jobId} />
+      <TitleCard>
+        <CollapsibleSection title="Placement Groups">
+          <PlacementGroupList jobId={jobId} />
+        </CollapsibleSection>
       </TitleCard>
     </div>
   );
diff --git a/dashboard/client/src/pages/job/JobProgressBar.tsx b/dashboard/client/src/pages/job/JobProgressBar.tsx
new file mode 100644
index 000000000000..59fe73784c93
--- /dev/null
+++ b/dashboard/client/src/pages/job/JobProgressBar.tsx
@@ -0,0 +1,82 @@
+import { makeStyles } from "@material-ui/core";
+import React, { useEffect, useState } from "react";
+import { UnifiedJob } from "../../type/job";
+import { AdvancedProgressBar } from "./AdvancedProgressBar";
+import { useJobProgress, useJobProgressByLineage } from "./hook/useJobProgress";
+import { TaskProgressBar } from "./TaskProgressBar";
+
+const useStyles = makeStyles((theme) => ({
+  advancedProgressBar: {
+    marginTop: theme.spacing(0.5),
+  },
+}));
+
+type JobProgressBarProps = {
+  jobId: string;
+  job: Pick<UnifiedJob, "status">;
+};
+
+export const JobProgressBar = ({ jobId, job }: JobProgressBarProps) => {
+  const classes = useStyles();
+
+  // Controls the first time we fetch the advanced progress bar data
+  const [advancedProgressBarRendered, setAdvancedProgressBarRendered] =
+    useState(false);
+  // Controls whether we continue to fetch the advanced progress bar data
+  const [advancedProgressBarExpanded, setAdvancedProgressBarExpanded] =
+    useState(false);
+
+  useEffect(() => {
+    if (advancedProgressBarExpanded) {
+      setAdvancedProgressBarRendered(true);
+    }
+  }, [advancedProgressBarExpanded]);
+
+  const {
+    progress,
+    driverExists,
+    totalTasks,
+    latestFetchTimestamp: progressTimestamp,
+  } = useJobProgress(jobId, advancedProgressBarExpanded);
+  const {
+    progressGroups,
+    total,
+    totalTasks: advancedTotalTasks,
+    latestFetchTimestamp: totalTimestamp,
+  } = useJobProgressByLineage(
+    advancedProgressBarRendered ? jobId : undefined,
+    !advancedProgressBarExpanded,
+  );
+
+  if (!driverExists) {
+    return <TaskProgressBar />;
+  }
+  const { status } = job;
+  // Use whichever data was received the most recently
+  // Note these values may disagree in some way. It might better to consistently use one endpoint.
+  const [totalProgress, finalTotalTasks] =
+    progressTimestamp > totalTimestamp
+      ? [progress, totalTasks]
+      : [total, advancedTotalTasks];
+
+  return (
+    <div>
+      <TaskProgressBar
+        {...totalProgress}
+        total={finalTotalTasks}
+        showAsComplete={status === "SUCCEEDED" || status === "FAILED"}
+        showTooltip={false}
+        expanded={advancedProgressBarExpanded}
+        onClick={() =>
+          setAdvancedProgressBarExpanded(!advancedProgressBarExpanded)
+        }
+      />
+      {advancedProgressBarExpanded && (
+        <AdvancedProgressBar
+          className={classes.advancedProgressBar}
+          progressGroups={progressGroups}
+        />
+      )}
+    </div>
+  );
+};
diff --git a/dashboard/client/src/pages/job/TaskProgressBar.tsx b/dashboard/client/src/pages/job/TaskProgressBar.tsx
index 69042142ee26..dc5a74dc7930 100644
--- a/dashboard/client/src/pages/job/TaskProgressBar.tsx
+++ b/dashboard/client/src/pages/job/TaskProgressBar.tsx
@@ -7,6 +7,9 @@ import { TaskProgress } from "../../type/job";
 export type TaskProgressBarProps = TaskProgress & {
   showAsComplete?: boolean;
   showTooltip?: boolean;
+  expanded?: boolean;
+  onClick?: () => void;
+  total?: number;
 };
 
 export const TaskProgressBar = ({
@@ -19,69 +22,53 @@ export const TaskProgressBar = ({
   numUnknown = 0,
   showAsComplete = false,
   showTooltip = true,
+  expanded,
+  onClick,
+  total,
 }: TaskProgressBarProps) => {
   const theme = useTheme<Theme>();
-  if (showAsComplete) {
-    const total =
-      numFinished +
-      numRunning +
-      numPendingArgsAvail +
-      numPendingNodeAssignment +
-      numSubmittedToWorker +
-      numFailed +
-      numUnknown;
-    return (
-      <ProgressBar
-        progress={[
-          {
-            label: "Finished",
-            value: total - numFailed,
-            color: theme.palette.success.main,
-          },
-          {
-            label: "Failed",
-            value: numFailed,
-            color: theme.palette.error.main,
-          },
-        ]}
-        showTooltip={showTooltip}
-      />
-    );
-  } else {
-    const progress: ProgressBarSegment[] = [
-      {
-        label: "Finished",
-        value: numFinished,
-        color: theme.palette.success.main,
-      },
-      {
-        label: "Failed",
-        value: numFailed,
-        color: theme.palette.error.main,
-      },
-      {
-        label: "Running",
-        value: numRunning,
-        color: theme.palette.primary.main,
-      },
-      {
-        label: "Waiting for scheduling",
-        value: numPendingNodeAssignment + numSubmittedToWorker,
-        color: "#cfcf08",
-      },
-      {
-        label: "Waiting for dependencies",
-        value: numPendingArgsAvail,
-        color: "#f79e02",
-      },
-      {
-        label: "Unknown",
-        value: numUnknown,
-        color: "#5f6469",
-      },
-    ];
-    return <ProgressBar progress={progress} />;
-  }
+  const progress: ProgressBarSegment[] = [
+    {
+      label: "Finished",
+      value: numFinished,
+      color: theme.palette.success.main,
+    },
+    {
+      label: "Failed",
+      value: numFailed,
+      color: theme.palette.error.main,
+    },
+    {
+      label: "Running",
+      value: numRunning,
+      color: theme.palette.primary.main,
+    },
+    {
+      label: "Waiting for scheduling",
+      value: numPendingNodeAssignment + numSubmittedToWorker,
+      color: "#cfcf08",
+    },
+    {
+      label: "Waiting for dependencies",
+      value: numPendingArgsAvail,
+      color: "#f79e02",
+    },
+    {
+      label: "Unknown",
+      value: numUnknown,
+      color: "#5f6469",
+    },
+  ];
+  return (
+    <ProgressBar
+      progress={progress}
+      expanded={expanded}
+      showTooltip={showTooltip}
+      onClick={onClick}
+      showTotalProgress={numFinished}
+      total={total}
+    />
+  );
 };
 
 export type MiniTaskProgressBarProps = TaskProgress & {
@@ -94,6 +81,10 @@ export type MiniTaskProgressBarProps = TaskProgress & {
    * Whether to show tooltip.
    */
   showTooltip?: boolean;
+  /**
+   * Whether to show the total finished to the right of the progress bar.
+   */
+  showTotal?: boolean;
 };
 
 export const MiniTaskProgressBar = ({
@@ -106,6 +97,7 @@ export const MiniTaskProgressBar = ({
   numFailed = 0,
   showAsComplete = false,
   showTooltip = true,
+  showTotal = false,
 }: MiniTaskProgressBarProps) => {
   const theme = useTheme<Theme>();
   if (showAsComplete) {
@@ -173,6 +165,7 @@ export const MiniTaskProgressBar = ({
         progress={progress}
         showLegend={false}
         showTooltip={showTooltip}
+        showTotalProgress={showTotal ? numFinished : undefined}
       />
     );
   }
diff --git a/dashboard/client/src/pages/job/hook/useJobProgress.ts b/dashboard/client/src/pages/job/hook/useJobProgress.ts
index acfbfde29028..61b49377ade4 100644
--- a/dashboard/client/src/pages/job/hook/useJobProgress.ts
+++ b/dashboard/client/src/pages/job/hook/useJobProgress.ts
@@ -2,8 +2,17 @@ import _ from "lodash";
 import { useState } from "react";
 import useSWR from "swr";
 import { API_REFRESH_INTERVAL_MS } from "../../../common/constants";
-import { getStateApiJobProgressByTaskName } from "../../../service/job";
-import { StateApiJobProgressByTaskName, TaskProgress } from "../../../type/job";
+import {
+  getStateApiJobProgressByLineage,
+  getStateApiJobProgressByTaskName,
+} from "../../../service/job";
+import {
+  JobProgressGroup,
+  NestedJobProgress,
+  StateApiJobProgressByTaskName,
+  StateApiNestedJobProgress,
+  TaskProgress,
+} from "../../../type/job";
 import { TypeTaskStatus } from "../../../type/task";
 
 const TASK_STATE_NAME_TO_PROGRESS_KEY: Record<
@@ -29,6 +38,8 @@ const useFetchStateApiProgressByTaskName = (
   setMsg: (msg: string) => void,
   setError: (error: boolean) => void,
   setRefresh: (refresh: boolean) => void,
+  disableRefresh: boolean,
+  setLatestFetchTimestamp?: (time: number) => void,
 ) => {
   return useSWR(
     jobId ? ["useJobProgressByTaskName", jobId] : null,
@@ -37,13 +48,21 @@ const useFetchStateApiProgressByTaskName = (
       setMsg(rsp.data.msg);
 
       if (rsp.data.result) {
-        return formatSummaryToTaskProgress(rsp.data.data.result.result);
+        setLatestFetchTimestamp?.(new Date().getTime());
+        const summary = formatSummaryToTaskProgress(
+          rsp.data.data.result.result,
+        );
+        return { summary, totalTasks: rsp.data.data.result.total };
       } else {
         setError(true);
         setRefresh(false);
       }
     },
-    { refreshInterval: isRefreshing ? API_REFRESH_INTERVAL_MS : 0 },
+    {
+      refreshInterval:
+        isRefreshing && !disableRefresh ? API_REFRESH_INTERVAL_MS : 0,
+      revalidateOnFocus: false,
+    },
   );
 };
 
@@ -51,26 +70,29 @@ const useFetchStateApiProgressByTaskName = (
  * Hook for fetching a job's task progress.
  * Refetches every 4 seconds unless refresh switch is toggled off.
  *
- * If jobId is not provided, will fetch the task progress across all jobs.
+ * If jobId is undefined, we will not fetch the job progress.
  * @param jobId The id of the job whose task progress to fetch or undefined
  *              to fetch all progress for all jobs
  */
-export const useJobProgress = (jobId?: string) => {
+export const useJobProgress = (
+  jobId: string | undefined,
+  disableRefresh = false,
+) => {
   const [msg, setMsg] = useState("Loading progress...");
   const [error, setError] = useState(false);
   const [isRefreshing, setRefresh] = useState(true);
-  const onSwitchChange = (event: React.ChangeEvent<HTMLInputElement>) => {
-    setRefresh(event.target.checked);
-  };
-  const { data: tasks } = useFetchStateApiProgressByTaskName(
+  const [latestFetchTimestamp, setLatestFetchTimestamp] = useState(0);
+  const { data } = useFetchStateApiProgressByTaskName(
     jobId,
     isRefreshing,
     setMsg,
     setError,
     setRefresh,
+    disableRefresh,
+    setLatestFetchTimestamp,
   );
 
-  const summed = (tasks ?? []).reduce((acc, task) => {
+  const summed = (data?.summary ?? []).reduce((acc, task) => {
     Object.entries(task.progress).forEach(([k, count]) => {
       const key = k as keyof TaskProgress;
       acc[key] = (acc[key] ?? 0) + count;
@@ -81,11 +103,11 @@ export const useJobProgress = (jobId?: string) => {
   const driverExists = !jobId ? false : true;
   return {
     progress: summed,
+    totalTasks: data?.totalTasks,
     msg,
     error,
-    isRefreshing,
-    onSwitchChange,
     driverExists,
+    latestFetchTimestamp,
   };
 };
 
@@ -106,15 +128,16 @@ export const useJobProgressByTaskName = (jobId: string) => {
     setRefresh(event.target.checked);
   };
 
-  const { data: tasks } = useFetchStateApiProgressByTaskName(
+  const { data } = useFetchStateApiProgressByTaskName(
     jobId,
     isRefreshing,
     setMsg,
     setError,
     setRefresh,
+    false,
   );
 
-  const formattedTasks = (tasks ?? []).map((task) => {
+  const formattedTasks = (data?.summary ?? []).map((task) => {
     const {
       numFailed = 0,
       numPendingArgsAvail = 0,
@@ -143,30 +166,121 @@ export const useJobProgressByTaskName = (jobId: string) => {
     progress: paginatedTasks,
     page: { pageNo: page, pageSize: 10 },
     total: formattedTasks.length,
+    totalTasks: data?.totalTasks,
     setPage,
     msg,
     error,
-    isRefreshing,
     onSwitchChange,
   };
 };
 
+const formatStateCountsToProgress = (stateCounts: {
+  [stateName: string]: number;
+}) => {
+  const formattedProgress: TaskProgress = {};
+  Object.entries(stateCounts).forEach(([state, count]) => {
+    const key: keyof TaskProgress =
+      TASK_STATE_NAME_TO_PROGRESS_KEY[state as TypeTaskStatus] ?? "numUnknown";
+
+    formattedProgress[key] = (formattedProgress[key] ?? 0) + count;
+  });
+
+  return formattedProgress;
+};
+
 export const formatSummaryToTaskProgress = (
   summary: StateApiJobProgressByTaskName,
 ) => {
   const tasks = summary.node_id_to_summary.cluster.summary;
   const formattedTasks = Object.entries(tasks).map(([name, task]) => {
-    const formattedProgress: TaskProgress = {};
-    Object.entries(task.state_counts).forEach(([state, count]) => {
-      const key: keyof TaskProgress =
-        TASK_STATE_NAME_TO_PROGRESS_KEY[state as TypeTaskStatus] ??
-        "numUnknown";
-
-      formattedProgress[key] = (formattedProgress[key] ?? 0) + count;
-    });
-
+    const formattedProgress = formatStateCountsToProgress(task.state_counts);
     return { name, progress: formattedProgress };
   });
 
   return formattedTasks;
 };
+
+const formatToJobProgressGroup = (
+  nestedJobProgress: NestedJobProgress,
+): JobProgressGroup => {
+  const formattedProgress = formatStateCountsToProgress(
+    nestedJobProgress.state_counts,
+  );
+
+  return {
+    name: nestedJobProgress.name,
+    key: nestedJobProgress.key,
+    progress: formattedProgress,
+    children: nestedJobProgress.children.map(formatToJobProgressGroup),
+    type: nestedJobProgress.type,
+  };
+};
+
+export const formatNestedJobProgressToJobProgressGroup = (
+  summary: StateApiNestedJobProgress,
+) => {
+  const tasks = summary.node_id_to_summary.cluster.summary;
+  const progressGroups = Object.values(tasks).map(formatToJobProgressGroup);
+
+  const total = progressGroups.reduce<TaskProgress>((acc, group) => {
+    Object.entries(group.progress).forEach(([key, count]) => {
+      const progressKey = key as keyof TaskProgress;
+      acc[progressKey] = (acc[progressKey] ?? 0) + count;
+    });
+    return acc;
+  }, {});
+
+  return { progressGroups, total };
+};
+
+/**
+ * Hook for fetching a job's task progress grouped by lineage. This is
+ * used for the Advanced progress bar.
+ * Refetches every 4 seconds.
+ *
+ * @param jobId The id of the job whose task progress to fetch or undefined
+ *              to fetch all progress for all jobs
+ *              If null, we will avoid fetching.
+ */
+export const useJobProgressByLineage = (
+  jobId: string | undefined,
+  disableRefresh = false,
+) => {
+  const [msg, setMsg] = useState("Loading progress...");
+  const [error, setError] = useState(false);
+  const [isRefreshing, setRefresh] = useState(true);
+  const [latestFetchTimestamp, setLatestFetchTimestamp] = useState(0);
+
+  const { data } = useSWR(
+    jobId ? ["useJobProgressByLineageAndName", jobId] : null,
+    async (_, jobId) => {
+      const rsp = await getStateApiJobProgressByLineage(jobId);
+      setMsg(rsp.data.msg);
+
+      if (rsp.data.result) {
+        setLatestFetchTimestamp(new Date().getTime());
+        const summary = formatNestedJobProgressToJobProgressGroup(
+          rsp.data.data.result.result,
+        );
+        return { summary, totalTasks: rsp.data.data.result.total };
+      } else {
+        setError(true);
+        setRefresh(false);
+      }
+    },
+    {
+      refreshInterval:
+        isRefreshing && !disableRefresh ? API_REFRESH_INTERVAL_MS : 0,
+      revalidateOnFocus: false,
+    },
+  );
+
+  return {
+    progressGroups: data?.summary?.progressGroups,
+    total: data?.summary?.total,
+    totalTasks: data?.totalTasks,
+    msg,
+    error,
+    latestFetchTimestamp,
+  };
+};
diff --git a/dashboard/client/src/service/job.ts b/dashboard/client/src/service/job.ts
index 097d81a647d9..dad2959cc1eb 100644
--- a/dashboard/client/src/service/job.ts
+++ b/dashboard/client/src/service/job.ts
@@ -3,6 +3,7 @@ import {
   JobProgressByTaskNameRsp,
   JobProgressRsp,
   StateApiJobProgressByTaskNameRsp,
+  StateApiNestedJobProgressRsp,
   UnifiedJob,
 } from "../type/job";
 import { get } from "./requestHandlers";
@@ -31,3 +32,9 @@ export const getStateApiJobProgressByTaskName = (jobId: string) => {
     `api/v0/tasks/summarize?filter_keys=job_id&filter_predicates=%3D&filter_values=${jobId}`,
   );
 };
+
+export const getStateApiJobProgressByLineage = (jobId: string) => {
+  return get<StateApiNestedJobProgressRsp>(
+    `api/v0/tasks/summarize?filter_keys=job_id&filter_predicates=%3D&filter_values=${jobId}&summary_by=lineage`,
+  );
+};
diff --git a/dashboard/client/src/type/job.d.ts b/dashboard/client/src/type/job.d.ts
index fe93eacd698d..4fe73ca5c273 100644
--- a/dashboard/client/src/type/job.d.ts
+++ b/dashboard/client/src/type/job.d.ts
@@ -1,4 +1,5 @@
 import { Actor } from "./actor";
+import { TypeTaskType } from "./task";
 import { Worker } from "./worker";
 
 export type Job = {
@@ -129,6 +130,48 @@ export type StateApiJobProgressByTaskNameRsp = {
   data: {
     result: {
       result: StateApiJobProgressByTaskName;
+      num_filtered: number;
+      total: number;
+    };
+  };
+  msg: string;
+  result: boolean;
+};
+
+export type NestedJobProgress = {
+  name: string;
+  key: string;
+  state_counts: {
+    [stateName: string]: number;
+  };
+  children: NestedJobProgress[];
+  type: TypeTaskType | "GROUP" | "ACTOR";
+};
+
+export type JobProgressGroup = {
+  name: string;
+  key: string;
+  progress: TaskProgress;
+  children: JobProgressGroup[];
+  type: TypeTaskType | "GROUP" | "ACTOR";
+};
+
+export type StateApiNestedJobProgress = {
+  node_id_to_summary: {
+    cluster: {
+      summary: {
+        [taskName: string]: NestedJobProgress;
+      };
+    };
+  };
+};
+
+export type StateApiNestedJobProgressRsp = {
+  data: {
+    result: {
+      result: StateApiNestedJobProgress;
+      num_filtered: number;
+      total: number;
     };
   };
   msg: string;
diff --git a/dashboard/modules/state/state_head.py b/dashboard/modules/state/state_head.py
index 9c0a7747abb2..50faa3a30b10 100644
--- a/dashboard/modules/state/state_head.py
+++ b/dashboard/modules/state/state_head.py
@@ -209,7 +209,10 @@ def _options_from_req(self, req: aiohttp.web.Request) -> ListApiOptions:
     def _summary_options_from_req(self, req: aiohttp.web.Request) -> SummaryApiOptions:
         timeout = int(req.query.get("timeout", DEFAULT_RPC_TIMEOUT))
         filters = self._get_filters_from_req(req)
-        return SummaryApiOptions(timeout=timeout, filters=filters)
+        summary_by = req.query.get("summary_by", None)
+        return SummaryApiOptions(
+            timeout=timeout, filters=filters, summary_by=summary_by
+        )
 
     def _reply(self, success: bool, error_message: str, result: dict, **kwargs):
         """Reply to the client."""
diff --git a/dashboard/state_aggregator.py b/dashboard/state_aggregator.py
index 6e5e6852ea25..d69663bb65eb 100644
--- a/dashboard/state_aggregator.py
+++ b/dashboard/state_aggregator.py
@@ -427,6 +427,7 @@ def _to_task_state(task_attempt: dict) -> dict:
                 for key in keys:
                     task_state[key] = src.get(key)
 
+            task_state["creation_time_ms"] = None
             task_state["start_time_ms"] = None
             task_state["end_time_ms"] = None
             events = []
@@ -443,6 +444,8 @@ def _to_task_state(task_attempt: dict) -> dict:
                             "created_ms": ts_ms,
                         }
                     )
+                    if state == "PENDING_ARGS_AVAIL":
+                        task_state["creation_time_ms"] = ts_ms
                     if state == "RUNNING":
                         task_state["start_time_ms"] = ts_ms
                     if state == "FINISHED" or state == "FAILED":
@@ -693,24 +696,41 @@ async def list_cluster_events(self, *, option: ListApiOptions) -> ListApiRespons
         )
 
     async def summarize_tasks(self, option: SummaryApiOptions) -> SummaryApiResponse:
+        summary_by = option.summary_by or "func_name"
+        if summary_by not in ["func_name", "lineage"]:
+            raise ValueError('summary_by must be one of "func_name" or "lineage".')
+
         # For summary, try getting as many entries as possible to minimze data loss.
         result = await self.list_tasks(
             option=ListApiOptions(
                 timeout=option.timeout,
                 limit=RAY_MAX_LIMIT_FROM_API_SERVER,
                 filters=option.filters,
+                detail=summary_by == "lineage",
             )
         )
-        summary = StateSummary(
-            node_id_to_summary={
-                "cluster": TaskSummaries.to_summary(tasks=result.result)
-            }
-        )
+        if summary_by == "func_name":
+            summary_results = TaskSummaries.to_summary_by_func_name(tasks=result.result)
+        else:
+            summary_results = TaskSummaries.to_summary_by_lineage(tasks=result.result)
+        summary = StateSummary(node_id_to_summary={"cluster": summary_results})
+        warnings = result.warnings
+        if (
+            summary_results.total_actor_scheduled
+            + summary_results.total_actor_tasks
+            + summary_results.total_tasks
+            < result.num_filtered
+        ):
+            warnings = warnings or []
+            warnings.append(
+                "There is missing data in this aggregation. "
+                "Possibly due to task data being evicted to preserve memory."
+            )
         return SummaryApiResponse(
             total=result.total,
             result=summary,
             partial_failure_warning=result.partial_failure_warning,
-            warnings=result.warnings,
+            warnings=warnings,
             num_after_truncation=result.num_after_truncation,
             num_filtered=result.num_filtered,
         )
diff --git a/python/ray/experimental/state/common.py b/python/ray/experimental/state/common.py
index ac2626185aa8..f3022c81af26 100644
--- a/python/ray/experimental/state/common.py
+++ b/python/ray/experimental/state/common.py
@@ -1,4 +1,5 @@
 import logging
+import sys
 from abc import ABC
 from dataclasses import dataclass, field, fields
 from enum import Enum, unique
@@ -145,6 +146,12 @@ class SummaryApiOptions:
         default_factory=list
     )
 
+    # Change out to summarize the output. There is a summary_by value for each entity.
+    # Tasks: by func_name
+    # Actors: by class
+    # Objects: by callsite
+    summary_by: Optional[str] = None
+
 
 def state_column(*, filterable: bool, detail: bool = False, **kwargs):
     """A wrapper around dataclass.field to add additional metadata.
@@ -549,6 +556,8 @@ class TaskState(StateSchema):
     events: List[dict] = state_column(detail=True, filterable=False)
     #: The list of profile events of the given task.
     profiling_data: List[dict] = state_column(detail=True, filterable=False)
+    #: The time when the task is created. A Unix timestamp in ms.
+    creation_time_ms: Optional[int] = state_column(detail=True, filterable=False)
     #: The time when the task starts to run. A Unix timestamp in ms.
     start_time_ms: Optional[int] = state_column(detail=True, filterable=False)
     #: The time when the task is finished or failed. A Unix timestamp in ms.
@@ -726,6 +735,8 @@ def __post_init__(self):
 Summary API schema
 """
 
+DRIVER_TASK_ID_PREFIX = "ffffffffffffffffffffffffffffffffffffffff"
+
 
 @dataclass(init=True)
 class TaskSummaryPerFuncOrClassName:
@@ -738,12 +749,30 @@ class TaskSummaryPerFuncOrClassName:
     state_counts: Dict[TypeTaskStatus, int] = field(default_factory=dict)
 
 
+@dataclass(init=True)
+class NestedTaskSummary:
+    #: The name of this task group
+    name: str
+    #: A unique identifier for this group
+    key: str
+    #: The type of the class. Equivalent to protobuf TaskType,
+    #: "ACTOR" if it represents an Actor, or "GROUP" if it's a grouping of tasks.
+    type: str
+    #: Unix timestamp to use to sort the task group.
+    timestamp: Optional[int] = None
+    #: State name to the count dict. State name is equivalent to
+    #: the protobuf TaskStatus.
+    state_counts: Dict[TypeTaskStatus, int] = field(default_factory=dict)
+    #: The child
+    children: List["NestedTaskSummary"] = field(default_factory=list)
+
+
 @dataclass
 class TaskSummaries:
     #: Group key -> summary.
     #: Right now, we only have func_class_name as a key.
     # TODO(sang): Support the task group abstraction.
-    summary: Dict[str, TaskSummaryPerFuncOrClassName]
+    summary: Union[Dict[str, TaskSummaryPerFuncOrClassName], List[NestedTaskSummary]]
     #: Total Ray tasks.
     total_tasks: int
     #: Total actor tasks.
@@ -753,7 +782,7 @@ class TaskSummaries:
     summary_by: str = "func_name"
 
     @classmethod
-    def to_summary(cls, *, tasks: List[Dict]):
+    def to_summary_by_func_name(cls, *, tasks: List[Dict]) -> "TaskSummaries":
         # NOTE: The argument tasks contains a list of dictionary
         # that have the same k/v as TaskState.
         summary = {}
@@ -788,6 +817,268 @@ def to_summary(cls, *, tasks: List[Dict]):
             total_tasks=total_tasks,
             total_actor_tasks=total_actor_tasks,
             total_actor_scheduled=total_actor_scheduled,
+            summary_by="func_name",
+        )
+
+    @classmethod
+    def to_summary_by_lineage(cls, *, tasks: List[Dict]) -> "TaskSummaries":
+        """
+        This summarizes tasks by lineage.
+        i.e. A task will be grouped with another task if they have the
+        same parent.
+
+        This does things in 4 steps.
+        Step 1: Iterate through all tasks and keep track of them by id and ownership
+        Step 2: Put the tasks in a tree structure based on ownership
+        Step 3: Merge together siblings in the tree if there are more
+                than one with the same name.
+        Step 4: Total the children
+
+        This can probably be more efficient if we merge together some steps to
+        reduce the amount of iterations but this algorithm produces very easy to
+        understand code. We can optimize in the future.
+        """
+        # NOTE: The argument tasks contains a list of dictionary
+        # that have the same k/v as TaskState.
+
+        tasks_by_id = {}
+        task_group_by_id = {}
+        actor_creation_task_id_for_actor_id = {}
+        summary = []
+        total_tasks = 0
+        total_actor_tasks = 0
+        total_actor_scheduled = 0
+
+        # Step 1
+        # We cannot assume that a parent task always comes before the child task
+        # So we need to keep track of all tasks by ids so we can quickly find the
+        # parent.
+        # We also track the actor creation tasks so we can quickly figure out the
+        # ownership of actors.
+        for task in tasks:
+            tasks_by_id[task["task_id"]] = task
+            type_enum = TaskType.DESCRIPTOR.values_by_name[task["type"]].number
+            if type_enum == TaskType.ACTOR_CREATION_TASK:
+                actor_creation_task_id_for_actor_id[task["actor_id"]] = task["task_id"]
+
+        def get_or_create_task_group(task_id: str) -> Optional[NestedTaskSummary]:
+            """
+            Gets an already created task_group
+            OR
+            Creates a task group and puts it in the right place under its parent.
+            For actor tasks, the parent is the Actor that owns it. For all other
+            tasks, the owner is the driver or task that created it.
+
+            Returns None if there is missing data about the task or one of its parents.
+
+            For task groups that represents actors, the id is in the
+            format actor:{actor_id}
+            """
+            if task_id in task_group_by_id:
+                return task_group_by_id[task_id]
+
+            task = tasks_by_id.get(task_id)
+            if not task:
+                logger.debug(f"We're missing data about {task_id}")
+                # We're missing data about this parent. So we're dropping the whole
+                # tree at that node.
+                return None
+
+            # Use name first which allows users to customize the name of
+            # their remote function call using the name option.
+            func_name = task["name"] or task["func_or_class_name"]
+            task_id = task["task_id"]
+            type_enum = TaskType.DESCRIPTOR.values_by_name[task["type"]].number
+
+            task_group_by_id[task_id] = NestedTaskSummary(
+                name=func_name,
+                key=task_id,
+                type=task["type"],
+                timestamp=task["creation_time_ms"],
+            )
+
+            # Set summary in right place under parent
+            if (
+                type_enum == TaskType.ACTOR_TASK
+                or type_enum == TaskType.ACTOR_CREATION_TASK
+            ):
+                # For actor tasks, the parent is the actor and not the parent task.
+                parent_task_group = get_or_create_actor_task_group(task["actor_id"])
+                if parent_task_group:
+                    parent_task_group.children.append(task_group_by_id[task_id])
+            else:
+                parent_task_id = task["parent_task_id"]
+                if not parent_task_id or parent_task_id.startswith(
+                    DRIVER_TASK_ID_PREFIX
+                ):
+                    summary.append(task_group_by_id[task_id])
+                else:
+                    parent_task_group = get_or_create_task_group(parent_task_id)
+                    if parent_task_group:
+                        parent_task_group.children.append(task_group_by_id[task_id])
+
+            return task_group_by_id[task_id]
+
+        def get_or_create_actor_task_group(
+            actor_id: str,
+        ) -> Optional[NestedTaskSummary]:
+            """
+            Gets an existing task group that represents an actor.
+            OR
+            Creates a task group that represents an actor. The owner of the actor is
+            the parent of the creation_task that created that actor.
+
+            Returns None if there is missing data about the actor or one of its parents.
+            """
+            key = f"actor:{actor_id}"
+            if key not in task_group_by_id:
+                creation_task_id = actor_creation_task_id_for_actor_id.get(actor_id)
+                creation_task = tasks_by_id.get(creation_task_id)
+
+                if not creation_task:
+                    logger.debug(f"We're missing data about actor {actor_id}")
+                    # We're missing data about the parent. So we're dropping the whole
+                    # tree at that node.
+                    return None
+
+                # TODO(aguo): Get actor name from actors state-api.
+                [actor_name, *rest] = creation_task["func_or_class_name"].split(".")
+
+                task_group_by_id[key] = NestedTaskSummary(
+                    name=actor_name,
+                    key=key,
+                    type="ACTOR",
+                    timestamp=task["creation_time_ms"],
+                )
+
+                parent_task_id = creation_task["parent_task_id"]
+                if not parent_task_id or parent_task_id.startswith(
+                    DRIVER_TASK_ID_PREFIX
+                ):
+                    summary.append(task_group_by_id[key])
+                else:
+                    parent_task_group = get_or_create_task_group(parent_task_id)
+                    if parent_task_group:
+                        parent_task_group.children.append(task_group_by_id[key])
+
+            return task_group_by_id[key]
+
+        # Step 2: Create the tree structure based on ownership
+        for task in tasks:
+            task_id = task["task_id"]
+
+            task_group = get_or_create_task_group(task_id)
+
+            if not task_group:
+                # We are probably missing data about this task or one of its parents.
+                continue
+
+            state = task["state"]
+            if state not in task_group.state_counts:
+                task_group.state_counts[state] = 0
+            task_group.state_counts[state] += 1
+
+            type_enum = TaskType.DESCRIPTOR.values_by_name[task["type"]].number
+            if type_enum == TaskType.NORMAL_TASK:
+                total_tasks += 1
+            elif type_enum == TaskType.ACTOR_CREATION_TASK:
+                total_actor_scheduled += 1
+            elif type_enum == TaskType.ACTOR_TASK:
+                total_actor_tasks += 1
+
+        def merge_sibings_for_task_group(
+            siblings: List[NestedTaskSummary],
+        ) -> Tuple[List[NestedTaskSummary], Optional[int]]:
+            """
+            Merges task summaries with the same name into a group if there are more than
+            one child with that name.
+
+            Args:
+                siblings: A list of NestedTaskSummary's to merge together
+
+            Returns
+                Index 0: A list of NestedTaskSummary's which have been merged
+                Index 1: The smallest timestamp amongst the siblings
+            """
+            if not len(siblings):
+                return siblings, None
+
+            # Group by name
+            groups = {}
+            min_timestamp = None
+
+            for child in siblings:
+                child.children, child_min_timestamp = merge_sibings_for_task_group(
+                    child.children
+                )
+                if child_min_timestamp and child_min_timestamp < (
+                    child.timestamp or sys.maxsize
+                ):
+                    child.timestamp = child_min_timestamp
+
+                if child.name not in groups:
+                    groups[child.name] = NestedTaskSummary(
+                        name=child.name,
+                        key=child.name,
+                        type="GROUP",
+                    )
+                groups[child.name].children.append(child)
+                if child.timestamp and child.timestamp < (
+                    groups[child.name].timestamp or sys.maxsize
+                ):
+                    groups[child.name].timestamp = child.timestamp
+                    if child.timestamp < (min_timestamp or sys.maxsize):
+                        min_timestamp = child.timestamp
+
+            # Take the groups that have more than one children and return it.
+            # For groups with just one child, return the child itself instead of
+            # creating a group.
+            return [
+                group if len(group.children) > 1 else group.children[0]
+                for group in groups.values()
+            ], min_timestamp
+
+        # Step 3
+        summary, _ = merge_sibings_for_task_group(summary)
+
+        def sort_task_groups(task_groups: List[NestedTaskSummary]) -> None:
+            # Sort by timestamp
+            # Put actor creation tasks above other tasks with the same timestamp
+            task_groups.sort(key=lambda x: 0 if x.type == "ACTOR_CREATION_TASK" else 1)
+            task_groups.sort(key=lambda x: x.timestamp or sys.maxsize)
+
+        def calc_total_for_task_group(
+            task_group: NestedTaskSummary,
+        ) -> NestedTaskSummary:
+            """
+            Calculates the total of a group as the sum of all children.
+            Sorts children by timestamp
+            """
+            if not len(task_group.children):
+                return task_group
+
+            for child in task_group.children:
+                totaled = calc_total_for_task_group(child)
+
+                for state, count in totaled.state_counts.items():
+                    task_group.state_counts[state] = (
+                        task_group.state_counts.get(state, 0) + count
+                    )
+
+            sort_task_groups(task_group.children)
+
+            return task_group
+
+        # Step 4
+        summary = [calc_total_for_task_group(task_group) for task_group in summary]
+        sort_task_groups(summary)
+
+        return TaskSummaries(
+            summary=summary,
+            total_tasks=total_tasks,
+            total_actor_tasks=total_actor_tasks,
+            total_actor_scheduled=total_actor_scheduled,
+            summary_by="lineage",
         )
 
 
diff --git a/python/ray/tests/test_state_api_summary.py b/python/ray/tests/test_state_api_summary.py
index 87a2778dac8c..bb8d38ad0d37 100644
--- a/python/ray/tests/test_state_api_summary.py
+++ b/python/ray/tests/test_state_api_summary.py
@@ -3,6 +3,7 @@
 import pytest
 import ray
 from unittest.mock import MagicMock
+import random
 import sys
 from dataclasses import asdict
 
@@ -30,6 +31,9 @@
 from ray.experimental.state.common import (
     DEFAULT_RPC_TIMEOUT,
     SummaryApiOptions,
+    NestedTaskSummary,
+    TaskSummaries,
+    DRIVER_TASK_ID_PREFIX,
 )
 from ray.core.generated.gcs_service_pb2 import GetAllActorInfoReply
 from ray.core.generated.gcs_pb2 import ActorTableData
@@ -467,6 +471,196 @@ def verify():
         assert result.exit_code == 0
 
 
+def test_summarize_by_lineage():
+    """
+    Unit test for summarize by lineage.
+
+    This test starts with an expected lineage.
+    It then converts that into a single list of tasks
+    It then randomizes the order of that list.
+    It calls the summarize_by_lineage_function with the randomized list.
+    Then asserts the final result should be the same.
+    """
+    expected_summary = [
+        NestedTaskSummary(
+            name="preprocess",
+            key="preprocess",
+            type="GROUP",
+            timestamp=100,
+            state_counts={
+                "FINISHED": 20,
+            },
+            children=[
+                NestedTaskSummary(
+                    name="preprocess",
+                    key=f"preprocess-{i}",
+                    type="NORMAL_TASK",
+                    timestamp=100 + i,
+                    state_counts={
+                        "FINISHED": 2,
+                    },
+                    children=[
+                        NestedTaskSummary(
+                            name="preprocess_sub_task",
+                            key=f"preprocess-{i}-0",
+                            type="NORMAL_TASK",
+                            timestamp=200,
+                            state_counts={
+                                "FINISHED": 1,
+                            },
+                        )
+                    ],
+                )
+                for i in range(10)
+            ],
+        ),
+        NestedTaskSummary(
+            name="TuneActor",
+            key="actor:tune-actor-0",
+            type="ACTOR",
+            timestamp=1000,
+            state_counts={
+                "FINISHED": 111,
+                "RUNNING": 10,
+            },
+            children=[
+                NestedTaskSummary(
+                    name="TuneActor.__init__",
+                    key="tune-actor-init-0",
+                    type="ACTOR_CREATION_TASK",
+                    timestamp=1000,
+                    state_counts={
+                        "FINISHED": 111,
+                        "RUNNING": 10,
+                    },
+                    children=[
+                        NestedTaskSummary(
+                            name="TrainActor",
+                            key="TrainActor",
+                            type="GROUP",
+                            timestamp=1100,
+                            state_counts={
+                                "FINISHED": 110,
+                                "RUNNING": 10,
+                            },
+                            children=[
+                                NestedTaskSummary(
+                                    name="TrainActor",
+                                    key=f"actor:train-actor-{i}",
+                                    type="ACTOR",
+                                    timestamp=1100 + i,
+                                    state_counts={
+                                        "FINISHED": 11,
+                                        "RUNNING": 1,
+                                    },
+                                    children=[
+                                        NestedTaskSummary(
+                                            name="TrainActor.__init__",
+                                            key=f"train-actor-init-{i}",
+                                            type="ACTOR_CREATION_TASK",
+                                            timestamp=1100 + i,
+                                            state_counts={
+                                                "FINISHED": 1,
+                                            },
+                                        ),
+                                        NestedTaskSummary(
+                                            name="TrainActor.train_step_map",
+                                            key="TrainActor.train_step_map",
+                                            type="GROUP",
+                                            timestamp=2100,
+                                            state_counts={
+                                                "FINISHED": 10,
+                                            },
+                                            children=[
+                                                NestedTaskSummary(
+                                                    name="TrainActor.train_step_map",
+                                                    key=(
+                                                        "train-actor-train-step-map-"
+                                                        f"{i}-{j}"
+                                                    ),
+                                                    type="ACTOR_TASK",
+                                                    timestamp=2100 + j,
+                                                    state_counts={
+                                                        "FINISHED": 1,
+                                                    },
+                                                )
+                                                for j in range(10)
+                                            ],
+                                        ),
+                                        NestedTaskSummary(
+                                            name="TrainActor.train_step_reduce",
+                                            key=f"train-actor-train-step-reduce-{i}",
+                                            type="ACTOR_TASK",
+                                            timestamp=2200,
+                                            state_counts={
+                                                "RUNNING": 1,
+                                            },
+                                        ),
+                                    ],
+                                )
+                                for i in range(10)
+                            ],
+                        )
+                    ],
+                )
+            ],
+        ),
+    ]
+
+    tasks = []
+
+    def grab_tasks_from_task_group(
+        task_group: NestedTaskSummary, actor_id=None, parent_task_id=None
+    ):
+        if task_group.type != "ACTOR" and task_group.type != "GROUP":
+            # "Virtual" groups don't have underlying tasks.
+            task = {
+                "name": task_group.name,
+                "task_id": task_group.key,
+                "parent_task_id": parent_task_id,
+                "state": "RUNNING"
+                if task_group.name == "TrainActor.train_step_reduce"
+                else "FINISHED",
+                "actor_id": actor_id,
+                "creation_time_ms": task_group.timestamp,
+                "func_or_class_name": task_group.name,
+                "type": task_group.type,
+            }
+            tasks.append(task)
+
+        actor_id_for_child = None
+        parent_task_id_for_child = None
+
+        if task_group.type == "ACTOR":
+            [_, actor_id_for_child] = task_group.key.split(":")
+            parent_task_id_for_child = parent_task_id
+        elif task_group.type == "GROUP":
+            actor_id_for_child = actor_id
+            parent_task_id_for_child = parent_task_id
+        else:
+            parent_task_id_for_child = task_group.key
+
+        for child in task_group.children:
+            grab_tasks_from_task_group(
+                child,
+                actor_id=actor_id_for_child,
+                parent_task_id=parent_task_id_for_child,
+            )
+
+    for group in expected_summary:
+        grab_tasks_from_task_group(group, None, f"{DRIVER_TASK_ID_PREFIX}01000000")
+
+    random.shuffle(tasks)
+
+    summary = TaskSummaries.to_summary_by_lineage(tasks=tasks)
+
+    assert summary.total_tasks == 20
+    assert summary.total_actor_tasks == 110
+    assert summary.total_actor_scheduled == 11
+    assert summary.summary[1] == expected_summary[1]
+    assert summary.summary == expected_summary
+
+
 if __name__ == "__main__":
     import sys
 

From 3a1709ffc05c463a6cde84366aa134a0a3662f77 Mon Sep 17 00:00:00 2001
From: WeichenXu <weichen.xu@databricks.com>
Date: Tue, 31 Jan 2023 19:36:55 +0800
Subject: [PATCH 075/267] [spark] Automatically shut down ray on spark cluster
 if user does not execute commands on databricks notebook for a long time
 (#31962)

Databricks Runtime provides an API:
dbutils.entry_point.getIdleTimeMillisSinceLastNotebookExecution() that returns elapsed milliseconds since last databricks notebook code execution.
This PR code calls this interface to monitor notebook activity and shut down Ray cluster on timeout.

Signed-off-by: Weichen Xu <weichen.xu@databricks.com>
---
 python/ray/tests/BUILD                        |  1 +
 python/ray/tests/spark/test_basic.py          | 16 ++-
 .../ray/tests/spark/test_databricks_hook.py   | 80 +++++++++++++++
 python/ray/util/spark/cluster_init.py         | 70 +++++++------
 python/ray/util/spark/databricks_hook.py      | 99 +++++++++++++++++--
 python/ray/util/spark/start_hook_base.py      |  2 +-
 python/requirements_test.txt                  |  2 +-
 7 files changed, 233 insertions(+), 37 deletions(-)
 create mode 100644 python/ray/tests/spark/test_databricks_hook.py

diff --git a/python/ray/tests/BUILD b/python/ray/tests/BUILD
index 62ea4bfeffec..5fa316f00fec 100644
--- a/python/ray/tests/BUILD
+++ b/python/ray/tests/BUILD
@@ -535,6 +535,7 @@ py_test_module_list(
     "spark/test_GPU.py",
     "spark/test_multicores_per_task.py",
     "spark/test_utils.py",
+    "spark/test_databricks_hook.py",
   ],
   size = "large",
   tags = ["exclusive", "spark_plugin_tests", "team:serverless"],
diff --git a/python/ray/tests/spark/test_basic.py b/python/ray/tests/spark/test_basic.py
index dac18bab1604..325fb3e4d96a 100644
--- a/python/ray/tests/spark/test_basic.py
+++ b/python/ray/tests/spark/test_basic.py
@@ -46,6 +46,7 @@ class RayOnSparkCPUClusterTestBase(ABC):
     @classmethod
     def teardown_class(cls):
         time.sleep(10)  # Wait all background spark job canceled.
+        os.environ.pop("SPARK_WORKER_CORES", None)
         cls.spark.stop()
 
     @staticmethod
@@ -70,6 +71,11 @@ def test_cpu_allocation(self):
                 self.num_cpus_per_spark_task * 2,
                 MAX_NUM_WORKER_NODES,
             ),
+            (
+                self.max_spark_tasks // 2,
+                self.num_cpus_per_spark_task * 2,
+                self.max_spark_tasks // 2 + 1,
+            ),  # Test case: requesting resources exceeding all cluster resources
         ]:
             with _setup_ray_cluster(
                 num_worker_nodes=num_worker_nodes_arg,
@@ -92,6 +98,12 @@ def test_public_api(self):
                 ray_temp_root_dir=ray_temp_root_dir,
                 head_node_options={"include_dashboard": True},
             )
+
+            assert (
+                os.environ["RAY_ADDRESS"]
+                == ray.util.spark.cluster_init._active_ray_cluster.address
+            )
+
             ray.init()
 
             @ray.remote
@@ -104,6 +116,8 @@ def f(x):
 
             shutdown_ray_cluster()
 
+            assert "RAY_ADDRESS" not in os.environ
+
             time.sleep(7)
             # assert temp dir is removed.
             assert len(os.listdir(ray_temp_root_dir)) == 1 and os.listdir(
@@ -121,7 +135,7 @@ def f(x):
             if ray.util.spark.cluster_init._active_ray_cluster is not None:
                 # if the test raised error and does not destroy cluster,
                 # destroy it here.
-                ray.util.spark._active_ray_cluster.shutdown()
+                ray.util.spark.cluster_init._active_ray_cluster.shutdown()
                 time.sleep(5)
             shutil.rmtree(ray_temp_root_dir, ignore_errors=True)
             shutil.rmtree(collect_log_to_path, ignore_errors=True)
diff --git a/python/ray/tests/spark/test_databricks_hook.py b/python/ray/tests/spark/test_databricks_hook.py
new file mode 100644
index 000000000000..5d296ac4f804
--- /dev/null
+++ b/python/ray/tests/spark/test_databricks_hook.py
@@ -0,0 +1,80 @@
+import sys
+
+import pytest
+import os
+import time
+import ray
+from pyspark.sql import SparkSession
+from ray.util.spark import setup_ray_cluster
+import ray.util.spark.databricks_hook
+
+
+pytestmark = pytest.mark.skipif(
+    not sys.platform.startswith("linux"),
+    reason="Ray on spark only supports running on Linux.",
+)
+
+
+class MockDbApiEntry:
+    def __init__(self):
+        self.created_time = time.time()
+        self.registered_job_groups = []
+
+    def getIdleTimeMillisSinceLastNotebookExecution(self):
+        return (time.time() - self.created_time) * 1000
+
+    def registerBackgroundSparkJobGroup(self, job_group_id):
+        self.registered_job_groups.append(job_group_id)
+
+
+class TestDatabricksHook:
+    @classmethod
+    def setup_class(cls):
+        os.environ["SPARK_WORKER_CORES"] = "2"
+        cls.spark = (
+            SparkSession.builder.master("local-cluster[1, 2, 1024]")
+            .config("spark.task.cpus", "1")
+            .config("spark.task.maxFailures", "1")
+            .config("spark.executorEnv.RAY_ON_SPARK_WORKER_CPU_CORES", "2")
+            .getOrCreate()
+        )
+
+    @classmethod
+    def teardown_class(cls):
+        time.sleep(10)  # Wait all background spark job canceled.
+        cls.spark.stop()
+        os.environ.pop("SPARK_WORKER_CORES")
+
+    def test_hook(self, monkeypatch):
+        monkeypatch.setattr(
+            "ray.util.spark.databricks_hook._DATABRICKS_DEFAULT_TMP_DIR", "/tmp"
+        )
+        monkeypatch.setenv("DATABRICKS_RUNTIME_VERSION", "12.2")
+        monkeypatch.setenv("DATABRICKS_RAY_ON_SPARK_AUTOSHUTDOWN_MINUTES", "0.5")
+        db_api_entry = MockDbApiEntry()
+        monkeypatch.setattr(
+            "ray.util.spark.databricks_hook._get_db_api_entry", lambda: db_api_entry
+        )
+        try:
+            setup_ray_cluster(
+                num_worker_nodes=2,
+                head_node_options={"include_dashboard": False},
+            )
+            cluster = ray.util.spark.cluster_init._active_ray_cluster
+            assert not cluster.is_shutdown
+            assert db_api_entry.registered_job_groups == [cluster.spark_job_group_id]
+            time.sleep(35)
+            assert cluster.is_shutdown
+            assert ray.util.spark.cluster_init._active_ray_cluster is None
+        finally:
+            if ray.util.spark.cluster_init._active_ray_cluster is not None:
+                # if the test raised error and does not destroy cluster,
+                # destroy it here.
+                ray.util.spark.cluster_init._active_ray_cluster.shutdown()
+
+
+if __name__ == "__main__":
+    if os.environ.get("PARALLEL_CI"):
+        sys.exit(pytest.main(["-n", "auto", "--boxed", "-vs", __file__]))
+    else:
+        sys.exit(pytest.main(["-sv", __file__]))
diff --git a/python/ray/util/spark/cluster_init.py b/python/ray/util/spark/cluster_init.py
index c8f8b347f4bc..50c5ba4fa21f 100644
--- a/python/ray/util/spark/cluster_init.py
+++ b/python/ray/util/spark/cluster_init.py
@@ -100,11 +100,6 @@ def _cancel_background_spark_job(self):
     def wait_until_ready(self):
         import ray
 
-        if self.background_job_exception is not None:
-            raise RuntimeError(
-                "Ray workers has exited."
-            ) from self.background_job_exception
-
         if self.is_shutdown:
             raise RuntimeError(
                 "The ray cluster has been shut down or it failed to start."
@@ -125,6 +120,16 @@ def wait_until_ready(self):
             last_progress_move_time = time.time()
             while True:
                 time.sleep(_RAY_CLUSTER_STARTUP_PROGRESS_CHECKING_INTERVAL)
+
+                # Inside the waiting ready loop,
+                # checking `self.background_job_exception`, if it is not None,
+                # it means the background spark job has failed,
+                # in this case, raise error directly.
+                if self.background_job_exception is not None:
+                    raise RuntimeError(
+                        "Ray workers have exited."
+                    ) from self.background_job_exception
+
                 cur_alive_worker_count = (
                     len([node for node in ray.nodes() if node["Alive"]]) - 1
                 )  # Minus 1 means excluding the head node.
@@ -144,12 +149,17 @@ def wait_until_ready(self):
                         time.time() - last_progress_move_time
                         > _RAY_CONNECT_CLUSTER_POLL_PROGRESS_TIMEOUT
                     ):
+                        if cur_alive_worker_count == 0:
+                            raise RuntimeError(
+                                "Current spark cluster has no resources to launch "
+                                "Ray worker nodes."
+                            )
                         _logger.warning(
                             "Timeout in waiting for all ray workers to start. "
                             "Started / Total requested: "
                             f"({cur_alive_worker_count} / {self.num_worker_nodes}). "
-                            "Please check ray logs to see why some ray workers "
-                            "failed to start."
+                            "Current spark cluster does not have sufficient resources "
+                            "to launch requested number of Ray worker nodes."
                         )
                         return
         finally:
@@ -678,7 +688,7 @@ def background_job_thread_fn():
         ).start()
 
         # Call hook immediately after spark job started.
-        start_hook.on_spark_background_job_created(spark_job_group_id)
+        start_hook.on_cluster_created(ray_cluster_handler)
 
         # wait background spark task starting.
         for _ in range(_BACKGROUND_JOB_STARTUP_WAIT):
@@ -699,6 +709,7 @@ def background_job_thread_fn():
 
 
 _active_ray_cluster = None
+_active_ray_cluster_rwlock = threading.RLock()
 
 
 def _create_resource_profile(num_cpus_per_node, num_gpus_per_node):
@@ -1007,23 +1018,24 @@ def setup_ray_cluster(
         else:
             _logger.warning("\n".join(insufficient_resources))
 
-    cluster = _setup_ray_cluster(
-        num_worker_nodes=num_worker_nodes,
-        num_cpus_per_node=num_cpus_per_node,
-        num_gpus_per_node=num_gpus_per_node,
-        using_stage_scheduling=using_stage_scheduling,
-        heap_memory_per_node=ray_worker_node_heap_mem_bytes,
-        object_store_memory_per_node=ray_worker_node_object_store_mem_bytes,
-        head_node_options=head_node_options,
-        worker_node_options=worker_node_options,
-        ray_temp_root_dir=ray_temp_root_dir,
-        collect_log_to_path=collect_log_to_path,
-    )
-    cluster.wait_until_ready()  # NB: this line might raise error.
+    with _active_ray_cluster_rwlock:
+        cluster = _setup_ray_cluster(
+            num_worker_nodes=num_worker_nodes,
+            num_cpus_per_node=num_cpus_per_node,
+            num_gpus_per_node=num_gpus_per_node,
+            using_stage_scheduling=using_stage_scheduling,
+            heap_memory_per_node=ray_worker_node_heap_mem_bytes,
+            object_store_memory_per_node=ray_worker_node_object_store_mem_bytes,
+            head_node_options=head_node_options,
+            worker_node_options=worker_node_options,
+            ray_temp_root_dir=ray_temp_root_dir,
+            collect_log_to_path=collect_log_to_path,
+        )
+        cluster.wait_until_ready()  # NB: this line might raise error.
 
-    # If connect cluster successfully, set global _active_ray_cluster to be the started
-    # cluster.
-    _active_ray_cluster = cluster
+        # If connect cluster successfully, set global _active_ray_cluster to be the
+        # started cluster.
+        _active_ray_cluster = cluster
     return cluster.address
 
 
@@ -1033,8 +1045,10 @@ def shutdown_ray_cluster() -> None:
     Shut down the active ray cluster.
     """
     global _active_ray_cluster
-    if _active_ray_cluster is None:
-        raise RuntimeError("No active ray cluster to shut down.")
 
-    _active_ray_cluster.shutdown()
-    _active_ray_cluster = None
+    with _active_ray_cluster_rwlock:
+        if _active_ray_cluster is None:
+            raise RuntimeError("No active ray cluster to shut down.")
+
+        _active_ray_cluster.shutdown()
+        _active_ray_cluster = None
diff --git a/python/ray/util/spark/databricks_hook.py b/python/ray/util/spark/databricks_hook.py
index b55c5b1b9db6..0d45baef499c 100644
--- a/python/ray/util/spark/databricks_hook.py
+++ b/python/ray/util/spark/databricks_hook.py
@@ -1,6 +1,10 @@
+import os
+
 from .start_hook_base import RayOnSparkStartHook
 from .utils import get_spark_session
 import logging
+import threading
+import time
 
 _logger = logging.getLogger(__name__)
 
@@ -54,21 +58,104 @@ def display_databricks_driver_proxy_url(spark_context, port, title):
     )
 
 
+DATABRICKS_AUTO_SHUTDOWN_POLL_INTERVAL_SECONDS = 3
+DATABRICKS_RAY_ON_SPARK_AUTOSHUTDOWN_MINUTES = (
+    "DATABRICKS_RAY_ON_SPARK_AUTOSHUTDOWN_MINUTES"
+)
+
+
+def _get_db_api_entry():
+    """
+    Get databricks API entry point.
+    """
+    return get_dbutils().entry_point
+
+
+_DATABRICKS_DEFAULT_TMP_DIR = "/local_disk0/tmp"
+
+
 class DefaultDatabricksRayOnSparkStartHook(RayOnSparkStartHook):
     def get_default_temp_dir(self):
-        return "/local_disk0/tmp"
+        return _DATABRICKS_DEFAULT_TMP_DIR
 
     def on_ray_dashboard_created(self, port):
         display_databricks_driver_proxy_url(
             get_spark_session().sparkContext, port, "Ray Cluster Dashboard"
         )
 
-    def on_spark_background_job_created(self, job_group_id):
+    def on_cluster_created(self, ray_cluster_handler):
+        db_api_entry = _get_db_api_entry()
         try:
-            get_dbutils().entry_point.registerBackgroundSparkJobGroup(job_group_id)
+            db_api_entry.registerBackgroundSparkJobGroup(
+                ray_cluster_handler.spark_job_group_id
+            )
         except Exception:
             _logger.warning(
-                "Register ray cluster spark job as background job failed. You need to "
-                "manually call `ray_cluster_on_spark.shutdown()` before detaching "
-                "your databricks python REPL."
+                "Registering Ray cluster spark job as background job failed. "
+                "You need to manually call `ray.util.spark.shutdown_ray_cluster()` "
+                "before detaching your databricks notebook."
+            )
+
+        auto_shutdown_minutes = float(
+            os.environ.get(DATABRICKS_RAY_ON_SPARK_AUTOSHUTDOWN_MINUTES, "30")
+        )
+        if auto_shutdown_minutes == 0:
+            _logger.info(
+                "The Ray cluster will keep running until you manually detach the "
+                "databricks notebook or call "
+                "`ray.util.spark.shutdown_ray_cluster()`."
+            )
+            return
+        if auto_shutdown_minutes < 0:
+            raise ValueError(
+                "You must set "
+                f"'{DATABRICKS_RAY_ON_SPARK_AUTOSHUTDOWN_MINUTES}' "
+                "to a value >= 0."
             )
+
+        try:
+            db_api_entry.getIdleTimeMillisSinceLastNotebookExecution()
+        except Exception:
+            _logger.warning(
+                "Databricks `getIdleTimeMillisSinceLastNotebookExecution` API "
+                "is unavailable, it is probably because that "
+                "your current Databricks Runtime version does not support API "
+                "`getIdleTimeMillisSinceLastNotebookExecution`, we cannot "
+                "automatically shut down Ray cluster when databricks notebook "
+                "is inactive, you need to manually detach databricks notebook "
+                "or call `ray.util.spark.shutdown_ray_cluster()` to shut down "
+                "Ray cluster on spark."
+            )
+            return
+
+        _logger.info(
+            "The Ray cluster will be shut down automatically if you don't run "
+            "commands on the databricks notebook for "
+            f"{auto_shutdown_minutes} minutes. You can change the "
+            "automatically shutdown minutes by setting "
+            f"'{DATABRICKS_RAY_ON_SPARK_AUTOSHUTDOWN_MINUTES}' environment "
+            "variable, setting it to 0 means that the Ray cluster keeps running "
+            "until you manually call `ray.util.spark.shutdown_ray_cluster()` or "
+            "detach databricks notebook."
+        )
+
+        def auto_shutdown_watcher():
+            auto_shutdown_millis = auto_shutdown_minutes * 60 * 1000
+            while True:
+                if ray_cluster_handler.is_shutdown:
+                    # The cluster is shut down. The watcher thread exits.
+                    return
+
+                idle_time = db_api_entry.getIdleTimeMillisSinceLastNotebookExecution()
+
+                if idle_time > auto_shutdown_millis:
+                    from ray.util.spark import cluster_init
+
+                    with cluster_init._active_ray_cluster_rwlock:
+                        if ray_cluster_handler is cluster_init._active_ray_cluster:
+                            cluster_init.shutdown_ray_cluster()
+                    return
+
+                time.sleep(DATABRICKS_AUTO_SHUTDOWN_POLL_INTERVAL_SECONDS)
+
+        threading.Thread(target=auto_shutdown_watcher, daemon=True).start()
diff --git a/python/ray/util/spark/start_hook_base.py b/python/ray/util/spark/start_hook_base.py
index 6421c0fc3c58..5bb750d3bdfa 100644
--- a/python/ray/util/spark/start_hook_base.py
+++ b/python/ray/util/spark/start_hook_base.py
@@ -5,5 +5,5 @@ def get_default_temp_dir(self):
     def on_ray_dashboard_created(self, port):
         pass
 
-    def on_spark_background_job_created(self, job_group):
+    def on_cluster_created(self, ray_cluster_handler):
         pass
diff --git a/python/requirements_test.txt b/python/requirements_test.txt
index 8e994f34e43c..ab643c3709fe 100644
--- a/python/requirements_test.txt
+++ b/python/requirements_test.txt
@@ -55,7 +55,7 @@ pygame==2.1.2; python_version < '3.11'
 Pygments==2.13.0
 pymongo==4.3.2
 # TODO: Replace this with pyspark==3.4 once it is released.
-https://ml-team-public-read.s3.us-west-2.amazonaws.com/pyspark-3.4.0.dev0.tar.gz
+https://ml-team-public-read.s3.us-west-2.amazonaws.com/spark-pkgs/pyspark-3.4.0.dev0-0cb0fa313979e1b82ddd711a05d8c4e78cf6c9f5.tar.gz
 pytest==7.0.1
 pytest-asyncio==0.16.0
 pytest-rerunfailures==10.2

From 1fdf24eb81173cdea037b07ebda37f1e66f0ca04 Mon Sep 17 00:00:00 2001
From: Scott Lee <scottjlee@users.noreply.github.com>
Date: Tue, 31 Jan 2023 07:18:48 -0800
Subject: [PATCH 076/267] [Datasets] Add support for string tensor columns in
 `ArrowTensorArray` and `ArrowVariableShapedTensorArray` (#31817)

Add support for creating ArrowTensorArrays and ArrowVariableShapedTensorArrays with string typed columns.

Signed-off-by: Scott Lee <sjl@anyscale.com>
---
 python/ray/air/tests/test_tensor_extension.py | 76 +++++++++++++++++
 .../ray/air/util/tensor_extensions/arrow.py   | 85 +++++++++++++------
 2 files changed, 134 insertions(+), 27 deletions(-)

diff --git a/python/ray/air/tests/test_tensor_extension.py b/python/ray/air/tests/test_tensor_extension.py
index 811116a82105..935f2680c621 100644
--- a/python/ray/air/tests/test_tensor_extension.py
+++ b/python/ray/air/tests/test_tensor_extension.py
@@ -49,6 +49,22 @@ def test_arrow_scalar_tensor_array_roundtrip_boolean():
     np.testing.assert_array_equal(out, arr)
 
 
+def test_arrow_scalar_tensor_array_roundtrip_string():
+    arr = np.array(
+        [
+            ["Philip", "Fry"],
+            ["Leela", "Turanga"],
+            ["Hubert", "Farnsworth"],
+            ["Lrrr", ""],
+        ]
+    )
+    ata = ArrowTensorArray.from_numpy(arr)
+    assert isinstance(ata.type, pa.DataType)
+    assert len(ata) == len(arr)
+    out = ata.to_numpy()
+    np.testing.assert_array_equal(out, arr)
+
+
 def test_scalar_tensor_array_roundtrip():
     arr = np.arange(10)
     ta = TensorArray(arr)
@@ -139,6 +155,24 @@ def test_arrow_variable_shaped_tensor_array_roundtrip_boolean():
         np.testing.assert_array_equal(o, a)
 
 
+def test_arrow_variable_shaped_tensor_array_roundtrip_string():
+    arr = np.array(
+        [
+            ["Philip", "J", "Fry"],
+            ["Leela", "Turanga"],
+            ["Professor", "Hubert", "J", "Farnsworth"],
+            ["Lrrr"],
+        ],
+        dtype=object,
+    )
+    ata = ArrowVariableShapedTensorArray.from_numpy(arr)
+    assert isinstance(ata.type, ArrowVariableShapedTensorType)
+    assert len(ata) == len(arr)
+    out = ata.to_numpy()
+    for o, a in zip(out, arr):
+        np.testing.assert_array_equal(o, a)
+
+
 def test_arrow_variable_shaped_tensor_array_roundtrip_contiguous_optimization():
     # Test that a roundtrip on slices of an already-contiguous 1D base array does not
     # create any unnecessary copies.
@@ -189,6 +223,46 @@ def test_arrow_variable_shaped_tensor_array_slice():
             np.testing.assert_array_equal(o, e)
 
 
+def test_arrow_variable_shaped_string_tensor_array_slice():
+    arr = np.array(
+        [
+            ["Philip", "J", "Fry"],
+            ["Leela", "Turanga"],
+            ["Professor", "Hubert", "J", "Farnsworth"],
+            ["Lrrr"],
+        ],
+        dtype=object,
+    )
+    ata = ArrowVariableShapedTensorArray.from_numpy(arr)
+    assert isinstance(ata.type, ArrowVariableShapedTensorType)
+    assert len(ata) == len(arr)
+    indices = [0, 1, 2]
+    for i in indices:
+        np.testing.assert_array_equal(ata[i], arr[i])
+    slices = [
+        slice(0, 1),
+        slice(1, 2),
+        slice(2, 3),
+        slice(3, 4),
+        slice(0, 2),
+        slice(1, 3),
+        slice(2, 4),
+        slice(0, 3),
+        slice(1, 4),
+        slice(0, 4),
+    ]
+    for slice_ in slices:
+        ata_slice = ata[slice_]
+        ata_slice_np = ata_slice.to_numpy()
+        arr_slice = arr[slice_]
+        # Check for equivalent dtypes and shapes.
+        assert ata_slice_np.dtype == arr_slice.dtype
+        assert ata_slice_np.shape == arr_slice.shape
+        # Iteration over tensor array slices triggers NumPy conversion.
+        for o, e in zip(ata_slice, arr_slice):
+            np.testing.assert_array_equal(o, e)
+
+
 def test_variable_shaped_tensor_array_roundtrip():
     shapes = [(2, 2), (3, 3), (4, 4)]
     cumsum_sizes = np.cumsum([0] + [np.prod(shape) for shape in shapes[:-1]])
@@ -484,6 +558,8 @@ def test_arrow_variable_shaped_tensor_array_getitem(chunked):
         ([[1.5, 2.5], [3.3, 4.2], [5.2, 6.9], [7.6, 8.1]], np.float32),
         ([[1.5, 2.5], [3.3, 4.2], [5.2, 6.9], [7.6, 8.1]], np.float16),
         ([[False, True], [True, False], [True, True], [False, False]], None),
+        ([["Aa", "Bb"], ["Cc", "Dd"], ["Ee", "Ff"], ["Gg", "Hh"]], None),
+        ([["Aa", "Bb"], ["Cc", "Dd"], ["Ee", "Ff"], ["Gg", "Hh"]], np.str_),
     ],
 )
 def test_arrow_tensor_array_slice(test_arr, dtype):
diff --git a/python/ray/air/util/tensor_extensions/arrow.py b/python/ray/air/util/tensor_extensions/arrow.py
index 7412e2d30c23..b6d2681de031 100644
--- a/python/ray/air/util/tensor_extensions/arrow.py
+++ b/python/ray/air/util/tensor_extensions/arrow.py
@@ -1,4 +1,5 @@
 import itertools
+import sys
 from typing import Iterable, Optional, Tuple, List, Sequence, Union
 
 from pkg_resources._vendor.packaging.version import parse as parse_version
@@ -309,6 +310,15 @@ def from_numpy(
                 # We only natively support C-contiguous ndarrays.
                 arr = np.ascontiguousarray(arr)
             pa_dtype = pa.from_numpy_dtype(arr.dtype)
+            if pa.types.is_string(pa_dtype):
+                if arr.dtype.byteorder == ">" or (
+                    arr.dtype.byteorder == "=" and sys.byteorder == "big"
+                ):
+                    raise ValueError(
+                        "Only little-endian string tensors are supported, but got: ",
+                        arr.dtype,
+                    )
+                pa_dtype = pa.binary(arr.dtype.itemsize)
             outer_len = arr.shape[0]
             element_shape = arr.shape[1:]
             total_num_items = arr.size
@@ -321,6 +331,7 @@ def from_numpy(
                 # NOTE: Arrow expects LSB bit-packed ordering.
                 # NOTE: This creates a copy.
                 arr = np.packbits(arr, bitorder="little")
+
             data_buffer = pa.py_buffer(arr)
             data_array = pa.Array.from_buffers(
                 pa_dtype, total_num_items, [None, data_buffer]
@@ -425,6 +436,12 @@ def _to_numpy(self, index: Optional[int] = None, zero_copy_only: bool = False):
             arr = np.unpackbits(arr, bitorder="little")
             # Interpret buffer as boolean array.
             return np.ndarray(shape, dtype=np.bool_, buffer=arr, offset=bool_offset)
+        # Special handling of binary/string types. Assumes unicode string tensor columns
+        if pa.types.is_fixed_size_binary(value_type):
+            NUM_BYTES_PER_UNICODE_CHAR = 4
+            ext_dtype = np.dtype(
+                f"<U{value_type.byte_width // NUM_BYTES_PER_UNICODE_CHAR}"
+            )
         return np.ndarray(shape, dtype=ext_dtype, buffer=data_buffer, offset=offset)
 
     def to_numpy(self, zero_copy_only: bool = True):
@@ -704,6 +721,14 @@ def from_numpy(
                 f"arrays: {types_and_shapes}"
             )
         pa_dtype = pa.from_numpy_dtype(dtype)
+        if pa.types.is_string(pa_dtype):
+            if dtype.byteorder == ">" or (
+                dtype.byteorder == "=" and sys.byteorder == "big"
+            ):
+                raise ValueError(
+                    "Only little-endian string tensors are supported, but got: ", dtype
+                )
+            pa_dtype = pa.binary(dtype.itemsize)
         if dtype.type is np.bool_:
             # NumPy doesn't represent boolean arrays as bit-packed, so we manually
             # bit-pack the booleans before handing the buffer off to Arrow.
@@ -758,6 +783,8 @@ def _to_numpy(self, index: Optional[int] = None, zero_copy_only: bool = False):
         data = self.storage.field("data")
         shapes = self.storage.field("shape")
         value_type = data.type.value_type
+        ext_dtype = value_type.to_pandas_dtype()
+        shape = shapes[index].as_py()
         if pa.types.is_boolean(value_type):
             # Arrow boolean array buffers are bit-packed, with 8 entries per byte,
             # and are accessed via bit offsets.
@@ -766,39 +793,43 @@ def _to_numpy(self, index: Optional[int] = None, zero_copy_only: bool = False):
             # We assume all other array types are accessed via byte array
             # offsets.
             buffer_item_width = value_type.bit_width // 8
-        shape = shapes[index].as_py()
+
         offset = data.offsets[index].as_py()
         data_offset = buffer_item_width * offset
         data_buffer = data.buffers()[3]
-        if not pa.types.is_boolean(value_type):
-            return np.ndarray(
-                shape,
-                dtype=value_type.to_pandas_dtype(),
+
+        if pa.types.is_boolean(value_type):
+            # Special handling for boolean arrays, since Arrow bit-packs boolean arrays
+            # while NumPy does not.
+            # Cast as uint8 array and let NumPy unpack into a boolean view.
+            # Offset into uint8 array, where each element is a bucket for 8 booleans.
+            byte_bucket_offset = data_offset // 8
+            # Offset for a specific boolean, within a uint8 array element.
+            bool_offset = data_offset % 8
+            # The number of uint8 array elements (buckets) that our slice spans.
+            # Note that, due to the offset for a specific boolean, the slice can span
+            # byte boundaries even if it contains less than 8 booleans.
+            num_boolean_byte_buckets = 1 + ((bool_offset + np.prod(shape) - 1) // 8)
+            # Construct the uint8 array view on the buffer.
+            arr = np.ndarray(
+                (num_boolean_byte_buckets,),
+                dtype=np.uint8,
                 buffer=data_buffer,
-                offset=data_offset,
+                offset=byte_bucket_offset,
+            )
+            # Unpack into a byte per boolean, using LSB bit-packed ordering.
+            arr = np.unpackbits(arr, bitorder="little")
+            # Interpret buffer as boolean array.
+            return np.ndarray(shape, dtype=np.bool_, buffer=arr, offset=bool_offset)
+        # Special handling of binary/string types. Assumes unicode string tensor columns
+        if pa.types.is_fixed_size_binary(value_type):
+            NUM_BYTES_PER_UNICODE_CHAR = 4
+            ext_dtype = np.dtype(
+                f"<U{value_type.byte_width // NUM_BYTES_PER_UNICODE_CHAR}"
             )
-        # Special handling for boolean arrays, since Arrow bit-packs boolean arrays
-        # while NumPy does not.
-        # Cast as uint8 array and let NumPy unpack into a boolean view.
-        # Offset into uint8 array, where each element is a bucket for 8 booleans.
-        byte_bucket_offset = data_offset // 8
-        # Offset for a specific boolean, within a uint8 array element.
-        bool_offset = data_offset % 8
-        # The number of uint8 array elements (buckets) that our slice spans.
-        # Note that, due to the offset for a specific boolean, the slice can span byte
-        # boundaries even if it contains less than 8 booleans.
-        num_boolean_byte_buckets = 1 + ((bool_offset + np.prod(shape) - 1) // 8)
-        # Construct the uint8 array view on the buffer.
-        arr = np.ndarray(
-            (num_boolean_byte_buckets,),
-            dtype=np.uint8,
-            buffer=data_buffer,
-            offset=byte_bucket_offset,
+        return np.ndarray(
+            shape, dtype=ext_dtype, buffer=data_buffer, offset=data_offset
         )
-        # Unpack into a byte per boolean, using LSB bit-packed ordering.
-        arr = np.unpackbits(arr, bitorder="little")
-        # Interpret buffer as boolean array.
-        return np.ndarray(shape, dtype=np.bool_, buffer=arr, offset=bool_offset)
 
     def to_numpy(self, zero_copy_only: bool = True):
         """

From 78b8c242a8411d6732bbb203ff2ce95b80cd8541 Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Tue, 31 Jan 2023 07:24:41 -0800
Subject: [PATCH 077/267] [RLlib] Upgrade tf eager code to no longer use
 `experimental_relax_shapes` (but `reduce_retracing` instead). (#29214)

Signed-off-by: Artur Niederfahrenhorst <artur@anyscale.com>
---
 rllib/policy/eager_tf_policy.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/rllib/policy/eager_tf_policy.py b/rllib/policy/eager_tf_policy.py
index 60cbf1e514aa..e89b47afe0b8 100644
--- a/rllib/policy/eager_tf_policy.py
+++ b/rllib/policy/eager_tf_policy.py
@@ -180,7 +180,7 @@ def compute_actions_from_input_dict(
                     tf.function(
                         super(TracedEagerPolicy, self)._compute_actions_helper,
                         autograph=False,
-                        experimental_relax_shapes=True,
+                        reduce_retracing=True,
                     )
                 )
                 self._traced_compute_actions_helper = True
@@ -206,7 +206,7 @@ def learn_on_batch(self, samples):
                     tf.function(
                         super(TracedEagerPolicy, self)._learn_on_batch_helper,
                         autograph=False,
-                        experimental_relax_shapes=True,
+                        reduce_retracing=True,
                     )
                 )
                 self._traced_learn_on_batch_helper = True
@@ -226,7 +226,7 @@ def compute_gradients(self, samples: SampleBatch) -> ModelGradients:
                     tf.function(
                         super(TracedEagerPolicy, self)._compute_gradients_helper,
                         autograph=False,
-                        experimental_relax_shapes=True,
+                        reduce_retracing=True,
                     )
                 )
                 self._traced_compute_gradients_helper = True
@@ -246,7 +246,7 @@ def apply_gradients(self, grads: ModelGradients) -> None:
                     tf.function(
                         super(TracedEagerPolicy, self)._apply_gradients_helper,
                         autograph=False,
-                        experimental_relax_shapes=True,
+                        reduce_retracing=True,
                     )
                 )
                 self._traced_apply_gradients_helper = True

From 61c411f38f8fa42afe463b5417e6a7f2260bfd83 Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Tue, 31 Jan 2023 07:26:20 -0800
Subject: [PATCH 078/267] [RLlib] Change Waterworld v3 to v4 and reinstate
 indep. MARL test case w/ pettingzoo. (#31820)

---
 rllib/BUILD                                   |  8 ++++
 .../multi_agent_independent_learning.py       | 38 ++++++++++++++-----
 .../examples/multi_agent_parameter_sharing.py |  4 +-
 3 files changed, 39 insertions(+), 11 deletions(-)

diff --git a/rllib/BUILD b/rllib/BUILD
index 0d3ef01f0019..5a969c10f51f 100644
--- a/rllib/BUILD
+++ b/rllib/BUILD
@@ -3331,6 +3331,14 @@ py_test(
     args = ["--stop-iters=4", "--framework=torch"]
 )
 
+py_test(
+    name = "examples/multi_agent_independent_learning",
+    main = "examples/multi_agent_independent_learning.py",
+    tags = ["team:rllib", "examples"],
+    size = "medium",
+    srcs = ["examples/multi_agent_independent_learning.py"],
+    args = ["--stop-iters=4", "--framework=torch"]
+)
 
 py_test(
     name = "examples/multi_agent_two_trainers_tf",
diff --git a/rllib/examples/multi_agent_independent_learning.py b/rllib/examples/multi_agent_independent_learning.py
index 416e48bacbf4..b88673b451a4 100644
--- a/rllib/examples/multi_agent_independent_learning.py
+++ b/rllib/examples/multi_agent_independent_learning.py
@@ -1,19 +1,33 @@
+import argparse
+
 from ray import air, tune
 from ray.tune.registry import register_env
 from ray.rllib.algorithms.apex_ddpg import ApexDDPGConfig
 from ray.rllib.env.wrappers.pettingzoo_env import PettingZooEnv
-from pettingzoo.sisl import waterworld_v3
+from pettingzoo.sisl import waterworld_v4
 
-# TODO (Kourosh): Noticed that the env is broken and throws an error in this test.
-# The error is ValueError: Input vector should be 1-D. (Could be pettingzoo version
-# issue)
 # Based on code from github.com/parametersharingmadrl/parametersharingmadrl
 
+parser = argparse.ArgumentParser()
+parser.add_argument(
+    "--num-gpus",
+    type=int,
+    default=1,
+    help="Number of GPUs to use for training.",
+)
+parser.add_argument(
+    "--as-test",
+    action="store_true",
+    help="Whether this script should be run as a test: Only one episode will be "
+    "sampled.",
+)
+parser.add_argument()
+
 if __name__ == "__main__":
-    # RDQN - Rainbow DQN
-    # ADQN - Apex DQN
+    args = parser.parse_args()
+
     def env_creator(args):
-        return PettingZooEnv(waterworld_v3.env())
+        return PettingZooEnv(waterworld_v4.env())
 
     env = env_creator({})
     register_env("waterworld", env_creator)
@@ -21,7 +35,7 @@ def env_creator(args):
     config = (
         ApexDDPGConfig()
         .environment("waterworld")
-        .resources(num_gpus=1)
+        .resources(num_gpus=args.num_gpus)
         .rollouts(num_rollout_workers=2)
         .multi_agent(
             policies=env.get_agent_ids(),
@@ -29,10 +43,16 @@ def env_creator(args):
         )
     )
 
+    if args.as_test:
+        # Only a compilation test of running waterworld / independent learning.
+        stop = {"iterations": 1}
+    else:
+        stop = {"episodes_total": 60000}
+
     tune.Tuner(
         "APEX_DDPG",
         run_config=air.RunConfig(
-            stop={"episodes_total": 60000},
+            stop=stop,
             checkpoint_config=air.CheckpointConfig(
                 checkpoint_frequency=10,
             ),
diff --git a/rllib/examples/multi_agent_parameter_sharing.py b/rllib/examples/multi_agent_parameter_sharing.py
index e2833fcb5a75..e40aa25e60b1 100644
--- a/rllib/examples/multi_agent_parameter_sharing.py
+++ b/rllib/examples/multi_agent_parameter_sharing.py
@@ -1,7 +1,7 @@
 from ray import air, tune
 from ray.tune.registry import register_env
 from ray.rllib.env.wrappers.pettingzoo_env import PettingZooEnv
-from pettingzoo.sisl import waterworld_v3
+from pettingzoo.sisl import waterworld_v4
 
 # TODO (Kourosh): Noticed that the env is broken and throws an error in this test.
 # The error is ValueError: Input vector should be 1-D. (Could be pettingzoo version
@@ -12,7 +12,7 @@
     # RDQN - Rainbow DQN
     # ADQN - Apex DQN
 
-    register_env("waterworld", lambda _: PettingZooEnv(waterworld_v3.env()))
+    register_env("waterworld", lambda _: PettingZooEnv(waterworld_v4.env()))
 
     tune.Tuner(
         "APEX_DDPG",

From f2b6a6baced3f252c0e04249224c870299a4998c Mon Sep 17 00:00:00 2001
From: Avnish Narayan <38871737+avnishn@users.noreply.github.com>
Date: Tue, 31 Jan 2023 07:28:05 -0800
Subject: [PATCH 079/267] [RLlib; docs] Change links and references in code and
 docs to "Farama foundation's gymnasium" (from "OpenAI gym"). (#32061)

---
 doc/source/rllib/core-concepts.rst                    | 2 +-
 doc/source/rllib/index.rst                            | 8 ++++----
 doc/source/rllib/rllib-env.rst                        | 6 +++---
 doc/source/rllib/rllib-models.rst                     | 2 +-
 doc/source/rllib/rllib-training.rst                   | 2 +-
 rllib/README.rst                                      | 2 +-
 rllib/algorithms/algorithm_config.py                  | 7 ++++---
 rllib/common.py                                       | 8 ++++----
 rllib/evaluation/rollout_worker.py                    | 2 +-
 rllib/examples/documentation/rllib_on_ray_readme.py   | 2 +-
 rllib/examples/documentation/rllib_on_rllib_readme.py | 2 +-
 rllib/examples/env/cliff_walking_wall_env.py          | 4 ++--
 rllib/examples/env/stateless_pendulum.py              | 4 ++--
 13 files changed, 26 insertions(+), 25 deletions(-)

diff --git a/doc/source/rllib/core-concepts.rst b/doc/source/rllib/core-concepts.rst
index 5e9a6a185fea..6406b45238c7 100644
--- a/doc/source/rllib/core-concepts.rst
+++ b/doc/source/rllib/core-concepts.rst
@@ -119,7 +119,7 @@ Policies
 `Policies <rllib-concepts.html#policies>`__ are a core concept in RLlib. In a nutshell, policies are
 Python classes that define how an agent acts in an environment.
 `Rollout workers <rllib-concepts.html#policy-evaluation>`__ query the policy to determine agent actions.
-In a `gym <rllib-env.html#openai-gym>`__ environment, there is a single agent and policy.
+In a `Farama-Foundation Gymnasium <rllib-env.html#gymnasium>`__ environment, there is a single agent and policy.
 In `vector envs <rllib-env.html#vectorized>`__, policy inference is for multiple agents at once,
 and in `multi-agent <rllib-env.html#multi-agent-and-hierarchical>`__, there may be multiple policies,
 each controlling one or more agents:
diff --git a/doc/source/rllib/index.rst b/doc/source/rllib/index.rst
index 0f0eedce8f68..5fcbd85444bd 100644
--- a/doc/source/rllib/index.rst
+++ b/doc/source/rllib/index.rst
@@ -77,7 +77,7 @@ As a last step, we `evaluate` the trained Algorithm:
     :start-after: __rllib-in-60s-begin__
     :end-before: __rllib-in-60s-end__
 
-Note that you can use any OpenAI gym environment as `env`.
+Note that you can use any Farama-Foundation Gymnasium environment as `env`.
 In `rollouts` you can for instance specify the number of parallel workers to collect samples from the environment.
 The `framework` config lets you choose between "tf2", "tf" and "torch" for execution.
 You can also tweak RLlib's default `model` config,and set up a separate config for `evaluation`.
@@ -159,7 +159,7 @@ click on the dropdowns below:
     :animate: fade-in-slide-down
 
     *  `RLlib Environments Overview <rllib-env.html>`__
-    *  `OpenAI Gym <rllib-env.html#openai-gym>`__
+    *  `Farama-Foundation gymnasium <rllib-env.html#gymnasium>`__
     *  `Vectorized <rllib-env.html#vectorized>`__
     *  `Multi-Agent and Hierarchical <rllib-env.html#multi-agent-and-hierarchical>`__
     *  `External Agents and Applications <rllib-env.html#external-agents-and-applications>`__
@@ -200,7 +200,7 @@ Feature Overview
 
     **RLlib Environments**
     ^^^
-    Get started with environments supported by RLlib, such as OpenAI Gym, Petting Zoo,
+    Get started with environments supported by RLlib, such as Farama foundation's Gymnasium, Petting Zoo,
     and many custom formats for vectorized and multi-agent environments.
     +++
     .. link-button:: rllib-environments-doc
@@ -220,7 +220,7 @@ Customizing RLlib
 
 RLlib provides simple APIs to customize all aspects of your training- and experimental workflows.
 For example, you may code your own `environments <rllib-env.html#configuring-environments>`__
-in python using openAI's gym or DeepMind's OpenSpiel, provide custom
+in python using Farama-Foundation's gymnasium or DeepMind's OpenSpiel, provide custom
 `TensorFlow/Keras- <rllib-models.html#tensorflow-models>`__ or ,
 `Torch models <rllib-models.html#torch-models>`_, write your own
 `policy- and loss definitions <rllib-concepts.html#policies>`__, or define
diff --git a/doc/source/rllib/rllib-env.rst b/doc/source/rllib/rllib-env.rst
index c4e80884eda8..9af679ebc5a7 100644
--- a/doc/source/rllib/rllib-env.rst
+++ b/doc/source/rllib/rllib-env.rst
@@ -7,7 +7,7 @@
 Environments
 ============
 
-RLlib works with several different types of environments, including `OpenAI Gym <https://www.gymlibrary.dev/>`__, user-defined, multi-agent, and also batched environments.
+RLlib works with several different types of environments, including `Farama-Foundation Gymnasium <https://gymnasium.farama.org/>`__, user-defined, multi-agent, and also batched environments.
 
 .. tip::
 
@@ -88,10 +88,10 @@ This can be useful if you want to train over an ensemble of different environmen
 
    When using logging in an environment, the logging configuration needs to be done inside the environment, which runs inside Ray workers. Any configurations outside the environment, e.g., before starting Ray will be ignored.
 
-OpenAI Gym
+Gymnasium
 ----------
 
-RLlib uses Gym as its environment interface for single-agent training. For more information on how to implement a custom Gym environment, see the `gym.Env class definition <https://github.com/openai/gym/blob/master/gym/core.py>`__. You may find the `SimpleCorridor <https://github.com/ray-project/ray/blob/master/rllib/examples/custom_env.py>`__ example useful as a reference.
+RLlib uses Gymnasium as its environment interface for single-agent training. For more information on how to implement a custom Gymnasium environment, see the `gymnasium.Env class definition <https://github.com/Farama-Foundation/Gymnasium/blob/main/gymnasium/core.py>`__. You may find the `SimpleCorridor <https://github.com/ray-project/ray/blob/master/rllib/examples/custom_env.py>`__ example useful as a reference.
 
 Performance
 ~~~~~~~~~~~
diff --git a/doc/source/rllib/rllib-models.rst b/doc/source/rllib/rllib-models.rst
index 5dce0603342c..492ab5cd462c 100644
--- a/doc/source/rllib/rllib-models.rst
+++ b/doc/source/rllib/rllib-models.rst
@@ -152,7 +152,7 @@ Custom Preprocessors and Environment Filters
 .. warning::
 
     Custom preprocessors have been fully deprecated, since they sometimes conflict with the built-in preprocessors for handling complex observation spaces.
-    Please use `wrapper classes <https://github.com/openai/gym/tree/master/gym/wrappers>`__ around your environment instead of preprocessors.
+    Please use `wrapper classes <https://github.com/Farama-Foundation/Gymnasium/tree/main/gymnasium/wrappers>`__ around your environment instead of preprocessors.
     Note that the built-in **default** Preprocessors described above will still be used and won't be deprecated.
 
 Instead of using the deprecated custom Preprocessors, you should use ``gym.Wrappers`` to preprocess your environment's output (observations and rewards),
diff --git a/doc/source/rllib/rllib-training.rst b/doc/source/rllib/rllib-training.rst
index 0ef1edf015e7..3f82f3ebd229 100644
--- a/doc/source/rllib/rllib-training.rst
+++ b/doc/source/rllib/rllib-training.rst
@@ -38,7 +38,7 @@ You can train DQN with the following commands:
     has a number of options you can show by running `rllib train --help`.
 
 Note that you choose any supported RLlib algorithm (``--algo``) and environment (``--env``).
-RLlib supports any OpenAI Gym environment, as well as a number of other environments
+RLlib supports any Farama-Foundation Gymnasium environment, as well as a number of other environments
 (see :ref:`rllib-environments-doc`).
 It also supports a large number of algorithms (see :ref:`rllib-algorithms-doc`) to
 choose from.
diff --git a/rllib/README.rst b/rllib/README.rst
index 7aa3f650b580..c6f73619a295 100644
--- a/rllib/README.rst
+++ b/rllib/README.rst
@@ -129,7 +129,7 @@ Quick First Experiment
     from ray.rllib.algorithms.ppo import PPOConfig
 
 
-    # Define your problem using python and openAI's gym API:
+    # Define your problem using python and Farama-Foundation's gymnasium API:
     class ParrotEnv(gym.Env):
         """Environment in which an agent must learn to repeat the seen observations.
 
diff --git a/rllib/algorithms/algorithm_config.py b/rllib/algorithms/algorithm_config.py
index 639d2950708d..63f6541ff140 100644
--- a/rllib/algorithms/algorithm_config.py
+++ b/rllib/algorithms/algorithm_config.py
@@ -1119,9 +1119,10 @@ def environment(
             env: The environment specifier. This can either be a tune-registered env,
                 via `tune.register_env([name], lambda env_ctx: [env object])`,
                 or a string specifier of an RLlib supported type. In the latter case,
-                RLlib will try to interpret the specifier as either an openAI gym env,
-                a PyBullet env, a ViZDoomGym env, or a fully qualified classpath to an
-                Env class, e.g. "ray.rllib.examples.env.random_env.RandomEnv".
+                RLlib will try to interpret the specifier as either an Farama-Foundation
+                gymnasium env, a PyBullet env, a ViZDoomGym env, or a fully qualified
+                classpath to an Env class, e.g.
+                "ray.rllib.examples.env.random_env.RandomEnv".
             env_config: Arguments dict passed to the env creator as an EnvContext
                 object (which is a dict plus the properties: num_rollout_workers,
                 worker_index, vector_index, and remote).
diff --git a/rllib/common.py b/rllib/common.py
index c3cee9a8f87c..a552958101f3 100644
--- a/rllib/common.py
+++ b/rllib/common.py
@@ -120,8 +120,8 @@ def get_help(key: str) -> str:
 
 
 train_help = dict(
-    env="The environment specifier to use. This could be an openAI gym "
-    "specifier (e.g. `CartPole-v1`) or a full class-path (e.g. "
+    env="The environment specifier to use. This could be an Farama-Foundation "
+    "Gymnasium specifier (e.g. `CartPole-v1`) or a full class-path (e.g. "
     "`ray.rllib.examples.env.simple_corridor.SimpleCorridor`).",
     config_file="Use the algorithm configuration from this file.",
     filetype="The file type of the config file. Defaults to 'yaml' and can also be "
@@ -160,8 +160,8 @@ def get_help(key: str) -> str:
     algo="The algorithm or model to train. This may refer to the name of a built-in "
     "Algorithm (e.g. RLlib's `DQN` or `PPO`), or a user-defined trainable "
     "function or class registered in the Tune registry.",
-    env="The environment specifier to use. This could be an openAI gym "
-    "specifier (e.g. `CartPole-v1`) or a full class-path (e.g. "
+    env="The environment specifier to use. This could be an Farama-Foundation gymnasium"
+    " specifier (e.g. `CartPole-v1`) or a full class-path (e.g. "
     "`ray.rllib.examples.env.simple_corridor.SimpleCorridor`).",
     local_mode="Run Ray in local mode for easier debugging.",
     render="Render the environment while evaluating. Off by default",
diff --git a/rllib/evaluation/rollout_worker.py b/rllib/evaluation/rollout_worker.py
index 6c876c0fdca5..47f08ae50d3b 100644
--- a/rllib/evaluation/rollout_worker.py
+++ b/rllib/evaluation/rollout_worker.py
@@ -145,7 +145,7 @@ def _update_env_seed_if_necessary(
     computed_seed: int = worker_idx * max_num_envs_per_workers + vector_idx + seed
 
     # Gymnasium.env.
-    # This will silently fail for most OpenAI gyms
+    # This will silently fail for most Farama-foundation gymnasium environments.
     # (they do nothing and return None per default)
     if not hasattr(env, "reset"):
         if log_once("env_has_no_reset_method"):
diff --git a/rllib/examples/documentation/rllib_on_ray_readme.py b/rllib/examples/documentation/rllib_on_ray_readme.py
index 27d121e4addc..8aace3c7e4b0 100644
--- a/rllib/examples/documentation/rllib_on_ray_readme.py
+++ b/rllib/examples/documentation/rllib_on_ray_readme.py
@@ -3,7 +3,7 @@
 from ray.rllib.algorithms.ppo import PPOConfig
 
 
-# Define your problem using python and openAI's gym API:
+# Define your problem using python and Farama-Foundation's gymnasium API:
 class SimpleCorridor(gym.Env):
     """Corridor in which an agent must learn to move right to reach the exit.
 
diff --git a/rllib/examples/documentation/rllib_on_rllib_readme.py b/rllib/examples/documentation/rllib_on_rllib_readme.py
index 18a362659b41..b1a632106944 100644
--- a/rllib/examples/documentation/rllib_on_rllib_readme.py
+++ b/rllib/examples/documentation/rllib_on_rllib_readme.py
@@ -2,7 +2,7 @@
 from ray.rllib.algorithms.ppo import PPOConfig
 
 
-# Define your problem using python and openAI's gym API:
+# Define your problem using python and Farama-Foundation's gymnasium API:
 class ParrotEnv(gym.Env):
     """Environment in which an agent must learn to repeat the seen observations.
 
diff --git a/rllib/examples/env/cliff_walking_wall_env.py b/rllib/examples/env/cliff_walking_wall_env.py
index d660fa2cbd63..496e86e3f907 100644
--- a/rllib/examples/env/cliff_walking_wall_env.py
+++ b/rllib/examples/env/cliff_walking_wall_env.py
@@ -8,8 +8,8 @@
 
 
 class CliffWalkingWallEnv(gym.Env):
-    """Modified version of the CliffWalking environment from OpenAI Gym
-    with walls instead of a cliff.
+    """Modified version of the CliffWalking environment from Farama-Foundation's
+    Gymnasium with walls instead of a cliff.
 
     ### Description
     The board is a 4x12 matrix, with (using NumPy matrix indexing):
diff --git a/rllib/examples/env/stateless_pendulum.py b/rllib/examples/env/stateless_pendulum.py
index 3235bd40bddb..36c6018229a5 100644
--- a/rllib/examples/env/stateless_pendulum.py
+++ b/rllib/examples/env/stateless_pendulum.py
@@ -7,8 +7,8 @@
 class StatelessPendulum(PendulumEnv):
     """Partially observable variant of the Pendulum gym environment.
 
-    https://github.com/openai/gym/blob/master/gym/envs/classic_control/
-    pendulum.py
+    https://github.com/Farama-Foundation/Gymnasium/blob/main/gymnasium/envs/
+    classic_control/pendulum.py
 
     We delete the angular velocity component of the state, so that it
     can only be solved by a memory enhanced model (policy).

From b7746b2801a81fb8180f1d55d6b4018461502a97 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Tue, 31 Jan 2023 08:13:06 -0800
Subject: [PATCH 080/267] [Datasets] Fix to pass TaskContext in
 generate_random_shuffle_fn() (#32101)

This PR is to fix master with resolving the conflict between #32080 and #32081, i.e.

- Pass TaskContext in random_shuffle.py:generate_random_shuffle_fn()
- Add AllToAllTransformFn and rename TransformFn to MapTransformFn
- Update the function return type in generate_map_xxx_fn().

Signed-off-by: Cheng Su <scnju13@gmail.com>
---
 python/ray/data/_internal/execution/interfaces.py |  9 +++++++--
 .../execution/operators/all_to_all_operator.py    |  5 +++--
 .../_internal/execution/operators/map_operator.py |  8 ++++----
 python/ray/data/_internal/planner/filter.py       |  8 +++++---
 python/ray/data/_internal/planner/flat_map.py     |  8 +++++---
 python/ray/data/_internal/planner/map_batches.py  |  6 +++---
 python/ray/data/_internal/planner/map_rows.py     |  8 +++++---
 .../ray/data/_internal/planner/random_shuffle.py  | 15 +++++++++++----
 .../data/_internal/planner/randomize_blocks.py    | 10 +++++++---
 9 files changed, 50 insertions(+), 27 deletions(-)

diff --git a/python/ray/data/_internal/execution/interfaces.py b/python/ray/data/_internal/execution/interfaces.py
index 8b11b84583de..821662e257c1 100644
--- a/python/ray/data/_internal/execution/interfaces.py
+++ b/python/ray/data/_internal/execution/interfaces.py
@@ -165,8 +165,13 @@ class TaskContext:
     task_idx: int
 
 
-# Block transform function applied by task and actor pools.
-TransformFn = Callable[[Iterable[Block], TaskContext], Iterable[Block]]
+# Block transform function applied by task and actor pools in MapOperator.
+MapTransformFn = Callable[[Iterable[Block], TaskContext], Iterable[Block]]
+
+# Block transform function applied in AllToAllOperator.
+AllToAllTransformFn = Callable[
+    [List[RefBundle], TaskContext], Tuple[List[RefBundle], StatsDict]
+]
 
 
 class PhysicalOperator(Operator):
diff --git a/python/ray/data/_internal/execution/operators/all_to_all_operator.py b/python/ray/data/_internal/execution/operators/all_to_all_operator.py
index 4fb1a2871820..fdc1d850e711 100644
--- a/python/ray/data/_internal/execution/operators/all_to_all_operator.py
+++ b/python/ray/data/_internal/execution/operators/all_to_all_operator.py
@@ -1,7 +1,8 @@
-from typing import List, Callable, Optional, Tuple
+from typing import List, Optional
 
 from ray.data._internal.stats import StatsDict
 from ray.data._internal.execution.interfaces import (
+    AllToAllTransformFn,
     RefBundle,
     PhysicalOperator,
     TaskContext,
@@ -16,7 +17,7 @@ class AllToAllOperator(PhysicalOperator):
 
     def __init__(
         self,
-        bulk_fn: Callable[[List[RefBundle]], Tuple[List[RefBundle], StatsDict]],
+        bulk_fn: AllToAllTransformFn,
         input_op: PhysicalOperator,
         num_outputs: Optional[int] = None,
         name: str = "AllToAll",
diff --git a/python/ray/data/_internal/execution/operators/map_operator.py b/python/ray/data/_internal/execution/operators/map_operator.py
index 1546f8c15422..545b5ed5058c 100644
--- a/python/ray/data/_internal/execution/operators/map_operator.py
+++ b/python/ray/data/_internal/execution/operators/map_operator.py
@@ -16,7 +16,7 @@
     ExecutionResources,
     PhysicalOperator,
     TaskContext,
-    TransformFn,
+    MapTransformFn,
 )
 from ray.data._internal.memory_tracing import trace_allocation
 from ray.data._internal.stats import StatsDict
@@ -34,7 +34,7 @@ class MapOperator(PhysicalOperator, ABC):
 
     def __init__(
         self,
-        transform_fn: TransformFn,
+        transform_fn: MapTransformFn,
         input_op: PhysicalOperator,
         name: str,
         min_rows_per_bundle: Optional[int],
@@ -64,7 +64,7 @@ def __init__(
     @classmethod
     def create(
         cls,
-        transform_fn: TransformFn,
+        transform_fn: MapTransformFn,
         input_op: PhysicalOperator,
         name: str = "Map",
         # TODO(ekl): slim down ComputeStrategy to only specify the compute
@@ -327,7 +327,7 @@ def to_metrics_dict(self) -> Dict[str, int]:
 
 
 def _map_task(
-    fn: TransformFn,
+    fn: MapTransformFn,
     ctx: TaskContext,
     *blocks: Block,
 ) -> Iterator[Union[Block, List[BlockMetadata]]]:
diff --git a/python/ray/data/_internal/planner/filter.py b/python/ray/data/_internal/planner/filter.py
index 54c1c2f4c1c3..390de5395afd 100644
--- a/python/ray/data/_internal/planner/filter.py
+++ b/python/ray/data/_internal/planner/filter.py
@@ -1,11 +1,13 @@
-from typing import Iterator
+from typing import Callable, Iterator
 
-from ray.data._internal.execution.interfaces import TaskContext, TransformFn
+from ray.data._internal.execution.interfaces import TaskContext
 from ray.data.block import Block, BlockAccessor, RowUDF
 from ray.data.context import DatasetContext
 
 
-def generate_filter_fn() -> TransformFn:
+def generate_filter_fn() -> Callable[
+    [Iterator[Block], TaskContext, RowUDF], Iterator[Block]
+]:
     """Generate function to apply the UDF to each record of blocks,
     and filter out records that do not satisfy the given predicate.
     """
diff --git a/python/ray/data/_internal/planner/flat_map.py b/python/ray/data/_internal/planner/flat_map.py
index 29a0274aa0f0..f08358a2e06c 100644
--- a/python/ray/data/_internal/planner/flat_map.py
+++ b/python/ray/data/_internal/planner/flat_map.py
@@ -1,12 +1,14 @@
-from typing import Iterator
+from typing import Callable, Iterator
 
-from ray.data._internal.execution.interfaces import TaskContext, TransformFn
+from ray.data._internal.execution.interfaces import TaskContext
 from ray.data._internal.output_buffer import BlockOutputBuffer
 from ray.data.block import Block, BlockAccessor, RowUDF
 from ray.data.context import DatasetContext
 
 
-def generate_flat_map_fn() -> TransformFn:
+def generate_flat_map_fn() -> Callable[
+    [Iterator[Block], TaskContext, RowUDF], Iterator[Block]
+]:
     """Generate function to apply the UDF to each record of blocks,
     and then flatten results.
     """
diff --git a/python/ray/data/_internal/planner/map_batches.py b/python/ray/data/_internal/planner/map_batches.py
index a3565ba53b65..1cc7d22b813d 100644
--- a/python/ray/data/_internal/planner/map_batches.py
+++ b/python/ray/data/_internal/planner/map_batches.py
@@ -1,8 +1,8 @@
 import sys
-from typing import Iterator, Optional
+from typing import Callable, Iterator, Optional
 
 from ray.data._internal.block_batching import batch_blocks
-from ray.data._internal.execution.interfaces import TaskContext, TransformFn
+from ray.data._internal.execution.interfaces import TaskContext
 from ray.data._internal.output_buffer import BlockOutputBuffer
 from ray.data.block import BatchUDF, Block, DataBatch
 from ray.data.context import DEFAULT_BATCH_SIZE, DatasetContext
@@ -19,7 +19,7 @@ def generate_map_batches_fn(
     batch_format: Literal["default", "pandas", "pyarrow", "numpy"] = "default",
     prefetch_batches: int = 0,
     zero_copy_batch: bool = False,
-) -> TransformFn:
+) -> Callable[[Iterator[Block], TaskContext, BatchUDF], Iterator[Block]]:
     """Generate function to apply the batch UDF to blocks."""
     import numpy as np
     import pandas as pd
diff --git a/python/ray/data/_internal/planner/map_rows.py b/python/ray/data/_internal/planner/map_rows.py
index 81bcccae64a4..6e0d1a49c2af 100644
--- a/python/ray/data/_internal/planner/map_rows.py
+++ b/python/ray/data/_internal/planner/map_rows.py
@@ -1,12 +1,14 @@
-from typing import Iterator
+from typing import Callable, Iterator
 
-from ray.data._internal.execution.interfaces import TaskContext, TransformFn
+from ray.data._internal.execution.interfaces import TaskContext
 from ray.data._internal.output_buffer import BlockOutputBuffer
 from ray.data.block import Block, BlockAccessor, RowUDF
 from ray.data.context import DatasetContext
 
 
-def generate_map_rows_fn() -> TransformFn:
+def generate_map_rows_fn() -> Callable[
+    [Iterator[Block], TaskContext, RowUDF], Iterator[Block]
+]:
     """Generate function to apply the UDF to each record of blocks."""
 
     context = DatasetContext.get_current()
diff --git a/python/ray/data/_internal/planner/random_shuffle.py b/python/ray/data/_internal/planner/random_shuffle.py
index 26b73733a1e7..31a1e74ac154 100644
--- a/python/ray/data/_internal/planner/random_shuffle.py
+++ b/python/ray/data/_internal/planner/random_shuffle.py
@@ -1,6 +1,10 @@
-from typing import Any, Callable, Dict, List, Optional, Tuple
+from typing import Any, Dict, List, Optional, Tuple
 
-from ray.data._internal.execution.interfaces import RefBundle
+from ray.data._internal.execution.interfaces import (
+    AllToAllTransformFn,
+    RefBundle,
+    TaskContext,
+)
 from ray.data._internal.planner.exchange.push_based_shuffle_task_scheduler import (
     PushBasedShuffleTaskScheduler,
 )
@@ -16,10 +20,13 @@ def generate_random_shuffle_fn(
     seed: Optional[int],
     num_outputs: Optional[int] = None,
     ray_remote_args: Optional[Dict[str, Any]] = None,
-) -> Callable[[List[RefBundle]], Tuple[List[RefBundle], StatsDict]]:
+) -> AllToAllTransformFn:
     """Generate function to randomly shuffle each records of blocks."""
 
-    def fn(refs: List[RefBundle]) -> Tuple[List[RefBundle], StatsDict]:
+    def fn(
+        refs: List[RefBundle],
+        ctx: TaskContext,
+    ) -> Tuple[List[RefBundle], StatsDict]:
         num_input_blocks = sum(len(r.blocks) for r in refs)
         shuffle_spec = ShuffleTaskSpec(random_shuffle=True, random_seed=seed)
 
diff --git a/python/ray/data/_internal/planner/randomize_blocks.py b/python/ray/data/_internal/planner/randomize_blocks.py
index 222aa3e7a4a3..364156f7ef11 100644
--- a/python/ray/data/_internal/planner/randomize_blocks.py
+++ b/python/ray/data/_internal/planner/randomize_blocks.py
@@ -1,12 +1,16 @@
-from typing import Callable, List, Optional, Tuple
+from typing import List, Optional, Tuple
 
-from ray.data._internal.execution.interfaces import RefBundle, TaskContext
+from ray.data._internal.execution.interfaces import (
+    AllToAllTransformFn,
+    RefBundle,
+    TaskContext,
+)
 from ray.data._internal.stats import StatsDict
 
 
 def generate_randomize_blocks_fn(
     seed: Optional[int],
-) -> Callable[[List[RefBundle], TaskContext], Tuple[List[RefBundle], StatsDict]]:
+) -> AllToAllTransformFn:
     """Generate function to randomize order of blocks."""
 
     def fn(

From 293fe2cb182b15499672c9cf50f79c8a9857dfb4 Mon Sep 17 00:00:00 2001
From: xwjiang2010 <87673679+xwjiang2010@users.noreply.github.com>
Date: Tue, 31 Jan 2023 08:22:28 -0800
Subject: [PATCH 081/267] [release] minor fix to pytorch_pbt_failure test when
 using gpu. (#32070)

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>
---
 .../train/examples/pytorch/tune_cifar_torch_pbt_example.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/python/ray/train/examples/pytorch/tune_cifar_torch_pbt_example.py b/python/ray/train/examples/pytorch/tune_cifar_torch_pbt_example.py
index 90846eb84824..196051971129 100644
--- a/python/ray/train/examples/pytorch/tune_cifar_torch_pbt_example.py
+++ b/python/ray/train/examples/pytorch/tune_cifar_torch_pbt_example.py
@@ -70,6 +70,10 @@ def train_func(config):
 
     model = resnet18()
 
+    # Note that `prepare_model` needs to be called before setting optimizer.
+    if not session.get_checkpoint():  # fresh start
+        model = train.torch.prepare_model(model)
+
     # Create optimizer.
     optimizer_config = {
         "lr": config.get("lr"),
@@ -84,6 +88,7 @@ def train_func(config):
         # Load in model
         model_state = checkpoint_dict["model"]
         model.load_state_dict(model_state)
+        model = train.torch.prepare_model(model)
 
         # Load in optimizer
         optimizer_state = checkpoint_dict["optimizer_state_dict"]
@@ -97,8 +102,6 @@ def train_func(config):
         checkpoint_epoch = checkpoint_dict["epoch"]
         starting_epoch = checkpoint_epoch + 1
 
-    model = train.torch.prepare_model(model)
-
     # Load in training and validation data.
     transform_train = transforms.Compose(
         [

From 5cf61f07179c099723422b8f0180542674d92e6d Mon Sep 17 00:00:00 2001
From: xwjiang2010 <87673679+xwjiang2010@users.noreply.github.com>
Date: Tue, 31 Jan 2023 09:45:13 -0800
Subject: [PATCH 082/267] [air] Add test for remote_storage with real hdfs
 backend. (#31940)

* [air] Add test for remote_storage with real hdfs backend.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* typo

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* typo

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* try a different syntax.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* change `install-hdfs.sh` permission.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* -hdfs in air tests.

update ssh-kengen command.

fix a few typos.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* test_env=

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* cat hdfs_env

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* move `PATH` as well to a separate file.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* setting env vars in test only.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* fix import

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* fix

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* address comments.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* nit

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* fix fixture

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* address comments

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* address comments

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

---------

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>
---
 .buildkite/pipeline.build.yml                 |  9 +++
 .buildkite/pipeline.ml.yml                    |  2 +-
 ci/env/install-dependencies.sh                |  5 ++
 ci/env/install-hdfs.sh                        | 81 +++++++++++++++++++
 python/ray/air/BUILD                          |  8 ++
 python/ray/air/_internal/remote_storage.py    | 13 ++-
 .../ray/air/tests/test_remote_storage_hdfs.py | 41 ++++++++++
 7 files changed, 157 insertions(+), 2 deletions(-)
 create mode 100755 ci/env/install-hdfs.sh
 create mode 100644 python/ray/air/tests/test_remote_storage_hdfs.py

diff --git a/.buildkite/pipeline.build.yml b/.buildkite/pipeline.build.yml
index a2dba9bf628e..b14b68836c96 100644
--- a/.buildkite/pipeline.build.yml
+++ b/.buildkite/pipeline.build.yml
@@ -599,6 +599,15 @@
       --test_env=DOCKER_CERT_PATH=/certs/client
       --test_env=DOCKER_TLS_CERTDIR=/certs
 
+- label: ":hadoop: Ray AIR HDFS tests"
+  conditions: ["RAY_CI_ML_AFFECTED"]
+  instance_size: medium
+  commands:
+    - cleanup() { if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then ./ci/build/upload_build_info.sh; fi }; trap cleanup EXIT
+    - INSTALL_HDFS=1 ./ci/env/install-dependencies.sh
+    - ./ci/env/env_info.sh
+    - cat /tmp/hdfs_env
+    - bazel test --config=ci $(./ci/run/bazel_export_options) --test_tag_filters=hdfs python/ray/air/...
 
 
 # Test to see if Train can be used without torch, tf, etc. installed
diff --git a/.buildkite/pipeline.ml.yml b/.buildkite/pipeline.ml.yml
index e617188bab45..7db645a5b83e 100644
--- a/.buildkite/pipeline.ml.yml
+++ b/.buildkite/pipeline.ml.yml
@@ -5,7 +5,7 @@
     - cleanup() { if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then ./ci/build/upload_build_info.sh; fi }; trap cleanup EXIT
     - DATA_PROCESSING_TESTING=1 INSTALL_HOROVOD=1 ./ci/env/install-dependencies.sh
     - ./ci/env/env_info.sh
-    - bazel test --config=ci $(./ci/run/bazel_export_options) --build_tests_only --test_tag_filters=-gpu,-needs_credentials
+    - bazel test --config=ci $(./ci/run/bazel_export_options) --build_tests_only --test_tag_filters=-gpu,-needs_credentials,-hdfs
       python/ray/air/...
     - bazel test --config=ci $(./ci/run/bazel_export_options) --build_tests_only --test_tag_filters=ray_air python/ray/data/...
 
diff --git a/ci/env/install-dependencies.sh b/ci/env/install-dependencies.sh
index 9e2502647fff..743279c42492 100755
--- a/ci/env/install-dependencies.sh
+++ b/ci/env/install-dependencies.sh
@@ -448,6 +448,11 @@ install_pip_packages() {
     "${SCRIPT_DIR}"/install-horovod.sh
   fi
 
+  # install hdfs if needed.
+  if [ "${INSTALL_HDFS-}" = 1 ]; then
+    "${SCRIPT_DIR}"/install-hdfs.sh
+  fi
+
   CC=gcc pip install psutil setproctitle==1.2.2 colorama --target="${WORKSPACE_DIR}/python/ray/thirdparty_files"
 }
 
diff --git a/ci/env/install-hdfs.sh b/ci/env/install-hdfs.sh
new file mode 100755
index 000000000000..35bd530bb23b
--- /dev/null
+++ b/ci/env/install-hdfs.sh
@@ -0,0 +1,81 @@
+#!/usr/bin/env bash
+
+apt-get update && DEBIAN_FRONTEND=noninteractive apt-get install -y --no-install-recommends openjdk-8-jdk net-tools curl netcat gnupg libsnappy-dev && rm -rf /var/lib/apt/lists/*
+
+export JAVA_HOME=/usr/lib/jvm/java-8-openjdk-amd64/
+
+curl -O https://dist.apache.org/repos/dist/release/hadoop/common/KEYS
+
+gpg --import KEYS
+
+export HADOOP_VERSION=3.2.4
+export HADOOP_URL=https://www.apache.org/dist/hadoop/common/hadoop-$HADOOP_VERSION/hadoop-$HADOOP_VERSION.tar.gz
+
+set -x && curl -fSL $HADOOP_URL -o /tmp/hadoop.tar.gz && curl -fSL $HADOOP_URL.asc -o /tmp/hadoop.tar.gz.asc && gpg --verify /tmp/hadoop.tar.gz.asc && tar -xvf /tmp/hadoop.tar.gz -C /opt/ && rm /tmp/hadoop.tar.gz*
+
+ln -s /opt/hadoop-$HADOOP_VERSION/etc/hadoop /etc/hadoop
+
+mkdir /opt/hadoop-$HADOOP_VERSION/logs
+
+mkdir /hadoop-data
+
+export HADOOP_HOME=/opt/hadoop-$HADOOP_VERSION
+export HADOOP_CONF_DIR=/etc/hadoop
+
+export USER=root
+export PATH=$HADOOP_HOME/bin/:$PATH
+
+export HDFS_DATANODE_USER=root
+export HDFS_NAMENODE_USER=root
+export HDFS_SECONDARYNAMENODE_USER=root
+
+export YARN_NODEMANAGER_USER=root
+export YARN_RESOURCEMANAGER_USER=root
+
+# The following script is mainly to set up `/etc/hadoop/core-site.html`.
+wget https://raw.githubusercontent.com/big-data-europe/docker-hadoop/master/base/entrypoint.sh
+chmod a+x entrypoint.sh
+./entrypoint.sh
+
+# Add JAVA_HOME env var to `/etc/hadoop/hadoop-env.sh`
+# Probably would be better to refer to JAVA_HOME env var, but not sure about sed syntax.
+sed -i "1s/^/JAVA_HOME=\/usr\/lib\/jvm\/java-8-openjdk-amd64\/\n/" $HADOOP_CONF_DIR/hadoop-env.sh
+
+# The following makes sure that ssh localhost should work without needing a password.
+sudo apt-get update
+sudo apt-get install -y openssh-server
+sudo service ssh start
+ssh-keygen -t rsa -N "" -f ~/.ssh/id_rsa
+cat ~/.ssh/id_rsa.pub >> ~/.ssh/authorized_keys
+chmod 640 ~/.ssh/authorized_keys
+sudo service ssh restart
+
+# without this `jps` won't show NameNode but only SecondaryNameNode
+yes | hadoop namenode -format
+$HADOOP_HOME/sbin/start-all.sh
+
+# Check that NameNode is up and running.
+res=$(jps | grep -c NameNode)
+if [[ $res == 2 ]]; then
+  echo "NameNode is up and running."
+else
+  echo "Something is wrong with hdfs setup."
+  exit 1
+fi
+
+hdfs dfs -mkdir /test
+
+# Generate an env file to be used in `test_remote_storage_hdfs` unit test.
+destdir=/tmp/hdfs_env
+touch $destdir
+for key in "JAVA_HOME" "HADOOP_HOME" "HADOOP_CONF_DIR" "USER"
+do
+  # use indirection to access a var by its name.
+  echo "$key=${!key}" >> $destdir
+done
+
+# Needed for `test_remote_storage_hdfs` unit test to specify hdfs uri.
+echo -e "CONTAINER_ID=$(hostname)\nHDFS_PORT=8020" >> $destdir
+
+# Needed for pyarrow to work.
+echo "CLASSPATH=$(hadoop classpath --glob)" >> $destdir
diff --git a/python/ray/air/BUILD b/python/ray/air/BUILD
index 062b772d68ce..bbd2879674c6 100644
--- a/python/ray/air/BUILD
+++ b/python/ray/air/BUILD
@@ -115,6 +115,14 @@ py_test(
     deps = [":ml_lib"]
 )
 
+py_test(
+    name = "test_remote_storage_hdfs",
+    size = "small",
+    srcs = ["tests/test_remote_storage_hdfs.py"],
+    tags = ["team:ml", "exclusive", "hdfs"],
+    deps = [":ml_lib"]
+)
+
 py_test(
     name = "test_resource_changing",
     size = "large",
diff --git a/python/ray/air/_internal/remote_storage.py b/python/ray/air/_internal/remote_storage.py
index 1762c2881b6a..c43e718ae4a5 100644
--- a/python/ray/air/_internal/remote_storage.py
+++ b/python/ray/air/_internal/remote_storage.py
@@ -86,7 +86,18 @@ def get_fs_and_path(
         return None, None
 
     parsed = urllib.parse.urlparse(uri)
-    path = parsed.netloc + parsed.path
+    # for uri="hdfs://48bb8ca83706:8020/test":
+    # netloc="48bb8ca83706:8020/"
+    # netloc's information is taken into account from the pyarrow client.
+    # so path should not include netloc.
+    # On the other hand, for uri="s3://my_bucket/test":
+    # netloc="my_bucket/" and path="test/"
+    # netloc's information is not part of the pyarrow client.
+    # so path should include netloc information hence the concatenation.
+    if uri.startswith("hdfs://"):
+        path = parsed.path
+    else:
+        path = parsed.netloc + parsed.path
 
     cache_key = (parsed.scheme, parsed.netloc)
 
diff --git a/python/ray/air/tests/test_remote_storage_hdfs.py b/python/ray/air/tests/test_remote_storage_hdfs.py
new file mode 100644
index 000000000000..2347a680a22f
--- /dev/null
+++ b/python/ray/air/tests/test_remote_storage_hdfs.py
@@ -0,0 +1,41 @@
+"""Test remote_storage in a ci environment with real hdfs setup."""
+import os
+
+import pytest
+
+from ray.air._internal.remote_storage import get_fs_and_path
+
+
+@pytest.fixture
+def setup_hdfs():
+    """Set env vars required by pyarrow to talk to hdfs correctly.
+
+    Returns hostname and port needed for the hdfs uri."""
+
+    # the following file is written in `install-hdfs.sh`.
+    with open("/tmp/hdfs_env", "r") as f:
+        for line in f.readlines():
+            line = line.rstrip("\n")
+            tokens = line.split("=", maxsplit=1)
+            os.environ[tokens[0]] = tokens[1]
+    import sys
+
+    sys.path.insert(0, os.path.join(os.environ["HADOOP_HOME"], "bin"))
+    hostname = os.getenv("CONTAINER_ID")
+    port = os.getenv("HDFS_PORT")
+    yield hostname, port
+
+
+def test_get_fs_and_path_hdfs(setup_hdfs):
+    hostname, port = setup_hdfs
+    hdfs_uri = f"hdfs://{hostname}:{port}/test/"
+    # do it twice should yield the same result
+    _, path = get_fs_and_path(hdfs_uri)
+    _, cached_path = get_fs_and_path(hdfs_uri)
+    assert path == cached_path
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))

From 65d904fb1225b277bd905d5e493a0cc23485f51a Mon Sep 17 00:00:00 2001
From: Cade Daniel <cade@anyscale.com>
Date: Tue, 31 Jan 2023 09:52:38 -0800
Subject: [PATCH 083/267] [RLlib] [Ray 2.3 release] Marking RLLib release tests
 as unstable if xfail (#32072)

* Marking RLLib release tests as unstable if xfail
---
 release/release_tests.yaml | 27 +++++++++++++++++++++++++++
 1 file changed, 27 insertions(+)

diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index f476309df65b..df2f34c8308c 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -2757,6 +2757,9 @@
     test_name: learning_tests
     test_suite: rllib_tests
 
+  # Marking as unstable since it's currently expected to fail.
+  stable: false
+
   frequency: nightly
   team: rllib
   env: staging
@@ -2824,6 +2827,9 @@
     test_name: learning_tests
     test_suite: rllib_tests
 
+  # Marking as unstable since it's currently expected to fail.
+  stable: false
+
   frequency: nightly
   team: rllib
   env: staging
@@ -2894,6 +2900,9 @@
   team: rllib
   env: staging
 
+  # Marking as unstable since it's currently expected to fail.
+  stable: false
+
   cluster:
     cluster_env: app_config.yaml
     cluster_compute: 1gpu_16cpus.yaml
@@ -2912,6 +2921,9 @@
     test_name: learning_tests
     test_suite: rllib_tests
 
+  # Marking as unstable since it's currently expected to fail.
+  stable: false
+
   frequency: nightly
   team: rllib
   env: staging
@@ -3003,6 +3015,9 @@
     test_name: learning_tests
     test_suite: rllib_tests
 
+  # Marking as unstable since it's currently expected to fail.
+  stable: false
+
   frequency: nightly
   team: rllib
   env: staging
@@ -3118,6 +3133,9 @@
     test_name: learning_tests
     test_suite: rllib_tests
 
+  # Marking as unstable since it's currently expected to fail.
+  stable: false
+
   frequency: nightly
   team: rllib
   env: staging
@@ -3141,6 +3159,9 @@
     test_name: learning_tests
     test_suite: rllib_tests
 
+  # Marking as unstable since it's currently expected to fail.
+  stable: false
+
   frequency: nightly
   team: rllib
   env: staging
@@ -3187,6 +3208,9 @@
     test_name: learning_tests
     test_suite: rllib_tests
 
+  # Marking as unstable since it's currently expected to fail.
+  stable: false
+
   frequency: nightly
   team: rllib
   env: staging
@@ -3278,6 +3302,9 @@
     test_name: learning_tests
     test_suite: rllib_tests
 
+  # Marking as unstable since it's currently expected to fail.
+  stable: false
+
   frequency: nightly
   team: rllib
   env: staging

From 44a1398a891b5f0dbcca5ff0465b40034fe4cf78 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Tue, 31 Jan 2023 11:18:44 -0800
Subject: [PATCH 084/267] [Datasets] Add logical operator for repartition()
 (#32102)

This PR adds logical operator for `repartition()`. Only implement shuffle repartition (`repartition.py:generate_repartition_fn()`).

Non-shuffle repartition is left as TODO, as the corresponding code in [fast_repartition.py](https://github.com/ray-project/ray/blob/master/python/ray/data/_internal/fast_repartition.py) involves `BlockList`, `ExecutionPlan` and `Dataset.split()`, so it needs a deeper refactoring and code change.
---
 .../logical/operators/all_to_all_operator.py  | 17 ++++++++
 .../_internal/planner/plan_all_to_all_op.py   |  4 ++
 .../ray/data/_internal/planner/repartition.py | 40 +++++++++++++++++++
 python/ray/data/dataset.py                    | 12 +++++-
 .../data/tests/test_execution_optimizer.py    | 39 ++++++++++++++++++
 5 files changed, 111 insertions(+), 1 deletion(-)
 create mode 100644 python/ray/data/_internal/planner/repartition.py

diff --git a/python/ray/data/_internal/logical/operators/all_to_all_operator.py b/python/ray/data/_internal/logical/operators/all_to_all_operator.py
index ca2b47913a90..166c19d383ee 100644
--- a/python/ray/data/_internal/logical/operators/all_to_all_operator.py
+++ b/python/ray/data/_internal/logical/operators/all_to_all_operator.py
@@ -62,3 +62,20 @@ def __init__(
             ray_remote_args=ray_remote_args,
         )
         self._seed = seed
+
+
+class Repartition(AbstractAllToAll):
+    """Logical operator for repartition."""
+
+    def __init__(
+        self,
+        input_op: LogicalOperator,
+        num_outputs: int,
+        shuffle: bool,
+    ):
+        super().__init__(
+            "Repartition",
+            input_op,
+            num_outputs=num_outputs,
+        )
+        self._shuffle = shuffle
diff --git a/python/ray/data/_internal/planner/plan_all_to_all_op.py b/python/ray/data/_internal/planner/plan_all_to_all_op.py
index b3b96b2e6f98..827bbcbd7126 100644
--- a/python/ray/data/_internal/planner/plan_all_to_all_op.py
+++ b/python/ray/data/_internal/planner/plan_all_to_all_op.py
@@ -4,9 +4,11 @@
     AbstractAllToAll,
     RandomShuffle,
     RandomizeBlocks,
+    Repartition,
 )
 from ray.data._internal.planner.random_shuffle import generate_random_shuffle_fn
 from ray.data._internal.planner.randomize_blocks import generate_randomize_blocks_fn
+from ray.data._internal.planner.repartition import generate_repartition_fn
 
 
 def _plan_all_to_all_op(
@@ -22,6 +24,8 @@ def _plan_all_to_all_op(
         fn = generate_randomize_blocks_fn(op._seed)
     elif isinstance(op, RandomShuffle):
         fn = generate_random_shuffle_fn(op._seed, op._num_outputs)
+    elif isinstance(op, Repartition):
+        fn = generate_repartition_fn(op._num_outputs, op._shuffle)
     else:
         raise ValueError(f"Found unknown logical operator during planning: {op}")
 
diff --git a/python/ray/data/_internal/planner/repartition.py b/python/ray/data/_internal/planner/repartition.py
new file mode 100644
index 000000000000..6be58ae10add
--- /dev/null
+++ b/python/ray/data/_internal/planner/repartition.py
@@ -0,0 +1,40 @@
+from typing import List, Tuple
+
+from ray.data._internal.execution.interfaces import (
+    AllToAllTransformFn,
+    RefBundle,
+    TaskContext,
+)
+from ray.data._internal.planner.exchange.push_based_shuffle_task_scheduler import (
+    PushBasedShuffleTaskScheduler,
+)
+from ray.data._internal.planner.exchange.shuffle_task_spec import ShuffleTaskSpec
+from ray.data._internal.planner.exchange.pull_based_shuffle_task_scheduler import (
+    PullBasedShuffleTaskScheduler,
+)
+from ray.data._internal.stats import StatsDict
+from ray.data.context import DatasetContext
+
+
+def generate_repartition_fn(
+    num_outputs: int,
+    shuffle: bool,
+) -> AllToAllTransformFn:
+    """Generate function to randomly shuffle each records of blocks."""
+    # TODO: support non-shuffle repartition as _internal/fast_repartition.py.
+    assert shuffle, "Execution optimizer does not support non-shuffle repartition yet."
+
+    def fn(
+        refs: List[RefBundle],
+        ctx: TaskContext,
+    ) -> Tuple[List[RefBundle], StatsDict]:
+        shuffle_spec = ShuffleTaskSpec(random_shuffle=False)
+
+        if DatasetContext.get_current().use_push_based_shuffle:
+            scheduler = PushBasedShuffleTaskScheduler(shuffle_spec)
+        else:
+            scheduler = PullBasedShuffleTaskScheduler(shuffle_spec)
+
+        return scheduler.execute(refs, num_outputs)
+
+    return fn
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index 4839cdf4fcd1..c14d50384351 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -33,6 +33,7 @@
 from ray.data._internal.logical.operators.all_to_all_operator import (
     RandomShuffle,
     RandomizeBlocks,
+    Repartition,
 )
 from ray.data._internal.logical.optimizers import LogicalPlan
 from ray.data._internal.logical.operators.map_operator import (
@@ -963,7 +964,16 @@ def repartition(self, num_blocks: int, *, shuffle: bool = False) -> "Dataset[T]"
         """
 
         plan = self._plan.with_stage(RepartitionStage(num_blocks, shuffle))
-        return Dataset(plan, self._epoch, self._lazy)
+
+        logical_plan = self._logical_plan
+        if logical_plan is not None:
+            op = Repartition(
+                logical_plan.dag,
+                num_outputs=num_blocks,
+                shuffle=shuffle,
+            )
+            logical_plan = LogicalPlan(op)
+        return Dataset(plan, self._epoch, self._lazy, logical_plan)
 
     def random_shuffle(
         self,
diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index 7b9c7336ca2b..b4c73a1ae122 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -7,6 +7,7 @@
 from ray.data._internal.logical.operators.all_to_all_operator import (
     RandomShuffle,
     RandomizeBlocks,
+    Repartition,
 )
 from ray.data._internal.logical.operators.read_operator import Read
 from ray.data._internal.logical.operators.map_operator import (
@@ -195,6 +196,44 @@ def test_random_shuffle_e2e(
     assert sorted(r2) == [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11], r2
 
 
+def test_repartition_operator(ray_start_cluster_enabled, enable_optimizer):
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = Repartition(
+        read_op,
+        num_outputs=5,
+        shuffle=True,
+    )
+    physical_op = planner.plan(op)
+
+    assert op.name == "Repartition"
+    assert isinstance(physical_op, AllToAllOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], MapOperator)
+
+    # Check error is thrown for non-shuffle repartition.
+    with pytest.raises(AssertionError):
+        planner.plan(
+            Repartition(
+                read_op,
+                num_outputs=5,
+                shuffle=False,
+            )
+        )
+
+
+def test_repartition_e2e(
+    ray_start_cluster_enabled, enable_optimizer, use_push_based_shuffle
+):
+    ds = ray.data.range(10000, parallelism=10)
+    ds1 = ds.repartition(20, shuffle=True)
+    assert ds1._block_num_rows() == [500] * 20, ds
+
+    # Check error is thrown for non-shuffle repartition.
+    with pytest.raises(AssertionError):
+        ds.repartition(20, shuffle=False).take_all()
+
+
 if __name__ == "__main__":
     import sys
 

From dae13bfbf614259fd865fef7cc59c73319cfb213 Mon Sep 17 00:00:00 2001
From: Archit Kulkarni <architkulkarni@users.noreply.github.com>
Date: Tue, 31 Jan 2023 11:36:47 -0800
Subject: [PATCH 085/267] [Core] Expose Internal KV MultiGet operation (#32096)

This PR exposes the MultiGet operation to the InternalKVInterface. The MultiGet operation is already supported in the two backends (InMemory and Redis), so this PR is just plumbing.

This change is needed to support getting multiple keys from the Internal KV in a single RPC.
---
 src/mock/ray/gcs/gcs_server/gcs_kv_manager.h  |  7 ++++++
 src/ray/gcs/gcs_server/gcs_kv_manager.h       | 10 +++++++++
 src/ray/gcs/gcs_server/store_client_kv.cc     | 22 +++++++++++++++++++
 src/ray/gcs/gcs_server/store_client_kv.h      |  5 +++++
 .../gcs_server/test/gcs_kv_manager_test.cc    | 13 +++++++++++
 src/ray/gcs/store_client/store_client.h       |  3 ++-
 6 files changed, 59 insertions(+), 1 deletion(-)

diff --git a/src/mock/ray/gcs/gcs_server/gcs_kv_manager.h b/src/mock/ray/gcs/gcs_server/gcs_kv_manager.h
index e0484546d319..014d239855bf 100644
--- a/src/mock/ray/gcs/gcs_server/gcs_kv_manager.h
+++ b/src/mock/ray/gcs/gcs_server/gcs_kv_manager.h
@@ -25,6 +25,13 @@ class MockInternalKVInterface : public ray::gcs::InternalKVInterface {
                const std::string &key,
                std::function<void(std::optional<std::string>)> callback),
               (override));
+  MOCK_METHOD(
+      void,
+      MultiGet,
+      (const std::string &ns,
+       const std::vector<std::string> &keys,
+       std::function<void(std::unordered_map<std::string, std::string>)> callback),
+      (override));
   MOCK_METHOD(void,
               Put,
               (const std::string &ns,
diff --git a/src/ray/gcs/gcs_server/gcs_kv_manager.h b/src/ray/gcs/gcs_server/gcs_kv_manager.h
index 9ccc9c04a604..75836136d7e8 100644
--- a/src/ray/gcs/gcs_server/gcs_kv_manager.h
+++ b/src/ray/gcs/gcs_server/gcs_kv_manager.h
@@ -39,6 +39,16 @@ class InternalKVInterface {
                    const std::string &key,
                    std::function<void(std::optional<std::string>)> callback) = 0;
 
+  /// Get the values associated with `keys`.
+  ///
+  /// \param ns The namespace of the key.
+  /// \param keys The keys to fetch.
+  /// \param callback Returns the values for those keys that exist.
+  virtual void MultiGet(
+      const std::string &ns,
+      const std::vector<std::string> &keys,
+      std::function<void(std::unordered_map<std::string, std::string>)> callback) = 0;
+
   /// Associate a key with the specified value.
   ///
   /// \param ns The namespace of the key.
diff --git a/src/ray/gcs/gcs_server/store_client_kv.cc b/src/ray/gcs/gcs_server/store_client_kv.cc
index 3539f3e87d99..11bf15b10291 100644
--- a/src/ray/gcs/gcs_server/store_client_kv.cc
+++ b/src/ray/gcs/gcs_server/store_client_kv.cc
@@ -67,6 +67,28 @@ void StoreClientInternalKV::Get(
       }));
 }
 
+void StoreClientInternalKV::MultiGet(
+    const std::string &ns,
+    const std::vector<std::string> &keys,
+    std::function<void(std::unordered_map<std::string, std::string>)> callback) {
+  if (!callback) {
+    callback = [](auto) {};
+  }
+  std::vector<std::string> prefixed_keys;
+  prefixed_keys.reserve(keys.size());
+  for (const auto &key : keys) {
+    prefixed_keys.emplace_back(MakeKey(ns, key));
+  }
+  RAY_CHECK_OK(delegate_->AsyncMultiGet(
+      table_name_, prefixed_keys, [callback = std::move(callback)](auto result) {
+        std::unordered_map<std::string, std::string> ret;
+        for (const auto &item : result) {
+          ret.emplace(ExtractKey(item.first), item.second);
+        }
+        callback(std::move(ret));
+      }));
+}
+
 void StoreClientInternalKV::Put(const std::string &ns,
                                 const std::string &key,
                                 const std::string &value,
diff --git a/src/ray/gcs/gcs_server/store_client_kv.h b/src/ray/gcs/gcs_server/store_client_kv.h
index 390b8ea94b4f..cdbb351df81d 100644
--- a/src/ray/gcs/gcs_server/store_client_kv.h
+++ b/src/ray/gcs/gcs_server/store_client_kv.h
@@ -33,6 +33,11 @@ class StoreClientInternalKV : public InternalKVInterface {
            const std::string &key,
            std::function<void(std::optional<std::string>)> callback) override;
 
+  void MultiGet(const std::string &ns,
+                const std::vector<std::string> &keys,
+                std::function<void(std::unordered_map<std::string, std::string>)>
+                    callback) override;
+
   void Put(const std::string &ns,
            const std::string &key,
            const std::string &value,
diff --git a/src/ray/gcs/gcs_server/test/gcs_kv_manager_test.cc b/src/ray/gcs/gcs_server/test/gcs_kv_manager_test.cc
index 00a3725e9d57..ec12a988be7f 100644
--- a/src/ray/gcs/gcs_server/test/gcs_kv_manager_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_kv_manager_test.cc
@@ -73,6 +73,16 @@ TEST_P(GcsKVManagerTest, TestInternalKV) {
   });
   kv_instance->Get("N2", "A_1", [](auto b) { ASSERT_FALSE(b.has_value()); });
   kv_instance->Get("N1", "A_1", [](auto b) { ASSERT_TRUE(b.has_value()); });
+  kv_instance->MultiGet("N1", {"A_1", "A_2", "A_3"}, [](auto b) {
+    ASSERT_EQ(3, b.size());
+    ASSERT_EQ("B", b["A_1"]);
+    ASSERT_EQ("C", b["A_2"]);
+    ASSERT_EQ("C", b["A_3"]);
+  });
+  // MultiGet with empty keys.
+  kv_instance->MultiGet("N1", {}, [](auto b) { ASSERT_EQ(0, b.size()); });
+  // MultiGet with non-existent keys.
+  kv_instance->MultiGet("N1", {"A_4", "A_5"}, [](auto b) { ASSERT_EQ(0, b.size()); });
   {
     // Delete by prefix are two steps in redis mode, so we need sync here.
     std::promise<void> p;
@@ -101,6 +111,9 @@ TEST_P(GcsKVManagerTest, TestInternalKV) {
     });
     p.get_future().get();
   }
+  // Check the keys are deleted.
+  kv_instance->MultiGet(
+      "N1", {"A_1", "A_2", "A_3"}, [](auto b) { ASSERT_EQ(0, b.size()); });
 }
 
 INSTANTIATE_TEST_SUITE_P(GcsKVManagerTestFixture,
diff --git a/src/ray/gcs/store_client/store_client.h b/src/ray/gcs/store_client/store_client.h
index f8b544287c08..23386cd95ebc 100644
--- a/src/ray/gcs/store_client/store_client.h
+++ b/src/ray/gcs/store_client/store_client.h
@@ -71,7 +71,8 @@ class StoreClient {
   /// Get all data from the given table asynchronously.
   ///
   /// \param table_name The name of the table to be read.
-  /// \param callback returns the key value pairs in a map.
+  /// \param keys The keys to look up from the table.
+  /// \param callback returns the key value pairs in a map for those keys that exist.
   /// \return Status
   virtual Status AsyncMultiGet(const std::string &table_name,
                                const std::vector<std::string> &keys,

From e3001e98ddc844f931ad136c91d91d1eba5d069f Mon Sep 17 00:00:00 2001
From: Scott Lee <scottjlee@users.noreply.github.com>
Date: Tue, 31 Jan 2023 11:54:27 -0800
Subject: [PATCH 086/267] Revert "[Datasets] Add support for string tensor
 columns in `ArrowTensorArray` and `ArrowVariableShapedTensorArray` (#31817)"
 (#32123)

This reverts commit 1fdf24eb81173cdea037b07ebda37f1e66f0ca04.
---
 python/ray/air/tests/test_tensor_extension.py | 76 -----------------
 .../ray/air/util/tensor_extensions/arrow.py   | 85 ++++++-------------
 2 files changed, 27 insertions(+), 134 deletions(-)

diff --git a/python/ray/air/tests/test_tensor_extension.py b/python/ray/air/tests/test_tensor_extension.py
index 935f2680c621..811116a82105 100644
--- a/python/ray/air/tests/test_tensor_extension.py
+++ b/python/ray/air/tests/test_tensor_extension.py
@@ -49,22 +49,6 @@ def test_arrow_scalar_tensor_array_roundtrip_boolean():
     np.testing.assert_array_equal(out, arr)
 
 
-def test_arrow_scalar_tensor_array_roundtrip_string():
-    arr = np.array(
-        [
-            ["Philip", "Fry"],
-            ["Leela", "Turanga"],
-            ["Hubert", "Farnsworth"],
-            ["Lrrr", ""],
-        ]
-    )
-    ata = ArrowTensorArray.from_numpy(arr)
-    assert isinstance(ata.type, pa.DataType)
-    assert len(ata) == len(arr)
-    out = ata.to_numpy()
-    np.testing.assert_array_equal(out, arr)
-
-
 def test_scalar_tensor_array_roundtrip():
     arr = np.arange(10)
     ta = TensorArray(arr)
@@ -155,24 +139,6 @@ def test_arrow_variable_shaped_tensor_array_roundtrip_boolean():
         np.testing.assert_array_equal(o, a)
 
 
-def test_arrow_variable_shaped_tensor_array_roundtrip_string():
-    arr = np.array(
-        [
-            ["Philip", "J", "Fry"],
-            ["Leela", "Turanga"],
-            ["Professor", "Hubert", "J", "Farnsworth"],
-            ["Lrrr"],
-        ],
-        dtype=object,
-    )
-    ata = ArrowVariableShapedTensorArray.from_numpy(arr)
-    assert isinstance(ata.type, ArrowVariableShapedTensorType)
-    assert len(ata) == len(arr)
-    out = ata.to_numpy()
-    for o, a in zip(out, arr):
-        np.testing.assert_array_equal(o, a)
-
-
 def test_arrow_variable_shaped_tensor_array_roundtrip_contiguous_optimization():
     # Test that a roundtrip on slices of an already-contiguous 1D base array does not
     # create any unnecessary copies.
@@ -223,46 +189,6 @@ def test_arrow_variable_shaped_tensor_array_slice():
             np.testing.assert_array_equal(o, e)
 
 
-def test_arrow_variable_shaped_string_tensor_array_slice():
-    arr = np.array(
-        [
-            ["Philip", "J", "Fry"],
-            ["Leela", "Turanga"],
-            ["Professor", "Hubert", "J", "Farnsworth"],
-            ["Lrrr"],
-        ],
-        dtype=object,
-    )
-    ata = ArrowVariableShapedTensorArray.from_numpy(arr)
-    assert isinstance(ata.type, ArrowVariableShapedTensorType)
-    assert len(ata) == len(arr)
-    indices = [0, 1, 2]
-    for i in indices:
-        np.testing.assert_array_equal(ata[i], arr[i])
-    slices = [
-        slice(0, 1),
-        slice(1, 2),
-        slice(2, 3),
-        slice(3, 4),
-        slice(0, 2),
-        slice(1, 3),
-        slice(2, 4),
-        slice(0, 3),
-        slice(1, 4),
-        slice(0, 4),
-    ]
-    for slice_ in slices:
-        ata_slice = ata[slice_]
-        ata_slice_np = ata_slice.to_numpy()
-        arr_slice = arr[slice_]
-        # Check for equivalent dtypes and shapes.
-        assert ata_slice_np.dtype == arr_slice.dtype
-        assert ata_slice_np.shape == arr_slice.shape
-        # Iteration over tensor array slices triggers NumPy conversion.
-        for o, e in zip(ata_slice, arr_slice):
-            np.testing.assert_array_equal(o, e)
-
-
 def test_variable_shaped_tensor_array_roundtrip():
     shapes = [(2, 2), (3, 3), (4, 4)]
     cumsum_sizes = np.cumsum([0] + [np.prod(shape) for shape in shapes[:-1]])
@@ -558,8 +484,6 @@ def test_arrow_variable_shaped_tensor_array_getitem(chunked):
         ([[1.5, 2.5], [3.3, 4.2], [5.2, 6.9], [7.6, 8.1]], np.float32),
         ([[1.5, 2.5], [3.3, 4.2], [5.2, 6.9], [7.6, 8.1]], np.float16),
         ([[False, True], [True, False], [True, True], [False, False]], None),
-        ([["Aa", "Bb"], ["Cc", "Dd"], ["Ee", "Ff"], ["Gg", "Hh"]], None),
-        ([["Aa", "Bb"], ["Cc", "Dd"], ["Ee", "Ff"], ["Gg", "Hh"]], np.str_),
     ],
 )
 def test_arrow_tensor_array_slice(test_arr, dtype):
diff --git a/python/ray/air/util/tensor_extensions/arrow.py b/python/ray/air/util/tensor_extensions/arrow.py
index b6d2681de031..7412e2d30c23 100644
--- a/python/ray/air/util/tensor_extensions/arrow.py
+++ b/python/ray/air/util/tensor_extensions/arrow.py
@@ -1,5 +1,4 @@
 import itertools
-import sys
 from typing import Iterable, Optional, Tuple, List, Sequence, Union
 
 from pkg_resources._vendor.packaging.version import parse as parse_version
@@ -310,15 +309,6 @@ def from_numpy(
                 # We only natively support C-contiguous ndarrays.
                 arr = np.ascontiguousarray(arr)
             pa_dtype = pa.from_numpy_dtype(arr.dtype)
-            if pa.types.is_string(pa_dtype):
-                if arr.dtype.byteorder == ">" or (
-                    arr.dtype.byteorder == "=" and sys.byteorder == "big"
-                ):
-                    raise ValueError(
-                        "Only little-endian string tensors are supported, but got: ",
-                        arr.dtype,
-                    )
-                pa_dtype = pa.binary(arr.dtype.itemsize)
             outer_len = arr.shape[0]
             element_shape = arr.shape[1:]
             total_num_items = arr.size
@@ -331,7 +321,6 @@ def from_numpy(
                 # NOTE: Arrow expects LSB bit-packed ordering.
                 # NOTE: This creates a copy.
                 arr = np.packbits(arr, bitorder="little")
-
             data_buffer = pa.py_buffer(arr)
             data_array = pa.Array.from_buffers(
                 pa_dtype, total_num_items, [None, data_buffer]
@@ -436,12 +425,6 @@ def _to_numpy(self, index: Optional[int] = None, zero_copy_only: bool = False):
             arr = np.unpackbits(arr, bitorder="little")
             # Interpret buffer as boolean array.
             return np.ndarray(shape, dtype=np.bool_, buffer=arr, offset=bool_offset)
-        # Special handling of binary/string types. Assumes unicode string tensor columns
-        if pa.types.is_fixed_size_binary(value_type):
-            NUM_BYTES_PER_UNICODE_CHAR = 4
-            ext_dtype = np.dtype(
-                f"<U{value_type.byte_width // NUM_BYTES_PER_UNICODE_CHAR}"
-            )
         return np.ndarray(shape, dtype=ext_dtype, buffer=data_buffer, offset=offset)
 
     def to_numpy(self, zero_copy_only: bool = True):
@@ -721,14 +704,6 @@ def from_numpy(
                 f"arrays: {types_and_shapes}"
             )
         pa_dtype = pa.from_numpy_dtype(dtype)
-        if pa.types.is_string(pa_dtype):
-            if dtype.byteorder == ">" or (
-                dtype.byteorder == "=" and sys.byteorder == "big"
-            ):
-                raise ValueError(
-                    "Only little-endian string tensors are supported, but got: ", dtype
-                )
-            pa_dtype = pa.binary(dtype.itemsize)
         if dtype.type is np.bool_:
             # NumPy doesn't represent boolean arrays as bit-packed, so we manually
             # bit-pack the booleans before handing the buffer off to Arrow.
@@ -783,8 +758,6 @@ def _to_numpy(self, index: Optional[int] = None, zero_copy_only: bool = False):
         data = self.storage.field("data")
         shapes = self.storage.field("shape")
         value_type = data.type.value_type
-        ext_dtype = value_type.to_pandas_dtype()
-        shape = shapes[index].as_py()
         if pa.types.is_boolean(value_type):
             # Arrow boolean array buffers are bit-packed, with 8 entries per byte,
             # and are accessed via bit offsets.
@@ -793,43 +766,39 @@ def _to_numpy(self, index: Optional[int] = None, zero_copy_only: bool = False):
             # We assume all other array types are accessed via byte array
             # offsets.
             buffer_item_width = value_type.bit_width // 8
-
+        shape = shapes[index].as_py()
         offset = data.offsets[index].as_py()
         data_offset = buffer_item_width * offset
         data_buffer = data.buffers()[3]
-
-        if pa.types.is_boolean(value_type):
-            # Special handling for boolean arrays, since Arrow bit-packs boolean arrays
-            # while NumPy does not.
-            # Cast as uint8 array and let NumPy unpack into a boolean view.
-            # Offset into uint8 array, where each element is a bucket for 8 booleans.
-            byte_bucket_offset = data_offset // 8
-            # Offset for a specific boolean, within a uint8 array element.
-            bool_offset = data_offset % 8
-            # The number of uint8 array elements (buckets) that our slice spans.
-            # Note that, due to the offset for a specific boolean, the slice can span
-            # byte boundaries even if it contains less than 8 booleans.
-            num_boolean_byte_buckets = 1 + ((bool_offset + np.prod(shape) - 1) // 8)
-            # Construct the uint8 array view on the buffer.
-            arr = np.ndarray(
-                (num_boolean_byte_buckets,),
-                dtype=np.uint8,
+        if not pa.types.is_boolean(value_type):
+            return np.ndarray(
+                shape,
+                dtype=value_type.to_pandas_dtype(),
                 buffer=data_buffer,
-                offset=byte_bucket_offset,
-            )
-            # Unpack into a byte per boolean, using LSB bit-packed ordering.
-            arr = np.unpackbits(arr, bitorder="little")
-            # Interpret buffer as boolean array.
-            return np.ndarray(shape, dtype=np.bool_, buffer=arr, offset=bool_offset)
-        # Special handling of binary/string types. Assumes unicode string tensor columns
-        if pa.types.is_fixed_size_binary(value_type):
-            NUM_BYTES_PER_UNICODE_CHAR = 4
-            ext_dtype = np.dtype(
-                f"<U{value_type.byte_width // NUM_BYTES_PER_UNICODE_CHAR}"
+                offset=data_offset,
             )
-        return np.ndarray(
-            shape, dtype=ext_dtype, buffer=data_buffer, offset=data_offset
+        # Special handling for boolean arrays, since Arrow bit-packs boolean arrays
+        # while NumPy does not.
+        # Cast as uint8 array and let NumPy unpack into a boolean view.
+        # Offset into uint8 array, where each element is a bucket for 8 booleans.
+        byte_bucket_offset = data_offset // 8
+        # Offset for a specific boolean, within a uint8 array element.
+        bool_offset = data_offset % 8
+        # The number of uint8 array elements (buckets) that our slice spans.
+        # Note that, due to the offset for a specific boolean, the slice can span byte
+        # boundaries even if it contains less than 8 booleans.
+        num_boolean_byte_buckets = 1 + ((bool_offset + np.prod(shape) - 1) // 8)
+        # Construct the uint8 array view on the buffer.
+        arr = np.ndarray(
+            (num_boolean_byte_buckets,),
+            dtype=np.uint8,
+            buffer=data_buffer,
+            offset=byte_bucket_offset,
         )
+        # Unpack into a byte per boolean, using LSB bit-packed ordering.
+        arr = np.unpackbits(arr, bitorder="little")
+        # Interpret buffer as boolean array.
+        return np.ndarray(shape, dtype=np.bool_, buffer=arr, offset=bool_offset)
 
     def to_numpy(self, zero_copy_only: bool = True):
         """

From ae167f010758fffd7204d42b709dfc300897417e Mon Sep 17 00:00:00 2001
From: Stephanie Wang <swang@cs.berkeley.edu>
Date: Tue, 31 Jan 2023 14:34:27 -0600
Subject: [PATCH 087/267] [AIR] Add option for per-epoch preprocessor (#31739)

This adds an option to the AIR DatasetConfig for a preprocessor that gets reapplied on each epoch. Currently the implementation uses DatasetPipeline to ensure that the extra preprocessing step is overlapped with training.

Signed-off-by: Stephanie Wang <swang@cs.berkeley.edu>
---
 doc/source/ray-air/check-ingest.rst         |  19 ++++
 doc/source/ray-air/doc_code/air_ingest.py   |  50 ++++++++
 python/ray/air/config.py                    |  25 ++++
 python/ray/air/tests/test_dataset_config.py | 119 ++++++++++++++++++++
 python/ray/data/preprocessor.py             |  16 +--
 python/ray/data/preprocessors/utils.py      |   4 +
 python/ray/train/_internal/dataset_spec.py  |  20 +++-
 7 files changed, 243 insertions(+), 10 deletions(-)

diff --git a/doc/source/ray-air/check-ingest.rst b/doc/source/ray-air/check-ingest.rst
index d416770cde62..7fa1fd2aea5d 100644
--- a/doc/source/ray-air/check-ingest.rst
+++ b/doc/source/ray-air/check-ingest.rst
@@ -178,6 +178,25 @@ Shuffling or data randomization is important for training high-quality models. B
      * you suspect high-quality shuffles may significantly improve model quality; and
      * absolute ingest performance is less of a concern
 
+.. _air-per-epoch-preprocessing:
+
+Applying randomized preprocessing (experimental)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The standard preprocessor passed to the ``Trainer`` is only applied once to the initial dataset when using :ref:`bulk ingest <air-streaming-ingest>`.
+However, in some cases you may want to reapply a preprocessor on each epoch, for example to augment your training dataset with a randomized transform.
+
+To support this use case, AIR offers an additional *per-epoch preprocessor* that gets reapplied on each epoch, after all other preprocessors and right before dataset consumption (e.g., using :meth:`~ray.data.DatasetIterator.iter_batches()`).
+Per-epoch preprocessing also executes in parallel with dataset consumption to reduce pauses in dataset consumption.
+
+This example shows how to use this feature to apply a randomized preprocessor on top of the standard preprocessor.
+
+.. literalinclude:: doc_code/air_ingest.py
+    :language: python
+    :start-after: __config_6__
+    :end-before: __config_6_end__
+
+
 .. _air-splitting-aux-datasets:
 
 Splitting Auxiliary Datasets
diff --git a/doc/source/ray-air/doc_code/air_ingest.py b/doc/source/ray-air/doc_code/air_ingest.py
index 80e91c3bed5d..f8ec5442d44b 100644
--- a/doc/source/ray-air/doc_code/air_ingest.py
+++ b/doc/source/ray-air/doc_code/air_ingest.py
@@ -158,6 +158,56 @@ def train_loop_per_worker():
 my_trainer.fit()
 # __config_5_end__
 
+# __config_6__
+import random
+
+import ray
+from ray.air import session
+from ray.data import DatasetIterator
+from ray.data.preprocessors import BatchMapper
+from ray.train.torch import TorchTrainer
+from ray.air.config import ScalingConfig, DatasetConfig
+
+# A simple preprocessor that just scales all values by 2.0.
+preprocessor = BatchMapper(lambda df: df * 2, batch_format="pandas")
+
+# A randomized preprocessor that adds a random float to all values, to be
+# reapplied on each epoch after `preprocessor`. Each epoch will therefore add a
+# different random float to the scaled dataset.
+add_noise = BatchMapper(lambda df: df + random.random(), batch_format="pandas")
+
+
+def train_loop_per_worker():
+    # Get a handle to the worker's assigned DatasetIterator shard.
+    data_shard: DatasetIterator = session.get_dataset_shard("train")
+
+    # Manually iterate over the data 10 times (10 epochs).
+    for _ in range(10):
+        for batch in data_shard.iter_batches():
+            print("Do some training on batch", batch)
+
+    # Print the stats for performance debugging.
+    print(data_shard.stats())
+
+
+my_trainer = TorchTrainer(
+    train_loop_per_worker,
+    scaling_config=ScalingConfig(num_workers=1),
+    datasets={
+        "train": ray.data.range_tensor(100),
+    },
+    dataset_config={
+        "train": DatasetConfig(
+            # Don't randomize order, just to make it easier to read the results.
+            randomize_block_order=False,
+            per_epoch_preprocessor=add_noise,
+        ),
+    },
+    preprocessor=preprocessor,
+)
+my_trainer.fit()
+# __config_6_end__
+
 # __global_shuffling_start__
 import ray
 from ray.air import session
diff --git a/python/ray/air/config.py b/python/ray/air/config.py
index 3e6d74fd4704..2c85d73108d3 100644
--- a/python/ray/air/config.py
+++ b/python/ray/air/config.py
@@ -15,6 +15,7 @@
 from ray.air.constants import WILDCARD_KEY
 from ray.util.annotations import PublicAPI
 from ray.widgets import Template, make_table_html_repr
+from ray.data.preprocessor import Preprocessor
 
 if TYPE_CHECKING:
     from ray.data import Dataset
@@ -326,6 +327,11 @@ class DatasetConfig:
             The main purpose of this is to prevent data fetching hotspots in the
             cluster when running many parallel workers / trials on the same data.
             We recommend enabling it always. True by default.
+        per_epoch_preprocessor [Experimental]: A preprocessor to re-apply on
+            each pass of the dataset. The main use case for this is to apply a
+            random transform on a training dataset on each epoch. The
+            per-epoch preprocessor will be applied *after* all other
+            preprocessors and in parallel with the dataset consumer.
         use_stream_api: Deprecated. Use max_object_store_memory_fraction instead.
         stream_window_size: Deprecated. Use max_object_store_memory_fraction instead.
     """
@@ -340,6 +346,7 @@ class DatasetConfig:
     max_object_store_memory_fraction: Optional[float] = None
     global_shuffle: Optional[bool] = None
     randomize_block_order: Optional[bool] = None
+    per_epoch_preprocessor: Optional["Preprocessor"] = None
     # Deprecated.
     use_stream_api: Optional[int] = None
     stream_window_size: Optional[int] = None
@@ -377,6 +384,7 @@ def fill_defaults(self) -> "DatasetConfig":
             randomize_block_order=self.randomize_block_order
             if self.randomize_block_order is not None
             else True,
+            per_epoch_preprocessor=self.per_epoch_preprocessor,
         )
 
     @staticmethod
@@ -444,6 +452,20 @@ def validated(
                     "must be None or a float with value -1 or >=0, but got "
                     f"{v.max_object_store_memory_fraction}."
                 )
+            if v.per_epoch_preprocessor is not None:
+                if not isinstance(v.per_epoch_preprocessor, Preprocessor):
+                    raise ValueError(
+                        "`per_epoch_preprocessor` must be a ray.data.Preprocessor "
+                        f"but got {v.per_epoch_preprocessor}."
+                    )
+                if (
+                    v.per_epoch_preprocessor.fit_status()
+                    != Preprocessor.FitStatus.NOT_FITTABLE
+                ):
+                    raise ValueError(
+                        "`per_epoch_preprocessor` currently does not support "
+                        "fittable ray.data.Preprocessors."
+                    )
 
         if len(fittable) > 1:
             raise ValueError(
@@ -474,6 +496,9 @@ def _merge(self, other: "DatasetConfig") -> "DatasetConfig":
             randomize_block_order=self.randomize_block_order
             if other.randomize_block_order is None
             else other.randomize_block_order,
+            per_epoch_preprocessor=self.per_epoch_preprocessor
+            if other.per_epoch_preprocessor is None
+            else other.per_epoch_preprocessor,
         )
         return new_config
 
diff --git a/python/ray/air/tests/test_dataset_config.py b/python/ray/air/tests/test_dataset_config.py
index 902835e3f4b9..2f3dc765a340 100644
--- a/python/ray/air/tests/test_dataset_config.py
+++ b/python/ray/air/tests/test_dataset_config.py
@@ -9,6 +9,7 @@
 from ray.air.config import DatasetConfig, ScalingConfig
 from ray.air.util.check_ingest import make_local_dataset_iterator
 from ray.data import DatasetIterator
+from ray.data.preprocessor import Preprocessor
 from ray.data.preprocessors import BatchMapper
 from ray.train.data_parallel_trainer import DataParallelTrainer
 
@@ -421,6 +422,124 @@ def check_error(shard, results):
     test.fit()
 
 
+@pytest.mark.parametrize("max_object_store_memory_fraction", [None, 1, 0.3])
+def test_deterministic_per_epoch_preprocessor(
+    ray_start_4_cpus, max_object_store_memory_fraction
+):
+    ds = ray.data.range_table(5)
+
+    def multiply(x):
+        return x * 2
+
+    it = make_local_dataset_iterator(
+        ds,
+        # Add some random noise to each integer.
+        preprocessor=BatchMapper(
+            lambda x: x + 0.1 * random.random(), batch_format="pandas"
+        ),
+        dataset_config=DatasetConfig(
+            randomize_block_order=False,
+            max_object_store_memory_fraction=max_object_store_memory_fraction,
+            per_epoch_preprocessor=BatchMapper(multiply, batch_format="pandas"),
+        ),
+    )
+
+    def checker(shard, results):
+        assert len(results[0]) == 5, (max_object_store_memory_fraction, results)
+        if max_object_store_memory_fraction is None:
+            assert results[0] == results[1], (
+                max_object_store_memory_fraction,
+                results,
+            )
+        else:
+            # Windowed pipelined ingest also reapplies the base
+            # preprocessor on every epoch, so we get a random dataset each
+            # time.
+            assert results[0] != results[1], (
+                max_object_store_memory_fraction,
+                results,
+            )
+        # Per-epoch preprocessor was applied at least once.
+        assert all(int(x) % 2 == 0 for x in results[0]), (
+            max_object_store_memory_fraction,
+            results,
+        )
+        # Per-epoch preprocessor was applied no more than once.
+        assert any(int(x) % 4 != 0 for x in results[0]), (
+            max_object_store_memory_fraction,
+            results,
+        )
+
+    TestStream.train_loop_per_worker(it, checker)
+
+
+@pytest.mark.parametrize("max_object_store_memory_fraction", [None, 1, 0.3])
+def test_nondeterministic_per_epoch_preprocessor(
+    ray_start_4_cpus, max_object_store_memory_fraction
+):
+    ds = ray.data.range_table(5)
+
+    # Use randomized per-epoch preprocessor to check that it gets applied once
+    # per epoch.
+    def rand(x):
+        return x * random.random()
+
+    it = make_local_dataset_iterator(
+        ds,
+        preprocessor=None,
+        dataset_config=DatasetConfig(
+            randomize_block_order=False,
+            max_object_store_memory_fraction=max_object_store_memory_fraction,
+            per_epoch_preprocessor=BatchMapper(rand, batch_format="pandas"),
+        ),
+    )
+
+    def checker(shard, results):
+        assert len(results[0]) == 5, (max_object_store_memory_fraction, results)
+        # Per-epoch preprocessor is randomized, so we should get a random
+        # dataset on each epoch.
+        assert results[0] != results[1], (max_object_store_memory_fraction, results)
+
+    TestStream.train_loop_per_worker(it, checker)
+
+
+def test_validate_per_epoch_preprocessor(ray_start_4_cpus):
+    ds = ray.data.range_table(5)
+
+    def multiply(x):
+        return x * 2
+
+    dataset_config = DatasetConfig(
+        per_epoch_preprocessor=BatchMapper(multiply, batch_format="pandas")
+    )
+    DatasetConfig.validated(
+        {
+            "train": dataset_config,
+        },
+        {"train": ds},
+    )
+
+    with pytest.raises(ValueError):
+        # Must specify a ray.data.Preprocessor.
+        dataset_config = DatasetConfig(per_epoch_preprocessor=multiply)
+        DatasetConfig.validated(
+            {
+                "train": dataset_config,
+            },
+            {"train": ds},
+        )
+
+    with pytest.raises(ValueError):
+        # Must specify a non-fittable ray.data.Preprocessor.
+        dataset_config = DatasetConfig(per_epoch_preprocessor=Preprocessor())
+        DatasetConfig.validated(
+            {
+                "train": dataset_config,
+            },
+            {"train": ds},
+        )
+
+
 if __name__ == "__main__":
     import sys
 
diff --git a/python/ray/data/preprocessor.py b/python/ray/data/preprocessor.py
index c0d6d73fd839..cc913770d0e7 100644
--- a/python/ray/data/preprocessor.py
+++ b/python/ray/data/preprocessor.py
@@ -4,10 +4,10 @@
 from typing import TYPE_CHECKING, Optional, Union, Dict, Any
 
 from ray.air.util.data_batch_conversion import BatchFormat, BlockFormat
-from ray.data import Dataset, DatasetPipeline
 from ray.util.annotations import DeveloperAPI, PublicAPI
 
 if TYPE_CHECKING:
+    from ray.data import Dataset, DatasetPipeline
     import pandas as pd
     import numpy as np
     from ray.air.data_batch_type import DataBatchType
@@ -73,7 +73,7 @@ def transform_stats(self) -> Optional[str]:
             return None
         return self._transform_stats
 
-    def fit(self, dataset: Dataset) -> "Preprocessor":
+    def fit(self, dataset: "Dataset") -> "Preprocessor":
         """Fit this Preprocessor to the Dataset.
 
         Fitted state attributes will be directly set in the Preprocessor.
@@ -104,7 +104,7 @@ def fit(self, dataset: Dataset) -> "Preprocessor":
 
         return self._fit(dataset)
 
-    def fit_transform(self, dataset: Dataset) -> Dataset:
+    def fit_transform(self, dataset: "Dataset") -> "Dataset":
         """Fit this Preprocessor to the Dataset and then transform the Dataset.
 
         Calling it more than once will overwrite all previously fitted state:
@@ -120,7 +120,7 @@ def fit_transform(self, dataset: Dataset) -> Dataset:
         self.fit(dataset)
         return self.transform(dataset)
 
-    def transform(self, dataset: Dataset) -> Dataset:
+    def transform(self, dataset: "Dataset") -> "Dataset":
         """Transform the given dataset.
 
         Args:
@@ -170,7 +170,7 @@ def transform_batch(self, data: "DataBatchType") -> "DataBatchType":
             )
         return self._transform_batch(data)
 
-    def _transform_pipeline(self, pipeline: DatasetPipeline) -> DatasetPipeline:
+    def _transform_pipeline(self, pipeline: "DatasetPipeline") -> "DatasetPipeline":
         """Transform the given DatasetPipeline.
 
         Args:
@@ -205,7 +205,7 @@ def _check_is_fitted(self) -> bool:
         return bool(fitted_vars)
 
     @DeveloperAPI
-    def _fit(self, dataset: Dataset) -> "Preprocessor":
+    def _fit(self, dataset: "Dataset") -> "Preprocessor":
         """Sub-classes should override this instead of fit()."""
         raise NotImplementedError()
 
@@ -259,8 +259,8 @@ def _determine_transform_to_use(self, data_format: BlockFormat) -> BatchFormat:
         return transform_type
 
     def _transform(
-        self, dataset: Union[Dataset, DatasetPipeline]
-    ) -> Union[Dataset, DatasetPipeline]:
+        self, dataset: Union["Dataset", "DatasetPipeline"]
+    ) -> Union["Dataset", "DatasetPipeline"]:
         # TODO(matt): Expose `batch_size` or similar configurability.
         # The default may be too small for some datasets and too large for others.
 
diff --git a/python/ray/data/preprocessors/utils.py b/python/ray/data/preprocessors/utils.py
index 981f05ff1aed..81c061fc1441 100644
--- a/python/ray/data/preprocessors/utils.py
+++ b/python/ray/data/preprocessors/utils.py
@@ -1,12 +1,16 @@
 import hashlib
 from typing import List
 
+from ray.util.annotations import DeveloperAPI
 
+
+@DeveloperAPI
 def simple_split_tokenizer(value: str) -> List[str]:
     """Tokenize a string using a split on spaces."""
     return value.split(" ")
 
 
+@DeveloperAPI
 def simple_hash(value: object, num_features: int) -> int:
     """Deterministically hash a value into the integer space."""
     encoded_value = str(value).encode()
diff --git a/python/ray/train/_internal/dataset_spec.py b/python/ray/train/_internal/dataset_spec.py
index f5dd7020eee2..43377a6a1ff9 100644
--- a/python/ray/train/_internal/dataset_spec.py
+++ b/python/ray/train/_internal/dataset_spec.py
@@ -5,6 +5,7 @@
 from ray.air.config import DatasetConfig
 
 from ray.data import Dataset, DatasetPipeline
+from ray.data.preprocessors import Chain
 from ray.air._internal.util import _estimate_avail_object_store_memory
 
 if TYPE_CHECKING:
@@ -188,8 +189,18 @@ def get_dataset_shards(
                 )
                 dataset = dataset.window(bytes_per_window=stream_window_size).repeat()
                 # In windowed mode, we re-apply the preprocessor on each iteration.
-                if self.preprocessor:
-                    dataset = self.preprocessor._transform_pipeline(dataset)
+                if self.preprocessor or config.per_epoch_preprocessor:
+                    if self.preprocessor is not None:
+                        preprocessor = self.preprocessor
+                        if config.per_epoch_preprocessor is not None:
+                            preprocessor = Chain(
+                                preprocessor, config.per_epoch_preprocessor
+                            )
+                    else:
+                        preprocessor = config.per_epoch_preprocessor
+
+                    dataset = preprocessor._transform_pipeline(dataset)
+
                 # Always re-randomize each window; this doesn't help with reducing
                 # cluster hot-spots since we already randomized the based blocks, but
                 # can help with improving randomness in combination with local shuffle.
@@ -197,6 +208,11 @@ def get_dataset_shards(
                     # TODO(swang): Should randomize block order across the
                     # original dataset, not the window.
                     dataset = dataset.randomize_block_order_each_window()
+            elif config.per_epoch_preprocessor is not None:
+                # Reapply the per epoch preprocessor on each epoch.
+                if isinstance(dataset, Dataset):
+                    dataset = dataset.repeat()
+                dataset = config.per_epoch_preprocessor._transform_pipeline(dataset)
 
             if config.global_shuffle:
                 # If global shuffle is requested, then we should try to overlap

From 7573d498a2a61546b63f4883885c52984c8c3eb2 Mon Sep 17 00:00:00 2001
From: Alex Wu <alex@anyscale.io>
Date: Tue, 31 Jan 2023 12:51:15 -0800
Subject: [PATCH 088/267] [observability][autoscaler] Ensure pending nodes is
 reset to 0 after scaling (#32085)

The previous way pending_nodes was calculated was prone to race conditions, instead, let's just always publish it in the main thread with other metrics.

Closes #31982

---------

Co-authored-by: Alex <alex@anyscale.com>
---
 python/ray/autoscaler/_private/autoscaler.py    |  1 -
 python/ray/autoscaler/_private/monitor.py       |  5 +++++
 python/ray/autoscaler/_private/node_launcher.py |  1 -
 python/ray/tests/test_autoscaler.py             |  3 ---
 python/ray/tests/test_autoscaler_e2e.py         | 12 ++++++++++--
 5 files changed, 15 insertions(+), 7 deletions(-)

diff --git a/python/ray/autoscaler/_private/autoscaler.py b/python/ray/autoscaler/_private/autoscaler.py
index ead10d841950..08bfe1ffe688 100644
--- a/python/ray/autoscaler/_private/autoscaler.py
+++ b/python/ray/autoscaler/_private/autoscaler.py
@@ -1365,7 +1365,6 @@ def can_update(self, node_id):
     def launch_new_node(self, count: int, node_type: str) -> None:
         logger.info("StandardAutoscaler: Queue {} new nodes for launch".format(count))
         self.pending_launches.inc(node_type, count)
-        self.prom_metrics.pending_nodes.set(self.pending_launches.value)
         config = copy.deepcopy(self.config)
         if self.foreground_node_launch:
             assert self.foreground_node_launcher is not None
diff --git a/python/ray/autoscaler/_private/monitor.py b/python/ray/autoscaler/_private/monitor.py
index 34cd4d2109f8..2789787a4bad 100644
--- a/python/ray/autoscaler/_private/monitor.py
+++ b/python/ray/autoscaler/_private/monitor.py
@@ -416,6 +416,11 @@ def _run(self):
                                 SessionName=self.prom_metrics.session_name,
                             ).set(pending)
 
+                    self.prom_metrics.pending_nodes.set(
+                        len(autoscaler_summary.pending_nodes)
+                        + len(autoscaler_summary.pending_launches)
+                    )
+
                     for msg in self.event_summarizer.summary():
                         # Need to prefix each line of the message for the lines to
                         # get pushed to the driver logs.
diff --git a/python/ray/autoscaler/_private/node_launcher.py b/python/ray/autoscaler/_private/node_launcher.py
index 6c1610c201d9..24d295041387 100644
--- a/python/ray/autoscaler/_private/node_launcher.py
+++ b/python/ray/autoscaler/_private/node_launcher.py
@@ -65,7 +65,6 @@ def launch_node(self, config: Dict[str, Any], count: int, node_type: str):
         self.log("Got {} nodes to launch.".format(count))
         self._launch_node(config, count, node_type)
         self.pending.dec(node_type, count)
-        self.prom_metrics.pending_nodes.set(self.pending.value)
 
     def _launch_node(self, config: Dict[str, Any], count: int, node_type: str):
         if self.node_types:
diff --git a/python/ray/tests/test_autoscaler.py b/python/ray/tests/test_autoscaler.py
index 3a8835c99488..a4579c37597d 100644
--- a/python/ray/tests/test_autoscaler.py
+++ b/python/ray/tests/test_autoscaler.py
@@ -2256,7 +2256,6 @@ def testDelayedLaunchWithMinWorkers(self):
         waiters = rtc1._cond._waiters
         self.waitFor(lambda: len(waiters) == 2)
         assert autoscaler.pending_launches.value == 10
-        mock_metrics.pending_nodes.set.assert_called_with(10)
         assert (
             len(
                 self.provider.non_terminated_nodes(
@@ -2281,11 +2280,9 @@ def testDelayedLaunchWithMinWorkers(self):
         )
         self.waitForNodes(10, tag_filters={TAG_RAY_NODE_KIND: NODE_KIND_WORKER})
         assert autoscaler.pending_launches.value == 0
-        mock_metrics.pending_nodes.set.assert_called_with(0)
         autoscaler.update()
         self.waitForNodes(10, tag_filters={TAG_RAY_NODE_KIND: NODE_KIND_WORKER})
         assert autoscaler.pending_launches.value == 0
-        mock_metrics.pending_nodes.set.assert_called_with(0)
         assert mock_metrics.drain_node_exceptions.inc.call_count == 0
 
     def testUpdateThrottling(self):
diff --git a/python/ray/tests/test_autoscaler_e2e.py b/python/ray/tests/test_autoscaler_e2e.py
index 6bebfb955fa6..ae3e7da32ad0 100644
--- a/python/ray/tests/test_autoscaler_e2e.py
+++ b/python/ray/tests/test_autoscaler_e2e.py
@@ -91,7 +91,11 @@ def ping(self):
                 return True
 
         zero_reported_condition = get_metric_check_condition(
-            {"autoscaler_cluster_resources": 0, "autoscaler_pending_resources": 0},
+            {
+                "autoscaler_cluster_resources": 0,
+                "autoscaler_pending_resources": 0,
+                "autoscaler_pending_nodes": 0,
+            },
             export_addr=autoscaler_export_addr,
         )
         wait_for_condition(zero_reported_condition)
@@ -100,7 +104,11 @@ def ping(self):
         ray.get([actor.ping.remote() for actor in actors])
 
         two_cpu_no_pending_condition = get_metric_check_condition(
-            {"autoscaler_cluster_resources": 2, "autoscaler_pending_resources": 0},
+            {
+                "autoscaler_cluster_resources": 2,
+                "autoscaler_pending_resources": 0,
+                "autoscaler_pending_nodes": 0,
+            },
             export_addr=autoscaler_export_addr,
         )
         wait_for_condition(two_cpu_no_pending_condition)

From 10d52f7c2a8bfc169f94e71fd98f9b528f12e424 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Tue, 31 Jan 2023 13:16:39 -0800
Subject: [PATCH 089/267] [tune/execution] Update staged resources in a fixed
 counter for faster lookup (#32087)

In #30016 we migrated Ray Tune to use a new resource management interface. In the same PR, we simplified the resource consolidation logic. This lead to a performance regression first identified in #31337.

After manual profiling, the regression seems to come from `RayTrialExecutor._count_staged_resources`. We have 1000 staged trials, and this function is called on every step, executing a linear scan through all trials.

This PR fixes this performance bottleneck by keeping state of the resource counter instead of dynamically recreating it every time. This is simple as we can just add/subtract the resources whenever we add/remove from the `RayTrialExecutor._staged_trials` set.

Manual testing confirmed this improves the runtime of `tune_scalability_result_throughput_cluster` from ~132 seconds to ~122 seconds, bringing it back to the same level as before the refactor.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 python/ray/tune/execution/ray_trial_executor.py      | 12 ++++++------
 release/ray_release/alerts/tune_tests.py             |  2 +-
 .../workloads/test_result_throughput_cluster.py      |  9 ++-------
 3 files changed, 9 insertions(+), 14 deletions(-)

diff --git a/python/ray/tune/execution/ray_trial_executor.py b/python/ray/tune/execution/ray_trial_executor.py
index 035bb55defd2..12477fca1614 100644
--- a/python/ray/tune/execution/ray_trial_executor.py
+++ b/python/ray/tune/execution/ray_trial_executor.py
@@ -232,7 +232,8 @@ def __init__(
         ] = defaultdict(list)
 
         # Trials for which we requested resources
-        self._staged_trials = set()
+        self._staged_trials = set()  # Staged trials
+        self._staged_resources = Counter()  # Resources of staged trials
         self._trial_to_acquired_resources: Dict[Trial, AcquiredResources] = {}
 
         # Result buffer
@@ -319,6 +320,7 @@ def _stage_and_update_status(self, trials: Iterable[Trial]):
             resource_request = trial.placement_group_factory
 
             self._staged_trials.add(trial)
+            self._staged_resources[trial.placement_group_factory] += 1
             self._resource_manager.request_resources(resource_request=resource_request)
 
         self._resource_manager.update_state()
@@ -533,6 +535,7 @@ def _unstage_trial_with_resources(self, trial: Trial):
         # Case 1: The trial we started was staged. Just remove it
         if trial in self._staged_trials:
             self._staged_trials.remove(trial)
+            self._staged_resources[trial.placement_group_factory] -= 1
             return
 
         # Case 2: We staged a trial "A" with the same resources, but our trial "B"
@@ -551,6 +554,7 @@ def _unstage_trial_with_resources(self, trial: Trial):
 
         if candidate_trial:
             self._staged_trials.remove(candidate_trial)
+            self._staged_resources[candidate_trial.placement_group_factory] -= 1
             return
 
         raise RuntimeError(
@@ -848,11 +852,7 @@ def on_step_end(self, search_ended: bool = False) -> None:
         self._do_force_trial_cleanup()
 
     def _count_staged_resources(self):
-        counter = Counter()
-        for trial in self._staged_trials:
-            resource_request = trial.placement_group_factory
-            counter[resource_request] += 1
-        return counter
+        return self._staged_resources
 
     def _cleanup_cached_actors(
         self, search_ended: bool = False, force_all: bool = False
diff --git a/release/ray_release/alerts/tune_tests.py b/release/ray_release/alerts/tune_tests.py
index 250961f7232f..4e42545cee0d 100644
--- a/release/ray_release/alerts/tune_tests.py
+++ b/release/ray_release/alerts/tune_tests.py
@@ -44,7 +44,7 @@ def handle_result(
         target_time = 900 if not was_smoke_test else 400
     elif test_name == "result_throughput_cluster":
         target_terminated = 1000
-        target_time = 160
+        target_time = 130
     elif test_name == "result_throughput_single_node":
         target_terminated = 96
         target_time = 120
diff --git a/release/tune_tests/scalability_tests/workloads/test_result_throughput_cluster.py b/release/tune_tests/scalability_tests/workloads/test_result_throughput_cluster.py
index 1eecfa7cdfd4..8ac28835da64 100644
--- a/release/tune_tests/scalability_tests/workloads/test_result_throughput_cluster.py
+++ b/release/tune_tests/scalability_tests/workloads/test_result_throughput_cluster.py
@@ -8,7 +8,7 @@
 
 Test owner: krfricke
 
-Acceptance criteria: Should run faster than 160 seconds.
+Acceptance criteria: Should run faster than 130 seconds.
 
 Theoretical minimum time: 100 seconds
 """
@@ -16,7 +16,6 @@
 
 import ray
 from ray import tune
-from ray.tune.execution.cluster_info import _is_ray_cluster
 
 from ray.tune.utils.release_test_util import timed_tune_run
 
@@ -31,11 +30,7 @@ def main():
     results_per_second = 0.5
     trial_length_s = 100
 
-    max_runtime = 160
-
-    if _is_ray_cluster():
-        # Add constant overhead for SSH connection
-        max_runtime = 160
+    max_runtime = 130
 
     timed_tune_run(
         name="result throughput cluster",

From d15ccfcdf290e554846d2fddf2b8cf5d659e9892 Mon Sep 17 00:00:00 2001
From: Archit Kulkarni <architkulkarni@users.noreply.github.com>
Date: Tue, 31 Jan 2023 13:49:08 -0800
Subject: [PATCH 090/267] Revert "[RLlib] Reparameterize the construction of
 TrainerRunner and RLTrainers (#31991)" (#32130)

Reverts #31991

This PR seems to have broken CI.

Screenshot 2023-01-31 at 1 39 09 PM

The error is https://buildkite.com/ray-project/oss-ci-build-branch/builds/2099#01860972-e02e-47c4-8f86-8be28ea18d92/3786-3992
AttributeError: '_TFStub' object has no attribute 'Tensor'
---
 rllib/BUILD                                   |   9 +-
 rllib/algorithms/algorithm_config.py          |  46 +------
 rllib/core/rl_trainer/rl_trainer.py           |  93 ++-----------
 rllib/core/rl_trainer/scaling_config.py       |  21 ---
 .../core/rl_trainer/tests/test_rl_trainer.py  |  10 +-
 .../rl_trainer/tests/test_trainer_runner.py   | 126 +++--------------
 .../tests/test_trainer_runner_config.py       |   1 +
 .../tests/test_trainer_runner_local.py        |  70 ++++++++++
 rllib/core/rl_trainer/tf/tf_rl_trainer.py     |  32 ++++-
 .../torch/tests/test_torch_rl_trainer.py      |  25 ++--
 .../core/rl_trainer/torch/torch_rl_trainer.py |  53 ++++---
 rllib/core/rl_trainer/trainer_runner.py       | 129 +++++++++---------
 .../core/rl_trainer/trainer_runner_config.py  |  99 +++++++-------
 rllib/core/testing/utils.py                   |  12 +-
 rllib/utils/framework.py                      |  29 +---
 15 files changed, 319 insertions(+), 436 deletions(-)
 delete mode 100644 rllib/core/rl_trainer/scaling_config.py
 create mode 100644 rllib/core/rl_trainer/tests/test_trainer_runner_local.py

diff --git a/rllib/BUILD b/rllib/BUILD
index 5a969c10f51f..fb3689441803 100644
--- a/rllib/BUILD
+++ b/rllib/BUILD
@@ -1846,10 +1846,17 @@ py_test(
 py_test(
     name = "test_trainer_runner",
     tags = ["team:rllib", "multi_gpu", "exclusive"],
-    size = "large",
+    size = "medium",
     srcs = ["core/rl_trainer/tests/test_trainer_runner.py"]
 )
 
+py_test(
+    name = "test_trainer_runner_local",
+    tags = ["team:rllib", "core", "exclusive"],
+    size = "medium",
+    srcs = ["core/rl_trainer/tests/test_trainer_runner_local.py"]
+)
+
 py_test(
     name = "test_trainer_runner_config",
     tags = ["team:rllib", "core"],
diff --git a/rllib/algorithms/algorithm_config.py b/rllib/algorithms/algorithm_config.py
index 63f6541ff140..26a0327df5d0 100644
--- a/rllib/algorithms/algorithm_config.py
+++ b/rllib/algorithms/algorithm_config.py
@@ -17,7 +17,6 @@
 import ray
 from ray.rllib.algorithms.callbacks import DefaultCallbacks
 from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
-from ray.rllib.core.rl_trainer.rl_trainer import RLTrainerHPs
 from ray.rllib.core.rl_trainer.trainer_runner_config import (
     TrainerRunnerConfig,
     ModuleSpec,
@@ -243,9 +242,6 @@ def __init__(self, algo_class=None):
         self.num_gpus_per_worker = 0
         self._fake_gpus = False
         self.num_cpus_for_local_worker = 1
-        self.num_trainer_workers = 0
-        self.num_gpus_per_trainer_worker = 0
-        self.num_cpus_per_trainer_worker = 1
         self.custom_resources_per_worker = {}
         self.placement_strategy = "PACK"
 
@@ -322,10 +318,6 @@ def __init__(self, algo_class=None):
         self.max_requests_in_flight_per_sampler_worker = 2
         self.rl_trainer_class = None
         self._enable_rl_trainer_api = False
-        # experimental: this will contain the hyper-parameters that are passed to the
-        # RLTrainer, for computing loss, etc. New algorithms have to set this to their
-        # own default. .training() will modify the fields of this object.
-        self._rl_trainer_hps = RLTrainerHPs()
 
         # `self.callbacks()`
         self.callbacks_class = DefaultCallbacks
@@ -451,10 +443,6 @@ def __init__(self, algo_class=None):
         self.soft_horizon = DEPRECATED_VALUE
         self.no_done_at_end = DEPRECATED_VALUE
 
-    @property
-    def rl_trainer_hps(self) -> RLTrainerHPs:
-        return self._rl_trainer_hps
-
     def to_dict(self) -> AlgorithmConfigDict:
         """Converts all settings into a legacy config dict for backward compatibility.
 
@@ -959,9 +947,6 @@ def resources(
         num_cpus_per_worker: Optional[Union[float, int]] = NotProvided,
         num_gpus_per_worker: Optional[Union[float, int]] = NotProvided,
         num_cpus_for_local_worker: Optional[int] = NotProvided,
-        num_trainer_workers: Optional[int] = NotProvided,
-        num_cpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
-        num_gpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
         custom_resources_per_worker: Optional[dict] = NotProvided,
         placement_strategy: Optional[str] = NotProvided,
     ) -> "AlgorithmConfig":
@@ -981,20 +966,6 @@ def resources(
                 fractional. This is usually needed only if your env itself requires a
                 GPU (i.e., it is a GPU-intensive video game), or model inference is
                 unusually expensive.
-            num_trainer_workers: Number of workers used for training. A value of 0
-                means training will take place on a local worker on head node CPUs or 1
-                GPU (determined by `num_gpus_per_trainer_worker`). For multi-gpu
-                training, set number of workers greater than 1 and set
-                `num_gpus_per_trainer_worker` accordingly (e.g. 4 GPUs total, and model
-                needs 2 GPUs: `num_trainer_workers = 2` and
-                `num_gpus_per_trainer_worker = 2`)
-            num_cpus_per_trainer_worker: Number of CPUs allocated per trainer worker.
-                Only necessary for custom processing pipeline inside each RLTrainer
-                requiring multiple CPU cores. Ignored if `num_trainer_workers = 0`.
-            num_gpus_per_trainer_worker: Number of GPUs allocated per worker. If
-                `num_trainer_workers = 0`, any value greater than 0 will run the
-                training on a single GPU on the head node, while a value of 0 will run
-                the training on head node CPU cores.
             custom_resources_per_worker: Any custom Ray resources to allocate per
                 worker.
             num_cpus_for_local_worker: Number of CPUs to allocate for the algorithm.
@@ -1035,13 +1006,6 @@ def resources(
         if placement_strategy is not NotProvided:
             self.placement_strategy = placement_strategy
 
-        if num_trainer_workers is not NotProvided:
-            self.num_trainer_workers = num_trainer_workers
-        if num_cpus_per_trainer_worker is not NotProvided:
-            self.num_cpus_per_trainer_worker = num_cpus_per_trainer_worker
-        if num_gpus_per_trainer_worker is not NotProvided:
-            self.num_gpus_per_trainer_worker = num_gpus_per_trainer_worker
-
         return self
 
     def framework(
@@ -2681,16 +2645,12 @@ def get_trainer_runner_config(
             .module(module_spec)
             .trainer(
                 trainer_class=self.rl_trainer_class,
+                eager_tracing=self.eager_tracing,
                 # TODO (Kourosh): optimizer config can now be more complicated.
                 optimizer_config={"lr": self.lr},
-                rl_trainer_hps=self.rl_trainer_hps,
-            )
-            .resources(
-                num_trainer_workers=self.num_trainer_workers,
-                num_cpus_per_trainer_worker=self.num_cpus_per_trainer_worker,
-                num_gpus_per_trainer_worker=self.num_gpus_per_trainer_worker,
             )
-            .framework(eager_tracing=self.eager_tracing)
+            .resources(num_gpus=self.num_gpus, fake_gpus=self._fake_gpus)
+            .algorithm(algorithm_config=self)
         )
 
         return config
diff --git a/rllib/core/rl_trainer/rl_trainer.py b/rllib/core/rl_trainer/rl_trainer.py
index ca78f7a096f7..8969cab69a1e 100644
--- a/rllib/core/rl_trainer/rl_trainer.py
+++ b/rllib/core/rl_trainer/rl_trainer.py
@@ -1,6 +1,5 @@
 import abc
 
-from dataclasses import dataclass, field
 import logging
 import numpy as np
 from typing import (
@@ -15,6 +14,7 @@
     Tuple,
     Type,
     Union,
+    TYPE_CHECKING,
 )
 
 from ray.rllib.utils.framework import try_import_tf, try_import_torch
@@ -23,7 +23,6 @@
     ModuleID,
     SingleAgentRLModuleSpec,
 )
-
 from ray.rllib.core.rl_module.marl_module import (
     MultiAgentRLModule,
     MultiAgentRLModuleSpec,
@@ -32,8 +31,10 @@
 from ray.rllib.utils.nested_dict import NestedDict
 from ray.rllib.utils.numpy import convert_to_numpy
 from ray.rllib.utils.typing import TensorType
-from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
+if TYPE_CHECKING:
+    from ray.air.config import ScalingConfig
+    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 
 torch, _ = try_import_torch()
 tf1, tf, tfv = try_import_tf()
@@ -47,32 +48,6 @@
 ParamDictType = Dict[ParamRef, ParamType]
 
 
-@dataclass
-class FrameworkHPs:
-    """The framework specific hyper-parameters.
-
-    Args:
-        eager_tracing: Whether to trace the model in eager mode. This enables tf
-            tracing mode by wrapping the loss function computation in a tf.function.
-            This is useful for speeding up the training loop. However, it is not
-            compatible with all tf operations. For example, tf.print is not supported
-            in tf.function.
-    """
-
-    eager_tracing: bool = False
-
-
-@dataclass
-class RLTrainerHPs:
-    """The hyper-parameters for RLTrainer.
-
-    When creating a new RLTrainer, the new hyper-parameters have to be defined by
-    subclassing this class and adding the new hyper-parameters as fields.
-    """
-
-    pass
-
-
 class RLTrainer:
     """Base class for RLlib algorithm trainers.
 
@@ -143,9 +118,9 @@ def __init__(
         ] = None,
         module: Optional[RLModule] = None,
         optimizer_config: Mapping[str, Any] = None,
-        trainer_scaling_config: TrainerScalingConfig = TrainerScalingConfig(),
-        trainer_hyperparameters: Optional[RLTrainerHPs] = RLTrainerHPs(),
-        framework_hyperparameters: Optional[FrameworkHPs] = FrameworkHPs(),
+        distributed: bool = False,
+        scaling_config: Optional["ScalingConfig"] = None,
+        algorithm_config: Optional["AlgorithmConfig"] = None,
     ):
         # TODO (Kourosh): Having the entire algorithm_config inside trainer may not be
         # the best idea in the world, but it's easy to implement and user will
@@ -165,10 +140,9 @@ def __init__(
         self.module_spec = module_spec
         self.module_obj = module
         self.optimizer_config = optimizer_config
-        self.config = trainer_hyperparameters
-
-        # pick the configs that we need for the trainer from scaling config
-        self._distributed = trainer_scaling_config.num_workers > 1
+        self.distributed = distributed
+        self.scaling_config = scaling_config
+        self.config = algorithm_config
 
         # These are the attributes that are set during build
         self._module: MultiAgentRLModule = None
@@ -177,10 +151,6 @@ def __init__(
         self._param_to_optim: Dict[ParamRef, Optimizer] = {}
         self._params: ParamDictType = {}
 
-    @property
-    def distributed(self) -> bool:
-        return self._distributed
-
     @property
     def module(self) -> MultiAgentRLModule:
         return self._module
@@ -641,46 +611,3 @@ def __check_if_build_called(self):
                 "RLTrainer.build() must be called after constructing a "
                 "RLTrainer and before calling any methods on it."
             )
-
-
-@dataclass
-class RLTrainerSpec:
-    """The spec for construcitng RLTrainer actors.
-
-    Args:
-        rl_trainer_class: The RLTrainer class to use.
-        module_spec: The underlying (MA)RLModule spec to completely define the module.
-        module: Alternatively the RLModule instance can be passed in directly. This
-            only works if the RLTrainer is not an actor.
-        backend_config: The backend config for properly distributing the RLModule.
-        optimizer_config: The optimizer setting to apply during training.
-        trainer_hyperparameters: The extra config for the loss/additional update. This
-            should be a subclass of RLTrainerHPs. This is useful for passing in
-            algorithm configs that contains the hyper-parameters for loss computation,
-            change of training behaviors, etc. e.g lr, entropy_coeff.
-    """
-
-    rl_trainer_class: Type["RLTrainer"]
-    module_spec: Union["SingleAgentRLModuleSpec", "MultiAgentRLModuleSpec"] = None
-    module: Optional["RLModule"] = None
-    trainer_scaling_config: TrainerScalingConfig = field(
-        default_factory=TrainerScalingConfig
-    )
-    optimizer_config: Dict[str, Any] = field(default_factory=dict)
-    trainer_hyperparameters: RLTrainerHPs = field(default_factory=RLTrainerHPs)
-    framework_hyperparameters: FrameworkHPs = field(default_factory=FrameworkHPs)
-
-    def get_params_dict(self) -> Dict[str, Any]:
-        """Returns the parameters than be passed to the RLTrainer constructor."""
-        return {
-            "module": self.module,
-            "module_spec": self.module_spec,
-            "trainer_scaling_config": self.trainer_scaling_config,
-            "optimizer_config": self.optimizer_config,
-            "trainer_hyperparameters": self.trainer_hyperparameters,
-            "framework_hyperparameters": self.framework_hyperparameters,
-        }
-
-    def build(self) -> "RLTrainer":
-        """Builds the RLTrainer instance."""
-        return self.rl_trainer_class(**self.get_params_dict())
diff --git a/rllib/core/rl_trainer/scaling_config.py b/rllib/core/rl_trainer/scaling_config.py
deleted file mode 100644
index 1c8054ef4468..000000000000
--- a/rllib/core/rl_trainer/scaling_config.py
+++ /dev/null
@@ -1,21 +0,0 @@
-from dataclasses import dataclass
-
-
-@dataclass
-class TrainerScalingConfig:
-    """Configuratiom for scaling training actors.
-
-    Attributes:
-        num_workers: The number of workers to use for training. num_workers=0 means you
-            have only one local worker (either on 1 CPU or 1 GPU)
-        num_cpus_per_worker: The number of CPUs to allocate per worker. If
-            num_workers=0 and num_gpus_per_worker=0, regardless of this value, the
-            training will run on a single CPU.
-        num_gpus_per_worker: The number of GPUs to allocate per worker. If
-            num_workers=0, any number greater than 0 will run the training on a single
-            GPU. A value of zero will run the training on a single CPU.
-    """
-
-    num_workers: int = 0
-    num_cpus_per_worker: int = 1
-    num_gpus_per_worker: int = 0
diff --git a/rllib/core/rl_trainer/tests/test_rl_trainer.py b/rllib/core/rl_trainer/tests/test_rl_trainer.py
index b33bea2a1cc6..8af9b0ae7245 100644
--- a/rllib/core/rl_trainer/tests/test_rl_trainer.py
+++ b/rllib/core/rl_trainer/tests/test_rl_trainer.py
@@ -11,12 +11,16 @@
 from ray.rllib.core.testing.tf.bc_rl_trainer import BCTfRLTrainer
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID
 from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
-from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
 
-def get_trainer() -> RLTrainer:
+def get_trainer(distributed=False) -> RLTrainer:
     env = gym.make("CartPole-v1")
 
+    # TODO: Another way to make RLTrainer would be to construct the module first
+    # and then apply trainer to it. We should also allow that. In fact if we figure
+    # out the serialization of RLModules we can simply pass the module the trainer
+    # and internally it will serialize and deserialize the module for distributed
+    # construction.
     trainer = BCTfRLTrainer(
         module_spec=SingleAgentRLModuleSpec(
             module_class=DiscreteBCTFModule,
@@ -25,7 +29,7 @@ def get_trainer() -> RLTrainer:
             model_config={"hidden_dim": 32},
         ),
         optimizer_config={"lr": 1e-3},
-        trainer_scaling_config=TrainerScalingConfig(),
+        distributed=distributed,
     )
 
     trainer.build()
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner.py b/rllib/core/rl_trainer/tests/test_trainer_runner.py
index 67a511b6d5bc..5743c891b4c4 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner.py
@@ -2,130 +2,55 @@
 import unittest
 import ray
 import time
-import numpy as np
-import itertools
 
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID, MultiAgentBatch
-from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
-from ray.rllib.utils.framework import try_import_tf
-from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
+from ray.rllib.utils.test_utils import get_cartpole_dataset_reader
 from ray.rllib.core.testing.utils import (
     get_trainer_runner,
-    get_rl_trainer,
     add_module_to_runner_or_trainer,
 )
 
 
 class TestTrainerRunner(unittest.TestCase):
+    """This test is setup for 2 gpus."""
+
+    # TODO: This unittest should also test other resource allocations like multi-cpu,
+    # multi-node multi-gpu, etc.
+
     @classmethod
-    def setUpClass(cls) -> None:
+    def setUp(cls) -> None:
         ray.init()
 
-        # Settings to test
-        cls.scaling_configs = {
-            "local-cpu": TrainerScalingConfig(num_workers=0, num_gpus_per_worker=0),
-            "local-gpu": TrainerScalingConfig(num_workers=0, num_gpus_per_worker=0.5),
-            "remote-cpu": TrainerScalingConfig(num_workers=1),
-            "remote-gpu": TrainerScalingConfig(num_workers=1, num_gpus_per_worker=0.5),
-            "multi-gpu-ddp": TrainerScalingConfig(num_workers=2, num_gpus_per_worker=1),
-            "multi-cpu-ddp": TrainerScalingConfig(num_workers=2, num_cpus_per_worker=2),
-            # "multi-gpu-ddp-pipeline": TrainerScalingConfig(
-            #     num_workers=2, num_gpus_per_worker=2
-            # ),
-        }
-
     @classmethod
-    def tearDownClass(cls) -> None:
+    def tearDown(cls) -> None:
         ray.shutdown()
 
-    def test_trainer_runner_local(self):
-
-        tf1, tf, tfv = try_import_tf()
-        tf1.executing_eagerly()
-
-        # TODO (Avnish): tf does not clear out the GPU memory footprint, therefore
-        # doing it first before torch will result in OOM. Find a way to clear out the
-        # GPU memory footprint of tf.
-        fws = ["torch"]
-        scaling_modes = ["local-cpu", "local-gpu"]
-        test_iterator = itertools.product(fws, scaling_modes)
-
-        env = gym.make("CartPole-v1")
-        for fw, scaling_mode in test_iterator:
-            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}")
-            ray.init(ignore_reinit_error=True)
-            scaling_config = self.scaling_configs[scaling_mode]
-            runner = get_trainer_runner(fw, env, scaling_config)
-            local_trainer = get_rl_trainer(fw, env)
-            local_trainer.build()
-
-            # make the state of the trainer and the local runner identical
-            local_trainer.set_state(runner.get_state()[0])
-
-            reader = get_cartpole_dataset_reader(batch_size=500)
-            batch = reader.next()
-            batch = batch.as_multi_agent()
-            check(local_trainer.update(batch), runner.update(batch)[0])
-
-            new_module_id = "test_module"
-
-            add_module_to_runner_or_trainer(fw, env, new_module_id, runner)
-            add_module_to_runner_or_trainer(fw, env, new_module_id, local_trainer)
-
-            # make the state of the trainer and the local runner identical
-            local_trainer.set_state(runner.get_state()[0])
-
-            # do another update
-            batch = reader.next()
-            ma_batch = MultiAgentBatch(
-                {new_module_id: batch, DEFAULT_POLICY_ID: batch}, env_steps=batch.count
-            )
-            check(local_trainer.update(ma_batch), runner.update(ma_batch)[0])
-
-            check(local_trainer.get_state(), runner.get_state()[0])
-
-            # make sure the runner resources are freed up so that we don't autoscale
-            del runner
-            del local_trainer
-            ray.shutdown()
-            time.sleep(10)
-
     def test_update_multigpu(self):
+        """Test training in a 2 gpu setup and that weights are synchronized."""
 
-        # TODO (Avnish): The tf + remote-gpu test is flakey. Removing for now until
-        # investigated.
-        fws = ["torch"]
-        scaling_modes = self.scaling_configs.keys()
-        test_iterator = itertools.product(fws, scaling_modes)
-
-        for fw, scaling_mode in test_iterator:
-            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}.")
+        for fw in ["tf", "torch"]:
             ray.init(ignore_reinit_error=True)
+            print(f"Testing framework: {fw}.")
             env = gym.make("CartPole-v1")
-
-            scaling_config = self.scaling_configs[scaling_mode]
-            runner = get_trainer_runner(fw, env, scaling_config)
-            reader = get_cartpole_dataset_reader(batch_size=1024)
+            runner = get_trainer_runner(fw, env, compute_config=dict(num_gpus=2))
+            reader = get_cartpole_dataset_reader(batch_size=500)
 
             min_loss = float("inf")
             for iter_i in range(1000):
                 batch = reader.next()
-                results = runner.update(batch.as_multi_agent())
+                res_0, res_1 = runner.update(batch.as_multi_agent())
 
-                loss = np.mean([res["loss"]["total_loss"] for res in results])
+                loss = (res_0["loss"]["total_loss"] + res_1["loss"]["total_loss"]) / 2
                 min_loss = min(loss, min_loss)
                 print(f"[iter = {iter_i}] Loss: {loss:.3f}, Min Loss: {min_loss:.3f}")
                 # The loss is initially around 0.69 (ln2). When it gets to around
                 # 0.57 the return of the policy gets to around 100.
                 if min_loss < 0.57:
                     break
-
-                for res1, res2 in zip(results, results[1:]):
-                    self.assertEqual(
-                        res1["mean_weight"]["default_policy"],
-                        res2["mean_weight"]["default_policy"],
-                    )
-
+                self.assertEqual(
+                    res_0["mean_weight"]["default_policy"],
+                    res_1["mean_weight"]["default_policy"],
+                )
             self.assertLess(min_loss, 0.57)
 
             # make sure the runner resources are freed up so that we don't autoscale
@@ -135,18 +60,11 @@ def test_update_multigpu(self):
 
     def test_add_remove_module(self):
 
-        # TODO (Avnish): The tf + remote-gpu test is flakey. Removing for now until
-        # investigated.
-        fws = ["torch"]
-        scaling_modes = self.scaling_configs.keys()
-        test_iterator = itertools.product(fws, scaling_modes)
-
-        for fw, scaling_mode in test_iterator:
-            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}.")
+        for fw in ["tf", "torch"]:
             ray.init(ignore_reinit_error=True)
+            print(f"Testing framework: {fw}.")
             env = gym.make("CartPole-v1")
-            scaling_config = self.scaling_configs[scaling_mode]
-            runner = get_trainer_runner(fw, env, scaling_config)
+            runner = get_trainer_runner(fw, env, compute_config=dict(num_gpus=2))
             reader = get_cartpole_dataset_reader(batch_size=500)
             batch = reader.next()
 
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner_config.py b/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
index 46e215acd86d..acdc67731337 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
@@ -31,6 +31,7 @@ def test_trainer_runner_build(self):
             .trainer(
                 trainer_class=BCTfRLTrainer,
             )
+            .algorithm(algorithm_config=AlgorithmConfig())
         )
         config.build()
 
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner_local.py b/rllib/core/rl_trainer/tests/test_trainer_runner_local.py
new file mode 100644
index 000000000000..9986cf98dd3d
--- /dev/null
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner_local.py
@@ -0,0 +1,70 @@
+import gymnasium as gym
+import unittest
+
+import ray
+
+from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID, MultiAgentBatch
+from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
+from ray.rllib.utils.framework import try_import_tf
+from ray.rllib.core.testing.utils import (
+    add_module_to_runner_or_trainer,
+    get_trainer_runner,
+    get_rl_trainer,
+)
+
+
+tf1, tf, tfv = try_import_tf()
+tf1.executing_eagerly()
+
+
+class TestTrainerRunnerLocal(unittest.TestCase):
+    """This test is a trainer test setup for no gpus."""
+
+    # TODO: Make a unittest that does not need 2 gpus to run.
+    # So that the user can run it locally as well.
+    @classmethod
+    def setUp(cls) -> None:
+        ray.init()
+
+    @classmethod
+    def tearDown(cls) -> None:
+        ray.shutdown()
+
+    def test_trainer_runner_no_gpus(self):
+        env = gym.make("CartPole-v1")
+        for fw in ["tf", "torch"]:
+            runner = get_trainer_runner(fw, env, compute_config=dict(num_gpus=0))
+            local_trainer = get_rl_trainer(fw, env)
+            local_trainer.build()
+
+            # make the state of the trainer and the local runner identical
+            local_trainer.set_state(runner.get_state()[0])
+
+            reader = get_cartpole_dataset_reader(batch_size=500)
+            batch = reader.next()
+            batch = batch.as_multi_agent()
+            check(local_trainer.update(batch), runner.update(batch)[0])
+
+            new_module_id = "test_module"
+
+            add_module_to_runner_or_trainer(fw, env, new_module_id, runner)
+            add_module_to_runner_or_trainer(fw, env, new_module_id, local_trainer)
+
+            # make the state of the trainer and the local runner identical
+            local_trainer.set_state(runner.get_state()[0])
+
+            # do another update
+            batch = reader.next()
+            ma_batch = MultiAgentBatch(
+                {new_module_id: batch, DEFAULT_POLICY_ID: batch}, env_steps=batch.count
+            )
+            check(local_trainer.update(ma_batch), runner.update(ma_batch)[0])
+
+            check(local_trainer.get_state(), runner.get_state()[0])
+
+
+if __name__ == "__main__":
+    import pytest
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/rllib/core/rl_trainer/tf/tf_rl_trainer.py b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
index 0455a0e772e0..44a8f6d21581 100644
--- a/rllib/core/rl_trainer/tf/tf_rl_trainer.py
+++ b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
@@ -9,10 +9,10 @@
     Dict,
     Sequence,
     Hashable,
+    TYPE_CHECKING,
 )
 
 from ray.rllib.core.rl_trainer.rl_trainer import (
-    FrameworkHPs,
     RLTrainer,
     ParamOptimizerPairs,
     ParamRef,
@@ -25,13 +25,19 @@
     ModuleID,
     SingleAgentRLModuleSpec,
 )
-from ray.rllib.core.rl_module.marl_module import MultiAgentRLModule
+from ray.rllib.core.rl_module.marl_module import (
+    MultiAgentRLModule,
+    MultiAgentRLModuleSpec,
+)
 from ray.rllib.policy.sample_batch import MultiAgentBatch
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.framework import try_import_tf
 from ray.rllib.utils.typing import TensorType
 from ray.rllib.utils.nested_dict import NestedDict
 
+if TYPE_CHECKING:
+    from ray.air.config import ScalingConfig
+    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 
 tf1, tf, tfv = try_import_tf()
 
@@ -88,10 +94,24 @@ class TfRLTrainer(RLTrainer):
     def __init__(
         self,
         *,
-        framework_hyperparameters: Optional[FrameworkHPs] = FrameworkHPs(),
-        **kwargs,
+        module_spec: Optional[
+            Union[SingleAgentRLModuleSpec, MultiAgentRLModuleSpec]
+        ] = None,
+        module: Optional[RLModule] = None,
+        optimizer_config: Mapping[str, Any],
+        distributed: bool = False,
+        enable_tf_function: bool = True,
+        scaling_config: Optional["ScalingConfig"] = None,
+        algorithm_config: Optional["AlgorithmConfig"] = None,
     ):
-        super().__init__(framework_hyperparameters=framework_hyperparameters, **kwargs)
+        super().__init__(
+            module_spec=module_spec,
+            module=module,
+            optimizer_config=optimizer_config,
+            distributed=distributed,
+            scaling_config=scaling_config,
+            algorithm_config=algorithm_config,
+        )
 
         # TODO (Kourosh): This is required to make sure tf computes the values in the
         # end. Two question remains:
@@ -101,7 +121,7 @@ def __init__(
         # does not mention this as a requirement?
         tf1.enable_eager_execution()
 
-        self._enable_tf_function = framework_hyperparameters.eager_tracing
+        self._enable_tf_function = enable_tf_function
         if self._enable_tf_function:
             self._update_fn = tf.function(self._do_update_fn)
         else:
diff --git a/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py b/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
index 9de3c1d47259..40806048b6dc 100644
--- a/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
+++ b/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
@@ -12,12 +12,20 @@
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID
 from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
 from ray.rllib.utils.numpy import convert_to_numpy
-from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
+from ray.air.config import ScalingConfig
 
-def _get_trainer() -> RLTrainer:
-    env = gym.make("CartPole-v1")
 
+def _get_trainer(scaling_config=None, distributed: bool = False) -> RLTrainer:
+    env = gym.make("CartPole-v1")
+    scaling_config = scaling_config or ScalingConfig()
+    distributed = False
+
+    # TODO: Another way to make RLTrainer would be to construct the module first
+    # and then apply trainer to it. We should also allow that. In fact if we figure
+    # out the serialization of RLModules we can simply pass the module the trainer
+    # and internally it will serialize and deserialize the module for distributed
+    # construction.
     trainer = BCTorchRLTrainer(
         module_spec=SingleAgentRLModuleSpec(
             module_class=DiscreteBCTorchModule,
@@ -25,8 +33,9 @@ def _get_trainer() -> RLTrainer:
             action_space=env.action_space,
             model_config={"hidden_dim": 32},
         ),
+        scaling_config=scaling_config,
         optimizer_config={"lr": 1e-3},
-        trainer_scaling_config=TrainerScalingConfig(),
+        distributed=distributed,
     )
 
     trainer.build()
@@ -45,7 +54,7 @@ def tearDown(cls) -> None:
 
     def test_end_to_end_update(self):
 
-        trainer = _get_trainer()
+        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
         reader = get_cartpole_dataset_reader(batch_size=512)
 
         min_loss = float("inf")
@@ -68,7 +77,7 @@ def test_compute_gradients(self):
         Tests that if we sum all the trainable variables the gradient of output w.r.t.
         the weights is all ones.
         """
-        trainer = _get_trainer()
+        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
 
         params = trainer.get_parameters(trainer.module[DEFAULT_POLICY_ID])
         loss = {"total_loss": sum([param.sum() for param in params])}
@@ -87,7 +96,7 @@ def test_apply_gradients(self):
         standard SGD/Adam update rule.
         """
 
-        trainer = _get_trainer()
+        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
 
         # calculated the expected new params based on gradients of all ones.
         params = trainer.get_parameters(trainer.module[DEFAULT_POLICY_ID])
@@ -111,7 +120,7 @@ def test_add_remove_module(self):
         all variables the updated parameters follow the SGD update rule.
         """
         env = gym.make("CartPole-v1")
-        trainer = _get_trainer()
+        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
 
         # add a test module with SGD optimizer with a known lr
         lr = 1e-4
diff --git a/rllib/core/rl_trainer/torch/torch_rl_trainer.py b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
index 8fe28c662718..b8313b47a584 100644
--- a/rllib/core/rl_trainer/torch/torch_rl_trainer.py
+++ b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
@@ -8,6 +8,7 @@
     Hashable,
     Optional,
     Callable,
+    TYPE_CHECKING,
 )
 
 from ray.rllib.core.rl_module.rl_module import (
@@ -15,7 +16,10 @@
     ModuleID,
     SingleAgentRLModuleSpec,
 )
-from ray.rllib.core.rl_module.marl_module import MultiAgentRLModule
+from ray.rllib.core.rl_module.marl_module import (
+    MultiAgentRLModule,
+    MultiAgentRLModuleSpec,
+)
 from ray.rllib.core.rl_trainer.rl_trainer import (
     RLTrainer,
     ParamOptimizerPairs,
@@ -24,7 +28,6 @@
     ParamDictType,
 )
 from ray.rllib.core.rl_module.torch.torch_rl_module import TorchDDPRLModule
-from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 from ray.rllib.policy.sample_batch import MultiAgentBatch
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.typing import TensorType
@@ -34,8 +37,11 @@
 torch, nn = try_import_torch()
 
 if torch:
+    from ray.air.config import ScalingConfig
     from ray.train.torch.train_loop_utils import _TorchAccelerator
 
+if TYPE_CHECKING:
+    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 
 logger = logging.getLogger(__name__)
 
@@ -47,14 +53,31 @@ class TorchRLTrainer(RLTrainer):
     def __init__(
         self,
         *,
-        trainer_scaling_config: TrainerScalingConfig = TrainerScalingConfig(),
-        **kwargs,
+        module_spec: Optional[
+            Union[SingleAgentRLModuleSpec, MultiAgentRLModuleSpec]
+        ] = None,
+        module: Optional[RLModule] = None,
+        optimizer_config: Mapping[str, Any],
+        distributed: bool = False,
+        scaling_config: Optional["ScalingConfig"] = None,
+        algorithm_config: Optional["AlgorithmConfig"] = None,
     ):
-        super().__init__(trainer_scaling_config=trainer_scaling_config, **kwargs)
+        super().__init__(
+            module_spec=module_spec,
+            module=module,
+            optimizer_config=optimizer_config,
+            distributed=distributed,
+            scaling_config=scaling_config,
+            algorithm_config=algorithm_config,
+        )
 
-        # pick the stuff that we need from the scaling config
-        self._use_gpu = trainer_scaling_config.num_gpus_per_worker > 0
+        # TODO (Kourosh): Scaling config is required for torch trainer to do proper DDP
+        # wraping setup but not so much required for tf. we need to
+        scaling_config = scaling_config or ScalingConfig()
+        self._world_size = scaling_config.num_workers or 1
+        self._use_gpu = scaling_config.use_gpu
 
+        # These attributes are set in the `build` method.
         self._device = None
 
     @property
@@ -112,12 +135,6 @@ def build(self) -> None:
             self._device = torch.device("cpu")
         super().build()
 
-    @override(RLTrainer)
-    def _make_module(self) -> MultiAgentRLModule:
-        module = super()._make_module()
-        self._map_module_to_device(module)
-        return module
-
     @override(RLTrainer)
     def _make_distributed_module(self) -> MultiAgentRLModule:
         module = self._make_module()
@@ -129,9 +146,11 @@ def _make_distributed_module(self) -> MultiAgentRLModule:
         # register them in the MultiAgentRLModule. We should find a better way to
         # handle this.
         if isinstance(module, torch.nn.Module):
+            module.to(self._device)
             module = TorchDDPRLModule(module)
         else:
             for key in module.keys():
+                module[key].to(self._device)
                 module.add_module(key, TorchDDPRLModule(module[key]), override=True)
 
         return module
@@ -191,11 +210,3 @@ def add_module(
             self._module.add_module(
                 module_id, TorchDDPRLModule(self._module[module_id]), override=True
             )
-
-    def _map_module_to_device(self, module: MultiAgentRLModule) -> None:
-        """Moves the module to the correct device."""
-        if isinstance(module, torch.nn.Module):
-            module.to(self._device)
-        else:
-            for key in module.keys():
-                module[key].to(self._device)
diff --git a/rllib/core/rl_trainer/trainer_runner.py b/rllib/core/rl_trainer/trainer_runner.py
index b6889c77d973..c6fcda3deacf 100644
--- a/rllib/core/rl_trainer/trainer_runner.py
+++ b/rllib/core/rl_trainer/trainer_runner.py
@@ -1,5 +1,5 @@
 import math
-from typing import Any, List, Mapping, Type, Optional, Callable, Dict, TYPE_CHECKING
+from typing import Any, List, Mapping, Type, Optional, Callable, Dict
 
 import ray
 
@@ -9,30 +9,16 @@
     SingleAgentRLModuleSpec,
 )
 from ray.rllib.core.rl_trainer.rl_trainer import (
-    RLTrainerSpec,
+    RLTrainer,
     ParamOptimizerPairs,
     Optimizer,
 )
-from ray.rllib.policy.sample_batch import MultiAgentBatch
-from ray.train._internal.backend_executor import BackendExecutor
-
-if TYPE_CHECKING:
-    from ray.rllib.core.rl_trainer.rl_trainer import RLTrainer
-
 
-def _get_backend_config(rl_trainer_class: Type["RLTrainer"]) -> str:
-    if rl_trainer_class.framework == "torch":
-        from ray.train.torch import TorchConfig
-
-        backend_config = TorchConfig()
-    elif rl_trainer_class.framework == "tf":
-        from ray.train.tensorflow import TensorflowConfig
+from ray.rllib.policy.sample_batch import MultiAgentBatch
 
-        backend_config = TensorflowConfig()
-    else:
-        raise ValueError("framework must be either torch or tf")
 
-    return backend_config
+from ray.air.config import ScalingConfig
+from ray.train._internal.backend_executor import BackendExecutor
 
 
 class TrainerRunner:
@@ -61,23 +47,32 @@ class TrainerRunner:
 
     def __init__(
         self,
-        rl_trainer_spec: RLTrainerSpec,
+        trainer_class: Type[RLTrainer],
+        trainer_config: Mapping[str, Any],
+        compute_config: Mapping[str, Any],
     ):
-        scaling_config = rl_trainer_spec.trainer_scaling_config
-        rl_trainer_class = rl_trainer_spec.rl_trainer_class
+        num_gpus = compute_config.get("num_gpus", 0)
+        use_fake_gpus = compute_config.get("_use_fake_gpus", False)
+        self._trainer_config = trainer_config
+
+        if num_gpus > 0:
+            scaling_config = ScalingConfig(
+                num_workers=num_gpus,
+                use_gpu=(not use_fake_gpus),
+            )
 
-        # TODO (Kourosh): Go with a _remote flag instead of _is_local to be more
-        # explicit
-        self._is_local = scaling_config.num_workers == 0
-        self._trainer = None
-        self._workers = None
+            if trainer_class.framework == "torch":
+                from ray.train.torch import TorchConfig
 
-        if self._is_local:
-            self._trainer = rl_trainer_class(**rl_trainer_spec.get_params_dict())
-            self._trainer.build()
-        else:
-            backend_config = _get_backend_config(rl_trainer_class)
-            backend_executor = BackendExecutor(
+                backend_config = TorchConfig()
+            elif trainer_class.framework == "tf":
+                from ray.train.tensorflow import TensorflowConfig
+
+                backend_config = TensorflowConfig()
+            else:
+                raise ValueError("framework must be either torch or tf")
+
+            self.backend_executor = BackendExecutor(
                 backend_config=backend_config,
                 num_workers=scaling_config.num_workers,
                 num_cpus_per_worker=scaling_config.num_cpus_per_worker,
@@ -85,19 +80,23 @@ def __init__(
                 max_retries=0,
             )
 
-            backend_executor.start(
-                train_cls=rl_trainer_class,
-                train_cls_kwargs=rl_trainer_spec.get_params_dict(),
+            # TODO(avnishn, kourosh): Should we pass in scaling config into the
+            # trainer?
+            trainer_config["distributed"] = self._distributed = bool(num_gpus > 1)
+            trainer_config["scaling_config"] = scaling_config
+            self.backend_executor.start(
+                train_cls=trainer_class, train_cls_kwargs=trainer_config
             )
+            self._workers = [
+                w.actor for w in self.backend_executor.worker_group.workers
+            ]
 
-            self._workers = [w.actor for w in backend_executor.worker_group.workers]
-
-            # run the neural network building code on remote workers
             ray.get([w.build.remote() for w in self._workers])
 
-    @property
-    def is_local(self) -> bool:
-        return self._is_local
+        else:
+            trainer_config["distributed"] = self._distributed = False
+            self._trainer = trainer_class(**trainer_config)
+            self._trainer.build()
 
     def update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
         """Do a gradient based update to the RLTrainer(s) maintained by this TrainerRunner.
@@ -108,10 +107,10 @@ def update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
         Returns:
             A list of dictionaries of results from the updates from the RLTrainer(s)
         """
-        if self.is_local:
-            return [self._trainer.update(batch)]
-        else:
+        if self._distributed:
             return self._distributed_update(batch)
+        else:
+            return [self._trainer.update(batch)]
 
     def _distributed_update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
         """Do a gradient based update to the RLTrainers using DDP training.
@@ -158,13 +157,13 @@ def additional_update(self, *args, **kwargs) -> List[Mapping[str, Any]]:
             A list of dictionaries of results from the updates from each worker.
         """
 
-        if self.is_local:
-            return [self._trainer.additional_update(*args, **kwargs)]
-        else:
+        if self._distributed:
             refs = []
             for worker in self._workers:
                 refs.append(worker.additional_update.remote(*args, **kwargs))
             return ray.get(refs)
+        else:
+            return [self._trainer.additional_update(*args, **kwargs)]
 
     def add_module(
         self,
@@ -187,14 +186,7 @@ def add_module(
             optimizer_cls: The optimizer class to use. If None, the set_optimizer_fn
                 should be provided.
         """
-        if self.is_local:
-            self._trainer.add_module(
-                module_id=module_id,
-                module_spec=module_spec,
-                set_optimizer_fn=set_optimizer_fn,
-                optimizer_cls=optimizer_cls,
-            )
-        else:
+        if self._distributed:
             refs = []
             for worker in self._workers:
                 ref = worker.add_module.remote(
@@ -205,6 +197,13 @@ def add_module(
                 )
                 refs.append(ref)
             ray.get(refs)
+        else:
+            self._trainer.add_module(
+                module_id=module_id,
+                module_spec=module_spec,
+                set_optimizer_fn=set_optimizer_fn,
+                optimizer_cls=optimizer_cls,
+            )
 
     def remove_module(self, module_id: ModuleID) -> None:
         """Remove a module from the RLTrainers maintained by this TrainerRunner.
@@ -213,14 +212,14 @@ def remove_module(self, module_id: ModuleID) -> None:
             module_id: The id of the module to remove.
 
         """
-        if self.is_local:
-            self._trainer.remove_module(module_id)
-        else:
+        if self._distributed:
             refs = []
             for worker in self._workers:
                 ref = worker.remove_module.remote(module_id)
                 refs.append(ref)
             ray.get(refs)
+        else:
+            self._trainer.remove_module(module_id)
 
     def get_weight(self) -> Dict:
         """Get the weights of the MARLModule.
@@ -233,13 +232,13 @@ def get_weight(self) -> Dict:
 
     def get_state(self) -> List[Mapping[ModuleID, Mapping[str, Any]]]:
         """Get the states of the RLTrainers"""
-        if self.is_local:
-            return [self._trainer.get_state()]
-        else:
+        if self._distributed:
             refs = []
             for worker in self._workers:
                 refs.append(worker.get_state.remote())
             return ray.get(refs)
+        else:
+            return [self._trainer.get_state()]
 
     def set_state(self, state: List[Mapping[ModuleID, Mapping[str, Any]]]) -> None:
         """Sets the states of the RLTrainers.
@@ -248,10 +247,10 @@ def set_state(self, state: List[Mapping[ModuleID, Mapping[str, Any]]]) -> None:
             state: The state of the RLTrainers
 
         """
-        if self.is_local:
-            self._trainer.set_state(state)
-        else:
+        if self._distributed:
             refs = []
             for worker in self._workers:
                 refs.append(worker.set_state.remote(state))
             ray.get(refs)
+        else:
+            self._trainer.set_state(state)
diff --git a/rllib/core/rl_trainer/trainer_runner_config.py b/rllib/core/rl_trainer/trainer_runner_config.py
index d8de08c05328..d193e7cbb1f8 100644
--- a/rllib/core/rl_trainer/trainer_runner_config.py
+++ b/rllib/core/rl_trainer/trainer_runner_config.py
@@ -1,18 +1,11 @@
 from typing import Type, Optional, TYPE_CHECKING, Union, Dict
-
 from ray.rllib.core.rl_module.marl_module import MultiAgentRLModuleSpec
 from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
-from ray.rllib.core.rl_trainer.trainer_runner import TrainerRunner
-from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
-from ray.rllib.core.rl_trainer.rl_trainer import (
-    RLTrainerSpec,
-    RLTrainerHPs,
-    FrameworkHPs,
-)
 from ray.rllib.utils.from_config import NotProvided
-
+from ray.rllib.core.rl_trainer.trainer_runner import TrainerRunner
 
 if TYPE_CHECKING:
+    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
     from ray.rllib.core.rl_trainer import RLTrainer
 
 ModuleSpec = Union[SingleAgentRLModuleSpec, MultiAgentRLModuleSpec]
@@ -33,16 +26,15 @@ def __init__(self, cls: Type[TrainerRunner] = None) -> None:
 
         # `self.trainer()`
         self.trainer_class = None
+        self.eager_tracing = True
         self.optimizer_config = None
-        self.rl_trainer_hps = RLTrainerHPs()
 
         # `self.resources()`
-        self.num_gpus_per_trainer_worker = 0
-        self.num_cpus_per_trainer_worker = 1
-        self.num_trainer_workers = 1
+        self.num_gpus = 0
+        self.fake_gpus = False
 
-        # `self.framework()`
-        self.eager_tracing = False
+        # `self.algorithm()`
+        self.algorithm_config = None
 
     def validate(self) -> None:
 
@@ -58,39 +50,51 @@ def validate(self) -> None:
                 "the RLTrainer class with .trainer(trainer_class=MyTrainerClass)."
             )
 
+        if self.algorithm_config is None:
+            raise ValueError(
+                "Must provide algorithm_config for RLTrainer. Use "
+                ".algorithm(algorithm_config=MyConfig)."
+            )
+
         if self.optimizer_config is None:
             # get the default optimizer config if it's not provided
             # TODO (Kourosh): Change the optimizer config to a dataclass object.
             self.optimizer_config = {"lr": 1e-3}
 
+        if self.fake_gpus and self.num_gpus <= 0:
+            raise ValueError("If fake_gpus is True, num_gpus must be greater than 0.")
+
     def build(self) -> TrainerRunner:
         self.validate()
 
-        scaling_config = TrainerScalingConfig(
-            num_workers=self.num_trainer_workers,
-            num_gpus_per_worker=self.num_gpus_per_trainer_worker,
-            num_cpus_per_worker=self.num_cpus_per_trainer_worker,
+        # If the module class is a multi agent class it will override the default
+        # MultiAgentRLModule class. otherwise, it will be a single agent wrapped with
+        # mutliagent
+        # TODO (Kourosh): What should be scaling_config? it's not clear what
+        # should be passed in as trainer_config and what will be inferred
+        return self.trainer_runner_class(
+            trainer_class=self.trainer_class,
+            trainer_config={
+                "module_spec": self.module_spec,
+                # TODO (Kourosh): should this be inferred inside the constructor?
+                "distributed": self.num_gpus > 1,
+                # TODO (Avnish): add this
+                # "enable_tf_function": self.eager_tracing,
+                "optimizer_config": self.optimizer_config,
+                "algorithm_config": self.algorithm_config,
+            },
+            compute_config={
+                "num_gpus": self.num_gpus,
+                # TODO (Avnish): add this
+                # "fake_gpus": self.fake_gpus,
+            },
         )
 
-        framework_hps = FrameworkHPs(eager_tracing=self.eager_tracing)
-
-        rl_trainer_spec = RLTrainerSpec(
-            rl_trainer_class=self.trainer_class,
-            module_spec=self.module_spec,
-            optimizer_config=self.optimizer_config,
-            trainer_scaling_config=scaling_config,
-            trainer_hyperparameters=self.rl_trainer_hps,
-            framework_hyperparameters=framework_hps,
-        )
-
-        return self.trainer_runner_class(rl_trainer_spec)
-
-    def framework(
-        self, eager_tracing: Optional[bool] = NotProvided
+    def algorithm(
+        self, algorithm_config: Optional["AlgorithmConfig"] = NotProvided
     ) -> "TrainerRunnerConfig":
-
-        if eager_tracing is not NotProvided:
-            self.eager_tracing = eager_tracing
+        if algorithm_config is not NotProvided:
+            self.algorithm_config = algorithm_config
         return self
 
     def module(
@@ -105,17 +109,14 @@ def module(
 
     def resources(
         self,
-        num_trainer_workers: Optional[int] = NotProvided,
-        num_gpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
-        num_cpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
+        num_gpus: Optional[Union[float, int]] = NotProvided,
+        fake_gpus: Optional[bool] = NotProvided,
     ) -> "TrainerRunnerConfig":
 
-        if num_trainer_workers is not NotProvided:
-            self.num_trainer_workers = num_trainer_workers
-        if num_gpus_per_trainer_worker is not NotProvided:
-            self.num_gpus_per_trainer_worker = num_gpus_per_trainer_worker
-        if num_cpus_per_trainer_worker is not NotProvided:
-            self.num_cpus_per_trainer_worker = num_cpus_per_trainer_worker
+        if num_gpus is not NotProvided:
+            self.num_gpus = num_gpus
+        if fake_gpus is not NotProvided:
+            self.fake_gpus = fake_gpus
 
         return self
 
@@ -123,15 +124,15 @@ def trainer(
         self,
         *,
         trainer_class: Optional[Type["RLTrainer"]] = NotProvided,
+        eager_tracing: Optional[bool] = NotProvided,
         optimizer_config: Optional[Dict] = NotProvided,
-        rl_trainer_hps: Optional[RLTrainerHPs] = NotProvided,
     ) -> "TrainerRunnerConfig":
 
         if trainer_class is not NotProvided:
             self.trainer_class = trainer_class
+        if eager_tracing is not NotProvided:
+            self.eager_tracing = eager_tracing
         if optimizer_config is not NotProvided:
             self.optimizer_config = optimizer_config
-        if rl_trainer_hps is not NotProvided:
-            self.rl_trainer_hps = rl_trainer_hps
 
         return self
diff --git a/rllib/core/testing/utils.py b/rllib/core/testing/utils.py
index 01e38f07ad8a..bd96492bac50 100644
--- a/rllib/core/testing/utils.py
+++ b/rllib/core/testing/utils.py
@@ -4,8 +4,6 @@
 
 from ray.rllib.utils.annotations import DeveloperAPI
 from ray.rllib.core.rl_trainer.trainer_runner import TrainerRunner
-from ray.rllib.core.rl_trainer.rl_trainer import RLTrainerSpec
-from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
 from ray.rllib.core.rl_module.marl_module import (
     MultiAgentRLModuleSpec,
@@ -103,19 +101,17 @@ def get_rl_trainer(
 def get_trainer_runner(
     framework: str,
     env: "gym.Env",
-    scaling_config: TrainerScalingConfig,
+    compute_config: dict,
     is_multi_agent: bool = False,
 ) -> TrainerRunner:
-
-    rl_trainer_spec = RLTrainerSpec(
-        rl_trainer_class=get_trainer_class(framework),
+    trainer_class = get_trainer_class(framework)
+    trainer_cfg = dict(
         module_spec=get_module_spec(
             framework=framework, env=env, is_multi_agent=is_multi_agent
         ),
         optimizer_config={"lr": 0.1},
-        trainer_scaling_config=scaling_config,
     )
-    runner = TrainerRunner(rl_trainer_spec)
+    runner = TrainerRunner(trainer_class, trainer_cfg, compute_config=compute_config)
 
     return runner
 
diff --git a/rllib/utils/framework.py b/rllib/utils/framework.py
index 98a4d4dc3ee1..7ae4a4c5ddfc 100644
--- a/rllib/utils/framework.py
+++ b/rllib/utils/framework.py
@@ -59,7 +59,6 @@ def try_import_tf(error: bool = False):
     Raises:
         ImportError: If error=True and tf is not installed.
     """
-    tf_stub = _TFStub()
     # Make sure, these are reset after each test case
     # that uses them: del os.environ["RLLIB_TEST_NO_TF_IMPORT"]
     if "RLLIB_TEST_NO_TF_IMPORT" in os.environ:
@@ -87,7 +86,7 @@ def try_import_tf(error: bool = False):
                     "install at least one deep-learning framework: "
                     "`pip install [torch|tensorflow|jax]`."
                 )
-            return None, tf_stub, None
+            return None, None, None
 
     # Try "reducing" tf to tf.compat.v1.
     try:
@@ -109,24 +108,6 @@ def try_import_tf(error: bool = False):
     return tf1_module, tf_module, version
 
 
-# Fake module for tf.
-class _TFStub:
-    def __init__(self) -> None:
-        self.keras = _KerasStub()
-
-
-# Fake module for tf.keras.
-class _KerasStub:
-    def __init__(self) -> None:
-        self.Model = _FakeTfClassStub
-
-
-# Fake classes under keras (e.g for tf.keras.Model)
-class _FakeTfClassStub:
-    def __init__(self, *a, **kw):
-        raise ImportError("Could not import `tensorflow`. Try pip install tensorflow.")
-
-
 @DeveloperAPI
 def tf_function(tf_module):
     """Conditional decorator for @tf.function.
@@ -176,20 +157,20 @@ class _NNStub:
     def __init__(self, *a, **kw):
         # Fake nn.functional module within torch.nn.
         self.functional = None
-        self.Module = _FakeTorchClassStub
+        self.Module = _FakeClassStub
         self.parallel = _ParallelStub()
 
 
 # Fake class for e.g. torch.nn.Module to allow it to be inherited from.
-class _FakeTorchClassStub:
+class _FakeClassStub:
     def __init__(self, *a, **kw):
         raise ImportError("Could not import `torch`. Try pip install torch.")
 
 
 class _ParallelStub:
     def __init__(self, *a, **kw):
-        self.DataParallel = _FakeTorchClassStub
-        self.DistributedDataParallel = _FakeTorchClassStub
+        self.DataParallel = _FakeClassStub
+        self.DistributedDataParallel = _FakeClassStub
 
 
 @PublicAPI

From a0b84994ec2e1055355ead3e38bfffc420ae98ee Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Tue, 31 Jan 2023 14:43:33 -0800
Subject: [PATCH 091/267] [Dashboard] Better gpu utilization (#32125)

. So instead of averaging out, we should do sum(gpu_utillization) / (sum(num_gpus)) to cap the max percentage to 100%.
---
 dashboard/modules/metrics/grafana_dashboard_factory.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dashboard/modules/metrics/grafana_dashboard_factory.py b/dashboard/modules/metrics/grafana_dashboard_factory.py
index ead306c51cae..f8b9bdbc0942 100644
--- a/dashboard/modules/metrics/grafana_dashboard_factory.py
+++ b/dashboard/modules/metrics/grafana_dashboard_factory.py
@@ -378,7 +378,7 @@ def max_plus_pending(max_resource, pending_resource):
             ),
             # GPU
             Target(
-                expr="avg(ray_node_gpus_utilization{{{global_filters}}})",
+                expr="sum(ray_node_gpus_utilization{{{global_filters}}}) / on() (sum(autoscaler_cluster_resources{{resource='GPU',{global_filters}}}) or vector(0))",
                 legend="GPU (physical)",
             ),
             # Memory

From f28428e9ca52e6ea28e81838e130fcdb59d74864 Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Tue, 31 Jan 2023 14:45:20 -0800
Subject: [PATCH 092/267] [core] Update the scalability envelop (#32131)

With the recent updating of the nightly tests, update the data here.

In the nightly tests, we use 2k nodes (2cpus per node) and 20k actors, but if better node is used, we can run more than 40k actors.

https://buildkite.com/ray-project/release-tests-branch/builds/1321#018604d7-86a3-4fad-ac6c-803db73821d3
---
 release/benchmarks/README.md                              | 8 +++-----
 .../benchmarks/distributed/many_nodes_tests/actor_test.py | 6 ++++++
 2 files changed, 9 insertions(+), 5 deletions(-)

diff --git a/release/benchmarks/README.md b/release/benchmarks/README.md
index 1bfe46be41ee..996181b415bb 100644
--- a/release/benchmarks/README.md
+++ b/release/benchmarks/README.md
@@ -6,8 +6,8 @@ All distributed tests are run on 64 nodes with 64 cores/node. Maximum number of
 
 | Dimension                                       | Quantity |
 | ---------                                       | -------- |
-| # nodes in cluster (with trivial task workload) | 250+     |
-| # actors in cluster (with trivial workload)     | 10k+     |
+| # nodes in cluster (with trivial task workload) | 2k+      |
+| # actors in cluster (with trivial workload)     | 40k+     |
 | # simultaneously running tasks                  | 10k+     |
 | # simultaneously running placement groups       | 1k+      |
 
@@ -25,9 +25,7 @@ All single node benchmarks are run on a single m4.16xlarge.
 | Dimension                                      | Quantity   |
 | ---------                                      | --------   |
 | # of object arguments to a single task         | 10000+     |
-| # of objects returned from a single task       | 3000+     |
+| # of objects returned from a single task       | 3000+      |
 | # of plasma objects in a single `ray.get` call | 10000+     |
 | # of tasks queued on a single node             | 1,000,000+ |
 | Maximum `ray.get` numpy object size            | 100GiB+    |
-
-    
diff --git a/release/benchmarks/distributed/many_nodes_tests/actor_test.py b/release/benchmarks/distributed/many_nodes_tests/actor_test.py
index fd14b70d6236..d70490006dca 100644
--- a/release/benchmarks/distributed/many_nodes_tests/actor_test.py
+++ b/release/benchmarks/distributed/many_nodes_tests/actor_test.py
@@ -122,6 +122,12 @@ def main():
         json.dump(result, out_file)
     print(f"Result: {json.dumps(result, indent=2)}")
     print("Test finished successfully!")
+    ray.shutdown()
+
+    # We need to make sure GCS cool down otherwise, testing infra
+    # might get timeout when fetching the result.
+    print("Sleep for 60s, waiting for the cluster to cool down.")
+    sleep(60)
 
 
 if __name__ == "__main__":

From b4221c91588f4569533c71911fc7d36b8ece7a21 Mon Sep 17 00:00:00 2001
From: Alan Guo <aguo@anyscale.com>
Date: Tue, 31 Jan 2023 14:46:01 -0800
Subject: [PATCH 093/267] Fix docs lint for advanced progress bar (#32124)

Signed-off-by: Alan Guo <aguo@anyscale.com>

fix lint #31750
---
 python/ray/experimental/state/common.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/ray/experimental/state/common.py b/python/ray/experimental/state/common.py
index f3022c81af26..05d00da4cdc2 100644
--- a/python/ray/experimental/state/common.py
+++ b/python/ray/experimental/state/common.py
@@ -831,7 +831,7 @@ def to_summary_by_lineage(cls, *, tasks: List[Dict]) -> "TaskSummaries":
         Step 1: Iterate through all tasks and keep track of them by id and ownership
         Step 2: Put the tasks in a tree structure based on ownership
         Step 3: Merge together siblings in the tree if there are more
-                than one with the same name.
+        than one with the same name.
         Step 4: Total the children
 
         This can probably be more efficient if we merge together some steps to

From 2137945fc40a5124aa0df3d97e0e58b892c515d7 Mon Sep 17 00:00:00 2001
From: Clark Zinzow <clarkzinzow@gmail.com>
Date: Tue, 31 Jan 2023 14:46:53 -0800
Subject: [PATCH 094/267] [Datasets] [Operator Fusion - 1/2] Add operator
 fusion to new execution planner. (#32095)

This PR adds operation fusion to the new execution planner.
---
 python/ray/data/_internal/compute.py          |  11 +
 .../data/_internal/execution/interfaces.py    |  10 +-
 .../data/_internal/execution/legacy_compat.py |   4 +-
 .../operators/all_to_all_operator.py          |   3 +
 .../execution/operators/map_operator.py       |  10 +-
 .../ray/data/_internal/logical/interfaces.py  |  61 ++-
 .../ray/data/_internal/logical/optimizers.py  |  34 +-
 .../data/_internal/logical/rules/__init__.py  |   3 +
 .../logical/rules/operator_fusion.py          | 206 ++++++++++
 python/ray/data/_internal/planner/planner.py  |  38 +-
 python/ray/data/tests/conftest.py             |  10 +-
 .../data/tests/test_execution_optimizer.py    | 358 ++++++++++++++++--
 12 files changed, 659 insertions(+), 89 deletions(-)
 create mode 100644 python/ray/data/_internal/logical/rules/__init__.py
 create mode 100644 python/ray/data/_internal/logical/rules/operator_fusion.py

diff --git a/python/ray/data/_internal/compute.py b/python/ray/data/_internal/compute.py
index 997a1af92a1e..b5b3b733e00e 100644
--- a/python/ray/data/_internal/compute.py
+++ b/python/ray/data/_internal/compute.py
@@ -176,6 +176,9 @@ def _apply(
             owned_by_consumer=in_block_owned_by_consumer,
         )
 
+    def __eq__(self, other: Any) -> bool:
+        return isinstance(other, TaskPoolStrategy)
+
 
 @PublicAPI
 class ActorPoolStrategy(ComputeStrategy):
@@ -449,6 +452,14 @@ def map_block_nosplit(
             finally:
                 raise e from None
 
+    def __eq__(self, other: Any) -> bool:
+        return isinstance(other, ActorPoolStrategy) and (
+            self.min_size == other.min_size
+            and self.max_size == other.max_size
+            and self.max_tasks_in_flight_per_actor
+            == other.max_tasks_in_flight_per_actor
+        )
+
 
 def get_compute(compute_spec: Union[str, ComputeStrategy]) -> ComputeStrategy:
     if not compute_spec or compute_spec == "tasks":
diff --git a/python/ray/data/_internal/execution/interfaces.py b/python/ray/data/_internal/execution/interfaces.py
index 821662e257c1..2a350e9efd18 100644
--- a/python/ray/data/_internal/execution/interfaces.py
+++ b/python/ray/data/_internal/execution/interfaces.py
@@ -1,5 +1,5 @@
 from dataclasses import dataclass
-from typing import Dict, List, Optional, Iterable, Tuple
+from typing import Dict, List, Optional, Iterable, Tuple, Callable
 
 import ray
 from ray.data._internal.logical.interfaces import Operator
@@ -8,7 +8,6 @@
 from ray.data.block import Block, BlockMetadata
 from ray.data.context import DatasetContext
 from ray.types import ObjectRef
-from typing import Callable
 
 
 @dataclass
@@ -237,6 +236,13 @@ def get_metrics(self) -> Dict[str, int]:
         """
         return {}
 
+    def get_transformation_fn(self) -> Callable:
+        """Returns the underlying transformation function for this operator.
+
+        This is used by the physical plan optimizer for e.g. operator fusion.
+        """
+        raise NotImplementedError
+
     def progress_str(self) -> str:
         """Return any extra status to be displayed in the operator progress bar.
 
diff --git a/python/ray/data/_internal/execution/legacy_compat.py b/python/ray/data/_internal/execution/legacy_compat.py
index 5bc7e3435035..c1cfaf8a4934 100644
--- a/python/ray/data/_internal/execution/legacy_compat.py
+++ b/python/ray/data/_internal/execution/legacy_compat.py
@@ -7,7 +7,7 @@
 from typing import Iterator, Tuple, Any
 
 import ray
-from ray.data._internal.logical.optimizers import get_execution_dag
+from ray.data._internal.logical.optimizers import get_execution_plan
 from ray.data.context import DatasetContext
 from ray.types import ObjectRef
 from ray.data.block import Block, BlockMetadata, List
@@ -78,7 +78,7 @@ def execute_to_legacy_block_list(
         The output as a legacy block list.
     """
     if DatasetContext.get_current().optimizer_enabled:
-        dag, stats = get_execution_dag(plan._logical_plan.dag), None
+        dag, stats = get_execution_plan(plan._logical_plan).dag, None
     else:
         dag, stats = _to_operator_dag(plan, allow_clear_input_blocks)
     bundles = executor.execute(dag, initial_stats=stats)
diff --git a/python/ray/data/_internal/execution/operators/all_to_all_operator.py b/python/ray/data/_internal/execution/operators/all_to_all_operator.py
index fdc1d850e711..5c6389a3fa5b 100644
--- a/python/ray/data/_internal/execution/operators/all_to_all_operator.py
+++ b/python/ray/data/_internal/execution/operators/all_to_all_operator.py
@@ -67,3 +67,6 @@ def get_next(self) -> RefBundle:
 
     def get_stats(self) -> StatsDict:
         return self._stats
+
+    def get_transformation_fn(self) -> AllToAllTransformFn:
+        return self._bulk_fn
diff --git a/python/ray/data/_internal/execution/operators/map_operator.py b/python/ray/data/_internal/execution/operators/map_operator.py
index 545b5ed5058c..56e4951fdd90 100644
--- a/python/ray/data/_internal/execution/operators/map_operator.py
+++ b/python/ray/data/_internal/execution/operators/map_operator.py
@@ -44,9 +44,7 @@ def __init__(
         # instead.
         # NOTE: This constructor must be called by subclasses.
 
-        # Put the function def in the object store to avoid repeated serialization
-        # in case it's large (i.e., closure captures large objects).
-        self._transform_fn_ref = ray.put(transform_fn)
+        self._transform_fn = transform_fn
         self._ray_remote_args = _canonicalize_ray_remote_args(ray_remote_args or {})
 
         # Bundles block references up to the min_rows_per_bundle target.
@@ -142,6 +140,9 @@ def start(self, options: "ExecutionOptions"):
                 ray.get_runtime_context().get_node_id(),
                 soft=True,
             )
+        # Put the function def in the object store to avoid repeated serialization
+        # in case it's large (i.e., closure captures large objects).
+        self._transform_fn_ref = ray.put(self._transform_fn)
         super().start(options)
 
     def add_input(self, refs: RefBundle, input_index: int):
@@ -261,6 +262,9 @@ def get_metrics(self) -> Dict[str, int]:
     def get_stats(self) -> StatsDict:
         return {self._name: self._output_metadata}
 
+    def get_transformation_fn(self) -> MapTransformFn:
+        return self._transform_fn
+
     @abstractmethod
     def shutdown(self):
         # NOTE: This must be implemented by subclasses, and those overriding methods
diff --git a/python/ray/data/_internal/logical/interfaces.py b/python/ray/data/_internal/logical/interfaces.py
index 18304828e447..4e88d0b67e2e 100644
--- a/python/ray/data/_internal/logical/interfaces.py
+++ b/python/ray/data/_internal/logical/interfaces.py
@@ -1,4 +1,7 @@
-from typing import List
+from typing import List, Dict, TYPE_CHECKING
+
+if TYPE_CHECKING:
+    from ray.data._internal.execution.interfaces import PhysicalOperator
 
 
 class Operator:
@@ -51,11 +54,57 @@ def __init__(self, name: str, input_dependencies: List["LogicalOperator"]):
             assert isinstance(x, LogicalOperator), x
 
 
+class Plan:
+    """Abstract class for logical/physical execution plans.
+
+    This plan should hold an operator representing the plan DAG and any auxiliary data
+    that's useful for plan optimization or execution.
+    """
+
+    @property
+    def dag(self) -> Operator:
+        raise NotImplementedError
+
+
+class LogicalPlan(Plan):
+    """The plan with a DAG of logical operators."""
+
+    def __init__(self, dag: LogicalOperator):
+        self._dag = dag
+
+    @property
+    def dag(self) -> LogicalOperator:
+        """Get the DAG of logical operators."""
+        return self._dag
+
+
+class PhysicalPlan(Plan):
+    """The plan with a DAG of physical operators."""
+
+    def __init__(
+        self, dag: "PhysicalOperator", op_map: Dict["PhysicalOperator", LogicalOperator]
+    ):
+        self._dag = dag
+        self._op_map = op_map
+
+    @property
+    def dag(self) -> "PhysicalOperator":
+        """Get the DAG of physical operators."""
+        return self._dag
+
+    @property
+    def op_map(self) -> Dict["PhysicalOperator", LogicalOperator]:
+        """
+        Get a mapping from physical operators to their corresponding logical operator.
+        """
+        return self._op_map
+
+
 class Rule:
     """Abstract class for optimization rule."""
 
-    def apply(dag: Operator) -> Operator:
-        """Apply the optimization rule to the DAG of operators."""
+    def apply(plan: Plan) -> Plan:
+        """Apply the optimization rule to the execution plan."""
         raise NotImplementedError
 
 
@@ -70,8 +119,8 @@ def rules(self) -> List[Rule]:
         """List of predefined rules for this optimizer."""
         raise NotImplementedError
 
-    def optimize(self, dag: Operator) -> Operator:
+    def optimize(self, plan: Plan) -> Plan:
         """Optimize operators with a list of rules."""
         for rule in self.rules:
-            dag = rule.apply(dag)
-        return dag
+            plan = rule.apply(plan)
+        return plan
diff --git a/python/ray/data/_internal/logical/optimizers.py b/python/ray/data/_internal/logical/optimizers.py
index eaced07affc0..df14f99ba5c0 100644
--- a/python/ray/data/_internal/logical/optimizers.py
+++ b/python/ray/data/_internal/logical/optimizers.py
@@ -1,7 +1,12 @@
 from typing import List
 
-from ray.data._internal.execution.interfaces import PhysicalOperator
-from ray.data._internal.logical.interfaces import Rule, Optimizer, LogicalOperator
+from ray.data._internal.logical.interfaces import (
+    Rule,
+    Optimizer,
+    LogicalPlan,
+    PhysicalPlan,
+)
+from ray.data._internal.logical.rules import OperatorFusionRule
 from ray.data._internal.planner.planner import Planner
 
 
@@ -19,30 +24,17 @@ class PhysicalOptimizer(Optimizer):
 
     @property
     def rules(self) -> List["Rule"]:
-        # TODO: Add physical optimizer rules.
-        return []
-
-
-class LogicalPlan:
-    """The plan with a DAG of logical operators."""
-
-    def __init__(self, dag: LogicalOperator):
-        self._dag = dag
-
-    @property
-    def dag(self) -> LogicalOperator:
-        """Get the DAG of logical operators."""
-        return self._dag
+        return [OperatorFusionRule()]
 
 
-def get_execution_dag(logical_dag: LogicalOperator) -> PhysicalOperator:
-    """Get the DAG of physical operators to execute.
+def get_execution_plan(logical_plan: LogicalPlan) -> PhysicalPlan:
+    """Get the physical execution plan for the provided logical plan.
 
     This process has 3 steps:
     (1) logical optimization: optimize logical operators.
     (2) planning: convert logical to physical operators.
     (3) physical optimization: optimize physical operators.
     """
-    optimized_logical_dag = LogicalOptimizer().optimize(logical_dag)
-    physical_dag = Planner().plan(optimized_logical_dag)
-    return PhysicalOptimizer().optimize(physical_dag)
+    logical_plan = LogicalOptimizer().optimize(logical_plan)
+    physical_plan = Planner().plan(logical_plan)
+    return PhysicalOptimizer().optimize(physical_plan)
diff --git a/python/ray/data/_internal/logical/rules/__init__.py b/python/ray/data/_internal/logical/rules/__init__.py
new file mode 100644
index 000000000000..d138fe4b1193
--- /dev/null
+++ b/python/ray/data/_internal/logical/rules/__init__.py
@@ -0,0 +1,3 @@
+from ray.data._internal.logical.rules.operator_fusion import OperatorFusionRule
+
+__all__ = ["OperatorFusionRule"]
diff --git a/python/ray/data/_internal/logical/rules/operator_fusion.py b/python/ray/data/_internal/logical/rules/operator_fusion.py
new file mode 100644
index 000000000000..c78e4f1cc488
--- /dev/null
+++ b/python/ray/data/_internal/logical/rules/operator_fusion.py
@@ -0,0 +1,206 @@
+from typing import Iterator
+
+from ray.data.block import Block
+
+# TODO(Clark): Remove compute dependency once we delete the legacy compute.
+from ray.data._internal.compute import is_task_compute, CallableClass, get_compute
+from ray.data._internal.execution.interfaces import PhysicalOperator, TaskContext
+from ray.data._internal.logical.interfaces import Rule, PhysicalPlan
+
+
+# Scheduling strategy can be inherited from upstream operator if not specified.
+INHERITABLE_REMOTE_ARGS = ["scheduling_strategy"]
+
+
+class OperatorFusionRule(Rule):
+    """Fuses linear chains of compatible physical operators."""
+
+    def apply(self, plan: PhysicalPlan) -> PhysicalPlan:
+        self._op_map = plan.op_map.copy()
+        # Do DFS fusion.
+        root = self._apply(plan.dag)
+        return PhysicalPlan(root, self._op_map)
+
+    def _apply(self, op: PhysicalOperator) -> PhysicalOperator:
+        """Performs DFS fusion of linear chains of physical map operators, provided that
+        they are pairwise-compatible.
+
+        Args:
+            op: The op that we're trying to fuse with its input.
+        """
+        upstream_ops = op.input_dependencies
+        # Fuse with upstream ops while possible.
+        while len(upstream_ops) == 1 and self._can_fuse(op, upstream_ops[0]):
+            # Fuse operator with its upstream op.
+            op = self._fuse(op, upstream_ops[0])
+            upstream_ops = op.input_dependencies
+        # Can no longer fuse with upstream ops, proceed up the DAG.
+        op._input_dependencies = [
+            self._apply(upstream_op) for upstream_op in upstream_ops
+        ]
+        return op
+
+    def _can_fuse(self, down_op: PhysicalOperator, up_op: PhysicalOperator) -> bool:
+        """Returns whether the provided downstream operator can be fused with the given
+        upstream operator.
+
+        We currently support fusing two operators if the following are all true:
+            * They are both MapOperators.
+            * They either use the same compute configuration, or the upstream operator
+              uses a task pool while the downstream operator uses an actor pool.
+            * If both operators involve callable classes, the callable classes are
+              the same class AND constructor args are the same for both.
+            * They have compatible remote arguments.
+        """
+        from ray.data._internal.execution.operators.map_operator import MapOperator
+        from ray.data._internal.logical.operators.map_operator import AbstractMap
+        from ray.data._internal.logical.operators.read_operator import Read
+
+        # We only support fusing MapOperators.
+        if not isinstance(down_op, MapOperator) or not isinstance(up_op, MapOperator):
+            return False
+
+        down_logical_op = self._op_map[down_op]
+        up_logical_op = self._op_map[up_op]
+
+        # We only support fusing upstream reads and maps with downstream maps.
+        if not isinstance(down_logical_op, AbstractMap) or not isinstance(
+            up_logical_op, (Read, AbstractMap)
+        ):
+            return False
+
+        # Allow fusing tasks->actors if the resources are compatible (read->map), but
+        # not the other way around. The latter (downstream op) will be used as the
+        # compute if fused.
+        if (
+            is_task_compute(down_logical_op._compute)
+            and isinstance(up_logical_op, AbstractMap)
+            and get_compute(up_logical_op._compute)
+            != get_compute(down_logical_op._compute)
+        ):
+            return False
+
+        # Fusing callable classes is only supported if they are the same function AND
+        # their construction arguments are the same.
+        # TODO(Clark): Support multiple callable classes instantiating in the same actor
+        # worker.
+        if (
+            isinstance(down_logical_op._fn, CallableClass)
+            and isinstance(up_logical_op, AbstractMap)
+            and isinstance(up_logical_op._fn, CallableClass)
+            and (
+                up_logical_op._fn != down_logical_op._fn
+                or (
+                    up_logical_op._fn_constructor_args
+                    != down_logical_op._fn_constructor_args
+                    or up_logical_op._fn_constructor_kwargs
+                    != down_logical_op._fn_constructor_kwargs
+                )
+            )
+        ):
+            return False
+
+        # Only fuse if the ops' remote arguments are compatible.
+        if not _are_remote_args_compatible(
+            up_logical_op._ray_remote_args or {}, down_logical_op._ray_remote_args or {}
+        ):
+            return False
+
+        # Otherwise, ops are compatible for fusion.
+        return True
+
+    def _fuse(self, down_op: PhysicalOperator, up_op: PhysicalOperator):
+        """Fuse the downstream operator with its upstream operator."""
+        from ray.data._internal.execution.operators.map_operator import MapOperator
+        from ray.data._internal.logical.operators.map_operator import AbstractMap
+
+        assert self._can_fuse(down_op, up_op)
+
+        # Fuse operator names.
+        name = up_op.name + "->" + down_op.name
+
+        down_logical_op = self._op_map.pop(down_op)
+        up_logical_op = self._op_map.pop(up_op)
+
+        # Merge target block sizes.
+        down_target_block_size = down_logical_op._target_block_size
+        up_target_block_size = (
+            up_logical_op._target_block_size
+            if isinstance(up_logical_op, AbstractMap)
+            else None
+        )
+        if down_target_block_size is not None and up_target_block_size is not None:
+            target_block_size = max(down_target_block_size, up_target_block_size)
+        elif up_target_block_size is not None:
+            target_block_size = up_target_block_size
+        else:
+            target_block_size = down_target_block_size
+
+        # Fuse transformation functions.
+        down_transform_fn = down_op.get_transformation_fn()
+        up_transform_fn = up_op.get_transformation_fn()
+
+        def transform_fn(blocks: Iterator[Block], ctx: TaskContext) -> Iterator[Block]:
+            blocks = up_transform_fn(blocks, ctx)
+            # TODO(Clark): Add zero-copy batching between transform functions.
+            return down_transform_fn(blocks, ctx)
+
+        # We take the downstream op's compute in case we're fusing upstream tasks with a
+        # downstream actor pool (e.g. read->map).
+        compute = get_compute(down_logical_op._compute)
+        ray_remote_args = down_logical_op._ray_remote_args
+        # Make the upstream operator's inputs the new, fused operator's inputs.
+        input_deps = up_op.input_dependencies
+        assert len(input_deps) == 1
+        input_op = input_deps[0]
+
+        # Fused physical map operator.
+        op = MapOperator.create(
+            transform_fn,
+            input_op,
+            name=name,
+            compute_strategy=compute,
+            min_rows_per_bundle=target_block_size,
+            ray_remote_args=ray_remote_args,
+        )
+
+        # Build a map logical operator to be used as a reference for further fusion.
+        # TODO(Clark): This is hacky, remove this once we push fusion to be purely based
+        # on a lower-level operator spec.
+        if isinstance(up_logical_op, AbstractMap):
+            input_op = up_logical_op.input_dependencies[0]
+        else:
+            # Bottom out at the source logical op (e.g. Read()).
+            input_op = up_logical_op
+        logical_op = AbstractMap(
+            name,
+            input_op,
+            down_logical_op._fn,
+            down_logical_op._fn_args,
+            down_logical_op._fn_kwargs,
+            down_logical_op._fn_constructor_args,
+            down_logical_op._fn_constructor_kwargs,
+            target_block_size,
+            compute,
+            ray_remote_args,
+        )
+        self._op_map[op] = logical_op
+        # Return the fused physical operator.
+        return op
+
+
+def _are_remote_args_compatible(up_args, down_args):
+    """Check if Ray remote arguments are compatible for merging."""
+    from ray.data._internal.execution.operators.map_operator import (
+        _canonicalize_ray_remote_args,
+    )
+
+    up_args = _canonicalize_ray_remote_args(up_args)
+    down_args = _canonicalize_ray_remote_args(down_args)
+    remote_args = down_args.copy()
+    for key in INHERITABLE_REMOTE_ARGS:
+        if key in up_args:
+            remote_args[key] = up_args[key]
+    if up_args != remote_args:
+        return False
+    return True
diff --git a/python/ray/data/_internal/planner/planner.py b/python/ray/data/_internal/planner/planner.py
index 3f5084755944..8bac276fae46 100644
--- a/python/ray/data/_internal/planner/planner.py
+++ b/python/ray/data/_internal/planner/planner.py
@@ -1,5 +1,11 @@
+from typing import Dict
+
 from ray.data._internal.execution.interfaces import PhysicalOperator
-from ray.data._internal.logical.interfaces import LogicalOperator
+from ray.data._internal.logical.interfaces import (
+    LogicalOperator,
+    LogicalPlan,
+    PhysicalPlan,
+)
 from ray.data._internal.logical.operators.all_to_all_operator import AbstractAllToAll
 from ray.data._internal.logical.operators.read_operator import Read
 from ray.data._internal.logical.operators.map_operator import AbstractMap
@@ -15,24 +21,32 @@ class Planner:
     done by physical optimizer.
     """
 
-    def plan(self, logical_dag: LogicalOperator) -> PhysicalOperator:
+    def __init__(self):
+        self._physical_op_to_logical_op: Dict[PhysicalOperator, LogicalOperator] = {}
+
+    def plan(self, logical_plan: LogicalPlan) -> PhysicalPlan:
         """Convert logical to physical operators recursively in post-order."""
+        physical_dag = self._plan(logical_plan.dag)
+        return PhysicalPlan(physical_dag, self._physical_op_to_logical_op)
+
+    def _plan(self, logical_op: LogicalOperator) -> PhysicalOperator:
         # Plan the input dependencies first.
         physical_children = []
-        for child in logical_dag.input_dependencies:
-            physical_children.append(self.plan(child))
+        for child in logical_op.input_dependencies:
+            physical_children.append(self._plan(child))
 
-        if isinstance(logical_dag, Read):
+        if isinstance(logical_op, Read):
             assert not physical_children
-            physical_dag = _plan_read_op(logical_dag)
-        elif isinstance(logical_dag, AbstractMap):
+            physical_op = _plan_read_op(logical_op)
+        elif isinstance(logical_op, AbstractMap):
             assert len(physical_children) == 1
-            physical_dag = _plan_map_op(logical_dag, physical_children[0])
-        elif isinstance(logical_dag, AbstractAllToAll):
+            physical_op = _plan_map_op(logical_op, physical_children[0])
+        elif isinstance(logical_op, AbstractAllToAll):
             assert len(physical_children) == 1
-            physical_dag = _plan_all_to_all_op(logical_dag, physical_children[0])
+            physical_op = _plan_all_to_all_op(logical_op, physical_children[0])
         else:
             raise ValueError(
-                f"Found unknown logical operator during planning: {logical_dag}"
+                f"Found unknown logical operator during planning: {logical_op}"
             )
-        return physical_dag
+        self._physical_op_to_logical_op[physical_op] = logical_op
+        return physical_op
diff --git a/python/ray/data/tests/conftest.py b/python/ray/data/tests/conftest.py
index de089750c052..0d1cb84deb92 100644
--- a/python/ray/data/tests/conftest.py
+++ b/python/ray/data/tests/conftest.py
@@ -326,14 +326,14 @@ def target_max_block_size(request):
     ctx.target_max_block_size = original
 
 
-@pytest.fixture(params=[True])
-def enable_optimizer(request):
+@pytest.fixture
+def enable_optimizer():
     ctx = ray.data.context.DatasetContext.get_current()
     original_backend = ctx.new_execution_backend
     original_optimizer = ctx.optimizer_enabled
-    ctx.new_execution_backend = request.param
-    ctx.optimizer_enabled = request.param
-    yield request.param
+    ctx.new_execution_backend = True
+    ctx.optimizer_enabled = True
+    yield
     ctx.new_execution_backend = original_backend
     ctx.optimizer_enabled = original_optimizer
 
diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index b4c73a1ae122..6228905c1aac 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -4,6 +4,8 @@
 from ray.data._internal.execution.operators.map_operator import MapOperator
 from ray.data._internal.execution.operators.all_to_all_operator import AllToAllOperator
 from ray.data._internal.execution.operators.input_data_buffer import InputDataBuffer
+from ray.data._internal.logical.interfaces import LogicalPlan
+from ray.data._internal.logical.optimizers import PhysicalOptimizer
 from ray.data._internal.logical.operators.all_to_all_operator import (
     RandomShuffle,
     RandomizeBlocks,
@@ -22,10 +24,11 @@
 from ray.tests.conftest import *  # noqa
 
 
-def test_read_operator(ray_start_cluster_enabled, enable_optimizer):
+def test_read_operator(ray_start_regular_shared, enable_optimizer):
     planner = Planner()
     op = Read(ParquetDatasource())
-    physical_op = planner.plan(op)
+    plan = LogicalPlan(op)
+    physical_op = planner.plan(plan).dag
 
     assert op.name == "Read"
     assert isinstance(physical_op, MapOperator)
@@ -33,15 +36,15 @@ def test_read_operator(ray_start_cluster_enabled, enable_optimizer):
     assert isinstance(physical_op.input_dependencies[0], InputDataBuffer)
 
 
-def test_map_batches_operator(ray_start_cluster_enabled, enable_optimizer):
+def test_map_batches_operator(ray_start_regular_shared, enable_optimizer):
     planner = Planner()
     read_op = Read(ParquetDatasource())
     op = MapBatches(
         read_op,
-        lambda it: (x for x in it),
         lambda x: x,
     )
-    physical_op = planner.plan(op)
+    plan = LogicalPlan(op)
+    physical_op = planner.plan(plan).dag
 
     assert op.name == "MapBatches"
     assert isinstance(physical_op, MapOperator)
@@ -49,20 +52,21 @@ def test_map_batches_operator(ray_start_cluster_enabled, enable_optimizer):
     assert isinstance(physical_op.input_dependencies[0], MapOperator)
 
 
-def test_map_batches_e2e(ray_start_cluster_enabled, enable_optimizer):
+def test_map_batches_e2e(ray_start_regular_shared, enable_optimizer):
     ds = ray.data.range(5)
     ds = ds.map_batches(lambda x: x)
     assert ds.take_all() == list(range(5)), ds
 
 
-def test_map_rows_operator(ray_start_cluster_enabled, enable_optimizer):
+def test_map_rows_operator(ray_start_regular_shared, enable_optimizer):
     planner = Planner()
     read_op = Read(ParquetDatasource())
     op = MapRows(
         read_op,
         lambda x: x,
     )
-    physical_op = planner.plan(op)
+    plan = LogicalPlan(op)
+    physical_op = planner.plan(plan).dag
 
     assert op.name == "MapRows"
     assert isinstance(physical_op, MapOperator)
@@ -70,20 +74,21 @@ def test_map_rows_operator(ray_start_cluster_enabled, enable_optimizer):
     assert isinstance(physical_op.input_dependencies[0], MapOperator)
 
 
-def test_map_rows_e2e(ray_start_cluster_enabled, enable_optimizer):
+def test_map_rows_e2e(ray_start_regular_shared, enable_optimizer):
     ds = ray.data.range(5)
     ds = ds.map(lambda x: x + 1)
     assert ds.take_all() == [1, 2, 3, 4, 5], ds
 
 
-def test_filter_operator(ray_start_cluster_enabled, enable_optimizer):
+def test_filter_operator(ray_start_regular_shared, enable_optimizer):
     planner = Planner()
     read_op = Read(ParquetDatasource())
     op = Filter(
         read_op,
         lambda x: x,
     )
-    physical_op = planner.plan(op)
+    plan = LogicalPlan(op)
+    physical_op = planner.plan(plan).dag
 
     assert op.name == "Filter"
     assert isinstance(physical_op, MapOperator)
@@ -91,20 +96,21 @@ def test_filter_operator(ray_start_cluster_enabled, enable_optimizer):
     assert isinstance(physical_op.input_dependencies[0], MapOperator)
 
 
-def test_filter_e2e(ray_start_cluster_enabled, enable_optimizer):
+def test_filter_e2e(ray_start_regular_shared, enable_optimizer):
     ds = ray.data.range(5)
     ds = ds.filter(fn=lambda x: x % 2 == 0)
     assert ds.take_all() == [0, 2, 4], ds
 
 
-def test_flat_map(ray_start_cluster_enabled, enable_optimizer):
+def test_flat_map(ray_start_regular_shared, enable_optimizer):
     planner = Planner()
     read_op = Read(ParquetDatasource())
     op = FlatMap(
         read_op,
         lambda x: x,
     )
-    physical_op = planner.plan(op)
+    plan = LogicalPlan(op)
+    physical_op = planner.plan(plan).dag
 
     assert op.name == "FlatMap"
     assert isinstance(physical_op, MapOperator)
@@ -112,13 +118,13 @@ def test_flat_map(ray_start_cluster_enabled, enable_optimizer):
     assert isinstance(physical_op.input_dependencies[0], MapOperator)
 
 
-def test_flat_map_e2e(ray_start_cluster_enabled, enable_optimizer):
+def test_flat_map_e2e(ray_start_regular_shared, enable_optimizer):
     ds = ray.data.range(2)
     ds = ds.flat_map(fn=lambda x: [x, x])
     assert ds.take_all() == [0, 0, 1, 1], ds
 
 
-def test_column_ops_e2e(ray_start_cluster_enabled, enable_optimizer):
+def test_column_ops_e2e(ray_start_regular_shared, enable_optimizer):
     ds = ray.data.range(2)
     ds = ds.add_column(fn=lambda df: df.iloc[:, 0], col="new_col")
     assert ds.take_all() == [{"value": 0, "new_col": 0}, {"value": 1, "new_col": 1}], ds
@@ -130,7 +136,7 @@ def test_column_ops_e2e(ray_start_cluster_enabled, enable_optimizer):
     assert ds.take_all() == [{"value": 0}, {"value": 1}], ds
 
 
-def test_random_sample_e2e(ray_start_cluster_enabled, enable_optimizer):
+def test_random_sample_e2e(ray_start_regular_shared, enable_optimizer):
     import math
 
     def ensure_sample_size_close(dataset, sample_percent=0.5):
@@ -149,14 +155,15 @@ def ensure_sample_size_close(dataset, sample_percent=0.5):
     ensure_sample_size_close(ds)
 
 
-def test_randomize_blocks_operator(ray_start_cluster_enabled, enable_optimizer):
+def test_randomize_blocks_operator(ray_start_regular_shared, enable_optimizer):
     planner = Planner()
     read_op = Read(ParquetDatasource())
     op = RandomizeBlocks(
         read_op,
         seed=0,
     )
-    physical_op = planner.plan(op)
+    plan = LogicalPlan(op)
+    physical_op = planner.plan(plan).dag
 
     assert op.name == "RandomizeBlocks"
     assert isinstance(physical_op, AllToAllOperator)
@@ -164,20 +171,21 @@ def test_randomize_blocks_operator(ray_start_cluster_enabled, enable_optimizer):
     assert isinstance(physical_op.input_dependencies[0], MapOperator)
 
 
-def test_randomize_blocks_e2e(ray_start_cluster_enabled, enable_optimizer):
+def test_randomize_blocks_e2e(ray_start_regular_shared, enable_optimizer):
     ds = ray.data.range(12, parallelism=4)
     ds = ds.randomize_block_order(seed=0)
     assert ds.take_all() == [6, 7, 8, 0, 1, 2, 3, 4, 5, 9, 10, 11], ds
 
 
-def test_random_shuffle_operator(ray_start_cluster_enabled, enable_optimizer):
+def test_random_shuffle_operator(ray_start_regular_shared, enable_optimizer):
     planner = Planner()
     read_op = Read(ParquetDatasource())
     op = RandomShuffle(
         read_op,
         seed=0,
     )
-    physical_op = planner.plan(op)
+    plan = LogicalPlan(op)
+    physical_op = planner.plan(plan).dag
 
     assert op.name == "RandomShuffle"
     assert isinstance(physical_op, AllToAllOperator)
@@ -186,7 +194,7 @@ def test_random_shuffle_operator(ray_start_cluster_enabled, enable_optimizer):
 
 
 def test_random_shuffle_e2e(
-    ray_start_cluster_enabled, enable_optimizer, use_push_based_shuffle
+    ray_start_regular_shared, enable_optimizer, use_push_based_shuffle
 ):
     ds = ray.data.range(12, parallelism=4)
     r1 = ds.random_shuffle(seed=0).take_all()
@@ -196,15 +204,12 @@ def test_random_shuffle_e2e(
     assert sorted(r2) == [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11], r2
 
 
-def test_repartition_operator(ray_start_cluster_enabled, enable_optimizer):
+def test_repartition_operator(ray_start_regular_shared, enable_optimizer):
     planner = Planner()
     read_op = Read(ParquetDatasource())
-    op = Repartition(
-        read_op,
-        num_outputs=5,
-        shuffle=True,
-    )
-    physical_op = planner.plan(op)
+    op = Repartition(read_op, num_outputs=5, shuffle=True)
+    plan = LogicalPlan(op)
+    physical_op = planner.plan(plan).dag
 
     assert op.name == "Repartition"
     assert isinstance(physical_op, AllToAllOperator)
@@ -212,18 +217,14 @@ def test_repartition_operator(ray_start_cluster_enabled, enable_optimizer):
     assert isinstance(physical_op.input_dependencies[0], MapOperator)
 
     # Check error is thrown for non-shuffle repartition.
+    op = Repartition(read_op, num_outputs=5, shuffle=False)
+    plan = LogicalPlan(op)
     with pytest.raises(AssertionError):
-        planner.plan(
-            Repartition(
-                read_op,
-                num_outputs=5,
-                shuffle=False,
-            )
-        )
+        planner.plan(plan)
 
 
 def test_repartition_e2e(
-    ray_start_cluster_enabled, enable_optimizer, use_push_based_shuffle
+    ray_start_regular_shared, enable_optimizer, use_push_based_shuffle
 ):
     ds = ray.data.range(10000, parallelism=10)
     ds1 = ds.repartition(20, shuffle=True)
@@ -234,6 +235,287 @@ def test_repartition_e2e(
         ds.repartition(20, shuffle=False).take_all()
 
 
+def test_read_map_batches_operator_fusion(ray_start_regular_shared, enable_optimizer):
+    # Test that Read is fused with MapBatches.
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = MapBatches(
+        read_op,
+        lambda x: x,
+    )
+    logical_plan = LogicalPlan(op)
+    physical_plan = planner.plan(logical_plan)
+    physical_plan = PhysicalOptimizer().optimize(physical_plan)
+    physical_op = physical_plan.dag
+
+    assert op.name == "MapBatches"
+    assert physical_op.name == "DoRead->MapBatches"
+    assert isinstance(physical_op, MapOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], InputDataBuffer)
+
+
+def test_read_map_chain_operator_fusion(ray_start_regular_shared, enable_optimizer):
+    # Test that a chain of different map operators are fused.
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = MapRows(read_op, lambda x: x)
+    op = MapBatches(op, lambda x: x)
+    op = FlatMap(op, lambda x: x)
+    op = Filter(op, lambda x: x)
+    logical_plan = LogicalPlan(op)
+    physical_plan = planner.plan(logical_plan)
+    physical_plan = PhysicalOptimizer().optimize(physical_plan)
+    physical_op = physical_plan.dag
+
+    assert op.name == "Filter"
+    assert physical_op.name == "DoRead->MapRows->MapBatches->FlatMap->Filter"
+    assert isinstance(physical_op, MapOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], InputDataBuffer)
+
+
+def test_read_map_batches_operator_fusion_compatible_remote_args(
+    ray_start_regular_shared, enable_optimizer
+):
+    # Test that map operators are stilled fused when remote args are compatible.
+    planner = Planner()
+    read_op = Read(
+        ParquetDatasource(),
+        ray_remote_args={"num_cpus": 1, "scheduling_strategy": "SPREAD"},
+    )
+    op = MapBatches(read_op, lambda x: x, ray_remote_args={"num_cpus": 1})
+    op = MapBatches(op, lambda x: x, ray_remote_args={"num_cpus": 1})
+    logical_plan = LogicalPlan(op)
+    physical_plan = planner.plan(logical_plan)
+    physical_plan = PhysicalOptimizer().optimize(physical_plan)
+    physical_op = physical_plan.dag
+
+    assert op.name == "MapBatches"
+    assert physical_op.name == "DoRead->MapBatches->MapBatches"
+    assert isinstance(physical_op, MapOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], InputDataBuffer)
+
+
+def test_read_map_batches_operator_fusion_incompatible_remote_args(
+    ray_start_regular_shared, enable_optimizer
+):
+    # Test that map operators are not fused when remote args are incompatible.
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = MapBatches(read_op, lambda x: x, ray_remote_args={"num_cpus": 2})
+    op = MapBatches(op, lambda x: x, ray_remote_args={"num_cpus": 3})
+    logical_plan = LogicalPlan(op)
+    physical_plan = planner.plan(logical_plan)
+    physical_plan = PhysicalOptimizer().optimize(physical_plan)
+    physical_op = physical_plan.dag
+
+    assert op.name == "MapBatches"
+    assert physical_op.name == "MapBatches"
+    assert isinstance(physical_op, MapOperator)
+    assert len(physical_op.input_dependencies) == 1
+    upstream_physical_op = physical_op.input_dependencies[0]
+    assert isinstance(upstream_physical_op, MapOperator)
+    # Read shouldn't fuse into first MapBatches either, due to the differing CPU
+    # request.
+    assert upstream_physical_op.name == "MapBatches"
+
+
+def test_read_map_batches_operator_fusion_compute_tasks_to_actors(
+    ray_start_regular_shared, enable_optimizer
+):
+    # Test that a task-based map operator is fused into an actor-based map operator when
+    # the former comes before the latter.
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = MapBatches(read_op, lambda x: x, compute="tasks")
+    op = MapBatches(op, lambda x: x, compute="actors")
+    logical_plan = LogicalPlan(op)
+    physical_plan = planner.plan(logical_plan)
+    physical_plan = PhysicalOptimizer().optimize(physical_plan)
+    physical_op = physical_plan.dag
+
+    assert op.name == "MapBatches"
+    assert physical_op.name == "DoRead->MapBatches->MapBatches"
+    assert isinstance(physical_op, MapOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], InputDataBuffer)
+
+
+def test_read_map_batches_operator_fusion_compute_read_to_actors(
+    ray_start_regular_shared, enable_optimizer
+):
+    # Test that reads fuse into an actor-based map operator.
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = MapBatches(read_op, lambda x: x, compute="actors")
+    logical_plan = LogicalPlan(op)
+    physical_plan = planner.plan(logical_plan)
+    physical_plan = PhysicalOptimizer().optimize(physical_plan)
+    physical_op = physical_plan.dag
+
+    assert op.name == "MapBatches"
+    assert physical_op.name == "DoRead->MapBatches"
+    assert isinstance(physical_op, MapOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], InputDataBuffer)
+
+
+def test_read_map_batches_operator_fusion_incompatible_compute(
+    ray_start_regular_shared, enable_optimizer
+):
+    # Test that map operators are not fused when compute strategies are incompatible.
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = MapBatches(read_op, lambda x: x, compute="actors")
+    op = MapBatches(op, lambda x: x, compute="tasks")
+    logical_plan = LogicalPlan(op)
+    physical_plan = planner.plan(logical_plan)
+    physical_plan = PhysicalOptimizer().optimize(physical_plan)
+    physical_op = physical_plan.dag
+
+    assert op.name == "MapBatches"
+    assert physical_op.name == "MapBatches"
+    assert isinstance(physical_op, MapOperator)
+    assert len(physical_op.input_dependencies) == 1
+    upstream_physical_op = physical_op.input_dependencies[0]
+    assert isinstance(upstream_physical_op, MapOperator)
+    # Reads should fuse into actor compute.
+    assert upstream_physical_op.name == "DoRead->MapBatches"
+
+
+def test_read_map_batches_operator_fusion_target_block_size(
+    ray_start_regular_shared, enable_optimizer
+):
+    # Test that fusion of map operators merges their block sizes in the expected way
+    # (taking the max).
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = MapBatches(read_op, lambda x: x, target_block_size=2)
+    op = MapBatches(op, lambda x: x, target_block_size=5)
+    op = MapBatches(op, lambda x: x, target_block_size=3)
+    logical_plan = LogicalPlan(op)
+    physical_plan = planner.plan(logical_plan)
+    physical_plan = PhysicalOptimizer().optimize(physical_plan)
+    physical_op = physical_plan.dag
+
+    assert op.name == "MapBatches"
+    # Ops are still fused.
+    assert physical_op.name == "DoRead->MapBatches->MapBatches->MapBatches"
+    assert isinstance(physical_op, MapOperator)
+    # Target block size is set to max.
+    assert physical_op._block_ref_bundler._min_rows_per_bundle == 5
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], InputDataBuffer)
+
+
+def test_read_map_batches_operator_fusion_callable_classes(
+    ray_start_regular_shared, enable_optimizer
+):
+    # Test that callable classes can still be fused if they're the same function.
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+
+    class UDF:
+        def __call__(self, x):
+            return x
+
+    op = MapBatches(read_op, UDF, compute="actors")
+    op = MapBatches(op, UDF, compute="actors")
+    logical_plan = LogicalPlan(op)
+    physical_plan = planner.plan(logical_plan)
+    physical_plan = PhysicalOptimizer().optimize(physical_plan)
+    physical_op = physical_plan.dag
+
+    assert op.name == "MapBatches"
+    assert physical_op.name == "DoRead->MapBatches->MapBatches"
+    assert isinstance(physical_op, MapOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], InputDataBuffer)
+
+
+def test_read_map_batches_operator_fusion_incompatible_callable_classes(
+    ray_start_regular_shared, enable_optimizer
+):
+    # Test that map operators are not fused when different callable classes are used.
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+
+    class UDF:
+        def __call__(self, x):
+            return x
+
+    class UDF2:
+        def __call__(self, x):
+            return x + 1
+
+    op = MapBatches(read_op, UDF, compute="actors")
+    op = MapBatches(op, UDF2, compute="actors")
+    logical_plan = LogicalPlan(op)
+    physical_plan = planner.plan(logical_plan)
+    physical_plan = PhysicalOptimizer().optimize(physical_plan)
+    physical_op = physical_plan.dag
+
+    assert op.name == "MapBatches"
+    assert physical_op.name == "MapBatches"
+    assert isinstance(physical_op, MapOperator)
+    assert len(physical_op.input_dependencies) == 1
+    upstream_physical_op = physical_op.input_dependencies[0]
+    assert isinstance(upstream_physical_op, MapOperator)
+    # Reads should still fuse with first map.
+    assert upstream_physical_op.name == "DoRead->MapBatches"
+
+
+def test_read_map_batches_operator_fusion_incompatible_constructor_args(
+    ray_start_regular_shared, enable_optimizer
+):
+    # Test that map operators are not fused when callable classes have different
+    # constructor args.
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+
+    class UDF:
+        def __init__(self, a):
+            self._a
+
+        def __call__(self, x):
+            return x + self._a
+
+    op = MapBatches(read_op, UDF, compute="actors", fn_constructor_args=(1,))
+    op = MapBatches(op, UDF, compute="actors", fn_constructor_args=(2,))
+    op = MapBatches(op, UDF, compute="actors", fn_constructor_kwargs={"a": 1})
+    op = MapBatches(op, UDF, compute="actors", fn_constructor_kwargs={"a": 2})
+    logical_plan = LogicalPlan(op)
+    physical_plan = planner.plan(logical_plan)
+    physical_plan = PhysicalOptimizer().optimize(physical_plan)
+    physical_op = physical_plan.dag
+
+    assert op.name == "MapBatches"
+    # Last 3 physical map operators are unfused.
+    for _ in range(3):
+        assert isinstance(physical_op, MapOperator)
+        assert physical_op.name == "MapBatches"
+        assert len(physical_op.input_dependencies) == 1
+        physical_op = physical_op.input_dependencies[0]
+    # First physical map operator is fused with read.
+    assert isinstance(physical_op, MapOperator)
+    assert physical_op.name == "DoRead->MapBatches"
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], InputDataBuffer)
+
+
+def test_read_map_chain_operator_fusion_e2e(ray_start_regular_shared, enable_optimizer):
+    ds = ray.data.range(10, parallelism=2)
+    ds = ds.filter(lambda x: x % 2 == 0)
+    ds = ds.map(lambda x: x + 1)
+    ds = ds.map_batches(lambda batch: [2 * x for x in batch], batch_size=None)
+    ds = ds.flat_map(lambda x: [-x, x])
+    assert ds.take_all() == [-2, 2, -6, 6, -10, 10, -14, 14, -18, 18]
+    name = "DoRead->Filter->MapRows->MapBatches->FlatMap:"
+    assert name in ds.stats()
+
+
 if __name__ == "__main__":
     import sys
 

From 12ff13dda1dc566953cfd28e80b4e3685393d5e0 Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Tue, 31 Jan 2023 15:10:34 -0800
Subject: [PATCH 095/267] [RLlib] Fix waterworld example and test (#32117)

* Remove empty parser.add_argument() in test file
* remove --framework=torch
* fix BUILD
* use training_iteration as stopping cirterion

Signed-off-by: Artur Niederfahrenhorst <artur@anyscale.com>
---
 rllib/BUILD                                        | 2 +-
 rllib/examples/multi_agent_independent_learning.py | 3 +--
 2 files changed, 2 insertions(+), 3 deletions(-)

diff --git a/rllib/BUILD b/rllib/BUILD
index fb3689441803..531181a4425d 100644
--- a/rllib/BUILD
+++ b/rllib/BUILD
@@ -3344,7 +3344,7 @@ py_test(
     tags = ["team:rllib", "examples"],
     size = "medium",
     srcs = ["examples/multi_agent_independent_learning.py"],
-    args = ["--stop-iters=4", "--framework=torch"]
+    args = ["--num-gpus=0", "--as-test"]
 )
 
 py_test(
diff --git a/rllib/examples/multi_agent_independent_learning.py b/rllib/examples/multi_agent_independent_learning.py
index b88673b451a4..b06edd46ecc2 100644
--- a/rllib/examples/multi_agent_independent_learning.py
+++ b/rllib/examples/multi_agent_independent_learning.py
@@ -21,7 +21,6 @@
     help="Whether this script should be run as a test: Only one episode will be "
     "sampled.",
 )
-parser.add_argument()
 
 if __name__ == "__main__":
     args = parser.parse_args()
@@ -45,7 +44,7 @@ def env_creator(args):
 
     if args.as_test:
         # Only a compilation test of running waterworld / independent learning.
-        stop = {"iterations": 1}
+        stop = {"training_iteration": 1}
     else:
         stop = {"episodes_total": 60000}
 

From 3b1e21f6b10a6fd15d6bfdb2107159277e38c7e8 Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Tue, 31 Jan 2023 15:41:53 -0800
Subject: [PATCH 096/267] [RLlib] Error out if action_dict is empty in
 MultiAgentEnv.  (#32129)

* [release] minor fix to pytorch_pbt_failure test when using gpu. (#32070)

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>
---
 rllib/env/multi_agent_env.py | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/rllib/env/multi_agent_env.py b/rllib/env/multi_agent_env.py
index dd78c4536f05..a65b8c316073 100644
--- a/rllib/env/multi_agent_env.py
+++ b/rllib/env/multi_agent_env.py
@@ -536,6 +536,13 @@ def reset(self, *, seed: Optional[int] = None, options: Optional[dict] = None):
         @override(MultiAgentEnv)
         def step(self, action_dict):
             obs, rew, terminated, truncated, info = {}, {}, {}, {}, {}
+
+            # the environment is expecting action for at least one agent
+            if len(action_dict) == 0:
+                raise ValueError(
+                    "The environment is expecting action for at least one agent."
+                )
+
             for i, action in action_dict.items():
                 obs[i], rew[i], terminated[i], truncated[i], info[i] = self.envs[
                     i

From 1454e63a089b719f5b05b1a9997732ac97694dd2 Mon Sep 17 00:00:00 2001
From: Clark Zinzow <clarkzinzow@gmail.com>
Date: Tue, 31 Jan 2023 16:21:59 -0800
Subject: [PATCH 097/267] [CI] [Datasets] Run Datasets test suites on AIR
 changes (#32118)

Datasets depends on ray.air for several key features (tensor extensions, Arrow transformations, data batch conversions), and not running the Datasets test suite in PR builds on ray.air changes has caused breaks to go undetected. This PR changes this so when files under python/ray/air change, we trigger the Datasets test suite in CI.

Signed-off-by: Clark Zinzow <clarkzinzow@gmail.com>
---
 ci/pipeline/determine_tests_to_run.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/ci/pipeline/determine_tests_to_run.py b/ci/pipeline/determine_tests_to_run.py
index 7d10e80ad09f..bed9110be938 100644
--- a/ci/pipeline/determine_tests_to_run.py
+++ b/ci/pipeline/determine_tests_to_run.py
@@ -148,6 +148,7 @@ def get_commit_range():
                 RAY_CI_TRAIN_AFFECTED = 1
                 RAY_CI_TUNE_AFFECTED = 1
                 RAY_CI_RLLIB_AFFECTED = 1
+                RAY_CI_DATA_AFFECTED = 1
                 RAY_CI_LINUX_WHEELS_AFFECTED = 1
                 RAY_CI_MACOS_WHEELS_AFFECTED = 1
             elif changed_file.startswith("python/ray/data"):

From 909c22039bd581ba591856bba68941aaea7f7bb6 Mon Sep 17 00:00:00 2001
From: Archit Kulkarni <architkulkarni@users.noreply.github.com>
Date: Tue, 31 Jan 2023 16:30:45 -0800
Subject: [PATCH 098/267] [runtime env] Clarify error message about where to
 install `smart_open` for remote URI (#32110)

At least two users reported encountering

ImportError(
                            "You must `pip install smart_open` and "
                            "`pip install boto3` to fetch URIs in s3 "
                            "bucket. "
and trying to fix it by specifying them in the pip field of runtime_env, which won't work because the runtime_env setup code doesn't run inside the runtime_env. This PR clarifies the error message to say that they must be preinstalled on the cluster, and adds a note to the docs.
---
 doc/source/ray-core/handling-dependencies.rst |  3 ++-
 python/ray/_private/runtime_env/packaging.py  | 11 +++++++++--
 2 files changed, 11 insertions(+), 3 deletions(-)

diff --git a/doc/source/ray-core/handling-dependencies.rst b/doc/source/ray-core/handling-dependencies.rst
index f3ddd06630ea..0f06200770a8 100644
--- a/doc/source/ray-core/handling-dependencies.rst
+++ b/doc/source/ray-core/handling-dependencies.rst
@@ -572,7 +572,8 @@ Currently, three types of remote URIs are supported for hosting ``working_dir``
 
     - ``runtime_env = {"working_dir": "gs://example_bucket/example_file.zip"}``
 
-
+Note that the ``smart_open``, ``boto3``, and ``google-cloud-storage`` packages are not installed by default, and it is not sufficient to specify them in the ``pip`` section of your ``runtime_env``.
+The relevant packages must already be installed on all nodes of the cluster when Ray starts.
 
 Hosting a Dependency on a Remote Git Provider: Step-by-Step Guide
 -----------------------------------------------------------------
diff --git a/python/ray/_private/runtime_env/packaging.py b/python/ray/_private/runtime_env/packaging.py
index 4347228a2e8b..b718e8c627ac 100644
--- a/python/ray/_private/runtime_env/packaging.py
+++ b/python/ray/_private/runtime_env/packaging.py
@@ -649,6 +649,11 @@ async def download_and_unpack_package(
             elif protocol in Protocol.remote_protocols():
                 # Download package from remote URI
                 tp = None
+                install_warning = (
+                    "Note that these must be preinstalled "
+                    "on all nodes in the Ray cluster; it is not "
+                    "sufficient to install them in the runtime_env."
+                )
 
                 if protocol == Protocol.S3:
                     try:
@@ -658,7 +663,7 @@ async def download_and_unpack_package(
                         raise ImportError(
                             "You must `pip install smart_open` and "
                             "`pip install boto3` to fetch URIs in s3 "
-                            "bucket."
+                            "bucket. " + install_warning
                         )
                     tp = {"client": boto3.client("s3")}
                 elif protocol == Protocol.GS:
@@ -670,6 +675,7 @@ async def download_and_unpack_package(
                             "You must `pip install smart_open` and "
                             "`pip install google-cloud-storage` "
                             "to fetch URIs in Google Cloud Storage bucket."
+                            + install_warning
                         )
                 elif protocol == Protocol.FILE:
                     pkg_uri = pkg_uri[len("file://") :]
@@ -683,7 +689,8 @@ def open_file(uri, mode, *, transport_params=None):
                     except ImportError:
                         raise ImportError(
                             "You must `pip install smart_open` "
-                            f"to fetch {protocol.value.upper()} URIs."
+                            f"to fetch {protocol.value.upper()} URIs. "
+                            + install_warning
                         )
 
                 with open_file(pkg_uri, "rb", transport_params=tp) as package_zip:

From 6ec71d75d269b840260d72276b4f5029169afd06 Mon Sep 17 00:00:00 2001
From: Eric Liang <ekhliang@gmail.com>
Date: Tue, 31 Jan 2023 16:33:34 -0800
Subject: [PATCH 099/267] [docs] Add exoshuffle use case and move crawler under
 orchestration (#32126)

---
 .github/CODEOWNERS                    |  1 +
 doc/source/ray-overview/use-cases.rst | 17 ++++++++---------
 2 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS
index 51e3ffbce96b..41d46bc05397 100644
--- a/.github/CODEOWNERS
+++ b/.github/CODEOWNERS
@@ -10,6 +10,7 @@
 # Authors responsible for copy-editing of the documentation.
 # NOTE: Add @ray-project/ray-docs to all following docs subdirs.
 /doc/ @ray-project/ray-docs
+/doc/source/use-cases.rst @ericl @pcmoritz
 
 # ==== Ray core ====
 
diff --git a/doc/source/ray-overview/use-cases.rst b/doc/source/ray-overview/use-cases.rst
index 2cbf22472fc3..43f7851dbdc1 100644
--- a/doc/source/ray-overview/use-cases.rst
+++ b/doc/source/ray-overview/use-cases.rst
@@ -480,7 +480,7 @@ The following are highlighted examples utilizing Ray AIR to implement end-to-end
 Large Scale Workload Orchestration
 ----------------------------------
 
-The following highlights feature companies leveraging Ray Core's distributed APIs to simplify the orchestration of large scale workloads.
+The following highlights feature projects leveraging Ray Core's distributed APIs to simplify the orchestration of large scale workloads.
 
 .. panels::
     :container: container pb-3
@@ -510,19 +510,18 @@ The following highlights feature companies leveraging Ray Core's distributed API
         :text: [Blog] Ray Forward 2022 Conference: Hyper-scale Ray Application Use Cases
         :classes: btn-link btn-block stretched-link rayForward
 
+    ---
+    :img-top: /images/ray_logo.png
 
-Basic Examples
---------------
-
-.. panels::
-    :container: container pb-3
-    :column: col-md-3 px-1 py-1
-    :img-top-cls: p-2 w-75 d-block mx-auto fixed-height-img
+    .. link-button:: https://www.anyscale.com/blog/ray-breaks-the-usd1-tb-barrier-as-the-worlds-most-cost-efficient-sorting
+        :type: url
+        :text: [Blog] A new world record on the CloudSort benchmark using Ray
+        :classes: btn-link btn-block stretched-link rayForward
 
     ---
     :img-top: /images/ray_logo.png
 
     .. link-button:: /ray-core/examples/web-crawler
         :type: ref
-        :text: Speed up your web crawler by parallelizing it with Ray
+        :text: [Example] Speed up your web crawler by parallelizing it with Ray
         :classes: btn-link btn-block stretched-link webCrawler

From be6b598902122165998f8eaf1a8cf94bc17ff4a6 Mon Sep 17 00:00:00 2001
From: Clark Zinzow <clarkzinzow@gmail.com>
Date: Tue, 31 Jan 2023 16:41:13 -0800
Subject: [PATCH 100/267] Fix dynamic block splitting for new backend. (#32139)

---
 .../execution/operators/map_operator.py       | 25 +++++++--
 python/ray/data/tests/test_operators.py       | 52 ++++++++++++++++++-
 2 files changed, 72 insertions(+), 5 deletions(-)

diff --git a/python/ray/data/_internal/execution/operators/map_operator.py b/python/ray/data/_internal/execution/operators/map_operator.py
index 56e4951fdd90..7da98d626331 100644
--- a/python/ray/data/_internal/execution/operators/map_operator.py
+++ b/python/ray/data/_internal/execution/operators/map_operator.py
@@ -486,9 +486,17 @@ def has_next(self) -> bool:
         )
 
     def get_next(self) -> RefBundle:
-        i = self._next_output_index
-        self._next_output_index += 1
-        return self._tasks_by_output_order.pop(i).output
+        # Get the output RefBundle for the current task.
+        out_bundle = self._tasks_by_output_order[self._next_output_index].output
+        # Pop out the next single-block bundle.
+        next_bundle = RefBundle(
+            [out_bundle.blocks.pop(0)], owns_blocks=out_bundle.owns_blocks
+        )
+        if not out_bundle.blocks:
+            # If this task's RefBundle is exhausted, move to the next one.
+            del self._tasks_by_output_order[self._next_output_index]
+            self._next_output_index += 1
+        return next_bundle
 
 
 class _UnorderedOutputQueue(_OutputQueue):
@@ -504,7 +512,16 @@ def has_next(self) -> bool:
         return len(self._completed_tasks) > 0
 
     def get_next(self) -> RefBundle:
-        return self._completed_tasks.pop(0).output
+        # Get the output RefBundle for the oldest completed task.
+        out_bundle = self._completed_tasks[0].output
+        # Pop out the next single-block bundle.
+        next_bundle = RefBundle(
+            [out_bundle.blocks.pop(0)], owns_blocks=out_bundle.owns_blocks
+        )
+        if not out_bundle.blocks:
+            # If this task's RefBundle is exhausted, move to the next one.
+            del self._completed_tasks[0]
+        return next_bundle
 
 
 def _canonicalize_ray_remote_args(ray_remote_args: Dict[str, Any]) -> Dict[str, Any]:
diff --git a/python/ray/data/tests/test_operators.py b/python/ray/data/tests/test_operators.py
index 964d22a83119..960ab96c5b79 100644
--- a/python/ray/data/tests/test_operators.py
+++ b/python/ray/data/tests/test_operators.py
@@ -196,7 +196,7 @@ def test_map_operator_streamed(ray_start_regular_shared, use_actors):
 
 
 @pytest.mark.parametrize("use_actors", [False, True])
-def test_map_operator_min_rows_per_bundle(shutdown_only, use_actors):
+def test_map_operator_min_rows_per_bundle(ray_start_regular_shared, use_actors):
     # Simple sanity check of batching behavior.
     def _check_batch(block_iter: Iterable[Block], ctx) -> Iterable[Block]:
         block_iter = list(block_iter)
@@ -232,8 +232,57 @@ def _check_batch(block_iter: Iterable[Block], ctx) -> Iterable[Block]:
     assert op.completed()
 
 
+@pytest.mark.parametrize("use_actors", [False, True])
+@pytest.mark.parametrize("preserve_order", [False, True])
+def test_map_operator_output_unbundling(
+    ray_start_regular_shared, use_actors, preserve_order
+):
+    # Tests that the MapOperator's output queue unbundles the bundles returned from
+    # tasks; this facilitates features such as dynamic block splitting.
+    def noop(block_iter: Iterable[Block], ctx) -> Iterable[Block]:
+        for block in block_iter:
+            yield block
+
+    # Create with inputs.
+    input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(10)]))
+    compute_strategy = ActorPoolStrategy() if use_actors else TaskPoolStrategy()
+    op = MapOperator.create(
+        noop,
+        input_op=input_op,
+        name="TestMapper",
+        compute_strategy=compute_strategy,
+        # Send the everything in a single bundle of 10 blocks.
+        min_rows_per_bundle=10,
+    )
+
+    # Feed data and block on exec.
+    op.start(ExecutionOptions(preserve_order=preserve_order))
+    inputs = []
+    while input_op.has_next():
+        inputs.append(input_op.get_next())
+    # Sanity check: the op will get 10 input bundles.
+    assert len(inputs) == 10
+    for input_ in inputs:
+        op.add_input(input_, 0)
+    op.inputs_done()
+    work_refs = op.get_work_refs()
+    while work_refs:
+        for work_ref in work_refs:
+            ray.get(work_ref)
+            op.notify_work_completed(work_ref)
+        work_refs = op.get_work_refs()
+
+    # Check that bundles are unbundled in the output queue.
+    outputs = []
+    while op.has_next():
+        outputs.append(op.get_next())
+    assert len(outputs) == 10
+    assert op.completed()
+
+
 @pytest.mark.parametrize("use_actors", [False, True])
 def test_map_operator_ray_args(shutdown_only, use_actors):
+    ray.shutdown()
     ray.init(num_cpus=0, num_gpus=1)
     # Create with inputs.
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(10)]))
@@ -267,6 +316,7 @@ def test_map_operator_ray_args(shutdown_only, use_actors):
 
 @pytest.mark.parametrize("use_actors", [False, True])
 def test_map_operator_shutdown(shutdown_only, use_actors):
+    ray.shutdown()
     ray.init(num_cpus=0, num_gpus=1)
 
     def _sleep(block_iter: Iterable[Block]) -> Iterable[Block]:

From 5c110907827e4d77ba7ff91e7a3c4722bf038290 Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Tue, 31 Jan 2023 16:59:15 -0800
Subject: [PATCH 101/267] [Doc] Update the doc to mention dynamic resource
 update is not allowed.  (#31664)

Signed-off-by: SangBin Cho <rkooo567@gmail.com>
---
 doc/source/ray-core/scheduling/resources.rst | 14 ++++++++++++--
 1 file changed, 12 insertions(+), 2 deletions(-)

diff --git a/doc/source/ray-core/scheduling/resources.rst b/doc/source/ray-core/scheduling/resources.rst
index 0d627e2a26f4..04e7b811be74 100644
--- a/doc/source/ray-core/scheduling/resources.rst
+++ b/doc/source/ray-core/scheduling/resources.rst
@@ -61,8 +61,18 @@ Some use cases for custom resources:
 Specifying Node Resources
 -------------------------
 
-By default, Ray nodes start with pre-defiend CPU, GPU, and memory resources. The quantities of these resources on each node are set to the physical quantities auto detected by Ray.
-For example, if you start a head node with ``ray start --head`` then the quantity of logical CPU resources will be equal to the number of physical CPUs on the machine.
+By default, Ray nodes start with pre-defined CPU, GPU, and memory resources. The quantities of these resources on each node are set to the physical quantities auto detected by Ray.
+By default, logical resources are configured by the following rule.
+
+.. warning::
+
+    Ray **does not permit dynamic updates of resource capacities after Ray has been started on a node**.
+
+- **Number of logical CPUs (``num_cpus``)**: Set to the number of CPUs of the machine/container.
+- **Number of logical GPUs (``num_gpus)**: Set to the number of GPUs of the machine/container.
+- **Memory (``memory``)**: Set to 70% of "available memory" when ray runtime starts.
+- **Object Store Memory (``object_store_memory``)**: Set to 30% of "available memory" when ray runtime starts. Note that the object store memory is not logical resource, and users cannot use it for scheduling.
+
 However, you can always override that by manually specifying the quantities of pre-defined resources and adding custom resources.
 There are several ways to do that depending on how you start the Ray cluster:
 

From 13d098289ef482cfc10fc8b7a30047aca0c4989b Mon Sep 17 00:00:00 2001
From: xwjiang2010 <87673679+xwjiang2010@users.noreply.github.com>
Date: Tue, 31 Jan 2023 17:37:26 -0800
Subject: [PATCH 102/267] [ci] disable hdfs test for compat tests. (#32148)

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>
---
 .buildkite/pipeline.build.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.buildkite/pipeline.build.yml b/.buildkite/pipeline.build.yml
index b14b68836c96..cc1acbc0261e 100644
--- a/.buildkite/pipeline.build.yml
+++ b/.buildkite/pipeline.build.yml
@@ -658,8 +658,8 @@
       set -x;
       {
         python ./ci/run/bazel_sharding/bazel_sharding.py --exclude_manual --index "\${BUILDKITE_PARALLEL_JOB}" --count "\${BUILDKITE_PARALLEL_JOB_COUNT}" --tag_filters=compat python/ray/tests/horovod/... python/ray/tests/lightgbm/... python/ray/tests/ml_py36_compat/... python/ray/tests/xgboost/... python/ray/tests/ray_lightning/... &&
-        python ./ci/run/bazel_sharding/bazel_sharding.py --exclude_manual --index "\${BUILDKITE_PARALLEL_JOB}" --count "\${BUILDKITE_PARALLEL_JOB_COUNT}" --tag_filters=-gpu,-needs_credentials python/ray/air/... &&
-        python ./ci/run/bazel_sharding/bazel_sharding.py --exclude_manual --index "\${BUILDKITE_PARALLEL_JOB}" --count "\${BUILDKITE_PARALLEL_JOB_COUNT}" --tag_filters=ray_air,-torch_1_11,-gpu_only,-gpu,-needs_credentials python/ray/train/... &&
+        python ./ci/run/bazel_sharding/bazel_sharding.py --exclude_manual --index "\${BUILDKITE_PARALLEL_JOB}" --count "\${BUILDKITE_PARALLEL_JOB_COUNT}" --tag_filters=-gpu,-needs_credentials,-hdfs python/ray/air/... &&
+        python ./ci/run/bazel_sharding/bazel_sharding.py --exclude_manual --index "\${BUILDKITE_PARALLEL_JOB}" --count "\${BUILDKITE_PARALLEL_JOB_COUNT}" --tag_filters=ray_air,-torch_1_11,-gpu_only,-gpu,-needs_credentials,-hdfs python/ray/train/... &&
         python ./ci/run/bazel_sharding/bazel_sharding.py --exclude_manual --index "\${BUILDKITE_PARALLEL_JOB}" --count "\${BUILDKITE_PARALLEL_JOB_COUNT}" --tag_filters=ray_air python/ray/data/...;
       } > test_shard.txt
     - cat test_shard.txt

From dff4f0af9d844440ab75752be6a48164fca8f1e6 Mon Sep 17 00:00:00 2001
From: clarng <clarence.wyng@gmail.com>
Date: Tue, 31 Jan 2023 17:43:20 -0800
Subject: [PATCH 103/267] [core][oom] enable group by parent policy by default
 (#31976)

Why are these changes needed?
Fail the task if it is the last task of the group, per the new (group by parent) worker killing policy

Related issue number
#32149 32078


Co-authored-by: Clarence Ng <clarence@anyscale.com>
---
 python/ray/tests/test_memory_pressure.py      | 53 +++++++++++--------
 src/ray/common/ray_config_def.h               |  8 +--
 src/ray/core_worker/task_manager.cc           |  3 +-
 .../transport/direct_task_transport.cc        |  5 +-
 src/ray/raylet/node_manager.cc                | 24 +++++----
 src/ray/raylet/node_manager.h                 |  5 +-
 .../worker_killing_policy_group_by_owner.cc   |  3 +-
 7 files changed, 59 insertions(+), 42 deletions(-)

diff --git a/python/ray/tests/test_memory_pressure.py b/python/ray/tests/test_memory_pressure.py
index 2324763acb33..0f4ae113fd81 100644
--- a/python/ray/tests/test_memory_pressure.py
+++ b/python/ray/tests/test_memory_pressure.py
@@ -212,28 +212,6 @@ def test_non_retryable_task_killed_by_memory_monitor_with_oom_error(
     )
 
 
-@pytest.mark.skipif(
-    sys.platform != "linux" and sys.platform != "linux2",
-    reason="memory monitor only on linux currently",
-)
-def test_retryable_task_killed_by_memory_monitor_with_oom_error(
-    ray_with_memory_monitor,
-):
-    addr = ray_with_memory_monitor
-    bytes_to_alloc = get_additional_bytes_to_reach_memory_usage_pct(1.1)
-    with pytest.raises(ray.exceptions.OutOfMemoryError) as _:
-        ray.get(allocate_memory.options(max_retries=1).remote(bytes_to_alloc))
-
-    wait_for_condition(
-        has_metric_tagged_with_value,
-        timeout=10,
-        retry_interval_ms=100,
-        addr=addr,
-        tag="MemoryManager.TaskEviction.Total",
-        value=2.0,
-    )
-
-
 @pytest.mark.skipif(
     sys.platform != "linux" and sys.platform != "linux2",
     reason="memory monitor only on linux currently",
@@ -391,6 +369,10 @@ def test_task_oom_only_uses_oom_retry(
     ray_with_memory_monitor,
 ):
     addr = ray_with_memory_monitor
+
+    leaker = Leaker.options(max_restarts=1, max_task_retries=1).remote()
+    ray.get(leaker.allocate.remote(1))
+
     bytes_to_alloc = get_additional_bytes_to_reach_memory_usage_pct(1.1)
 
     with pytest.raises(ray.exceptions.OutOfMemoryError) as _:
@@ -469,5 +451,32 @@ def test_put_object_task_usage_slightly_below_limit_does_not_crash():
         )
 
 
+@pytest.mark.skipif(
+    sys.platform != "linux" and sys.platform != "linux2",
+    reason="memory monitor only on linux currently",
+)
+def test_last_task_of_the_group_fail_immediately():
+    @ray.remote(max_retries=-1)
+    def infinite_retry_task():
+        chunks = []
+        bytes_per_chunk = 1024 * 1024 * 1024
+        while True:
+            chunks.append([0] * bytes_per_chunk)
+            time.sleep(5)
+
+    with ray.init() as addr:
+        with pytest.raises(ray.exceptions.OutOfMemoryError) as _:
+            ray.get(infinite_retry_task.remote())
+
+        wait_for_condition(
+            has_metric_tagged_with_value,
+            timeout=10,
+            retry_interval_ms=100,
+            addr=addr,
+            tag="MemoryManager.TaskEviction.Total",
+            value=1.0,
+        )
+
+
 if __name__ == "__main__":
     sys.exit(pytest.main(["-sv", __file__]))
diff --git a/src/ray/common/ray_config_def.h b/src/ray/common/ray_config_def.h
index eb93e48f520d..e0714fdeac75 100644
--- a/src/ray/common/ray_config_def.h
+++ b/src/ray/common/ray_config_def.h
@@ -97,10 +97,12 @@ RAY_CONFIG(uint64_t, task_failure_entry_ttl_ms, 15 * 60 * 1000)
 /// ignored. This retry counter is only used when the process is killed due to memory, and
 /// the retry counter of the task or actor is only used when it fails in other ways
 /// that is not related to running out of memory. Retries indefinitely if the value is -1.
-RAY_CONFIG(uint64_t, task_oom_retries, 15)
+RAY_CONFIG(uint64_t, task_oom_retries, -1)
 
-/// The worker killing policy to use, as defined in worker_killing_policy.h.
-RAY_CONFIG(std::string, worker_killing_policy, "retriable_lifo")
+/// The worker killing policy to use, available options are
+/// group_by_owner
+/// retriable_lifo
+RAY_CONFIG(std::string, worker_killing_policy, "group_by_owner")
 
 /// If the raylet fails to get agent info, we will retry after this interval.
 RAY_CONFIG(uint64_t, raylet_get_agent_info_interval_ms, 1)
diff --git a/src/ray/core_worker/task_manager.cc b/src/ray/core_worker/task_manager.cc
index 3cf71e383d19..97927b637584 100644
--- a/src/ray/core_worker/task_manager.cc
+++ b/src/ray/core_worker/task_manager.cc
@@ -548,7 +548,8 @@ bool TaskManager::FailOrRetryPendingTask(const TaskID &task_id,
   // Note that this might be the __ray_terminate__ task, so we don't log
   // loudly with ERROR here.
   RAY_LOG(DEBUG) << "Task attempt " << task_id << " failed with error "
-                 << rpc::ErrorType_Name(error_type);
+                 << rpc::ErrorType_Name(error_type) << " Fail immediately? "
+                 << fail_immediately;
   bool will_retry = false;
   if (!fail_immediately) {
     will_retry = RetryTaskIfPossible(
diff --git a/src/ray/core_worker/transport/direct_task_transport.cc b/src/ray/core_worker/transport/direct_task_transport.cc
index eb5982d269b9..3d5958804c1c 100644
--- a/src/ray/core_worker/transport/direct_task_transport.cc
+++ b/src/ray/core_worker/transport/direct_task_transport.cc
@@ -652,13 +652,16 @@ void CoreWorkerDirectTaskSubmitter::HandleGetTaskFailureCause(
   if (get_task_failure_cause_reply_status.ok()) {
     RAY_LOG(DEBUG) << "Task failure cause for task " << task_id << ": "
                    << ray::gcs::RayErrorInfoToString(
-                          get_task_failure_cause_reply.failure_cause());
+                          get_task_failure_cause_reply.failure_cause())
+                   << " fail immedediately: "
+                   << get_task_failure_cause_reply.fail_task_immediately();
     if (get_task_failure_cause_reply.has_failure_cause()) {
       task_error_type = get_task_failure_cause_reply.failure_cause().error_type();
       error_info = std::make_unique<rpc::RayErrorInfo>(
           get_task_failure_cause_reply.failure_cause());
       // TODO(clarng): track and append task retry history to the error message.
     }
+    fail_immediately = get_task_failure_cause_reply.fail_task_immediately();
   } else {
     RAY_LOG(DEBUG) << "Failed to fetch task result with status "
                    << get_task_failure_cause_reply_status.ToString()
diff --git a/src/ray/raylet/node_manager.cc b/src/ray/raylet/node_manager.cc
index 31f722e8bf6a..133be7d8061e 100644
--- a/src/ray/raylet/node_manager.cc
+++ b/src/ray/raylet/node_manager.cc
@@ -802,8 +802,10 @@ void NodeManager::HandleGetTaskFailureCause(rpc::GetTaskFailureCauseRequest requ
   auto it = task_failure_reasons_.find(task_id);
   if (it != task_failure_reasons_.end()) {
     RAY_LOG(DEBUG) << "task " << task_id << " has failure reason "
-                   << ray::gcs::RayErrorInfoToString(it->second.ray_error_info);
+                   << ray::gcs::RayErrorInfoToString(it->second.ray_error_info)
+                   << ", fail immediately: " << !it->second.should_retry;
     reply->mutable_failure_cause()->CopyFrom(it->second.ray_error_info);
+    reply->set_fail_task_immediately(!it->second.should_retry);
   } else {
     RAY_LOG(INFO) << "didn't find failure cause for task " << task_id;
   }
@@ -2880,14 +2882,10 @@ MemoryUsageRefreshCallback NodeManager::CreateMemoryUsageRefreshCallback() {
           high_memory_eviction_target_ = worker_to_kill;
 
           /// TODO: (clarng) expose these strings in the frontend python error as well.
-          std::string oom_kill_details =
-              this->CreateOomKillMessageDetails(worker_to_kill,
-                                                this->self_node_id_,
-                                                system_memory,
-                                                usage_threshold,
-                                                should_retry);
+          std::string oom_kill_details = this->CreateOomKillMessageDetails(
+              worker_to_kill, this->self_node_id_, system_memory, usage_threshold);
           std::string oom_kill_suggestions =
-              this->CreateOomKillMessageSuggestions(worker_to_kill);
+              this->CreateOomKillMessageSuggestions(worker_to_kill, should_retry);
 
           RAY_LOG(INFO)
               << "Killing worker with task "
@@ -2934,8 +2932,7 @@ const std::string NodeManager::CreateOomKillMessageDetails(
     const std::shared_ptr<WorkerInterface> &worker,
     const NodeID &node_id,
     const MemorySnapshot &system_memory,
-    float usage_threshold,
-    bool should_retry) const {
+    float usage_threshold) const {
   float usage_fraction =
       static_cast<float>(system_memory.used_bytes) / system_memory.total_bytes;
   std::string used_bytes_gb =
@@ -2977,7 +2974,7 @@ const std::string NodeManager::CreateOomKillMessageDetails(
 }
 
 const std::string NodeManager::CreateOomKillMessageSuggestions(
-    const std::shared_ptr<WorkerInterface> &worker) const {
+    const std::shared_ptr<WorkerInterface> &worker, bool should_retry) const {
   std::stringstream not_retriable_recommendation_ss;
   if (worker && !worker->GetAssignedTask().GetTaskSpecification().IsRetriable()) {
     not_retriable_recommendation_ss << "Set ";
@@ -2989,6 +2986,11 @@ const std::string NodeManager::CreateOomKillMessageSuggestions(
     not_retriable_recommendation_ss
         << " to enable retry when the task crashes due to OOM. ";
   }
+  std::stringstream deadlock_recommendation;
+  if (!should_retry) {
+    deadlock_recommendation
+        << "The node has insufficient memory to execute this workload. ";
+  }
   std::stringstream oom_kill_suggestions_ss;
   oom_kill_suggestions_ss
       << "Refer to the documentation on how to address the out of memory issue: "
diff --git a/src/ray/raylet/node_manager.h b/src/ray/raylet/node_manager.h
index e470ac218e6d..cac72b18200b 100644
--- a/src/ray/raylet/node_manager.h
+++ b/src/ray/raylet/node_manager.h
@@ -654,13 +654,12 @@ class NodeManager : public rpc::NodeManagerServiceHandler,
       const std::shared_ptr<WorkerInterface> &worker,
       const NodeID &node_id,
       const MemorySnapshot &system_memory,
-      float usage_threshold,
-      bool should_retry) const;
+      float usage_threshold) const;
 
   /// Creates the suggestion message for the worker that is killed due to memory running
   /// low.
   const std::string CreateOomKillMessageSuggestions(
-      const std::shared_ptr<WorkerInterface> &worker) const;
+      const std::shared_ptr<WorkerInterface> &worker, bool should_retry = true) const;
 
   /// Stores the failure reason for the task. The entry will be cleaned up by a periodic
   /// function post TTL.
diff --git a/src/ray/raylet/worker_killing_policy_group_by_owner.cc b/src/ray/raylet/worker_killing_policy_group_by_owner.cc
index e455808ab3a1..25bc47b23b3f 100644
--- a/src/ray/raylet/worker_killing_policy_group_by_owner.cc
+++ b/src/ray/raylet/worker_killing_policy_group_by_owner.cc
@@ -89,7 +89,8 @@ GroupByOwnerIdWorkerKillingPolicy::SelectWorkerToKill(
   auto worker_to_kill = selected_group.SelectWorkerToKill();
 
   RAY_LOG(INFO) << "Sorted list of tasks based on the policy:\n"
-                << PolicyDebugString(sorted, system_memory);
+                << PolicyDebugString(sorted, system_memory)
+                << "\nTask should be retried? " << should_retry;
 
   return std::make_pair(worker_to_kill, should_retry);
 }

From df05cd993a9b3cc70e267a5f486b8c4b476a9df7 Mon Sep 17 00:00:00 2001
From: Kai-Hsun Chen <kaihsun@anyscale.com>
Date: Tue, 31 Jan 2023 17:44:27 -0800
Subject: [PATCH 104/267] Revert "[Docker] (Kubeflow integration) Add chmod
 --recursive 777 /home/ray to Ray Dockerfile." #32026

Signed-off-by: kaihsun <kaihsun@anyscale.com>
---
 docker/base-deps/Dockerfile | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/docker/base-deps/Dockerfile b/docker/base-deps/Dockerfile
index 0b60772e8415..8e1f526e4465 100644
--- a/docker/base-deps/Dockerfile
+++ b/docker/base-deps/Dockerfile
@@ -77,9 +77,6 @@ RUN sudo apt-get update -y && sudo apt-get upgrade -y \
     else sudo apt-get autoremove -y wget; \
     fi;) \
     && sudo rm -rf /var/lib/apt/lists/* \
-    && sudo apt-get clean \
-    # Ensure all users are able to write to /home/ray because OpenShift uses a random UID when logging into
-    # pods. See #30959 for more context.
-    && chmod --recursive 777 /home/ray
+    && sudo apt-get clean
 
 WORKDIR $HOME

From 47bb652de59e0fc7fde26262b48918cdd7ffa64c Mon Sep 17 00:00:00 2001
From: Chen Shen <scv119@gmail.com>
Date: Tue, 31 Jan 2023 18:06:17 -0800
Subject: [PATCH 105/267] [Core] update grpc to 1.46.6 (#32054)

#31956

Upgrade to a version of gRPC that GHSA-cfmr-vrgj-vqwv in Zlib
1.46.6 has this patch: grpc/grpc#31845
---
 bazel/ray_deps_setup.bzl | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/bazel/ray_deps_setup.bzl b/bazel/ray_deps_setup.bzl
index 3d44b8e2f614..916ca4883440 100644
--- a/bazel/ray_deps_setup.bzl
+++ b/bazel/ray_deps_setup.bzl
@@ -238,8 +238,8 @@ def ray_deps_setup():
     auto_http_archive(
         name = "com_github_grpc_grpc",
         # NOTE: If you update this, also update @boringssl's hash.
-        url = "https://github.com/grpc/grpc/archive/refs/tags/v1.45.2.tar.gz",
-        sha256 = "e18b16f7976aab9a36c14c38180f042bb0fd196b75c9fd6a20a2b5f934876ad6",
+        url = "https://github.com/grpc/grpc/archive/refs/tags/v1.46.6.tar.gz",
+        sha256 = "6514b3e6eab9e9c7017304512d4420387a47b1a9c5caa986643692977ed44e8a",
         patches = [
             "@com_github_ray_project_ray//thirdparty/patches:grpc-cython-copts.patch",
             "@com_github_ray_project_ray//thirdparty/patches:grpc-python.patch",
@@ -282,11 +282,11 @@ def ray_deps_setup():
         # https://github.com/grpc/grpc/blob/1ff1feaa83e071d87c07827b0a317ffac673794f/bazel/grpc_deps.bzl#L189
         # Ensure this rule matches the rule used by grpc's bazel/grpc_deps.bzl
         name = "boringssl",
-        sha256 = "e168777eb0fc14ea5a65749a2f53c095935a6ea65f38899a289808fb0c221dc4",
-        strip_prefix = "boringssl-4fb158925f7753d80fb858cb0239dff893ef9f15",
+        sha256 = "534fa658bd845fd974b50b10f444d392dfd0d93768c4a51b61263fd37d851c40",
+        strip_prefix = "boringssl-b9232f9e27e5668bc0414879dcdedb2a59ea75f2",
         urls = [
-            "https://storage.googleapis.com/grpc-bazel-mirror/github.com/google/boringssl/archive/4fb158925f7753d80fb858cb0239dff893ef9f15.tar.gz",
-            "https://github.com/google/boringssl/archive/4fb158925f7753d80fb858cb0239dff893ef9f15.tar.gz",
+            "https://storage.googleapis.com/grpc-bazel-mirror/github.com/google/boringssl/archive/b9232f9e27e5668bc0414879dcdedb2a59ea75f2.tar.gz",
+            "https://github.com/google/boringssl/archive/b9232f9e27e5668bc0414879dcdedb2a59ea75f2.tar.gz",
         ],
     )
 

From b2c5e63bf7df2b105dbdcaeb558c682c9103712f Mon Sep 17 00:00:00 2001
From: Archit Kulkarni <architkulkarni@users.noreply.github.com>
Date: Tue, 31 Jan 2023 18:08:24 -0800
Subject: [PATCH 106/267] [Core] Join Ray Jobs API `JobInfo` with GCS
 `JobTableData` (#31046)

Why are these changes needed?
Add a new protobuf for JobInfo from the Ray Job API
Augment the existing GCS GetAllJobInfo endpoint to return this information, if available (not all GCS jobs were submitted via the Ray Job API; these jobs won't have this extra JobInfo.)
Related issue number
Closes #29621
---
 dashboard/modules/job/common.py               |  25 +-
 dashboard/modules/job/tests/test_common.py    |  58 +++-
 python/ray/_private/ray_constants.py          |   2 +
 python/ray/_private/worker.py                 |   2 +-
 src/mock/ray/gcs/gcs_server/gcs_kv_manager.h  |  74 +++++
 .../test/global_state_accessor_test.cc        |  20 ++
 src/ray/gcs/gcs_server/gcs_job_manager.cc     |  70 ++++-
 src/ray/gcs/gcs_server/gcs_job_manager.h      |  16 +-
 src/ray/gcs/gcs_server/gcs_server.cc          |   7 +-
 .../gcs_server/test/gcs_job_manager_test.cc   | 274 +++++++++++++++++-
 src/ray/gcs/test/gcs_test_util.h              |   9 +-
 src/ray/protobuf/gcs.proto                    |  36 ++-
 src/ray/protobuf/gcs_service.proto            |   5 +-
 13 files changed, 582 insertions(+), 16 deletions(-)

diff --git a/dashboard/modules/job/common.py b/dashboard/modules/job/common.py
index 86e0dcbff0a2..a5d927541016 100644
--- a/dashboard/modules/job/common.py
+++ b/dashboard/modules/job/common.py
@@ -61,7 +61,10 @@ def is_terminal(self) -> bool:
 @PublicAPI(stability="stable")
 @dataclass
 class JobInfo:
-    """A class for recording information associated with a job and its execution."""
+    """A class for recording information associated with a job and its execution.
+
+    Please keep this in sync with the JobsAPIInfo proto in src/ray/protobuf/gcs.proto.
+    """
 
     #: The status of the job.
     status: JobStatus
@@ -127,6 +130,9 @@ def __post_init__(self):
     def to_json(self) -> Dict[str, Any]:
         """Convert this object to a JSON-serializable dictionary.
 
+        Note that the runtime_env field is converted to a JSON-serialized string
+        and the field is renamed to runtime_env_json.
+
         Returns:
             A JSON-serializable dictionary representing the JobInfo object.
         """
@@ -136,6 +142,12 @@ def to_json(self) -> Dict[str, Any]:
         # Convert enum values to strings.
         json_dict["status"] = str(json_dict["status"])
 
+        # Convert runtime_env to a JSON-serialized string.
+        if "runtime_env" in json_dict:
+            if json_dict["runtime_env"] is not None:
+                json_dict["runtime_env_json"] = json.dumps(json_dict["runtime_env"])
+            del json_dict["runtime_env"]
+
         # Assert that the dictionary is JSON-serializable.
         json.dumps(json_dict)
 
@@ -145,12 +157,21 @@ def to_json(self) -> Dict[str, Any]:
     def from_json(cls, json_dict: Dict[str, Any]) -> None:
         """Initialize this object from a JSON dictionary.
 
+        Note that the runtime_env_json field is converted to a dictionary and
+        the field is renamed to runtime_env.
+
         Args:
             json_dict: A JSON dictionary to use to initialize the JobInfo object.
         """
         # Convert enum values to enum objects.
         json_dict["status"] = JobStatus(json_dict["status"])
 
+        # Convert runtime_env from a JSON-serialized string to a dictionary.
+        if "runtime_env_json" in json_dict:
+            if json_dict["runtime_env_json"] is not None:
+                json_dict["runtime_env"] = json.loads(json_dict["runtime_env_json"])
+            del json_dict["runtime_env_json"]
+
         return cls(**json_dict)
 
 
@@ -159,6 +180,8 @@ class JobInfoStorageClient:
     Interface to put and get job data from the Internal KV store.
     """
 
+    # Please keep this format in sync with JobDataKey()
+    # in src/ray/gcs/gcs_server/gcs_job_manager.h.
     JOB_DATA_KEY_PREFIX = f"{ray_constants.RAY_INTERNAL_NAMESPACE_PREFIX}job_info_"
     JOB_DATA_KEY = f"{JOB_DATA_KEY_PREFIX}{{job_id}}"
 
diff --git a/dashboard/modules/job/tests/test_common.py b/dashboard/modules/job/tests/test_common.py
index 60b686e97858..7e721e1c63f4 100644
--- a/dashboard/modules/job/tests/test_common.py
+++ b/dashboard/modules/job/tests/test_common.py
@@ -1,4 +1,5 @@
 import pytest
+import json
 
 from ray.dashboard.modules.job.common import (
     JobInfo,
@@ -9,6 +10,9 @@
     JobSubmitRequest,
 )
 
+from ray.core.generated.gcs_pb2 import JobsAPIInfo
+from google.protobuf.json_format import Parse
+
 
 class TestJobSubmitRequestValidation:
     def test_validate_entrypoint(self):
@@ -151,7 +155,7 @@ def test_job_info_to_json():
         "entrypoint_num_cpus": 1,
         "entrypoint_num_gpus": 1,
         "entrypoint_resources": {"Custom": 1},
-        "runtime_env": {"pip": ["pkg"]},
+        "runtime_env_json": '{"pip": ["pkg"]}',
     }
 
     # Check that the expected items are in the JSON.
@@ -165,6 +169,58 @@ def test_job_info_to_json():
     assert isinstance(new_job_info.status, JobStatus)
 
 
+def test_job_info_json_to_proto():
+    """Test that JobInfo JSON can be converted to JobsAPIInfo protobuf."""
+    info = JobInfo(
+        status=JobStatus.PENDING,
+        entrypoint="echo hi",
+        error_type="error_type",
+        start_time=123,
+        end_time=456,
+        metadata={"hi": "hi2"},
+        entrypoint_num_cpus=1,
+        entrypoint_num_gpus=1,
+        entrypoint_resources={"Custom": 1},
+        runtime_env={"pip": ["pkg"]},
+        driver_agent_http_address="http://localhost:1234",
+        driver_node_id="node_id",
+    )
+    info_json = json.dumps(info.to_json())
+    info_proto = Parse(info_json, JobsAPIInfo())
+    assert info_proto.status == "PENDING"
+    assert info_proto.entrypoint == "echo hi"
+    assert info_proto.start_time == 123
+    assert info_proto.end_time == 456
+    assert info_proto.metadata == {"hi": "hi2"}
+    assert info_proto.entrypoint_num_cpus == 1
+    assert info_proto.entrypoint_num_gpus == 1
+    assert info_proto.entrypoint_resources == {"Custom": 1}
+    assert info_proto.runtime_env_json == '{"pip": ["pkg"]}'
+    assert info_proto.message == (
+        "Job has not started yet. It may be waiting for resources "
+        "(CPUs, GPUs, custom resources) to become available. "
+        "It may be waiting for the runtime environment to be set up."
+    )
+    assert info_proto.error_type == "error_type"
+    assert info_proto.driver_agent_http_address == "http://localhost:1234"
+    assert info_proto.driver_node_id == "node_id"
+
+    minimal_info = JobInfo(status=JobStatus.PENDING, entrypoint="echo hi")
+    minimal_info_json = json.dumps(minimal_info.to_json())
+    minimal_info_proto = Parse(minimal_info_json, JobsAPIInfo())
+    assert minimal_info_proto.status == "PENDING"
+    assert minimal_info_proto.entrypoint == "echo hi"
+    for unset_optional_field in [
+        "entrypoint_num_cpus",
+        "entrypoint_num_gpus",
+        "runtime_env_json",
+        "error_type",
+        "driver_agent_http_address",
+        "driver_node_id",
+    ]:
+        assert not minimal_info_proto.HasField(unset_optional_field)
+
+
 if __name__ == "__main__":
     import sys
 
diff --git a/python/ray/_private/ray_constants.py b/python/ray/_private/ray_constants.py
index 6badbbf2b29a..1b555c389409 100644
--- a/python/ray/_private/ray_constants.py
+++ b/python/ray/_private/ray_constants.py
@@ -355,6 +355,8 @@ def env_bool(key, default):
 # Prefix for namespaces which are used internally by ray.
 # Jobs within these namespaces should be hidden from users
 # and should not be considered user activity.
+# Please keep this in sync with the definition kRayInternalNamespacePrefix
+# in /src/ray/gcs/gcs_server/gcs_job_manager.h.
 RAY_INTERNAL_NAMESPACE_PREFIX = "_ray_internal_"
 
 
diff --git a/python/ray/_private/worker.py b/python/ray/_private/worker.py
index ece785f9f08b..a1dcfa8277cf 100644
--- a/python/ray/_private/worker.py
+++ b/python/ray/_private/worker.py
@@ -1912,7 +1912,7 @@ def connect(
             it during startup as a command line argument.
         ray_debugger_external: If True, make the debugger external to the
             node this worker is running on.
-        entrypoint: The name of the entrypoint script. Ignored unless the
+        entrypoint: The name of the entrypoint script. Ignored if the
             mode != SCRIPT_MODE
     """
     # Do some basic checking to make sure we didn't call ray.init twice.
diff --git a/src/mock/ray/gcs/gcs_server/gcs_kv_manager.h b/src/mock/ray/gcs/gcs_server/gcs_kv_manager.h
index 014d239855bf..ae3d9857b216 100644
--- a/src/mock/ray/gcs/gcs_server/gcs_kv_manager.h
+++ b/src/mock/ray/gcs/gcs_server/gcs_kv_manager.h
@@ -61,5 +61,79 @@ class MockInternalKVInterface : public ray::gcs::InternalKVInterface {
               (override));
 };
 
+// Fake internal KV interface that simply stores keys and values in a C++ map.
+// Only supports Put and Get.
+// Warning: Naively prepends the namespace to the key, so e.g.
+// the (namespace, key) pairs ("a", "bc") and ("ab", "c") will collide which is a bug.
+
+class FakeInternalKVInterface : public ray::gcs::InternalKVInterface {
+ public:
+  FakeInternalKVInterface() {}
+
+  // The C++ map.
+  std::unordered_map<std::string, std::string> kv_store_ = {};
+
+  void Get(const std::string &ns,
+           const std::string &key,
+           std::function<void(std::optional<std::string>)> callback) override {
+    std::string full_key = ns + key;
+    auto it = kv_store_.find(full_key);
+    if (it == kv_store_.end()) {
+      callback(std::nullopt);
+    } else {
+      callback(it->second);
+    }
+  }
+
+  void MultiGet(const std::string &ns,
+                const std::vector<std::string> &keys,
+                std::function<void(std::unordered_map<std::string, std::string>)>
+                    callback) override {
+    std::unordered_map<std::string, std::string> result;
+    for (const auto &key : keys) {
+      std::string full_key = ns + key;
+      auto it = kv_store_.find(full_key);
+      if (it != kv_store_.end()) {
+        result[key] = it->second;
+      }
+    }
+    callback(result);
+  }
+
+  void Put(const std::string &ns,
+           const std::string &key,
+           const std::string &value,
+           bool overwrite,
+           std::function<void(bool)> callback) override {
+    std::string full_key = ns + key;
+    if (kv_store_.find(full_key) != kv_store_.end() && !overwrite) {
+      callback(false);
+    } else {
+      kv_store_[full_key] = value;
+      callback(true);
+    }
+  }
+
+  MOCK_METHOD(void,
+              Del,
+              (const std::string &ns,
+               const std::string &key,
+               bool del_by_prefix,
+               std::function<void(int64_t)> callback),
+              (override));
+  MOCK_METHOD(void,
+              Exists,
+              (const std::string &ns,
+               const std::string &key,
+               std::function<void(bool)> callback),
+              (override));
+  MOCK_METHOD(void,
+              Keys,
+              (const std::string &ns,
+               const std::string &prefix,
+               std::function<void(std::vector<std::string>)> callback),
+              (override));
+};
+
 }  // namespace gcs
 }  // namespace ray
diff --git a/src/ray/gcs/gcs_client/test/global_state_accessor_test.cc b/src/ray/gcs/gcs_client/test/global_state_accessor_test.cc
index 364462163461..1ce0c1aa2934 100644
--- a/src/ray/gcs/gcs_client/test/global_state_accessor_test.cc
+++ b/src/ray/gcs/gcs_client/test/global_state_accessor_test.cc
@@ -125,6 +125,26 @@ TEST_P(GlobalStateAccessorTest, TestJobTable) {
   ASSERT_EQ(global_state_->GetAllJobInfo().size(), job_count);
 }
 
+// Test GetAllJobInfo where some jobs were submitted by the Ray Job API (i.d. they have
+// job_submission_id set).
+TEST_P(GlobalStateAccessorTest, TestJobTableWithSubmissionId) {
+  int job_count = 100;
+  ASSERT_EQ(global_state_->GetAllJobInfo().size(), 0);
+  for (int index = 0; index < job_count; ++index) {
+    auto job_id = JobID::FromInt(index);
+    auto job_table_data = Mocker::GenJobTableData(job_id);
+    if (index % 2 == 0) {
+      (*job_table_data->mutable_config()->mutable_metadata())["job_submission_id"] =
+          std::to_string(index);
+    }
+    std::promise<bool> promise;
+    RAY_CHECK_OK(gcs_client_->Jobs().AsyncAdd(
+        job_table_data, [&promise](Status status) { promise.set_value(status.ok()); }));
+    promise.get_future().get();
+  }
+  ASSERT_EQ(global_state_->GetAllJobInfo().size(), job_count);
+}
+
 TEST_P(GlobalStateAccessorTest, TestNodeTable) {
   int node_count = 100;
   ASSERT_EQ(global_state_->GetAllNodeInfo().size(), 0);
diff --git a/src/ray/gcs/gcs_server/gcs_job_manager.cc b/src/ray/gcs/gcs_server/gcs_job_manager.cc
index bed2b0298fd0..734f1795d9cb 100644
--- a/src/ray/gcs/gcs_server/gcs_job_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_job_manager.cc
@@ -14,6 +14,7 @@
 
 #include "ray/gcs/gcs_server/gcs_job_manager.h"
 
+#include "ray/gcs/gcs_client/accessor.h"
 #include "ray/gcs/pb_util.h"
 
 namespace ray {
@@ -146,13 +147,76 @@ void GcsJobManager::HandleGetAllJobInfo(rpc::GetAllJobInfoRequest request,
                                         rpc::GetAllJobInfoReply *reply,
                                         rpc::SendReplyCallback send_reply_callback) {
   RAY_LOG(INFO) << "Getting all job info.";
-  auto on_done = [reply, send_reply_callback](
+
+  int limit = std::numeric_limits<int>::max();
+  if (request.has_limit()) {
+    limit = request.limit();
+    if (limit < 0) {
+      RAY_LOG(ERROR) << "Invalid limit " << limit
+                     << " specified in GetAllJobInfoRequest, "
+                     << "must be nonnegative.";
+      GCS_RPC_SEND_REPLY(send_reply_callback, reply, Status::Invalid("Invalid limit"));
+      return;
+    }
+    RAY_LOG(INFO) << "Getting job info with limit " << limit << ".";
+  }
+
+  auto on_done = [this, reply, send_reply_callback, limit](
                      const absl::flat_hash_map<JobID, JobTableData> &result) {
+    // Internal KV keys for jobs that were submitted via the Ray Job API.
+    std::vector<std::string> job_api_data_keys;
+
+    // Maps job data keys to the index of the job in the table.
+    std::unordered_map<std::string, int> job_data_key_to_index;
+
+    // Load the job table data into the reply.
+    int i = 0;
     for (auto &data : result) {
+      if (i >= limit) {
+        break;
+      }
       reply->add_job_info_list()->CopyFrom(data.second);
+      auto &metadata = data.second.config().metadata();
+      auto iter = metadata.find("job_submission_id");
+      if (iter != metadata.end()) {
+        // This job was submitted via the Ray Job API, so it has JobInfo in the kv.
+        std::string job_submission_id = iter->second;
+        std::string job_data_key = JobDataKey(job_submission_id);
+        job_api_data_keys.push_back(job_data_key);
+        job_data_key_to_index[job_data_key] = i;
+      }
+      i++;
     }
-    RAY_LOG(INFO) << "Finished getting all job info.";
-    GCS_RPC_SEND_REPLY(send_reply_callback, reply, Status::OK());
+
+    RAY_CHECK(job_api_data_keys.size() == job_data_key_to_index.size());
+
+    auto kv_multi_get_callback =
+        [reply, send_reply_callback, job_data_key_to_index](
+            std::unordered_map<std::string, std::string> result) {
+          for (auto &data : result) {
+            std::string job_data_key = data.first;
+            // The JobInfo stored by the Ray Job API.
+            std::string job_info_json = data.second;
+            if (!job_info_json.empty()) {
+              // Parse the JSON into a JobsAPIInfo proto.
+              rpc::JobsAPIInfo jobs_api_info;
+              auto status = google::protobuf::util::JsonStringToMessage(job_info_json,
+                                                                        &jobs_api_info);
+              if (!status.ok()) {
+                RAY_LOG(ERROR)
+                    << "Failed to parse JobInfo JSON into JobsAPIInfo protobuf. JSON: "
+                    << job_info_json << " Error: " << status.message();
+              }
+              // Add the JobInfo to the correct index in the reply.
+              reply->mutable_job_info_list(job_data_key_to_index.at(job_data_key))
+                  ->mutable_job_info()
+                  ->CopyFrom(std::move(jobs_api_info));
+            }
+          }
+          RAY_LOG(INFO) << "Finished getting all job info.";
+          GCS_RPC_SEND_REPLY(send_reply_callback, reply, Status::OK());
+        };
+    internal_kv_.MultiGet("job", job_api_data_keys, kv_multi_get_callback);
   };
   Status status = gcs_table_storage_->JobTable().GetAll(on_done);
   if (!status.ok()) {
diff --git a/src/ray/gcs/gcs_server/gcs_job_manager.h b/src/ray/gcs/gcs_server/gcs_job_manager.h
index a7c0c25ec997..5404952ac573 100644
--- a/src/ray/gcs/gcs_server/gcs_job_manager.h
+++ b/src/ray/gcs/gcs_server/gcs_job_manager.h
@@ -24,6 +24,15 @@
 namespace ray {
 namespace gcs {
 
+// Please keep this in sync with the definition in ray_constants.py.
+const std::string kRayInternalNamespacePrefix = "_ray_internal_";
+
+// Please keep these in sync with the definition in dashboard/modules/job/common.py.
+const std::string kJobDataKeyPrefix = kRayInternalNamespacePrefix + "job_info_";
+inline std::string JobDataKey(const std::string submission_id) {
+  return kJobDataKeyPrefix + submission_id;
+}
+
 using JobFinishListenerCallback = rpc::JobInfoHandler::JobFinishListenerCallback;
 
 /// This implementation class of `JobInfoHandler`.
@@ -32,11 +41,13 @@ class GcsJobManager : public rpc::JobInfoHandler {
   explicit GcsJobManager(std::shared_ptr<GcsTableStorage> gcs_table_storage,
                          std::shared_ptr<GcsPublisher> gcs_publisher,
                          RuntimeEnvManager &runtime_env_manager,
-                         GcsFunctionManager &function_manager)
+                         GcsFunctionManager &function_manager,
+                         InternalKVInterface &internal_kv)
       : gcs_table_storage_(std::move(gcs_table_storage)),
         gcs_publisher_(std::move(gcs_publisher)),
         runtime_env_manager_(runtime_env_manager),
-        function_manager_(function_manager) {}
+        function_manager_(function_manager),
+        internal_kv_(internal_kv) {}
 
   void Initialize(const GcsInitData &gcs_init_data);
 
@@ -76,6 +87,7 @@ class GcsJobManager : public rpc::JobInfoHandler {
 
   ray::RuntimeEnvManager &runtime_env_manager_;
   GcsFunctionManager &function_manager_;
+  InternalKVInterface &internal_kv_;
   void ClearJobInfos(const rpc::JobTableData &job_data);
 
   void MarkJobAsFinished(rpc::JobTableData job_table_data,
diff --git a/src/ray/gcs/gcs_server/gcs_server.cc b/src/ray/gcs/gcs_server/gcs_server.cc
index 4705e854fcb6..73715dbddc13 100644
--- a/src/ray/gcs/gcs_server/gcs_server.cc
+++ b/src/ray/gcs/gcs_server/gcs_server.cc
@@ -347,8 +347,11 @@ void GcsServer::InitClusterTaskManager() {
 
 void GcsServer::InitGcsJobManager(const GcsInitData &gcs_init_data) {
   RAY_CHECK(gcs_table_storage_ && gcs_publisher_);
-  gcs_job_manager_ = std::make_unique<GcsJobManager>(
-      gcs_table_storage_, gcs_publisher_, *runtime_env_manager_, *function_manager_);
+  gcs_job_manager_ = std::make_unique<GcsJobManager>(gcs_table_storage_,
+                                                     gcs_publisher_,
+                                                     *runtime_env_manager_,
+                                                     *function_manager_,
+                                                     kv_manager_->GetInstance());
   gcs_job_manager_->Initialize(gcs_init_data);
 
   // Register service.
diff --git a/src/ray/gcs/gcs_server/test/gcs_job_manager_test.cc b/src/ray/gcs/gcs_server/test/gcs_job_manager_test.cc
index af99351f2724..afc84ea8ecfc 100644
--- a/src/ray/gcs/gcs_server/test/gcs_job_manager_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_job_manager_test.cc
@@ -52,6 +52,7 @@ class GcsJobManagerTest : public ::testing::Test {
     store_client_ = std::make_shared<MockInMemoryStoreClient>(io_service_);
     gcs_table_storage_ = std::make_shared<gcs::GcsTableStorage>(store_client_);
     kv_ = std::make_unique<gcs::MockInternalKVInterface>();
+    fake_kv_ = std::make_unique<gcs::FakeInternalKVInterface>();
     function_manager_ = std::make_unique<gcs::GcsFunctionManager>(*kv_);
   }
 
@@ -68,13 +69,277 @@ class GcsJobManagerTest : public ::testing::Test {
   std::shared_ptr<gcs::GcsPublisher> gcs_publisher_;
   std::unique_ptr<gcs::GcsFunctionManager> function_manager_;
   std::unique_ptr<gcs::MockInternalKVInterface> kv_;
+  std::unique_ptr<gcs::FakeInternalKVInterface> fake_kv_;
   RuntimeEnvManager runtime_env_manager_;
   const std::chrono::milliseconds timeout_ms_{5000};
 };
 
+TEST_F(GcsJobManagerTest, TestFakeInternalKV) {
+  fake_kv_->Put("ns", "key", "value", /*overwrite=*/true, /*callback=*/[](auto) {});
+  fake_kv_->Get(
+      "ns", "key", [](std::optional<std::string> v) { ASSERT_EQ(v.value(), "value"); });
+  fake_kv_->Put("ns", "key2", "value2", /*overwrite=*/true, /*callback=*/[](auto) {});
+
+  fake_kv_->MultiGet("ns",
+                     {"key", "key2"},
+                     [](const std::unordered_map<std::string, std::string> &result) {
+                       ASSERT_EQ(result.size(), 2);
+                       ASSERT_EQ(result.at("key"), "value");
+                       ASSERT_EQ(result.at("key2"), "value2");
+                     });
+}
+
+TEST_F(GcsJobManagerTest, TestGetAllJobInfo) {
+  gcs::GcsJobManager gcs_job_manager(gcs_table_storage_,
+                                     gcs_publisher_,
+                                     runtime_env_manager_,
+                                     *function_manager_,
+                                     *fake_kv_);
+
+  gcs::GcsInitData gcs_init_data(gcs_table_storage_);
+  gcs_job_manager.Initialize(/*init_data=*/gcs_init_data);
+
+  // Add 100 jobs.
+  for (int i = 0; i < 100; ++i) {
+    auto job_id = JobID::FromInt(i);
+    auto add_job_request =
+        Mocker::GenAddJobRequest(job_id, "namespace_" + std::to_string(i));
+    rpc::AddJobReply empty_reply;
+    std::promise<bool> promise;
+    gcs_job_manager.HandleAddJob(
+        *add_job_request,
+        &empty_reply,
+        [&promise](Status, std::function<void()>, std::function<void()>) {
+          promise.set_value(true);
+        });
+    promise.get_future().get();
+  }
+
+  // Get all jobs.
+  rpc::GetAllJobInfoRequest all_job_info_request;
+  rpc::GetAllJobInfoReply all_job_info_reply;
+  std::promise<bool> all_job_info_promise;
+
+  gcs_job_manager.HandleGetAllJobInfo(
+      all_job_info_request,
+      &all_job_info_reply,
+      [&all_job_info_promise](Status, std::function<void()>, std::function<void()>) {
+        all_job_info_promise.set_value(true);
+      });
+  all_job_info_promise.get_future().get();
+
+  ASSERT_EQ(all_job_info_reply.job_info_list().size(), 100);
+
+  // Add a job with a submission id (simulate a job being "submitted via the Ray Job
+  // API.")
+  auto job_api_job_id = JobID::FromInt(100);
+  std::string submission_id = "submission_id_100";
+  auto add_job_request =
+      Mocker::GenAddJobRequest(job_api_job_id, "namespace_100", submission_id);
+  rpc::AddJobReply empty_reply;
+  std::promise<bool> promise;
+  gcs_job_manager.HandleAddJob(
+      *add_job_request,
+      &empty_reply,
+      [&promise](Status, std::function<void()>, std::function<void()>) {
+        promise.set_value(true);
+      });
+  promise.get_future().get();
+
+  // Manually put sample JobInfo for that job into the internal kv.
+  // This is ordinarily done in Python by the Ray Job API.
+  std::string job_info_json = R"(
+    {
+      "status": "PENDING",
+      "entrypoint": "echo hi",
+      "entrypoint_num_cpus": 1,
+      "entrypoint_num_gpus": 1,
+      "entrypoint_resources": {
+        "Custom": 1
+      },
+      "runtime_env_json": "{\"pip\": [\"pkg\"]}"
+    }
+  )";
+
+  std::promise<bool> kv_promise;
+  fake_kv_->Put("job",
+                gcs::JobDataKey(submission_id),
+                job_info_json,
+                /*overwrite=*/true,
+                [&kv_promise](auto) { kv_promise.set_value(true); });
+  kv_promise.get_future().get();
+
+  // Get all job info again.
+  rpc::GetAllJobInfoRequest all_job_info_request2;
+  rpc::GetAllJobInfoReply all_job_info_reply2;
+  std::promise<bool> all_job_info_promise2;
+
+  gcs_job_manager.HandleGetAllJobInfo(
+      all_job_info_request2,
+      &all_job_info_reply2,
+      [&all_job_info_promise2](Status, std::function<void()>, std::function<void()>) {
+        all_job_info_promise2.set_value(true);
+      });
+  all_job_info_promise2.get_future().get();
+
+  ASSERT_EQ(all_job_info_reply2.job_info_list().size(), 101);
+
+  // From the reply, get the job info for the job "submitted via the Ray Job API."
+  rpc::JobTableData job_table_data_for_api_job;
+  for (auto job_info : all_job_info_reply2.job_info_list()) {
+    if (job_info.job_id() == job_api_job_id.Binary()) {
+      job_table_data_for_api_job = job_info;
+      break;
+    }
+  }
+
+  // Verify the contents of the job info proto from the reply.
+  auto job_info = job_table_data_for_api_job.job_info();
+  ASSERT_EQ(job_info.status(), "PENDING");
+  ASSERT_EQ(job_info.entrypoint(), "echo hi");
+  ASSERT_EQ(job_info.entrypoint_num_cpus(), 1);
+  ASSERT_EQ(job_info.entrypoint_num_gpus(), 1);
+  ASSERT_EQ(job_info.entrypoint_resources().size(), 1);
+  ASSERT_EQ(job_info.entrypoint_resources().at("Custom"), 1);
+  ASSERT_EQ(job_info.runtime_env_json(), "{\"pip\": [\"pkg\"]}");
+
+  // Manually overwrite with bad JobInfo JSON to test error handling on parse.
+  job_info_json = R"(
+    {
+      "status": "PENDING",
+      "entrypoint": "echo hi",
+      "not_a_real_field": 1
+    }
+  )";
+
+  std::promise<bool> kv_promise2;
+  fake_kv_->Put("job",
+                gcs::JobDataKey(submission_id),
+                job_info_json,
+                /*overwrite=*/true,
+                [&kv_promise2](auto) { kv_promise2.set_value(true); });
+  kv_promise2.get_future().get();
+
+  // Get all job info again.
+  rpc::GetAllJobInfoRequest all_job_info_request3;
+  rpc::GetAllJobInfoReply all_job_info_reply3;
+  std::promise<bool> all_job_info_promise3;
+
+  gcs_job_manager.HandleGetAllJobInfo(
+      all_job_info_request3,
+      &all_job_info_reply3,
+      [&all_job_info_promise3](Status, std::function<void()>, std::function<void()>) {
+        all_job_info_promise3.set_value(true);
+      });
+
+  // Make sure the GCS didn't hang or crash.
+  all_job_info_promise3.get_future().get();
+}
+
+TEST_F(GcsJobManagerTest, TestGetAllJobInfoWithLimit) {
+  gcs::GcsJobManager gcs_job_manager(gcs_table_storage_,
+                                     gcs_publisher_,
+                                     runtime_env_manager_,
+                                     *function_manager_,
+                                     *fake_kv_);
+
+  auto job_id1 = JobID::FromInt(1);
+  auto job_id2 = JobID::FromInt(2);
+  gcs::GcsInitData gcs_init_data(gcs_table_storage_);
+  gcs_job_manager.Initialize(/*init_data=*/gcs_init_data);
+
+  rpc::AddJobReply empty_reply;
+  std::promise<bool> promise1;
+  std::promise<bool> promise2;
+
+  auto add_job_request1 = Mocker::GenAddJobRequest(job_id1, "namespace_1");
+  gcs_job_manager.HandleAddJob(
+      *add_job_request1,
+      &empty_reply,
+      [&promise1](Status, std::function<void()>, std::function<void()>) {
+        promise1.set_value(true);
+      });
+  promise1.get_future().get();
+
+  auto add_job_request2 = Mocker::GenAddJobRequest(job_id2, "namespace_2");
+  gcs_job_manager.HandleAddJob(
+      *add_job_request2,
+      &empty_reply,
+      [&promise2](Status, std::function<void()>, std::function<void()>) {
+        promise2.set_value(true);
+      });
+  promise2.get_future().get();
+
+  // Get all jobs with limit.
+  rpc::GetAllJobInfoRequest all_job_info_request;
+  rpc::GetAllJobInfoReply all_job_info_reply;
+  std::promise<bool> all_job_info_promise;
+
+  all_job_info_request.set_limit(1);
+  gcs_job_manager.HandleGetAllJobInfo(
+      all_job_info_request,
+      &all_job_info_reply,
+      [&all_job_info_promise](Status, std::function<void()>, std::function<void()>) {
+        all_job_info_promise.set_value(true);
+      });
+  all_job_info_promise.get_future().get();
+
+  ASSERT_EQ(all_job_info_reply.job_info_list().size(), 1);
+
+  // Test edge case of limit=0.
+  rpc::GetAllJobInfoRequest all_job_info_request2;
+  rpc::GetAllJobInfoReply all_job_info_reply2;
+  std::promise<bool> all_job_info_promise2;
+
+  all_job_info_request2.set_limit(0);
+  gcs_job_manager.HandleGetAllJobInfo(
+      all_job_info_request2,
+      &all_job_info_reply2,
+      [&all_job_info_promise2](Status, std::function<void()>, std::function<void()>) {
+        all_job_info_promise2.set_value(true);
+      });
+  all_job_info_promise2.get_future().get();
+
+  ASSERT_EQ(all_job_info_reply2.job_info_list().size(), 0);
+
+  // Test get all jobs with limit larger than the number of jobs.
+  rpc::GetAllJobInfoRequest all_job_info_request3;
+  rpc::GetAllJobInfoReply all_job_info_reply3;
+  std::promise<bool> all_job_info_promise3;
+
+  all_job_info_request3.set_limit(100);
+  gcs_job_manager.HandleGetAllJobInfo(
+      all_job_info_request3,
+      &all_job_info_reply3,
+      [&all_job_info_promise3](Status, std::function<void()>, std::function<void()>) {
+        all_job_info_promise3.set_value(true);
+      });
+  all_job_info_promise3.get_future().get();
+
+  ASSERT_EQ(all_job_info_reply3.job_info_list().size(), 2);
+
+  // Test get all jobs with limit -1. Should fail validation.
+  rpc::GetAllJobInfoRequest all_job_info_request4;
+  rpc::GetAllJobInfoReply all_job_info_reply4;
+  std::promise<bool> all_job_info_promise4;
+
+  all_job_info_request4.set_limit(-1);
+  gcs_job_manager.HandleGetAllJobInfo(
+      all_job_info_request4,
+      &all_job_info_reply4,
+      [&all_job_info_promise4](Status, std::function<void()>, std::function<void()>) {
+        all_job_info_promise4.set_value(true);
+      });
+  all_job_info_promise4.get_future().get();
+
+  // Check that the reply has the invalid status.
+  ASSERT_EQ(all_job_info_reply4.status().code(), (int)StatusCode::Invalid);
+  // Check that the reply has the correct error message.
+  ASSERT_EQ(all_job_info_reply4.status().message(), "Invalid limit");
+}
 TEST_F(GcsJobManagerTest, TestGetJobConfig) {
   gcs::GcsJobManager gcs_job_manager(
-      gcs_table_storage_, gcs_publisher_, runtime_env_manager_, *function_manager_);
+      gcs_table_storage_, gcs_publisher_, runtime_env_manager_, *function_manager_, *kv_);
 
   auto job_id1 = JobID::FromInt(1);
   auto job_id2 = JobID::FromInt(2);
@@ -111,8 +376,11 @@ TEST_F(GcsJobManagerTest, TestGetJobConfig) {
 }
 
 TEST_F(GcsJobManagerTest, TestPreserveDriverInfo) {
-  gcs::GcsJobManager gcs_job_manager(
-      gcs_table_storage_, gcs_publisher_, runtime_env_manager_, *function_manager_);
+  gcs::GcsJobManager gcs_job_manager(gcs_table_storage_,
+                                     gcs_publisher_,
+                                     runtime_env_manager_,
+                                     *function_manager_,
+                                     *fake_kv_);
 
   auto job_id = JobID::FromInt(1);
   gcs::GcsInitData gcs_init_data(gcs_table_storage_);
diff --git a/src/ray/gcs/test/gcs_test_util.h b/src/ray/gcs/test/gcs_test_util.h
index ea5b4e02b8c5..579ffd7c48da 100644
--- a/src/ray/gcs/test/gcs_test_util.h
+++ b/src/ray/gcs/test/gcs_test_util.h
@@ -236,7 +236,9 @@ struct Mocker {
   }
 
   static std::shared_ptr<rpc::AddJobRequest> GenAddJobRequest(
-      const JobID &job_id, const std::string &ray_namespace) {
+      const JobID &job_id,
+      const std::string &ray_namespace,
+      const std::optional<std::string> &submission_id = std::nullopt) {
     auto job_config_data = std::make_shared<rpc::JobConfig>();
     job_config_data->set_ray_namespace(ray_namespace);
 
@@ -244,6 +246,11 @@ struct Mocker {
     job_table_data->set_job_id(job_id.Binary());
     job_table_data->mutable_config()->CopyFrom(*job_config_data);
 
+    if (submission_id.has_value()) {
+      job_table_data->mutable_config()->mutable_metadata()->insert(
+          {"job_submission_id", submission_id.value()});
+    }
+
     auto add_job_request = std::make_shared<rpc::AddJobRequest>();
     add_job_request->mutable_data()->CopyFrom(*job_table_data);
     return add_job_request;
diff --git a/src/ray/protobuf/gcs.proto b/src/ray/protobuf/gcs.proto
index b008fe9593e6..bd470ddfb82d 100644
--- a/src/ray/protobuf/gcs.proto
+++ b/src/ray/protobuf/gcs.proto
@@ -18,7 +18,6 @@ option cc_enable_arenas = true;
 package ray.rpc;
 
 import "src/ray/protobuf/common.proto";
-import "src/ray/protobuf/runtime_env_common.proto";
 
 option java_package = "io.ray.runtime.generated";
 
@@ -301,6 +300,39 @@ message GcsNodeInfo {
   uint64 end_time_ms = 24;
 }
 
+// Please keep this in sync with the definition of JobInfo in
+// dashboard/modules/job/common.py
+message JobsAPIInfo {
+  // The status of the job.
+  string status = 1;
+  // The entrypoint command for this job.
+  string entrypoint = 2;
+  // A message describing the status in more detail.
+  optional string message = 3;
+  // TODO(architkulkarni): Populate this field
+  // Error type (e.g. Runtime env setup failure, Internal error, user script error)
+  optional string error_type = 4;
+  // The time when the job was started.  A Unix timestamp in ms.
+  optional uint64 start_time = 5;
+  // The time when the job moved into a terminal state.  A Unix timestamp in ms.
+  optional uint64 end_time = 6;
+  // Arbitrary user-provided metadata for the job.
+  map<string, string> metadata = 7;
+  // The JSON-serialized runtime environment for the job.
+  optional string runtime_env_json = 8;
+  // The quantity of CPU cores to reserve for the entrypoint command.
+  optional double entrypoint_num_cpus = 9;
+  // The number of GPUs to reserve for the entrypoint command.
+  optional double entrypoint_num_gpus = 10;
+  // The quantity of various custom resources to reserve for the entrypoint command.
+  map<string, double> entrypoint_resources = 11;
+  // Driver agent http address
+  optional string driver_agent_http_address = 12;
+  // The node id that driver running on. It will be None only when the job status
+  // is PENDING, and this field will not be deleted or modified even if the driver dies
+  optional string driver_node_id = 13;
+}
+
 message JobTableData {
   // The job ID.
   bytes job_id = 1;
@@ -320,6 +352,8 @@ message JobTableData {
   uint64 end_time = 8;
   // The entrypoint of the job.
   string entrypoint = 9;
+  // The optional JobInfo from the Ray Job API.
+  optional JobsAPIInfo job_info = 10;
 }
 
 message WorkerTableData {
diff --git a/src/ray/protobuf/gcs_service.proto b/src/ray/protobuf/gcs_service.proto
index 2d7e214c6e60..5b89e78f2567 100644
--- a/src/ray/protobuf/gcs_service.proto
+++ b/src/ray/protobuf/gcs_service.proto
@@ -36,7 +36,10 @@ message MarkJobFinishedReply {
   GcsStatus status = 1;
 }
 
-message GetAllJobInfoRequest {}
+message GetAllJobInfoRequest {
+  // The number of jobs to return. If not specified, return all jobs.
+  optional int32 limit = 1;
+}
 
 message GetAllJobInfoReply {
   GcsStatus status = 1;

From d74e4c42ebd03d8ce274a84591043bd004c7b522 Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Tue, 31 Jan 2023 21:15:03 -0500
Subject: [PATCH 107/267] [core][state] Adjust worker side reporting with
 batches && add debugstring (remerging #31840) (#32057)

Remerging #31840
---
 BUILD.bazel                                   |   1 +
 src/ray/common/ray_config_def.h               |  11 +-
 src/ray/core_worker/core_worker.cc            |   5 +-
 src/ray/core_worker/task_event_buffer.cc      | 139 +++++++++++-------
 src/ray/core_worker/task_event_buffer.h       |  16 +-
 .../test/task_event_buffer_test.cc            |  58 +++++++-
 src/ray/core_worker/test/task_manager_test.cc |   2 +
 7 files changed, 164 insertions(+), 68 deletions(-)

diff --git a/BUILD.bazel b/BUILD.bazel
index 39c9ddd285da..20759e151419 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -833,6 +833,7 @@ cc_library(
         ":stats_lib",
         ":worker_rpc",
         "//src/ray/protobuf:worker_cc_proto",
+        "@boost//:circular_buffer",
         "@boost//:fiber",
         "@com_google_absl//absl/container:btree",
         "@com_google_absl//absl/container:flat_hash_map",
diff --git a/src/ray/common/ray_config_def.h b/src/ray/common/ray_config_def.h
index e0714fdeac75..3a133ea6d510 100644
--- a/src/ray/common/ray_config_def.h
+++ b/src/ray/common/ray_config_def.h
@@ -457,9 +457,14 @@ RAY_CONFIG(int64_t, task_events_report_interval_ms, 1000)
 RAY_CONFIG(int64_t, task_events_max_num_task_in_gcs, 100000)
 
 /// Max number of task events stored in the buffer on workers. Any additional events
-/// will be dropped.
-/// Setting the value to -1 allows for unlimited task events buffered on workers.
-RAY_CONFIG(int64_t, task_events_max_num_task_events_in_buffer, 10000)
+/// will be dropped. This is set to a large value to avoid worker side data loss.
+/// For now, avg size of task event is 200Bytes, 1M task events would incur 200MiB
+/// overhead.
+RAY_CONFIG(uint64_t, task_events_max_num_task_events_in_buffer, 1 * 1000 * 1000)
+
+/// Max number of task events to be send in a single message to GCS. This caps both
+/// the message size, and also the processing work on GCS.
+RAY_CONFIG(uint64_t, task_events_send_batch_size, 10 * 1000)
 
 /// Max number of profile events allowed for a single task when sent to GCS.
 /// NOTE: this limit only applies to the profile events per task in a single
diff --git a/src/ray/core_worker/core_worker.cc b/src/ray/core_worker/core_worker.cc
index c3ea072b52db..b58aa8a44b73 100644
--- a/src/ray/core_worker/core_worker.cc
+++ b/src/ray/core_worker/core_worker.cc
@@ -531,7 +531,10 @@ CoreWorker::CoreWorker(const CoreWorkerOptions &options, const WorkerID &worker_
     periodical_runner_.RunFnPeriodically(
         [this] {
           RAY_LOG(INFO) << "Event stats:\n\n"
-                        << io_service_.stats().StatsString() << "\n\n";
+                        << io_service_.stats().StatsString() << "\n\n"
+                        << "-----------------\n"
+                        << "Task Event stats:\n"
+                        << task_event_buffer_->DebugString() << "\n";
         },
         event_stats_print_interval_ms);
   }
diff --git a/src/ray/core_worker/task_event_buffer.cc b/src/ray/core_worker/task_event_buffer.cc
index 10bc43028b94..03cb3a4fbda0 100644
--- a/src/ray/core_worker/task_event_buffer.cc
+++ b/src/ray/core_worker/task_event_buffer.cc
@@ -22,7 +22,8 @@ namespace worker {
 TaskEventBufferImpl::TaskEventBufferImpl(std::unique_ptr<gcs::GcsClient> gcs_client)
     : work_guard_(boost::asio::make_work_guard(io_service_)),
       periodical_runner_(io_service_),
-      gcs_client_(std::move(gcs_client)) {}
+      gcs_client_(std::move(gcs_client)),
+      buffer_() {}
 
 Status TaskEventBufferImpl::Start(bool auto_flush) {
   absl::MutexLock lock(&mutex_);
@@ -30,8 +31,8 @@ Status TaskEventBufferImpl::Start(bool auto_flush) {
   RAY_CHECK(report_interval_ms > 0)
       << "RAY_task_events_report_interval_ms should be > 0 to use TaskEventBuffer.";
 
-  buffer_.reserve(RayConfig::instance().task_events_max_num_task_events_in_buffer());
-
+  buffer_.set_capacity(
+      {RayConfig::instance().task_events_max_num_task_events_in_buffer()});
   // Reporting to GCS, set up gcs client and and events flushing.
   auto status = gcs_client_->Connect(io_service_);
   if (!status.ok()) {
@@ -100,17 +101,13 @@ void TaskEventBufferImpl::AddTaskEvent(rpc::TaskEvents task_events) {
   absl::MutexLock lock(&mutex_);
 
   auto limit = RayConfig::instance().task_events_max_num_task_events_in_buffer();
-  if (limit > 0 && buffer_.size() >= static_cast<size_t>(limit)) {
-    // Too many task events, start overriding older ones.
-    if (buffer_[next_idx_to_overwrite_].has_profile_events()) {
+  if (limit > 0 && buffer_.full()) {
+    const auto &to_evict = buffer_.front();
+    if (to_evict.has_profile_events()) {
       num_profile_task_events_dropped_++;
     } else {
       num_status_task_events_dropped_++;
     }
-
-    buffer_[next_idx_to_overwrite_] = std::move(task_events);
-    next_idx_to_overwrite_ = (next_idx_to_overwrite_ + 1) % limit;
-    return;
   }
   buffer_.push_back(std::move(task_events));
 }
@@ -119,20 +116,13 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
   if (!enabled_) {
     return;
   }
-  std::vector<rpc::TaskEvents> task_events;
   size_t num_status_task_events_dropped = 0;
   size_t num_profile_task_events_dropped = 0;
+  std::vector<rpc::TaskEvents> to_send;
+
   {
     absl::MutexLock lock(&mutex_);
 
-    RAY_LOG_EVERY_MS(INFO, 15000)
-        << "Pushed task state events to GCS. [total_bytes="
-        << (1.0 * total_events_bytes_) / 1024 / 1024
-        << "MiB][total_count=" << total_num_events_
-        << "][total_status_task_events_dropped=" << num_status_task_events_dropped_
-        << "][total_profile_task_events_dropped=" << num_profile_task_events_dropped_
-        << "][cur_buffer_size=" << buffer_.size() << "].";
-
     // Skip if GCS hasn't finished processing the previous message.
     if (grpc_in_progress_ && !forced) {
       RAY_LOG_EVERY_N_OR_DEBUG(WARNING, 100)
@@ -143,15 +133,20 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
       return;
     }
 
-    if (buffer_.size() == 0) {
+    // No data to send.
+    if (buffer_.empty()) {
       return;
     }
 
-    task_events.reserve(
-        RayConfig::instance().task_events_max_num_task_events_in_buffer());
-    buffer_.swap(task_events);
-    next_idx_to_overwrite_ = 0;
+    size_t num_to_send =
+        std::min(static_cast<size_t>(RayConfig::instance().task_events_send_batch_size()),
+                 static_cast<size_t>(buffer_.size()));
+    to_send.insert(to_send.end(),
+                   std::make_move_iterator(buffer_.begin()),
+                   std::make_move_iterator(buffer_.begin() + num_to_send));
+    buffer_.erase(buffer_.begin(), buffer_.begin() + num_to_send);
 
+    // Send and reset the counters
     num_profile_task_events_dropped = num_profile_task_events_dropped_;
     num_profile_task_events_dropped_ = 0;
 
@@ -159,56 +154,49 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
     num_status_task_events_dropped_ = 0;
   }
 
-  // Merge multiple events from a single task attempt run into one task event.
-  absl::flat_hash_map<std::pair<std::string, int>, rpc::TaskEvents> task_events_map;
+  // Convert to rpc::TaskEventsData
+  auto data = std::make_unique<rpc::TaskEventData>();
+  data->set_num_profile_task_events_dropped(num_profile_task_events_dropped);
+  data->set_num_status_task_events_dropped(num_status_task_events_dropped);
 
+  size_t num_task_events = to_send.size();
   size_t num_profile_event_to_send = 0;
   size_t num_status_event_to_send = 0;
-  for (auto event : task_events) {
-    if (event.has_profile_events()) {
+  for (auto &task_event : to_send) {
+    auto events_by_task = data->add_events_by_task();
+    if (task_event.has_profile_events()) {
       num_profile_event_to_send++;
     } else {
       num_status_event_to_send++;
     }
-    auto &task_events_itr =
-        task_events_map[std::make_pair(event.task_id(), event.attempt_number())];
-    task_events_itr.MergeFrom(event);
-  }
-
-  // Convert to rpc::TaskEventsData
-  auto data = std::make_unique<rpc::TaskEventData>();
-  data->set_num_profile_task_events_dropped(num_profile_task_events_dropped);
-  data->set_num_status_task_events_dropped(num_status_task_events_dropped);
-
-  auto num_task_events = task_events_map.size();
-  for (auto itr : task_events_map) {
-    auto events_by_task = data->add_events_by_task();
-    events_by_task->Swap(&itr.second);
+    events_by_task->Swap(&task_event);
   }
 
+  gcs::TaskInfoAccessor *task_accessor;
   {
     // Sending the protobuf to GCS.
     absl::MutexLock lock(&mutex_);
     // Some debug tracking.
     total_num_events_ += num_task_events;
     total_events_bytes_ += data->ByteSizeLong();
-
-    auto on_complete = [this, num_task_events](const Status &status) {
-      absl::MutexLock lock(&mutex_);
-      if (!status.ok()) {
-        RAY_LOG(WARNING) << "Failed to push " << num_task_events
-                         << " task state events to GCS. Data will be lost. [status="
-                         << status.ToString() << "]";
-      } else {
-        RAY_LOG(DEBUG) << "Push " << num_task_events << " task state events to GCS.";
-      }
-      grpc_in_progress_ = false;
-    };
-
     // The flag should be unset when on_complete is invoked.
     grpc_in_progress_ = true;
-    auto status =
-        gcs_client_->Tasks().AsyncAddTaskEventData(std::move(data), on_complete);
+    task_accessor = &gcs_client_->Tasks();
+  }
+
+  auto on_complete = [this, num_task_events](const Status &status) {
+    absl::MutexLock lock(&mutex_);
+    if (!status.ok()) {
+      RAY_LOG(WARNING) << "Failed to push " << num_task_events
+                       << " task state events to GCS. Data will be lost. [status="
+                       << status.ToString() << "]";
+    }
+    grpc_in_progress_ = false;
+  };
+
+  auto status = task_accessor->AsyncAddTaskEventData(std::move(data), on_complete);
+  {
+    absl::MutexLock lock(&mutex_);
     if (!status.ok()) {
       // If we couldn't even send the data by invoking client side callbacks, there's
       // something seriously wrong, and losing data in this case should not be too
@@ -225,6 +213,43 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
   }
 }
 
+const std::string TaskEventBufferImpl::DebugString() {
+  std::stringstream ss;
+
+  if (!Enabled()) {
+    ss << "Task Event Buffer is disabled.";
+    return ss.str();
+  }
+
+  bool grpc_in_progress;
+  size_t num_status_task_events_dropped, num_profile_task_events_dropped,
+      data_buffer_size;
+  uint64_t total_events_bytes, total_num_events;
+
+  {
+    absl::MutexLock lock(&mutex_);
+    grpc_in_progress = grpc_in_progress_;
+    num_status_task_events_dropped = num_status_task_events_dropped_;
+    num_profile_task_events_dropped = num_profile_task_events_dropped_;
+    total_events_bytes = total_events_bytes_;
+    total_num_events = total_num_events_;
+    data_buffer_size = buffer_.size();
+  }
+
+  ss << "\nIO Service Stats:\n";
+  ss << io_service_.stats().StatsString();
+  ss << "\nOther Stats:"
+     << "\n\tgrpc_in_progress:" << grpc_in_progress
+     << "\n\tcurrent number of task events in buffer: " << data_buffer_size
+     << "\n\ttotal task events sent: " << 1.0 * total_events_bytes / 1024 / 1024 << " MiB"
+     << "\n\ttotal number of task events sent: " << total_num_events
+     << "\n\tnum status task events dropped: " << num_status_task_events_dropped
+     << "\n\tnum profile task events dropped: " << num_profile_task_events_dropped
+     << "\n";
+
+  return ss.str();
+}
+
 }  // namespace worker
 
 }  // namespace core
diff --git a/src/ray/core_worker/task_event_buffer.h b/src/ray/core_worker/task_event_buffer.h
index 145b8908e225..7deee0c2e3b7 100644
--- a/src/ray/core_worker/task_event_buffer.h
+++ b/src/ray/core_worker/task_event_buffer.h
@@ -14,6 +14,7 @@
 
 #pragma once
 
+#include <boost/circular_buffer.hpp>
 #include <memory>
 #include <string>
 
@@ -92,6 +93,9 @@ class TaskEventBuffer {
   ///
   /// The TaskEventBuffer will be disabled if Start() returns not ok.
   virtual bool Enabled() const = 0;
+
+  /// Return a string that describes the task event buffer stats.
+  virtual const std::string DebugString() = 0;
 };
 
 /// Implementation of TaskEventBuffer.
@@ -117,11 +121,13 @@ class TaskEventBufferImpl : public TaskEventBuffer {
 
   bool Enabled() const override;
 
+  const std::string DebugString() LOCKS_EXCLUDED(mutex_) override;
+
  private:
   /// Test only functions.
   std::vector<rpc::TaskEvents> GetAllTaskEvents() LOCKS_EXCLUDED(mutex_) {
     absl::MutexLock lock(&mutex_);
-    std::vector<rpc::TaskEvents> copy(buffer_);
+    std::vector<rpc::TaskEvents> copy(buffer_.begin(), buffer_.end());
     return copy;
   }
 
@@ -164,11 +170,8 @@ class TaskEventBufferImpl : public TaskEventBuffer {
   /// True if the TaskEventBuffer is enabled.
   std::atomic<bool> enabled_ = false;
 
-  /// Buffered task events.
-  std::vector<rpc::TaskEvents> buffer_ GUARDED_BY(mutex_);
-
-  /// A iterator into buffer_ that determines which element to be overwritten.
-  size_t next_idx_to_overwrite_ GUARDED_BY(mutex_) = 0;
+  /// Circular buffered task events.
+  boost::circular_buffer_space_optimized<rpc::TaskEvents> buffer_ GUARDED_BY(mutex_);
 
   /// Number of profile task events dropped since the last report flush.
   size_t num_profile_task_events_dropped_ GUARDED_BY(mutex_) = 0;
@@ -188,6 +191,7 @@ class TaskEventBufferImpl : public TaskEventBuffer {
   uint64_t total_num_events_ GUARDED_BY(mutex_) = 0;
 
   FRIEND_TEST(TaskEventBufferTestManualStart, TestGcsClientFail);
+  FRIEND_TEST(TaskEventBufferTestBatchSend, TestBatchedSend);
   FRIEND_TEST(TaskEventBufferTest, TestAddEvent);
   FRIEND_TEST(TaskEventBufferTest, TestFlushEvents);
   FRIEND_TEST(TaskEventBufferTest, TestFailedFlush);
diff --git a/src/ray/core_worker/test/task_event_buffer_test.cc b/src/ray/core_worker/test/task_event_buffer_test.cc
index 3a4d116daaec..5f8088cb0261 100644
--- a/src/ray/core_worker/test/task_event_buffer_test.cc
+++ b/src/ray/core_worker/test/task_event_buffer_test.cc
@@ -38,7 +38,8 @@ class TaskEventBufferTest : public ::testing::Test {
         R"(
 {
   "task_events_report_interval_ms": 1000,
-  "task_events_max_num_task_events_in_buffer": 100
+  "task_events_max_num_task_events_in_buffer": 100,
+  "task_events_send_batch_size": 100
 }
   )");
 
@@ -91,6 +92,20 @@ class TaskEventBufferTestManualStart : public TaskEventBufferTest {
   void SetUp() override {}
 };
 
+class TaskEventBufferTestBatchSend : public TaskEventBufferTest {
+ public:
+  TaskEventBufferTestBatchSend() : TaskEventBufferTest() {
+    RayConfig::instance().initialize(
+        R"(
+{
+  "task_events_report_interval_ms": 1000,
+  "task_events_max_num_task_events_in_buffer": 100,
+  "task_events_send_batch_size": 10
+}
+  )");
+  }
+};
+
 TEST_F(TaskEventBufferTestManualStart, TestGcsClientFail) {
   ASSERT_NE(task_event_buffer_, nullptr);
 
@@ -270,6 +285,47 @@ TEST_F(TaskEventBufferTest, TestForcedFlush) {
   task_event_buffer_->FlushEvents(true);
 }
 
+TEST_F(TaskEventBufferTestBatchSend, TestBatchedSend) {
+  size_t num_events = 100;
+  size_t batch_size = 10;  // Sync with constructor.
+  std::vector<TaskID> task_ids;
+  // Adding some events
+  for (size_t i = 0; i < num_events; ++i) {
+    auto task_id = RandomTaskId();
+    task_ids.push_back(task_id);
+    task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id, 0));
+  }
+
+  auto task_gcs_accessor =
+      static_cast<ray::gcs::MockGcsClient *>(task_event_buffer_->GetGcsClient())
+          ->mock_task_accessor;
+
+  size_t i = 0;
+  // With batch size = 10, there should be 10 flush calls
+  EXPECT_CALL(*task_gcs_accessor, AsyncAddTaskEventData)
+      .Times(num_events / batch_size)
+      .WillRepeatedly(
+          [&i, &batch_size, &task_ids](std::unique_ptr<rpc::TaskEventData> actual_data,
+                                       ray::gcs::StatusCallback callback) {
+            EXPECT_EQ(actual_data->events_by_task_size(), batch_size);
+            for (const auto &task : actual_data->events_by_task()) {
+              // Assert sent data in order.
+              EXPECT_EQ(task_ids[i++].Binary(), task.task_id());
+            }
+            callback(Status::OK());
+            return Status::OK();
+          });
+
+  for (int i = 0; i * batch_size < num_events; i++) {
+    task_event_buffer_->FlushEvents(false);
+    EXPECT_EQ(task_event_buffer_->GetAllTaskEvents().size(),
+              num_events - (i + 1) * batch_size);
+  }
+
+  // With last flush, there should be no more events in the buffer and as data.
+  EXPECT_EQ(task_event_buffer_->GetAllTaskEvents().size(), 0);
+}
+
 TEST_F(TaskEventBufferTest, TestBufferSizeLimit) {
   size_t num_limit = 100;  // Synced with test setup
   size_t num_profile = 50;
diff --git a/src/ray/core_worker/test/task_manager_test.cc b/src/ray/core_worker/test/task_manager_test.cc
index 3bdb156b3eae..1cd73cda00a6 100644
--- a/src/ray/core_worker/test/task_manager_test.cc
+++ b/src/ray/core_worker/test/task_manager_test.cc
@@ -62,6 +62,8 @@ class MockTaskEventBuffer : public worker::TaskEventBuffer {
   MOCK_METHOD(void, Stop, (), (override));
 
   MOCK_METHOD(bool, Enabled, (), (const, override));
+
+  MOCK_METHOD(const std::string, DebugString, (), (override));
 };
 
 class TaskManagerTest : public ::testing::Test {

From 77ac9c25b4381d4c1cb18724cb7931974e3076e4 Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Tue, 31 Jan 2023 18:16:11 -0800
Subject: [PATCH 108/267] [Dashboard] Support ray status output to the
 dashboard job page (#32040)

This is the initial prototype of integrating ray status to the frontend.

I think we could've returned structured data from the backend, but I decided to parse ray status output from the frontend for quick implementation (so that we can support if from ray 2.3).
---
 dashboard/client/src/pages/job/JobDetail.tsx  | 98 ++++++++++++++++++-
 .../src/pages/job/hook/useClusterStatus.ts    | 24 +++++
 dashboard/client/src/service/status.ts        | 13 +++
 dashboard/modules/reporter/reporter_head.py   | 24 +++--
 4 files changed, 151 insertions(+), 8 deletions(-)
 create mode 100644 dashboard/client/src/pages/job/hook/useClusterStatus.ts
 create mode 100644 dashboard/client/src/service/status.ts

diff --git a/dashboard/client/src/pages/job/JobDetail.tsx b/dashboard/client/src/pages/job/JobDetail.tsx
index 4c3b791a216c..1d1909a7934e 100644
--- a/dashboard/client/src/pages/job/JobDetail.tsx
+++ b/dashboard/client/src/pages/job/JobDetail.tsx
@@ -1,4 +1,4 @@
-import { makeStyles } from "@material-ui/core";
+import { Box, Grid, makeStyles, Typography } from "@material-ui/core";
 import dayjs from "dayjs";
 import React, { useContext } from "react";
 import { Link } from "react-router-dom";
@@ -14,6 +14,7 @@ import ActorList from "../actor/ActorList";
 import PlacementGroupList from "../state/PlacementGroup";
 import TaskList from "../state/task";
 
+import { useRayStatus } from "./hook/useClusterStatus";
 import { useJobDetail } from "./hook/useJobDetail";
 import { JobProgressBar } from "./JobProgressBar";
 import { TaskTimeline } from "./TaskTimeline";
@@ -35,6 +36,61 @@ export const JobDetailChartsPage = ({
   const { job, msg, params } = useJobDetail();
   const jobId = params.id;
 
+  const { cluster_status } = useRayStatus();
+
+  const formatNodeStatus = (cluster_status: string) => {
+    // ==== auto scaling status
+    // Node status
+    // ....
+    // Resources
+    // ....
+    const sections = cluster_status.split("Resources");
+    return formatClusterStatus(
+      "Node Status",
+      sections[0].split("Node status")[1],
+    );
+  };
+
+  const formatResourcesStatus = (cluster_status: string) => {
+    // ==== auto scaling status
+    // Node status
+    // ....
+    // Resources
+    // ....
+    const sections = cluster_status.split("Resources");
+    return formatClusterStatus("Resource Status", sections[1]);
+  };
+
+  const formatClusterStatus = (title: string, cluster_status: string) => {
+    const cluster_status_rows = cluster_status.split("\n");
+
+    return (
+      <div>
+        <Typography variant="h6">
+          <b>{title}</b>
+        </Typography>
+        {cluster_status_rows.map((i, key) => {
+          // Format the output.
+          // See format_info_string in util.py
+          if (i.startsWith("-----") || i.startsWith("=====")) {
+            // Separator
+            return <div />;
+          } else if (i.endsWith(":")) {
+            return (
+              <div key={key}>
+                <b>{i}</b>
+              </div>
+            );
+          } else if (i === "") {
+            return <br />;
+          } else {
+            return <div key={key}>{i}</div>;
+          }
+        })}
+      </div>
+    );
+  };
+
   if (!job) {
     return (
       <div className={classes.root}>
@@ -126,6 +182,46 @@ export const JobDetailChartsPage = ({
       <TitleCard title="Task Timeline">
         <TaskTimeline jobId={jobId} />
       </TitleCard>
+      <Grid container>
+        <Grid item xs={4}>
+          <TitleCard title="">
+            <Box
+              mb={2}
+              display="flex"
+              flexDirection="column"
+              height="300px"
+              style={{
+                overflow: "hidden",
+                overflowY: "scroll",
+              }}
+              sx={{ borderRadius: "16px" }}
+            >
+              {cluster_status?.data
+                ? formatNodeStatus(cluster_status?.data.clusterStatus)
+                : "No cluster status."}
+            </Box>
+          </TitleCard>
+        </Grid>
+        <Grid item xs={4}>
+          <TitleCard title="">
+            <Box
+              mb={2}
+              display="flex"
+              flexDirection="column"
+              height="300px"
+              style={{
+                overflow: "hidden",
+                overflowY: "scroll",
+              }}
+              sx={{ border: 1, borderRadius: "1", borderColor: "primary.main" }}
+            >
+              {cluster_status?.data
+                ? formatResourcesStatus(cluster_status?.data.clusterStatus)
+                : "No cluster status."}
+            </Box>
+          </TitleCard>
+        </Grid>
+      </Grid>
       <TitleCard>
         <CollapsibleSection title="Task Table">
           <TaskList jobId={jobId} />
diff --git a/dashboard/client/src/pages/job/hook/useClusterStatus.ts b/dashboard/client/src/pages/job/hook/useClusterStatus.ts
new file mode 100644
index 000000000000..61ce605f14b0
--- /dev/null
+++ b/dashboard/client/src/pages/job/hook/useClusterStatus.ts
@@ -0,0 +1,24 @@
+import useSWR from "swr";
+import { API_REFRESH_INTERVAL_MS } from "../../../common/constants";
+import { getRayStatus } from "../../../service/status";
+
+export const useRayStatus = () => {
+  const { data: cluster_status } = useSWR(
+    "useClusterStatus",
+    async () => {
+      try {
+        const rsp = await getRayStatus();
+        return rsp.data;
+      } catch (e) {
+        console.error(
+          "Cluster Status Error. Couldn't get the cluster status data from the dashboard server.",
+        );
+      }
+    },
+    { refreshInterval: API_REFRESH_INTERVAL_MS },
+  );
+
+  return {
+    cluster_status,
+  };
+};
diff --git a/dashboard/client/src/service/status.ts b/dashboard/client/src/service/status.ts
new file mode 100644
index 000000000000..31dd5944712b
--- /dev/null
+++ b/dashboard/client/src/service/status.ts
@@ -0,0 +1,13 @@
+import { get } from "./requestHandlers";
+
+export type RayStatusResp = {
+  result: boolean;
+  message: string;
+  data: {
+    clusterStatus: string;
+  };
+};
+
+export const getRayStatus = () => {
+  return get<RayStatusResp>("api/cluster_status?format=1");
+};
diff --git a/dashboard/modules/reporter/reporter_head.py b/dashboard/modules/reporter/reporter_head.py
index 1eae913a5498..706df6924c84 100644
--- a/dashboard/modules/reporter/reporter_head.py
+++ b/dashboard/modules/reporter/reporter_head.py
@@ -21,6 +21,7 @@
 from ray.core.generated import reporter_pb2, reporter_pb2_grpc
 from ray.dashboard.datacenter import DataSource
 from ray._private.usage.usage_constants import CLUSTER_METADATA_KEY
+from ray.autoscaler._private.commands import debug_status
 
 logger = logging.getLogger(__name__)
 routes = dashboard_optional_utils.ClassMethodRouteTable
@@ -75,6 +76,7 @@ async def get_cluster_status(self, req):
         These fields are both read from the GCS, it's expected that the
         autoscaler writes them there.
         """
+        return_formatted_output = req.query.get("format", "0") == "1"
 
         (legacy_status, formatted_status_string, error) = await asyncio.gather(
             *[
@@ -94,13 +96,21 @@ async def get_cluster_status(self, req):
             if formatted_status_string
             else {}
         )
-        return dashboard_optional_utils.rest_response(
-            success=True,
-            message="Got cluster status.",
-            autoscaling_status=legacy_status.decode() if legacy_status else None,
-            autoscaling_error=error.decode() if error else None,
-            cluster_status=formatted_status if formatted_status else None,
-        )
+
+        if not return_formatted_output:
+            return dashboard_optional_utils.rest_response(
+                success=True,
+                message="Got cluster status.",
+                autoscaling_status=legacy_status.decode() if legacy_status else None,
+                autoscaling_error=error.decode() if error else None,
+                cluster_status=formatted_status if formatted_status else None,
+            )
+        else:
+            return dashboard_optional_utils.rest_response(
+                success=True,
+                message="Got formatted cluster status.",
+                cluster_status=debug_status(formatted_status_string, error),
+            )
 
     @routes.get("/worker/traceback")
     async def get_traceback(self, req) -> aiohttp.web.Response:

From 5dd140633beb4a27ab945f9402937710d9a89c96 Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Tue, 31 Jan 2023 18:16:52 -0800
Subject: [PATCH 109/267] [Observability] Unpin open telemetry version for
 tracing feature (#32120)

Signed-off-by: SangBin Cho <rkooo567@gmail.com>

<!-- Thank you for your contribution! Please review https://github.com/ray-project/ray/blob/master/CONTRIBUTING.rst before opening a pull request. -->

<!-- Please add a reviewer to the assignee section when you create a PR. If you don't have the access to it, we will shortly find a reviewer and assign them to your PR. -->

## Why are these changes needed?

This PR unpins the version of open telemetry as it is too strict for an experimental tracing feature.

## Related issue number

Closes https://github.com/ray-project/ray/issues/32051

## Checks

- [ ] I've signed off every commit(by using the -s flag, i.e., `git commit -s`) in this PR.
- [ ] I've run `scripts/format.sh` to lint the changes in this PR.
- [ ] I've included any doc changes needed for https://docs.ray.io/en/master/.
- [ ] I've made sure the tests are passing. Note that there might be a few flaky tests, see the recent failures at https://flakey-tests.ray.io/
- Testing Strategy
   - [ ] Unit tests
   - [ ] Release tests
   - [ ] This PR is not tested :(
---
 python/setup.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/python/setup.py b/python/setup.py
index eb4872f9eb19..c9d9ae574912 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -248,9 +248,9 @@ def get_packages(self):
         "tune": ["pandas", "tabulate", "tensorboardX>=1.9", "requests"],
         "k8s": ["kubernetes", "urllib3"],
         "observability": [
-            "opentelemetry-api==1.1.0",
-            "opentelemetry-sdk==1.1.0",
-            "opentelemetry-exporter-otlp==1.1.0",
+            "opentelemetry-api",
+            "opentelemetry-sdk",
+            "opentelemetry-exporter-otlp",
         ],
     }
 

From fb1e0b06d80b2eed5a21b9f130cc1aebad048d6a Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Tue, 31 Jan 2023 18:44:34 -0800
Subject: [PATCH 110/267] [RLlib] Fix revert of trainer runner (#32146)

* Revert "Revert "[RLlib] Reparameterize the construction of TrainerRunner and RLTrainers (#31991)" (#32130)"

This reverts commit d15ccfcdf290e554846d2fddf2b8cf5d659e9892.

* added bool evaluation to tf stub so that if tf returns false

Signed-off-by: Kourosh Hakhamaneshi <kourosh@anyscale.com>
---
 rllib/BUILD                                   |   9 +-
 rllib/algorithms/algorithm_config.py          |  46 ++++++-
 rllib/core/rl_trainer/rl_trainer.py           |  93 +++++++++++--
 rllib/core/rl_trainer/scaling_config.py       |  21 +++
 .../core/rl_trainer/tests/test_rl_trainer.py  |  10 +-
 .../rl_trainer/tests/test_trainer_runner.py   | 126 ++++++++++++++---
 .../tests/test_trainer_runner_config.py       |   1 -
 .../tests/test_trainer_runner_local.py        |  70 ----------
 rllib/core/rl_trainer/tf/tf_rl_trainer.py     |  32 +----
 .../torch/tests/test_torch_rl_trainer.py      |  25 ++--
 .../core/rl_trainer/torch/torch_rl_trainer.py |  53 +++----
 rllib/core/rl_trainer/trainer_runner.py       | 129 +++++++++---------
 .../core/rl_trainer/trainer_runner_config.py  |  99 +++++++-------
 rllib/core/testing/utils.py                   |  12 +-
 rllib/utils/framework.py                      |  33 ++++-
 15 files changed, 440 insertions(+), 319 deletions(-)
 create mode 100644 rllib/core/rl_trainer/scaling_config.py
 delete mode 100644 rllib/core/rl_trainer/tests/test_trainer_runner_local.py

diff --git a/rllib/BUILD b/rllib/BUILD
index 531181a4425d..4882d7cd65cd 100644
--- a/rllib/BUILD
+++ b/rllib/BUILD
@@ -1846,17 +1846,10 @@ py_test(
 py_test(
     name = "test_trainer_runner",
     tags = ["team:rllib", "multi_gpu", "exclusive"],
-    size = "medium",
+    size = "large",
     srcs = ["core/rl_trainer/tests/test_trainer_runner.py"]
 )
 
-py_test(
-    name = "test_trainer_runner_local",
-    tags = ["team:rllib", "core", "exclusive"],
-    size = "medium",
-    srcs = ["core/rl_trainer/tests/test_trainer_runner_local.py"]
-)
-
 py_test(
     name = "test_trainer_runner_config",
     tags = ["team:rllib", "core"],
diff --git a/rllib/algorithms/algorithm_config.py b/rllib/algorithms/algorithm_config.py
index 26a0327df5d0..63f6541ff140 100644
--- a/rllib/algorithms/algorithm_config.py
+++ b/rllib/algorithms/algorithm_config.py
@@ -17,6 +17,7 @@
 import ray
 from ray.rllib.algorithms.callbacks import DefaultCallbacks
 from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
+from ray.rllib.core.rl_trainer.rl_trainer import RLTrainerHPs
 from ray.rllib.core.rl_trainer.trainer_runner_config import (
     TrainerRunnerConfig,
     ModuleSpec,
@@ -242,6 +243,9 @@ def __init__(self, algo_class=None):
         self.num_gpus_per_worker = 0
         self._fake_gpus = False
         self.num_cpus_for_local_worker = 1
+        self.num_trainer_workers = 0
+        self.num_gpus_per_trainer_worker = 0
+        self.num_cpus_per_trainer_worker = 1
         self.custom_resources_per_worker = {}
         self.placement_strategy = "PACK"
 
@@ -318,6 +322,10 @@ def __init__(self, algo_class=None):
         self.max_requests_in_flight_per_sampler_worker = 2
         self.rl_trainer_class = None
         self._enable_rl_trainer_api = False
+        # experimental: this will contain the hyper-parameters that are passed to the
+        # RLTrainer, for computing loss, etc. New algorithms have to set this to their
+        # own default. .training() will modify the fields of this object.
+        self._rl_trainer_hps = RLTrainerHPs()
 
         # `self.callbacks()`
         self.callbacks_class = DefaultCallbacks
@@ -443,6 +451,10 @@ def __init__(self, algo_class=None):
         self.soft_horizon = DEPRECATED_VALUE
         self.no_done_at_end = DEPRECATED_VALUE
 
+    @property
+    def rl_trainer_hps(self) -> RLTrainerHPs:
+        return self._rl_trainer_hps
+
     def to_dict(self) -> AlgorithmConfigDict:
         """Converts all settings into a legacy config dict for backward compatibility.
 
@@ -947,6 +959,9 @@ def resources(
         num_cpus_per_worker: Optional[Union[float, int]] = NotProvided,
         num_gpus_per_worker: Optional[Union[float, int]] = NotProvided,
         num_cpus_for_local_worker: Optional[int] = NotProvided,
+        num_trainer_workers: Optional[int] = NotProvided,
+        num_cpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
+        num_gpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
         custom_resources_per_worker: Optional[dict] = NotProvided,
         placement_strategy: Optional[str] = NotProvided,
     ) -> "AlgorithmConfig":
@@ -966,6 +981,20 @@ def resources(
                 fractional. This is usually needed only if your env itself requires a
                 GPU (i.e., it is a GPU-intensive video game), or model inference is
                 unusually expensive.
+            num_trainer_workers: Number of workers used for training. A value of 0
+                means training will take place on a local worker on head node CPUs or 1
+                GPU (determined by `num_gpus_per_trainer_worker`). For multi-gpu
+                training, set number of workers greater than 1 and set
+                `num_gpus_per_trainer_worker` accordingly (e.g. 4 GPUs total, and model
+                needs 2 GPUs: `num_trainer_workers = 2` and
+                `num_gpus_per_trainer_worker = 2`)
+            num_cpus_per_trainer_worker: Number of CPUs allocated per trainer worker.
+                Only necessary for custom processing pipeline inside each RLTrainer
+                requiring multiple CPU cores. Ignored if `num_trainer_workers = 0`.
+            num_gpus_per_trainer_worker: Number of GPUs allocated per worker. If
+                `num_trainer_workers = 0`, any value greater than 0 will run the
+                training on a single GPU on the head node, while a value of 0 will run
+                the training on head node CPU cores.
             custom_resources_per_worker: Any custom Ray resources to allocate per
                 worker.
             num_cpus_for_local_worker: Number of CPUs to allocate for the algorithm.
@@ -1006,6 +1035,13 @@ def resources(
         if placement_strategy is not NotProvided:
             self.placement_strategy = placement_strategy
 
+        if num_trainer_workers is not NotProvided:
+            self.num_trainer_workers = num_trainer_workers
+        if num_cpus_per_trainer_worker is not NotProvided:
+            self.num_cpus_per_trainer_worker = num_cpus_per_trainer_worker
+        if num_gpus_per_trainer_worker is not NotProvided:
+            self.num_gpus_per_trainer_worker = num_gpus_per_trainer_worker
+
         return self
 
     def framework(
@@ -2645,12 +2681,16 @@ def get_trainer_runner_config(
             .module(module_spec)
             .trainer(
                 trainer_class=self.rl_trainer_class,
-                eager_tracing=self.eager_tracing,
                 # TODO (Kourosh): optimizer config can now be more complicated.
                 optimizer_config={"lr": self.lr},
+                rl_trainer_hps=self.rl_trainer_hps,
+            )
+            .resources(
+                num_trainer_workers=self.num_trainer_workers,
+                num_cpus_per_trainer_worker=self.num_cpus_per_trainer_worker,
+                num_gpus_per_trainer_worker=self.num_gpus_per_trainer_worker,
             )
-            .resources(num_gpus=self.num_gpus, fake_gpus=self._fake_gpus)
-            .algorithm(algorithm_config=self)
+            .framework(eager_tracing=self.eager_tracing)
         )
 
         return config
diff --git a/rllib/core/rl_trainer/rl_trainer.py b/rllib/core/rl_trainer/rl_trainer.py
index 8969cab69a1e..ca78f7a096f7 100644
--- a/rllib/core/rl_trainer/rl_trainer.py
+++ b/rllib/core/rl_trainer/rl_trainer.py
@@ -1,5 +1,6 @@
 import abc
 
+from dataclasses import dataclass, field
 import logging
 import numpy as np
 from typing import (
@@ -14,7 +15,6 @@
     Tuple,
     Type,
     Union,
-    TYPE_CHECKING,
 )
 
 from ray.rllib.utils.framework import try_import_tf, try_import_torch
@@ -23,6 +23,7 @@
     ModuleID,
     SingleAgentRLModuleSpec,
 )
+
 from ray.rllib.core.rl_module.marl_module import (
     MultiAgentRLModule,
     MultiAgentRLModuleSpec,
@@ -31,10 +32,8 @@
 from ray.rllib.utils.nested_dict import NestedDict
 from ray.rllib.utils.numpy import convert_to_numpy
 from ray.rllib.utils.typing import TensorType
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
-if TYPE_CHECKING:
-    from ray.air.config import ScalingConfig
-    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 
 torch, _ = try_import_torch()
 tf1, tf, tfv = try_import_tf()
@@ -48,6 +47,32 @@
 ParamDictType = Dict[ParamRef, ParamType]
 
 
+@dataclass
+class FrameworkHPs:
+    """The framework specific hyper-parameters.
+
+    Args:
+        eager_tracing: Whether to trace the model in eager mode. This enables tf
+            tracing mode by wrapping the loss function computation in a tf.function.
+            This is useful for speeding up the training loop. However, it is not
+            compatible with all tf operations. For example, tf.print is not supported
+            in tf.function.
+    """
+
+    eager_tracing: bool = False
+
+
+@dataclass
+class RLTrainerHPs:
+    """The hyper-parameters for RLTrainer.
+
+    When creating a new RLTrainer, the new hyper-parameters have to be defined by
+    subclassing this class and adding the new hyper-parameters as fields.
+    """
+
+    pass
+
+
 class RLTrainer:
     """Base class for RLlib algorithm trainers.
 
@@ -118,9 +143,9 @@ def __init__(
         ] = None,
         module: Optional[RLModule] = None,
         optimizer_config: Mapping[str, Any] = None,
-        distributed: bool = False,
-        scaling_config: Optional["ScalingConfig"] = None,
-        algorithm_config: Optional["AlgorithmConfig"] = None,
+        trainer_scaling_config: TrainerScalingConfig = TrainerScalingConfig(),
+        trainer_hyperparameters: Optional[RLTrainerHPs] = RLTrainerHPs(),
+        framework_hyperparameters: Optional[FrameworkHPs] = FrameworkHPs(),
     ):
         # TODO (Kourosh): Having the entire algorithm_config inside trainer may not be
         # the best idea in the world, but it's easy to implement and user will
@@ -140,9 +165,10 @@ def __init__(
         self.module_spec = module_spec
         self.module_obj = module
         self.optimizer_config = optimizer_config
-        self.distributed = distributed
-        self.scaling_config = scaling_config
-        self.config = algorithm_config
+        self.config = trainer_hyperparameters
+
+        # pick the configs that we need for the trainer from scaling config
+        self._distributed = trainer_scaling_config.num_workers > 1
 
         # These are the attributes that are set during build
         self._module: MultiAgentRLModule = None
@@ -151,6 +177,10 @@ def __init__(
         self._param_to_optim: Dict[ParamRef, Optimizer] = {}
         self._params: ParamDictType = {}
 
+    @property
+    def distributed(self) -> bool:
+        return self._distributed
+
     @property
     def module(self) -> MultiAgentRLModule:
         return self._module
@@ -611,3 +641,46 @@ def __check_if_build_called(self):
                 "RLTrainer.build() must be called after constructing a "
                 "RLTrainer and before calling any methods on it."
             )
+
+
+@dataclass
+class RLTrainerSpec:
+    """The spec for construcitng RLTrainer actors.
+
+    Args:
+        rl_trainer_class: The RLTrainer class to use.
+        module_spec: The underlying (MA)RLModule spec to completely define the module.
+        module: Alternatively the RLModule instance can be passed in directly. This
+            only works if the RLTrainer is not an actor.
+        backend_config: The backend config for properly distributing the RLModule.
+        optimizer_config: The optimizer setting to apply during training.
+        trainer_hyperparameters: The extra config for the loss/additional update. This
+            should be a subclass of RLTrainerHPs. This is useful for passing in
+            algorithm configs that contains the hyper-parameters for loss computation,
+            change of training behaviors, etc. e.g lr, entropy_coeff.
+    """
+
+    rl_trainer_class: Type["RLTrainer"]
+    module_spec: Union["SingleAgentRLModuleSpec", "MultiAgentRLModuleSpec"] = None
+    module: Optional["RLModule"] = None
+    trainer_scaling_config: TrainerScalingConfig = field(
+        default_factory=TrainerScalingConfig
+    )
+    optimizer_config: Dict[str, Any] = field(default_factory=dict)
+    trainer_hyperparameters: RLTrainerHPs = field(default_factory=RLTrainerHPs)
+    framework_hyperparameters: FrameworkHPs = field(default_factory=FrameworkHPs)
+
+    def get_params_dict(self) -> Dict[str, Any]:
+        """Returns the parameters than be passed to the RLTrainer constructor."""
+        return {
+            "module": self.module,
+            "module_spec": self.module_spec,
+            "trainer_scaling_config": self.trainer_scaling_config,
+            "optimizer_config": self.optimizer_config,
+            "trainer_hyperparameters": self.trainer_hyperparameters,
+            "framework_hyperparameters": self.framework_hyperparameters,
+        }
+
+    def build(self) -> "RLTrainer":
+        """Builds the RLTrainer instance."""
+        return self.rl_trainer_class(**self.get_params_dict())
diff --git a/rllib/core/rl_trainer/scaling_config.py b/rllib/core/rl_trainer/scaling_config.py
new file mode 100644
index 000000000000..1c8054ef4468
--- /dev/null
+++ b/rllib/core/rl_trainer/scaling_config.py
@@ -0,0 +1,21 @@
+from dataclasses import dataclass
+
+
+@dataclass
+class TrainerScalingConfig:
+    """Configuratiom for scaling training actors.
+
+    Attributes:
+        num_workers: The number of workers to use for training. num_workers=0 means you
+            have only one local worker (either on 1 CPU or 1 GPU)
+        num_cpus_per_worker: The number of CPUs to allocate per worker. If
+            num_workers=0 and num_gpus_per_worker=0, regardless of this value, the
+            training will run on a single CPU.
+        num_gpus_per_worker: The number of GPUs to allocate per worker. If
+            num_workers=0, any number greater than 0 will run the training on a single
+            GPU. A value of zero will run the training on a single CPU.
+    """
+
+    num_workers: int = 0
+    num_cpus_per_worker: int = 1
+    num_gpus_per_worker: int = 0
diff --git a/rllib/core/rl_trainer/tests/test_rl_trainer.py b/rllib/core/rl_trainer/tests/test_rl_trainer.py
index 8af9b0ae7245..b33bea2a1cc6 100644
--- a/rllib/core/rl_trainer/tests/test_rl_trainer.py
+++ b/rllib/core/rl_trainer/tests/test_rl_trainer.py
@@ -11,16 +11,12 @@
 from ray.rllib.core.testing.tf.bc_rl_trainer import BCTfRLTrainer
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID
 from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
 
-def get_trainer(distributed=False) -> RLTrainer:
+def get_trainer() -> RLTrainer:
     env = gym.make("CartPole-v1")
 
-    # TODO: Another way to make RLTrainer would be to construct the module first
-    # and then apply trainer to it. We should also allow that. In fact if we figure
-    # out the serialization of RLModules we can simply pass the module the trainer
-    # and internally it will serialize and deserialize the module for distributed
-    # construction.
     trainer = BCTfRLTrainer(
         module_spec=SingleAgentRLModuleSpec(
             module_class=DiscreteBCTFModule,
@@ -29,7 +25,7 @@ def get_trainer(distributed=False) -> RLTrainer:
             model_config={"hidden_dim": 32},
         ),
         optimizer_config={"lr": 1e-3},
-        distributed=distributed,
+        trainer_scaling_config=TrainerScalingConfig(),
     )
 
     trainer.build()
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner.py b/rllib/core/rl_trainer/tests/test_trainer_runner.py
index 5743c891b4c4..67a511b6d5bc 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner.py
@@ -2,55 +2,130 @@
 import unittest
 import ray
 import time
+import numpy as np
+import itertools
 
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID, MultiAgentBatch
-from ray.rllib.utils.test_utils import get_cartpole_dataset_reader
+from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
+from ray.rllib.utils.framework import try_import_tf
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 from ray.rllib.core.testing.utils import (
     get_trainer_runner,
+    get_rl_trainer,
     add_module_to_runner_or_trainer,
 )
 
 
 class TestTrainerRunner(unittest.TestCase):
-    """This test is setup for 2 gpus."""
-
-    # TODO: This unittest should also test other resource allocations like multi-cpu,
-    # multi-node multi-gpu, etc.
-
     @classmethod
-    def setUp(cls) -> None:
+    def setUpClass(cls) -> None:
         ray.init()
 
+        # Settings to test
+        cls.scaling_configs = {
+            "local-cpu": TrainerScalingConfig(num_workers=0, num_gpus_per_worker=0),
+            "local-gpu": TrainerScalingConfig(num_workers=0, num_gpus_per_worker=0.5),
+            "remote-cpu": TrainerScalingConfig(num_workers=1),
+            "remote-gpu": TrainerScalingConfig(num_workers=1, num_gpus_per_worker=0.5),
+            "multi-gpu-ddp": TrainerScalingConfig(num_workers=2, num_gpus_per_worker=1),
+            "multi-cpu-ddp": TrainerScalingConfig(num_workers=2, num_cpus_per_worker=2),
+            # "multi-gpu-ddp-pipeline": TrainerScalingConfig(
+            #     num_workers=2, num_gpus_per_worker=2
+            # ),
+        }
+
     @classmethod
-    def tearDown(cls) -> None:
+    def tearDownClass(cls) -> None:
         ray.shutdown()
 
+    def test_trainer_runner_local(self):
+
+        tf1, tf, tfv = try_import_tf()
+        tf1.executing_eagerly()
+
+        # TODO (Avnish): tf does not clear out the GPU memory footprint, therefore
+        # doing it first before torch will result in OOM. Find a way to clear out the
+        # GPU memory footprint of tf.
+        fws = ["torch"]
+        scaling_modes = ["local-cpu", "local-gpu"]
+        test_iterator = itertools.product(fws, scaling_modes)
+
+        env = gym.make("CartPole-v1")
+        for fw, scaling_mode in test_iterator:
+            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}")
+            ray.init(ignore_reinit_error=True)
+            scaling_config = self.scaling_configs[scaling_mode]
+            runner = get_trainer_runner(fw, env, scaling_config)
+            local_trainer = get_rl_trainer(fw, env)
+            local_trainer.build()
+
+            # make the state of the trainer and the local runner identical
+            local_trainer.set_state(runner.get_state()[0])
+
+            reader = get_cartpole_dataset_reader(batch_size=500)
+            batch = reader.next()
+            batch = batch.as_multi_agent()
+            check(local_trainer.update(batch), runner.update(batch)[0])
+
+            new_module_id = "test_module"
+
+            add_module_to_runner_or_trainer(fw, env, new_module_id, runner)
+            add_module_to_runner_or_trainer(fw, env, new_module_id, local_trainer)
+
+            # make the state of the trainer and the local runner identical
+            local_trainer.set_state(runner.get_state()[0])
+
+            # do another update
+            batch = reader.next()
+            ma_batch = MultiAgentBatch(
+                {new_module_id: batch, DEFAULT_POLICY_ID: batch}, env_steps=batch.count
+            )
+            check(local_trainer.update(ma_batch), runner.update(ma_batch)[0])
+
+            check(local_trainer.get_state(), runner.get_state()[0])
+
+            # make sure the runner resources are freed up so that we don't autoscale
+            del runner
+            del local_trainer
+            ray.shutdown()
+            time.sleep(10)
+
     def test_update_multigpu(self):
-        """Test training in a 2 gpu setup and that weights are synchronized."""
 
-        for fw in ["tf", "torch"]:
+        # TODO (Avnish): The tf + remote-gpu test is flakey. Removing for now until
+        # investigated.
+        fws = ["torch"]
+        scaling_modes = self.scaling_configs.keys()
+        test_iterator = itertools.product(fws, scaling_modes)
+
+        for fw, scaling_mode in test_iterator:
+            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}.")
             ray.init(ignore_reinit_error=True)
-            print(f"Testing framework: {fw}.")
             env = gym.make("CartPole-v1")
-            runner = get_trainer_runner(fw, env, compute_config=dict(num_gpus=2))
-            reader = get_cartpole_dataset_reader(batch_size=500)
+
+            scaling_config = self.scaling_configs[scaling_mode]
+            runner = get_trainer_runner(fw, env, scaling_config)
+            reader = get_cartpole_dataset_reader(batch_size=1024)
 
             min_loss = float("inf")
             for iter_i in range(1000):
                 batch = reader.next()
-                res_0, res_1 = runner.update(batch.as_multi_agent())
+                results = runner.update(batch.as_multi_agent())
 
-                loss = (res_0["loss"]["total_loss"] + res_1["loss"]["total_loss"]) / 2
+                loss = np.mean([res["loss"]["total_loss"] for res in results])
                 min_loss = min(loss, min_loss)
                 print(f"[iter = {iter_i}] Loss: {loss:.3f}, Min Loss: {min_loss:.3f}")
                 # The loss is initially around 0.69 (ln2). When it gets to around
                 # 0.57 the return of the policy gets to around 100.
                 if min_loss < 0.57:
                     break
-                self.assertEqual(
-                    res_0["mean_weight"]["default_policy"],
-                    res_1["mean_weight"]["default_policy"],
-                )
+
+                for res1, res2 in zip(results, results[1:]):
+                    self.assertEqual(
+                        res1["mean_weight"]["default_policy"],
+                        res2["mean_weight"]["default_policy"],
+                    )
+
             self.assertLess(min_loss, 0.57)
 
             # make sure the runner resources are freed up so that we don't autoscale
@@ -60,11 +135,18 @@ def test_update_multigpu(self):
 
     def test_add_remove_module(self):
 
-        for fw in ["tf", "torch"]:
+        # TODO (Avnish): The tf + remote-gpu test is flakey. Removing for now until
+        # investigated.
+        fws = ["torch"]
+        scaling_modes = self.scaling_configs.keys()
+        test_iterator = itertools.product(fws, scaling_modes)
+
+        for fw, scaling_mode in test_iterator:
+            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}.")
             ray.init(ignore_reinit_error=True)
-            print(f"Testing framework: {fw}.")
             env = gym.make("CartPole-v1")
-            runner = get_trainer_runner(fw, env, compute_config=dict(num_gpus=2))
+            scaling_config = self.scaling_configs[scaling_mode]
+            runner = get_trainer_runner(fw, env, scaling_config)
             reader = get_cartpole_dataset_reader(batch_size=500)
             batch = reader.next()
 
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner_config.py b/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
index acdc67731337..46e215acd86d 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
@@ -31,7 +31,6 @@ def test_trainer_runner_build(self):
             .trainer(
                 trainer_class=BCTfRLTrainer,
             )
-            .algorithm(algorithm_config=AlgorithmConfig())
         )
         config.build()
 
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner_local.py b/rllib/core/rl_trainer/tests/test_trainer_runner_local.py
deleted file mode 100644
index 9986cf98dd3d..000000000000
--- a/rllib/core/rl_trainer/tests/test_trainer_runner_local.py
+++ /dev/null
@@ -1,70 +0,0 @@
-import gymnasium as gym
-import unittest
-
-import ray
-
-from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID, MultiAgentBatch
-from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
-from ray.rllib.utils.framework import try_import_tf
-from ray.rllib.core.testing.utils import (
-    add_module_to_runner_or_trainer,
-    get_trainer_runner,
-    get_rl_trainer,
-)
-
-
-tf1, tf, tfv = try_import_tf()
-tf1.executing_eagerly()
-
-
-class TestTrainerRunnerLocal(unittest.TestCase):
-    """This test is a trainer test setup for no gpus."""
-
-    # TODO: Make a unittest that does not need 2 gpus to run.
-    # So that the user can run it locally as well.
-    @classmethod
-    def setUp(cls) -> None:
-        ray.init()
-
-    @classmethod
-    def tearDown(cls) -> None:
-        ray.shutdown()
-
-    def test_trainer_runner_no_gpus(self):
-        env = gym.make("CartPole-v1")
-        for fw in ["tf", "torch"]:
-            runner = get_trainer_runner(fw, env, compute_config=dict(num_gpus=0))
-            local_trainer = get_rl_trainer(fw, env)
-            local_trainer.build()
-
-            # make the state of the trainer and the local runner identical
-            local_trainer.set_state(runner.get_state()[0])
-
-            reader = get_cartpole_dataset_reader(batch_size=500)
-            batch = reader.next()
-            batch = batch.as_multi_agent()
-            check(local_trainer.update(batch), runner.update(batch)[0])
-
-            new_module_id = "test_module"
-
-            add_module_to_runner_or_trainer(fw, env, new_module_id, runner)
-            add_module_to_runner_or_trainer(fw, env, new_module_id, local_trainer)
-
-            # make the state of the trainer and the local runner identical
-            local_trainer.set_state(runner.get_state()[0])
-
-            # do another update
-            batch = reader.next()
-            ma_batch = MultiAgentBatch(
-                {new_module_id: batch, DEFAULT_POLICY_ID: batch}, env_steps=batch.count
-            )
-            check(local_trainer.update(ma_batch), runner.update(ma_batch)[0])
-
-            check(local_trainer.get_state(), runner.get_state()[0])
-
-
-if __name__ == "__main__":
-    import pytest
-    import sys
-
-    sys.exit(pytest.main(["-v", __file__]))
diff --git a/rllib/core/rl_trainer/tf/tf_rl_trainer.py b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
index 44a8f6d21581..0455a0e772e0 100644
--- a/rllib/core/rl_trainer/tf/tf_rl_trainer.py
+++ b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
@@ -9,10 +9,10 @@
     Dict,
     Sequence,
     Hashable,
-    TYPE_CHECKING,
 )
 
 from ray.rllib.core.rl_trainer.rl_trainer import (
+    FrameworkHPs,
     RLTrainer,
     ParamOptimizerPairs,
     ParamRef,
@@ -25,19 +25,13 @@
     ModuleID,
     SingleAgentRLModuleSpec,
 )
-from ray.rllib.core.rl_module.marl_module import (
-    MultiAgentRLModule,
-    MultiAgentRLModuleSpec,
-)
+from ray.rllib.core.rl_module.marl_module import MultiAgentRLModule
 from ray.rllib.policy.sample_batch import MultiAgentBatch
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.framework import try_import_tf
 from ray.rllib.utils.typing import TensorType
 from ray.rllib.utils.nested_dict import NestedDict
 
-if TYPE_CHECKING:
-    from ray.air.config import ScalingConfig
-    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 
 tf1, tf, tfv = try_import_tf()
 
@@ -94,24 +88,10 @@ class TfRLTrainer(RLTrainer):
     def __init__(
         self,
         *,
-        module_spec: Optional[
-            Union[SingleAgentRLModuleSpec, MultiAgentRLModuleSpec]
-        ] = None,
-        module: Optional[RLModule] = None,
-        optimizer_config: Mapping[str, Any],
-        distributed: bool = False,
-        enable_tf_function: bool = True,
-        scaling_config: Optional["ScalingConfig"] = None,
-        algorithm_config: Optional["AlgorithmConfig"] = None,
+        framework_hyperparameters: Optional[FrameworkHPs] = FrameworkHPs(),
+        **kwargs,
     ):
-        super().__init__(
-            module_spec=module_spec,
-            module=module,
-            optimizer_config=optimizer_config,
-            distributed=distributed,
-            scaling_config=scaling_config,
-            algorithm_config=algorithm_config,
-        )
+        super().__init__(framework_hyperparameters=framework_hyperparameters, **kwargs)
 
         # TODO (Kourosh): This is required to make sure tf computes the values in the
         # end. Two question remains:
@@ -121,7 +101,7 @@ def __init__(
         # does not mention this as a requirement?
         tf1.enable_eager_execution()
 
-        self._enable_tf_function = enable_tf_function
+        self._enable_tf_function = framework_hyperparameters.eager_tracing
         if self._enable_tf_function:
             self._update_fn = tf.function(self._do_update_fn)
         else:
diff --git a/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py b/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
index 40806048b6dc..9de3c1d47259 100644
--- a/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
+++ b/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
@@ -12,20 +12,12 @@
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID
 from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
 from ray.rllib.utils.numpy import convert_to_numpy
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
-from ray.air.config import ScalingConfig
 
-
-def _get_trainer(scaling_config=None, distributed: bool = False) -> RLTrainer:
+def _get_trainer() -> RLTrainer:
     env = gym.make("CartPole-v1")
-    scaling_config = scaling_config or ScalingConfig()
-    distributed = False
-
-    # TODO: Another way to make RLTrainer would be to construct the module first
-    # and then apply trainer to it. We should also allow that. In fact if we figure
-    # out the serialization of RLModules we can simply pass the module the trainer
-    # and internally it will serialize and deserialize the module for distributed
-    # construction.
+
     trainer = BCTorchRLTrainer(
         module_spec=SingleAgentRLModuleSpec(
             module_class=DiscreteBCTorchModule,
@@ -33,9 +25,8 @@ def _get_trainer(scaling_config=None, distributed: bool = False) -> RLTrainer:
             action_space=env.action_space,
             model_config={"hidden_dim": 32},
         ),
-        scaling_config=scaling_config,
         optimizer_config={"lr": 1e-3},
-        distributed=distributed,
+        trainer_scaling_config=TrainerScalingConfig(),
     )
 
     trainer.build()
@@ -54,7 +45,7 @@ def tearDown(cls) -> None:
 
     def test_end_to_end_update(self):
 
-        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
+        trainer = _get_trainer()
         reader = get_cartpole_dataset_reader(batch_size=512)
 
         min_loss = float("inf")
@@ -77,7 +68,7 @@ def test_compute_gradients(self):
         Tests that if we sum all the trainable variables the gradient of output w.r.t.
         the weights is all ones.
         """
-        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
+        trainer = _get_trainer()
 
         params = trainer.get_parameters(trainer.module[DEFAULT_POLICY_ID])
         loss = {"total_loss": sum([param.sum() for param in params])}
@@ -96,7 +87,7 @@ def test_apply_gradients(self):
         standard SGD/Adam update rule.
         """
 
-        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
+        trainer = _get_trainer()
 
         # calculated the expected new params based on gradients of all ones.
         params = trainer.get_parameters(trainer.module[DEFAULT_POLICY_ID])
@@ -120,7 +111,7 @@ def test_add_remove_module(self):
         all variables the updated parameters follow the SGD update rule.
         """
         env = gym.make("CartPole-v1")
-        trainer = _get_trainer(scaling_config=ScalingConfig(num_workers=2))
+        trainer = _get_trainer()
 
         # add a test module with SGD optimizer with a known lr
         lr = 1e-4
diff --git a/rllib/core/rl_trainer/torch/torch_rl_trainer.py b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
index b8313b47a584..8fe28c662718 100644
--- a/rllib/core/rl_trainer/torch/torch_rl_trainer.py
+++ b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
@@ -8,7 +8,6 @@
     Hashable,
     Optional,
     Callable,
-    TYPE_CHECKING,
 )
 
 from ray.rllib.core.rl_module.rl_module import (
@@ -16,10 +15,7 @@
     ModuleID,
     SingleAgentRLModuleSpec,
 )
-from ray.rllib.core.rl_module.marl_module import (
-    MultiAgentRLModule,
-    MultiAgentRLModuleSpec,
-)
+from ray.rllib.core.rl_module.marl_module import MultiAgentRLModule
 from ray.rllib.core.rl_trainer.rl_trainer import (
     RLTrainer,
     ParamOptimizerPairs,
@@ -28,6 +24,7 @@
     ParamDictType,
 )
 from ray.rllib.core.rl_module.torch.torch_rl_module import TorchDDPRLModule
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 from ray.rllib.policy.sample_batch import MultiAgentBatch
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.typing import TensorType
@@ -37,11 +34,8 @@
 torch, nn = try_import_torch()
 
 if torch:
-    from ray.air.config import ScalingConfig
     from ray.train.torch.train_loop_utils import _TorchAccelerator
 
-if TYPE_CHECKING:
-    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 
 logger = logging.getLogger(__name__)
 
@@ -53,31 +47,14 @@ class TorchRLTrainer(RLTrainer):
     def __init__(
         self,
         *,
-        module_spec: Optional[
-            Union[SingleAgentRLModuleSpec, MultiAgentRLModuleSpec]
-        ] = None,
-        module: Optional[RLModule] = None,
-        optimizer_config: Mapping[str, Any],
-        distributed: bool = False,
-        scaling_config: Optional["ScalingConfig"] = None,
-        algorithm_config: Optional["AlgorithmConfig"] = None,
+        trainer_scaling_config: TrainerScalingConfig = TrainerScalingConfig(),
+        **kwargs,
     ):
-        super().__init__(
-            module_spec=module_spec,
-            module=module,
-            optimizer_config=optimizer_config,
-            distributed=distributed,
-            scaling_config=scaling_config,
-            algorithm_config=algorithm_config,
-        )
+        super().__init__(trainer_scaling_config=trainer_scaling_config, **kwargs)
 
-        # TODO (Kourosh): Scaling config is required for torch trainer to do proper DDP
-        # wraping setup but not so much required for tf. we need to
-        scaling_config = scaling_config or ScalingConfig()
-        self._world_size = scaling_config.num_workers or 1
-        self._use_gpu = scaling_config.use_gpu
+        # pick the stuff that we need from the scaling config
+        self._use_gpu = trainer_scaling_config.num_gpus_per_worker > 0
 
-        # These attributes are set in the `build` method.
         self._device = None
 
     @property
@@ -135,6 +112,12 @@ def build(self) -> None:
             self._device = torch.device("cpu")
         super().build()
 
+    @override(RLTrainer)
+    def _make_module(self) -> MultiAgentRLModule:
+        module = super()._make_module()
+        self._map_module_to_device(module)
+        return module
+
     @override(RLTrainer)
     def _make_distributed_module(self) -> MultiAgentRLModule:
         module = self._make_module()
@@ -146,11 +129,9 @@ def _make_distributed_module(self) -> MultiAgentRLModule:
         # register them in the MultiAgentRLModule. We should find a better way to
         # handle this.
         if isinstance(module, torch.nn.Module):
-            module.to(self._device)
             module = TorchDDPRLModule(module)
         else:
             for key in module.keys():
-                module[key].to(self._device)
                 module.add_module(key, TorchDDPRLModule(module[key]), override=True)
 
         return module
@@ -210,3 +191,11 @@ def add_module(
             self._module.add_module(
                 module_id, TorchDDPRLModule(self._module[module_id]), override=True
             )
+
+    def _map_module_to_device(self, module: MultiAgentRLModule) -> None:
+        """Moves the module to the correct device."""
+        if isinstance(module, torch.nn.Module):
+            module.to(self._device)
+        else:
+            for key in module.keys():
+                module[key].to(self._device)
diff --git a/rllib/core/rl_trainer/trainer_runner.py b/rllib/core/rl_trainer/trainer_runner.py
index c6fcda3deacf..b6889c77d973 100644
--- a/rllib/core/rl_trainer/trainer_runner.py
+++ b/rllib/core/rl_trainer/trainer_runner.py
@@ -1,5 +1,5 @@
 import math
-from typing import Any, List, Mapping, Type, Optional, Callable, Dict
+from typing import Any, List, Mapping, Type, Optional, Callable, Dict, TYPE_CHECKING
 
 import ray
 
@@ -9,16 +9,30 @@
     SingleAgentRLModuleSpec,
 )
 from ray.rllib.core.rl_trainer.rl_trainer import (
-    RLTrainer,
+    RLTrainerSpec,
     ParamOptimizerPairs,
     Optimizer,
 )
-
 from ray.rllib.policy.sample_batch import MultiAgentBatch
+from ray.train._internal.backend_executor import BackendExecutor
 
+if TYPE_CHECKING:
+    from ray.rllib.core.rl_trainer.rl_trainer import RLTrainer
 
-from ray.air.config import ScalingConfig
-from ray.train._internal.backend_executor import BackendExecutor
+
+def _get_backend_config(rl_trainer_class: Type["RLTrainer"]) -> str:
+    if rl_trainer_class.framework == "torch":
+        from ray.train.torch import TorchConfig
+
+        backend_config = TorchConfig()
+    elif rl_trainer_class.framework == "tf":
+        from ray.train.tensorflow import TensorflowConfig
+
+        backend_config = TensorflowConfig()
+    else:
+        raise ValueError("framework must be either torch or tf")
+
+    return backend_config
 
 
 class TrainerRunner:
@@ -47,32 +61,23 @@ class TrainerRunner:
 
     def __init__(
         self,
-        trainer_class: Type[RLTrainer],
-        trainer_config: Mapping[str, Any],
-        compute_config: Mapping[str, Any],
+        rl_trainer_spec: RLTrainerSpec,
     ):
-        num_gpus = compute_config.get("num_gpus", 0)
-        use_fake_gpus = compute_config.get("_use_fake_gpus", False)
-        self._trainer_config = trainer_config
-
-        if num_gpus > 0:
-            scaling_config = ScalingConfig(
-                num_workers=num_gpus,
-                use_gpu=(not use_fake_gpus),
-            )
-
-            if trainer_class.framework == "torch":
-                from ray.train.torch import TorchConfig
-
-                backend_config = TorchConfig()
-            elif trainer_class.framework == "tf":
-                from ray.train.tensorflow import TensorflowConfig
+        scaling_config = rl_trainer_spec.trainer_scaling_config
+        rl_trainer_class = rl_trainer_spec.rl_trainer_class
 
-                backend_config = TensorflowConfig()
-            else:
-                raise ValueError("framework must be either torch or tf")
+        # TODO (Kourosh): Go with a _remote flag instead of _is_local to be more
+        # explicit
+        self._is_local = scaling_config.num_workers == 0
+        self._trainer = None
+        self._workers = None
 
-            self.backend_executor = BackendExecutor(
+        if self._is_local:
+            self._trainer = rl_trainer_class(**rl_trainer_spec.get_params_dict())
+            self._trainer.build()
+        else:
+            backend_config = _get_backend_config(rl_trainer_class)
+            backend_executor = BackendExecutor(
                 backend_config=backend_config,
                 num_workers=scaling_config.num_workers,
                 num_cpus_per_worker=scaling_config.num_cpus_per_worker,
@@ -80,23 +85,19 @@ def __init__(
                 max_retries=0,
             )
 
-            # TODO(avnishn, kourosh): Should we pass in scaling config into the
-            # trainer?
-            trainer_config["distributed"] = self._distributed = bool(num_gpus > 1)
-            trainer_config["scaling_config"] = scaling_config
-            self.backend_executor.start(
-                train_cls=trainer_class, train_cls_kwargs=trainer_config
+            backend_executor.start(
+                train_cls=rl_trainer_class,
+                train_cls_kwargs=rl_trainer_spec.get_params_dict(),
             )
-            self._workers = [
-                w.actor for w in self.backend_executor.worker_group.workers
-            ]
 
+            self._workers = [w.actor for w in backend_executor.worker_group.workers]
+
+            # run the neural network building code on remote workers
             ray.get([w.build.remote() for w in self._workers])
 
-        else:
-            trainer_config["distributed"] = self._distributed = False
-            self._trainer = trainer_class(**trainer_config)
-            self._trainer.build()
+    @property
+    def is_local(self) -> bool:
+        return self._is_local
 
     def update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
         """Do a gradient based update to the RLTrainer(s) maintained by this TrainerRunner.
@@ -107,10 +108,10 @@ def update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
         Returns:
             A list of dictionaries of results from the updates from the RLTrainer(s)
         """
-        if self._distributed:
-            return self._distributed_update(batch)
-        else:
+        if self.is_local:
             return [self._trainer.update(batch)]
+        else:
+            return self._distributed_update(batch)
 
     def _distributed_update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
         """Do a gradient based update to the RLTrainers using DDP training.
@@ -157,13 +158,13 @@ def additional_update(self, *args, **kwargs) -> List[Mapping[str, Any]]:
             A list of dictionaries of results from the updates from each worker.
         """
 
-        if self._distributed:
+        if self.is_local:
+            return [self._trainer.additional_update(*args, **kwargs)]
+        else:
             refs = []
             for worker in self._workers:
                 refs.append(worker.additional_update.remote(*args, **kwargs))
             return ray.get(refs)
-        else:
-            return [self._trainer.additional_update(*args, **kwargs)]
 
     def add_module(
         self,
@@ -186,7 +187,14 @@ def add_module(
             optimizer_cls: The optimizer class to use. If None, the set_optimizer_fn
                 should be provided.
         """
-        if self._distributed:
+        if self.is_local:
+            self._trainer.add_module(
+                module_id=module_id,
+                module_spec=module_spec,
+                set_optimizer_fn=set_optimizer_fn,
+                optimizer_cls=optimizer_cls,
+            )
+        else:
             refs = []
             for worker in self._workers:
                 ref = worker.add_module.remote(
@@ -197,13 +205,6 @@ def add_module(
                 )
                 refs.append(ref)
             ray.get(refs)
-        else:
-            self._trainer.add_module(
-                module_id=module_id,
-                module_spec=module_spec,
-                set_optimizer_fn=set_optimizer_fn,
-                optimizer_cls=optimizer_cls,
-            )
 
     def remove_module(self, module_id: ModuleID) -> None:
         """Remove a module from the RLTrainers maintained by this TrainerRunner.
@@ -212,14 +213,14 @@ def remove_module(self, module_id: ModuleID) -> None:
             module_id: The id of the module to remove.
 
         """
-        if self._distributed:
+        if self.is_local:
+            self._trainer.remove_module(module_id)
+        else:
             refs = []
             for worker in self._workers:
                 ref = worker.remove_module.remote(module_id)
                 refs.append(ref)
             ray.get(refs)
-        else:
-            self._trainer.remove_module(module_id)
 
     def get_weight(self) -> Dict:
         """Get the weights of the MARLModule.
@@ -232,13 +233,13 @@ def get_weight(self) -> Dict:
 
     def get_state(self) -> List[Mapping[ModuleID, Mapping[str, Any]]]:
         """Get the states of the RLTrainers"""
-        if self._distributed:
+        if self.is_local:
+            return [self._trainer.get_state()]
+        else:
             refs = []
             for worker in self._workers:
                 refs.append(worker.get_state.remote())
             return ray.get(refs)
-        else:
-            return [self._trainer.get_state()]
 
     def set_state(self, state: List[Mapping[ModuleID, Mapping[str, Any]]]) -> None:
         """Sets the states of the RLTrainers.
@@ -247,10 +248,10 @@ def set_state(self, state: List[Mapping[ModuleID, Mapping[str, Any]]]) -> None:
             state: The state of the RLTrainers
 
         """
-        if self._distributed:
+        if self.is_local:
+            self._trainer.set_state(state)
+        else:
             refs = []
             for worker in self._workers:
                 refs.append(worker.set_state.remote(state))
             ray.get(refs)
-        else:
-            self._trainer.set_state(state)
diff --git a/rllib/core/rl_trainer/trainer_runner_config.py b/rllib/core/rl_trainer/trainer_runner_config.py
index d193e7cbb1f8..d8de08c05328 100644
--- a/rllib/core/rl_trainer/trainer_runner_config.py
+++ b/rllib/core/rl_trainer/trainer_runner_config.py
@@ -1,11 +1,18 @@
 from typing import Type, Optional, TYPE_CHECKING, Union, Dict
+
 from ray.rllib.core.rl_module.marl_module import MultiAgentRLModuleSpec
 from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
-from ray.rllib.utils.from_config import NotProvided
 from ray.rllib.core.rl_trainer.trainer_runner import TrainerRunner
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
+from ray.rllib.core.rl_trainer.rl_trainer import (
+    RLTrainerSpec,
+    RLTrainerHPs,
+    FrameworkHPs,
+)
+from ray.rllib.utils.from_config import NotProvided
+
 
 if TYPE_CHECKING:
-    from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
     from ray.rllib.core.rl_trainer import RLTrainer
 
 ModuleSpec = Union[SingleAgentRLModuleSpec, MultiAgentRLModuleSpec]
@@ -26,15 +33,16 @@ def __init__(self, cls: Type[TrainerRunner] = None) -> None:
 
         # `self.trainer()`
         self.trainer_class = None
-        self.eager_tracing = True
         self.optimizer_config = None
+        self.rl_trainer_hps = RLTrainerHPs()
 
         # `self.resources()`
-        self.num_gpus = 0
-        self.fake_gpus = False
+        self.num_gpus_per_trainer_worker = 0
+        self.num_cpus_per_trainer_worker = 1
+        self.num_trainer_workers = 1
 
-        # `self.algorithm()`
-        self.algorithm_config = None
+        # `self.framework()`
+        self.eager_tracing = False
 
     def validate(self) -> None:
 
@@ -50,51 +58,39 @@ def validate(self) -> None:
                 "the RLTrainer class with .trainer(trainer_class=MyTrainerClass)."
             )
 
-        if self.algorithm_config is None:
-            raise ValueError(
-                "Must provide algorithm_config for RLTrainer. Use "
-                ".algorithm(algorithm_config=MyConfig)."
-            )
-
         if self.optimizer_config is None:
             # get the default optimizer config if it's not provided
             # TODO (Kourosh): Change the optimizer config to a dataclass object.
             self.optimizer_config = {"lr": 1e-3}
 
-        if self.fake_gpus and self.num_gpus <= 0:
-            raise ValueError("If fake_gpus is True, num_gpus must be greater than 0.")
-
     def build(self) -> TrainerRunner:
         self.validate()
 
-        # If the module class is a multi agent class it will override the default
-        # MultiAgentRLModule class. otherwise, it will be a single agent wrapped with
-        # mutliagent
-        # TODO (Kourosh): What should be scaling_config? it's not clear what
-        # should be passed in as trainer_config and what will be inferred
-        return self.trainer_runner_class(
-            trainer_class=self.trainer_class,
-            trainer_config={
-                "module_spec": self.module_spec,
-                # TODO (Kourosh): should this be inferred inside the constructor?
-                "distributed": self.num_gpus > 1,
-                # TODO (Avnish): add this
-                # "enable_tf_function": self.eager_tracing,
-                "optimizer_config": self.optimizer_config,
-                "algorithm_config": self.algorithm_config,
-            },
-            compute_config={
-                "num_gpus": self.num_gpus,
-                # TODO (Avnish): add this
-                # "fake_gpus": self.fake_gpus,
-            },
+        scaling_config = TrainerScalingConfig(
+            num_workers=self.num_trainer_workers,
+            num_gpus_per_worker=self.num_gpus_per_trainer_worker,
+            num_cpus_per_worker=self.num_cpus_per_trainer_worker,
         )
 
-    def algorithm(
-        self, algorithm_config: Optional["AlgorithmConfig"] = NotProvided
+        framework_hps = FrameworkHPs(eager_tracing=self.eager_tracing)
+
+        rl_trainer_spec = RLTrainerSpec(
+            rl_trainer_class=self.trainer_class,
+            module_spec=self.module_spec,
+            optimizer_config=self.optimizer_config,
+            trainer_scaling_config=scaling_config,
+            trainer_hyperparameters=self.rl_trainer_hps,
+            framework_hyperparameters=framework_hps,
+        )
+
+        return self.trainer_runner_class(rl_trainer_spec)
+
+    def framework(
+        self, eager_tracing: Optional[bool] = NotProvided
     ) -> "TrainerRunnerConfig":
-        if algorithm_config is not NotProvided:
-            self.algorithm_config = algorithm_config
+
+        if eager_tracing is not NotProvided:
+            self.eager_tracing = eager_tracing
         return self
 
     def module(
@@ -109,14 +105,17 @@ def module(
 
     def resources(
         self,
-        num_gpus: Optional[Union[float, int]] = NotProvided,
-        fake_gpus: Optional[bool] = NotProvided,
+        num_trainer_workers: Optional[int] = NotProvided,
+        num_gpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
+        num_cpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
     ) -> "TrainerRunnerConfig":
 
-        if num_gpus is not NotProvided:
-            self.num_gpus = num_gpus
-        if fake_gpus is not NotProvided:
-            self.fake_gpus = fake_gpus
+        if num_trainer_workers is not NotProvided:
+            self.num_trainer_workers = num_trainer_workers
+        if num_gpus_per_trainer_worker is not NotProvided:
+            self.num_gpus_per_trainer_worker = num_gpus_per_trainer_worker
+        if num_cpus_per_trainer_worker is not NotProvided:
+            self.num_cpus_per_trainer_worker = num_cpus_per_trainer_worker
 
         return self
 
@@ -124,15 +123,15 @@ def trainer(
         self,
         *,
         trainer_class: Optional[Type["RLTrainer"]] = NotProvided,
-        eager_tracing: Optional[bool] = NotProvided,
         optimizer_config: Optional[Dict] = NotProvided,
+        rl_trainer_hps: Optional[RLTrainerHPs] = NotProvided,
     ) -> "TrainerRunnerConfig":
 
         if trainer_class is not NotProvided:
             self.trainer_class = trainer_class
-        if eager_tracing is not NotProvided:
-            self.eager_tracing = eager_tracing
         if optimizer_config is not NotProvided:
             self.optimizer_config = optimizer_config
+        if rl_trainer_hps is not NotProvided:
+            self.rl_trainer_hps = rl_trainer_hps
 
         return self
diff --git a/rllib/core/testing/utils.py b/rllib/core/testing/utils.py
index bd96492bac50..01e38f07ad8a 100644
--- a/rllib/core/testing/utils.py
+++ b/rllib/core/testing/utils.py
@@ -4,6 +4,8 @@
 
 from ray.rllib.utils.annotations import DeveloperAPI
 from ray.rllib.core.rl_trainer.trainer_runner import TrainerRunner
+from ray.rllib.core.rl_trainer.rl_trainer import RLTrainerSpec
+from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
 from ray.rllib.core.rl_module.marl_module import (
     MultiAgentRLModuleSpec,
@@ -101,17 +103,19 @@ def get_rl_trainer(
 def get_trainer_runner(
     framework: str,
     env: "gym.Env",
-    compute_config: dict,
+    scaling_config: TrainerScalingConfig,
     is_multi_agent: bool = False,
 ) -> TrainerRunner:
-    trainer_class = get_trainer_class(framework)
-    trainer_cfg = dict(
+
+    rl_trainer_spec = RLTrainerSpec(
+        rl_trainer_class=get_trainer_class(framework),
         module_spec=get_module_spec(
             framework=framework, env=env, is_multi_agent=is_multi_agent
         ),
         optimizer_config={"lr": 0.1},
+        trainer_scaling_config=scaling_config,
     )
-    runner = TrainerRunner(trainer_class, trainer_cfg, compute_config=compute_config)
+    runner = TrainerRunner(rl_trainer_spec)
 
     return runner
 
diff --git a/rllib/utils/framework.py b/rllib/utils/framework.py
index 7ae4a4c5ddfc..226b2a441a3d 100644
--- a/rllib/utils/framework.py
+++ b/rllib/utils/framework.py
@@ -59,6 +59,7 @@ def try_import_tf(error: bool = False):
     Raises:
         ImportError: If error=True and tf is not installed.
     """
+    tf_stub = _TFStub()
     # Make sure, these are reset after each test case
     # that uses them: del os.environ["RLLIB_TEST_NO_TF_IMPORT"]
     if "RLLIB_TEST_NO_TF_IMPORT" in os.environ:
@@ -86,7 +87,7 @@ def try_import_tf(error: bool = False):
                     "install at least one deep-learning framework: "
                     "`pip install [torch|tensorflow|jax]`."
                 )
-            return None, None, None
+            return None, tf_stub, None
 
     # Try "reducing" tf to tf.compat.v1.
     try:
@@ -108,6 +109,28 @@ def try_import_tf(error: bool = False):
     return tf1_module, tf_module, version
 
 
+# Fake module for tf.
+class _TFStub:
+    def __init__(self) -> None:
+        self.keras = _KerasStub()
+
+    def __bool__(self):
+        # if tf should return False
+        return False
+
+
+# Fake module for tf.keras.
+class _KerasStub:
+    def __init__(self) -> None:
+        self.Model = _FakeTfClassStub
+
+
+# Fake classes under keras (e.g for tf.keras.Model)
+class _FakeTfClassStub:
+    def __init__(self, *a, **kw):
+        raise ImportError("Could not import `tensorflow`. Try pip install tensorflow.")
+
+
 @DeveloperAPI
 def tf_function(tf_module):
     """Conditional decorator for @tf.function.
@@ -157,20 +180,20 @@ class _NNStub:
     def __init__(self, *a, **kw):
         # Fake nn.functional module within torch.nn.
         self.functional = None
-        self.Module = _FakeClassStub
+        self.Module = _FakeTorchClassStub
         self.parallel = _ParallelStub()
 
 
 # Fake class for e.g. torch.nn.Module to allow it to be inherited from.
-class _FakeClassStub:
+class _FakeTorchClassStub:
     def __init__(self, *a, **kw):
         raise ImportError("Could not import `torch`. Try pip install torch.")
 
 
 class _ParallelStub:
     def __init__(self, *a, **kw):
-        self.DataParallel = _FakeClassStub
-        self.DistributedDataParallel = _FakeClassStub
+        self.DataParallel = _FakeTorchClassStub
+        self.DistributedDataParallel = _FakeTorchClassStub
 
 
 @PublicAPI

From cf7bc272bcbe094bc6f637c10419d12431830a68 Mon Sep 17 00:00:00 2001
From: Chen Shen <scv119@gmail.com>
Date: Tue, 31 Jan 2023 20:37:23 -0800
Subject: [PATCH 111/267] [Core] Pick node from top k by default. (#31868)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

This PR takes over #28179

Why are these changes needed?
Today with the default scheduling policy, Ray will try to pack tasks on nodes until the resource utilization is beyond a certain threshold and spread tasks afterwards.
This has caused slow down the scheduling speed for embarrassingly parallel jobs:

we will only move on to another node before the current node's resource if sufficiently utilized,
for each node, the overhead of accepting new job and starting of a new workers is not negligible.
the overall scheduling speed doesn't scale with the number of nodes;
This PR is one proposal to address the problem: instead of stick to one node, we randomly choose one node from top-k nodes for the default scheduling, where the node is sorted by it's resource utilization in reverse order.

Intuitively, this allows us to kick off the workers startup on multiple node in parallel of the scheduling.

benchmark result:

baseline: 10 parallelism, top 1, 25 tasks/second
10 parallelism, top 6, 30 tasks/second
64 parallelism, top 6, 126
100 parallelism, top 6, 150
1000 parallelism, top 6, 374.8676886257549
10 concurrent, top 12, 176
64 concurrent, top 12, 182.59477988042443 tasks/s
128 concurrent, top 12, 245.9862948998163
256 concurrent, top 12, 298…
---
 BUILD.bazel                                   |  17 ++
 python/ray/tests/test_scheduling.py           |  17 +-
 src/ray/common/ray_config_def.h               |  11 +
 .../scheduling/cluster_resource_manager.h     |   4 +
 .../scheduling/cluster_task_manager_test.cc   |   4 +-
 .../policy/hybrid_scheduling_policy.cc        | 285 +++++++++++-------
 .../policy/hybrid_scheduling_policy.h         |  98 ++++--
 .../policy/hybrid_scheduling_policy_test.cc   | 164 ++++++++++
 .../scheduling/policy/scheduling_options.h    |  30 +-
 .../policy/scheduling_policy_test.cc          |  11 +-
 10 files changed, 481 insertions(+), 160 deletions(-)
 create mode 100644 src/ray/raylet/scheduling/policy/hybrid_scheduling_policy_test.cc

diff --git a/BUILD.bazel b/BUILD.bazel
index 20759e151419..6baa80541cf4 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -702,6 +702,8 @@ cc_library(
         "@com_google_absl//absl/base:core_headers",
         "@com_google_absl//absl/container:flat_hash_set",
         "@com_google_absl//absl/memory",
+        "@com_google_absl//absl/random",
+        "@com_google_absl//absl/random:bit_gen_ref",
         "@com_google_absl//absl/strings",
         "@com_google_googletest//:gtest",
         "@io_opencensus_cpp//opencensus/exporters/stats/prometheus:prometheus_exporter",
@@ -1186,6 +1188,21 @@ cc_test(
     ],
 )
 
+cc_test(
+    name = "hybrid_scheduling_policy_test",
+    size = "small",
+    srcs = [
+        "src/ray/raylet/scheduling/policy/hybrid_scheduling_policy_test.cc",
+    ],
+    copts = COPTS,
+    tags = ["team:core"],
+    deps = [
+        ":scheduler",
+        "@com_google_absl//absl/random:mock_distributions",
+        "@com_google_googletest//:gtest_main",
+    ],
+)
+
 cc_test(
     name = "cluster_task_manager_test",
     size = "small",
diff --git a/python/ray/tests/test_scheduling.py b/python/ray/tests/test_scheduling.py
index 70cf0f8d5b43..82636d7e2b2b 100644
--- a/python/ray/tests/test_scheduling.py
+++ b/python/ray/tests/test_scheduling.py
@@ -62,12 +62,21 @@ def f():
 
 @pytest.mark.skipif(sys.platform == "win32", reason="Times out on Windows")
 def test_hybrid_policy(ray_start_cluster):
-
     cluster = ray_start_cluster
-    num_nodes = 2
+
     num_cpus = 10
-    for _ in range(num_nodes):
-        cluster.add_node(num_cpus=num_cpus, memory=num_cpus)
+    cluster.add_node(
+        num_cpus=num_cpus,
+        memory=num_cpus,
+        _system_config={
+            "scheduler_top_k_absolute": 1,
+            "scheduler_top_k_fraction": 0,
+        },
+    )
+    cluster.add_node(
+        num_cpus=num_cpus,
+        memory=num_cpus,
+    )
     cluster.wait_for_nodes()
     ray.init(address=cluster.address)
 
diff --git a/src/ray/common/ray_config_def.h b/src/ray/common/ray_config_def.h
index 3a133ea6d510..069972afcf78 100644
--- a/src/ray/common/ray_config_def.h
+++ b/src/ray/common/ray_config_def.h
@@ -191,6 +191,17 @@ RAY_CONFIG(int64_t, worker_cap_max_backoff_delay_ms, 1000 * 10)
 /// even balancing of load. Low values (min 0.0) encourage more load spreading.
 RAY_CONFIG(float, scheduler_spread_threshold, 0.5)
 
+/// Used by the default hybrid policy only. The scheduler will randomly pick
+/// one node from the top k in the cluster to improve load balancing. The
+/// scheduler guarantees k is at least equal to this fraction * the number of
+/// nodes in the cluster.
+RAY_CONFIG(float, scheduler_top_k_fraction, 0.2);
+
+/// Used by the default hybrid policy only. The scheduler will randomly pick
+/// one node from the top k in the cluster to improve load balancing. The
+/// scheduler guarantees k is at least equal to scheduler_top_k_absolute.
+RAY_CONFIG(int32_t, scheduler_top_k_absolute, 1);
+
 /// Whether to only report the usage of pinned copies of objects in the
 /// object_store_memory resource. This means nodes holding secondary copies only
 /// will become eligible for removal in the autoscaler.
diff --git a/src/ray/raylet/scheduling/cluster_resource_manager.h b/src/ray/raylet/scheduling/cluster_resource_manager.h
index 1db8fcf0d325..568de5d9a7f2 100644
--- a/src/ray/raylet/scheduling/cluster_resource_manager.h
+++ b/src/ray/raylet/scheduling/cluster_resource_manager.h
@@ -34,6 +34,9 @@ namespace raylet {
 class ClusterTaskManagerTest;
 class SchedulingPolicyTest;
 }  // namespace raylet
+namespace raylet_scheduling_policy {
+class HybridSchedulingPolicyTest;
+}
 namespace gcs {
 class GcsActorSchedulerTest;
 }  // namespace gcs
@@ -185,6 +188,7 @@ class ClusterResourceManager {
   FRIEND_TEST(ClusterResourceSchedulerTest, AffinityWithBundleScheduleTest);
 
   friend class raylet::SchedulingPolicyTest;
+  friend class raylet_scheduling_policy::HybridSchedulingPolicyTest;
 };
 
 }  // end namespace ray
diff --git a/src/ray/raylet/scheduling/cluster_task_manager_test.cc b/src/ray/raylet/scheduling/cluster_task_manager_test.cc
index 846fc282c08a..c85efcd1f701 100644
--- a/src/ray/raylet/scheduling/cluster_task_manager_test.cc
+++ b/src/ray/raylet/scheduling/cluster_task_manager_test.cc
@@ -290,7 +290,9 @@ class ClusterTaskManagerTest : public ::testing::Test {
             /* announce_infeasible_task= */
             [this](const RayTask &task) { announce_infeasible_task_calls_++; },
             local_task_manager_,
-            /*get_time=*/[this]() { return current_time_ms_; }) {}
+            /*get_time=*/[this]() { return current_time_ms_; }) {
+    RayConfig::instance().initialize("{\"scheduler_top_k_absolute\": 1}");
+  }
 
   void SetUp() {
     static rpc::GcsNodeInfo node_info;
diff --git a/src/ray/raylet/scheduling/policy/hybrid_scheduling_policy.cc b/src/ray/raylet/scheduling/policy/hybrid_scheduling_policy.cc
index 0b83a52b242c..482bd6533f17 100644
--- a/src/ray/raylet/scheduling/policy/hybrid_scheduling_policy.cc
+++ b/src/ray/raylet/scheduling/policy/hybrid_scheduling_policy.cc
@@ -23,121 +23,164 @@ namespace ray {
 
 namespace raylet_scheduling_policy {
 
-scheduling::NodeID HybridSchedulingPolicy::HybridPolicyWithFilter(
+bool HybridSchedulingPolicy::IsNodeFeasible(
+    const scheduling::NodeID &node_id,
+    const NodeFilter &node_filter,
+    const NodeResources &node_resources,
+    const ResourceRequest &resource_request) const {
+  if (!is_node_alive_(node_id)) {
+    return false;
+  }
+
+  if (node_filter != NodeFilter::kAny) {
+    const bool has_gpu = node_resources.total.Has(ResourceID::GPU());
+    if (node_filter == NodeFilter::kGPU && !has_gpu) {
+      return false;
+    } else if (node_filter == NodeFilter::kNonGpu && has_gpu) {
+      return false;
+    }
+  }
+
+  return node_resources.IsFeasible(resource_request);
+}
+
+namespace {
+float ComputeNodeScoreImpl(const NodeResources &node_resources, float spread_threshold) {
+  float critical_resource_utilization =
+      node_resources.CalculateCriticalResourceUtilization();
+  if (critical_resource_utilization < spread_threshold) {
+    critical_resource_utilization = 0;
+  }
+  return critical_resource_utilization;
+}
+}  // namespace
+
+float HybridSchedulingPolicy::ComputeNodeScore(const scheduling::NodeID &node_id,
+                                               float spread_threshold) const {
+  const auto local_it = nodes_.find(node_id);
+  RAY_CHECK(local_it != nodes_.end());
+  return ComputeNodeScoreImpl(local_it->second.GetLocalView(), spread_threshold);
+}
+
+scheduling::NodeID HybridSchedulingPolicy::GetBestNode(
+    std::vector<std::pair<scheduling::NodeID, float>> &node_scores,
+    size_t num_candidate_nodes,
+    std::optional<scheduling::NodeID> preferred_node_id,
+    float preferred_node_score) const {
+  RAY_CHECK(!node_scores.empty());
+  RAY_CHECK(num_candidate_nodes >= 1);
+  // Pick the top num_candidate_nodes nodes with the lowest score.
+  // First, sort nodes by id so that we always break ties between nodes in the same
+  // order.
+  std::sort(
+      node_scores.begin(),
+      node_scores.end(),
+      [](const std::pair<scheduling::NodeID, float> &a,
+         const std::pair<scheduling::NodeID, float> &b) { return a.first < b.first; });
+  // Then sort nodes by scores and preserve the order of equivalent elements.
+  std::stable_sort(
+      node_scores.begin(),
+      node_scores.end(),
+      [](const std::pair<scheduling::NodeID, float> &a,
+         const std::pair<scheduling::NodeID, float> &b) { return a.second < b.second; });
+
+  // If prioritize local node, always pick local node is it has the minimal
+  // score across all candidates.
+  if (preferred_node_id.has_value()) {
+    if (preferred_node_score <= node_scores.front().second) {
+      return preferred_node_id.value();
+    }
+  }
+  size_t node_index = absl::Uniform<size_t>(
+      bitgenref_, 0u, std::min(num_candidate_nodes, node_scores.size()));
+  return node_scores[node_index].first;
+}
+
+scheduling::NodeID HybridSchedulingPolicy::ScheduleImpl(
     const ResourceRequest &resource_request,
     float spread_threshold,
     bool force_spillback,
     bool require_node_available,
+    NodeFilter node_filter,
     const std::string &preferred_node,
-    NodeFilter node_filter) {
-  // Step 1: Generate the traversal order. We guarantee that the first node is local (or
-  // the preferred node, if provided), to encourage local/preferred scheduling. The rest
-  // of the traversal order should be globally consistent, to encourage using "warm"
-  // workers.
-  std::vector<scheduling::NodeID> round;
-  round.reserve(nodes_.size());
-  auto preferred_node_id =
-      preferred_node.empty() ? local_node_id_ : scheduling::NodeID(preferred_node);
-  auto preferred_it = nodes_.find(preferred_node_id);
-  RAY_CHECK(preferred_it != nodes_.end());
-  auto predicate = [this, node_filter](scheduling::NodeID node_id,
-                                       const NodeResources &node_resources) {
-    if (!is_node_available_(node_id)) {
-      return false;
-    }
-    if (node_filter == NodeFilter::kAny) {
-      return true;
-    }
-    const bool has_gpu = node_resources.total.Has(ResourceID::GPU());
-    if (node_filter == NodeFilter::kGPU) {
-      return has_gpu;
+    int32_t schedule_top_k_absolute,
+    float scheduler_top_k_fraction) {
+  // Nodes that are feasible and currently have available resources.
+  std::vector<std::pair<scheduling::NodeID, float>> available_nodes;
+  // Nodes that are feasible but currently do not have available resources.
+  std::vector<std::pair<scheduling::NodeID, float>> feasible_and_unavailable_nodes;
+  // Check whether the local node is available and feasible. We'll use this to
+  // help prioritize the local node when force_spillback=false.
+  bool preferred_node_is_available = false;
+  bool preferred_node_is_feasible = false;
+  scheduling::NodeID preferred_node_id = local_node_id_;
+  if (!preferred_node.empty()) {
+    auto new_id = scheduling::NodeID(preferred_node);
+    if (nodes_.contains(new_id)) {
+      preferred_node_id = new_id;
     }
-    RAY_CHECK(node_filter == NodeFilter::kNonGpu);
-    return !has_gpu;
-  };
-
-  const auto &preferred_node_view = preferred_it->second.GetLocalView();
-  // If we should include local/preferred node at all, make sure it is at the front of the
-  // list so that
-  // 1. It's first in traversal order.
-  // 2. It's easy to avoid sorting it.
-  if (predicate(preferred_node_id, preferred_node_view) && !force_spillback) {
-    round.push_back(preferred_node_id);
   }
-
-  const auto start_index = round.size();
   for (const auto &pair : nodes_) {
-    if (pair.first != preferred_node_id &&
-        predicate(pair.first, pair.second.GetLocalView())) {
-      round.push_back(pair.first);
-    }
-  }
-  // Sort all the nodes, making sure that if we added the local node in front, it stays in
-  // place.
-  std::sort(round.begin() + start_index, round.end());
-
-  scheduling::NodeID best_node_id = scheduling::NodeID::Nil();
-  float best_utilization_score = INFINITY;
-  bool best_is_available = false;
-
-  // Step 2: Perform the round robin.
-  auto round_it = round.begin();
-  for (; round_it != round.end(); round_it++) {
-    const auto &node_id = *round_it;
-    const auto &it = nodes_.find(node_id);
-    RAY_CHECK(it != nodes_.end());
-    const auto &node = it->second;
-    if (!node.GetLocalView().IsFeasible(resource_request)) {
+    const auto &node_id = pair.first;
+    const auto &node_resources = pair.second.GetLocalView();
+    if (force_spillback && node_id == preferred_node_id) {
       continue;
     }
-
-    bool ignore_pull_manager_at_capacity = false;
-    if (node_id == local_node_id_) {
-      // It's okay if the local node's pull manager is at
-      // capacity because we will eventually spill the task
-      // back from the waiting queue if its args cannot be
-      // pulled.
-      ignore_pull_manager_at_capacity = true;
-    }
-    bool is_available = node.GetLocalView().IsAvailable(resource_request,
-                                                        ignore_pull_manager_at_capacity);
-    float critical_resource_utilization =
-        node.GetLocalView().CalculateCriticalResourceUtilization();
-    RAY_LOG(DEBUG) << "Node " << node_id.ToInt() << " is "
-                   << (is_available ? "available" : "not available") << " for request "
-                   << resource_request.DebugString()
-                   << " with critical resource utilization "
-                   << critical_resource_utilization << " based on local view "
-                   << node.GetLocalView().DebugString();
-    if (critical_resource_utilization < spread_threshold) {
-      critical_resource_utilization = 0;
-    }
-
-    bool update_best_node = false;
-
-    if (is_available) {
-      // Always prioritize available nodes over nodes where the task must be queued first.
-      if (!best_is_available) {
-        update_best_node = true;
-      } else if (critical_resource_utilization < best_utilization_score) {
-        // Break ties between available nodes by their critical resource utilization.
-        update_best_node = true;
+    if (IsNodeFeasible(node_id, node_filter, node_resources, resource_request)) {
+      bool ignore_pull_manager_at_capacity = false;
+      if (node_id == preferred_node_id) {
+        // It's okay if the local node's pull manager is at
+        // capacity because we will eventually spill the task
+        // back from the waiting queue if its args cannot be
+        // pulled.
+        ignore_pull_manager_at_capacity = true;
+        preferred_node_is_feasible = true;
+      }
+      bool is_available =
+          node_resources.IsAvailable(resource_request, ignore_pull_manager_at_capacity);
+      if (node_id == preferred_node_id && is_available) {
+        preferred_node_is_available = true;
+      }
+      float node_score = ComputeNodeScoreImpl(node_resources, spread_threshold);
+      RAY_LOG(DEBUG) << "Node " << node_id.ToInt() << " is "
+                     << (is_available ? "available" : "not available") << " for request "
+                     << resource_request.DebugString()
+                     << " with critical resource utilization " << node_score
+                     << " based on local view " << node_resources.DebugString();
+      if (is_available) {
+        available_nodes.push_back({node_id, node_score});
+      } else {
+        feasible_and_unavailable_nodes.push_back({node_id, node_score});
       }
-    } else if (!best_is_available &&
-               critical_resource_utilization < best_utilization_score &&
-               !require_node_available) {
-      // Pick the best feasible node by critical resource utilization.
-      update_best_node = true;
-    }
-
-    if (update_best_node) {
-      best_node_id = node_id;
-      best_utilization_score = critical_resource_utilization;
-      best_is_available = is_available;
     }
   }
 
-  return best_node_id;
+  size_t num_candidate_nodes =
+      std::max<int32_t>(schedule_top_k_absolute,
+                        static_cast<int32_t>(nodes_.size() * scheduler_top_k_fraction));
+
+  if (!available_nodes.empty()) {
+    bool prioritize_preferred_node = !force_spillback && preferred_node_is_available;
+    // First prioritize available nodes.
+    return GetBestNode(available_nodes,
+                       num_candidate_nodes,
+                       prioritize_preferred_node
+                           ? std::optional<scheduling::NodeID>(preferred_node_id)
+                           : std::optional<scheduling::NodeID>(),
+                       ComputeNodeScore(preferred_node_id, spread_threshold));
+  } else if (!feasible_and_unavailable_nodes.empty() && !require_node_available) {
+    bool prioritize_preferred_node = !force_spillback && preferred_node_is_feasible;
+    // If there are no available nodes, and the caller is okay with an
+    // unavailable node, check the feasible nodes next.
+    return GetBestNode(feasible_and_unavailable_nodes,
+                       num_candidate_nodes,
+                       prioritize_preferred_node
+                           ? std::optional<scheduling::NodeID>(preferred_node_id)
+                           : std::optional<scheduling::NodeID>(),
+                       ComputeNodeScore(preferred_node_id, spread_threshold));
+  } else {
+    return scheduling::NodeID::Nil();
+  }
 }
 
 scheduling::NodeID HybridSchedulingPolicy::Schedule(
@@ -145,31 +188,39 @@ scheduling::NodeID HybridSchedulingPolicy::Schedule(
   RAY_CHECK(options.scheduling_type == SchedulingType::HYBRID)
       << "HybridPolicy policy requires type = HYBRID";
   if (!options.avoid_gpu_nodes || resource_request.Has(ResourceID::GPU())) {
-    return HybridPolicyWithFilter(resource_request,
-                                  options.spread_threshold,
-                                  options.avoid_local_node,
-                                  options.require_node_available,
-                                  options.preferred_node_id);
+    return ScheduleImpl(resource_request,
+                        options.spread_threshold,
+                        options.avoid_local_node,
+                        options.require_node_available,
+                        NodeFilter::kAny,
+                        options.preferred_node_id,
+                        options.schedule_top_k_absolute,
+                        options.scheduler_top_k_fraction);
   }
 
   // Try schedule on non-GPU nodes.
-  auto best_node_id = HybridPolicyWithFilter(resource_request,
-                                             options.spread_threshold,
-                                             options.avoid_local_node,
-                                             /*require_node_available*/ true,
-                                             options.preferred_node_id,
-                                             NodeFilter::kNonGpu);
+  auto best_node_id = ScheduleImpl(resource_request,
+                                   options.spread_threshold,
+                                   options.avoid_local_node,
+                                   /*require_node_available*/ true,
+                                   NodeFilter::kNonGpu,
+                                   options.preferred_node_id,
+                                   options.schedule_top_k_absolute,
+                                   options.scheduler_top_k_fraction);
   if (!best_node_id.IsNil()) {
     return best_node_id;
   }
 
   // If we cannot find any available node from non-gpu nodes, fallback to the original
   // scheduling
-  return HybridPolicyWithFilter(resource_request,
-                                options.spread_threshold,
-                                options.avoid_local_node,
-                                options.require_node_available,
-                                options.preferred_node_id);
+  return ScheduleImpl(resource_request,
+                      options.spread_threshold,
+                      options.avoid_local_node,
+                      options.require_node_available,
+                      NodeFilter::kAny,
+                      options.preferred_node_id,
+                      options.schedule_top_k_absolute,
+                      options.scheduler_top_k_fraction);
 }
 
 }  // namespace raylet_scheduling_policy
diff --git a/src/ray/raylet/scheduling/policy/hybrid_scheduling_policy.h b/src/ray/raylet/scheduling/policy/hybrid_scheduling_policy.h
index 773eaf8fcb6b..bf992e702882 100644
--- a/src/ray/raylet/scheduling/policy/hybrid_scheduling_policy.h
+++ b/src/ray/raylet/scheduling/policy/hybrid_scheduling_policy.h
@@ -14,8 +14,13 @@
 
 #pragma once
 
+#include <gtest/gtest_prod.h>
+
+#include <optional>
 #include <vector>
 
+#include "absl/random/bit_gen_ref.h"
+#include "absl/random/random.h"
 #include "ray/raylet/scheduling/policy/scheduling_policy.h"
 
 namespace ray {
@@ -31,6 +36,10 @@ namespace raylet_scheduling_policy {
 /// In order to solve these problems, we use the following scheduling policy.
 ///   1. Generate a traversal.
 ///   2. Run a priority scheduler.
+///   3. Randomly choose one node from top-k nodes according to the priority.
+///      If preferred node is specified, and the preferred node has the highest
+///      priority (lowest score), we always skip top k but directly pick
+///      the preferred node.
 ///
 /// A node's priorities are determined by the following factors:
 ///   * Always skip infeasible nodes
@@ -38,39 +47,24 @@ namespace raylet_scheduling_policy {
 ///   * Break ties in available/feasible by critical resource utilization.
 ///   * Critical resource utilization below a threshold should be truncated to 0.
 ///
-/// The traversal order should:
-///   * Prioritize the local node above all others.
-///   * All other nodes should have a globally fixed priority across the cluster.
-///
-/// We call this a hybrid policy because below the threshold, the traversal and
-/// truncation properties will lead to packing of nodes. Above the threshold, the policy
-/// will act like a traditional weighted round robin.
 class HybridSchedulingPolicy : public ISchedulingPolicy {
  public:
   HybridSchedulingPolicy(scheduling::NodeID local_node_id,
                          const absl::flat_hash_map<scheduling::NodeID, Node> &nodes,
-                         std::function<bool(scheduling::NodeID)> is_node_available)
+                         std::function<bool(scheduling::NodeID)> is_node_alive)
       : local_node_id_(local_node_id),
         nodes_(nodes),
-        is_node_available_(is_node_available) {}
+        is_node_alive_(is_node_alive),
+        bitgen_(),
+        bitgenref_(bitgen_) {}
 
   scheduling::NodeID Schedule(const ResourceRequest &resource_request,
                               SchedulingOptions options) override;
 
  private:
-  /// Identifier of local node.
-  const scheduling::NodeID local_node_id_;
-  /// List of nodes in the clusters and their resources organized as a map.
-  /// The key of the map is the node ID.
-  const absl::flat_hash_map<scheduling::NodeID, Node> &nodes_;
-
-  /// Function Checks if node is alive.
-  std::function<bool(scheduling::NodeID)> is_node_available_;
-
   enum class NodeFilter {
     /// Default scheduling.
-    kAny,
-    /// Schedule on GPU only nodes.
+    kAny,  /// Schedule on GPU only nodes.
     kGPU,
     /// Schedule on nodes that don't have GPU. Since GPUs are more scarce resources, we
     /// need
@@ -78,19 +72,71 @@ class HybridSchedulingPolicy : public ISchedulingPolicy {
     kNonGpu
   };
 
+  /// Return true if the node is alive and its total resource
+  /// satisify the filter and resource requrement.
+  bool IsNodeFeasible(const scheduling::NodeID &node_id,
+                      const NodeFilter &node_filter,
+                      const NodeResources &node_resources,
+                      const ResourceRequest &resource_request) const;
+
+  /// helper function compute a score between 0-1 indicates
+  /// the preference of the node (the lower score,
+  /// the more preferable.
+  float ComputeNodeScore(const scheduling::NodeID &node_id, float spread_threshold) const;
+
+  scheduling::NodeID GetBestNode(
+      std::vector<std::pair<scheduling::NodeID, float>> &node_scores,
+      size_t num_candidate_nodes,
+      std::optional<scheduling::NodeID> preferred_node_id,
+      float preferred_node_score) const;
+
   /// \param resource_request: The resource request we're attempting to schedule.
+  /// \param spread_threshold: The fraction of resource utilization on a node after
+  /// which the scheduler starts to prefer spreading tasks to other nodes.
+  //// This balances between locality and
+  /// even balancing of load. Low values (min 0.0) encourage more load spreading.
+  /// \param force_spillback: don't schedule on local node if true.
+  /// \param require_available: If true, only schedule on nodes who have resources
+  /// available to fulfill the request. Otherwise, schedule on nodes whose resources
+  /// capacity can fulfill the request, even if the resources are not currently
+  /// available.
   /// \param node_filter: defines the subset of nodes were are allowed to schedule on.
   /// can be one of kAny (can schedule on all nodes), kGPU (can only schedule on kGPU
   /// nodes), kNonGpu (can only schedule on non-GPU nodes.
+  /// \param preferred_node_id: defines the preferred node to schedule on.
+  /// \param schedule_top_k_absolute: scheduler will randomly pick
+  /// one node from the top k in the cluster to improve load balancing. The
+  /// scheduler guarantees k is at least equal to schedule_top_k_absolute.
+  /// \param schedule_top_k_fraction: The scheduler will randomly pick
+  /// one node from the top k in the cluster to improve load balancing. The
+  /// scheduler guarantees k is at least equal to this fraction * the number of
+  /// nodes in the cluster.
   ///
   /// \return -1 if the task is unfeasible, otherwise the node id (key in `nodes`) to
   /// schedule on.
-  scheduling::NodeID HybridPolicyWithFilter(const ResourceRequest &resource_request,
-                                            float spread_threshold,
-                                            bool force_spillback,
-                                            bool require_available,
-                                            const std::string &preferred_node,
-                                            NodeFilter node_filter = NodeFilter::kAny);
+  scheduling::NodeID ScheduleImpl(const ResourceRequest &resource_request,
+                                  float spread_threshold,
+                                  bool force_spillback,
+                                  bool require_available,
+                                  NodeFilter node_filter,
+                                  const std::string &preferred_node,
+                                  int32_t schedule_top_k_absolute,
+                                  float scheduler_top_k_fraction);
+
+  /// Identifier of local node.
+  const scheduling::NodeID local_node_id_;
+  /// List of nodes in the clusters and their resources organized as a map.
+  /// The key of the map is the node ID.
+  const absl::flat_hash_map<scheduling::NodeID, Node> &nodes_;
+  /// Function Checks if node is alive.
+  std::function<bool(scheduling::NodeID)> is_node_alive_;
+  /// Random number generator to choose a random node out of the top K.
+  mutable absl::BitGen bitgen_;
+  /// Using BitGenRef to simplify testing.
+  mutable absl::BitGenRef bitgenref_;
+
+  FRIEND_TEST(HybridSchedulingPolicyTest, GetBestNode);
+  FRIEND_TEST(HybridSchedulingPolicyTest, GetBestNodePrioritizePreferredNode);
 };
 }  // namespace raylet_scheduling_policy
 }  // namespace ray
diff --git a/src/ray/raylet/scheduling/policy/hybrid_scheduling_policy_test.cc b/src/ray/raylet/scheduling/policy/hybrid_scheduling_policy_test.cc
new file mode 100644
index 000000000000..7f8772b503ae
--- /dev/null
+++ b/src/ray/raylet/scheduling/policy/hybrid_scheduling_policy_test.cc
@@ -0,0 +1,164 @@
+// Copyright 2021 The Ray Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//  http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "absl/random/mock_distributions.h"
+#include "absl/random/mocking_bit_gen.h"
+#include "gmock/gmock.h"
+#include "gtest/gtest.h"
+#include "ray/raylet/scheduling/policy/composite_scheduling_policy.h"
+
+namespace ray {
+
+namespace raylet_scheduling_policy {
+
+using namespace ::testing;
+using namespace ray::raylet;
+
+NodeResources CreateNodeResources(double available_cpu,
+                                  double total_cpu,
+                                  double available_memory,
+                                  double total_memory,
+                                  double available_gpu,
+                                  double total_gpu) {
+  NodeResources resources;
+  resources.available.Set(ResourceID::CPU(), available_cpu)
+      .Set(ResourceID::Memory(), available_memory)
+      .Set(ResourceID::GPU(), available_gpu);
+  resources.total.Set(ResourceID::CPU(), total_cpu)
+      .Set(ResourceID::Memory(), total_memory)
+      .Set(ResourceID::GPU(), total_gpu);
+  return resources;
+}
+
+class HybridSchedulingPolicyTest : public ::testing::Test {
+ public:
+  scheduling::NodeID local_node = scheduling::NodeID(0);
+  scheduling::NodeID n1 = scheduling::NodeID(1);
+  scheduling::NodeID n2 = scheduling::NodeID(2);
+  scheduling::NodeID n3 = scheduling::NodeID(3);
+  scheduling::NodeID n4 = scheduling::NodeID(4);
+  absl::flat_hash_map<scheduling::NodeID, Node> nodes;
+
+  SchedulingOptions HybridOptions(
+      float spread,
+      bool avoid_local_node,
+      bool require_node_available,
+      bool avoid_gpu_nodes = RayConfig::instance().scheduler_avoid_gpu_nodes(),
+      int schedule_top_k_absolute = 1,
+      float scheduler_top_k_fraction = 0.1) {
+    return SchedulingOptions(SchedulingType::HYBRID,
+                             RayConfig::instance().scheduler_spread_threshold(),
+                             avoid_local_node,
+                             require_node_available,
+                             avoid_gpu_nodes,
+                             /*max_cpu_fraction_per_node*/ 1.0,
+                             /*scheduling_context*/ nullptr,
+                             /*preferred_node*/ "",
+                             schedule_top_k_absolute,
+                             scheduler_top_k_fraction);
+  }
+
+  ClusterResourceManager MockClusterResourceManager(
+      const absl::flat_hash_map<scheduling::NodeID, Node> &nodes) {
+    ClusterResourceManager cluster_resource_manager;
+    cluster_resource_manager.nodes_ = nodes;
+    return cluster_resource_manager;
+  }
+};
+
+TEST_F(HybridSchedulingPolicyTest, GetBestNode) {
+  std::vector<std::pair<scheduling::NodeID, float>> node_scores{
+      {n3, 0.6},
+      {n4, 0.7},
+      {n1, 0},
+      {n2, 0},
+  };
+
+  // Test return 1 node always return the first node.
+  {
+    HybridSchedulingPolicy policy{local_node, {}, [](auto) { return true; }};
+    EXPECT_EQ(n1,
+              policy.GetBestNode(node_scores,
+                                 /*num_candidate_nodes*/ 1,
+                                 /*preferred_node*/ {},
+                                 /*preferred_node_score*/ 1));
+  }
+
+  // Test return 3 node calls to the random generator.
+  {
+    absl::MockingBitGen mock;
+    EXPECT_CALL(absl::MockUniform<size_t>(), Call(mock, 0u, 3u))
+        .WillOnce(Return(1))
+        .WillOnce(Return(2))
+        .WillOnce(Return(0));
+    HybridSchedulingPolicy policy{local_node, {}, [](auto) { return true; }};
+    policy.bitgenref_ = absl::BitGenRef{mock};
+    EXPECT_EQ(n2,
+              policy.GetBestNode(node_scores,
+                                 /*num_candidate_nodes*/ 3,
+                                 /*preferred_node_id*/ {},
+                                 /*preferred_node_score*/ 1));
+    EXPECT_EQ(n3,
+              policy.GetBestNode(node_scores,
+                                 /*num_candidate_nodes*/ 3,
+                                 /*preferred_node_id*/ {},
+                                 /*preferred_node_score*/ 1));
+    EXPECT_EQ(n1,
+              policy.GetBestNode(node_scores,
+                                 /*num_candidate_nodes*/ 3,
+                                 /*preferred_node_id*/ {},
+                                 /*preferred_node_score*/ 1));
+  }
+}
+
+TEST_F(HybridSchedulingPolicyTest, GetBestNodePrioritizePreferredNode) {
+  {
+    std::vector<std::pair<scheduling::NodeID, float>> node_scores{
+        {n3, 0.6},
+        {n4, 0.7},
+        {n1, 0},
+        {n2, 0},
+    };
+
+    HybridSchedulingPolicy policy{local_node, {}, [](auto) { return true; }};
+    // local node score is greater than the smallest one
+    EXPECT_EQ(n1,
+              policy.GetBestNode(node_scores,
+                                 /*num_candidate_nodes*/ 1,
+                                 /*preferred_node_id*/ {local_node},
+                                 /*preferred_node_score*/ 0.5));
+
+    // local node score is equal to the smallest one.
+    EXPECT_EQ(local_node,
+              policy.GetBestNode(node_scores,
+                                 /*num_candidate_nodes*/ 1,
+                                 /*preferred_node_id*/ {local_node},
+                                 /*preferred_node_score*/ 0));
+    // preferred node score is equal to the smallest one.
+    EXPECT_EQ(n2,
+              policy.GetBestNode(node_scores,
+                                 /*num_candidate_nodes*/ 1,
+                                 /*preferred_node_id*/ {n2},
+                                 /*preferred_node_score*/ 0));
+  }
+}
+
+int main(int argc, char **argv) {
+  ::testing::InitGoogleTest(&argc, argv);
+  return RUN_ALL_TESTS();
+}
+
+}  // namespace raylet_scheduling_policy
+
+}  // namespace ray
diff --git a/src/ray/raylet/scheduling/policy/scheduling_options.h b/src/ray/raylet/scheduling/policy/scheduling_options.h
index cd624f9b610c..cea8254ec9e1 100644
--- a/src/ray/raylet/scheduling/policy/scheduling_options.h
+++ b/src/ray/raylet/scheduling/policy/scheduling_options.h
@@ -20,9 +20,11 @@
 namespace ray {
 namespace raylet {
 class SchedulingPolicyTest;
-}
+}  // namespace raylet
 namespace raylet_scheduling_policy {
 
+class HybridSchedulingPolicyTest;
+
 // Different scheduling types. Please refer to
 // scheduling_policy.h to see detailed behaviors.
 enum class SchedulingType {
@@ -160,16 +162,21 @@ struct SchedulingOptions {
   // The node where the task is preferred to be placed. By default, this node id
   // is empty, which means no preferred node.
   std::string preferred_node_id;
+  int32_t schedule_top_k_absolute;
+  float scheduler_top_k_fraction;
 
  private:
-  SchedulingOptions(SchedulingType type,
-                    float spread_threshold,
-                    bool avoid_local_node,
-                    bool require_node_available,
-                    bool avoid_gpu_nodes,
-                    double max_cpu_fraction_per_node = 1.0,
-                    std::shared_ptr<SchedulingContext> scheduling_context = nullptr,
-                    const std::string &preferred_node_id = std::string())
+  SchedulingOptions(
+      SchedulingType type,
+      float spread_threshold,
+      bool avoid_local_node,
+      bool require_node_available,
+      bool avoid_gpu_nodes,
+      double max_cpu_fraction_per_node = 1.0,
+      std::shared_ptr<SchedulingContext> scheduling_context = nullptr,
+      const std::string &preferred_node_id = std::string(),
+      int32_t schedule_top_k_absolute = RayConfig::instance().scheduler_top_k_absolute(),
+      float scheduler_top_k_fraction = RayConfig::instance().scheduler_top_k_fraction())
       : scheduling_type(type),
         spread_threshold(spread_threshold),
         avoid_local_node(avoid_local_node),
@@ -177,9 +184,12 @@ struct SchedulingOptions {
         avoid_gpu_nodes(avoid_gpu_nodes),
         max_cpu_fraction_per_node(max_cpu_fraction_per_node),
         scheduling_context(std::move(scheduling_context)),
-        preferred_node_id(preferred_node_id) {}
+        preferred_node_id(preferred_node_id),
+        schedule_top_k_absolute(schedule_top_k_absolute),
+        scheduler_top_k_fraction(scheduler_top_k_fraction) {}
 
   friend class ::ray::raylet::SchedulingPolicyTest;
+  friend class HybridSchedulingPolicyTest;
 };
 }  // namespace raylet_scheduling_policy
 }  // namespace ray
diff --git a/src/ray/raylet/scheduling/policy/scheduling_policy_test.cc b/src/ray/raylet/scheduling/policy/scheduling_policy_test.cc
index 7233f815a571..c37f2309ca4a 100644
--- a/src/ray/raylet/scheduling/policy/scheduling_policy_test.cc
+++ b/src/ray/raylet/scheduling/policy/scheduling_policy_test.cc
@@ -51,12 +51,19 @@ class SchedulingPolicyTest : public ::testing::Test {
       float spread,
       bool avoid_local_node,
       bool require_node_available,
-      bool avoid_gpu_nodes = RayConfig::instance().scheduler_avoid_gpu_nodes()) {
+      bool avoid_gpu_nodes = RayConfig::instance().scheduler_avoid_gpu_nodes(),
+      int schedule_top_k_absolute = 1,
+      float scheduler_top_k_fraction = 0) {
     return SchedulingOptions(SchedulingType::HYBRID,
                              RayConfig::instance().scheduler_spread_threshold(),
                              avoid_local_node,
                              require_node_available,
-                             avoid_gpu_nodes);
+                             avoid_gpu_nodes,
+                             /*max_cpu_fraction_per_node*/ 1.0,
+                             /*scheduling_context*/ nullptr,
+                             /*preferred node*/ "",
+                             schedule_top_k_absolute,
+                             scheduler_top_k_fraction);
   }
 
   ClusterResourceManager MockClusterResourceManager(

From d4b0a20bcf7d121b4b650b64411cd87f2fcd5a83 Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Tue, 31 Jan 2023 22:33:19 -0800
Subject: [PATCH 112/267] [Dashboard] Support actor detail (#32103)

This PR adds actor detail page.

Other than the detail page, it also

Add pg id to task/actor
Add profiling links to job detail & job row & actor detail
---
 dashboard/client/src/App.tsx                  |   4 +
 dashboard/client/src/common/ProfilingLink.tsx |  52 +++++
 .../client/src/components/ActorTable.tsx      |  63 ++++--
 dashboard/client/src/components/TaskTable.tsx |  47 +++-
 .../client/src/components/WorkerTable.tsx     |   2 +-
 .../client/src/pages/actor/ActorDetail.tsx    | 202 ++++++++++++++++++
 .../client/src/pages/actor/ActorList.tsx      |  17 +-
 .../src/pages/actor/hook/useActorDetail.ts    |  40 ++++
 dashboard/client/src/pages/actor/index.tsx    |   2 +-
 dashboard/client/src/pages/job/JobDetail.tsx  |  29 ++-
 .../src/pages/job/JobDetailActorPage.tsx      |   4 +-
 dashboard/client/src/pages/job/JobRow.tsx     |  16 ++
 dashboard/client/src/pages/job/index.tsx      |   2 +-
 .../client/src/pages/node/NodeDetail.tsx      |   1 +
 dashboard/client/src/pages/state/task.tsx     |  10 +-
 dashboard/client/src/service/actor.ts         |  14 +-
 dashboard/client/src/type/actor.ts            |  31 +++
 dashboard/client/src/type/task.ts             |   1 +
 dashboard/client/src/util/hook.ts             |   9 +-
 dashboard/modules/actor/actor_head.py         |  11 +-
 20 files changed, 521 insertions(+), 36 deletions(-)
 create mode 100644 dashboard/client/src/common/ProfilingLink.tsx
 create mode 100644 dashboard/client/src/pages/actor/ActorDetail.tsx
 create mode 100644 dashboard/client/src/pages/actor/hook/useActorDetail.ts

diff --git a/dashboard/client/src/App.tsx b/dashboard/client/src/App.tsx
index b45d1f0db50f..69c50d550b2e 100644
--- a/dashboard/client/src/App.tsx
+++ b/dashboard/client/src/App.tsx
@@ -4,6 +4,7 @@ import dayjs from "dayjs";
 import duration from "dayjs/plugin/duration";
 import React, { Suspense, useEffect, useState } from "react";
 import { HashRouter, Navigate, Route, Routes } from "react-router-dom";
+import ActorDetailPage from "./pages/actor/ActorDetail";
 import Events from "./pages/event/Events";
 import Loading from "./pages/exception/Loading";
 import JobList, { NewIAJobsPage } from "./pages/job";
@@ -172,6 +173,7 @@ const App = () => {
                   />
                   <Route element={<NodeDetail />} path="/node/:id" />
                   <Route element={<JobDetailChartsPage />} path="/job/:id" />
+                  <Route element={<ActorDetailPage />} path="/actors/:id" />
                   <Route element={<CMDResult />} path="/cmd/:cmd/:ip/:pid" />
                   <Route element={<Loading />} path="/loading" />
                 </Route>
@@ -227,9 +229,11 @@ const App = () => {
                         }
                         path="actors"
                       />
+                      <Route element={<ActorDetailPage />} path="actors/:id" />
                     </Route>
                   </Route>
                   <Route element={<Actors />} path="actors" />
+                  <Route element={<ActorDetailPage />} path="actors/:id" />
                   <Route element={<Metrics newIA />} path="metrics" />
                   <Route element={<NewIALogsPage />} path="logs">
                     {/* TODO(aguo): Refactor Logs component to use optional query
diff --git a/dashboard/client/src/common/ProfilingLink.tsx b/dashboard/client/src/common/ProfilingLink.tsx
new file mode 100644
index 000000000000..bf432a712e87
--- /dev/null
+++ b/dashboard/client/src/common/ProfilingLink.tsx
@@ -0,0 +1,52 @@
+import React, { PropsWithChildren } from "react";
+import { ClassNameProps } from "./props";
+
+type CpuProfilingLinkProps = PropsWithChildren<
+  {
+    pid: string | number | null | undefined;
+    ip: string | null | undefined;
+    type: string | null;
+  } & ClassNameProps
+>;
+
+export const CpuProfilingLink = ({
+  pid,
+  ip,
+  type = "",
+}: CpuProfilingLinkProps) => {
+  if (!pid || !ip || typeof pid === "undefined" || typeof ip === "undefined") {
+    return <div></div>;
+  }
+
+  return (
+    <a
+      href={`worker/traceback?pid=${pid}&ip=${ip}&native=0`}
+      target="_blank"
+      title="Sample the current Python stack trace for this worker."
+      rel="noreferrer"
+    >
+      Stack&nbsp;Trace{type ? ` (${type})` : ""}
+    </a>
+  );
+};
+
+export const CpuStackTraceLink = ({
+  pid,
+  ip,
+  type = "",
+}: CpuProfilingLinkProps) => {
+  if (!pid || !ip) {
+    return <div></div>;
+  }
+
+  return (
+    <a
+      href={`worker/cpu_profile?pid=${pid}&ip=${ip}&duration=5&native=0`}
+      target="_blank"
+      title="Profile the Python worker for 5 seconds (default) and display a CPU flame graph."
+      rel="noreferrer"
+    >
+      CPU&nbsp;Flame&nbsp;Graph{type ? ` (${type})` : ""}
+    </a>
+  );
+};
diff --git a/dashboard/client/src/components/ActorTable.tsx b/dashboard/client/src/components/ActorTable.tsx
index 994e4e2bfe31..f1cfb846fbc9 100644
--- a/dashboard/client/src/components/ActorTable.tsx
+++ b/dashboard/client/src/components/ActorTable.tsx
@@ -19,6 +19,7 @@ import React, { useContext, useState } from "react";
 import { Link } from "react-router-dom";
 import { GlobalContext } from "../App";
 import { DurationText } from "../common/DurationText";
+import { CpuProfilingLink, CpuStackTraceLink } from "../common/ProfilingLink";
 import rowStyles from "../common/RowStyles";
 import { Actor } from "../type/actor";
 import { Worker } from "../type/worker";
@@ -32,10 +33,12 @@ const ActorTable = ({
   actors = {},
   workers = [],
   jobId = null,
+  detailPathPrefix = null,
 }: {
   actors: { [actorId: string]: Actor };
   workers?: Worker[];
   jobId?: string | null;
+  detailPathPrefix: string | null;
 }) => {
   const [pageNo, setPageNo] = useState(1);
   const { changeFilter, filterFunc } = useFilter();
@@ -44,6 +47,9 @@ const ActorTable = ({
   const actorList = Object.values(actors || {}).filter(filterFunc);
   const list = actorList.slice((pageNo - 1) * pageSize, pageNo * pageSize);
   const classes = rowStyles();
+  if (detailPathPrefix === null) {
+    detailPathPrefix = "";
+  }
 
   const columns = [
     { label: "" },
@@ -113,6 +119,15 @@ const ActorTable = ({
         </Typography>
       ),
     },
+    {
+      label: "Placement Group Id",
+      helpInfo: (
+        <Typography>
+          The id of the placement group this actor is scheduled to.
+          <br />
+        </Typography>
+      ),
+    },
     {
       label: "Required Resources",
       helpInfo: (
@@ -274,6 +289,7 @@ const ActorTable = ({
               actorId,
               actorClass,
               jobId,
+              placementGroupId,
               pid,
               address,
               state,
@@ -312,7 +328,15 @@ const ActorTable = ({
                     arrow
                     interactive
                   >
-                    <div>{actorId}</div>
+                    <Link
+                      to={
+                        detailPathPrefix
+                          ? `${detailPathPrefix}/${actorId}`
+                          : actorId
+                      }
+                    >
+                      {actorId}
+                    </Link>
                   </Tooltip>
                 </TableCell>
                 <TableCell align="center">{actorClass}</TableCell>
@@ -332,24 +356,17 @@ const ActorTable = ({
                         Log
                       </Link>
                       <br />
-                      <a
-                        href={`worker/traceback?pid=${pid}&ip=${address?.ipAddress}&native=0`}
-                        target="_blank"
-                        title="Sample the current Python stack trace for this worker."
-                        rel="noreferrer"
-                      >
-                        Stack&nbsp;Trace
-                      </a>
-                      <br />
-                      <a
-                        href={`worker/cpu_profile?pid=${pid}&ip=${address?.ipAddress}&duration=5&native=0`}
-                        target="_blank"
-                        title="Profile the Python worker for 5 seconds (default) and display a CPU flame graph."
-                        rel="noreferrer"
-                      >
-                        CPU&nbsp;Flame&nbsp;Graph
-                      </a>
+                      <CpuProfilingLink
+                        pid={pid}
+                        ip={address?.ipAddress}
+                        type=""
+                      />
                       <br />
+                      <CpuStackTraceLink
+                        pid={pid}
+                        ip={address?.ipAddress}
+                        type=""
+                      />
                     </React.Fragment>
                   )}
                 </TableCell>
@@ -373,6 +390,16 @@ const ActorTable = ({
                 >
                   {numRestarts}
                 </TableCell>
+                <TableCell align="center">
+                  <Tooltip
+                    className={classes.idCol}
+                    title={placementGroupId ? placementGroupId : "-"}
+                    arrow
+                    interactive
+                  >
+                    <div>{placementGroupId ? placementGroupId : "-"}</div>
+                  </Tooltip>
+                </TableCell>
                 <TableCell align="center">
                   <Tooltip
                     className={classes.OverflowCol}
diff --git a/dashboard/client/src/components/TaskTable.tsx b/dashboard/client/src/components/TaskTable.tsx
index d21d013704ea..508ae72a67f9 100644
--- a/dashboard/client/src/components/TaskTable.tsx
+++ b/dashboard/client/src/components/TaskTable.tsx
@@ -23,9 +23,11 @@ import { StatusChip } from "./StatusChip";
 const TaskTable = ({
   tasks = [],
   jobId = null,
+  actorId = null,
 }: {
   tasks: Task[];
   jobId?: string | null;
+  actorId?: string | null;
 }) => {
   const [pageNo, setPageNo] = useState(1);
   const { changeFilter, filterFunc } = useFilter();
@@ -44,6 +46,7 @@ const TaskTable = ({
     { label: "Node Id" },
     { label: "Actor_id" },
     { label: "Type" },
+    { label: "Placement Group Id" },
     { label: "Required Resources" },
   ];
 
@@ -81,6 +84,19 @@ const TaskTable = ({
             <TextField {...params} label="Job Id" />
           )}
         />
+        <Autocomplete
+          style={{ margin: 8, width: 150 }}
+          defaultValue={actorId ? actorId : ""}
+          options={Array.from(
+            new Set(tasks.map((e) => (e.actor_id ? e.actor_id : ""))),
+          )}
+          onInputChange={(_: any, value: string) => {
+            changeFilter("actor_id", value.trim());
+          }}
+          renderInput={(params: TextFieldProps) => (
+            <TextField {...params} label="Actor Id" />
+          )}
+        />
         <Autocomplete
           style={{ margin: 8, width: 150 }}
           options={Array.from(new Set(tasks.map((e) => e.name)))}
@@ -150,6 +166,7 @@ const TaskTable = ({
               func_or_class_name,
               node_id,
               actor_id,
+              placement_group_id,
               type,
               required_resources,
               events,
@@ -183,11 +200,37 @@ const TaskTable = ({
                   )}
                 </TableCell>
                 <TableCell align="center">{func_or_class_name}</TableCell>
-                <TableCell align="center">{node_id ? node_id : "-"}</TableCell>
                 <TableCell align="center">
-                  {actor_id ? actor_id : "-"}
+                  <Tooltip
+                    className={classes.idCol}
+                    title={node_id ? node_id : "-"}
+                    arrow
+                    interactive
+                  >
+                    <div>{node_id ? node_id : "-"}</div>
+                  </Tooltip>
+                </TableCell>
+                <TableCell align="center">
+                  <Tooltip
+                    className={classes.idCol}
+                    title={actor_id ? actor_id : "-"}
+                    arrow
+                    interactive
+                  >
+                    <div>{actor_id ? actor_id : "-"}</div>
+                  </Tooltip>
                 </TableCell>
                 <TableCell align="center">{type}</TableCell>
+                <TableCell align="center">
+                  <Tooltip
+                    className={classes.idCol}
+                    title={placement_group_id ? placement_group_id : "-"}
+                    arrow
+                    interactive
+                  >
+                    <div>{placement_group_id ? placement_group_id : "-"}</div>
+                  </Tooltip>
+                </TableCell>
                 <TableCell align="center">
                   <Tooltip
                     className={classes.OverflowCol}
diff --git a/dashboard/client/src/components/WorkerTable.tsx b/dashboard/client/src/components/WorkerTable.tsx
index f235d015a4d5..0f80325ea48b 100644
--- a/dashboard/client/src/components/WorkerTable.tsx
+++ b/dashboard/client/src/components/WorkerTable.tsx
@@ -101,7 +101,7 @@ const WorkerDetailTable = ({
 
   return (
     <TableContainer>
-      <ActorTable actors={actors} />
+      <ActorTable actors={actors} detailPathPrefix="" />
     </TableContainer>
   );
 };
diff --git a/dashboard/client/src/pages/actor/ActorDetail.tsx b/dashboard/client/src/pages/actor/ActorDetail.tsx
new file mode 100644
index 000000000000..05bb5ff566e2
--- /dev/null
+++ b/dashboard/client/src/pages/actor/ActorDetail.tsx
@@ -0,0 +1,202 @@
+import { makeStyles } from "@material-ui/core";
+import dayjs from "dayjs";
+import React, { useContext } from "react";
+import { Link } from "react-router-dom";
+import { GlobalContext } from "../../App";
+import { DurationText } from "../../common/DurationText";
+import {
+  CpuProfilingLink,
+  CpuStackTraceLink,
+} from "../../common/ProfilingLink";
+import Loading from "../../components/Loading";
+import { MetadataSection } from "../../components/MetadataSection";
+import { StatusChip } from "../../components/StatusChip";
+import TitleCard from "../../components/TitleCard";
+import { MainNavPageInfo } from "../layout/mainNavContext";
+import TaskList from "../state/task";
+import { useActorDetail } from "./hook/useActorDetail";
+
+const useStyle = makeStyles((theme) => ({
+  root: {
+    padding: theme.spacing(2),
+  },
+  paper: {
+    padding: theme.spacing(2),
+    marginTop: theme.spacing(2),
+    marginBottom: theme.spacing(2),
+  },
+  label: {
+    fontWeight: "bold",
+  },
+  tab: {
+    marginBottom: theme.spacing(2),
+  },
+}));
+
+const ActorDetailPage = () => {
+  const classes = useStyle();
+  const { ipLogMap } = useContext(GlobalContext);
+  const { params, actorDetail, msg } = useActorDetail();
+
+  if (!actorDetail) {
+    return (
+      <div className={classes.root}>
+        <Loading loading={msg.startsWith("Loading")} />
+        <TitleCard title={`JOB - ${params.id}`}>
+          <StatusChip type="job" status="LOADING" />
+          <br />
+          Request Status: {msg} <br />
+        </TitleCard>
+      </div>
+    );
+  }
+
+  return (
+    <div className={classes.root}>
+      <MainNavPageInfo
+        pageInfo={{
+          title: `Actor: ${params.id}`,
+          id: "actor-detail",
+          path: `/new/actors/${params.id}`,
+        }}
+      />
+      <TitleCard title={`ACTOR - ${params.id}`}>
+        <MetadataSection
+          metadataList={[
+            {
+              label: "State",
+              content: <StatusChip type="actor" status={actorDetail.state} />,
+            },
+            {
+              label: "ID",
+              content: actorDetail.actorId
+                ? {
+                    value: actorDetail.actorId,
+                    copyableValue: actorDetail.actorId,
+                  }
+                : { value: "-" },
+            },
+            {
+              label: "Name",
+              content: actorDetail.name
+                ? {
+                    value: actorDetail.name,
+                  }
+                : { value: "-" },
+            },
+            {
+              label: "Class Name",
+              content: actorDetail.actorClass
+                ? {
+                    value: actorDetail.actorClass,
+                  }
+                : { value: "-" },
+            },
+            {
+              label: "Job ID",
+              content: actorDetail.jobId
+                ? {
+                    value: actorDetail.jobId,
+                    copyableValue: actorDetail.jobId,
+                  }
+                : { value: "-" },
+            },
+            {
+              label: "Node ID",
+              content: actorDetail.address?.rayletId
+                ? {
+                    value: actorDetail.address?.rayletId,
+                    copyableValue: actorDetail.address?.rayletId,
+                  }
+                : { value: "-" },
+            },
+            {
+              label: "Worker ID",
+              content: actorDetail.address?.workerId
+                ? {
+                    value: actorDetail.address?.workerId,
+                    copyableValue: actorDetail.address?.workerId,
+                  }
+                : { value: "-" },
+            },
+            {
+              label: "Started at",
+              content: {
+                value: actorDetail.startTime
+                  ? dayjs(Number(actorDetail.startTime)).format(
+                      "YYYY/MM/DD HH:mm:ss",
+                    )
+                  : "-",
+              },
+            },
+            {
+              label: "Ended at",
+              content: {
+                value: actorDetail.endTime
+                  ? dayjs(Number(actorDetail.endTime)).format(
+                      "YYYY/MM/DD HH:mm:ss",
+                    )
+                  : "-",
+              },
+            },
+            {
+              label: "Uptime",
+              content: actorDetail.startTime ? (
+                <DurationText
+                  startTime={actorDetail.startTime}
+                  endTime={actorDetail.endTime}
+                />
+              ) : (
+                <React.Fragment>-</React.Fragment>
+              ),
+            },
+            {
+              label: "Restarted",
+              content: { value: actorDetail.numRestarts },
+            },
+            {
+              label: "Exit Detail",
+              content: actorDetail.exitDetail
+                ? {
+                    value: actorDetail.exitDetail,
+                  }
+                : { value: "-" },
+            },
+            {
+              label: "Actions",
+              content: (
+                <div>
+                  <Link
+                    target="_blank"
+                    to={`/log/${encodeURIComponent(
+                      ipLogMap[actorDetail.address?.ipAddress],
+                    )}?fileName=${actorDetail.jobId}-${actorDetail.pid}`}
+                  >
+                    Log
+                  </Link>
+                  <br />
+                  <CpuProfilingLink
+                    pid={actorDetail.pid}
+                    ip={actorDetail.address?.ipAddress}
+                    type=""
+                  />
+                  <br />
+                  <CpuStackTraceLink
+                    pid={actorDetail.pid}
+                    ip={actorDetail.address?.ipAddress}
+                    type=""
+                  />
+                </div>
+              ),
+            },
+          ]}
+        />
+      </TitleCard>
+      <TitleCard title="Tasks History">
+        <TaskList jobId={actorDetail.jobId} actorId={params.id} />
+      </TitleCard>
+    </div>
+  );
+};
+
+export default ActorDetailPage;
diff --git a/dashboard/client/src/pages/actor/ActorList.tsx b/dashboard/client/src/pages/actor/ActorList.tsx
index 6b22751d2571..cc06555cd273 100644
--- a/dashboard/client/src/pages/actor/ActorList.tsx
+++ b/dashboard/client/src/pages/actor/ActorList.tsx
@@ -8,10 +8,19 @@ import { useActorList } from "./hook/useActorList";
 /**
  * Represent the embedable actors page.
  */
-const ActorList = ({ jobId = null }: { jobId?: string | null }) => {
+const ActorList = ({
+  jobId = null,
+  detailPathPrefix = null,
+}: {
+  jobId?: string | null;
+  detailPathPrefix: string | null;
+}) => {
   const [timeStamp] = useState(dayjs());
   const data: { [actorId: string]: Actor } | undefined = useActorList();
   const actors: { [actorId: string]: Actor } = data ? data : {};
+  if (detailPathPrefix === null) {
+    detailPathPrefix = "";
+  }
 
   return (
     <div>
@@ -20,7 +29,11 @@ const ActorList = ({ jobId = null }: { jobId?: string | null }) => {
           Last updated: {timeStamp.format("YYYY-MM-DD HH:mm:ss")}
         </Grid>
       </Grid>
-      <ActorTable actors={actors} jobId={jobId} />
+      <ActorTable
+        actors={actors}
+        jobId={jobId}
+        detailPathPrefix={detailPathPrefix}
+      />
     </div>
   );
 };
diff --git a/dashboard/client/src/pages/actor/hook/useActorDetail.ts b/dashboard/client/src/pages/actor/hook/useActorDetail.ts
new file mode 100644
index 000000000000..fe93bfc9ec2b
--- /dev/null
+++ b/dashboard/client/src/pages/actor/hook/useActorDetail.ts
@@ -0,0 +1,40 @@
+import { useContext, useState } from "react";
+import { useParams } from "react-router-dom";
+import useSWR from "swr";
+import { GlobalContext } from "../../../App";
+import { API_REFRESH_INTERVAL_MS } from "../../../common/constants";
+import { ActorResp, getActor } from "../../../service/actor";
+
+export const useActorDetail = () => {
+  const params = useParams() as { id: string };
+  const [msg, setMsg] = useState("Loading the actor infos...");
+  const { namespaceMap } = useContext(GlobalContext);
+
+  const { data: actorDetail } = useSWR(
+    ["useActorDetail", params.id],
+    async (_, actorId) => {
+      const actor_resp = await getActor(actorId);
+      const data: ActorResp = actor_resp?.data;
+      const { data: rspData, msg, result } = data;
+      if (msg) {
+        setMsg(msg);
+      }
+
+      if (result === false) {
+        setMsg("Actor Query Error Please Check Actor Id");
+      }
+
+      if (rspData.detail) {
+        return rspData.detail;
+      }
+    },
+    { refreshInterval: API_REFRESH_INTERVAL_MS },
+  );
+
+  return {
+    params,
+    actorDetail,
+    msg,
+    namespaceMap,
+  };
+};
diff --git a/dashboard/client/src/pages/actor/index.tsx b/dashboard/client/src/pages/actor/index.tsx
index 7661539b518a..ff1f96f49e65 100644
--- a/dashboard/client/src/pages/actor/index.tsx
+++ b/dashboard/client/src/pages/actor/index.tsx
@@ -27,7 +27,7 @@ const Actors = () => {
         }}
       />
       <TitleCard title="ACTORS">
-        <ActorList />
+        <ActorList detailPathPrefix="" />
       </TitleCard>
     </div>
   );
diff --git a/dashboard/client/src/pages/job/JobDetail.tsx b/dashboard/client/src/pages/job/JobDetail.tsx
index 1d1909a7934e..d7e6427a0079 100644
--- a/dashboard/client/src/pages/job/JobDetail.tsx
+++ b/dashboard/client/src/pages/job/JobDetail.tsx
@@ -5,6 +5,10 @@ import { Link } from "react-router-dom";
 import { GlobalContext } from "../../App";
 import { CollapsibleSection } from "../../common/CollapsibleSection";
 import { DurationText } from "../../common/DurationText";
+import {
+  CpuProfilingLink,
+  CpuStackTraceLink,
+} from "../../common/ProfilingLink";
 import Loading from "../../components/Loading";
 import { MetadataSection } from "../../components/MetadataSection";
 import { StatusChip } from "../../components/StatusChip";
@@ -170,8 +174,24 @@ export const JobDetailChartsPage = ({
               },
             },
             {
-              label: "Logs",
-              content: <JobLogsLink job={job} newIA />,
+              label: "Actions",
+              content: (
+                <div>
+                  <JobLogsLink job={job} newIA />
+                  <br />
+                  <CpuProfilingLink
+                    pid={job.driver_info?.pid}
+                    ip={job.driver_info?.node_ip_address}
+                    type="Driver"
+                  />
+                  <br />
+                  <CpuStackTraceLink
+                    pid={job.driver_info?.pid}
+                    ip={job.driver_info?.node_ip_address}
+                    type="Driver"
+                  />
+                </div>
+              ),
             },
           ]}
         />
@@ -229,7 +249,10 @@ export const JobDetailChartsPage = ({
       </TitleCard>
       <TitleCard>
         <CollapsibleSection title="Actors">
-          <ActorList jobId={jobId} />
+          <ActorList
+            jobId={jobId}
+            detailPathPrefix={newIA ? "actors" : "/actors"}
+          />
         </CollapsibleSection>
       </TitleCard>
       <TitleCard>
diff --git a/dashboard/client/src/pages/job/JobDetailActorPage.tsx b/dashboard/client/src/pages/job/JobDetailActorPage.tsx
index c0fa8735850c..25d8fe773045 100644
--- a/dashboard/client/src/pages/job/JobDetailActorPage.tsx
+++ b/dashboard/client/src/pages/job/JobDetailActorPage.tsx
@@ -31,7 +31,9 @@ export const JobDetailActorsPage = () => {
   return (
     <div className={classes.root}>
       <MainNavPageInfo pageInfo={pageInfo} />
-      <TitleCard title="Actors">{<ActorList jobId={params.id} />}</TitleCard>
+      <TitleCard title="Actors">
+        {<ActorList jobId={params.id} detailPathPrefix="" />}
+      </TitleCard>
     </div>
   );
 };
diff --git a/dashboard/client/src/pages/job/JobRow.tsx b/dashboard/client/src/pages/job/JobRow.tsx
index 010754eb4976..fdc1fdbcb935 100644
--- a/dashboard/client/src/pages/job/JobRow.tsx
+++ b/dashboard/client/src/pages/job/JobRow.tsx
@@ -4,6 +4,10 @@ import dayjs from "dayjs";
 import React from "react";
 import { Link } from "react-router-dom";
 import { DurationText } from "../../common/DurationText";
+import {
+  CpuProfilingLink,
+  CpuStackTraceLink,
+} from "../../common/ProfilingLink";
 import { StatusChip } from "../../components/StatusChip";
 import { UnifiedJob } from "../../type/job";
 import { useJobProgress } from "./hook/useJobProgress";
@@ -89,6 +93,18 @@ export const JobRow = ({ job, newIA = false }: JobRowProps) => {
         {/* TODO(aguo): Also show logs for the job id instead
       of just the submission's logs */}
         <JobLogsLink job={job} newIA={newIA} />
+        <br />
+        <CpuProfilingLink
+          pid={job.driver_info?.pid}
+          ip={job.driver_info?.node_ip_address}
+          type="Driver"
+        />
+        <br />
+        <CpuStackTraceLink
+          pid={job.driver_info?.pid}
+          ip={job.driver_info?.node_ip_address}
+          type="Driver"
+        />
       </TableCell>
       <TableCell align="center">
         {dayjs(Number(start_time)).format("YYYY/MM/DD HH:mm:ss")}
diff --git a/dashboard/client/src/pages/job/index.tsx b/dashboard/client/src/pages/job/index.tsx
index ccca72f5d62c..7d72d68c4668 100644
--- a/dashboard/client/src/pages/job/index.tsx
+++ b/dashboard/client/src/pages/job/index.tsx
@@ -57,7 +57,7 @@ const columns = [
     ),
   },
   {
-    label: "Logs",
+    label: "Actions",
   },
   { label: "StartTime" },
   { label: "EndTime" },
diff --git a/dashboard/client/src/pages/node/NodeDetail.tsx b/dashboard/client/src/pages/node/NodeDetail.tsx
index be09c6a6c59e..219207ce8d56 100644
--- a/dashboard/client/src/pages/node/NodeDetail.tsx
+++ b/dashboard/client/src/pages/node/NodeDetail.tsx
@@ -235,6 +235,7 @@ const NodeDetailPage = () => {
               <ActorTable
                 actors={nodeDetail.actors}
                 workers={nodeDetail?.workers}
+                detailPathPrefix="/new/actors"
               />
             </TableContainer>
           </React.Fragment>
diff --git a/dashboard/client/src/pages/state/task.tsx b/dashboard/client/src/pages/state/task.tsx
index 8c5aa446e5ca..654ed94740d2 100644
--- a/dashboard/client/src/pages/state/task.tsx
+++ b/dashboard/client/src/pages/state/task.tsx
@@ -9,7 +9,13 @@ import { useStateApiList } from "./hook/useStateApi";
 /**
  * Represent the embedable tasks page.
  */
-const TaskList = ({ jobId = null }: { jobId?: string | null }) => {
+const TaskList = ({
+  jobId = null,
+  actorId = null,
+}: {
+  jobId?: string | null;
+  actorId?: string | null;
+}) => {
   const [timeStamp] = useState(dayjs());
   const data: Task[] | undefined = useStateApiList("useTasks", getTasks);
   const tasks = data ? data : [];
@@ -21,7 +27,7 @@ const TaskList = ({ jobId = null }: { jobId?: string | null }) => {
           Last updated: {timeStamp.format("YYYY-MM-DD HH:mm:ss")}
         </Grid>
       </Grid>
-      <TaskTable tasks={tasks} jobId={jobId} />
+      <TaskTable tasks={tasks} jobId={jobId} actorId={actorId} />
     </div>
   );
 };
diff --git a/dashboard/client/src/service/actor.ts b/dashboard/client/src/service/actor.ts
index 28df4c206d21..9973044b7f7a 100644
--- a/dashboard/client/src/service/actor.ts
+++ b/dashboard/client/src/service/actor.ts
@@ -1,4 +1,4 @@
-import { Actor } from "../type/actor";
+import { Actor, ActorDetail } from "../type/actor";
 import { get } from "./requestHandlers";
 
 export const getActors = () => {
@@ -12,3 +12,15 @@ export const getActors = () => {
     };
   }>("logical/actors");
 };
+
+export type ActorResp = {
+  result: boolean;
+  msg: string;
+  data: {
+    detail: ActorDetail;
+  };
+};
+
+export const getActor = (actorId: string) => {
+  return get<ActorResp>(`logical/actors/${actorId}`);
+};
diff --git a/dashboard/client/src/type/actor.ts b/dashboard/client/src/type/actor.ts
index 53faaeac30b5..bf0bff94c219 100644
--- a/dashboard/client/src/type/actor.ts
+++ b/dashboard/client/src/type/actor.ts
@@ -1,3 +1,5 @@
+import { GPUStats } from "./node";
+
 export enum ActorEnum {
   ALIVE = "ALIVE",
   PENDING = "PENDING",
@@ -15,6 +17,7 @@ export type Address = {
 export type Actor = {
   actorId: string;
   jobId: string;
+  placementGroupId: string | null;
   state: ActorEnum | string; // PENDING, ALIVE, RECONSTRUCTING, DEAD
   pid: number | null;
   address: Address;
@@ -28,3 +31,31 @@ export type Actor = {
   };
   exitDetail: string;
 };
+
+export type ActorDetail = {
+  workerId: string;
+  numPendingTasks: number;
+  taskQueueLength: number;
+  numExecutedTasks: number;
+  numInPlasma: number;
+  numLocalObjects: number;
+  numObjectRefsInScope: number;
+  gpus?: GPUStats[]; // GPU stats fetched from node, 1 entry per GPU
+  createTime: number;
+  cpuPercent: number;
+  cmdline: string[];
+  memoryInfo: {
+    rss: number; // aka “Resident Set Size”, this is the non-swapped physical memory a process has used. On UNIX it matches “top“‘s RES column). On Windows this is an alias for wset field and it matches “Mem Usage” column of taskmgr.exe.
+    vms: number; // aka “Virtual Memory Size”, this is the total amount of virtual memory used by the process. On UNIX it matches “top“‘s VIRT column. On Windows this is an alias for pagefile field and it matches “Mem Usage” “VM Size” column of taskmgr.exe.
+    pfaults: number; // number of page faults.
+    pageins: number; // number of actual pageins.
+    [key: string]: number;
+  };
+  cpuTimes: {
+    user: number;
+    system: number;
+    childrenUser: number;
+    childrenUystem: number;
+    iowait?: number;
+  };
+} & Actor;
diff --git a/dashboard/client/src/type/task.ts b/dashboard/client/src/type/task.ts
index 107e00192536..0ed4c8d5b5f7 100644
--- a/dashboard/client/src/type/task.ts
+++ b/dashboard/client/src/type/task.ts
@@ -28,6 +28,7 @@ export type Task = {
   job_id: string;
   node_id: string;
   actor_id: string;
+  placement_group_id: string | null;
   type: TypeTaskType;
   func_or_class_name: string;
   language: string;
diff --git a/dashboard/client/src/util/hook.ts b/dashboard/client/src/util/hook.ts
index 3c6f61b06ef8..460db4354ac3 100644
--- a/dashboard/client/src/util/hook.ts
+++ b/dashboard/client/src/util/hook.ts
@@ -13,9 +13,12 @@ export const useFilter = <KeyType extends string>() => {
     setFilters([...filters]);
   };
   const filterFunc = (instance: { [key: string]: any }) => {
-    return filters.every(
-      (f) => !f.val || get(instance, f.key, "").toString().includes(f.val),
-    );
+    return filters.every((f) => {
+      const instance_val = get(instance, f.key, "");
+      return (
+        !f.val || (instance_val && instance_val.toString().includes(f.val))
+      );
+    });
   };
 
   return {
diff --git a/dashboard/modules/actor/actor_head.py b/dashboard/modules/actor/actor_head.py
index 817f66b66544..1a5e5a260e25 100644
--- a/dashboard/modules/actor/actor_head.py
+++ b/dashboard/modules/actor/actor_head.py
@@ -14,7 +14,7 @@
     gcs_service_pb2,
     gcs_service_pb2_grpc,
 )
-from ray.dashboard.datacenter import DataSource
+from ray.dashboard.datacenter import DataSource, DataOrganizer
 from ray.dashboard.modules.actor import actor_consts
 from ray.dashboard.optional_utils import rest_response
 
@@ -249,6 +249,15 @@ async def get_all_actors(self, req) -> aiohttp.web.Response:
             convert_google_style=False,
         )
 
+    @routes.get("/logical/actors/{actor_id}")
+    @dashboard_optional_utils.aiohttp_cache
+    async def get_actor(self, req) -> aiohttp.web.Response:
+        actor_id = req.match_info.get("actor_id")
+        actors = await DataOrganizer.get_all_actors()
+        return dashboard_optional_utils.rest_response(
+            success=True, message="Actor details fetched.", detail=actors[actor_id]
+        )
+
     async def run(self, server):
         gcs_channel = self._dashboard_head.aiogrpc_gcs_channel
         self._gcs_actor_info_stub = gcs_service_pb2_grpc.ActorInfoGcsServiceStub(

From 75419d339ff315dda771f0150158c708fe7a9b1a Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Tue, 31 Jan 2023 23:19:21 -0800
Subject: [PATCH 113/267] [Datasets] Add logical operator for sort() (#32133)

This PR is to add logical operator for `sort()`, the change includes:
* `Sort` logical operator
* `SortTaskSpec` to copy from `sort.py`
* `generate_sort_fn` is generated function for sort
---
 .../logical/operators/all_to_all_operator.py  |  18 +++
 .../planner/exchange/sort_task_spec.py        | 125 ++++++++++++++++++
 .../_internal/planner/plan_all_to_all_op.py   |   4 +
 python/ray/data/_internal/planner/sort.py     |  65 +++++++++
 python/ray/data/dataset.py                    |  12 +-
 .../data/tests/test_execution_optimizer.py    |  45 +++++++
 6 files changed, 268 insertions(+), 1 deletion(-)
 create mode 100644 python/ray/data/_internal/planner/exchange/sort_task_spec.py
 create mode 100644 python/ray/data/_internal/planner/sort.py

diff --git a/python/ray/data/_internal/logical/operators/all_to_all_operator.py b/python/ray/data/_internal/logical/operators/all_to_all_operator.py
index 166c19d383ee..150490866ec3 100644
--- a/python/ray/data/_internal/logical/operators/all_to_all_operator.py
+++ b/python/ray/data/_internal/logical/operators/all_to_all_operator.py
@@ -1,6 +1,7 @@
 from typing import Any, Dict, Optional
 
 from ray.data._internal.logical.interfaces import LogicalOperator
+from ray.data.block import KeyFn
 
 
 class AbstractAllToAll(LogicalOperator):
@@ -79,3 +80,20 @@ def __init__(
             num_outputs=num_outputs,
         )
         self._shuffle = shuffle
+
+
+class Sort(AbstractAllToAll):
+    """Logical operator for sort."""
+
+    def __init__(
+        self,
+        input_op: LogicalOperator,
+        key: Optional[KeyFn],
+        descending: bool,
+    ):
+        super().__init__(
+            "Sort",
+            input_op,
+        )
+        self._key = key
+        self._descending = descending
diff --git a/python/ray/data/_internal/planner/exchange/sort_task_spec.py b/python/ray/data/_internal/planner/exchange/sort_task_spec.py
new file mode 100644
index 000000000000..4ba8b0e8e430
--- /dev/null
+++ b/python/ray/data/_internal/planner/exchange/sort_task_spec.py
@@ -0,0 +1,125 @@
+from typing import Any, Callable, List, Tuple, TypeVar, Union
+
+import numpy as np
+
+from ray.data._internal.progress_bar import ProgressBar
+from ray.data._internal.remote_fn import cached_remote_fn
+from ray.data._internal.delegating_block_builder import DelegatingBlockBuilder
+from ray.data._internal.planner.exchange.interfaces import ExchangeTaskSpec
+from ray.data.block import Block, BlockAccessor, BlockExecStats, BlockMetadata
+from ray.types import ObjectRef
+
+
+T = TypeVar("T")
+
+# Data can be sorted by value (None), a list of columns and
+# ascending/descending orders (List), or a custom transform function
+# (Callable).
+SortKeyT = Union[None, List[Tuple[str, str]], Callable[[T], Any]]
+
+
+class SortTaskSpec(ExchangeTaskSpec):
+    """
+    The implementation for distributed sort tasks.
+
+    The algorithm is similar to [External Merge Sort]
+    (https://en.wikipedia.org/wiki/External_sorting).
+    Sorting is done in 3 steps: sampling, sorting individual blocks, and
+    merging sorted blocks.
+
+    Sampling (`sample_boundaries`): we get a number of sample items from each block,
+    sort them, and use them to compute boundaries that would partition all items into
+    approximately equal ranges.
+
+    Sorting (`map`): each block is sorted locally, then partitioned into smaller
+    blocks according to the boundaries. Each partitioned block is passed to a merge
+    task.
+
+    Merging (`reduce`): a merge task would receive a block from every worker that
+    consists of items in a certain range. It then merges the sorted blocks into one
+    sorted block and becomes part of the new, sorted block.
+    """
+
+    def __init__(
+        self,
+        boundaries: List[T],
+        key: SortKeyT,
+        descending: bool,
+    ):
+        super().__init__(
+            map_args=[boundaries, key, descending],
+            reduce_args=[key, descending],
+        )
+
+    @staticmethod
+    def map(
+        idx: int,
+        block: Block,
+        output_num_blocks: int,
+        boundaries: List[T],
+        key: SortKeyT,
+        descending: bool,
+    ) -> List[Union[BlockMetadata, Block]]:
+        stats = BlockExecStats.builder()
+        out = BlockAccessor.for_block(block).sort_and_partition(
+            boundaries, key, descending
+        )
+        meta = BlockAccessor.for_block(block).get_metadata(
+            input_files=None, exec_stats=stats.build()
+        )
+        return out + [meta]
+
+    @staticmethod
+    def reduce(
+        key: SortKeyT,
+        descending: bool,
+        *mapper_outputs: List[Block],
+        partial_reduce: bool = False,
+    ) -> Tuple[Block, BlockMetadata]:
+        return BlockAccessor.for_block(mapper_outputs[0]).merge_sorted_blocks(
+            mapper_outputs, key, descending
+        )
+
+    @staticmethod
+    def sample_boundaries(
+        blocks: List[ObjectRef[Block]], key: SortKeyT, num_reducers: int
+    ) -> List[T]:
+        """
+        Return (num_reducers - 1) items in ascending order from the blocks that
+        partition the domain into ranges with approximately equally many elements.
+        """
+        # TODO(Clark): Support multiple boundary sampling keys.
+        if isinstance(key, list) and len(key) > 1:
+            raise ValueError("Multiple boundary sampling keys not supported.")
+
+        n_samples = int(num_reducers * 10 / len(blocks))
+
+        sample_block = cached_remote_fn(_sample_block)
+
+        sample_results = [
+            sample_block.remote(block, n_samples, key) for block in blocks
+        ]
+        sample_bar = ProgressBar("Sort Sample", len(sample_results))
+        samples = sample_bar.fetch_until_complete(sample_results)
+        sample_bar.close()
+        del sample_results
+        samples = [s for s in samples if len(s) > 0]
+        # The dataset is empty
+        if len(samples) == 0:
+            return [None] * (num_reducers - 1)
+        builder = DelegatingBlockBuilder()
+        for sample in samples:
+            builder.add_block(sample)
+        samples = builder.build()
+        column = key[0][0] if isinstance(key, list) else None
+        sample_items = BlockAccessor.for_block(samples).to_numpy(column)
+        sample_items = np.sort(sample_items)
+        ret = [
+            np.quantile(sample_items, q, interpolation="nearest")
+            for q in np.linspace(0, 1, num_reducers)
+        ]
+        return ret[1:]
+
+
+def _sample_block(block: Block[T], n_samples: int, key: SortKeyT) -> Block[T]:
+    return BlockAccessor.for_block(block).sample(n_samples, key)
diff --git a/python/ray/data/_internal/planner/plan_all_to_all_op.py b/python/ray/data/_internal/planner/plan_all_to_all_op.py
index 827bbcbd7126..fbb20f2b3f4f 100644
--- a/python/ray/data/_internal/planner/plan_all_to_all_op.py
+++ b/python/ray/data/_internal/planner/plan_all_to_all_op.py
@@ -5,10 +5,12 @@
     RandomShuffle,
     RandomizeBlocks,
     Repartition,
+    Sort,
 )
 from ray.data._internal.planner.random_shuffle import generate_random_shuffle_fn
 from ray.data._internal.planner.randomize_blocks import generate_randomize_blocks_fn
 from ray.data._internal.planner.repartition import generate_repartition_fn
+from ray.data._internal.planner.sort import generate_sort_fn
 
 
 def _plan_all_to_all_op(
@@ -26,6 +28,8 @@ def _plan_all_to_all_op(
         fn = generate_random_shuffle_fn(op._seed, op._num_outputs)
     elif isinstance(op, Repartition):
         fn = generate_repartition_fn(op._num_outputs, op._shuffle)
+    elif isinstance(op, Sort):
+        fn = generate_sort_fn(op._key, op._descending)
     else:
         raise ValueError(f"Found unknown logical operator during planning: {op}")
 
diff --git a/python/ray/data/_internal/planner/sort.py b/python/ray/data/_internal/planner/sort.py
new file mode 100644
index 000000000000..4567337ac328
--- /dev/null
+++ b/python/ray/data/_internal/planner/sort.py
@@ -0,0 +1,65 @@
+from functools import partial
+from typing import List, Tuple
+
+from ray.data._internal.execution.interfaces import (
+    AllToAllTransformFn,
+    RefBundle,
+    TaskContext,
+)
+from ray.data._internal.planner.exchange.push_based_shuffle_task_scheduler import (
+    PushBasedShuffleTaskScheduler,
+)
+from ray.data._internal.planner.exchange.pull_based_shuffle_task_scheduler import (
+    PullBasedShuffleTaskScheduler,
+)
+from ray.data._internal.planner.exchange.sort_task_spec import SortKeyT, SortTaskSpec
+from ray.data._internal.stats import StatsDict
+from ray.data.context import DatasetContext
+
+
+def generate_sort_fn(
+    key: SortKeyT,
+    descending: bool,
+) -> AllToAllTransformFn:
+    """Generate function to sort blocks by the specified key column or key function."""
+    # TODO: validate key with block._validate_key_fn.
+
+    def fn(
+        key: SortKeyT,
+        descending: bool,
+        refs: List[RefBundle],
+        ctx: TaskContext,
+    ) -> Tuple[List[RefBundle], StatsDict]:
+        blocks = []
+        for ref_bundle in refs:
+            for block, _ in ref_bundle.blocks:
+                blocks.append(block)
+        if len(blocks) == 0:
+            return (blocks, {})
+
+        if isinstance(key, str):
+            key = [(key, "descending" if descending else "ascending")]
+        if isinstance(key, list):
+            descending = key[0][1] == "descending"
+
+        num_mappers = len(blocks)
+        # Use same number of output partitions.
+        num_outputs = num_mappers
+
+        # Sample boundaries for sort key.
+        boundaries = SortTaskSpec.sample_boundaries(blocks, key, num_outputs)
+        if descending:
+            boundaries.reverse()
+        sort_spec = SortTaskSpec(boundaries=boundaries, key=key, descending=descending)
+
+        if DatasetContext.get_current().use_push_based_shuffle:
+            scheduler = PushBasedShuffleTaskScheduler(sort_spec)
+        else:
+            scheduler = PullBasedShuffleTaskScheduler(sort_spec)
+
+        return scheduler.execute(refs, num_outputs)
+
+    # NOTE: use partial function to pass parameters to avoid error like
+    # "UnboundLocalError: local variable ... referenced before assignment",
+    # because `key` and `descending` variables are reassigned in `fn()`.
+    return partial(fn, key, descending)
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index c14d50384351..8b6fc9c5bed6 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -34,6 +34,7 @@
     RandomShuffle,
     RandomizeBlocks,
     Repartition,
+    Sort,
 )
 from ray.data._internal.logical.optimizers import LogicalPlan
 from ray.data._internal.logical.operators.map_operator import (
@@ -2006,7 +2007,16 @@ def sort(
         """
 
         plan = self._plan.with_stage(SortStage(self, key, descending))
-        return Dataset(plan, self._epoch, self._lazy)
+
+        logical_plan = self._logical_plan
+        if logical_plan is not None:
+            op = Sort(
+                logical_plan.dag,
+                key=key,
+                descending=descending,
+            )
+            logical_plan = LogicalPlan(op)
+        return Dataset(plan, self._epoch, self._lazy, logical_plan)
 
     def zip(self, other: "Dataset[U]") -> "Dataset[(T, U)]":
         """Zip this dataset with the elements of another.
diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index 6228905c1aac..83b2c9b6cd01 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -1,4 +1,6 @@
+import os
 import pytest
+import pandas as pd
 
 import ray
 from ray.data._internal.execution.operators.map_operator import MapOperator
@@ -10,6 +12,7 @@
     RandomShuffle,
     RandomizeBlocks,
     Repartition,
+    Sort,
 )
 from ray.data._internal.logical.operators.read_operator import Read
 from ray.data._internal.logical.operators.map_operator import (
@@ -21,6 +24,7 @@
 from ray.data._internal.planner.planner import Planner
 from ray.data.datasource.parquet_datasource import ParquetDatasource
 
+from ray.data.tests.conftest import *  # noqa
 from ray.tests.conftest import *  # noqa
 
 
@@ -516,6 +520,47 @@ def test_read_map_chain_operator_fusion_e2e(ray_start_regular_shared, enable_opt
     assert name in ds.stats()
 
 
+def test_sort_operator(ray_start_regular_shared, enable_optimizer):
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = Sort(
+        read_op,
+        key="col1",
+        descending=False,
+    )
+    plan = LogicalPlan(op)
+    physical_op = planner.plan(plan).dag
+
+    assert op.name == "Sort"
+    assert isinstance(physical_op, AllToAllOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], MapOperator)
+
+
+def test_sort_e2e(
+    ray_start_regular_shared, enable_optimizer, use_push_based_shuffle, local_path
+):
+    ds = ray.data.range(100, parallelism=4)
+    ds = ds.random_shuffle()
+    ds = ds.sort()
+    assert ds.take_all() == list(range(100))
+
+    df = pd.DataFrame({"one": list(range(100)), "two": ["a"] * 100})
+    ds = ray.data.from_pandas([df])
+    path = os.path.join(local_path, "test_parquet_dir")
+    os.mkdir(path)
+    ds.write_parquet(path)
+
+    ds = ray.data.read_parquet(path)
+    ds = ds.random_shuffle()
+    ds1 = ds.sort("one")
+    ds2 = ds.sort("one", descending=True)
+    r1 = ds1.select_columns(["one"]).take_all()
+    r2 = ds2.select_columns(["one"]).take_all()
+    assert [d["one"] for d in r1] == list(range(100))
+    assert [d["one"] for d in r2] == list(reversed(range(100)))
+
+
 if __name__ == "__main__":
     import sys
 

From b8221bb9a3aeadc50baeb59b17fbad65e07faea3 Mon Sep 17 00:00:00 2001
From: Simran Mhatre <mhatresimran007@gmail.com>
Date: Tue, 31 Jan 2023 23:19:58 -0800
Subject: [PATCH 114/267] Update index.md (#32053)

Signed-off-by: Simran Mhatre <simran@anyscale.com>
---
 doc/source/ray-overview/index.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/doc/source/ray-overview/index.md b/doc/source/ray-overview/index.md
index 45d889c60672..566df0c30fd2 100644
--- a/doc/source/ray-overview/index.md
+++ b/doc/source/ray-overview/index.md
@@ -55,7 +55,7 @@ Check out our detailed [installation guide](installation.rst).
 
 ## Ray AI Runtime Quick Start
 
-To use Ray's AI Runtime install Ray with the optional extra `air` packages:
+Ray AI Runtime (AIR) is an open-source, Python-based, domain-specific library that equips ML engineers, data scientists, and researchers with a scalable and unified toolkit for ML applications. To use Ray's AI Runtime install Ray with the optional extra `air` packages:
 
 ```
 pip install "ray[air]"

From 12d7d7dcc2dae779c4c843e38819e00c21aaf824 Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Tue, 31 Jan 2023 23:28:58 -0800
Subject: [PATCH 115/267] [core] Increase the threshold for pubsub integration
 test (#32145)

The test failed asan because some data is not cleaned when it exits. Increase the threshold to mitigate it. Tested locally and for 500 runs, only 3 failed.
---
 BUILD.bazel                             | 2 +-
 src/ray/pubsub/test/integration_test.cc | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/BUILD.bazel b/BUILD.bazel
index 6baa80541cf4..1dbcd8319f43 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -1711,7 +1711,7 @@ cc_test(
 
 cc_test(
     name = "pubsub_integration_test",
-    timeout = "short",
+    timeout = "small",
     srcs = ["src/ray/pubsub/test/integration_test.cc"],
     copts = COPTS,
     tags = ["team:core"],
diff --git a/src/ray/pubsub/test/integration_test.cc b/src/ray/pubsub/test/integration_test.cc
index 9f52c6e7a499..ffca2acd0e05 100644
--- a/src/ray/pubsub/test/integration_test.cc
+++ b/src/ray/pubsub/test/integration_test.cc
@@ -295,7 +295,7 @@ TEST_F(IntegrationTest, SubscribersToOneIDAndAllIDs) {
   // logic below.
   int wait_count = 0;
   while (!(subscriber_1->CheckNoLeaks() && subscriber_2->CheckNoLeaks())) {
-    ASSERT_LT(wait_count, 15) << "Subscribers still have inflight operations after 15s";
+    ASSERT_LT(wait_count, 60) << "Subscribers still have inflight operations after 60s";
     ++wait_count;
     absl::SleepFor(absl::Seconds(1));
   }

From 174f157e2b602a0337093d179f6819c6e3f895d8 Mon Sep 17 00:00:00 2001
From: clarng <clarence.wyng@gmail.com>
Date: Wed, 1 Feb 2023 00:59:57 -0800
Subject: [PATCH 116/267] [core] surface OOM error when actor is killed due to
 OOM (#32107)

Right now we show Actor error if the actor is killed due to OOM. This PR changes it so it surfaces a OOM error

It does not support actor / actor task oom retry, as the goal of this PR is to improve observability by setting the death cause of the actor to OOM

Related issue number
#29736
Signed-off-by: Aviv Haber <aviv@anyscale.com>
Signed-off-by: Clarence Ng <clarence@anyscale.com>
---
 .../ray-core/doc_code/ray_oom_prevention.py   |  2 +-
 python/ray/tests/test_memory_pressure.py      | 40 +++++++++++++++----
 .../transport/direct_actor_task_submitter.cc  | 30 +++++++++++---
 src/ray/gcs/gcs_server/gcs_actor_manager.cc   | 24 +++++++----
 src/ray/gcs/pb_util.h                         |  8 +++-
 src/ray/protobuf/common.proto                 | 11 +++++
 6 files changed, 94 insertions(+), 21 deletions(-)

diff --git a/doc/source/ray-core/doc_code/ray_oom_prevention.py b/doc/source/ray-core/doc_code/ray_oom_prevention.py
index 8d7b3d74bd2f..9eead11891ae 100644
--- a/doc/source/ray-core/doc_code/ray_oom_prevention.py
+++ b/doc/source/ray-core/doc_code/ray_oom_prevention.py
@@ -76,7 +76,7 @@ def allocate(self, bytes_to_allocate: float) -> None:
 error_thrown = False
 try:
     ray.get(first_actor_task)
-except ray.exceptions.RayActorError as ex:
+except ray.exceptions.OutOfMemoryError as ex:
     error_thrown = True
     print("first actor was killed by memory monitor")
 assert error_thrown
diff --git a/python/ray/tests/test_memory_pressure.py b/python/ray/tests/test_memory_pressure.py
index 0f4ae113fd81..9b3eb8643023 100644
--- a/python/ray/tests/test_memory_pressure.py
+++ b/python/ray/tests/test_memory_pressure.py
@@ -139,7 +139,7 @@ def has_metric_tagged_with_value(addr, tag, value) -> bool:
     sys.platform != "linux" and sys.platform != "linux2",
     reason="memory monitor only on linux currently",
 )
-def test_memory_pressure_kill_actor(ray_with_memory_monitor):
+def test_non_restartable_actor_throws_oom_error(ray_with_memory_monitor):
     addr = ray_with_memory_monitor
     leaker = Leaker.options(max_restarts=0, max_task_retries=0).remote()
 
@@ -151,7 +151,7 @@ def test_memory_pressure_kill_actor(ray_with_memory_monitor):
     bytes_to_alloc = get_additional_bytes_to_reach_memory_usage_pct(
         memory_usage_threshold + 0.1
     )
-    with pytest.raises(ray.exceptions.RayActorError) as _:
+    with pytest.raises(ray.exceptions.OutOfMemoryError) as _:
         ray.get(leaker.allocate.remote(bytes_to_alloc, memory_monitor_refresh_ms * 3))
 
     wait_for_condition(
@@ -168,7 +168,7 @@ def test_memory_pressure_kill_actor(ray_with_memory_monitor):
     sys.platform != "linux" and sys.platform != "linux2",
     reason="memory monitor only on linux currently",
 )
-def test_restartable_actor_killed_by_memory_monitor_with_actor_error(
+def test_restartable_actor_throws_oom_error(
     ray_with_memory_monitor,
 ):
     addr = ray_with_memory_monitor
@@ -177,7 +177,33 @@ def test_restartable_actor_killed_by_memory_monitor_with_actor_error(
     bytes_to_alloc = get_additional_bytes_to_reach_memory_usage_pct(
         memory_usage_threshold + 0.1
     )
-    with pytest.raises(ray.exceptions.RayActorError) as _:
+    with pytest.raises(ray.exceptions.OutOfMemoryError) as _:
+        ray.get(leaker.allocate.remote(bytes_to_alloc, memory_monitor_refresh_ms * 3))
+
+    wait_for_condition(
+        has_metric_tagged_with_value,
+        timeout=10,
+        retry_interval_ms=100,
+        addr=addr,
+        tag="MemoryManager.ActorEviction.Total",
+        value=2.0,
+    )
+
+
+@pytest.mark.skipif(
+    sys.platform != "linux" and sys.platform != "linux2",
+    reason="memory monitor only on linux currently",
+)
+def test_restartable_actor_oom_retry_off_throws_oom_error(
+    ray_with_memory_monitor_no_oom_retry,
+):
+    addr = ray_with_memory_monitor_no_oom_retry
+    leaker = Leaker.options(max_restarts=1, max_task_retries=1).remote()
+
+    bytes_to_alloc = get_additional_bytes_to_reach_memory_usage_pct(
+        memory_usage_threshold + 0.1
+    )
+    with pytest.raises(ray.exceptions.OutOfMemoryError) as _:
         ray.get(leaker.allocate.remote(bytes_to_alloc, memory_monitor_refresh_ms * 3))
 
     wait_for_condition(
@@ -274,7 +300,7 @@ async def test_actor_oom_logs_error(ray_with_memory_monitor):
     actor_id = ray.get(oom_actor.get_actor_id.remote())
 
     bytes_to_alloc = get_additional_bytes_to_reach_memory_usage_pct(1)
-    with pytest.raises(ray.exceptions.RayActorError) as _:
+    with pytest.raises(ray.exceptions.OutOfMemoryError) as _:
         ray.get(
             oom_actor.allocate.remote(bytes_to_alloc, memory_monitor_refresh_ms * 3)
         )
@@ -293,10 +319,10 @@ async def test_actor_oom_logs_error(ray_with_memory_monitor):
     for actor in result.actor_table_data:
         if actor.actor_id.hex() == actor_id:
             assert actor.death_cause
-            assert actor.death_cause.actor_died_error_context
+            assert actor.death_cause.oom_context
             assert (
                 expected_worker_eviction_message
-                in actor.death_cause.actor_died_error_context.error_message
+                in actor.death_cause.oom_context.error_message
             )
             verified = True
     assert verified
diff --git a/src/ray/core_worker/transport/direct_actor_task_submitter.cc b/src/ray/core_worker/transport/direct_actor_task_submitter.cc
index e480456d67aa..b380365ee617 100644
--- a/src/ray/core_worker/transport/direct_actor_task_submitter.cc
+++ b/src/ray/core_worker/transport/direct_actor_task_submitter.cc
@@ -146,8 +146,16 @@ Status CoreWorkerDirectActorTaskSubmitter::SubmitTask(TaskSpecification task_spe
     auto status = Status::IOError("cancelling task of dead actor");
     // No need to increment the number of completed tasks since the actor is
     // dead.
-    GetTaskFinisherWithoutMu().FailOrRetryPendingTask(
-        task_id, error_type, &status, &error_info);
+    bool fail_immediatedly =
+        error_info.has_actor_died_error() &&
+        error_info.actor_died_error().has_oom_context() &&
+        error_info.actor_died_error().oom_context().fail_immediately();
+    GetTaskFinisherWithoutMu().FailOrRetryPendingTask(task_id,
+                                                      error_type,
+                                                      &status,
+                                                      &error_info,
+                                                      /*mark_task_object_failed*/ true,
+                                                      fail_immediatedly);
   }
 
   // If the task submission subsequently fails, then the client will receive
@@ -306,8 +314,16 @@ void CoreWorkerDirectActorTaskSubmitter::DisconnectActor(
       // This task may have been waiting for dependency resolution, so cancel
       // this first.
       resolver_.CancelDependencyResolution(task_id);
-      GetTaskFinisherWithoutMu().FailOrRetryPendingTask(
-          task_id, error_type, &status, &error_info);
+      bool fail_immediatedly =
+          error_info.has_actor_died_error() &&
+          error_info.actor_died_error().has_oom_context() &&
+          error_info.actor_died_error().oom_context().fail_immediately();
+      GetTaskFinisherWithoutMu().FailOrRetryPendingTask(task_id,
+                                                        error_type,
+                                                        &status,
+                                                        &error_info,
+                                                        /*mark_task_object_failed*/ true,
+                                                        fail_immediatedly);
     }
     if (!wait_for_death_info_tasks.empty()) {
       RAY_LOG(DEBUG) << "Failing tasks waiting for death info, size="
@@ -496,6 +512,7 @@ void CoreWorkerDirectActorTaskSubmitter::HandlePushTaskReply(
         task_id, reply, addr, reply.is_application_error());
   } else {
     bool is_actor_dead = false;
+    bool fail_immediatedly = false;
     rpc::ErrorType error_type;
     rpc::RayErrorInfo error_info;
     {
@@ -512,6 +529,9 @@ void CoreWorkerDirectActorTaskSubmitter::HandlePushTaskReply(
       const auto &death_cause = queue.death_cause;
       error_info = GetErrorInfoFromActorDeathCause(death_cause);
       error_type = GenErrorTypeFromDeathCause(death_cause);
+      fail_immediatedly = error_info.has_actor_died_error() &&
+                          error_info.actor_died_error().has_oom_context() &&
+                          error_info.actor_died_error().oom_context().fail_immediately();
     }
 
     // This task may have been waiting for dependency resolution, so cancel
@@ -524,7 +544,7 @@ void CoreWorkerDirectActorTaskSubmitter::HandlePushTaskReply(
         &status,
         &error_info,
         /*mark_task_object_failed*/ is_actor_dead,
-        /*fail_immediatedly*/ false);
+        fail_immediatedly);
 
     if (!is_actor_dead && !will_retry) {
       // No retry == actor is dead.
diff --git a/src/ray/gcs/gcs_server/gcs_actor_manager.cc b/src/ray/gcs/gcs_server/gcs_actor_manager.cc
index 28ccbecd30e0..dd5ceec85f09 100644
--- a/src/ray/gcs/gcs_server/gcs_actor_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_actor_manager.cc
@@ -62,13 +62,21 @@ const ray::rpc::ActorDeathCause GenWorkerDiedCause(
     const ray::rpc::WorkerExitType &disconnect_type,
     const std::string &disconnect_detail) {
   ray::rpc::ActorDeathCause death_cause;
-  auto actor_died_error_ctx = death_cause.mutable_actor_died_error_context();
-  AddActorInfo(actor, actor_died_error_ctx);
-  actor_died_error_ctx->set_error_message(absl::StrCat(
-      "The actor is dead because its worker process has died. Worker exit type: ",
-      ray::rpc::WorkerExitType_Name(disconnect_type),
-      " Worker exit detail: ",
-      disconnect_detail));
+  if (disconnect_type == ray::rpc::WorkerExitType::NODE_OUT_OF_MEMORY) {
+    auto oom_ctx = death_cause.mutable_oom_context();
+    /// TODO(clarng): actors typically don't retry. Support actor (task) oom retry
+    /// and set this value from raylet here.
+    oom_ctx->set_fail_immediately(false);
+    oom_ctx->set_error_message(disconnect_detail);
+  } else {
+    auto actor_died_error_ctx = death_cause.mutable_actor_died_error_context();
+    AddActorInfo(actor, actor_died_error_ctx);
+    actor_died_error_ctx->set_error_message(absl::StrCat(
+        "The actor is dead because its worker process has died. Worker exit type: ",
+        ray::rpc::WorkerExitType_Name(disconnect_type),
+        " Worker exit detail: ",
+        disconnect_detail));
+  }
   return death_cause;
 }
 const ray::rpc::ActorDeathCause GenOwnerDiedCause(
@@ -908,6 +916,8 @@ void GcsActorManager::OnWorkerDead(const ray::NodeID &node_id,
                                      rpc::WorkerExitType_Name(disconnect_type),
                                      ", has creation_task_exception = ",
                                      (creation_task_exception != nullptr));
+  RAY_LOG(DEBUG) << "on worker dead worker id " << worker_id << " disconnect detail "
+                 << disconnect_detail;
   if (disconnect_type == rpc::WorkerExitType::INTENDED_USER_EXIT ||
       disconnect_type == rpc::WorkerExitType::INTENDED_SYSTEM_EXIT) {
     RAY_LOG(DEBUG) << message;
diff --git a/src/ray/gcs/pb_util.h b/src/ray/gcs/pb_util.h
index e799faedf47b..e45a3932c79b 100644
--- a/src/ray/gcs/pb_util.h
+++ b/src/ray/gcs/pb_util.h
@@ -147,6 +147,8 @@ inline rpc::ErrorType GenErrorTypeFromDeathCause(
     return rpc::ErrorType::RUNTIME_ENV_SETUP_FAILED;
   } else if (death_cause.context_case() == ContextCase::kActorUnschedulableContext) {
     return rpc::ErrorType::ACTOR_UNSCHEDULABLE_ERROR;
+  } else if (death_cause.context_case() == ContextCase::kOomContext) {
+    return rpc::ErrorType::OUT_OF_MEMORY;
   } else {
     return rpc::ErrorType::ACTOR_DIED;
   }
@@ -159,7 +161,8 @@ inline const std::string &GetActorDeathCauseString(
       {ContextCase::kRuntimeEnvFailedContext, "RuntimeEnvFailedContext"},
       {ContextCase::kCreationTaskFailureContext, "CreationTaskFailureContext"},
       {ContextCase::kActorUnschedulableContext, "ActorUnschedulableContext"},
-      {ContextCase::kActorDiedErrorContext, "ActorDiedErrorContext"}};
+      {ContextCase::kActorDiedErrorContext, "ActorDiedErrorContext"},
+      {ContextCase::kOomContext, "OOMContext"}};
   auto it = death_cause_string.find(death_cause.context_case());
   RAY_CHECK(it != death_cause_string.end())
       << "Given death cause case " << death_cause.context_case() << " doesn't exist.";
@@ -182,6 +185,9 @@ inline rpc::RayErrorInfo GetErrorInfoFromActorDeathCause(
   } else if (death_cause.context_case() == ContextCase::kActorUnschedulableContext) {
     *(error_info.mutable_error_message()) =
         death_cause.actor_unschedulable_context().error_message();
+  } else if (death_cause.context_case() == ContextCase::kOomContext) {
+    error_info.mutable_actor_died_error()->CopyFrom(death_cause);
+    *(error_info.mutable_error_message()) = death_cause.oom_context().error_message();
   } else {
     RAY_CHECK(death_cause.context_case() == ContextCase::CONTEXT_NOT_SET);
   }
diff --git a/src/ray/protobuf/common.proto b/src/ray/protobuf/common.proto
index e471dc4adaff..eda041053857 100644
--- a/src/ray/protobuf/common.proto
+++ b/src/ray/protobuf/common.proto
@@ -261,6 +261,7 @@ message ActorDeathCause {
     RuntimeEnvFailedContext runtime_env_failed_context = 2;
     ActorDiedErrorContext actor_died_error_context = 3;
     ActorUnschedulableContext actor_unschedulable_context = 4;
+    OomContext oom_context = 5;
   }
 }
 // ---Actor death contexts start----
@@ -296,6 +297,16 @@ message ActorDiedErrorContext {
   // before scheduling had completed.
   bool never_started = 10;
 }
+
+// Context for task OOM.
+message OomContext {
+  // The error message
+  string error_message = 1;
+
+  // Whether the task / actor should fail immediately and not be retried.
+  bool fail_immediately = 2;
+}
+
 // ---Actor death contexts end----
 
 message JobConfig {

From 890e034aac46499b9896ffb0628ba1dfd75781e2 Mon Sep 17 00:00:00 2001
From: Justin Yu <justinvyu@berkeley.edu>
Date: Wed, 1 Feb 2023 01:30:10 -0800
Subject: [PATCH 117/267] [Tune] Save and restore stateful callbacks as part of
 experiment checkpoint (#31957)

Signed-off-by: Justin Yu <justinvyu@berkeley.edu>
---
 python/ray/tune/BUILD                        |   8 ++
 python/ray/tune/callback.py                  | 105 ++++++++++++++++++-
 python/ray/tune/execution/trial_runner.py    |  13 ++-
 python/ray/tune/tests/test_callbacks.py      |  59 +++++++++++
 python/ray/tune/tests/test_trial_runner_3.py |  24 +++++
 5 files changed, 205 insertions(+), 4 deletions(-)
 create mode 100644 python/ray/tune/tests/test_callbacks.py

diff --git a/python/ray/tune/BUILD b/python/ray/tune/BUILD
index 172888302452..b386ccd9853a 100644
--- a/python/ray/tune/BUILD
+++ b/python/ray/tune/BUILD
@@ -39,6 +39,14 @@ py_test(
     tags = ["team:ml", "exclusive"],
 )
 
+py_test(
+    name = "test_callbacks",
+    size = "small",
+    srcs = ["tests/test_callbacks.py"],
+    deps = [":tune_lib"],
+    tags = ["team:ml", "exclusive"],
+)
+
 py_test(
     name = "test_checkpoint_manager",
     size = "small",
diff --git a/python/ray/tune/callback.py b/python/ray/tune/callback.py
index d9baa386f1d9..fbfb926daee9 100644
--- a/python/ray/tune/callback.py
+++ b/python/ray/tune/callback.py
@@ -1,8 +1,11 @@
-from typing import TYPE_CHECKING, Any, Dict, List, Optional, Tuple
 from abc import ABCMeta
+import glob
+import os
+from typing import TYPE_CHECKING, Any, Dict, List, Optional, Tuple
 import warnings
 
 from ray.util.annotations import PublicAPI, DeveloperAPI
+from ray.tune.utils.util import _atomic_save, _load_newest_checkpoint
 
 if TYPE_CHECKING:
     from ray.air._internal.checkpoint_manager import _TrackedCheckpoint
@@ -278,12 +281,36 @@ def on_experiment_end(self, trials: List["Trial"], **info):
         """
         pass
 
+    def get_state(self) -> Optional[Dict]:
+        """Get the state of the callback.
+
+        This method should be implemented by subclasses to return a dictionary
+        representation of the object's current state.
+
+        Returns:
+            state: State of the callback. Should be `None` if the callback does not
+                have any state to save (this is the default).
+        """
+        return None
+
+    def set_state(self, state: Dict):
+        """Get the state of the callback.
+
+        This method should be implemented by subclasses to restore the callback's
+        state based on the given dict state.
+
+        Args:
+            state: State of the callback.
+        """
+        pass
+
 
 @DeveloperAPI
 class CallbackList(Callback):
     """Call multiple callbacks at once."""
 
     IS_CALLBACK_CONTAINER = True
+    CKPT_FILE_TMPL = "callback-states-{}.pkl"
 
     def __init__(self, callbacks: List[Callback]):
         self._callbacks = callbacks
@@ -343,3 +370,79 @@ def on_checkpoint(self, **info):
     def on_experiment_end(self, **info):
         for callback in self._callbacks:
             callback.on_experiment_end(**info)
+
+    def get_state(self) -> Optional[Dict]:
+        """Gets the state of all callbacks contained within this list.
+        If there are no stateful callbacks, then None will be returned in order
+        to avoid saving an unnecessary callback checkpoint file."""
+        state = {}
+        any_stateful_callbacks = False
+        for i, callback in enumerate(self._callbacks):
+            callback_state = callback.get_state()
+            if callback_state:
+                any_stateful_callbacks = True
+            state[i] = callback_state
+        if not any_stateful_callbacks:
+            return None
+        return state
+
+    def set_state(self, state: Dict):
+        """Sets the state for all callbacks contained within this list.
+        Skipps setting state for all stateless callbacks where `get_state`
+        returned None."""
+        for i, callback in enumerate(self._callbacks):
+            callback_state = state.get(i, None)
+            if callback_state:
+                callback.set_state(callback_state)
+
+    def save_to_dir(self, checkpoint_dir: str, session_str: str = "default"):
+        """Save the state of the callback list to the checkpoint_dir.
+
+        Args:
+            checkpoint_dir: directory where the checkpoint is stored.
+            session_str: Unique identifier of the current run session (ex: timestamp).
+        """
+        state_dict = self.get_state()
+
+        if state_dict:
+            file_name = self.CKPT_FILE_TMPL.format(session_str)
+            tmp_file_name = f".tmp-{file_name}"
+            _atomic_save(
+                state=state_dict,
+                checkpoint_dir=checkpoint_dir,
+                file_name=file_name,
+                tmp_file_name=tmp_file_name,
+            )
+
+    def restore_from_dir(self, checkpoint_dir: str):
+        """Restore the state of the list of callbacks from the checkpoint_dir.
+
+        You should check if it's possible to restore with `can_restore`
+        before calling this method.
+
+        Args:
+            checkpoint_dir: directory where the checkpoint is stored.
+
+        Raises:
+            RuntimeError: if unable to find checkpoint.
+            NotImplementedError: if the `set_state` method is not implemented.
+        """
+        state_dict = _load_newest_checkpoint(
+            checkpoint_dir, self.CKPT_FILE_TMPL.format("*")
+        )
+        if not state_dict:
+            raise RuntimeError(
+                "Unable to find checkpoint in {}.".format(checkpoint_dir)
+            )
+        self.set_state(state_dict)
+
+    def can_restore(self, checkpoint_dir: str) -> bool:
+        """Check if the checkpoint_dir contains the saved state for this callback list.
+
+        Returns:
+            can_restore: True if the checkpoint_dir contains a file of the
+                format `CKPT_FILE_TMPL`. False otherwise.
+        """
+        return bool(
+            glob.glob(os.path.join(checkpoint_dir, self.CKPT_FILE_TMPL.format("*")))
+        )
diff --git a/python/ray/tune/execution/trial_runner.py b/python/ray/tune/execution/trial_runner.py
index f25e63828220..dbcc4919d34e 100644
--- a/python/ray/tune/execution/trial_runner.py
+++ b/python/ray/tune/execution/trial_runner.py
@@ -151,6 +151,7 @@ def checkpoint(
         trial_runner: "TrialRunner",
         trial_executor: RayTrialExecutor,
         search_alg: SearchAlgorithm,
+        callbacks: CallbackList,
         force: bool = False,
     ):
         """Saves execution state to `self._local_checkpoint_dir`.
@@ -190,6 +191,9 @@ def _serialize_and_write():
             search_alg.save_to_dir(
                 self._local_checkpoint_dir, session_str=self._session_str
             )
+            callbacks.save_to_dir(
+                self._local_checkpoint_dir, session_str=self._session_str
+            )
 
         checkpoint_time_start = time.monotonic()
         with out_of_band_serialize_dataset():
@@ -347,6 +351,7 @@ def __init__(
         self._search_alg = search_alg or BasicVariantGenerator()
         self._scheduler_alg = scheduler or FIFOScheduler()
         self.trial_executor = trial_executor or RayTrialExecutor()
+        self._callbacks = CallbackList(callbacks or [])
         self._insufficient_resources_manager = _InsufficientResourcesManager()
         self._pending_trial_queue_times = {}
 
@@ -469,8 +474,6 @@ def __init__(
                 TrialRunner.CKPT_FILE_TMPL.format(self._session_str),
             )
 
-        self._callbacks = CallbackList(callbacks or [])
-
         if checkpoint_period is None:
             checkpoint_period = os.getenv("TUNE_GLOBAL_CHECKPOINT_S", "auto")
 
@@ -751,6 +754,7 @@ def checkpoint(self, force: bool = False):
                 trial_runner=self,
                 trial_executor=self.trial_executor,
                 search_alg=self._search_alg,
+                callbacks=self._callbacks,
                 force=force,
             )
 
@@ -795,10 +799,13 @@ def resume(
         # 1. Restore trial runner state
         self.__setstate__(runner_state["runner_data"])
 
-        # 2. Restore search algorithm state
+        # 2. Restore search algorithm and callback state
         if self._search_alg.has_checkpoint(self._local_checkpoint_dir):
             self._search_alg.restore_from_dir(self._local_checkpoint_dir)
 
+        if self._callbacks.can_restore(self._local_checkpoint_dir):
+            self._callbacks.restore_from_dir(self._local_checkpoint_dir)
+
         # 3. Load trial table from experiment checkpoint
         trials = []
         for trial_json_state in runner_state["checkpoints"]:
diff --git a/python/ray/tune/tests/test_callbacks.py b/python/ray/tune/tests/test_callbacks.py
new file mode 100644
index 000000000000..376908485b54
--- /dev/null
+++ b/python/ray/tune/tests/test_callbacks.py
@@ -0,0 +1,59 @@
+import pytest
+from typing import Dict, Optional
+
+from ray.tune.callback import Callback, CallbackList
+
+
+class StatefulCallback(Callback):
+    CKPT_FILE_TMPL = "test-callback-state-{}.json"
+
+    def __init__(self):
+        self.counter = 0
+
+    def on_trial_result(self, iteration, trials, trial, result, **info):
+        self.counter += 1
+
+    def get_state(self) -> Optional[Dict]:
+        return {"counter": self.counter}
+
+    def set_state(self, state: Dict):
+        self.counter = state["counter"]
+
+
+def test_callback_list_with_stateful_callback(tmp_path):
+    """Checks that a callback list saves and restores all callbacks contained
+    inside it."""
+
+    callbacks = CallbackList([Callback(), StatefulCallback()])
+    for i in range(3):
+        callbacks.on_trial_result(iteration=i, trials=None, trial=None, result=None)
+
+    callbacks.save_to_dir(str(tmp_path))
+
+    assert list(tmp_path.glob(CallbackList.CKPT_FILE_TMPL.format("*")))
+    assert callbacks.can_restore(str(tmp_path))
+
+    restored_callbacks = CallbackList([Callback(), StatefulCallback()])
+    restored_callbacks.restore_from_dir(str(tmp_path))
+
+    assert restored_callbacks._callbacks[1].counter == 3
+
+
+def test_callback_list_without_stateful_callback(tmp_path):
+    """If no callbacks within a CallbackList are stateful, then nothing
+    should be saved."""
+
+    callbacks = CallbackList([Callback(), Callback()])
+    callbacks.save_to_dir(str(tmp_path))
+
+    assert not list(tmp_path.glob(CallbackList.CKPT_FILE_TMPL.format("*")))
+    assert not callbacks.can_restore(str(tmp_path))
+
+    with pytest.raises(RuntimeError):
+        callbacks.restore_from_dir(str(tmp_path))
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/python/ray/tune/tests/test_trial_runner_3.py b/python/ray/tune/tests/test_trial_runner_3.py
index 79c130377f42..fb855abb1e9e 100644
--- a/python/ray/tune/tests/test_trial_runner_3.py
+++ b/python/ray/tune/tests/test_trial_runner_3.py
@@ -32,6 +32,7 @@
 from ray.tune.search.search_generator import SearchGenerator
 from ray.tune.syncer import SyncConfig, Syncer
 from ray.tune.tests.tune_test_util import TrialResultObserver
+from ray.tune.tests.test_callbacks import StatefulCallback
 
 
 class MyCallbacks(DefaultCallbacks):
@@ -402,6 +403,29 @@ def num_running_trials():
         count = Counter(evaluated)
         assert all(v <= 3 for v in count.values())
 
+    def testCallbackSaveRestore(self):
+        """Check that experiment state save + restore handles stateful callbacks."""
+        ray.init(num_cpus=2)
+        runner = TrialRunner(
+            local_checkpoint_dir=self.tmpdir,
+            callbacks=[StatefulCallback()],
+            trial_executor=RayTrialExecutor(resource_manager=self._resourceManager()),
+        )
+        runner.add_trial(Trial("__fake", stub=True))
+        for i in range(3):
+            runner._callbacks.on_trial_result(
+                iteration=i, trials=None, trial=None, result=None
+            )
+        runner.checkpoint(force=True)
+        callback = StatefulCallback()
+        runner2 = TrialRunner(
+            local_checkpoint_dir=self.tmpdir,
+            callbacks=[callback],
+        )
+        assert callback.counter == 0
+        runner2.resume()
+        assert callback.counter == 3
+
     def testTrialErrorResumeFalse(self):
         ray.init(num_cpus=3, local_mode=True, include_dashboard=False)
         runner = TrialRunner(

From 59f72cfdc9a8008f00f03887f989eb1de831a876 Mon Sep 17 00:00:00 2001
From: Justin Yu <justinvyu@berkeley.edu>
Date: Wed, 1 Feb 2023 01:30:53 -0800
Subject: [PATCH 118/267] [Tune] Rename `overwrite_trainable` argument in Tuner
 restore to `trainable` (#32059)

* Add trainable and deprecate overwrite_trainable

Signed-off-by: Justin Yu <justinvyu@berkeley.edu>
---
 python/ray/train/tests/test_tune.py    |  2 +-
 python/ray/tune/impl/tuner_internal.py |  7 ++---
 python/ray/tune/trainable/util.py      |  7 +++--
 python/ray/tune/tuner.py               | 38 ++++++++++++++++++++------
 4 files changed, 37 insertions(+), 17 deletions(-)

diff --git a/python/ray/train/tests/test_tune.py b/python/ray/train/tests/test_tune.py
index 59f170bb4989..61077cc11974 100644
--- a/python/ray/train/tests/test_tune.py
+++ b/python/ray/train/tests/test_tune.py
@@ -273,7 +273,7 @@ def train_func(config):
                 resume_errored=True,
             )
         # Should warn about the RunConfig being ignored
-        assert "RunConfig" in str(warn_record[0].message)
+        assert any("RunConfig" in str(record.message) for record in warn_record)
         assert "The trainable will be overwritten" in caplog.text
 
     results = tuner.fit()
diff --git a/python/ray/tune/impl/tuner_internal.py b/python/ray/tune/impl/tuner_internal.py
index fbd7d57e9823..e6184cb87b47 100644
--- a/python/ray/tune/impl/tuner_internal.py
+++ b/python/ray/tune/impl/tuner_internal.py
@@ -251,7 +251,7 @@ def _validate_overwrite_trainable(
                 "# Reconstruct the trainable with the same parameters\n"
                 "trainable_with_params = tune.with_parameters(trainable, ...)\n"
                 "tuner = tune.Tuner.restore(\n"
-                "    ..., overwrite_trainable=trainable_with_params\n"
+                "    ..., trainable=trainable_with_params\n"
                 ")\n\nSee https://docs.ray.io/en/master/tune/api_docs/trainable.html"
                 "#tune-with-parameters for more details."
             )
@@ -259,9 +259,8 @@ def _validate_overwrite_trainable(
             return
 
         error_message = (
-            "Usage of `overwrite_trainable` is limited to re-specifying the "
-            "same trainable that was passed to `Tuner`, in the case "
-            "that the trainable is not serializable (e.g. it holds object references)."
+            "Invalid trainable input. To avoid errors, pass in the same trainable "
+            "that was used to initialize the Tuner."
         )
 
         if type(original_trainable) != type(overwrite_trainable):
diff --git a/python/ray/tune/trainable/util.py b/python/ray/tune/trainable/util.py
index 0f696e7871c9..489faad4113e 100644
--- a/python/ray/tune/trainable/util.py
+++ b/python/ray/tune/trainable/util.py
@@ -325,13 +325,13 @@ def step(self):
 
         1. ``tune.with_parameters`` stores parameters in the object store and
         attaches object references to the trainable, but the objects they point to
-        may not exist anymore upon restore.
+        may not exist anymore upon restoring in a new Ray cluster.
 
         2. The attached objects could be arbitrarily large, so Tune does not save the
         object data along with the trainable.
 
         To restore, Tune allows the trainable to be re-specified in
-        :meth:`Tuner.restore(overwrite_trainable=...) <ray.tune.tuner.Tuner.restore>`.
+        :meth:`Tuner.restore(path, trainable=...) <ray.tune.tuner.Tuner.restore>`.
         Continuing from the previous examples, here's an example of restoration:
 
         .. code-block:: python
@@ -342,7 +342,8 @@ def step(self):
 
             tuner = Tuner.restore(
                 "/path/to/experiment/",
-                overwrite_trainable=tune.with_parameters(MyTrainable, data=data)
+                trainable=tune.with_parameters(MyTrainable, data=data),
+                # ...
             )
 
     """
diff --git a/python/ray/tune/tuner.py b/python/ray/tune/tuner.py
index f30a8266f1c9..8adb6d8859ec 100644
--- a/python/ray/tune/tuner.py
+++ b/python/ray/tune/tuner.py
@@ -1,4 +1,5 @@
 from typing import Any, Callable, Dict, Optional, Type, Union, TYPE_CHECKING
+import warnings
 
 import ray
 
@@ -159,9 +160,13 @@ def __init__(
     def restore(
         cls,
         path: str,
+        trainable: Optional[
+            Union[str, Callable, Type[Trainable], "BaseTrainer"]
+        ] = None,
         resume_unfinished: bool = True,
         resume_errored: bool = False,
         restart_errored: bool = False,
+        # Deprecated
         overwrite_trainable: Optional[
             Union[str, Callable, Type[Trainable], "BaseTrainer"]
         ] = None,
@@ -191,24 +196,39 @@ def restore(
                 console output of previous run.
                 Note: depending on whether ray client mode is used or not,
                 this path may or may not exist on your local machine.
+            trainable: The trainable to use upon resuming the experiment.
+                This should be the same trainable that was used to initialize
+                the original Tuner.
+                NOTE: Starting in 2.5, this will be a required parameter.
             resume_unfinished: If True, will continue to run unfinished trials.
             resume_errored: If True, will re-schedule errored trials and try to
                 restore from their latest checkpoints.
             restart_errored: If True, will re-schedule errored trials but force
                 restarting them from scratch (no checkpoint will be loaded).
-            overwrite_trainable: A newly specified trainable that will overwrite
-                the trainable that was originally saved by Tune. This should
-                only be used to resume an experiment where the original trainable
-                is not fully serializable (e.g. when the trainable has object
-                references attached to it via ``tune.with_parameters``, the objects
-                they point to may not exist if restoring from a new Ray cluster).
-                NOTE: This API is experimental and should be used with caution.
+            overwrite_trainable: Deprecated. Use the `trainable` argument instead.
         """
         # TODO(xwjiang): Add some comments to clarify the config behavior across
         #  retored runs.
         #  For example, is callbacks supposed to be automatically applied
         #  when a Tuner is restored and fit again?
 
+        if overwrite_trainable:
+            if not trainable:
+                trainable = overwrite_trainable
+            warning_message = (
+                "`overwrite_trainable` has been renamed to `trainable`. "
+                "The old argument will be removed starting from version 2.5."
+            )
+            warnings.warn(warning_message, DeprecationWarning)
+
+        if not trainable:
+            warning_message = (
+                "Passing in the experiment's `trainable` will be a required argument "
+                "to `Tuner.restore` starting from version 2.5. "
+                "Please specify the trainable to avoid this warning."
+            )
+            warnings.warn(warning_message)
+
         resume_config = _ResumeConfig(
             resume_unfinished=resume_unfinished,
             resume_errored=resume_errored,
@@ -219,7 +239,7 @@ def restore(
             tuner_internal = TunerInternal(
                 restore_path=path,
                 resume_config=resume_config,
-                trainable=overwrite_trainable,
+                trainable=trainable,
             )
             return Tuner(_tuner_internal=tuner_internal)
         else:
@@ -228,7 +248,7 @@ def restore(
             ).remote(
                 restore_path=path,
                 resume_config=resume_config,
-                trainable=overwrite_trainable,
+                trainable=trainable,
             )
             return Tuner(_tuner_internal=tuner_internal)
 

From 83e1a2a136d97c0cf70b227415b48c0fddc2ddfc Mon Sep 17 00:00:00 2001
From: Chen Shen <scv119@gmail.com>
Date: Wed, 1 Feb 2023 01:47:56 -0800
Subject: [PATCH 119/267] Revert "[core] Increase the threshold for pubsub
 integration test (#32145)" (#32165)

This reverts commit 12d7d7dcc2dae779c4c843e38819e00c21aaf824.
---
 BUILD.bazel                             | 2 +-
 src/ray/pubsub/test/integration_test.cc | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/BUILD.bazel b/BUILD.bazel
index 1dbcd8319f43..6baa80541cf4 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -1711,7 +1711,7 @@ cc_test(
 
 cc_test(
     name = "pubsub_integration_test",
-    timeout = "small",
+    timeout = "short",
     srcs = ["src/ray/pubsub/test/integration_test.cc"],
     copts = COPTS,
     tags = ["team:core"],
diff --git a/src/ray/pubsub/test/integration_test.cc b/src/ray/pubsub/test/integration_test.cc
index ffca2acd0e05..9f52c6e7a499 100644
--- a/src/ray/pubsub/test/integration_test.cc
+++ b/src/ray/pubsub/test/integration_test.cc
@@ -295,7 +295,7 @@ TEST_F(IntegrationTest, SubscribersToOneIDAndAllIDs) {
   // logic below.
   int wait_count = 0;
   while (!(subscriber_1->CheckNoLeaks() && subscriber_2->CheckNoLeaks())) {
-    ASSERT_LT(wait_count, 60) << "Subscribers still have inflight operations after 60s";
+    ASSERT_LT(wait_count, 15) << "Subscribers still have inflight operations after 15s";
     ++wait_count;
     absl::SleepFor(absl::Seconds(1));
   }

From aad24bdb913f97ddd62657701d7baba6e3ecb1ab Mon Sep 17 00:00:00 2001
From: clarng <clarence.wyng@gmail.com>
Date: Wed, 1 Feb 2023 02:13:15 -0800
Subject: [PATCH 120/267] [core] clean up infeasible tasks submitted by the
 driver when the driver dies (#32127)

Signed-off-by: Clarence Ng <clarence.wyng@gmail.com>

infeasible requests are not cleaned up when the driver exits. This cleans up infeasible request created by driver when it exits.

does not apply to worker exit (follow up)
also does not apply to infeasible task submitted to a different raylet (follow up)
---
 python/ray/tests/test_node_manager.py         | 107 ++++++++++++++++++
 src/ray/raylet/node_manager.cc                |   5 +-
 .../raylet/scheduling/cluster_task_manager.cc |  38 +++++++
 .../raylet/scheduling/cluster_task_manager.h  |  13 +++
 .../cluster_task_manager_interface.h          |  12 ++
 src/ray/util/container_util.h                 |  18 +++
 src/ray/util/container_util_test.cc           |  27 +++++
 7 files changed, 219 insertions(+), 1 deletion(-)

diff --git a/python/ray/tests/test_node_manager.py b/python/ray/tests/test_node_manager.py
index 5d3535db5b33..f8d44779bdda 100644
--- a/python/ray/tests/test_node_manager.py
+++ b/python/ray/tests/test_node_manager.py
@@ -114,6 +114,113 @@ def check_backlog(expect_backlog) -> bool:
     )
 
 
+def get_infeasible_queued(ray_ctx):
+    resources_batch = get_resource_usage(
+        gcs_address=ray_ctx.address_info["gcs_address"]
+    )
+
+    infeasible_queued = (
+        resources_batch.resource_load_by_shape.resource_demands[
+            0
+        ].num_infeasible_requests_queued
+        if len(resources_batch.resource_load_by_shape.resource_demands) > 0
+        and hasattr(
+            resources_batch.resource_load_by_shape.resource_demands[0],
+            "num_infeasible_requests_queued",
+        )
+        else 0
+    )
+
+    return infeasible_queued
+
+
+def check_infeasible(expect_infeasible, ray_ctx) -> bool:
+    infeasible_queued = get_infeasible_queued(ray_ctx)
+    if expect_infeasible:
+        return infeasible_queued > 0
+    else:
+        return infeasible_queued == 0
+
+
+@pytest.mark.parametrize(
+    "call_ray_start",
+    ["""ray start --head"""],
+    indirect=True,
+)
+def test_kill_driver_clears_infeasible(call_ray_start):
+    driver = """
+import ray
+
+@ray.remote
+def f():
+    pass
+
+ray.get(f.options(num_cpus=99999999).remote())
+  """
+    proc = run_string_as_driver_nonblocking(driver)
+    ctx = ray.init(address=call_ray_start)
+
+    wait_for_condition(
+        check_infeasible,
+        timeout=10,
+        retry_interval_ms=1000,
+        expect_infeasible=True,
+        ray_ctx=ctx,
+    )
+
+    os.kill(proc.pid, 9)
+
+    wait_for_condition(
+        check_infeasible,
+        timeout=10,
+        retry_interval_ms=1000,
+        expect_infeasible=False,
+        ray_ctx=ctx,
+    )
+
+
+def test_kill_driver_keep_infeasible_detached_actor(ray_start_cluster):
+    cluster = ray_start_cluster
+    address = cluster.address
+
+    cluster.add_node(num_cpus=1)
+
+    driver_script = """
+import ray
+
+@ray.remote
+class A:
+    def fn(self):
+        pass
+
+ray.init(address="{}", namespace="test_det")
+
+ray.get(A.options(num_cpus=123, name="det", lifetime="detached").remote())
+""".format(
+        cluster.address
+    )
+
+    proc = run_string_as_driver_nonblocking(driver_script)
+
+    ctx = ray.init(address=address, namespace="test_det")
+
+    wait_for_condition(
+        check_infeasible,
+        timeout=10,
+        retry_interval_ms=1000,
+        expect_infeasible=True,
+        ray_ctx=ctx,
+    )
+
+    os.kill(proc.pid, 9)
+
+    cluster.add_node(num_cpus=200)
+
+    det_actor = ray.get_actor("det")
+
+    ray.get(det_actor.fn.remote())
+
+
 if __name__ == "__main__":
     import sys
 
diff --git a/src/ray/raylet/node_manager.cc b/src/ray/raylet/node_manager.cc
index 133be7d8061e..a405c51439e7 100644
--- a/src/ray/raylet/node_manager.cc
+++ b/src/ray/raylet/node_manager.cc
@@ -1340,7 +1340,9 @@ void NodeManager::ProcessRegisterClientRequestMessage(
     RAY_CHECK(pid >= 0);
     worker->SetProcess(Process::FromPid(pid));
     // Compute a dummy driver task id from a given driver.
-    const TaskID driver_task_id = TaskID::ComputeDriverTaskId(worker_id);
+    // The task id set in the worker here should be consistent with the task
+    // id set in the core worker.
+    const TaskID driver_task_id = TaskID::ForDriverTask(job_id);
     worker->AssignTaskId(driver_task_id);
     rpc::JobConfig job_config;
     job_config.ParseFromString(message->serialized_job_config()->str());
@@ -1543,6 +1545,7 @@ void NodeManager::DisconnectClient(const std::shared_ptr<ClientConnection> &clie
   }
 
   local_task_manager_->ClearWorkerBacklog(worker->WorkerId());
+  cluster_task_manager_->CancelTaskForOwner(worker->GetAssignedTaskId());
 
   client->Close();
 
diff --git a/src/ray/raylet/scheduling/cluster_task_manager.cc b/src/ray/raylet/scheduling/cluster_task_manager.cc
index 1d87aaaca0e8..94f76bcac944 100644
--- a/src/ray/raylet/scheduling/cluster_task_manager.cc
+++ b/src/ray/raylet/scheduling/cluster_task_manager.cc
@@ -258,6 +258,44 @@ bool ClusterTaskManager::CancelTask(
       task_id, failure_type, scheduling_failure_message);
 }
 
+void ClusterTaskManager::CancelTaskForOwner(
+    const TaskID &owner_task_id,
+    rpc::RequestWorkerLeaseReply::SchedulingFailureType failure_type,
+    const std::string &scheduling_failure_message) {
+  std::function<bool(std::shared_ptr<internal::Work>)> filter(
+      [owner_task_id, failure_type, scheduling_failure_message](
+          std::shared_ptr<internal::Work> work) {
+        auto task = work->task;
+        if (task.GetTaskSpecification().ParentTaskId() == owner_task_id) {
+          if (!task.GetTaskSpecification().IsDetachedActor()) {
+            RAY_LOG(DEBUG) << "Canceling task from owner " << owner_task_id
+                           << " for task " << task.GetTaskSpecification().DebugString();
+            ReplyCancelled(*work, failure_type, scheduling_failure_message);
+            return true;
+          }
+        }
+        return false;
+      });
+
+  for (auto shapes_it = tasks_to_schedule_.begin(); shapes_it != tasks_to_schedule_.end();
+       shapes_it++) {
+    auto &work_queue = shapes_it->second;
+    remove_elements(filter, work_queue);
+    if (work_queue.empty()) {
+      tasks_to_schedule_.erase(shapes_it);
+    }
+  }
+
+  for (auto shapes_it = infeasible_tasks_.begin(); shapes_it != infeasible_tasks_.end();
+       shapes_it++) {
+    auto &work_queue = shapes_it->second;
+    remove_elements(filter, work_queue);
+    if (work_queue.empty()) {
+      infeasible_tasks_.erase(shapes_it);
+    }
+  }
+}
+
 void ClusterTaskManager::FillResourceUsage(
     rpc::ResourcesData &data,
     const std::shared_ptr<NodeResources> &last_reported_resources) {
diff --git a/src/ray/raylet/scheduling/cluster_task_manager.h b/src/ray/raylet/scheduling/cluster_task_manager.h
index a06690f5bf4f..d53ac0b3cbc0 100644
--- a/src/ray/raylet/scheduling/cluster_task_manager.h
+++ b/src/ray/raylet/scheduling/cluster_task_manager.h
@@ -25,6 +25,7 @@
 #include "ray/raylet/scheduling/local_task_manager_interface.h"
 #include "ray/raylet/scheduling/scheduler_resource_reporter.h"
 #include "ray/raylet/scheduling/scheduler_stats.h"
+#include "ray/util/container_util.h"
 
 namespace ray {
 namespace raylet {
@@ -76,6 +77,7 @@ class ClusterTaskManager : public ClusterTaskManagerInterface {
   ///
   /// \param task_id: The id of the task to remove.
   /// \param failure_type: The failure type.
+  /// \param scheduling_failure_message: The failure message.
   ///
   /// \return True if task was successfully removed. This function will return
   /// false if the task is already running.
@@ -84,6 +86,17 @@ class ClusterTaskManager : public ClusterTaskManagerInterface {
                       rpc::RequestWorkerLeaseReply::SCHEDULING_CANCELLED_INTENDED,
                   const std::string &scheduling_failure_message = "") override;
 
+  /// Attempt to cancel an already queued task that belongs to an owner.
+  ///
+  /// \param owner_task_id: The id of the parent.
+  /// \param failure_type: The failure type.
+  /// \param scheduling_failure_message: The failure message.
+  void CancelTaskForOwner(
+      const TaskID &owner_task_id,
+      rpc::RequestWorkerLeaseReply::SchedulingFailureType failure_type =
+          rpc::RequestWorkerLeaseReply::SCHEDULING_CANCELLED_INTENDED,
+      const std::string &scheduling_failure_message = "") override;
+
   /// Populate the relevant parts of the heartbeat table. This is intended for
   /// sending resource usage of raylet to gcs. In particular, this should fill in
   /// resource_load and resource_load_by_shape.
diff --git a/src/ray/raylet/scheduling/cluster_task_manager_interface.h b/src/ray/raylet/scheduling/cluster_task_manager_interface.h
index 06e4891e025a..c97f85c170a4 100644
--- a/src/ray/raylet/scheduling/cluster_task_manager_interface.h
+++ b/src/ray/raylet/scheduling/cluster_task_manager_interface.h
@@ -40,6 +40,7 @@ class ClusterTaskManagerInterface {
   ///
   /// \param task_id: The id of the task to remove.
   /// \param failure_type: The failure type.
+  /// \param scheduling_failure_message: The failure message.
   ///
   /// \return True if task was successfully removed. This function will return
   /// false if the task is already running.
@@ -49,6 +50,17 @@ class ClusterTaskManagerInterface {
           rpc::RequestWorkerLeaseReply::SCHEDULING_CANCELLED_INTENDED,
       const std::string &scheduling_failure_message = "") = 0;
 
+  /// Attempt to cancel an already queued task that belongs to an owner.
+  ///
+  /// \param owner_task_id: The id of the parent.
+  /// \param failure_type: The failure type.
+  /// \param scheduling_failure_message: The failure message.
+  virtual void CancelTaskForOwner(
+      const TaskID &owner_task_id,
+      rpc::RequestWorkerLeaseReply::SchedulingFailureType failure_type =
+          rpc::RequestWorkerLeaseReply::SCHEDULING_CANCELLED_INTENDED,
+      const std::string &scheduling_failure_message = "") = 0;
+
   /// Queue task and schedule. This hanppens when processing the worker lease request.
   ///
   /// \param task: The incoming task to be queued and scheduled.
diff --git a/src/ray/util/container_util.h b/src/ray/util/container_util.h
index c9c5f25fd845..6a6bc671e529 100644
--- a/src/ray/util/container_util.h
+++ b/src/ray/util/container_util.h
@@ -14,6 +14,7 @@
 
 #pragma once
 
+#include <deque>
 #include <map>
 #include <set>
 #include <sstream>
@@ -96,4 +97,21 @@ typename C::mapped_type &map_find_or_die(C &c, const typename C::key_type &k) {
       map_find_or_die(const_cast<const C &>(c), k));
 }
 
+/// Remove elements whole matcher returns true against the element.
+///
+/// @param matcher the matcher function to be applied to each elements
+/// @param container the container of the elements
+template <typename T>
+void remove_elements(std::function<bool(T)> matcher, std::deque<T> &container) {
+  auto itr = container.begin();
+  while (itr != container.end()) {
+    if (matcher(*itr)) {
+      itr = container.erase(itr);
+    }
+    if (itr != container.end()) {
+      itr++;
+    }
+  }
+}
+
 }  // namespace ray
diff --git a/src/ray/util/container_util_test.cc b/src/ray/util/container_util_test.cc
index da2bc7319ad8..d5ba8a7aa7e4 100644
--- a/src/ray/util/container_util_test.cc
+++ b/src/ray/util/container_util_test.cc
@@ -36,6 +36,33 @@ TEST(ContainerUtilTest, TestMapFindOrDie) {
   }
 }
 
+TEST(ContainerUtilTest, RemoveElementsLastElement) {
+  std::deque<int> queue{1, 2, 3, 4};
+  std::function<bool(int)> even = [](int value) { return value % 2 == 0; };
+  remove_elements(even, queue);
+
+  std::deque<int> expected{1, 3};
+  ASSERT_EQ(queue, expected);
+}
+
+TEST(ContainerUtilTest, RemoveElementsExcludeLastElement) {
+  std::deque<int> queue{1, 2, 3};
+  std::function<bool(int)> even = [](int value) { return value % 2 == 0; };
+  remove_elements(even, queue);
+
+  std::deque<int> expected{1, 3};
+  ASSERT_EQ(queue, expected);
+}
+
+TEST(ContainerUtilTest, RemoveElementsEmptyContainer) {
+  std::deque<int> queue{};
+  std::function<bool(int)> even = [](int value) { return value % 2 == 0; };
+  remove_elements(even, queue);
+
+  std::deque<int> expected{};
+  ASSERT_EQ(queue, expected);
+}
+
 }  // namespace ray
 
 int main(int argc, char **argv) {

From eb660ceace3344d9972293809cf80c6cbd38508d Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Wed, 1 Feb 2023 02:21:02 -0800
Subject: [PATCH 121/267] Done (#32104)

Signed-off-by: SangBin Cho <rkooo567@gmail.com>

Add job id to the task state API call. This will help us not including tasks from other jobs (so improve the experience when we have 10K+ tasks from the cluster).
Add resource requirement to the pg table.
---
 .../src/components/PlacementGroupTable.tsx    | 34 +++++++++++++++++--
 dashboard/client/src/pages/state/task.tsx     |  4 ++-
 dashboard/client/src/service/task.ts          | 16 ++++++---
 dashboard/client/src/type/placementGroup.ts   |  9 +++++
 dashboard/state_aggregator.py                 |  2 +-
 5 files changed, 57 insertions(+), 8 deletions(-)

diff --git a/dashboard/client/src/components/PlacementGroupTable.tsx b/dashboard/client/src/components/PlacementGroupTable.tsx
index 9a513fe96ce5..73329bd184f8 100644
--- a/dashboard/client/src/components/PlacementGroupTable.tsx
+++ b/dashboard/client/src/components/PlacementGroupTable.tsx
@@ -14,11 +14,23 @@ import Autocomplete from "@material-ui/lab/Autocomplete";
 import Pagination from "@material-ui/lab/Pagination";
 import React, { useState } from "react";
 import rowStyles from "../common/RowStyles";
-import { PlacementGroup } from "../type/placementGroup";
+import { Bundle, PlacementGroup } from "../type/placementGroup";
 import { useFilter } from "../util/hook";
 import StateCounter from "./StatesCounter";
 import { StatusChip } from "./StatusChip";
 
+const BundleResourceRequirements = ({ bundles }: { bundles: Bundle[] }) => {
+  return (
+    <div>
+      {bundles.map(({ unit_resources }, index) => {
+        return `{${Object.entries(unit_resources || {})
+          .map(([key, val]) => `${key}: ${val}`)
+          .join(", ")}}, `;
+      })}
+    </div>
+  );
+};
+
 const PlacementGroupTable = ({
   placementGroups = [],
   jobId = null,
@@ -41,6 +53,7 @@ const PlacementGroupTable = ({
     { label: "Name" },
     { label: "Job Id" },
     { label: "State" },
+    { label: "Reserved Resources" },
     { label: "Scheduling Detail" },
   ];
 
@@ -133,7 +146,14 @@ const PlacementGroupTable = ({
         </TableHead>
         <TableBody>
           {list.map(
-            ({ placement_group_id, name, creator_job_id, state, stats }) => (
+            ({
+              placement_group_id,
+              name,
+              creator_job_id,
+              state,
+              stats,
+              bundles,
+            }) => (
               <TableRow key={placement_group_id}>
                 <TableCell align="center">
                   <Tooltip
@@ -150,6 +170,16 @@ const PlacementGroupTable = ({
                 <TableCell align="center">
                   <StatusChip type="placementGroup" status={state} />
                 </TableCell>
+                <TableCell align="center">
+                  <Tooltip
+                    className={classes.OverflowCol}
+                    title={<BundleResourceRequirements bundles={bundles} />}
+                    arrow
+                    interactive
+                  >
+                    <BundleResourceRequirements bundles={bundles} />
+                  </Tooltip>
+                </TableCell>
                 <TableCell align="center">
                   {stats ? stats.scheduling_state : "-"}
                 </TableCell>
diff --git a/dashboard/client/src/pages/state/task.tsx b/dashboard/client/src/pages/state/task.tsx
index 654ed94740d2..a81e4778d06f 100644
--- a/dashboard/client/src/pages/state/task.tsx
+++ b/dashboard/client/src/pages/state/task.tsx
@@ -17,7 +17,9 @@ const TaskList = ({
   actorId?: string | null;
 }) => {
   const [timeStamp] = useState(dayjs());
-  const data: Task[] | undefined = useStateApiList("useTasks", getTasks);
+  const data: Task[] | undefined = useStateApiList("useTasks", () =>
+    getTasks(jobId),
+  );
   const tasks = data ? data : [];
 
   return (
diff --git a/dashboard/client/src/service/task.ts b/dashboard/client/src/service/task.ts
index bb25ad2acb4a..6d43ef343ad8 100644
--- a/dashboard/client/src/service/task.ts
+++ b/dashboard/client/src/service/task.ts
@@ -2,10 +2,18 @@ import { StateApiResponse } from "../type/stateApi";
 import { Task } from "../type/task";
 import { get } from "./requestHandlers";
 
-export const getTasks = () => {
-  return get<StateApiResponse<Task>>("api/v0/tasks?detail=1&limit=10000");
+export const getTasks = (jobId: string | null) => {
+  let url = "api/v0/tasks?detail=1&limit=10000";
+  if (jobId) {
+    url += `&job_id=${jobId}`;
+  }
+  return get<StateApiResponse<Task>>(url);
 };
 
-export const downloadTaskTimelineHref = (jobId: string) => {
-  return `/api/v0/tasks/timeline?job_id=${jobId}&download=1`;
+export const downloadTaskTimelineHref = (jobId: string | null) => {
+  let url = "/api/v0/tasks/timeline?download=1";
+  if (jobId) {
+    url += `&job_id=${jobId}`;
+  }
+  return url;
 };
diff --git a/dashboard/client/src/type/placementGroup.ts b/dashboard/client/src/type/placementGroup.ts
index 69b1a98caf9c..42e71162abd2 100644
--- a/dashboard/client/src/type/placementGroup.ts
+++ b/dashboard/client/src/type/placementGroup.ts
@@ -6,6 +6,14 @@ export enum PlacementGroupState {
   RESCHEDULING = "RESCHEDULING",
 }
 
+export type Bundle = {
+  bundle_id: string;
+  node_id: string | null;
+  unit_resources: {
+    [key: string]: number;
+  };
+};
+
 export type PlacementGroup = {
   placement_group_id: string;
   name: string;
@@ -14,4 +22,5 @@ export type PlacementGroup = {
   stats?: {
     [key: string]: number | string;
   } | null;
+  bundles: Bundle[];
 };
diff --git a/dashboard/state_aggregator.py b/dashboard/state_aggregator.py
index d69663bb65eb..c7fa98ce4f10 100644
--- a/dashboard/state_aggregator.py
+++ b/dashboard/state_aggregator.py
@@ -253,7 +253,7 @@ async def list_placement_groups(self, *, option: ListApiOptions) -> ListApiRespo
 
             data = self._message_to_dict(
                 message=message,
-                fields_to_decode=["placement_group_id", "creator_job_id"],
+                fields_to_decode=["placement_group_id", "creator_job_id", "node_id"],
             )
             result.append(data)
         num_after_truncation = len(result)

From 10c46dc2537a9615b5c86409e3f3a6b2c005df7d Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Wed, 1 Feb 2023 07:00:42 -0500
Subject: [PATCH 122/267] [core][state][dashboard] Use main threads's task id
 or actor creation task id for parent's task id in state API (#32157)

Right now, if a new thread (or async actor's event loop executing thread) runs some ray code (e.g. submitting a task, calling runtime context), the thread will have a WorkerThreadContext that has a random task id.

This causes issues in state API since the task tree will have wrong structures, i.e. some tasks might have parent_task_id that doesn't match any existing tasks:

For normal single threaded task/actor, we will use the main thread's task id (correct hehavior).
For unusual cases (threaded/async actors), we will use the actor creation task's task id. This means from the advanced visualization, all the remote tasks created from actor tasks will be under the constructor of threaded/async actors
---
 .../runtime/task/local_mode_task_submitter.cc |   3 +-
 python/ray/experimental/state/common.py       |   4 +-
 python/ray/tests/test_task_events.py          | 210 ++++++++++++++++++
 src/ray/common/task/task_spec.cc              |   7 +
 src/ray/common/task/task_spec.h               |   2 +
 src/ray/common/task/task_util.h               |   6 +-
 src/ray/core_worker/context.cc                |  13 ++
 src/ray/core_worker/context.h                 |   6 +
 src/ray/core_worker/core_worker.cc            |   8 +-
 src/ray/core_worker/core_worker.h             |   1 +
 src/ray/core_worker/task_manager.cc           |   7 +-
 src/ray/core_worker/test/core_worker_test.cc  |  12 +-
 .../test/dependency_resolver_test.cc          |   3 +-
 .../test/direct_task_transport_test.cc        |   3 +-
 src/ray/gcs/test/gcs_test_util.h              |   3 +-
 src/ray/protobuf/common.proto                 |   6 +
 .../scheduling/cluster_task_manager_test.cc   |   1 +
 17 files changed, 286 insertions(+), 9 deletions(-)

diff --git a/cpp/src/ray/runtime/task/local_mode_task_submitter.cc b/cpp/src/ray/runtime/task/local_mode_task_submitter.cc
index 7740bc186d25..145e8130fe15 100644
--- a/cpp/src/ray/runtime/task/local_mode_task_submitter.cc
+++ b/cpp/src/ray/runtime/task/local_mode_task_submitter.cc
@@ -64,7 +64,8 @@ ObjectID LocalModeTaskSubmitter::Submit(InvocationSpec &invocation,
                             required_resources,
                             required_placement_resources,
                             "",
-                            /*depth=*/0);
+                            /*depth=*/0,
+                            local_mode_ray_tuntime_.GetCurrentTaskId());
   if (invocation.task_type == TaskType::NORMAL_TASK) {
   } else if (invocation.task_type == TaskType::ACTOR_CREATION_TASK) {
     invocation.actor_id = local_mode_ray_tuntime_.GetNextActorID();
diff --git a/python/ray/experimental/state/common.py b/python/ray/experimental/state/common.py
index 05d00da4cdc2..84b234192981 100644
--- a/python/ray/experimental/state/common.py
+++ b/python/ray/experimental/state/common.py
@@ -544,7 +544,9 @@ class TaskState(StateSchema):
     required_resources: dict = state_column(detail=True, filterable=False)
     #: The runtime environment information for the task.
     runtime_env_info: str = state_column(detail=True, filterable=False)
-    #: The parent task id.
+    #: The parent task id. If the parent is a normal task, it will be the task's id.
+    #: If the parent runs in a concurrent actor (async actor or threaded actor),
+    #: it will be the actor's creation task id.
     parent_task_id: str = state_column(filterable=True)
     #: The placement group id that's associated with this task.
     placement_group_id: str = state_column(detail=True, filterable=True)
diff --git a/python/ray/tests/test_task_events.py b/python/ray/tests/test_task_events.py
index 425f1f5931cc..48790844faaf 100644
--- a/python/ray/tests/test_task_events.py
+++ b/python/ray/tests/test_task_events.py
@@ -1,12 +1,14 @@
 from collections import defaultdict
 from typing import Dict
 import pytest
+import threading
 import time
 
 import ray
 from ray.experimental.state.common import ListApiOptions, StateResource
 from ray._private.test_utils import (
     raw_metrics,
+    run_string_as_driver,
     run_string_as_driver_nonblocking,
     wait_for_condition,
 )
@@ -124,6 +126,214 @@ def verify():
     )
 
 
+def test_parent_task_id_threaded_task(shutdown_only):
+    ray.init(_system_config=_SYSTEM_CONFIG)
+
+    # Task starts a thread
+    @ray.remote
+    def main_task():
+        def thd_task():
+            @ray.remote
+            def thd_task():
+                pass
+
+            ray.get(thd_task.remote())
+
+        thd = threading.Thread(target=thd_task)
+        thd.start()
+        thd.join()
+
+    ray.get(main_task.remote())
+
+    def verify():
+        tasks = list_tasks()
+        assert len(tasks) == 2
+        expect_parent_task_id = None
+        actual_parent_task_id = None
+        for task in tasks:
+            if task["name"] == "main_task":
+                expect_parent_task_id = task["task_id"]
+            elif task["name"] == "thd_task":
+                actual_parent_task_id = task["parent_task_id"]
+        assert actual_parent_task_id is not None
+        assert expect_parent_task_id == actual_parent_task_id
+
+        return True
+
+    wait_for_condition(verify)
+
+
+def test_parent_task_id_non_concurrent_actor(shutdown_only):
+    ray.init(_system_config=_SYSTEM_CONFIG)
+
+    def run_task_in_thread():
+        def thd_task():
+            @ray.remote
+            def thd_task():
+                pass
+
+            ray.get(thd_task.remote())
+
+        thd = threading.Thread(target=thd_task)
+        thd.start()
+        thd.join()
+
+    @ray.remote
+    class Actor:
+        def main_task(self):
+            run_task_in_thread()
+
+    a = Actor.remote()
+    ray.get(a.main_task.remote())
+
+    def verify():
+        tasks = list_tasks()
+        expect_parent_task_id = None
+        actual_parent_task_id = None
+        for task in tasks:
+            if "main_task" in task["name"]:
+                expect_parent_task_id = task["task_id"]
+            elif "thd_task" in task["name"]:
+                actual_parent_task_id = task["parent_task_id"]
+        print(tasks)
+        assert actual_parent_task_id is not None
+        assert expect_parent_task_id == actual_parent_task_id
+
+        return True
+
+    wait_for_condition(verify)
+
+
+@pytest.mark.parametrize("actor_concurrency", [3, 10])
+def test_parent_task_id_concurrent_actor(shutdown_only, actor_concurrency):
+    # Test tasks runs in user started thread from actors have a parent_task_id
+    # as the actor's creation task.
+    ray.init(_system_config=_SYSTEM_CONFIG)
+
+    def run_task_in_thread(name, i):
+        def thd_task():
+            @ray.remote
+            def thd_task():
+                pass
+
+            ray.get(thd_task.options(name=f"{name}_{i}").remote())
+
+        thd = threading.Thread(target=thd_task)
+        thd.start()
+        thd.join()
+
+    @ray.remote
+    class AsyncActor:
+        async def main_task(self, i):
+            run_task_in_thread("async_thd_task", i)
+
+    @ray.remote
+    class ThreadedActor:
+        def main_task(self, i):
+            run_task_in_thread("threaded_thd_task", i)
+
+    def verify(actor_method_name, actor_class_name):
+        tasks = list_tasks()
+        print(tasks)
+        expect_parent_task_id = None
+        actual_parent_task_id = None
+        for task in tasks:
+            if f"{actor_class_name}.__init__" in task["name"]:
+                expect_parent_task_id = task["task_id"]
+
+        assert expect_parent_task_id is not None
+        for task in tasks:
+            if f"{actor_method_name}" in task["name"]:
+                actual_parent_task_id = task["parent_task_id"]
+                assert expect_parent_task_id == actual_parent_task_id, task
+
+        return True
+
+    async_actor = AsyncActor.options(max_concurrency=actor_concurrency).remote()
+    ray.get([async_actor.main_task.remote(i) for i in range(20)])
+    wait_for_condition(
+        verify, actor_class_name="AsyncActor", actor_method_name="async_thd_task"
+    )
+
+    thd_actor = ThreadedActor.options(max_concurrency=actor_concurrency).remote()
+    ray.get([thd_actor.main_task.remote(i) for i in range(20)])
+    wait_for_condition(
+        verify, actor_class_name="ThreadedActor", actor_method_name="threaded_thd_task"
+    )
+
+
+def test_parent_task_id_tune_e2e(shutdown_only):
+    # Test a tune e2e workload should not have any task with parent_task_id that's
+    # not found.
+    ray.init(_system_config=_SYSTEM_CONFIG)
+    job_id = ray.get_runtime_context().get_job_id()
+    script = """
+import numpy as np
+import ray
+from ray import tune
+import time
+
+ray.init("auto")
+
+@ray.remote
+def train_step_1():
+    time.sleep(0.5)
+    return 1
+
+def train_function(config):
+    for i in range(5):
+        loss = config["mean"] * np.random.randn() + ray.get(
+            train_step_1.remote())
+        tune.report(loss=loss, nodes=ray.nodes())
+
+
+def tune_function():
+    analysis = tune.run(
+        train_function,
+        metric="loss",
+        mode="min",
+        config={
+            "mean": tune.grid_search([1, 2, 3, 4, 5]),
+        },
+        resources_per_trial=tune.PlacementGroupFactory([{
+            'CPU': 1.0
+        }] + [{
+            'CPU': 1.0
+        }] * 3),
+    )
+    return analysis.best_config
+
+
+tune_function()
+    """
+
+    run_string_as_driver(script)
+    client = StateApiClient()
+
+    def list_tasks():
+        return client.list(
+            StateResource.TASKS,
+            # Filter out this driver
+            options=ListApiOptions(
+                exclude_driver=False, filters=[("job_id", "!=", job_id)], limit=1000
+            ),
+            raise_on_missing_output=True,
+        )
+
+    def verify():
+        tasks = list_tasks()
+
+        task_id_map = {task["task_id"]: task for task in tasks}
+        for task in tasks:
+            if task["type"] == "DRIVER_TASK":
+                continue
+            assert task_id_map.get(task["parent_task_id"], None) is not None, task
+
+        return True
+
+    wait_for_condition(verify)
+
+
 def test_handle_driver_tasks(shutdown_only):
     ray.init(_system_config=_SYSTEM_CONFIG)
 
diff --git a/src/ray/common/task/task_spec.cc b/src/ray/common/task/task_spec.cc
index 0c31dd0f466a..71000748cb44 100644
--- a/src/ray/common/task/task_spec.cc
+++ b/src/ray/common/task/task_spec.cc
@@ -160,6 +160,13 @@ TaskID TaskSpecification::ParentTaskId() const {
   return TaskID::FromBinary(message_->parent_task_id());
 }
 
+TaskID TaskSpecification::SubmitterTaskId() const {
+  if (message_->submitter_task_id().empty() /* e.g., empty proto default */) {
+    return TaskID::Nil();
+  }
+  return TaskID::FromBinary(message_->submitter_task_id());
+}
+
 size_t TaskSpecification::ParentCounter() const { return message_->parent_counter(); }
 
 ray::FunctionDescriptor TaskSpecification::FunctionDescriptor() const {
diff --git a/src/ray/common/task/task_spec.h b/src/ray/common/task/task_spec.h
index 778678ced951..e1aea6fc4459 100644
--- a/src/ray/common/task/task_spec.h
+++ b/src/ray/common/task/task_spec.h
@@ -222,6 +222,8 @@ class TaskSpecification : public MessageWrapper<rpc::TaskSpec> {
 
   TaskID ParentTaskId() const;
 
+  TaskID SubmitterTaskId() const;
+
   size_t ParentCounter() const;
 
   ray::FunctionDescriptor FunctionDescriptor() const;
diff --git a/src/ray/common/task/task_util.h b/src/ray/common/task/task_util.h
index 652ddd307a28..c260745b7161 100644
--- a/src/ray/common/task/task_util.h
+++ b/src/ray/common/task/task_util.h
@@ -130,6 +130,7 @@ class TaskSpecBuilder {
       const std::unordered_map<std::string, double> &required_placement_resources,
       const std::string &debugger_breakpoint,
       int64_t depth,
+      const TaskID &submitter_task_id,
       const std::shared_ptr<rpc::RuntimeEnvInfo> runtime_env_info = nullptr,
       const std::string &concurrency_group_name = "") {
     message_->set_type(TaskType::NORMAL_TASK);
@@ -142,6 +143,7 @@ class TaskSpecBuilder {
     }
     message_->set_task_id(task_id.Binary());
     message_->set_parent_task_id(parent_task_id.Binary());
+    message_->set_submitter_task_id(submitter_task_id.Binary());
     message_->set_parent_counter(parent_counter);
     message_->set_caller_id(caller_id.Binary());
     message_->mutable_caller_address()->CopyFrom(caller_address);
@@ -182,12 +184,14 @@ class TaskSpecBuilder {
                                      const JobID &job_id,
                                      const TaskID &parent_task_id,
                                      const TaskID &caller_id,
-                                     const rpc::Address &caller_address) {
+                                     const rpc::Address &caller_address,
+                                     const TaskID &submitter_task_id) {
     message_->set_type(TaskType::DRIVER_TASK);
     message_->set_language(language);
     message_->set_job_id(job_id.Binary());
     message_->set_task_id(task_id.Binary());
     message_->set_parent_task_id(parent_task_id.Binary());
+    message_->set_submitter_task_id(submitter_task_id.Binary());
     message_->set_parent_counter(0);
     message_->set_caller_id(caller_id.Binary());
     message_->mutable_caller_address()->CopyFrom(caller_address);
diff --git a/src/ray/core_worker/context.cc b/src/ray/core_worker/context.cc
index 89a79cd5ba21..125f42d17e39 100644
--- a/src/ray/core_worker/context.cc
+++ b/src/ray/core_worker/context.cc
@@ -160,6 +160,11 @@ WorkerContext::WorkerContext(WorkerType worker_type,
     RAY_CHECK(!current_job_id_.IsNil());
     GetThreadContext().SetCurrentTaskId(TaskID::ForDriverTask(job_id),
                                         /*attempt_number=*/0);
+    // Driver runs in the main thread.
+    {
+      absl::WriterMutexLock lock(&mutex_);
+      main_thread_or_actor_creation_task_id_ = TaskID::ForDriverTask(job_id);
+    }
   }
 }
 
@@ -267,6 +272,9 @@ void WorkerContext::SetCurrentTask(const TaskSpecification &task_spec) {
   GetThreadContext().SetCurrentTask(task_spec);
   absl::WriterMutexLock lock(&mutex_);
   SetTaskDepth(task_spec.GetDepth());
+  if (CurrentThreadIsMain()) {
+    main_thread_or_actor_creation_task_id_ = task_spec.TaskId();
+  }
   RAY_CHECK(current_job_id_ == task_spec.JobId());
   if (task_spec.IsNormalTask()) {
     current_task_is_direct_call_ = true;
@@ -314,6 +322,11 @@ bool WorkerContext::CurrentThreadIsMain() const {
   return boost::this_thread::get_id() == main_thread_id_;
 }
 
+const TaskID WorkerContext::GetMainThreadOrActorCreationTaskID() const {
+  absl::ReaderMutexLock lock(&mutex_);
+  return main_thread_or_actor_creation_task_id_;
+}
+
 bool WorkerContext::ShouldReleaseResourcesOnBlockingCalls() const {
   // Check if we need to release resources when we block:
   //  - Driver doesn't acquire resources and thus doesn't need to release.
diff --git a/src/ray/core_worker/context.h b/src/ray/core_worker/context.h
index 09719f57654d..692063900526 100644
--- a/src/ray/core_worker/context.h
+++ b/src/ray/core_worker/context.h
@@ -40,6 +40,8 @@ class WorkerContext {
 
   const TaskID &GetCurrentTaskID() const;
 
+  const TaskID GetMainThreadOrActorCreationTaskID() const;
+
   const PlacementGroupID &GetCurrentPlacementGroupId() const LOCKS_EXCLUDED(mutex_);
 
   bool ShouldCaptureChildTasksInPlacementGroup() const LOCKS_EXCLUDED(mutex_);
@@ -130,6 +132,10 @@ class WorkerContext {
   std::shared_ptr<rpc::RuntimeEnvInfo> runtime_env_info_ GUARDED_BY(mutex_);
   /// The id of the (main) thread that constructed this worker context.
   const boost::thread::id main_thread_id_;
+  /// The currently executing main thread's task id. It's the actor creation task id
+  /// for concurrent actor, or the main thread's task id for other cases.
+  /// Used merely for observability purposes to track task hierarchy.
+  TaskID main_thread_or_actor_creation_task_id_ GUARDED_BY(mutex_);
   // To protect access to mutable members;
   mutable absl::Mutex mutex_;
 
diff --git a/src/ray/core_worker/core_worker.cc b/src/ray/core_worker/core_worker.cc
index b58aa8a44b73..bff8815ef370 100644
--- a/src/ray/core_worker/core_worker.cc
+++ b/src/ray/core_worker/core_worker.cc
@@ -363,7 +363,8 @@ CoreWorker::CoreWorker(const CoreWorkerOptions &options, const WorkerID &worker_
                               // Driver has no parent task
                               /* parent_task_id */ TaskID::Nil(),
                               GetCallerId(),
-                              rpc_address_);
+                              rpc_address_,
+                              TaskID::Nil());
     // Drivers are never re-executed.
     SetCurrentTaskId(task_id, /*attempt_number=*/0, "driver");
 
@@ -1751,6 +1752,7 @@ void CoreWorker::BuildCommonTaskSpec(
     const std::string &debugger_breakpoint,
     int64_t depth,
     const std::string &serialized_runtime_env_info,
+    const TaskID &main_thread_current_task_id,
     const std::string &concurrency_group_name,
     bool include_job_config) {
   // Build common task spec.
@@ -1783,6 +1785,7 @@ void CoreWorker::BuildCommonTaskSpec(
       required_placement_resources,
       debugger_breakpoint,
       depth,
+      main_thread_current_task_id,
       override_runtime_env_info,
       concurrency_group_name);
   // Set task arguments.
@@ -1833,6 +1836,7 @@ std::vector<rpc::ObjectReference> CoreWorker::SubmitTask(
                       debugger_breakpoint,
                       depth,
                       task_options.serialized_runtime_env_info,
+                      worker_context_.GetMainThreadOrActorCreationTaskID(),
                       /*concurrency_group_name*/ "",
                       /*include_job_config*/ true);
   builder.SetNormalTaskSpec(max_retries,
@@ -1916,6 +1920,7 @@ Status CoreWorker::CreateActor(const RayFunction &function,
                       "" /* debugger_breakpoint */,
                       depth,
                       actor_creation_options.serialized_runtime_env_info,
+                      worker_context_.GetMainThreadOrActorCreationTaskID(),
                       /*concurrency_group_name*/ "",
                       /*include_job_config*/ true);
 
@@ -2140,6 +2145,7 @@ std::optional<std::vector<rpc::ObjectReference>> CoreWorker::SubmitActorTask(
                       "",    /* debugger_breakpoint */
                       depth, /*depth*/
                       "{}",  /* serialized_runtime_env_info */
+                      worker_context_.GetMainThreadOrActorCreationTaskID(),
                       task_options.concurrency_group_name,
                       /*include_job_config*/ false);
   // NOTE: placement_group_capture_child_tasks and runtime_env will
diff --git a/src/ray/core_worker/core_worker.h b/src/ray/core_worker/core_worker.h
index d16f82003a86..8d926a7eead7 100644
--- a/src/ray/core_worker/core_worker.h
+++ b/src/ray/core_worker/core_worker.h
@@ -1145,6 +1145,7 @@ class CoreWorker : public rpc::CoreWorkerServiceHandler {
       const std::string &debugger_breakpoint,
       int64_t depth,
       const std::string &serialized_runtime_env_info,
+      const TaskID &main_thread_current_task_id,
       const std::string &concurrency_group_name = "",
       bool include_job_config = false);
   void SetCurrentTaskId(const TaskID &task_id,
diff --git a/src/ray/core_worker/task_manager.cc b/src/ray/core_worker/task_manager.cc
index 97927b637584..8b91e3161a5f 100644
--- a/src/ray/core_worker/task_manager.cc
+++ b/src/ray/core_worker/task_manager.cc
@@ -862,7 +862,12 @@ rpc::TaskInfoEntry TaskManager::MakeTaskInfoEntry(
   task_info.set_job_id(task_spec.JobId().Binary());
 
   task_info.set_task_id(task_spec.TaskId().Binary());
-  task_info.set_parent_task_id(task_spec.ParentTaskId().Binary());
+  // NOTE: we set the parent task id of a task to be submitter's task id, where
+  // the submitter depends on the owner coreworker's:
+  // - if the owner coreworker runs a normal task, the submitter's task id is the task id.
+  // - if the owner coreworker runs an actor, the submitter's task id will be the actor's
+  // creation task id.
+  task_info.set_parent_task_id(task_spec.SubmitterTaskId().Binary());
   const auto &resources_map = task_spec.GetRequiredResources().GetResourceMap();
   task_info.mutable_required_resources()->insert(resources_map.begin(),
                                                  resources_map.end());
diff --git a/src/ray/core_worker/test/core_worker_test.cc b/src/ray/core_worker/test/core_worker_test.cc
index 302c7e877dc8..cba46a14d733 100644
--- a/src/ray/core_worker/test/core_worker_test.cc
+++ b/src/ray/core_worker/test/core_worker_test.cc
@@ -565,7 +565,8 @@ TEST_F(ZeroNodeTest, TestTaskSpecPerf) {
                               resources,
                               resources,
                               "",
-                              0);
+                              0,
+                              RandomTaskId());
     // Set task arguments.
     for (const auto &arg : args) {
       builder.AddArg(*arg);
@@ -631,6 +632,7 @@ TEST_F(ZeroNodeTest, TestWorkerContext) {
   auto job_id = NextJobId();
 
   WorkerContext context(WorkerType::WORKER, WorkerID::FromRandom(), job_id);
+  // This fails locally somehow. Guess we reuse the thread in testing.
   ASSERT_TRUE(context.GetCurrentTaskID().IsNil());
   ASSERT_EQ(context.GetNextTaskIndex(), 1);
   ASSERT_EQ(context.GetNextTaskIndex(), 2);
@@ -658,6 +660,14 @@ TEST_F(ZeroNodeTest, TestWorkerContext) {
   context.SetCurrentTask(task_spec);
   ASSERT_EQ(context.GetCurrentTaskID(), task_spec.TaskId());
 
+  auto main_thread_task_id = task_spec.TaskId();
+  auto thread_func2 = [&context, &main_thread_task_id]() {
+    // Verify the main thread task id matches.
+    ASSERT_EQ(context.GetMainThreadOrActorCreationTaskID(), main_thread_task_id);
+  };
+  std::thread async_thread2(thread_func2);
+  async_thread2.join();
+
   // Verify that put index doesn't confict with the return object range.
   ASSERT_EQ(context.GetNextPutIndex(), num_returns + 1);
   ASSERT_EQ(context.GetNextPutIndex(), num_returns + 2);
diff --git a/src/ray/core_worker/test/dependency_resolver_test.cc b/src/ray/core_worker/test/dependency_resolver_test.cc
index d83318a1e82b..241cf0e5e31d 100644
--- a/src/ray/core_worker/test/dependency_resolver_test.cc
+++ b/src/ray/core_worker/test/dependency_resolver_test.cc
@@ -47,7 +47,8 @@ TaskSpecification BuildTaskSpec(const std::unordered_map<std::string, double> &r
                             resources,
                             resources,
                             serialized_runtime_env,
-                            depth);
+                            depth,
+                            TaskID::Nil());
   return builder.Build();
 }
 TaskSpecification BuildEmptyTaskSpec() {
diff --git a/src/ray/core_worker/test/direct_task_transport_test.cc b/src/ray/core_worker/test/direct_task_transport_test.cc
index bc90f82c1824..2abc88cf87ac 100644
--- a/src/ray/core_worker/test/direct_task_transport_test.cc
+++ b/src/ray/core_worker/test/direct_task_transport_test.cc
@@ -52,7 +52,8 @@ TaskSpecification BuildTaskSpec(const std::unordered_map<std::string, double> &r
                             resources,
                             resources,
                             serialized_runtime_env,
-                            depth);
+                            depth,
+                            TaskID::Nil());
   return builder.Build();
 }
 // Calls BuildTaskSpec with empty resources map and empty function descriptor
diff --git a/src/ray/gcs/test/gcs_test_util.h b/src/ray/gcs/test/gcs_test_util.h
index 579ffd7c48da..a0746add894c 100644
--- a/src/ray/gcs/test/gcs_test_util.h
+++ b/src/ray/gcs/test/gcs_test_util.h
@@ -61,7 +61,8 @@ struct Mocker {
                               required_resources,
                               required_placement_resources,
                               "",
-                              0);
+                              0,
+                              TaskID::Nil());
     rpc::SchedulingStrategy scheduling_strategy;
     scheduling_strategy.mutable_default_scheduling_strategy();
     builder.SetActorCreationTaskSpec(actor_id,
diff --git a/src/ray/protobuf/common.proto b/src/ray/protobuf/common.proto
index eda041053857..6660b9277dde 100644
--- a/src/ray/protobuf/common.proto
+++ b/src/ray/protobuf/common.proto
@@ -412,6 +412,12 @@ message TaskSpec {
   repeated bytes dynamic_return_ids = 31;
   // Job config for the task. Only set for normal task or actor creation task.
   optional JobConfig job_config = 32;
+  // TODO(rickyx): Remove this once we figure out a way to handle task ids
+  // across multiple threads properly.
+  // The task id of the CoreWorker's main thread from which the task is submitted.
+  // This will be the actor creation task's task id for concurrent actors. Or
+  // the main thread's task id for other cases.
+  bytes submitter_task_id = 33;
 }
 
 message TaskInfoEntry {
diff --git a/src/ray/raylet/scheduling/cluster_task_manager_test.cc b/src/ray/raylet/scheduling/cluster_task_manager_test.cc
index c85efcd1f701..f95c51c2aac3 100644
--- a/src/ray/raylet/scheduling/cluster_task_manager_test.cc
+++ b/src/ray/raylet/scheduling/cluster_task_manager_test.cc
@@ -168,6 +168,7 @@ RayTask CreateTask(
                                  {},
                                  "",
                                  0,
+                                 TaskID::Nil(),
                                  runtime_env_info);
 
   if (!args.empty()) {

From 666e2d930ae8d7863d810cc4d2061f6a732e247c Mon Sep 17 00:00:00 2001
From: matthewdeng <matt@anyscale.com>
Date: Wed, 1 Feb 2023 05:14:34 -0800
Subject: [PATCH 123/267] [air][tune] replace node:<ip> custom resource with
 NodeAffinitySchedulingPolicy (#32016)

This PR changes usages of the `node:<ip>` custom resource as determined by querying [file:(air|tune|train).*\.py node:](https://sourcegraph.com/search?q=context:global+repo:%5Egithub%5C.com/ray-project/ray%24+file:%28air%7Ctune%7Ctrain%29.*%5C.py+node:).

This is being used for:
- Collocating tasks (`_force_on_current_node`).
- Syncing files to specific IP addresses.
- Syncing files to _all_ other nodes.

Signed-off-by: Matthew Deng <matt@anyscale.com>
---
 python/ray/air/integrations/wandb.py          |  2 +-
 python/ray/air/util/node.py                   | 68 +++++++++++++++++++
 python/ray/tune/progress_reporter.py          |  2 +-
 python/ray/tune/tests/test_multinode_sync.py  | 42 ++++++++++++
 python/ray/tune/tune.py                       |  2 +-
 python/ray/tune/tuner.py                      |  2 +-
 python/ray/tune/utils/file_transfer.py        | 36 +++++-----
 python/ray/tune/utils/node.py                 | 40 -----------
 python/ray/tune/utils/util.py                 | 16 ++---
 .../workloads/benchmark_util.py               | 15 ++--
 .../workloads/torch_tune_serve_test.py        |  2 +-
 .../command_runner/_prometheus_metrics.py     |  2 +-
 12 files changed, 147 insertions(+), 82 deletions(-)
 create mode 100644 python/ray/air/util/node.py
 delete mode 100644 python/ray/tune/utils/node.py

diff --git a/python/ray/air/integrations/wandb.py b/python/ray/air/integrations/wandb.py
index b2806a19a530..5c388108f51b 100644
--- a/python/ray/air/integrations/wandb.py
+++ b/python/ray/air/integrations/wandb.py
@@ -13,13 +13,13 @@
 import ray
 from ray import logger
 from ray.air import session
+from ray.air.util.node import _force_on_current_node
 
 from ray.tune.logger import LoggerCallback
 from ray.tune.utils import flatten_dict
 from ray.tune.experiment import Trial
 
 from ray._private.storage import _load_class
-from ray.tune.utils.node import _force_on_current_node
 from ray.util import PublicAPI
 from ray.util.queue import Queue
 
diff --git a/python/ray/air/util/node.py b/python/ray/air/util/node.py
new file mode 100644
index 000000000000..bcc3e609347a
--- /dev/null
+++ b/python/ray/air/util/node.py
@@ -0,0 +1,68 @@
+from typing import Dict, Optional, Union
+import ray
+
+
+def _get_node_id_from_node_ip(node_ip: str) -> Optional[str]:
+    """Returns the node ID for the first alive node with the input IP."""
+    for node in ray.nodes():
+        if node["Alive"] and node["NodeManagerAddress"] == node_ip:
+            return node["NodeID"]
+
+    return None
+
+
+def _force_on_node(
+    node_id: str,
+    remote_func_or_actor_class: Optional[
+        Union[ray.remote_function.RemoteFunction, ray.actor.ActorClass]
+    ] = None,
+) -> Union[Union[ray.remote_function.RemoteFunction, ray.actor.ActorClass], Dict]:
+    """Schedule a remote function or actor class on a given node.
+
+    Args:
+        node_id: The node to schedule on.
+        remote_func_or_actor_class: A Ray remote function or actor class
+            to schedule on the input node. If None, this function will directly
+            return the options dict to pass to another remote function or actor class
+            as remote options.
+    Returns:
+        The provided remote function or actor class, but with options modified to force
+        placement on the input node. If remote_func_or_actor_class is None,
+        the options dict to pass to another remote function or
+        actor class as remote options kwargs.
+    """
+
+    scheduling_strategy = ray.util.scheduling_strategies.NodeAffinitySchedulingStrategy(
+        node_id=node_id, soft=False
+    )
+
+    options = {"scheduling_strategy": scheduling_strategy}
+
+    if remote_func_or_actor_class is None:
+        return options
+
+    return remote_func_or_actor_class.options(**options)
+
+
+def _force_on_current_node(
+    remote_func_or_actor_class: Optional[
+        Union[ray.remote_function.RemoteFunction, ray.actor.ActorClass]
+    ] = None
+) -> Union[Union[ray.remote_function.RemoteFunction, ray.actor.ActorClass], Dict]:
+    """Schedule a remote function or actor class on the current node.
+
+    If using Ray Client, the current node is the client server node.
+
+    Args:
+        remote_func_or_actor_class: A Ray remote function or actor class
+            to schedule on the current node. If None, this function will directly
+            return the options dict to pass to another remote function or actor class
+            as remote options.
+    Returns:
+        The provided remote function or actor class, but with options modified to force
+        placement on the current node. If remote_func_or_actor_class is None,
+        the options dict to pass to another remote function or
+        actor class as remote options kwargs.
+    """
+    current_node_id = ray.get_runtime_context().get_node_id()
+    return _force_on_node(current_node_id, remote_func_or_actor_class)
diff --git a/python/ray/tune/progress_reporter.py b/python/ray/tune/progress_reporter.py
index f032953ee955..daa2a669bb6c 100644
--- a/python/ray/tune/progress_reporter.py
+++ b/python/ray/tune/progress_reporter.py
@@ -16,6 +16,7 @@
 
 import ray
 from ray._private.dict import flatten_dict
+from ray.air.util.node import _force_on_current_node
 from ray.tune.callback import Callback
 from ray.tune.logger import pretty_print
 from ray.tune.result import (
@@ -36,7 +37,6 @@
 from ray.tune.experiment.trial import DEBUG_PRINT_INTERVAL, Trial, _Location
 from ray.tune.trainable import Trainable
 from ray.tune.utils import unflattened_lookup
-from ray.tune.utils.node import _force_on_current_node
 from ray.tune.utils.log import Verbosity, has_verbosity, set_verbosity
 from ray.util.annotations import DeveloperAPI, PublicAPI
 from ray.util.queue import Empty, Queue
diff --git a/python/ray/tune/tests/test_multinode_sync.py b/python/ray/tune/tests/test_multinode_sync.py
index 851daee6305f..5091028e1882 100644
--- a/python/ray/tune/tests/test_multinode_sync.py
+++ b/python/ray/tune/tests/test_multinode_sync.py
@@ -7,6 +7,7 @@
 
 import ray
 from ray import tune
+from ray.air.util.node import _force_on_node
 from ray.autoscaler._private.fake_multi_node.node_provider import FAKE_HEAD_NODE_ID
 from ray.autoscaler._private.fake_multi_node.test_utils import DockerCluster
 from ray.tune.callback import Callback
@@ -349,6 +350,47 @@ def get_checkpoint_dirs(node_trial_path: str) -> List[str]:
             # 2, and we currently don't delete these on continue
             self.assertLessEqual(len(checkpoint_dirs), 4)
 
+    def testForceOnNodeScheduling(self):
+        """Test node scheduling behavior correctly schedules with node affinity."""
+        num_workers = 4
+        num_cpu_per_node = 4
+        self.cluster.update_config(
+            {
+                "provider": {"head_resources": {"CPU": num_cpu_per_node, "GPU": 0}},
+                "available_node_types": {
+                    "ray.worker.cpu": {
+                        "resources": {"CPU": num_cpu_per_node},
+                        "min_workers": num_workers,
+                        "max_workers": num_workers,
+                    },
+                    "ray.worker.gpu": {
+                        "min_workers": 0,
+                        "max_workers": 0,  # No GPU nodes
+                    },
+                },
+            }
+        )
+        self.cluster.start()
+        self.cluster.connect(client=True, timeout=120)
+
+        total_num_cpu = (1 + num_workers) * num_cpu_per_node
+        self.cluster.wait_for_resources({"CPU": total_num_cpu})
+
+        @ray.remote
+        def get_current_node_id():
+            return ray.get_runtime_context().get_node_id()
+
+        node_ids = [node["NodeID"] for node in ray.nodes()]
+        assert len(node_ids) == 1 + num_workers
+
+        remote_tasks = [
+            _force_on_node(node_id, get_current_node_id).remote()
+            for node_id in node_ids
+        ]
+        results = ray.get(remote_tasks)
+        print(results)
+        assert results == node_ids
+
 
 if __name__ == "__main__":
     import pytest
diff --git a/python/ray/tune/tune.py b/python/ray/tune/tune.py
index 53ccca7dba9b..15242cf5f281 100644
--- a/python/ray/tune/tune.py
+++ b/python/ray/tune/tune.py
@@ -10,6 +10,7 @@
 
 import ray
 from ray.air import CheckpointConfig
+from ray.air.util.node import _force_on_current_node
 from ray.tune.analysis import ExperimentAnalysis
 from ray.tune.callback import Callback
 from ray.tune.error import TuneError
@@ -54,7 +55,6 @@
 from ray.tune.execution.trial_runner import TrialRunner
 from ray.tune.utils.callback import _create_default_callbacks
 from ray.tune.utils.log import Verbosity, has_verbosity, set_verbosity
-from ray.tune.utils.node import _force_on_current_node
 from ray.tune.execution.placement_groups import PlacementGroupFactory
 from ray.util.annotations import PublicAPI
 from ray.util.queue import Queue
diff --git a/python/ray/tune/tuner.py b/python/ray/tune/tuner.py
index 8adb6d8859ec..7b1cacb000fa 100644
--- a/python/ray/tune/tuner.py
+++ b/python/ray/tune/tuner.py
@@ -4,6 +4,7 @@
 import ray
 
 from ray.air.config import RunConfig
+from ray.air.util.node import _force_on_current_node
 from ray.tune import TuneError
 from ray.tune.execution.trial_runner import _ResumeConfig
 from ray.tune.result_grid import ResultGrid
@@ -14,7 +15,6 @@
     _prepare_progress_reporter_for_ray_client,
     _stream_client_output,
 )
-from ray.tune.utils.node import _force_on_current_node
 from ray.util import PublicAPI
 
 if TYPE_CHECKING:
diff --git a/python/ray/tune/utils/file_transfer.py b/python/ray/tune/utils/file_transfer.py
index 8c5cf15e6fb4..30f7675c5cb9 100644
--- a/python/ray/tune/utils/file_transfer.py
+++ b/python/ray/tune/utils/file_transfer.py
@@ -9,7 +9,7 @@
 import ray
 from ray.util.annotations import DeveloperAPI
 from ray.air._internal.filelock import TempFileLock
-from ray.util.scheduling_strategies import PlacementGroupSchedulingStrategy
+from ray.air.util.node import _get_node_id_from_node_ip, _force_on_node
 
 
 _DEFAULT_CHUNK_SIZE_BYTES = 500 * 1024 * 1024  # 500 MiB
@@ -114,11 +114,10 @@ def _sync_dir_on_same_node(
         None, or future of the copy task.
 
     """
-    copy_on_node = _remote_copy_dir.options(
-        num_cpus=0,
-        resources={f"node:{ip}": 0.01},
-        scheduling_strategy=PlacementGroupSchedulingStrategy(placement_group=None),
-    )
+
+    node_id = _get_node_id_from_node_ip(ip)
+
+    copy_on_node = _remote_copy_dir.options(num_cpus=0, **_force_on_node(node_id))
     copy_future = copy_on_node.remote(
         source_dir=source_path, target_dir=target_path, exclude=exclude
     )
@@ -165,24 +164,22 @@ def _sync_dir_between_different_nodes(
         None, or Tuple of unpack future, pack actor, and files_stats future.
 
     """
+
+    source_node_id = _get_node_id_from_node_ip(source_ip)
+    target_node_id = _get_node_id_from_node_ip(target_ip)
+
     pack_actor_on_source_node = _PackActor.options(
-        num_cpus=0,
-        resources={f"node:{source_ip}": 0.01},
-        scheduling_strategy=PlacementGroupSchedulingStrategy(placement_group=None),
+        num_cpus=0, **_force_on_node(source_node_id)
     )
     unpack_on_target_node = _unpack_from_actor.options(
-        num_cpus=0,
-        resources={f"node:{target_ip}": 0.01},
-        scheduling_strategy=PlacementGroupSchedulingStrategy(placement_group=None),
+        num_cpus=0, **_force_on_node(target_node_id)
     )
 
     if force_all:
         files_stats = None
     else:
         files_stats = _remote_get_recursive_files_and_stats.options(
-            num_cpus=0,
-            resources={f"node:{target_ip}": 0.01},
-            scheduling_strategy=PlacementGroupSchedulingStrategy(placement_group=None),
+            num_cpus=0, **_force_on_node(target_node_id)
         ).remote(target_path)
 
     pack_actor = pack_actor_on_source_node.remote(
@@ -217,11 +214,10 @@ def delete_on_node(
         Boolean indicating if deletion succeeded, or Ray future
         for scheduled delete task.
     """
-    delete_task = _remote_delete_path.options(
-        num_cpus=0,
-        resources={f"node:{node_ip}": 0.01},
-        scheduling_strategy=PlacementGroupSchedulingStrategy(placement_group=None),
-    )
+
+    node_id = _get_node_id_from_node_ip(node_ip)
+
+    delete_task = _remote_delete_path.options(num_cpus=0, **_force_on_node(node_id))
     future = delete_task.remote(path)
 
     if return_future:
diff --git a/python/ray/tune/utils/node.py b/python/ray/tune/utils/node.py
deleted file mode 100644
index a3534db53b44..000000000000
--- a/python/ray/tune/utils/node.py
+++ /dev/null
@@ -1,40 +0,0 @@
-import ray
-
-
-def _get_current_node_resource_key() -> str:
-    """Get the Ray resource key for current node.
-    It can be used for actor placement.
-    If using Ray Client, this will return the resource key for the node that
-    is running the client server.
-    Returns:
-        (str) A string of the format node:<CURRENT-NODE-IP-ADDRESS>
-    """
-    current_node_id = ray.get_runtime_context().get_node_id()
-    for node in ray.nodes():
-        if node["NodeID"] == current_node_id:
-            # Found the node.
-            for key in node["Resources"].keys():
-                if key.startswith("node:"):
-                    return key
-    else:
-        raise ValueError("Cannot found the node dictionary for current node.")
-
-
-def _force_on_current_node(task_or_actor=None):
-    """Given a task or actor, place it on the current node.
-    If using Ray Client, the current node is the client server node.
-    Args:
-        task_or_actor: A Ray remote function or class to place on the
-            current node. If None, returns the options dict to pass to
-            another actor.
-    Returns:
-        The provided task or actor, but with options modified to force
-            placement on the current node.
-    """
-    node_resource_key = _get_current_node_resource_key()
-    options = {"resources": {node_resource_key: 0.01}}
-
-    if task_or_actor is None:
-        return options
-
-    return task_or_actor.options(**options)
diff --git a/python/ray/tune/utils/util.py b/python/ray/tune/utils/util.py
index c7d805a2ea27..4f2953555d03 100644
--- a/python/ray/tune/utils/util.py
+++ b/python/ray/tune/utils/util.py
@@ -16,6 +16,7 @@
 import ray
 from ray.air.checkpoint import Checkpoint
 from ray.air._internal.remote_storage import delete_at_uri
+from ray.air.util.node import _get_node_id_from_node_ip, _force_on_node
 from ray.util.annotations import DeveloperAPI, PublicAPI
 from ray.air._internal.json import SafeFallbackEncoder  # noqa
 from ray.air._internal.util import (  # noqa: F401
@@ -171,20 +172,19 @@ def _serialize_checkpoint(checkpoint_path) -> bytes:
 def _get_checkpoint_from_remote_node(
     checkpoint_path: str, node_ip: str, timeout: float = 300.0
 ) -> Optional[Checkpoint]:
-    if not any(
-        node["NodeManagerAddress"] == node_ip and node["Alive"] for node in ray.nodes()
-    ):
+    node_id = _get_node_id_from_node_ip(node_ip)
+
+    if node_id is None:
         logger.warning(
             f"Could not fetch checkpoint with path {checkpoint_path} from "
             f"node with IP {node_ip} because the node is not available "
             f"anymore."
         )
         return None
-    fut = _serialize_checkpoint.options(
-        resources={f"node:{node_ip}": 0.01},
-        num_cpus=0,
-        scheduling_strategy="DEFAULT",
-    ).remote(checkpoint_path)
+
+    fut = _serialize_checkpoint.options(num_cpus=0, **_force_on_node(node_id)).remote(
+        checkpoint_path
+    )
     try:
         checkpoint_data = ray.get(fut, timeout=timeout)
     except Exception as e:
diff --git a/release/air_tests/air_benchmarks/workloads/benchmark_util.py b/release/air_tests/air_benchmarks/workloads/benchmark_util.py
index 267b3d794c07..e08daa082dc2 100644
--- a/release/air_tests/air_benchmarks/workloads/benchmark_util.py
+++ b/release/air_tests/air_benchmarks/workloads/benchmark_util.py
@@ -4,18 +4,12 @@
 from collections import defaultdict
 from contextlib import closing
 from pathlib import Path
+from python.ray.air.util.node import _force_on_node
 
 import ray
 from typing import Any, List, Dict, Union, Callable
 
 
-def _schedule_remote_fn_on_node(node_ip: str, remote_fn, *args, **kwargs):
-    return remote_fn.options(resources={f"node:{node_ip}": 0.01}).remote(
-        *args,
-        **kwargs,
-    )
-
-
 def schedule_remote_fn_on_all_nodes(
     remote_fn, exclude_head: bool = False, *args, **kwargs
 ):
@@ -31,7 +25,12 @@ def schedule_remote_fn_on_all_nodes(
         if exclude_head and node_ip == head_ip:
             continue
 
-        future = _schedule_remote_fn_on_node(node_ip, remote_fn, *args, **kwargs)
+        node_id = node["NodeID"]
+
+        future = _force_on_node(node_id, remote_fn).remote(
+            *args,
+            **kwargs,
+        )
         futures.append(future)
     return futures
 
diff --git a/release/golden_notebook_tests/workloads/torch_tune_serve_test.py b/release/golden_notebook_tests/workloads/torch_tune_serve_test.py
index cc9bcd424e9f..c843953e7568 100644
--- a/release/golden_notebook_tests/workloads/torch_tune_serve_test.py
+++ b/release/golden_notebook_tests/workloads/torch_tune_serve_test.py
@@ -8,6 +8,7 @@
 import ray
 from ray.air import session
 from ray.air.config import ScalingConfig, RunConfig
+from ray.air.util.node import _force_on_current_node
 from ray.tune.tune_config import TuneConfig
 import requests
 import torch
@@ -15,7 +16,6 @@
 import torchvision.transforms as transforms
 from filelock import FileLock
 from ray import serve, tune, train
-from ray.tune.utils.node import _force_on_current_node
 from ray.train.torch import TorchTrainer, TorchCheckpoint
 from ray.tune import Tuner
 from torch.utils.data import DataLoader, Subset
diff --git a/release/ray_release/command_runner/_prometheus_metrics.py b/release/ray_release/command_runner/_prometheus_metrics.py
index a992ea7820a2..453abf0124bf 100644
--- a/release/ray_release/command_runner/_prometheus_metrics.py
+++ b/release/ray_release/command_runner/_prometheus_metrics.py
@@ -126,7 +126,7 @@ def save_prometheus_metrics(
             end_time = time.time()
         if use_ray:
             import ray
-            from ray.tune.utils.node import _force_on_current_node
+            from ray.air.util.node import _force_on_current_node
 
             addr = os.environ.get("RAY_ADDRESS", None)
             ray.init(addr)

From 24d0376c0235bb0c1b19a7d18551ac514aed0088 Mon Sep 17 00:00:00 2001
From: Cade Daniel <cade@anyscale.com>
Date: Wed, 1 Feb 2023 07:59:38 -0800
Subject: [PATCH 124/267] [Ray release] Moving Atari ROM dependencies to S3
 (#32150)

In #31933 we fix an Atari ROM dependency that by default uses a torrent to download ROMs. The tests in this PR also break occasionally due to the same reason.

I moved the ROM dependency to S3 to increase reliability. I actually think we can remove the ROM dependency from these app configs since I don't see any RL test using them. But I think that is too much risk for this PR, since it will likely end up as a cherry pick to 2.3.
---
 release/dashboard/agent_stress_app_config.yaml | 5 ++++-
 release/long_running_tests/app_config.yaml     | 5 ++++-
 release/long_running_tests/app_config_np.yaml  | 5 ++++-
 3 files changed, 12 insertions(+), 3 deletions(-)

diff --git a/release/dashboard/agent_stress_app_config.yaml b/release/dashboard/agent_stress_app_config.yaml
index ef9a0407cad0..9392238a10f6 100644
--- a/release/dashboard/agent_stress_app_config.yaml
+++ b/release/dashboard/agent_stress_app_config.yaml
@@ -25,7 +25,10 @@ post_build_cmds:
   - pip install ale-py==0.7
   - pip uninstall importlib-metadata -y
   - pip install importlib-metadata==4.13.0
-  - pip install gym[atari] autorom[accept-rom-license]
+  # AutoROM downloads ROMs via torrent when they are built. The torrent is unreliable,
+  # so we built it for py3 and use that instead. This wheel was tested for python 3.7, 3.8,
+  # and 3.9.
+  - pip install gym[atari] https://ray-ci-deps-wheels.s3.us-west-2.amazonaws.com/AutoROM.accept_rom_license-0.5.4-py3-none-any.whl
   - pip3 uninstall -y ray && pip3 install -U {{ env["RAY_WHEELS"] | default("ray") }}
   - pip3 install -U ray[default]
   - {{ env["RAY_WHEELS_SANITY_CHECK"] | default("echo No Ray wheels sanity check") }}
diff --git a/release/long_running_tests/app_config.yaml b/release/long_running_tests/app_config.yaml
index 9c39239c5924..6a6bf3aba6af 100755
--- a/release/long_running_tests/app_config.yaml
+++ b/release/long_running_tests/app_config.yaml
@@ -11,9 +11,12 @@ python:
     # requirements_ml_docker.txt and removed here
     - gym>=0.21.0,<0.24.1
     - ale-py==0.7.5
-    - autorom[accept-rom-license]
     - pytest
     - tensorflow
+    # AutoROM downloads ROMs via torrent when they are built. The torrent is unreliable,
+    # so we built it for py3 and use that instead. This wheel was tested for python 3.7, 3.8,
+    # and 3.9.
+    - https://ray-ci-deps-wheels.s3.us-west-2.amazonaws.com/AutoROM.accept_rom_license-0.5.4-py3-none-any.whl
   conda_packages: []
 
 post_build_cmds:
diff --git a/release/long_running_tests/app_config_np.yaml b/release/long_running_tests/app_config_np.yaml
index b028cbafd2b2..461c4e395b54 100644
--- a/release/long_running_tests/app_config_np.yaml
+++ b/release/long_running_tests/app_config_np.yaml
@@ -9,11 +9,14 @@ python:
   pip_packages:
     - "gym[atari]>=0.21.0,<0.24.0"
     - ale-py==0.7.5
-    - autorom[accept-rom-license]
     - pygame
     - pytest
     - tensorflow
     - torch
+    # AutoROM downloads ROMs via torrent when they are built. The torrent is unreliable,
+    # so we built it for py3 and use that instead. This wheel was tested for python 3.7, 3.8,
+    # and 3.9.
+    - https://ray-ci-deps-wheels.s3.us-west-2.amazonaws.com/AutoROM.accept_rom_license-0.5.4-py3-none-any.whl
   conda_packages: []
 
 post_build_cmds:

From ff16730597f6681beb4e275d9f3189ec09494c45 Mon Sep 17 00:00:00 2001
From: Chen Shen <scv119@gmail.com>
Date: Wed, 1 Feb 2023 08:27:02 -0800
Subject: [PATCH 125/267] [Core] automatically pick max_pending_lease_requests
 based on number of nodes in the cluster (#31934)

Why are these changes needed?
This PR takes over #26373

Currently, the initial scheduling delay for a simple f.remote() loop is approximately worker startup time (~1s) * number of nodes. There are three reasons for this:

1 . Drivers do not share physical worker processes, so each raylet must start new worker processes when a new driver starts. Each raylet starts the workers when the driver first sends a lease (resource) request to that raylet.
2. The #14790 prefers to pack tasks on fewer nodes up to 50% CPU utilization before spreading tasks for load-balancing.
3. The maximum number of concurrent lease requests is 10, meaning that the driver must wait for workers to start on the first 10 nodes that it contacts before sending lease requests to the next set of nodes. Because of (2), the first 10 nodes contacted is usually not unique, especially when each node has many cores.

This PR change (3), which allows us to dynamic adjust the max_pending_lease_requests based on the number of nodes in the cluster.
Without this PR, the top k scheduling algorithm is bottlenecked by the speed of sending lease request across the cluster.
---
 src/ray/common/ray_config_def.h               |   4 +-
 src/ray/core_worker/core_worker.cc            |  52 ++-
 src/ray/core_worker/core_worker.h             |  16 +
 .../test/direct_task_transport_mock_test.cc   |   5 +-
 .../test/direct_task_transport_test.cc        | 415 ++++++++++++++----
 .../transport/direct_task_transport.cc        |  20 +-
 .../transport/direct_task_transport.h         |  32 +-
 7 files changed, 439 insertions(+), 105 deletions(-)

diff --git a/src/ray/common/ray_config_def.h b/src/ray/common/ray_config_def.h
index 069972afcf78..097f7ab12c70 100644
--- a/src/ray/common/ray_config_def.h
+++ b/src/ray/common/ray_config_def.h
@@ -496,7 +496,9 @@ RAY_CONFIG(bool, enable_metrics_collection, true)
 RAY_CONFIG(int64_t, task_rpc_inlined_bytes_limit, 10 * 1024 * 1024)
 
 /// Maximum number of pending lease requests per scheduling category
-RAY_CONFIG(uint64_t, max_pending_lease_requests_per_scheduling_category, 10)
+/// -1 means that Ray should automatically set this to the number of nodes in
+/// the cluster.
+RAY_CONFIG(int64_t, max_pending_lease_requests_per_scheduling_category, -1)
 
 /// Wait timeout for dashboard agent register.
 #ifdef _WIN32
diff --git a/src/ray/core_worker/core_worker.cc b/src/ray/core_worker/core_worker.cc
index bff8815ef370..452bea1ad478 100644
--- a/src/ray/core_worker/core_worker.cc
+++ b/src/ray/core_worker/core_worker.cc
@@ -271,10 +271,23 @@ CoreWorker::CoreWorker(const CoreWorkerOptions &options, const WorkerID &worker_
             new rpc::CoreWorkerClient(addr, *client_call_manager_));
       });
 
-  // Register a callback to monitor removed nodes.
-  // Note we capture a shared ownership of reference_counter_
+  if (RayConfig::instance().max_pending_lease_requests_per_scheduling_category() > 0) {
+    lease_request_rate_limiter_ = std::make_shared<StaticLeaseRequestRateLimiter>(
+        RayConfig::instance().max_pending_lease_requests_per_scheduling_category());
+  } else {
+    RAY_CHECK(
+        RayConfig::instance().max_pending_lease_requests_per_scheduling_category() != 0)
+        << "max_pending_lease_requests_per_scheduling_category can't be 0";
+    lease_request_rate_limiter_ =
+        std::make_shared<ClusterSizeBasedLeaseRequestRateLimiter>(
+            /*kMinConcurrentLeaseCap*/ 10);
+  }
+
+  // Register a callback to monitor add/removed nodes.
+  // Note we capture a shared ownership of reference_counter_ and rate_limiter
   // here to avoid destruction order fiasco between gcs_client and reference_counter_.
-  auto on_node_change = [reference_counter = this->reference_counter_](
+  auto on_node_change = [reference_counter = this->reference_counter_,
+                         rate_limiter = this->lease_request_rate_limiter_](
                             const NodeID &node_id, const rpc::GcsNodeInfo &data) {
     if (data.state() == rpc::GcsNodeInfo::DEAD) {
       RAY_LOG(INFO) << "Node failure from " << node_id
@@ -282,6 +295,11 @@ CoreWorker::CoreWorker(const CoreWorkerOptions &options, const WorkerID &worker_
                        "reconstruction is not enabled.";
       reference_counter->ResetObjectsOnRemovedNode(node_id);
     }
+    auto cluster_size_based_rate_limiter =
+        dynamic_cast<ClusterSizeBasedLeaseRequestRateLimiter *>(rate_limiter.get());
+    if (cluster_size_based_rate_limiter) {
+      cluster_size_based_rate_limiter->OnNodeChanges(data);
+    }
   };
   RAY_CHECK_OK(gcs_client_->Nodes().AsyncSubscribeToNodeChange(on_node_change, nullptr));
 
@@ -445,8 +463,8 @@ CoreWorker::CoreWorker(const CoreWorkerOptions &options, const WorkerID &worker_
       RayConfig::instance().worker_lease_timeout_milliseconds(),
       actor_creator_,
       worker_context_.GetCurrentJobID(),
-      boost::asio::steady_timer(io_service_),
-      RayConfig::instance().max_pending_lease_requests_per_scheduling_category());
+      lease_request_rate_limiter_,
+      boost::asio::steady_timer(io_service_));
   auto report_locality_data_callback = [this](
                                            const ObjectID &object_id,
                                            const absl::flat_hash_set<NodeID> &locations,
@@ -3762,5 +3780,29 @@ std::vector<ObjectID> CoreWorker::GetCurrentReturnIds(int num_returns,
   return return_ids;
 }
 
+ClusterSizeBasedLeaseRequestRateLimiter::ClusterSizeBasedLeaseRequestRateLimiter(
+    size_t min_concurrent_lease_limit)
+    : kMinConcurrentLeaseCap(min_concurrent_lease_limit), num_alive_nodes_(0) {}
+
+size_t ClusterSizeBasedLeaseRequestRateLimiter::
+    GetMaxPendingLeaseRequestsPerSchedulingCategory() {
+  return std::max<size_t>(kMinConcurrentLeaseCap, num_alive_nodes_.load());
+}
+
+void ClusterSizeBasedLeaseRequestRateLimiter::OnNodeChanges(
+    const rpc::GcsNodeInfo &data) {
+  if (data.state() == rpc::GcsNodeInfo::DEAD) {
+    if (num_alive_nodes_ != 0) {
+      num_alive_nodes_--;
+    } else {
+      RAY_LOG(WARNING) << "Node" << data.node_manager_address()
+                       << " change state to DEAD but num_alive_node is 0.";
+    }
+  } else {
+    num_alive_nodes_++;
+  }
+  RAY_LOG_EVERY_MS(INFO, 60000) << "Number of alive nodes:" << num_alive_nodes_.load();
+}
+
 }  // namespace core
 }  // namespace ray
diff --git a/src/ray/core_worker/core_worker.h b/src/ray/core_worker/core_worker.h
index 8d926a7eead7..58be90803bc5 100644
--- a/src/ray/core_worker/core_worker.h
+++ b/src/ray/core_worker/core_worker.h
@@ -1463,6 +1463,10 @@ class CoreWorker : public rpc::CoreWorkerServiceHandler {
   // A class to subscribe object status from other raylets/workers.
   std::unique_ptr<pubsub::Subscriber> object_info_subscriber_;
 
+  // Rate limit the concurrent pending lease requests for submitting
+  // tasks.
+  std::shared_ptr<LeaseRequestRateLimiter> lease_request_rate_limiter_;
+
   // Interface to submit non-actor tasks directly to leased workers.
   std::unique_ptr<CoreWorkerDirectTaskSubmitter> direct_task_submitter_;
 
@@ -1570,5 +1574,17 @@ class CoreWorker : public rpc::CoreWorkerServiceHandler {
   std::unique_ptr<worker::TaskEventBuffer> task_event_buffer_ = nullptr;
 };
 
+// Lease request rate-limiter based on cluster node size.
+// It returns max(num_nodes_in_cluster, min_concurrent_lease_limit)
+class ClusterSizeBasedLeaseRequestRateLimiter : public LeaseRequestRateLimiter {
+ public:
+  explicit ClusterSizeBasedLeaseRequestRateLimiter(size_t min_concurrent_lease_limit);
+  size_t GetMaxPendingLeaseRequestsPerSchedulingCategory() override;
+  void OnNodeChanges(const rpc::GcsNodeInfo &data);
+
+ private:
+  const size_t kMinConcurrentLeaseCap;
+  std::atomic<size_t> num_alive_nodes_;
+};
 }  // namespace core
 }  // namespace ray
diff --git a/src/ray/core_worker/test/direct_task_transport_mock_test.cc b/src/ray/core_worker/test/direct_task_transport_mock_test.cc
index 32520a6e9d73..b9fb7b22ff46 100644
--- a/src/ray/core_worker/test/direct_task_transport_mock_test.cc
+++ b/src/ray/core_worker/test/direct_task_transport_mock_test.cc
@@ -34,6 +34,8 @@ class DirectTaskTransportTest : public ::testing::Test {
     lease_policy = std::make_shared<MockLeasePolicyInterface>();
     auto client_pool = std::make_shared<rpc::CoreWorkerClientPool>(
         [&](const rpc::Address &) { return nullptr; });
+    static std::shared_ptr<LeaseRequestRateLimiter> kRateLimiter =
+        std::make_shared<StaticLeaseRequestRateLimiter>(1);
     task_submitter = std::make_unique<CoreWorkerDirectTaskSubmitter>(
         rpc::Address(), /* rpc_address */
         raylet_client,  /* lease_client */
@@ -46,7 +48,8 @@ class DirectTaskTransportTest : public ::testing::Test {
         WorkerType::WORKER, /* worker_type */
         0,                  /* lease_timeout_ms */
         actor_creator,
-        JobID::Nil() /* job_id */);
+        JobID::Nil() /* job_id */,
+        kRateLimiter);
   }
 
   TaskSpecification GetCreatingTaskSpec(const ActorID &actor_id) {
diff --git a/src/ray/core_worker/test/direct_task_transport_test.cc b/src/ray/core_worker/test/direct_task_transport_test.cc
index 2abc88cf87ac..401481fd5839 100644
--- a/src/ray/core_worker/test/direct_task_transport_test.cc
+++ b/src/ray/core_worker/test/direct_task_transport_test.cc
@@ -18,12 +18,28 @@
 #include "ray/common/task/task_spec.h"
 #include "ray/common/task/task_util.h"
 #include "ray/common/test_util.h"
+#include "ray/core_worker/core_worker.h"
 #include "ray/core_worker/store_provider/memory_store/memory_store.h"
 #include "ray/raylet_client/raylet_client.h"
 #include "ray/rpc/worker/core_worker_client.h"
 
 namespace ray {
 namespace core {
+namespace {
+std::shared_ptr<LeaseRequestRateLimiter> kOneRateLimiter =
+    std::make_shared<StaticLeaseRequestRateLimiter>(1);
+std::shared_ptr<LeaseRequestRateLimiter> kTwoRateLimiter =
+    std::make_shared<StaticLeaseRequestRateLimiter>(2);
+
+class DynamicRateLimiter : public LeaseRequestRateLimiter {
+ public:
+  explicit DynamicRateLimiter(size_t limit) : limit(limit) {}
+  size_t GetMaxPendingLeaseRequestsPerSchedulingCategory() override { return limit; }
+
+ public:
+  size_t limit;
+};
+}  // namespace
 
 // Used to prevent leases from timing out when not testing that logic. It would
 // be better to use a mock clock or lease manager interface, but that's high
@@ -391,7 +407,8 @@ TEST(DirectTaskTransportTest, TestLocalityAwareSubmitOneTask) {
                                           WorkerType::WORKER,
                                           kLongTimeout,
                                           actor_creator,
-                                          JobID::Nil());
+                                          JobID::Nil(),
+                                          kOneRateLimiter);
 
   TaskSpecification task = BuildEmptyTaskSpec();
 
@@ -442,7 +459,8 @@ TEST(DirectTaskTransportTest, TestSubmitOneTask) {
                                           WorkerType::WORKER,
                                           kLongTimeout,
                                           actor_creator,
-                                          JobID::Nil());
+                                          JobID::Nil(),
+                                          kOneRateLimiter);
 
   TaskSpecification task = BuildEmptyTaskSpec();
 
@@ -493,7 +511,8 @@ TEST(DirectTaskTransportTest, TestRetryTaskApplicationLevelError) {
                                           WorkerType::WORKER,
                                           kLongTimeout,
                                           actor_creator,
-                                          JobID::Nil());
+                                          JobID::Nil(),
+                                          kOneRateLimiter);
   TaskSpecification task = BuildEmptyTaskSpec();
   task.GetMutableMessage().set_retry_exceptions(true);
 
@@ -549,7 +568,8 @@ TEST(DirectTaskTransportTest, TestHandleTaskFailure) {
                                           WorkerType::WORKER,
                                           kLongTimeout,
                                           actor_creator,
-                                          JobID::Nil());
+                                          JobID::Nil(),
+                                          kOneRateLimiter);
   TaskSpecification task = BuildEmptyTaskSpec();
 
   ASSERT_TRUE(submitter.SubmitTask(task).ok());
@@ -559,9 +579,9 @@ TEST(DirectTaskTransportTest, TestHandleTaskFailure) {
   ASSERT_EQ(worker_client->callbacks.size(), 0);
   ASSERT_EQ(raylet_client->num_workers_returned, 0);
   ASSERT_EQ(raylet_client->num_workers_disconnected, 1);
+  ASSERT_EQ(raylet_client->num_get_task_failure_causes, 1);
   ASSERT_EQ(task_finisher->num_tasks_complete, 0);
   ASSERT_EQ(task_finisher->num_tasks_failed, 1);
-  ASSERT_EQ(raylet_client->num_get_task_failure_causes, 1);
   ASSERT_EQ(raylet_client->num_leases_canceled, 0);
   ASSERT_FALSE(raylet_client->ReplyCancelWorkerLease());
 
@@ -592,8 +612,7 @@ TEST(DirectTaskTransportTest, TestHandleUnschedulableTask) {
                                           kLongTimeout,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          2);
+                                          kTwoRateLimiter);
 
   TaskSpecification task1 = BuildEmptyTaskSpec();
   TaskSpecification task2 = BuildEmptyTaskSpec();
@@ -663,8 +682,7 @@ TEST(DirectTaskTransportTest, TestHandleRuntimeEnvSetupFailed) {
                                           kLongTimeout,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          2);
+                                          kTwoRateLimiter);
 
   TaskSpecification task1 = BuildEmptyTaskSpec();
   TaskSpecification task2 = BuildEmptyTaskSpec();
@@ -734,8 +752,7 @@ TEST(DirectTaskTransportTest, TestWorkerHandleLocalRayletDied) {
                                           kLongTimeout,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          2);
+                                          kTwoRateLimiter);
 
   TaskSpecification task1 = BuildEmptyTaskSpec();
   ASSERT_TRUE(submitter.SubmitTask(task1).ok());
@@ -764,8 +781,7 @@ TEST(DirectTaskTransportTest, TestDriverHandleLocalRayletDied) {
                                           kLongTimeout,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          2);
+                                          kTwoRateLimiter);
 
   TaskSpecification task1 = BuildEmptyTaskSpec();
   TaskSpecification task2 = BuildEmptyTaskSpec();
@@ -807,6 +823,9 @@ TEST(DirectTaskTransportTest, TestConcurrentWorkerLeases) {
   auto task_finisher = std::make_shared<MockTaskFinisher>();
   auto actor_creator = std::make_shared<MockActorCreator>();
   auto lease_policy = std::make_shared<MockLeasePolicy>();
+
+  int64_t concurrency = 10;
+  auto rateLimiter = std::make_shared<StaticLeaseRequestRateLimiter>(concurrency);
   CoreWorkerDirectTaskSubmitter submitter(address,
                                           raylet_client,
                                           client_pool,
@@ -819,54 +838,263 @@ TEST(DirectTaskTransportTest, TestConcurrentWorkerLeases) {
                                           kLongTimeout,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          2);
+                                          rateLimiter);
 
-  TaskSpecification task1 = BuildEmptyTaskSpec();
-  TaskSpecification task2 = BuildEmptyTaskSpec();
-  TaskSpecification task3 = BuildEmptyTaskSpec();
+  std::vector<TaskSpecification> tasks;
+  for (int i = 0; i < 2 * concurrency; i++) {
+    auto task = BuildEmptyTaskSpec();
+    tasks.push_back(task);
+    ASSERT_TRUE(submitter.SubmitTask(task).ok());
+  }
 
-  ASSERT_TRUE(submitter.SubmitTask(task1).ok());
-  ASSERT_TRUE(submitter.SubmitTask(task2).ok());
-  ASSERT_TRUE(submitter.SubmitTask(task3).ok());
-  ASSERT_EQ(lease_policy->num_lease_policy_consults, 2);
-  ASSERT_EQ(raylet_client->num_workers_requested, 2);
+  ASSERT_EQ(lease_policy->num_lease_policy_consults, concurrency);
+  ASSERT_EQ(raylet_client->num_workers_requested, concurrency);
   ASSERT_EQ(raylet_client->num_workers_returned, 0);
   ASSERT_EQ(raylet_client->reported_backlog_size, 0);
   ASSERT_EQ(worker_client->callbacks.size(), 0);
 
   // Trigger the periodic backlog report
   submitter.ReportWorkerBacklog();
-  ASSERT_EQ(raylet_client->reported_backlog_size, 1);
+  ASSERT_EQ(raylet_client->reported_backlog_size, concurrency);
+
+  // Grant the first round of leases.
+  for (int i = 0; i < concurrency; i++) {
+    ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", i, NodeID::Nil()));
+    ASSERT_EQ(worker_client->callbacks.size(), i + 1);
+    ASSERT_EQ(lease_policy->num_lease_policy_consults, concurrency + i + 1);
+    ASSERT_EQ(raylet_client->num_workers_requested, concurrency + i + 1);
+    ASSERT_EQ(raylet_client->reported_backlog_size, concurrency - i - 1);
+  }
+  for (int i = 0; i < concurrency; i++) {
+    ASSERT_TRUE(
+        raylet_client->GrantWorkerLease("localhost", concurrency + i, NodeID::Nil()));
+    ASSERT_EQ(worker_client->callbacks.size(), concurrency + i + 1);
+    ASSERT_EQ(lease_policy->num_lease_policy_consults, tasks.size());
+    ASSERT_EQ(raylet_client->num_workers_requested, tasks.size());
+    ASSERT_EQ(raylet_client->reported_backlog_size, 0);
+  }
 
-  // Task 1 is pushed; worker 3 is requested.
-  ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", 1000, NodeID::Nil()));
-  ASSERT_EQ(worker_client->callbacks.size(), 1);
-  ASSERT_EQ(lease_policy->num_lease_policy_consults, 3);
-  ASSERT_EQ(raylet_client->num_workers_requested, 3);
+  // All workers returned.
+  while (!worker_client->callbacks.empty()) {
+    ASSERT_TRUE(worker_client->ReplyPushTask());
+  }
+  ASSERT_EQ(raylet_client->num_workers_returned, tasks.size());
+  ASSERT_EQ(raylet_client->num_workers_disconnected, 0);
+  ASSERT_EQ(task_finisher->num_tasks_complete, tasks.size());
+  ASSERT_EQ(task_finisher->num_tasks_failed, 0);
+  ASSERT_EQ(raylet_client->num_leases_canceled, 0);
   ASSERT_EQ(raylet_client->reported_backlog_size, 0);
+  ASSERT_FALSE(raylet_client->ReplyCancelWorkerLease());
 
-  // Task 2 is pushed; no more workers requested.
+  // Check that there are no entries left in the scheduling_key_entries_ hashmap. These
+  // would otherwise cause a memory leak.
+  ASSERT_TRUE(submitter.CheckNoSchedulingKeyEntriesPublic());
+}
+
+TEST(DirectTaskTransportTest, TestConcurrentWorkerLeasesDynamic) {
+  rpc::Address address;
+  auto raylet_client = std::make_shared<MockRayletClient>();
+  auto worker_client = std::make_shared<MockWorkerClient>();
+  auto store = std::make_shared<CoreWorkerMemoryStore>();
+  auto client_pool = std::make_shared<rpc::CoreWorkerClientPool>(
+      [&](const rpc::Address &addr) { return worker_client; });
+  auto task_finisher = std::make_shared<MockTaskFinisher>();
+  auto actor_creator = std::make_shared<MockActorCreator>();
+  auto lease_policy = std::make_shared<MockLeasePolicy>();
+
+  int64_t concurrency = 10;
+  auto rateLimiter = std::make_shared<DynamicRateLimiter>(1);
+  CoreWorkerDirectTaskSubmitter submitter(address,
+                                          raylet_client,
+                                          client_pool,
+                                          nullptr,
+                                          lease_policy,
+                                          store,
+                                          task_finisher,
+                                          NodeID::Nil(),
+                                          WorkerType::WORKER,
+                                          kLongTimeout,
+                                          actor_creator,
+                                          JobID::Nil(),
+                                          rateLimiter);
+
+  std::vector<TaskSpecification> tasks;
+  for (int i = 0; i < 2 * concurrency; i++) {
+    auto task = BuildEmptyTaskSpec();
+    tasks.push_back(task);
+    ASSERT_TRUE(submitter.SubmitTask(task).ok());
+  }
+
+  ASSERT_EQ(lease_policy->num_lease_policy_consults, 1);
+  ASSERT_EQ(raylet_client->num_workers_requested, 1);
+  ASSERT_EQ(raylet_client->num_workers_returned, 0);
+  ASSERT_EQ(raylet_client->reported_backlog_size, 0);
+  ASSERT_EQ(worker_client->callbacks.size(), 0);
+
+  // Trigger the periodic backlog report
+  submitter.ReportWorkerBacklog();
+  ASSERT_EQ(raylet_client->reported_backlog_size, tasks.size() - 1);
+
+  // Max concurrency is still 1.
+  ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", 1000, NodeID::Nil()));
+  ASSERT_EQ(lease_policy->num_lease_policy_consults, 2);
+  ASSERT_EQ(raylet_client->num_workers_requested, 2);
+  ASSERT_EQ(raylet_client->reported_backlog_size, tasks.size() - 2);
+
+  // Increase max concurrency. Should request leases up to the max concurrency.
+  rateLimiter->limit = concurrency;
   ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", 1001, NodeID::Nil()));
-  ASSERT_EQ(worker_client->callbacks.size(), 2);
-  ASSERT_EQ(lease_policy->num_lease_policy_consults, 3);
-  ASSERT_EQ(raylet_client->num_workers_requested, 3);
+  ASSERT_EQ(lease_policy->num_lease_policy_consults, 2 + concurrency);
+  ASSERT_EQ(raylet_client->num_workers_requested, 2 + concurrency);
+  ASSERT_EQ(raylet_client->reported_backlog_size,
+            tasks.size() - raylet_client->num_workers_requested);
+
+  // Decrease max concurrency again. Should not request any more leases even as
+  // previous requests are granted, since we are still over the current
+  // concurrency.
+  rateLimiter->limit = 1;
+  for (int i = 0; i < concurrency - 1; i++) {
+    ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", i, NodeID::Nil()));
+    ASSERT_EQ(lease_policy->num_lease_policy_consults, 2 + concurrency);
+    ASSERT_EQ(raylet_client->num_workers_requested, 2 + concurrency);
+    ASSERT_EQ(raylet_client->reported_backlog_size,
+              tasks.size() - raylet_client->num_workers_requested);
+  }
+
+  // Grant remaining leases with max lease concurrency of 1.
+  int num_tasks_remaining = tasks.size() - raylet_client->num_workers_requested;
+  lease_policy->num_lease_policy_consults = 0;
+  raylet_client->num_workers_requested = 0;
+  for (int i = 0; i < num_tasks_remaining; i++) {
+    ASSERT_TRUE(
+        raylet_client->GrantWorkerLease("localhost", concurrency + i, NodeID::Nil()));
+    ASSERT_EQ(lease_policy->num_lease_policy_consults, i + 1);
+    ASSERT_EQ(raylet_client->num_workers_requested, i + 1);
+  }
+
+  lease_policy->num_lease_policy_consults = 0;
+  raylet_client->num_workers_requested = 0;
+  ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", 2000, NodeID::Nil()));
+  ASSERT_EQ(lease_policy->num_lease_policy_consults, 0);
+  ASSERT_EQ(raylet_client->num_workers_requested, 0);
+
+  // All workers returned.
+  while (!worker_client->callbacks.empty()) {
+    ASSERT_TRUE(worker_client->ReplyPushTask());
+  }
+  ASSERT_EQ(raylet_client->num_workers_returned, tasks.size());
+  ASSERT_EQ(raylet_client->num_workers_disconnected, 0);
+  ASSERT_EQ(task_finisher->num_tasks_complete, tasks.size());
+  ASSERT_EQ(task_finisher->num_tasks_failed, 0);
+  ASSERT_EQ(raylet_client->num_leases_canceled, 0);
   ASSERT_EQ(raylet_client->reported_backlog_size, 0);
+  ASSERT_FALSE(raylet_client->ReplyCancelWorkerLease());
 
-  // Task 3 is pushed; no more workers requested.
-  ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", 1002, NodeID::Nil()));
-  ASSERT_EQ(worker_client->callbacks.size(), 3);
-  ASSERT_EQ(lease_policy->num_lease_policy_consults, 3);
-  ASSERT_EQ(raylet_client->num_workers_requested, 3);
+  // Check that there are no entries left in the scheduling_key_entries_ hashmap. These
+  // would otherwise cause a memory leak.
+  ASSERT_TRUE(submitter.CheckNoSchedulingKeyEntriesPublic());
+}
+
+TEST(DirectTaskTransportTest, TestConcurrentWorkerLeasesDynamicWithSpillback) {
+  rpc::Address address;
+  auto raylet_client = std::make_shared<MockRayletClient>();
+  auto worker_client = std::make_shared<MockWorkerClient>();
+  auto store = std::make_shared<CoreWorkerMemoryStore>();
+  auto client_pool = std::make_shared<rpc::CoreWorkerClientPool>(
+      [&](const rpc::Address &addr) { return worker_client; });
+  auto task_finisher = std::make_shared<MockTaskFinisher>();
+  auto actor_creator = std::make_shared<MockActorCreator>();
+  auto lease_client_factory = [&](const std::string &ip, int port) {
+    return raylet_client;
+  };
+  auto lease_policy = std::make_shared<MockLeasePolicy>();
+
+  int64_t concurrency = 10;
+  auto rateLimiter = std::make_shared<DynamicRateLimiter>(1);
+  CoreWorkerDirectTaskSubmitter submitter(address,
+                                          raylet_client,
+                                          client_pool,
+                                          lease_client_factory,
+                                          lease_policy,
+                                          store,
+                                          task_finisher,
+                                          NodeID::Nil(),
+                                          WorkerType::WORKER,
+                                          kLongTimeout,
+                                          actor_creator,
+                                          JobID::Nil(),
+                                          rateLimiter);
+
+  std::vector<TaskSpecification> tasks;
+  for (int i = 0; i < 2 * concurrency; i++) {
+    auto task = BuildEmptyTaskSpec();
+    tasks.push_back(task);
+    ASSERT_TRUE(submitter.SubmitTask(task).ok());
+  }
+
+  ASSERT_EQ(lease_policy->num_lease_policy_consults, 1);
+  ASSERT_EQ(raylet_client->num_workers_requested, 1);
+  ASSERT_EQ(raylet_client->num_workers_returned, 0);
   ASSERT_EQ(raylet_client->reported_backlog_size, 0);
+  ASSERT_EQ(worker_client->callbacks.size(), 0);
+
+  // Trigger the periodic backlog report
+  submitter.ReportWorkerBacklog();
+  ASSERT_EQ(raylet_client->reported_backlog_size, tasks.size() - 1);
+
+  // Max concurrency is still 1.
+  ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", 1000, NodeID::Nil()));
+  ASSERT_EQ(lease_policy->num_lease_policy_consults, 2);
+  ASSERT_EQ(raylet_client->num_workers_requested, 2);
+  ASSERT_EQ(raylet_client->reported_backlog_size, tasks.size() - 2);
+
+  // Increase max concurrency.
+  rateLimiter->limit = concurrency;
+  // The outstanding lease request is spilled back to a remote raylet.
+  ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", 1001, NodeID::FromRandom()));
+  // We should request one lease request from the spillback raylet and then the
+  // rest from the raylet returned by the lease policy.
+  ASSERT_EQ(lease_policy->num_lease_policy_consults, concurrency + 1);
+  ASSERT_EQ(raylet_client->num_workers_requested, 2 + concurrency);
+  ASSERT_EQ(raylet_client->reported_backlog_size,
+            tasks.size() - raylet_client->num_workers_requested + 1);
+
+  // Decrease max concurrency again. Should not request any more leases even as
+  // previous requests are granted, since we are still over the current
+  // concurrency.
+  rateLimiter->limit = 1;
+  for (int i = 0; i < concurrency - 1; i++) {
+    ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", i, NodeID::Nil()));
+    ASSERT_EQ(lease_policy->num_lease_policy_consults, concurrency + 1);
+    ASSERT_EQ(raylet_client->num_workers_requested, 2 + concurrency);
+    ASSERT_EQ(raylet_client->reported_backlog_size,
+              tasks.size() - raylet_client->num_workers_requested + 1);
+  }
+
+  // Grant remaining leases with max lease concurrency of 1.
+  int num_tasks_remaining = tasks.size() - raylet_client->num_workers_requested + 1;
+  lease_policy->num_lease_policy_consults = 0;
+  raylet_client->num_workers_requested = 0;
+  for (int i = 0; i < num_tasks_remaining; i++) {
+    ASSERT_TRUE(
+        raylet_client->GrantWorkerLease("localhost", concurrency + i, NodeID::Nil()));
+    ASSERT_EQ(lease_policy->num_lease_policy_consults, i + 1);
+    ASSERT_EQ(raylet_client->num_workers_requested, i + 1);
+  }
+
+  lease_policy->num_lease_policy_consults = 0;
+  raylet_client->num_workers_requested = 0;
+  ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", 2000, NodeID::Nil()));
+  ASSERT_EQ(lease_policy->num_lease_policy_consults, 0);
+  ASSERT_EQ(raylet_client->num_workers_requested, 0);
 
   // All workers returned.
   while (!worker_client->callbacks.empty()) {
     ASSERT_TRUE(worker_client->ReplyPushTask());
   }
-  ASSERT_EQ(raylet_client->num_workers_returned, 3);
+  ASSERT_EQ(raylet_client->num_workers_returned, tasks.size());
   ASSERT_EQ(raylet_client->num_workers_disconnected, 0);
-  ASSERT_EQ(task_finisher->num_tasks_complete, 3);
+  ASSERT_EQ(task_finisher->num_tasks_complete, tasks.size());
   ASSERT_EQ(task_finisher->num_tasks_failed, 0);
   ASSERT_EQ(raylet_client->num_leases_canceled, 0);
   ASSERT_EQ(raylet_client->reported_backlog_size, 0);
@@ -899,8 +1127,7 @@ TEST(DirectTaskTransportTest, TestSubmitMultipleTasks) {
                                           kLongTimeout,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          1);
+                                          kOneRateLimiter);
 
   TaskSpecification task1 = BuildEmptyTaskSpec();
   TaskSpecification task2 = BuildEmptyTaskSpec();
@@ -972,8 +1199,7 @@ TEST(DirectTaskTransportTest, TestReuseWorkerLease) {
                                           kLongTimeout,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          1);
+                                          kOneRateLimiter);
 
   TaskSpecification task1 = BuildEmptyTaskSpec();
   TaskSpecification task2 = BuildEmptyTaskSpec();
@@ -1046,8 +1272,7 @@ TEST(DirectTaskTransportTest, TestRetryLeaseCancellation) {
                                           kLongTimeout,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          1);
+                                          kOneRateLimiter);
   TaskSpecification task1 = BuildEmptyTaskSpec();
   TaskSpecification task2 = BuildEmptyTaskSpec();
   TaskSpecification task3 = BuildEmptyTaskSpec();
@@ -1114,7 +1339,8 @@ TEST(DirectTaskTransportTest, TestConcurrentCancellationAndSubmission) {
                                           WorkerType::WORKER,
                                           kLongTimeout,
                                           actor_creator,
-                                          JobID::Nil());
+                                          JobID::Nil(),
+                                          kOneRateLimiter);
   TaskSpecification task1 = BuildEmptyTaskSpec();
   TaskSpecification task2 = BuildEmptyTaskSpec();
   TaskSpecification task3 = BuildEmptyTaskSpec();
@@ -1179,8 +1405,7 @@ TEST(DirectTaskTransportTest, TestWorkerNotReusedOnError) {
                                           kLongTimeout,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          1);
+                                          kOneRateLimiter);
   TaskSpecification task1 = BuildEmptyTaskSpec();
   TaskSpecification task2 = BuildEmptyTaskSpec();
 
@@ -1235,7 +1460,8 @@ TEST(DirectTaskTransportTest, TestWorkerNotReturnedOnExit) {
                                           WorkerType::WORKER,
                                           kLongTimeout,
                                           actor_creator,
-                                          JobID::Nil());
+                                          JobID::Nil(),
+                                          kOneRateLimiter);
   TaskSpecification task1 = BuildEmptyTaskSpec();
 
   ASSERT_TRUE(submitter.SubmitTask(task1).ok());
@@ -1290,7 +1516,8 @@ TEST(DirectTaskTransportTest, TestSpillback) {
                                           WorkerType::WORKER,
                                           kLongTimeout,
                                           actor_creator,
-                                          JobID::Nil());
+                                          JobID::Nil(),
+                                          kOneRateLimiter);
   TaskSpecification task = BuildEmptyTaskSpec();
 
   ASSERT_TRUE(submitter.SubmitTask(task).ok());
@@ -1363,7 +1590,8 @@ TEST(DirectTaskTransportTest, TestSpillbackRoundTrip) {
                                           WorkerType::WORKER,
                                           kLongTimeout,
                                           actor_creator,
-                                          JobID::Nil());
+                                          JobID::Nil(),
+                                          kOneRateLimiter);
   TaskSpecification task = BuildEmptyTaskSpec();
 
   ASSERT_TRUE(submitter.SubmitTask(task).ok());
@@ -1441,8 +1669,7 @@ void TestSchedulingKey(const std::shared_ptr<CoreWorkerMemoryStore> store,
                                           kLongTimeout,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          1);
+                                          kOneRateLimiter);
 
   ASSERT_TRUE(submitter.SubmitTask(same1).ok());
   ASSERT_TRUE(submitter.SubmitTask(same2).ok());
@@ -1595,8 +1822,7 @@ TEST(DirectTaskTransportTest, TestBacklogReport) {
                                           kLongTimeout,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          1);
+                                          kOneRateLimiter);
 
   TaskSpecification task1 = BuildEmptyTaskSpec();
 
@@ -1665,8 +1891,7 @@ TEST(DirectTaskTransportTest, TestWorkerLeaseTimeout) {
                                           /*lease_timeout_ms=*/5,
                                           actor_creator,
                                           JobID::Nil(),
-                                          absl::nullopt,
-                                          1);
+                                          kOneRateLimiter);
   TaskSpecification task1 = BuildEmptyTaskSpec();
   TaskSpecification task2 = BuildEmptyTaskSpec();
   TaskSpecification task3 = BuildEmptyTaskSpec();
@@ -1732,7 +1957,8 @@ TEST(DirectTaskTransportTest, TestKillExecutingTask) {
                                           WorkerType::WORKER,
                                           kLongTimeout,
                                           actor_creator,
-                                          JobID::Nil());
+                                          JobID::Nil(),
+                                          kOneRateLimiter);
   TaskSpecification task = BuildEmptyTaskSpec();
 
   ASSERT_TRUE(submitter.SubmitTask(task).ok());
@@ -1757,15 +1983,15 @@ TEST(DirectTaskTransportTest, TestKillExecutingTask) {
 
   // Try non-force kill, worker returns normally
   ASSERT_TRUE(submitter.CancelTask(task, false, false).ok());
-  ASSERT_TRUE(worker_client->ReplyPushTask(Status::OK(), false, false, true));
+  ASSERT_TRUE(worker_client->ReplyPushTask());
   ASSERT_EQ(worker_client->kill_requests.front().intended_task_id(),
             task.TaskId().Binary());
   ASSERT_EQ(worker_client->callbacks.size(), 0);
   ASSERT_EQ(raylet_client->num_workers_returned, 1);
   ASSERT_EQ(raylet_client->num_workers_returned_exiting, 0);
   ASSERT_EQ(raylet_client->num_workers_disconnected, 1);
-  ASSERT_EQ(task_finisher->num_tasks_complete, 0);
-  ASSERT_EQ(task_finisher->num_fail_pending_task_calls, 1);
+  ASSERT_EQ(task_finisher->num_tasks_complete, 1);
+  ASSERT_EQ(task_finisher->num_tasks_failed, 1);
 
   // Check that there are no entries left in the scheduling_key_entries_ hashmap. These
   // would otherwise cause a memory leak.
@@ -1793,12 +2019,11 @@ TEST(DirectTaskTransportTest, TestKillPendingTask) {
                                           WorkerType::WORKER,
                                           kLongTimeout,
                                           actor_creator,
-                                          JobID::Nil());
+                                          JobID::Nil(),
+                                          kOneRateLimiter);
   TaskSpecification task = BuildEmptyTaskSpec();
 
   ASSERT_TRUE(submitter.SubmitTask(task).ok());
-
-  // Try force kill
   ASSERT_TRUE(submitter.CancelTask(task, true, false).ok());
   ASSERT_EQ(worker_client->kill_requests.size(), 0);
   ASSERT_EQ(worker_client->callbacks.size(), 0);
@@ -1813,24 +2038,6 @@ TEST(DirectTaskTransportTest, TestKillPendingTask) {
   // Trigger reply to RequestWorkerLease to remove the canceled pending lease request
   ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", 1000, NodeID::Nil(), true));
 
-  task.GetMutableMessage().set_task_id(
-      TaskID::ForNormalTask(JobID::Nil(), TaskID::Nil(), 1).Binary());
-  ASSERT_TRUE(submitter.SubmitTask(task).ok());
-
-  // Try non-force kill
-  ASSERT_TRUE(submitter.CancelTask(task, false, false).ok());
-  ASSERT_EQ(worker_client->kill_requests.size(), 0);
-  ASSERT_EQ(worker_client->callbacks.size(), 0);
-  ASSERT_EQ(raylet_client->num_workers_returned, 0);
-  ASSERT_EQ(raylet_client->num_workers_disconnected, 0);
-  ASSERT_EQ(task_finisher->num_tasks_complete, 0);
-  ASSERT_EQ(task_finisher->num_fail_pending_task_calls, 2);
-  ASSERT_EQ(raylet_client->num_leases_canceled, 2);
-  ASSERT_TRUE(raylet_client->ReplyCancelWorkerLease());
-
-  // Trigger reply to RequestWorkerLease to remove the canceled pending lease request
-  ASSERT_TRUE(raylet_client->GrantWorkerLease("localhost", 1000, NodeID::Nil(), true));
-
   // Check that there are no entries left in the scheduling_key_entries_ hashmap. These
   // would otherwise cause a memory leak.
   ASSERT_TRUE(submitter.CheckNoSchedulingKeyEntriesPublic());
@@ -1857,7 +2064,8 @@ TEST(DirectTaskTransportTest, TestKillResolvingTask) {
                                           WorkerType::WORKER,
                                           kLongTimeout,
                                           actor_creator,
-                                          JobID::Nil());
+                                          JobID::Nil(),
+                                          kOneRateLimiter);
   TaskSpecification task = BuildEmptyTaskSpec();
   ObjectID obj1 = ObjectID::FromRandom();
   task.GetMutableMessage().add_args()->mutable_object_ref()->set_object_id(obj1.Binary());
@@ -1878,10 +2086,47 @@ TEST(DirectTaskTransportTest, TestKillResolvingTask) {
   ASSERT_TRUE(submitter.CheckNoSchedulingKeyEntriesPublic());
 }
 
+TEST(LeaseRequestRateLimiterTest, StaticLeaseRequestRateLimiter) {
+  StaticLeaseRequestRateLimiter limiter(10);
+  ASSERT_EQ(limiter.GetMaxPendingLeaseRequestsPerSchedulingCategory(), 10);
+}
+
+TEST(LeaseRequestRateLimiterTest, ClusterSizeBasedLeaseRequestRateLimiter) {
+  rpc::GcsNodeInfo dead_node;
+  dead_node.set_state(rpc::GcsNodeInfo::DEAD);
+  rpc::GcsNodeInfo alive_node;
+  alive_node.set_state(rpc::GcsNodeInfo::ALIVE);
+  {
+    ClusterSizeBasedLeaseRequestRateLimiter limiter(1);
+    ASSERT_EQ(limiter.GetMaxPendingLeaseRequestsPerSchedulingCategory(), 1);
+    limiter.OnNodeChanges(alive_node);
+    ASSERT_EQ(limiter.GetMaxPendingLeaseRequestsPerSchedulingCategory(), 1);
+    limiter.OnNodeChanges(alive_node);
+    ASSERT_EQ(limiter.GetMaxPendingLeaseRequestsPerSchedulingCategory(), 2);
+    limiter.OnNodeChanges(dead_node);
+    ASSERT_EQ(limiter.GetMaxPendingLeaseRequestsPerSchedulingCategory(), 1);
+    limiter.OnNodeChanges(dead_node);
+    ASSERT_EQ(limiter.GetMaxPendingLeaseRequestsPerSchedulingCategory(), 1);
+  }
+
+  {
+    ClusterSizeBasedLeaseRequestRateLimiter limiter(0);
+    ASSERT_EQ(limiter.GetMaxPendingLeaseRequestsPerSchedulingCategory(), 0);
+    limiter.OnNodeChanges(alive_node);
+    ASSERT_EQ(limiter.GetMaxPendingLeaseRequestsPerSchedulingCategory(), 1);
+    limiter.OnNodeChanges(dead_node);
+    ASSERT_EQ(limiter.GetMaxPendingLeaseRequestsPerSchedulingCategory(), 0);
+    limiter.OnNodeChanges(dead_node);
+    ASSERT_EQ(limiter.GetMaxPendingLeaseRequestsPerSchedulingCategory(), 0);
+    limiter.OnNodeChanges(alive_node);
+    ASSERT_EQ(limiter.GetMaxPendingLeaseRequestsPerSchedulingCategory(), 1);
+  }
+}
+
 }  // namespace core
 }  // namespace ray
 
 int main(int argc, char **argv) {
   ::testing::InitGoogleTest(&argc, argv);
   return RUN_ALL_TESTS();
-}
+}
\ No newline at end of file
diff --git a/src/ray/core_worker/transport/direct_task_transport.cc b/src/ray/core_worker/transport/direct_task_transport.cc
index 3d5958804c1c..7de9c58aa7f0 100644
--- a/src/ray/core_worker/transport/direct_task_transport.cc
+++ b/src/ray/core_worker/transport/direct_task_transport.cc
@@ -326,14 +326,15 @@ void CoreWorkerDirectTaskSubmitter::RequestNewWorkerIfNeeded(
     const SchedulingKey &scheduling_key, const rpc::Address *raylet_address) {
   auto &scheduling_key_entry = scheduling_key_entries_[scheduling_key];
 
-  if (scheduling_key_entry.pending_lease_requests.size() ==
-      max_pending_lease_requests_per_scheduling_category_) {
+  const size_t kMaxPendingLeaseRequestsPerSchedulingCategory =
+      lease_request_rate_limiter_->GetMaxPendingLeaseRequestsPerSchedulingCategory();
+
+  if (scheduling_key_entry.pending_lease_requests.size() >=
+      kMaxPendingLeaseRequestsPerSchedulingCategory) {
     RAY_LOG(DEBUG) << "Exceeding the pending request limit "
-                   << max_pending_lease_requests_per_scheduling_category_;
+                   << kMaxPendingLeaseRequestsPerSchedulingCategory;
     return;
   }
-  RAY_CHECK(scheduling_key_entry.pending_lease_requests.size() <
-            max_pending_lease_requests_per_scheduling_category_);
 
   if (!scheduling_key_entry.AllWorkersBusy()) {
     // There are idle workers, so we don't need more.
@@ -544,6 +545,15 @@ void CoreWorkerDirectTaskSubmitter::RequestNewWorkerIfNeeded(
       is_selected_based_on_locality);
   scheduling_key_entry.pending_lease_requests.emplace(task_id, *raylet_address);
   ReportWorkerBacklogIfNeeded(scheduling_key);
+
+  // Lease more workers if there are still pending tasks and
+  // and we haven't hit the max_pending_lease_requests yet.
+  if (scheduling_key_entry.task_queue.size() >
+          scheduling_key_entry.pending_lease_requests.size() &&
+      scheduling_key_entry.pending_lease_requests.size() <
+          kMaxPendingLeaseRequestsPerSchedulingCategory) {
+    RequestNewWorkerIfNeeded(scheduling_key);
+  }
 }
 
 void CoreWorkerDirectTaskSubmitter::PushNormalTask(
diff --git a/src/ray/core_worker/transport/direct_task_transport.h b/src/ray/core_worker/transport/direct_task_transport.h
index 1c1b9134cef9..48c8dda7c75f 100644
--- a/src/ray/core_worker/transport/direct_task_transport.h
+++ b/src/ray/core_worker/transport/direct_task_transport.h
@@ -53,6 +53,24 @@ typedef int RuntimeEnvHash;
 using SchedulingKey =
     std::tuple<SchedulingClass, std::vector<ObjectID>, ActorID, RuntimeEnvHash>;
 
+// Interface that controls the max concurrent pending lease requests
+// per scheduling category.
+class LeaseRequestRateLimiter {
+ public:
+  virtual size_t GetMaxPendingLeaseRequestsPerSchedulingCategory() = 0;
+  virtual ~LeaseRequestRateLimiter() = default;
+};
+
+// Lease request rate-limiter with fixed number.
+class StaticLeaseRequestRateLimiter : public LeaseRequestRateLimiter {
+ public:
+  StaticLeaseRequestRateLimiter(size_t limit) : kLimit(limit) {}
+  size_t GetMaxPendingLeaseRequestsPerSchedulingCategory() override { return kLimit; }
+
+ private:
+  const size_t kLimit;
+};
+
 // This class is thread-safe.
 class CoreWorkerDirectTaskSubmitter {
  public:
@@ -69,9 +87,8 @@ class CoreWorkerDirectTaskSubmitter {
       int64_t lease_timeout_ms,
       std::shared_ptr<ActorCreatorInterface> actor_creator,
       const JobID &job_id,
-      absl::optional<boost::asio::steady_timer> cancel_timer = absl::nullopt,
-      uint64_t max_pending_lease_requests_per_scheduling_category =
-          ::RayConfig::instance().max_pending_lease_requests_per_scheduling_category())
+      std::shared_ptr<LeaseRequestRateLimiter> lease_request_rate_limiter,
+      absl::optional<boost::asio::steady_timer> cancel_timer = absl::nullopt)
       : rpc_address_(rpc_address),
         local_lease_client_(lease_client),
         lease_client_factory_(lease_client_factory),
@@ -84,8 +101,7 @@ class CoreWorkerDirectTaskSubmitter {
         actor_creator_(actor_creator),
         client_cache_(core_worker_client_pool),
         job_id_(job_id),
-        max_pending_lease_requests_per_scheduling_category_(
-            max_pending_lease_requests_per_scheduling_category),
+        lease_request_rate_limiter_(lease_request_rate_limiter),
         cancel_retry_timer_(std::move(cancel_timer)) {}
 
   /// Schedule a task for direct submission to a worker.
@@ -254,9 +270,6 @@ class CoreWorkerDirectTaskSubmitter {
   /// The ID of the job.
   const JobID job_id_;
 
-  // Max number of pending lease requests per SchedulingKey.
-  const uint64_t max_pending_lease_requests_per_scheduling_category_;
-
   /// A LeaseEntry struct is used to condense the metadata about a single executor:
   /// (1) The lease client through which the worker should be returned
   /// (2) The expiration time of a worker's lease.
@@ -347,6 +360,9 @@ class CoreWorkerDirectTaskSubmitter {
   // Keeps track of where currently executing tasks are being run.
   absl::flat_hash_map<TaskID, rpc::WorkerAddress> executing_tasks_ GUARDED_BY(mu_);
 
+  // Ratelimiter controls the num of pending lease requests.
+  std::shared_ptr<LeaseRequestRateLimiter> lease_request_rate_limiter_;
+
   // Retries cancelation requests if they were not successful.
   absl::optional<boost::asio::steady_timer> cancel_retry_timer_;
 

From e9269ab5f1771e49447d2852d273b7972f6c5b03 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Wed, 1 Feb 2023 10:17:55 -0800
Subject: [PATCH 126/267] [Datasets] Fix filter logic and reuse output buffer
 (#32160)

This PR is to fix filter logic that it should always `yield`, instead of `return`. Otherwise it will just read first block, and exit. Add a unit test, and verify unit test is failed before this PR.

Also change all map-like functions to reuse same output buffer.
---
 python/ray/data/_internal/planner/filter.py   |  5 +++-
 python/ray/data/_internal/planner/flat_map.py |  8 +++---
 python/ray/data/_internal/planner/map_rows.py |  8 +++---
 .../data/tests/test_dynamic_block_split.py    | 25 +++++++++++++++++++
 4 files changed, 37 insertions(+), 9 deletions(-)

diff --git a/python/ray/data/_internal/planner/filter.py b/python/ray/data/_internal/planner/filter.py
index 390de5395afd..7c8e3deb8099 100644
--- a/python/ray/data/_internal/planner/filter.py
+++ b/python/ray/data/_internal/planner/filter.py
@@ -24,6 +24,9 @@ def fn(
             for row in block.iter_rows():
                 if row_fn(row):
                     builder.add(row)
-            return [builder.build()]
+            # NOTE: this yields an empty block if all rows are filtered out.
+            # This causes different behavior between filter and other map-like
+            # functions. We should revisit and try to get rid of this logic.
+            yield builder.build()
 
     return fn
diff --git a/python/ray/data/_internal/planner/flat_map.py b/python/ray/data/_internal/planner/flat_map.py
index f08358a2e06c..e7d0ebadf052 100644
--- a/python/ray/data/_internal/planner/flat_map.py
+++ b/python/ray/data/_internal/planner/flat_map.py
@@ -19,16 +19,16 @@ def fn(
         blocks: Iterator[Block], ctx: TaskContext, row_fn: RowUDF
     ) -> Iterator[Block]:
         DatasetContext._set_current(context)
+        output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
         for block in blocks:
-            output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
             block = BlockAccessor.for_block(block)
             for row in block.iter_rows():
                 for r2 in row_fn(row):
                     output_buffer.add(r2)
                     if output_buffer.has_next():
                         yield output_buffer.next()
-            output_buffer.finalize()
-            if output_buffer.has_next():
-                yield output_buffer.next()
+        output_buffer.finalize()
+        if output_buffer.has_next():
+            yield output_buffer.next()
 
     return fn
diff --git a/python/ray/data/_internal/planner/map_rows.py b/python/ray/data/_internal/planner/map_rows.py
index 6e0d1a49c2af..d7042ed2d874 100644
--- a/python/ray/data/_internal/planner/map_rows.py
+++ b/python/ray/data/_internal/planner/map_rows.py
@@ -17,15 +17,15 @@ def fn(
         blocks: Iterator[Block], ctx: TaskContext, row_fn: RowUDF
     ) -> Iterator[Block]:
         DatasetContext._set_current(context)
+        output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
         for block in blocks:
-            output_buffer = BlockOutputBuffer(None, context.target_max_block_size)
             block = BlockAccessor.for_block(block)
             for row in block.iter_rows():
                 output_buffer.add(row_fn(row))
                 if output_buffer.has_next():
                     yield output_buffer.next()
-            output_buffer.finalize()
-            if output_buffer.has_next():
-                yield output_buffer.next()
+        output_buffer.finalize()
+        if output_buffer.has_next():
+            yield output_buffer.next()
 
     return fn
diff --git a/python/ray/data/tests/test_dynamic_block_split.py b/python/ray/data/tests/test_dynamic_block_split.py
index 5f4203c0a768..252e27c30fa0 100644
--- a/python/ray/data/tests/test_dynamic_block_split.py
+++ b/python/ray/data/tests/test_dynamic_block_split.py
@@ -175,6 +175,31 @@ def test_dataset_pipeline(
     assert len(dsp.take(5)) == 5
 
 
+def test_filter(
+    ray_start_regular_shared, enable_dynamic_block_splitting, target_max_block_size
+):
+    # Test 10 blocks from 1 task, each block is 1024 bytes.
+    num_blocks = 10
+    block_size = 1024
+
+    ds = ray.data.read_datasource(
+        RandomBytesDatasource(),
+        parallelism=1,
+        num_blocks=num_blocks,
+        block_size=block_size,
+    )
+
+    ds = ds.filter(lambda _: True)
+    ds.fully_executed()
+    assert ds.count() == num_blocks
+    assert ds.num_blocks() == num_blocks
+
+    ds = ds.filter(lambda _: False)
+    ds.fully_executed()
+    assert ds.count() == 0
+    assert ds.num_blocks() == num_blocks
+
+
 def test_lazy_block_list(
     shutdown_only, enable_dynamic_block_splitting, target_max_block_size
 ):

From 223a9a6b5f40df44c6be1d58960e231f0b5aae27 Mon Sep 17 00:00:00 2001
From: Chen Shen <scv119@gmail.com>
Date: Wed, 1 Feb 2023 11:53:43 -0800
Subject: [PATCH 127/267] [Core] add ray-core as code-owner for most of the
 core code-path (#32082)

make https://github.com/orgs/ray-project/teams/ray-core/members become the code-owner on most of core code paths
---
 .github/CODEOWNERS | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS
index 41d46bc05397..1b4eb7f6dbd0 100644
--- a/.github/CODEOWNERS
+++ b/.github/CODEOWNERS
@@ -25,8 +25,8 @@
 /python/ray/autoscaler/ @wuisawesome @DmitriGekhtman @ericl
 
 # Metrics
-/src/ray/stats/metric_defs.h @ericl @scv119 @rkooo567
-/src/ray/stats/metric_defs.cc @ericl @scv119 @rkooo567
+/src/ray/stats/metric_defs.h @ray-project/ray-core
+/src/ray/stats/metric_defs.cc @ray-project/ray-core
 
 # Telemetry
 /src/ray/protobuf/usage.proto @pcmoritz @thomasdesr
@@ -35,7 +35,7 @@
 # /src/ray @ray-project/ray-core-cpp
 
 # GCS
-/src/ray/gcs/ @iycheng @scv119 @rkooo567 @ericl
+/src/ray/gcs/ @ray-project/ray-core
 
 # Dependencies
 /python/setup.py @richardliaw @ericl @edoakes
@@ -44,12 +44,12 @@
 /ci/lint/format.sh @richardliaw @ericl @edoakes
 
 # Docker image build script.
-/ci/build/build-docker-images.py @amogkam @krfricke
+/ci/build/build-docker-images.py @amogkam @krfricke @ray-project/ray-core
 
 # Python worker.
-#/python/ray/ @ray-project/ray-core-python
-#!/python/ray/tune/ @ray-project/ray-core-python
-#!/python/ray/rllib/ @ray-project/ray-core-python
+#/python/ray/ @ray-project/ray-core
+#!/python/ray/tune/ @ray-project/ray-core
+#!/python/ray/rllib/ @ray-project/ray-core
 
 # Java worker.
 /java/dependencies.bzl @jovany-wang @kfstorm @raulchen @ericl @iycheng @WangTaoTheTonic
@@ -59,15 +59,15 @@
 /java/api/ @jovany-wang @kfstorm @raulchen @ericl @iycheng @WangTaoTheTonic
 
 # C++ worker
-/cpp/include/ray @SongGuyang @raulchen @kfstorm
+/cpp/include/ray @SongGuyang @raulchen @kfstorm @ray-project/ray-core
 
 # Ray Client
 /src/ray/protobuf/ray_client.proto @ijrsvt @ameerhajali @ckw017
 
 # Runtime Env
 # TODO(SongGuyang): Add new items to guarantee runtime env API compatibility in multiple languages.
-/src/ray/protobuf/runtime_env_common.proto @SongGuyang @raulchen @edoakes @architkulkarni
-/src/ray/protobuf/runtime_env_agent.proto @SongGuyang @raulchen @edoakes @architkulkarni
+/src/ray/protobuf/runtime_env_common.proto @SongGuyang @raulchen @edoakes @architkulkarni @ray-project/ray-core
+/src/ray/protobuf/runtime_env_agent.proto @SongGuyang @raulchen @edoakes @architkulkarni @ray-project/ray-core
 
 # ==== Libraries and frameworks ====
 

From 4d526c5b296e4fedadd73aa45b4db8ed50e83bbe Mon Sep 17 00:00:00 2001
From: Chen Shen <scv119@gmail.com>
Date: Wed, 1 Feb 2023 12:07:36 -0800
Subject: [PATCH 128/267] Revert "[Core] add ray-core as code-owner for most of
 the core code-path (#32082)" (#32176)

This reverts commit 223a9a6b5f40df44c6be1d58960e231f0b5aae27.
---
 .github/CODEOWNERS | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS
index 1b4eb7f6dbd0..41d46bc05397 100644
--- a/.github/CODEOWNERS
+++ b/.github/CODEOWNERS
@@ -25,8 +25,8 @@
 /python/ray/autoscaler/ @wuisawesome @DmitriGekhtman @ericl
 
 # Metrics
-/src/ray/stats/metric_defs.h @ray-project/ray-core
-/src/ray/stats/metric_defs.cc @ray-project/ray-core
+/src/ray/stats/metric_defs.h @ericl @scv119 @rkooo567
+/src/ray/stats/metric_defs.cc @ericl @scv119 @rkooo567
 
 # Telemetry
 /src/ray/protobuf/usage.proto @pcmoritz @thomasdesr
@@ -35,7 +35,7 @@
 # /src/ray @ray-project/ray-core-cpp
 
 # GCS
-/src/ray/gcs/ @ray-project/ray-core
+/src/ray/gcs/ @iycheng @scv119 @rkooo567 @ericl
 
 # Dependencies
 /python/setup.py @richardliaw @ericl @edoakes
@@ -44,12 +44,12 @@
 /ci/lint/format.sh @richardliaw @ericl @edoakes
 
 # Docker image build script.
-/ci/build/build-docker-images.py @amogkam @krfricke @ray-project/ray-core
+/ci/build/build-docker-images.py @amogkam @krfricke
 
 # Python worker.
-#/python/ray/ @ray-project/ray-core
-#!/python/ray/tune/ @ray-project/ray-core
-#!/python/ray/rllib/ @ray-project/ray-core
+#/python/ray/ @ray-project/ray-core-python
+#!/python/ray/tune/ @ray-project/ray-core-python
+#!/python/ray/rllib/ @ray-project/ray-core-python
 
 # Java worker.
 /java/dependencies.bzl @jovany-wang @kfstorm @raulchen @ericl @iycheng @WangTaoTheTonic
@@ -59,15 +59,15 @@
 /java/api/ @jovany-wang @kfstorm @raulchen @ericl @iycheng @WangTaoTheTonic
 
 # C++ worker
-/cpp/include/ray @SongGuyang @raulchen @kfstorm @ray-project/ray-core
+/cpp/include/ray @SongGuyang @raulchen @kfstorm
 
 # Ray Client
 /src/ray/protobuf/ray_client.proto @ijrsvt @ameerhajali @ckw017
 
 # Runtime Env
 # TODO(SongGuyang): Add new items to guarantee runtime env API compatibility in multiple languages.
-/src/ray/protobuf/runtime_env_common.proto @SongGuyang @raulchen @edoakes @architkulkarni @ray-project/ray-core
-/src/ray/protobuf/runtime_env_agent.proto @SongGuyang @raulchen @edoakes @architkulkarni @ray-project/ray-core
+/src/ray/protobuf/runtime_env_common.proto @SongGuyang @raulchen @edoakes @architkulkarni
+/src/ray/protobuf/runtime_env_agent.proto @SongGuyang @raulchen @edoakes @architkulkarni
 
 # ==== Libraries and frameworks ====
 

From f49b1b287c72acd0cdd1fdc23fb2dea240f5981d Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Wed, 1 Feb 2023 15:37:43 -0500
Subject: [PATCH 129/267] [core][state] Fix task failed time when job finishes
 (#32161)

Signed-off-by: rickyyx rickyx@anyscale.com

Why are these changes needed?
We have the wrong unit translation right now when recording tasks' failed status if the owning job finishes.
This results in negative duration of such tasks.
Signed-off-by: rickyyx <rickyx@anyscale.com>
---
 python/ray/tests/test_task_events.py                 | 10 +++++++++-
 src/ray/gcs/gcs_server/gcs_task_manager.cc           |  2 +-
 src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc |  2 +-
 3 files changed, 11 insertions(+), 3 deletions(-)

diff --git a/python/ray/tests/test_task_events.py b/python/ray/tests/test_task_events.py
index 48790844faaf..6311c9111ac3 100644
--- a/python/ray/tests/test_task_events.py
+++ b/python/ray/tests/test_task_events.py
@@ -442,11 +442,13 @@ def verify():
         timeout=10,
         retry_interval_ms=500,
     )
+    time_sleep_s = 2
+    time.sleep(time_sleep_s)
 
     proc.kill()
 
     def verify():
-        tasks = list_tasks()
+        tasks = list_tasks(detail=True)
         assert len(tasks) == 7, (
             "Incorrect number of tasks are reported. "
             "Expected length: 1 parent + 2 finished child +  2 failed child + "
@@ -462,6 +464,12 @@ def verify():
                     task["state"] == "FAILED"
                 ), f"task {task['func_or_class_name']} has wrong state"
 
+                duration_ms = task["end_time_ms"] - task["start_time_ms"]
+                assert (
+                    duration_ms > time_sleep_s * 1000
+                    and duration_ms < 2 * time_sleep_s * 1000
+                )
+
         return True
 
     wait_for_condition(
diff --git a/src/ray/gcs/gcs_server/gcs_task_manager.cc b/src/ray/gcs/gcs_server/gcs_task_manager.cc
index 7810f2ff0b50..4ab9f40148f5 100644
--- a/src/ray/gcs/gcs_server/gcs_task_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_task_manager.cc
@@ -479,7 +479,7 @@ void GcsTaskManager::OnJobFinished(const JobID &job_id, int64_t job_finish_time_
         absl::MutexLock lock(&mutex_);
         // If there are any non-terminated tasks from the job, mark them failed since all
         // workers associated with the job will be killed.
-        task_event_storage_->MarkTasksFailed(job_id, job_finish_time_ms * 1000);
+        task_event_storage_->MarkTasksFailed(job_id, job_finish_time_ms * 1000 * 1000);
       });
 }
 
diff --git a/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc b/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
index 4932794d521b..7282b2df1670 100644
--- a/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
@@ -564,7 +564,7 @@ TEST_F(GcsTaskManagerTest, TestJobFinishesFailAllRunningTasks) {
     auto reply = SyncGetTaskEvents(tasks);
     EXPECT_EQ(reply.events_by_task_size(), 10);
     for (const auto &task_event : reply.events_by_task()) {
-      EXPECT_EQ(task_event.state_updates().failed_ts(), 5000);
+      EXPECT_EQ(task_event.state_updates().failed_ts(), /* 5 ms to ns */ 5 * 1000 * 1000);
     }
   }
 

From 6e39b2e0255ac6329d822c890040c09153869916 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Wed, 1 Feb 2023 13:16:18 -0800
Subject: [PATCH 130/267] [tune/execution][rfc] Cache ready futures in
 RayTrialExecutor (#32093)

We currently resolve futures one-by-one in Ray Tune, and query Ray core for the ready status of future multiple times. Instead, we can also cache ready events and yield them if cached elements exist. This can improve performance: In tune_scalability_result_cluster_throughput this improved performance by ~2-3%.

We will always re-query Ray if we expect a resource to be ready.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 .../ray/tune/execution/ray_trial_executor.py  | 57 +++++++++++++------
 1 file changed, 40 insertions(+), 17 deletions(-)

diff --git a/python/ray/tune/execution/ray_trial_executor.py b/python/ray/tune/execution/ray_trial_executor.py
index 12477fca1614..d16469b1041e 100644
--- a/python/ray/tune/execution/ray_trial_executor.py
+++ b/python/ray/tune/execution/ray_trial_executor.py
@@ -205,6 +205,9 @@ def __init__(
 
         # future --> (type, trial/pg)
         self._futures = {}
+        # Cache futures that are ready to reduce the number times we iterate through
+        # all futures (and e.g. shuffle them)
+        self._cached_ready_futures = []
 
         # Cleanup
         force_trial_cleanup = int(os.environ.get("TUNE_FORCE_TRIAL_CLEANUP_S", "600"))
@@ -1212,24 +1215,44 @@ def get_next_executor_event(
             ###################################################################
             # Prepare for futures to wait
             ###################################################################
-            futures_to_wait = list(self._futures.keys())
-            random.shuffle(futures_to_wait)
-            if next_trial_exists:
-                # Only wait for pg explicitly if there is next trial to run.
-                # In which case, handling PG_READY triumphs handling other events.
-                # Since we want to place pending trial ASAP.
-                futures_to_wait = (
-                    self._resource_manager.get_resource_futures() + futures_to_wait
+            if self._cached_ready_futures and not next_trial_exists:
+                # If there are cached ready futures, handle the first.
+                # But: If next trial exists, we want to prioritize PG_READY events.
+                ready_futures = [self._cached_ready_futures.pop(0)]
+            else:
+                # Otherwise, wait for new futures
+                futures_to_wait = list(self._futures.keys())
+                random.shuffle(futures_to_wait)
+                if next_trial_exists:
+                    # Only wait for pg explicitly if there is next trial to run.
+                    # In which case, handling PG_READY triumphs handling other events.
+                    # Since we want to place pending trial ASAP.
+                    futures_to_wait = (
+                        self._resource_manager.get_resource_futures() + futures_to_wait
+                    )
+                logger.debug(
+                    f"get_next_executor_event before wait with futures "
+                    f"{futures_to_wait} and "
+                    f"next_trial_exists={next_trial_exists}"
                 )
-            logger.debug(
-                f"get_next_executor_event before wait with futures "
-                f"{futures_to_wait} and "
-                f"next_trial_exists={next_trial_exists}"
-            )
 
-            ready_futures, _ = ray.wait(
-                futures_to_wait, num_returns=1, timeout=self._get_next_event_wait
-            )
+                # Try to resolve all ready futures that are immediately ready
+                ready, _ = ray.wait(
+                    futures_to_wait, num_returns=len(futures_to_wait), timeout=0
+                )
+
+                if ready:
+                    # If at least one future resolved, use that one. Cache the other
+                    # ones.
+                    ready_futures = [ready.pop(0)]
+                    self._cached_ready_futures = ready
+                else:
+                    # Otherwise, wait for next future with timeout.
+                    ready_futures, _ = ray.wait(
+                        futures_to_wait,
+                        num_returns=1,
+                        timeout=self._get_next_event_wait,
+                    )
 
             ###################################################################
             # Dealing with no future returned case.
@@ -1256,7 +1279,7 @@ def get_next_executor_event(
             ###################################################################
             # If it is a PG_READY event.
             ###################################################################
-            if ready_future not in self._futures.keys():
+            if ready_future not in self._futures:
                 self._resource_manager.update_state()
                 return _ExecutorEvent(_ExecutorEventType.PG_READY)
 

From 6d39879899eb03c5eec0790b972da82a64c04d94 Mon Sep 17 00:00:00 2001
From: Antoni Baum <antoni.baum@protonmail.com>
Date: Wed, 1 Feb 2023 13:30:47 -0800
Subject: [PATCH 131/267] [Release] Fix bad import in AIR benchmark (#32175)

Fixes a bad import causing an AIR benchmark release test to fail.

Release test run: https://buildkite.com/ray-project/release-tests-pr/builds/27298

Signed-off-by: Antoni Baum <antoni.baum@protonmail.com>
---
 release/air_tests/air_benchmarks/workloads/benchmark_util.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/release/air_tests/air_benchmarks/workloads/benchmark_util.py b/release/air_tests/air_benchmarks/workloads/benchmark_util.py
index e08daa082dc2..7bee5d682aff 100644
--- a/release/air_tests/air_benchmarks/workloads/benchmark_util.py
+++ b/release/air_tests/air_benchmarks/workloads/benchmark_util.py
@@ -4,7 +4,7 @@
 from collections import defaultdict
 from contextlib import closing
 from pathlib import Path
-from python.ray.air.util.node import _force_on_node
+from ray.air.util.node import _force_on_node
 
 import ray
 from typing import Any, List, Dict, Union, Callable

From 1f53e606be2e411df1ea6c316bc70acb3240eb37 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Wed, 1 Feb 2023 15:46:28 -0800
Subject: [PATCH 132/267] [tune] Sync less often and only wait at end of
 experiment (#32155)

We currently run into syncing bottleneck when running many short running trials in a multi node cluster, see #32121.

After some investigation, there are three major bottlenecks:

1. All of the 100 trials trigger 2 sync processes each. This is because we trigger a sync for both the result (`SyncerCallback.on_trial_result`) and for the trial completion (`SyncerCallback.on_trial_complete`).
2. We wait synchronously for the sync processes to finish on trial completion
3. The packing and unpacking interferes with the actual training processes on the local node, drastically increasing trial runtime for those trials colocated with the driver script

This PR mitigates 1) and 2) to unblock the coming release. For 3), we may have to re-architecture the current packing logic that uses multiple pack actors and unpack tasks that can impact training performance.

For 1), we introduce a **minimum training time + iteration threshold** for the syncing process. Per default, we only trigger the first sync after at least 2 results were received _or_ 10 training seconds passed. The logic here is that this will only affect experiments where we have short running trials that report one result. In that case, we only need the `on_trial_complete` trigger at the end of training. Other experiments are unaffected and there's not much lost if we don't sync results from the first iteration that took less than 10 seconds to run.

For 2), we cache sync process removal on trial completion. This means we do not wait until the sync process finished, but we keep the process around so we can await syncing at the end of the experiment. Periodically we clean up sync processes that were flagged for removal.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 doc/source/tune/api_docs/env.rst              |  9 +-
 python/ray/tune/syncer.py                     | 97 +++++++++++++++++--
 python/ray/tune/tests/test_syncer_callback.py | 58 ++++++++++-
 3 files changed, 154 insertions(+), 10 deletions(-)

diff --git a/doc/source/tune/api_docs/env.rst b/doc/source/tune/api_docs/env.rst
index 054176280379..8ff39bd73bae 100644
--- a/doc/source/tune/api_docs/env.rst
+++ b/doc/source/tune/api_docs/env.rst
@@ -49,6 +49,14 @@ These are the environment variables Ray Tune currently considers:
 * **TUNE_MAX_PENDING_TRIALS_PG**: Maximum number of pending trials when placement groups are used. Defaults
   to ``auto``, which will be updated to ``max(16, cluster_cpus * 1.1)`` for random/grid search and ``1``
   for any other search algorithms.
+* **TUNE_NODE_SYNCING_MIN_ITER_THRESHOLD**: When syncing trial data between nodes, only sync if this many
+  iterations were recorded for the trial or the minimum time threshold was met. This will prevent unnecessary
+  double syncing for trials that finish quickly or report only once. Defaults to ``2``. Disabled
+  when using external storage (e.g., cloud storage).
+* **TUNE_NODE_SYNCING_MIN_TIME_S_THRESHOLD**: When syncing trial data between nodes, only sync if this much
+  time has been spent training or the minimum iteration threshold was met. This will prevent unnecessary
+  double syncing for trials that finish quickly or report only once. Defaults to ``10`` (seconds).
+  Disabled when using external storage (e.g., cloud storage).
 * **TUNE_PLACEMENT_GROUP_PREFIX**: Prefix for placement groups created by Ray Tune. This prefix is used
   e.g. to identify placement groups that should be cleaned up on start/stop of the tuning run. This is
   initialized to a unique name at the start of the first run.
@@ -82,7 +90,6 @@ These are the environment variables Ray Tune currently considers:
 * **TUNE_WARN_EXCESSIVE_EXPERIMENT_CHECKPOINT_SYNC_THRESHOLD_S**: Threshold for throwing a warning if the experiment state is synced
   multiple times in that many seconds. Defaults to 30 (seconds).
 * **TUNE_STATE_REFRESH_PERIOD**: Frequency of updating the resource tracking from Ray. Defaults to 10 (seconds).
-* **TUNE_SYNC_DISABLE_BOOTSTRAP**: Disable bootstrapping the autoscaler config for Docker syncing.
 * **TUNE_RESTORE_RETRY_NUM**: The number of retries that are done before a particular trial's restore is determined
   unsuccessful. After that, the trial is not restored to its previous checkpoint but rather from scratch.
   Default is ``0``. While this retry counter is taking effect, per trial failure number will not be incremented, which
diff --git a/python/ray/tune/syncer.py b/python/ray/tune/syncer.py
index 4be9f7b2ff30..dc4a739c66a9 100644
--- a/python/ray/tune/syncer.py
+++ b/python/ray/tune/syncer.py
@@ -9,6 +9,7 @@
     TYPE_CHECKING,
     Union,
     Optional,
+    Set,
     Tuple,
 )
 
@@ -29,6 +30,7 @@
 from ray.exceptions import RayActorError
 from ray.tune import TuneError
 from ray.tune.callback import Callback
+from ray.tune.result import TRAINING_ITERATION, TIME_TOTAL_S
 from ray.tune.utils.file_transfer import sync_dir_between_nodes
 from ray.util.annotations import PublicAPI, DeveloperAPI
 from ray.widgets import Template
@@ -44,6 +46,12 @@
 # Default sync timeout after which syncing processes are aborted
 DEFAULT_SYNC_TIMEOUT = 1800
 
+# Trigger first node-to-node sync only after this many iterations arrived
+_DEFAULT_NODE_SYNCING_MIN_ITER_THRESHOLD = 2
+# ... or until at least this much time (in seconds) passed
+_DEFAULT_NODE_SYNCING_MIN_TIME_S_THRESHOLD = 10.0
+
+
 _EXCLUDE_FROM_SYNC = [
     "./checkpoint_-00001",
     "./checkpoint_tmp*",
@@ -210,7 +218,7 @@ def entrypoint():
         self._start_time = time.time()
 
     def wait(self, timeout: Optional[float] = None) -> Any:
-        """Waits for the backgrond process to finish running. Waits until the
+        """Waits for the background process to finish running. Waits until the
         background process has run for at least `timeout` seconds, counting from
         the time when the process was started."""
         if not self._process:
@@ -623,10 +631,39 @@ class SyncerCallback(Callback):
 
     def __init__(self, enabled: bool = True, sync_period: float = DEFAULT_SYNC_PERIOD):
         self._enabled = enabled
+
+        # Map from trial id to syncer process
         self._sync_processes: Dict[str, _BackgroundProcess] = {}
+
+        # Last time we synced a trial
         self._sync_times: Dict[str, float] = {}
+
+        # How often we should sync (in seconds)
         self._sync_period = sync_period
-        self._trial_ips = {}
+
+        # Map of trial id to IP
+        self._trial_ips: Dict[str, str] = {}
+
+        # Set of sync processes that are flagged to remove
+        self._trial_sync_processes_to_remove: Set[str] = set()
+
+        # Recorded training iterations + training times
+        self._trial_iter_training_times: Dict[str, Tuple[int, float]] = {}
+
+        # Only sync if this many items OR this much time has passed
+        # for each individual trial.
+        self._min_iter_threshold = int(
+            os.environ.get(
+                "TUNE_NODE_SYNCING_MIN_ITER_THRESHOLD",
+                _DEFAULT_NODE_SYNCING_MIN_ITER_THRESHOLD,
+            )
+        )
+        self._min_time_s_threshold = float(
+            os.environ.get(
+                "TUNE_NODE_SYNCING_MIN_TIME_S_THRESHOLD",
+                _DEFAULT_NODE_SYNCING_MIN_TIME_S_THRESHOLD,
+            )
+        )
 
     def _get_trial_sync_process(self, trial: "Trial"):
         return self._sync_processes.setdefault(
@@ -634,12 +671,47 @@ def _get_trial_sync_process(self, trial: "Trial"):
             _BackgroundProcess(partial(sync_dir_between_nodes, max_size_bytes=None)),
         )
 
-    def _remove_trial_sync_process(self, trial: "Trial"):
-        self._sync_processes.pop(trial.trial_id, None)
+    def _remove_trial_sync_process(self, trial: "Trial", force: bool = False):
+        """Remove trial sync process.
+
+        If ``force=True``, we remove it immediately. If ``force=False``, we flag
+        it for removal and only remove it when it resolved. This is so we can await
+        the sync process at the end of the experiment.
+        """
+        if force:
+            self._sync_processes.pop(trial.trial_id, None)
+        else:
+            self._trial_sync_processes_to_remove.add(trial.trial_id)
+
+    def _cleanup_trial_sync_processes(self):
+        for trial_id in list(self._trial_sync_processes_to_remove):
+            sync_process = self._sync_processes.get(trial_id, None)
+            if not sync_process or not sync_process.is_running:
+                self._trial_sync_processes_to_remove.remove(trial_id)
+                self._sync_processes.pop(trial_id, None)
 
     def _should_sync(self, trial: "Trial"):
+        iteration, time_trained = self._trial_iter_training_times.setdefault(
+            trial.trial_id, (0, 0.0)
+        )
+
+        # If neither the min iter nor the min time threshold were met, we don't sync.
+        # This is to avoid eager syncing when we have many short running trials -
+        # in that case we only want to sync once at the end of training. For longer
+        # running trials the threshold is usually small enough to not make a difference
+        # in practice.
+        if (
+            iteration < self._min_iter_threshold
+            and time_trained < self._min_time_s_threshold
+        ):
+            return False
+
         last_sync_time = self._sync_times.setdefault(trial.trial_id, float("-inf"))
-        return time.time() - last_sync_time >= self._sync_period
+
+        if time.time() - last_sync_time < self._sync_period:
+            return False
+
+        return True
 
     def _mark_as_synced(self, trial: "Trial"):
         self._sync_times[trial.trial_id] = time.time()
@@ -723,20 +795,27 @@ def on_trial_result(
         result: Dict,
         **info,
     ):
+        # If the results are not found, default to triggering syncing
+        trial_iter = result.get(TRAINING_ITERATION, self._min_iter_threshold)
+        trial_time_s = result.get(TIME_TOTAL_S, self._min_time_s_threshold)
+
+        self._trial_iter_training_times[trial.trial_id] = (trial_iter, trial_time_s)
         self._sync_trial_dir(trial, force=False, wait=False)
 
     def on_trial_complete(
         self, iteration: int, trials: List["Trial"], trial: "Trial", **info
     ):
-        self._sync_trial_dir(trial, force=True, wait=True)
-        self._remove_trial_sync_process(trial)
+        self._sync_trial_dir(trial, force=True, wait=False)
+        self._remove_trial_sync_process(trial, force=False)
         self._trial_ips.pop(trial.trial_id, None)
+        self._cleanup_trial_sync_processes()
 
     def on_trial_error(
         self, iteration: int, trials: List["Trial"], trial: "Trial", **info
     ):
-        self._remove_trial_sync_process(trial)
+        self._remove_trial_sync_process(trial, force=True)
         self._trial_ips.pop(trial.trial_id, None)
+        self._cleanup_trial_sync_processes()
 
     def on_checkpoint(
         self,
@@ -758,6 +837,8 @@ def on_checkpoint(
             )
 
     def wait_for_all(self):
+        self._cleanup_trial_sync_processes()
+
         failed_syncs = {}
         for trial, sync_process in self._sync_processes.items():
             try:
diff --git a/python/ray/tune/tests/test_syncer_callback.py b/python/ray/tune/tests/test_syncer_callback.py
index bc01450865c2..4dcd28ed590c 100644
--- a/python/ray/tune/tests/test_syncer_callback.py
+++ b/python/ray/tune/tests/test_syncer_callback.py
@@ -12,6 +12,7 @@
 from ray.exceptions import RayActorError
 from ray.tune import TuneError
 from ray.tune.logger import NoopLogger
+from ray.tune.result import TRAINING_ITERATION, TIME_TOTAL_S
 from ray.tune.syncer import (
     DEFAULT_SYNC_PERIOD,
     SyncConfig,
@@ -96,6 +97,9 @@ def __init__(
         super(TestSyncerCallback, self).__init__(
             enabled=enabled, sync_period=sync_period
         )
+        self._min_iter_threshold = 0
+        self._min_time_s_threshold = 0
+
         self.local_logdir_override = local_logdir_override
         self.remote_logdir_override = remote_logdir_override
 
@@ -189,10 +193,14 @@ def test_syncer_callback_op_on_no_cloud_checkpointing():
         if isinstance(cb, SyncerCallback):
             syncer_callback = cb
 
+    assert syncer_callback
+
+    syncer_callback._min_iter_threshold = 0
+    syncer_callback._min_time_s_threshold = 0
+
     trial1 = MockTrial(trial_id="a", logdir=None)
     trial1.uses_cloud_checkpointing = False
 
-    assert syncer_callback
     assert syncer_callback._enabled
     assert syncer_callback._sync_trial_dir(trial1)
 
@@ -368,6 +376,53 @@ def test_syncer_callback_force_on_complete(ray_start_2_cpus, temp_data_dirs):
         assert_file(True, tmp_target, "level0_new.txt")
 
 
+@pytest.mark.parametrize("threshold", [TRAINING_ITERATION, TIME_TOTAL_S])
+def test_syncer_callback_min_thresholds(ray_start_2_cpus, temp_data_dirs, threshold):
+    """Check that the min_iter/min_time_s thresholds are respected."""
+    tmp_source, tmp_target = temp_data_dirs
+
+    # Keep the other metric at 0
+    other = TRAINING_ITERATION if threshold == TIME_TOTAL_S else TIME_TOTAL_S
+
+    syncer_callback = TestSyncerCallback(local_logdir_override=tmp_target)
+
+    syncer_callback._min_iter_threshold = 8
+    syncer_callback._min_time_s_threshold = 8
+
+    trial1 = MockTrial(trial_id="a", logdir=tmp_source)
+
+    syncer_callback._trial_ips[trial1.trial_id] = "invalid"
+    syncer_callback.on_trial_start(iteration=0, trials=[], trial=trial1)
+
+    for i in range(7):
+        syncer_callback.on_trial_result(
+            iteration=i, trials=[], trial=trial1, result={threshold: i, other: 0}
+        )
+        syncer_callback.wait_for_all()
+        assert_file(False, tmp_target, "level0.txt")
+
+    syncer_callback.on_trial_result(
+        iteration=8, trials=[], trial=trial1, result={threshold: 8, other: 0}
+    )
+    syncer_callback.wait_for_all()
+
+    assert_file(True, tmp_target, "level0.txt")
+    assert_file(True, tmp_target, "level0_exclude.txt")
+    assert_file(True, tmp_target, "subdir/level1.txt")
+    assert_file(True, tmp_target, "subdir/level1_exclude.txt")
+    assert_file(True, tmp_target, "subdir/nested/level2.txt")
+    assert_file(True, tmp_target, "subdir_nested_level2_exclude.txt")
+    assert_file(True, tmp_target, "subdir_exclude/something/somewhere.txt")
+
+    # Also trigger delayed syncer process removal
+    syncer_callback._remove_trial_sync_process(trial=trial1)
+    assert trial1.trial_id in syncer_callback._trial_sync_processes_to_remove
+
+    # Syncing finished so syncer should be removed now
+    syncer_callback._cleanup_trial_sync_processes()
+    assert trial1.trial_id not in syncer_callback._trial_sync_processes_to_remove
+
+
 def test_syncer_callback_wait_for_all_error(ray_start_2_cpus, temp_data_dirs):
     """Check that syncer errors are caught correctly in wait_for_all()"""
     tmp_source, tmp_target = temp_data_dirs
@@ -492,6 +547,7 @@ def train_fn(config):
         local_logdir_override=tmp_target,
     )
     syncer_callback.on_trial_complete(iteration=1, trials=[], trial=trial1)
+    syncer_callback.wait_for_all()
 
     # Regular files are synced
     assert_file(True, tmp_target, "level0.txt")

From d6de1ce9975823702a2a8ca69bca1b8bfd5b0d47 Mon Sep 17 00:00:00 2001
From: Justin Yu <justinvyu@berkeley.edu>
Date: Wed, 1 Feb 2023 15:51:15 -0800
Subject: [PATCH 133/267] [Tune] Add `Tuner.can_restore(path)` utility for
 checking if an experiment exists at a path/uri (#32003)

This PR adds a utility to check if a given path (either local or remote) exists and can be restored from. It includes some simple validation that this is the root of the experiment directory (can't restore from the trial level directory).

Signed-off-by: Justin Yu <justinvyu@berkeley.edu>
Signed-off-by: Justin Yu <justinvyu@anyscale.com>
Co-authored-by: Antoni Baum <antoni.baum@protonmail.com>
---
 python/ray/air/_internal/remote_storage.py  | 10 ++++-
 python/ray/tune/tests/test_tuner_restore.py | 36 ++++++++++++++++
 python/ray/tune/tuner.py                    | 48 ++++++++++++++++++++-
 3 files changed, 92 insertions(+), 2 deletions(-)

diff --git a/python/ray/air/_internal/remote_storage.py b/python/ray/air/_internal/remote_storage.py
index c43e718ae4a5..66708deb02f3 100644
--- a/python/ray/air/_internal/remote_storage.py
+++ b/python/ray/air/_internal/remote_storage.py
@@ -252,16 +252,24 @@ def _should_exclude(candidate: str) -> bool:
 
 
 def list_at_uri(uri: str) -> List[str]:
+    """Returns the list of filenames at a URI (similar to os.listdir).
+
+    If the URI doesn't exist, returns an empty list.
+    """
     _assert_pyarrow_installed()
 
     fs, bucket_path = get_fs_and_path(uri)
     if not fs:
         raise ValueError(
-            f"Could not upload to URI: "
+            f"Could not list at URI: "
             f"URI `{uri}` is not a valid or supported cloud target. "
             f"Hint: {fs_hint(uri)}"
         )
 
+    if not is_non_local_path_uri(uri):
+        # Make sure local paths get expanded fully
+        bucket_path = os.path.abspath(os.path.expanduser(bucket_path))
+
     selector = pyarrow.fs.FileSelector(
         bucket_path, allow_not_found=True, recursive=False
     )
diff --git a/python/ray/tune/tests/test_tuner_restore.py b/python/ray/tune/tests/test_tuner_restore.py
index edca293e1dec..0eb7a5e917a6 100644
--- a/python/ray/tune/tests/test_tuner_restore.py
+++ b/python/ray/tune/tests/test_tuner_restore.py
@@ -964,6 +964,42 @@ def get_checkpoints(experiment_dir):
     assert [ckpt.to_dict()["it"] for ckpt in checkpoints] == [2, 3, 4, 5]
 
 
+@pytest.mark.parametrize("upload_dir", [None, "memory:///test/"])
+def test_tuner_can_restore(tmp_path, upload_dir):
+    """Make sure that `can_restore` detects an existing experiment at a
+    local/remote path and only returns True if it's at the experiment dir root.
+    """
+    name = "exp_name"
+    if upload_dir:
+        path = Path(upload_dir) / name
+    else:
+        path = tmp_path / name
+
+    assert not Tuner.can_restore(path)
+    Tuner(
+        lambda config: None,
+        run_config=RunConfig(
+            name=name,
+            local_dir=str(tmp_path),
+            sync_config=tune.SyncConfig(upload_dir=upload_dir),
+        ),
+        tune_config=TuneConfig(trial_dirname_creator=lambda t: "trial_dir"),
+    )
+    (path / "trial_dir").mkdir(parents=True, exist_ok=True)
+    if upload_dir:
+        upload_to_uri(str(tmp_path / name), str(path))
+    assert Tuner.can_restore(path)
+    # Can't restore from the trial level
+    assert not Tuner.can_restore(path / "trial_dir")
+    # Can't restore from the local_dir level
+    assert not Tuner.can_restore(tmp_path)
+
+    if upload_dir:
+        assert not Tuner.can_restore(Path(upload_dir) / "new_exp")
+    else:
+        assert not Tuner.can_restore(tmp_path / "new_exp")
+
+
 if __name__ == "__main__":
     import sys
 
diff --git a/python/ray/tune/tuner.py b/python/ray/tune/tuner.py
index 7b1cacb000fa..1c35acd411a6 100644
--- a/python/ray/tune/tuner.py
+++ b/python/ray/tune/tuner.py
@@ -1,15 +1,17 @@
+from pathlib import Path
 from typing import Any, Callable, Dict, Optional, Type, Union, TYPE_CHECKING
 import warnings
 
 import ray
 
 from ray.air.config import RunConfig
+from ray.air._internal.remote_storage import list_at_uri
 from ray.air.util.node import _force_on_current_node
 from ray.tune import TuneError
 from ray.tune.execution.trial_runner import _ResumeConfig
 from ray.tune.result_grid import ResultGrid
 from ray.tune.trainable import Trainable
-from ray.tune.impl.tuner_internal import TunerInternal
+from ray.tune.impl.tuner_internal import TunerInternal, _TUNER_PKL
 from ray.tune.tune_config import TuneConfig
 from ray.tune.progress_reporter import (
     _prepare_progress_reporter_for_ray_client,
@@ -252,6 +254,50 @@ def restore(
             )
             return Tuner(_tuner_internal=tuner_internal)
 
+    @classmethod
+    def can_restore(cls, path: Union[str, Path]) -> bool:
+        """Checks whether a given directory contains a restorable Tune experiment.
+
+        Usage Pattern:
+
+        Use this utility to switch between starting a new Tune experiment
+        and restoring when possible. This is useful for experiment fault-tolerance
+        when re-running a failed tuning script.
+
+        .. code-block:: python
+
+            import os
+            from ray.tune import Tuner
+            from ray.air import RunConfig
+
+            def train_fn(config):
+                # Make sure to implement checkpointing so that progress gets
+                # saved on restore.
+                pass
+
+            name = "exp_name"
+            local_dir = "~/ray_results"
+            exp_dir = os.path.join(local_dir, name)
+
+            if Tuner.can_restore(exp_dir):
+                tuner = Tuner.restore(exp_dir, resume_errored=True)
+            else:
+                tuner = Tuner(
+                    train_fn,
+                    run_config=RunConfig(name=name, local_dir=local_dir),
+                )
+            tuner.fit()
+
+        Args:
+            path: The path to the experiment directory of the Tune experiment.
+                This can be either a local directory (e.g. ~/ray_results/exp_name)
+                or a remote URI (e.g. s3://bucket/exp_name).
+
+        Returns:
+            bool: True if this path exists and contains the Tuner state to resume from
+        """
+        return _TUNER_PKL in list_at_uri(str(path))
+
     def _prepare_remote_tuner_for_jupyter_progress_reporting(self):
         run_config: RunConfig = ray.get(self._remote_tuner.get_run_config.remote())
         progress_reporter, string_queue = _prepare_progress_reporter_for_ray_client(

From a954ab715322ad46bcc3fa0b51ed78e1475e2a70 Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Wed, 1 Feb 2023 19:31:56 -0500
Subject: [PATCH 134/267] [ci][job] Move test_cli_integration to large test 
 (#32171)

This has caused flaky test failures which are false positives.
---
 dashboard/BUILD | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/dashboard/BUILD b/dashboard/BUILD
index 72aa8aea4a16..96f76bd6a16d 100644
--- a/dashboard/BUILD
+++ b/dashboard/BUILD
@@ -22,9 +22,10 @@ py_test_run_all_subdirectory(
     exclude = [
         "client/node_modules/**",
         "modules/test/**", 
+        "modules/job/tests/test_cli_integration.py",
         "modules/node/tests/test_node.py", 
         "tests/test_dashboard.py", 
-        "tests/test_state_head.py"
+        "tests/test_state_head.py",
     ],
     extra_srcs = [],
     data = [
@@ -39,6 +40,14 @@ py_test_run_all_subdirectory(
     tags = ["exclusive", "team:serve"],
 )
 
+py_test(
+    name="test_cli_integration",
+    size="large",
+    srcs = ["modules/job/tests/test_cli_integration.py"],
+    deps = [":conftest"],
+    tags = ["exclusive", "team:serve"],
+)
+
 py_test(
     name = "test_node",
     size = "medium",

From 74266a22406ea85af4b1084bdb6729d017c72078 Mon Sep 17 00:00:00 2001
From: Scott Lee <scottjlee@users.noreply.github.com>
Date: Wed, 1 Feb 2023 18:52:42 -0800
Subject: [PATCH 135/267] [Datasets] Add support for string tensor columns in
 `ArrowTensorArray` and `ArrowVariableShapedTensorArray` (#32143)

Add support for creating ArrowTensorArrays and ArrowVariableShapedTensorArray with string typed columns. The previous PR #31817 had CI test failures which were not run at PR-review time. This PR replicates the functionality of the previous PR, and additionally addresses the test failures (which only occur for Arrow 8.0+).

Signed-off-by: Scott Lee <sjl@anyscale.com>
---
 python/ray/air/tests/test_tensor_extension.py |  81 ++++++++++-
 .../ray/air/util/tensor_extensions/arrow.py   | 134 +++++++++++-------
 python/ray/data/tests/test_dataset.py         |   7 +-
 .../ray/data/tests/test_dataset_tfrecords.py  |   2 +-
 4 files changed, 171 insertions(+), 53 deletions(-)

diff --git a/python/ray/air/tests/test_tensor_extension.py b/python/ray/air/tests/test_tensor_extension.py
index 811116a82105..b7cdd383a936 100644
--- a/python/ray/air/tests/test_tensor_extension.py
+++ b/python/ray/air/tests/test_tensor_extension.py
@@ -14,6 +14,7 @@
 )
 from ray.air.util.tensor_extensions.pandas import TensorArray, TensorDtype
 from ray._private.utils import _get_pyarrow_version
+from ray.air.util.tensor_extensions.utils import _create_strict_ragged_ndarray
 
 
 def test_tensor_array_validation():
@@ -189,6 +190,82 @@ def test_arrow_variable_shaped_tensor_array_slice():
             np.testing.assert_array_equal(o, e)
 
 
+def test_arrow_variable_shaped_bool_tensor_array_slice():
+    arr = np.array(
+        [
+            [True],
+            [True, False],
+            [False, True, False],
+        ],
+        dtype=object,
+    )
+    ata = ArrowVariableShapedTensorArray.from_numpy(arr)
+    assert isinstance(ata.type, ArrowVariableShapedTensorType)
+    assert len(ata) == len(arr)
+    indices = [0, 1, 2]
+    for i in indices:
+        np.testing.assert_array_equal(ata[i], arr[i])
+
+    slices = [
+        slice(0, 1),
+        slice(1, 2),
+        slice(2, 3),
+        slice(0, 2),
+        slice(1, 3),
+        slice(0, 3),
+    ]
+    for slice_ in slices:
+        ata_slice = ata[slice_]
+        ata_slice_np = ata_slice.to_numpy()
+        arr_slice = arr[slice_]
+        # Check for equivalent dtypes and shapes.
+        assert ata_slice_np.dtype == arr_slice.dtype
+        assert ata_slice_np.shape == arr_slice.shape
+        # Iteration over tensor array slices triggers NumPy conversion.
+        for o, e in zip(ata_slice, arr_slice):
+            np.testing.assert_array_equal(o, e)
+
+
+def test_arrow_variable_shaped_string_tensor_array_slice():
+    arr = np.array(
+        [
+            ["Philip", "J", "Fry"],
+            ["Leela", "Turanga"],
+            ["Professor", "Hubert", "J", "Farnsworth"],
+            ["Lrrr"],
+        ],
+        dtype=object,
+    )
+    ata = ArrowVariableShapedTensorArray.from_numpy(arr)
+    assert isinstance(ata.type, ArrowVariableShapedTensorType)
+    assert len(ata) == len(arr)
+    indices = [0, 1, 2, 3]
+    for i in indices:
+        np.testing.assert_array_equal(ata[i], arr[i])
+    slices = [
+        slice(0, 1),
+        slice(1, 2),
+        slice(2, 3),
+        slice(3, 4),
+        slice(0, 2),
+        slice(1, 3),
+        slice(2, 4),
+        slice(0, 3),
+        slice(1, 4),
+        slice(0, 4),
+    ]
+    for slice_ in slices:
+        ata_slice = ata[slice_]
+        ata_slice_np = ata_slice.to_numpy()
+        arr_slice = arr[slice_]
+        # Check for equivalent dtypes and shapes.
+        assert ata_slice_np.dtype == arr_slice.dtype
+        assert ata_slice_np.shape == arr_slice.shape
+        # Iteration over tensor array slices triggers NumPy conversion.
+        for o, e in zip(ata_slice, arr_slice):
+            np.testing.assert_array_equal(o, e)
+
+
 def test_variable_shaped_tensor_array_roundtrip():
     shapes = [(2, 2), (3, 3), (4, 4)]
     cumsum_sizes = np.cumsum([0] + [np.prod(shape) for shape in shapes[:-1]])
@@ -505,7 +582,9 @@ def test_arrow_tensor_array_slice(test_arr, dtype):
     for shape in pytest_tensor_array_concat_shapes
 ]
 pytest_tensor_array_concat_arrs += [
-    np.array([np.arange(4).reshape((2, 2)), np.arange(4, 13).reshape((3, 3))])
+    _create_strict_ragged_ndarray(
+        [np.arange(4).reshape((2, 2)), np.arange(4, 13).reshape((3, 3))]
+    )
 ]
 pytest_tensor_array_concat_arr_combinations = list(
     itertools.combinations(pytest_tensor_array_concat_arrs, 2)
diff --git a/python/ray/air/util/tensor_extensions/arrow.py b/python/ray/air/util/tensor_extensions/arrow.py
index 7412e2d30c23..6d61c3ab25ad 100644
--- a/python/ray/air/util/tensor_extensions/arrow.py
+++ b/python/ray/air/util/tensor_extensions/arrow.py
@@ -1,4 +1,5 @@
 import itertools
+import sys
 from typing import Iterable, Optional, Tuple, List, Sequence, Union
 
 from pkg_resources._vendor.packaging.version import parse as parse_version
@@ -23,6 +24,8 @@
 # TODO(Clark): Remove conditional definition once we only support Arrow 9.0.0+.
 MIN_PYARROW_VERSION_SCALAR_SUBCLASS = parse_version("9.0.0")
 
+NUM_BYTES_PER_UNICODE_CHAR = 4
+
 
 def _arrow_supports_extension_scalars():
     """
@@ -124,10 +127,12 @@ def _extension_scalar_to_ndarray(
             """
             Convert an ExtensionScalar to a tensor element.
             """
-            # TODO(Clark): Construct ndarray view directly on tensor element buffer to
-            # ensure reliable zero-copy semantics.
-            flat_ndarray = scalar.value.values.to_numpy(zero_copy_only=False)
-            return flat_ndarray.reshape(self.shape)
+            raw_values = scalar.value.values
+            shape = scalar.type.shape
+            value_type = raw_values.type
+            offset = raw_values.offset
+            data_buffer = raw_values.buffers()[1]
+            return _to_ndarray_helper(shape, value_type, offset, data_buffer)
 
     def __str__(self) -> str:
         return (
@@ -309,6 +314,15 @@ def from_numpy(
                 # We only natively support C-contiguous ndarrays.
                 arr = np.ascontiguousarray(arr)
             pa_dtype = pa.from_numpy_dtype(arr.dtype)
+            if pa.types.is_string(pa_dtype):
+                if arr.dtype.byteorder == ">" or (
+                    arr.dtype.byteorder == "=" and sys.byteorder == "big"
+                ):
+                    raise ValueError(
+                        "Only little-endian string tensors are supported, "
+                        f"but got: {arr.dtype}",
+                    )
+                pa_dtype = pa.binary(arr.dtype.itemsize)
             outer_len = arr.shape[0]
             element_shape = arr.shape[1:]
             total_num_items = arr.size
@@ -425,6 +439,11 @@ def _to_numpy(self, index: Optional[int] = None, zero_copy_only: bool = False):
             arr = np.unpackbits(arr, bitorder="little")
             # Interpret buffer as boolean array.
             return np.ndarray(shape, dtype=np.bool_, buffer=arr, offset=bool_offset)
+        # Special handling of binary/string types. Assumes unicode string tensor columns
+        if pa.types.is_fixed_size_binary(value_type):
+            ext_dtype = np.dtype(
+                f"<U{value_type.byte_width // NUM_BYTES_PER_UNICODE_CHAR}"
+            )
         return np.ndarray(shape, dtype=ext_dtype, buffer=data_buffer, offset=offset)
 
     def to_numpy(self, zero_copy_only: bool = True):
@@ -598,13 +617,14 @@ def _extension_scalar_to_ndarray(
             """
             Convert an ExtensionScalar to a tensor element.
             """
-            # TODO(Clark): Construct ndarray view directly on tensor element buffer to
-            # ensure reliable zero-copy semantics.
-            flat_ndarray = scalar.value.get("data").values.to_numpy(
-                zero_copy_only=False
-            )
+            data = scalar.value.get("data")
+            raw_values = data.values
+
             shape = tuple(scalar.value.get("shape").as_py())
-            return flat_ndarray.reshape(shape)
+            value_type = raw_values.type
+            offset = raw_values.offset
+            data_buffer = raw_values.buffers()[1]
+            return _to_ndarray_helper(shape, value_type, offset, data_buffer)
 
 
 # NOTE: We need to inherit from the mixin before pa.ExtensionArray to ensure that the
@@ -704,6 +724,15 @@ def from_numpy(
                 f"arrays: {types_and_shapes}"
             )
         pa_dtype = pa.from_numpy_dtype(dtype)
+        if pa.types.is_string(pa_dtype):
+            if dtype.byteorder == ">" or (
+                dtype.byteorder == "=" and sys.byteorder == "big"
+            ):
+                raise ValueError(
+                    "Only little-endian string tensors are supported, "
+                    f"but got: {dtype}"
+                )
+            pa_dtype = pa.binary(dtype.itemsize)
         if dtype.type is np.bool_:
             # NumPy doesn't represent boolean arrays as bit-packed, so we manually
             # bit-pack the booleans before handing the buffer off to Arrow.
@@ -757,48 +786,12 @@ def _to_numpy(self, index: Optional[int] = None, zero_copy_only: bool = False):
             return _create_strict_ragged_ndarray(arrs)
         data = self.storage.field("data")
         shapes = self.storage.field("shape")
-        value_type = data.type.value_type
-        if pa.types.is_boolean(value_type):
-            # Arrow boolean array buffers are bit-packed, with 8 entries per byte,
-            # and are accessed via bit offsets.
-            buffer_item_width = value_type.bit_width
-        else:
-            # We assume all other array types are accessed via byte array
-            # offsets.
-            buffer_item_width = value_type.bit_width // 8
+
         shape = shapes[index].as_py()
+        value_type = data.type.value_type
         offset = data.offsets[index].as_py()
-        data_offset = buffer_item_width * offset
         data_buffer = data.buffers()[3]
-        if not pa.types.is_boolean(value_type):
-            return np.ndarray(
-                shape,
-                dtype=value_type.to_pandas_dtype(),
-                buffer=data_buffer,
-                offset=data_offset,
-            )
-        # Special handling for boolean arrays, since Arrow bit-packs boolean arrays
-        # while NumPy does not.
-        # Cast as uint8 array and let NumPy unpack into a boolean view.
-        # Offset into uint8 array, where each element is a bucket for 8 booleans.
-        byte_bucket_offset = data_offset // 8
-        # Offset for a specific boolean, within a uint8 array element.
-        bool_offset = data_offset % 8
-        # The number of uint8 array elements (buckets) that our slice spans.
-        # Note that, due to the offset for a specific boolean, the slice can span byte
-        # boundaries even if it contains less than 8 booleans.
-        num_boolean_byte_buckets = 1 + ((bool_offset + np.prod(shape) - 1) // 8)
-        # Construct the uint8 array view on the buffer.
-        arr = np.ndarray(
-            (num_boolean_byte_buckets,),
-            dtype=np.uint8,
-            buffer=data_buffer,
-            offset=byte_bucket_offset,
-        )
-        # Unpack into a byte per boolean, using LSB bit-packed ordering.
-        arr = np.unpackbits(arr, bitorder="little")
-        # Interpret buffer as boolean array.
-        return np.ndarray(shape, dtype=np.bool_, buffer=arr, offset=bool_offset)
+        return _to_ndarray_helper(shape, value_type, offset, data_buffer)
 
     def to_numpy(self, zero_copy_only: bool = True):
         """
@@ -863,3 +856,46 @@ def _pairwise(iterable):
     a, b = itertools.tee(iterable)
     next(b, None)
     return zip(a, b)
+
+
+def _to_ndarray_helper(shape, value_type, offset, data_buffer):
+    if pa.types.is_boolean(value_type):
+        # Arrow boolean array buffers are bit-packed, with 8 entries per byte,
+        # and are accessed via bit offsets.
+        buffer_item_width = value_type.bit_width
+    else:
+        # We assume all other array types are accessed via byte array
+        # offsets.
+        buffer_item_width = value_type.bit_width // 8
+    data_offset = buffer_item_width * offset
+
+    if pa.types.is_boolean(value_type):
+        # Special handling for boolean arrays, since Arrow
+        # bit-packs boolean arrays while NumPy does not.
+        # Cast as uint8 array and let NumPy unpack into a boolean view.
+        # Offset into uint8 array, where each element is
+        # a bucket for 8 booleans.
+        byte_bucket_offset = data_offset // 8
+        # Offset for a specific boolean, within a uint8 array element.
+        bool_offset = data_offset % 8
+        # The number of uint8 array elements (buckets) that our slice spans.
+        # Note that, due to the offset for a specific boolean,
+        # the slice can span byte boundaries even if it contains
+        # less than 8 booleans.
+        num_boolean_byte_buckets = 1 + ((bool_offset + np.prod(shape) - 1) // 8)
+        # Construct the uint8 array view on the buffer.
+        arr = np.ndarray(
+            (num_boolean_byte_buckets,),
+            dtype=np.uint8,
+            buffer=data_buffer,
+            offset=byte_bucket_offset,
+        )
+        # Unpack into a byte per boolean, using LSB bit-packed ordering.
+        arr = np.unpackbits(arr, bitorder="little")
+        # Interpret buffer as boolean array.
+        return np.ndarray(shape, dtype=np.bool_, buffer=arr, offset=bool_offset)
+    ext_dtype = value_type.to_pandas_dtype()
+    # Special handling of ragged string tensors
+    if pa.types.is_fixed_size_binary(value_type):
+        ext_dtype = np.dtype(f"<U{value_type.byte_width // NUM_BYTES_PER_UNICODE_CHAR}")
+    return np.ndarray(shape, dtype=ext_dtype, buffer=data_buffer, offset=data_offset)
diff --git a/python/ray/data/tests/test_dataset.py b/python/ray/data/tests/test_dataset.py
index 4cd1d39aa5a8..99ace502471f 100644
--- a/python/ray/data/tests/test_dataset.py
+++ b/python/ray/data/tests/test_dataset.py
@@ -15,6 +15,7 @@
 import ray
 from ray._private.test_utils import wait_for_condition
 from ray.air.util.tensor_extensions.arrow import ArrowVariableShapedTensorType
+from ray.air.util.tensor_extensions.utils import _create_possibly_ragged_ndarray
 from ray.data._internal.dataset_logger import DatasetLogger
 from ray.data._internal.stats import _StatsActor
 from ray.data._internal.arrow_block import ArrowRow
@@ -889,7 +890,7 @@ def check_for_copy(table1, table2, a, b, is_copy):
 def test_tensor_array_boolean_slice_pandas_roundtrip(init_with_pandas, test_data, a, b):
     is_variable_shaped = len({len(elem) for elem in test_data}) > 1
     n = len(test_data)
-    test_arr = np.array(test_data)
+    test_arr = _create_possibly_ragged_ndarray(test_data)
     df = pd.DataFrame({"one": TensorArray(test_arr), "two": ["a"] * n})
     if init_with_pandas:
         table = pa.Table.from_pandas(df)
@@ -998,7 +999,9 @@ def test_tensors_in_tables_pandas_roundtrip_variable_shaped(
     ds_df = ds.to_pandas()
     expected_df = df + 1
     if enable_automatic_tensor_extension_cast:
-        expected_df.loc[:, "two"] = list(expected_df["two"].to_numpy())
+        expected_df.loc[:, "two"] = _create_possibly_ragged_ndarray(
+            expected_df["two"].to_numpy()
+        )
     pd.testing.assert_frame_equal(ds_df, expected_df)
 
 
diff --git a/python/ray/data/tests/test_dataset_tfrecords.py b/python/ray/data/tests/test_dataset_tfrecords.py
index fca97b7c8bb9..6302b0031acf 100644
--- a/python/ray/data/tests/test_dataset_tfrecords.py
+++ b/python/ray/data/tests/test_dataset_tfrecords.py
@@ -40,7 +40,7 @@ def test_read_tfrecords(ray_start_regular_shared, tmp_path):
     assert dict(df.dtypes) == {
         "int64": np.int64,
         "int64_list": object,
-        "float": np.float,
+        "float": np.float_,
         "float_list": object,
         "bytes": object,
         "bytes_list": object,

From 509121731fe8ab9fef638430030a25e3b80de061 Mon Sep 17 00:00:00 2001
From: Alan Guo <aguo@anyscale.com>
Date: Thu, 2 Feb 2023 02:47:50 -0800
Subject: [PATCH 136/267] IA polish for demo (#32158)

Add links between progress bar and task table and actor table
Add links from task table to logs and to view stack trace fix horizontal scroll of table view
Fix logs link going to old IA instead of new IA.
fix horizontal scroll of table view
Add beta label
---
 dashboard/client/src/App.tsx                  |   7 +-
 .../client/src/common/CollapsibleSection.tsx  | 111 +++--
 dashboard/client/src/common/RowStyles.tsx     |   3 +
 .../client/src/components/ActorTable.tsx      | 369 +++++++++--------
 .../src/components/PlacementGroupTable.tsx    | 114 +++---
 dashboard/client/src/components/TaskTable.tsx | 385 ++++++++++++------
 .../client/src/components/WorkerTable.tsx     |  25 +-
 .../client/src/pages/actor/ActorList.tsx      |  16 +-
 dashboard/client/src/pages/actor/index.tsx    |   4 +-
 .../AdvancedProgressBar.tsx                   |  33 +-
 dashboard/client/src/pages/job/JobDetail.tsx  |  83 +++-
 .../src/pages/job/JobDetailActorPage.tsx      |   2 +-
 .../client/src/pages/job/JobProgressBar.tsx   |  14 +-
 .../src/pages/job/hook/useJobProgress.ts      |   1 +
 .../client/src/pages/node/NodeDetail.tsx      |  12 +-
 dashboard/client/src/pages/state/task.tsx     |  20 +-
 dashboard/client/src/service/task.ts          |   4 +-
 dashboard/client/src/type/job.d.ts            |   7 +
 dashboard/client/src/type/task.ts             |  13 +
 dashboard/client/src/util/hook.ts             |  15 +-
 python/ray/experimental/state/common.py       |  14 +-
 python/ray/tests/test_state_api_summary.py    |  17 +-
 22 files changed, 830 insertions(+), 439 deletions(-)

diff --git a/dashboard/client/src/App.tsx b/dashboard/client/src/App.tsx
index 69c50d550b2e..52e89c5315e2 100644
--- a/dashboard/client/src/App.tsx
+++ b/dashboard/client/src/App.tsx
@@ -199,7 +199,10 @@ const App = () => {
                         }
                         path=""
                       />
-                      <Route element={<NodeDetailPage />} path="nodes/:id" />
+                      <Route
+                        element={<NodeDetailPage newIA />}
+                        path="nodes/:id"
+                      />
                     </Route>
                   </Route>
                   <Route element={<NewIAJobsPage />} path="jobs">
@@ -232,7 +235,7 @@ const App = () => {
                       <Route element={<ActorDetailPage />} path="actors/:id" />
                     </Route>
                   </Route>
-                  <Route element={<Actors />} path="actors" />
+                  <Route element={<Actors newIA />} path="actors" />
                   <Route element={<ActorDetailPage />} path="actors/:id" />
                   <Route element={<Metrics newIA />} path="metrics" />
                   <Route element={<NewIALogsPage />} path="logs">
diff --git a/dashboard/client/src/common/CollapsibleSection.tsx b/dashboard/client/src/common/CollapsibleSection.tsx
index 2f42d82ff7d6..57c2d3792563 100644
--- a/dashboard/client/src/common/CollapsibleSection.tsx
+++ b/dashboard/client/src/common/CollapsibleSection.tsx
@@ -1,6 +1,11 @@
 import { createStyles, makeStyles, Typography } from "@material-ui/core";
 import classNames from "classnames";
-import React, { PropsWithChildren, useEffect, useState } from "react";
+import React, {
+  forwardRef,
+  PropsWithChildren,
+  useEffect,
+  useState,
+} from "react";
 import { RiArrowDownSLine, RiArrowRightSLine } from "react-icons/ri";
 import { ClassNameProps } from "./props";
 
@@ -30,6 +35,12 @@ const useStyles = makeStyles((theme) =>
 
 type CollapsibleSectionProps = PropsWithChildren<
   {
+    /**
+     * Allows the parent component to control if this section is expanded.
+     * If undefined, the child wil own the expansion state
+     */
+    expanded?: boolean;
+    onExpandButtonClick?: () => void;
     title: string;
     startExpanded?: boolean;
     /**
@@ -40,50 +51,62 @@ type CollapsibleSectionProps = PropsWithChildren<
   } & ClassNameProps
 >;
 
-export const CollapsibleSection = ({
-  title,
-  startExpanded = false,
-  className,
-  children,
-  keepRendered,
-}: CollapsibleSectionProps) => {
-  const classes = useStyles();
-  const [expanded, setExpanded] = useState(startExpanded);
-  const [rendered, setRendered] = useState(expanded);
+export const CollapsibleSection = forwardRef<
+  HTMLDivElement,
+  CollapsibleSectionProps
+>(
+  (
+    {
+      title,
+      expanded,
+      onExpandButtonClick,
+      startExpanded = false,
+      className,
+      children,
+      keepRendered,
+    },
+    ref,
+  ) => {
+    const classes = useStyles();
+    const [internalExpanded, setInternalExpanded] = useState(startExpanded);
+    const finalExpanded = expanded !== undefined ? expanded : internalExpanded;
+    const [rendered, setRendered] = useState(finalExpanded);
 
-  useEffect(() => {
-    if (expanded) {
-      setRendered(true);
-    }
-  }, [expanded]);
+    useEffect(() => {
+      if (finalExpanded) {
+        setRendered(true);
+      }
+    }, [finalExpanded]);
 
-  const handleExpandClick = () => {
-    setExpanded(!expanded);
-  };
+    const handleExpandClick = () => {
+      onExpandButtonClick?.();
+      setInternalExpanded(!finalExpanded);
+    };
 
-  return (
-    <div className={className}>
-      <Typography
-        className={classes.title}
-        variant="h4"
-        onClick={handleExpandClick}
-      >
-        {expanded ? (
-          <RiArrowDownSLine className={classes.icon} />
-        ) : (
-          <RiArrowRightSLine className={classes.icon} />
-        )}
-        {title}
-      </Typography>
-      {(expanded || (keepRendered && rendered)) && (
-        <div
-          className={classNames(classes.body, {
-            [classes.bodyHidden]: !expanded,
-          })}
+    return (
+      <div ref={ref} className={className}>
+        <Typography
+          className={classes.title}
+          variant="h4"
+          onClick={handleExpandClick}
         >
-          {children}
-        </div>
-      )}
-    </div>
-  );
-};
+          {finalExpanded ? (
+            <RiArrowDownSLine className={classes.icon} />
+          ) : (
+            <RiArrowRightSLine className={classes.icon} />
+          )}
+          {title}
+        </Typography>
+        {(finalExpanded || (keepRendered && rendered)) && (
+          <div
+            className={classNames(classes.body, {
+              [classes.bodyHidden]: !finalExpanded,
+            })}
+          >
+            {children}
+          </div>
+        )}
+      </div>
+    );
+  },
+);
diff --git a/dashboard/client/src/common/RowStyles.tsx b/dashboard/client/src/common/RowStyles.tsx
index 794e59860c84..098ac9a32e3e 100644
--- a/dashboard/client/src/common/RowStyles.tsx
+++ b/dashboard/client/src/common/RowStyles.tsx
@@ -2,6 +2,9 @@ import { createStyles, makeStyles } from "@material-ui/core/styles";
 
 const rowStyles = makeStyles((theme) =>
   createStyles({
+    tableContainer: {
+      overflowX: "scroll",
+    },
     expandCollapseIcon: {
       color: theme.palette.text.secondary,
       fontSize: "1.5em",
diff --git a/dashboard/client/src/components/ActorTable.tsx b/dashboard/client/src/components/ActorTable.tsx
index f1cfb846fbc9..903e87a8cba8 100644
--- a/dashboard/client/src/components/ActorTable.tsx
+++ b/dashboard/client/src/components/ActorTable.tsx
@@ -29,27 +29,39 @@ import { StatusChip } from "./StatusChip";
 import { HelpInfo } from "./Tooltip";
 import RayletWorkerTable, { ExpandableTableRow } from "./WorkerTable";
 
+export type ActorTableProps = {
+  actors: { [actorId: string]: Actor };
+  workers?: Worker[];
+  jobId?: string | null;
+  newIA?: boolean;
+  filterToActorId?: string;
+  onFilterChange?: () => void;
+  detailPathPrefix?: string;
+};
+
 const ActorTable = ({
   actors = {},
   workers = [],
   jobId = null,
-  detailPathPrefix = null,
-}: {
-  actors: { [actorId: string]: Actor };
-  workers?: Worker[];
-  jobId?: string | null;
-  detailPathPrefix: string | null;
-}) => {
+  newIA = false,
+  filterToActorId,
+  onFilterChange,
+  detailPathPrefix = "",
+}: ActorTableProps) => {
   const [pageNo, setPageNo] = useState(1);
-  const { changeFilter, filterFunc } = useFilter();
+  const { changeFilter, filterFunc } = useFilter<string>({
+    overrideFilters:
+      filterToActorId !== undefined
+        ? [{ key: "actorId", val: filterToActorId }]
+        : undefined,
+    onFilterChange,
+  });
+  const [actorIdFilterValue, setActorIdFilterValue] = useState(filterToActorId);
   const [pageSize, setPageSize] = useState(10);
   const { ipLogMap } = useContext(GlobalContext);
   const actorList = Object.values(actors || {}).filter(filterFunc);
   const list = actorList.slice((pageNo - 1) * pageSize, pageNo * pageSize);
   const classes = rowStyles();
-  if (detailPathPrefix === null) {
-    detailPathPrefix = "";
-  }
 
   const columns = [
     { label: "" },
@@ -173,7 +185,7 @@ const ActorTable = ({
         />
         <Autocomplete
           style={{ margin: 8, width: 150 }}
-          defaultValue={jobId}
+          defaultValue={filterToActorId === undefined ? jobId : undefined}
           options={Array.from(
             new Set(Object.values(actors).map((e) => e.jobId)),
           )}
@@ -227,12 +239,14 @@ const ActorTable = ({
           }}
         />
         <TextField
+          value={filterToActorId ?? actorIdFilterValue}
           style={{ margin: 8, width: 120 }}
           label="Actor ID"
           size="small"
           InputProps={{
             onChange: ({ target: { value } }) => {
               changeFilter("actorId", value.trim());
+              setActorIdFilterValue(value);
             },
             endAdornment: (
               <InputAdornment position="end">
@@ -245,7 +259,6 @@ const ActorTable = ({
           style={{ margin: 8, width: 120 }}
           label="Page Size"
           size="small"
-          defaultValue={10}
           InputProps={{
             onChange: ({ target: { value } }) => {
               setPageSize(Math.min(Number(value), 500) || 10);
@@ -268,173 +281,187 @@ const ActorTable = ({
           <StateCounter type="actor" list={actorList} />
         </div>
       </div>
-      <Table>
-        <TableHead>
-          <TableRow>
-            {columns.map(({ label, helpInfo }) => (
-              <TableCell align="center" key={label}>
-                <Box display="flex" justifyContent="center" alignItems="center">
-                  {label}
-                  {helpInfo && (
-                    <HelpInfo className={classes.helpInfo}>{helpInfo}</HelpInfo>
-                  )}
-                </Box>
-              </TableCell>
-            ))}
-          </TableRow>
-        </TableHead>
-        <TableBody>
-          {list.map(
-            ({
-              actorId,
-              actorClass,
-              jobId,
-              placementGroupId,
-              pid,
-              address,
-              state,
-              name,
-              numRestarts,
-              startTime,
-              endTime,
-              exitDetail,
-              requiredResources,
-            }) => (
-              <ExpandableTableRow
-                length={
-                  workers.filter(
-                    (e) =>
-                      e.pid === pid &&
-                      address.ipAddress === e.coreWorkerStats[0].ipAddress,
-                  ).length
-                }
-                expandComponent={
-                  <RayletWorkerTable
-                    actorMap={{}}
-                    workers={workers.filter(
+      <div className={classes.tableContainer}>
+        <Table>
+          <TableHead>
+            <TableRow>
+              {columns.map(({ label, helpInfo }) => (
+                <TableCell align="center" key={label}>
+                  <Box
+                    display="flex"
+                    justifyContent="center"
+                    alignItems="center"
+                  >
+                    {label}
+                    {helpInfo && (
+                      <HelpInfo className={classes.helpInfo}>
+                        {helpInfo}
+                      </HelpInfo>
+                    )}
+                  </Box>
+                </TableCell>
+              ))}
+            </TableRow>
+          </TableHead>
+          <TableBody>
+            {list.map(
+              ({
+                actorId,
+                actorClass,
+                jobId,
+                placementGroupId,
+                pid,
+                address,
+                state,
+                name,
+                numRestarts,
+                startTime,
+                endTime,
+                exitDetail,
+                requiredResources,
+              }) => (
+                <ExpandableTableRow
+                  length={
+                    workers.filter(
                       (e) =>
                         e.pid === pid &&
                         address.ipAddress === e.coreWorkerStats[0].ipAddress,
-                    )}
-                    mini
-                  />
-                }
-                key={actorId}
-              >
-                <TableCell align="center">
-                  <Tooltip
-                    className={classes.idCol}
-                    title={actorId}
-                    arrow
-                    interactive
-                  >
-                    <Link
-                      to={
-                        detailPathPrefix
-                          ? `${detailPathPrefix}/${actorId}`
-                          : actorId
-                      }
+                    ).length
+                  }
+                  expandComponent={
+                    <RayletWorkerTable
+                      actorMap={{}}
+                      workers={workers.filter(
+                        (e) =>
+                          e.pid === pid &&
+                          address.ipAddress === e.coreWorkerStats[0].ipAddress,
+                      )}
+                      mini
+                    />
+                  }
+                  key={actorId}
+                >
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.idCol}
+                      title={actorId}
+                      arrow
+                      interactive
                     >
-                      {actorId}
-                    </Link>
-                  </Tooltip>
-                </TableCell>
-                <TableCell align="center">{actorClass}</TableCell>
-                <TableCell align="center">{name ? name : "-"}</TableCell>
-                <TableCell align="center">
-                  <StatusChip type="actor" status={state} />
-                </TableCell>
-                <TableCell align="center">
-                  {ipLogMap[address?.ipAddress] && (
-                    <React.Fragment>
                       <Link
-                        target="_blank"
-                        to={`/log/${encodeURIComponent(
-                          ipLogMap[address?.ipAddress],
-                        )}?fileName=${jobId}-${pid}`}
+                        to={
+                          detailPathPrefix
+                            ? `${detailPathPrefix}/${actorId}`
+                            : actorId
+                        }
                       >
-                        Log
+                        {actorId}
                       </Link>
-                      <br />
-                      <CpuProfilingLink
-                        pid={pid}
-                        ip={address?.ipAddress}
-                        type=""
-                      />
-                      <br />
-                      <CpuStackTraceLink
-                        pid={pid}
-                        ip={address?.ipAddress}
-                        type=""
-                      />
-                    </React.Fragment>
-                  )}
-                </TableCell>
-                <TableCell align="center">
-                  {startTime && startTime > 0 ? (
-                    <DurationText startTime={startTime} endTime={endTime} />
-                  ) : (
-                    "-"
-                  )}
-                </TableCell>
-                <TableCell align="center">{jobId}</TableCell>
-                <TableCell align="center">{pid ? pid : "-"}</TableCell>
-                <TableCell align="center">
-                  {address?.ipAddress ? address?.ipAddress : "-"}
-                </TableCell>
-                <TableCell
-                  align="center"
-                  style={{
-                    color: Number(numRestarts) > 0 ? orange[500] : "inherit",
-                  }}
-                >
-                  {numRestarts}
-                </TableCell>
-                <TableCell align="center">
-                  <Tooltip
-                    className={classes.idCol}
-                    title={placementGroupId ? placementGroupId : "-"}
-                    arrow
-                    interactive
-                  >
-                    <div>{placementGroupId ? placementGroupId : "-"}</div>
-                  </Tooltip>
-                </TableCell>
-                <TableCell align="center">
-                  <Tooltip
-                    className={classes.OverflowCol}
-                    title={Object.entries(requiredResources || {}).map(
-                      ([key, val]) => (
-                        <div style={{ margin: 4 }}>
-                          {key}: {val}
-                        </div>
-                      ),
+                    </Tooltip>
+                  </TableCell>
+                  <TableCell align="center">{actorClass}</TableCell>
+                  <TableCell align="center">{name ? name : "-"}</TableCell>
+                  <TableCell align="center">
+                    <StatusChip type="actor" status={state} />
+                  </TableCell>
+                  <TableCell align="center">
+                    {ipLogMap[address?.ipAddress] && (
+                      <React.Fragment>
+                        <Link
+                          target="_blank"
+                          to={
+                            newIA
+                              ? `/new/logs/${encodeURIComponent(
+                                  ipLogMap[address?.ipAddress],
+                                )}?fileName=${jobId}-${pid}`
+                              : `/log/${encodeURIComponent(
+                                  ipLogMap[address?.ipAddress],
+                                )}?fileName=${jobId}-${pid}`
+                          }
+                        >
+                          Log
+                        </Link>
+                        <br />
+                        <CpuProfilingLink
+                          pid={pid}
+                          ip={address?.ipAddress}
+                          type=""
+                        />
+                        <br />
+                        <CpuStackTraceLink
+                          pid={pid}
+                          ip={address?.ipAddress}
+                          type=""
+                        />
+                      </React.Fragment>
                     )}
-                    arrow
-                    interactive
-                  >
-                    <div>
-                      {Object.entries(requiredResources || {})
-                        .map(([key, val]) => `${key}: ${val}`)
-                        .join(", ")}
-                    </div>
-                  </Tooltip>
-                </TableCell>
-                <TableCell align="center">
-                  <Tooltip
-                    className={classes.OverflowCol}
-                    title={exitDetail}
-                    arrow
-                    interactive
+                  </TableCell>
+                  <TableCell align="center">
+                    {startTime && startTime > 0 ? (
+                      <DurationText startTime={startTime} endTime={endTime} />
+                    ) : (
+                      "-"
+                    )}
+                  </TableCell>
+                  <TableCell align="center">{jobId}</TableCell>
+                  <TableCell align="center">{pid ? pid : "-"}</TableCell>
+                  <TableCell align="center">
+                    {address?.ipAddress ? address?.ipAddress : "-"}
+                  </TableCell>
+                  <TableCell
+                    align="center"
+                    style={{
+                      color: Number(numRestarts) > 0 ? orange[500] : "inherit",
+                    }}
                   >
-                    <div>{exitDetail}</div>
-                  </Tooltip>
-                </TableCell>
-              </ExpandableTableRow>
-            ),
-          )}
-        </TableBody>
-      </Table>
+                    {numRestarts}
+                  </TableCell>
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.idCol}
+                      title={placementGroupId ? placementGroupId : "-"}
+                      arrow
+                      interactive
+                    >
+                      <div>{placementGroupId ? placementGroupId : "-"}</div>
+                    </Tooltip>
+                  </TableCell>
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.OverflowCol}
+                      title={Object.entries(requiredResources || {}).map(
+                        ([key, val]) => (
+                          <div style={{ margin: 4 }}>
+                            {key}: {val}
+                          </div>
+                        ),
+                      )}
+                      arrow
+                      interactive
+                    >
+                      <div>
+                        {Object.entries(requiredResources || {})
+                          .map(([key, val]) => `${key}: ${val}`)
+                          .join(", ")}
+                      </div>
+                    </Tooltip>
+                  </TableCell>
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.OverflowCol}
+                      title={exitDetail}
+                      arrow
+                      interactive
+                    >
+                      <div>{exitDetail}</div>
+                    </Tooltip>
+                  </TableCell>
+                </ExpandableTableRow>
+              ),
+            )}
+          </TableBody>
+        </Table>
+      </div>
     </React.Fragment>
   );
 };
diff --git a/dashboard/client/src/components/PlacementGroupTable.tsx b/dashboard/client/src/components/PlacementGroupTable.tsx
index 73329bd184f8..4ea75dddfb4e 100644
--- a/dashboard/client/src/components/PlacementGroupTable.tsx
+++ b/dashboard/client/src/components/PlacementGroupTable.tsx
@@ -132,62 +132,68 @@ const PlacementGroupTable = ({
           <StateCounter type="placementGroup" list={placementGroupList} />
         </div>
       </div>
-      <Table>
-        <TableHead>
-          <TableRow>
-            {columns.map(({ label }) => (
-              <TableCell align="center" key={label}>
-                <Box display="flex" justifyContent="center" alignItems="center">
-                  {label}
-                </Box>
-              </TableCell>
-            ))}
-          </TableRow>
-        </TableHead>
-        <TableBody>
-          {list.map(
-            ({
-              placement_group_id,
-              name,
-              creator_job_id,
-              state,
-              stats,
-              bundles,
-            }) => (
-              <TableRow key={placement_group_id}>
-                <TableCell align="center">
-                  <Tooltip
-                    className={classes.idCol}
-                    title={placement_group_id}
-                    arrow
-                    interactive
+      <div className={classes.tableContainer}>
+        <Table>
+          <TableHead>
+            <TableRow>
+              {columns.map(({ label }) => (
+                <TableCell align="center" key={label}>
+                  <Box
+                    display="flex"
+                    justifyContent="center"
+                    alignItems="center"
                   >
-                    <div>{placement_group_id}</div>
-                  </Tooltip>
+                    {label}
+                  </Box>
                 </TableCell>
-                <TableCell align="center">{name ? name : "-"}</TableCell>
-                <TableCell align="center">{creator_job_id}</TableCell>
-                <TableCell align="center">
-                  <StatusChip type="placementGroup" status={state} />
-                </TableCell>
-                <TableCell align="center">
-                  <Tooltip
-                    className={classes.OverflowCol}
-                    title={<BundleResourceRequirements bundles={bundles} />}
-                    arrow
-                    interactive
-                  >
-                    <BundleResourceRequirements bundles={bundles} />
-                  </Tooltip>
-                </TableCell>
-                <TableCell align="center">
-                  {stats ? stats.scheduling_state : "-"}
-                </TableCell>
-              </TableRow>
-            ),
-          )}
-        </TableBody>
-      </Table>
+              ))}
+            </TableRow>
+          </TableHead>
+          <TableBody>
+            {list.map(
+              ({
+                placement_group_id,
+                name,
+                creator_job_id,
+                state,
+                stats,
+                bundles,
+              }) => (
+                <TableRow key={placement_group_id}>
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.idCol}
+                      title={placement_group_id}
+                      arrow
+                      interactive
+                    >
+                      <div>{placement_group_id}</div>
+                    </Tooltip>
+                  </TableCell>
+                  <TableCell align="center">{name ? name : "-"}</TableCell>
+                  <TableCell align="center">{creator_job_id}</TableCell>
+                  <TableCell align="center">
+                    <StatusChip type="placementGroup" status={state} />
+                  </TableCell>
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.OverflowCol}
+                      title={<BundleResourceRequirements bundles={bundles} />}
+                      arrow
+                      interactive
+                    >
+                      <BundleResourceRequirements bundles={bundles} />
+                    </Tooltip>
+                  </TableCell>
+                  <TableCell align="center">
+                    {stats ? stats.scheduling_state : "-"}
+                  </TableCell>
+                </TableRow>
+              ),
+            )}
+          </TableBody>
+        </Table>
+      </div>
     </div>
   );
 };
diff --git a/dashboard/client/src/components/TaskTable.tsx b/dashboard/client/src/components/TaskTable.tsx
index 508ae72a67f9..652e8dc36c60 100644
--- a/dashboard/client/src/components/TaskTable.tsx
+++ b/dashboard/client/src/components/TaskTable.tsx
@@ -1,6 +1,8 @@
 import {
   Box,
+  createStyles,
   InputAdornment,
+  makeStyles,
   Table,
   TableBody,
   TableCell,
@@ -9,28 +11,48 @@ import {
   TextField,
   TextFieldProps,
   Tooltip,
+  Typography,
 } from "@material-ui/core";
 import Autocomplete from "@material-ui/lab/Autocomplete";
 import Pagination from "@material-ui/lab/Pagination";
-import React, { useState } from "react";
+import React, { useContext, useState } from "react";
+import { Link } from "react-router-dom";
+import { GlobalContext } from "../App";
+import DialogWithTitle from "../common/DialogWithTitle";
 import { DurationText } from "../common/DurationText";
 import rowStyles from "../common/RowStyles";
 import { Task } from "../type/task";
 import { useFilter } from "../util/hook";
 import StateCounter from "./StatesCounter";
 import { StatusChip } from "./StatusChip";
+import { HelpInfo } from "./Tooltip";
+
+export type TaskTableProps = {
+  tasks: Task[];
+  jobId?: string;
+  filterToTaskId?: string;
+  onFilterChange?: () => void;
+  newIA?: boolean;
+  actorId?: string;
+};
 
 const TaskTable = ({
   tasks = [],
-  jobId = null,
-  actorId = null,
-}: {
-  tasks: Task[];
-  jobId?: string | null;
-  actorId?: string | null;
-}) => {
+  jobId,
+  filterToTaskId,
+  onFilterChange,
+  newIA = false,
+  actorId,
+}: TaskTableProps) => {
   const [pageNo, setPageNo] = useState(1);
-  const { changeFilter, filterFunc } = useFilter();
+  const { changeFilter, filterFunc } = useFilter<keyof Task>({
+    overrideFilters:
+      filterToTaskId !== undefined
+        ? [{ key: "task_id", val: filterToTaskId }]
+        : undefined,
+    onFilterChange,
+  });
+  const [taskIdFilterValue, setTaskIdFilterValue] = useState(filterToTaskId);
   const [pageSize, setPageSize] = useState(10);
   const taskList = tasks.filter(filterFunc);
   const list = taskList.slice((pageNo - 1) * pageSize, pageNo * pageSize);
@@ -41,10 +63,25 @@ const TaskTable = ({
     { label: "Name" },
     { label: "Job Id" },
     { label: "State" },
+    {
+      label: "Actions",
+      helpInfo: (
+        <Typography>
+          A list of actions performable on this task.
+          <br />
+          - Log: view log messages of the worker that ran this task. You can
+          only view all the logs of the worker and a worker can run multiple
+          tasks.
+          <br />- Error: For tasks that have failed, show a stack trace for the
+          faiure.
+        </Typography>
+      ),
+    },
     { label: "Duration" },
     { label: "Function or Class Name" },
     { label: "Node Id" },
     { label: "Actor_id" },
+    { label: "Worker_id" },
     { label: "Type" },
     { label: "Placement Group Id" },
     { label: "Required Resources" },
@@ -54,10 +91,13 @@ const TaskTable = ({
     <div>
       <div style={{ flex: 1, display: "flex", alignItems: "center" }}>
         <Autocomplete
+          value={filterToTaskId ?? taskIdFilterValue}
+          inputValue={filterToTaskId ?? taskIdFilterValue}
           style={{ margin: 8, width: 120 }}
           options={Array.from(new Set(tasks.map((e) => e.task_id)))}
           onInputChange={(_: any, value: string) => {
             changeFilter("task_id", value.trim());
+            setTaskIdFilterValue(value);
           }}
           renderInput={(params: TextFieldProps) => (
             <TextField {...params} label="Task ID" />
@@ -75,7 +115,7 @@ const TaskTable = ({
         />
         <Autocomplete
           style={{ margin: 8, width: 150 }}
-          defaultValue={jobId}
+          defaultValue={filterToTaskId === undefined ? jobId : undefined}
           options={Array.from(new Set(tasks.map((e) => e.job_id)))}
           onInputChange={(_: any, value: string) => {
             changeFilter("job_id", value.trim());
@@ -86,7 +126,7 @@ const TaskTable = ({
         />
         <Autocomplete
           style={{ margin: 8, width: 150 }}
-          defaultValue={actorId ? actorId : ""}
+          defaultValue={filterToTaskId === undefined ? actorId : undefined}
           options={Array.from(
             new Set(tasks.map((e) => (e.actor_id ? e.actor_id : ""))),
           )}
@@ -144,120 +184,225 @@ const TaskTable = ({
           <StateCounter type="task" list={taskList} />
         </div>
       </div>
-      <Table>
-        <TableHead>
-          <TableRow>
-            {columns.map(({ label }) => (
-              <TableCell align="center" key={label}>
-                <Box display="flex" justifyContent="center" alignItems="center">
-                  {label}
-                </Box>
-              </TableCell>
-            ))}
-          </TableRow>
-        </TableHead>
-        <TableBody>
-          {list.map(
-            ({
-              task_id,
-              name,
-              job_id,
-              state,
-              func_or_class_name,
-              node_id,
-              actor_id,
-              placement_group_id,
-              type,
-              required_resources,
-              events,
-              start_time_ms,
-              end_time_ms,
-            }) => (
-              <TableRow key={task_id}>
-                <TableCell align="center">
-                  <Tooltip
-                    className={classes.idCol}
-                    title={task_id}
-                    arrow
-                    interactive
-                  >
-                    <div>{task_id}</div>
-                  </Tooltip>
-                </TableCell>
-                <TableCell align="center">{name ? name : "-"}</TableCell>
-                <TableCell align="center">{job_id}</TableCell>
-                <TableCell align="center">
-                  <StatusChip type="task" status={state} />
-                </TableCell>
-                <TableCell align="center">
-                  {start_time_ms && start_time_ms > 0 ? (
-                    <DurationText
-                      startTime={start_time_ms}
-                      endTime={end_time_ms}
-                    />
-                  ) : (
-                    "-"
-                  )}
-                </TableCell>
-                <TableCell align="center">{func_or_class_name}</TableCell>
-                <TableCell align="center">
-                  <Tooltip
-                    className={classes.idCol}
-                    title={node_id ? node_id : "-"}
-                    arrow
-                    interactive
+      <div className={classes.tableContainer}>
+        <Table>
+          <TableHead>
+            <TableRow>
+              {columns.map(({ label, helpInfo }) => (
+                <TableCell align="center" key={label}>
+                  <Box
+                    display="flex"
+                    justifyContent="center"
+                    alignItems="center"
                   >
-                    <div>{node_id ? node_id : "-"}</div>
-                  </Tooltip>
-                </TableCell>
-                <TableCell align="center">
-                  <Tooltip
-                    className={classes.idCol}
-                    title={actor_id ? actor_id : "-"}
-                    arrow
-                    interactive
-                  >
-                    <div>{actor_id ? actor_id : "-"}</div>
-                  </Tooltip>
-                </TableCell>
-                <TableCell align="center">{type}</TableCell>
-                <TableCell align="center">
-                  <Tooltip
-                    className={classes.idCol}
-                    title={placement_group_id ? placement_group_id : "-"}
-                    arrow
-                    interactive
-                  >
-                    <div>{placement_group_id ? placement_group_id : "-"}</div>
-                  </Tooltip>
-                </TableCell>
-                <TableCell align="center">
-                  <Tooltip
-                    className={classes.OverflowCol}
-                    title={Object.entries(required_resources || {}).map(
-                      ([key, val]) => (
-                        <div style={{ margin: 4 }}>
-                          {key}: {val}
-                        </div>
-                      ),
+                    {label}
+                    {helpInfo && (
+                      <HelpInfo className={classes.helpInfo}>
+                        {helpInfo}
+                      </HelpInfo>
                     )}
-                    arrow
-                    interactive
-                  >
-                    <div>
-                      {Object.entries(required_resources || {})
-                        .map(([key, val]) => `${key}: ${val}`)
-                        .join(", ")}
-                    </div>
-                  </Tooltip>
+                  </Box>
                 </TableCell>
-              </TableRow>
-            ),
-          )}
-        </TableBody>
-      </Table>
+              ))}
+            </TableRow>
+          </TableHead>
+          <TableBody>
+            {list.map((task) => {
+              const {
+                task_id,
+                name,
+                job_id,
+                state,
+                func_or_class_name,
+                node_id,
+                actor_id,
+                placement_group_id,
+                type,
+                required_resources,
+                start_time_ms,
+                end_time_ms,
+                worker_id,
+              } = task;
+              return (
+                <TableRow key={task_id}>
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.idCol}
+                      title={task_id}
+                      arrow
+                      interactive
+                    >
+                      <div>{task_id}</div>
+                    </Tooltip>
+                  </TableCell>
+                  <TableCell align="center">{name ? name : "-"}</TableCell>
+                  <TableCell align="center">{job_id}</TableCell>
+                  <TableCell align="center">
+                    <StatusChip type="task" status={state} />
+                  </TableCell>
+                  <TableCell align="center">
+                    <TaskTableActions task={task} newIA={newIA} />
+                  </TableCell>
+                  <TableCell align="center">
+                    {start_time_ms && start_time_ms > 0 ? (
+                      <DurationText
+                        startTime={start_time_ms}
+                        endTime={end_time_ms}
+                      />
+                    ) : (
+                      "-"
+                    )}
+                  </TableCell>
+                  <TableCell align="center">{func_or_class_name}</TableCell>
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.idCol}
+                      title={node_id ? node_id : "-"}
+                      arrow
+                      interactive
+                    >
+                      <div>{node_id ? node_id : "-"}</div>
+                    </Tooltip>
+                  </TableCell>
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.idCol}
+                      title={actor_id ? actor_id : "-"}
+                      arrow
+                      interactive
+                    >
+                      <div>{actor_id ? actor_id : "-"}</div>
+                    </Tooltip>
+                  </TableCell>
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.idCol}
+                      title={worker_id ? worker_id : "-"}
+                      arrow
+                      interactive
+                    >
+                      <div>{worker_id ? worker_id : "-"}</div>
+                    </Tooltip>
+                  </TableCell>
+                  <TableCell align="center">{type}</TableCell>
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.idCol}
+                      title={placement_group_id ? placement_group_id : "-"}
+                      arrow
+                      interactive
+                    >
+                      <div>{placement_group_id ? placement_group_id : "-"}</div>
+                    </Tooltip>
+                  </TableCell>
+                  <TableCell align="center">
+                    <Tooltip
+                      className={classes.OverflowCol}
+                      title={Object.entries(required_resources || {}).map(
+                        ([key, val]) => (
+                          <div style={{ margin: 4 }}>
+                            {key}: {val}
+                          </div>
+                        ),
+                      )}
+                      arrow
+                      interactive
+                    >
+                      <div>
+                        {Object.entries(required_resources || {})
+                          .map(([key, val]) => `${key}: ${val}`)
+                          .join(", ")}
+                      </div>
+                    </Tooltip>
+                  </TableCell>
+                </TableRow>
+              );
+            })}
+          </TableBody>
+        </Table>
+      </div>
     </div>
   );
 };
 
 export default TaskTable;
+
+const useTaskTableActionsStyles = makeStyles(() =>
+  createStyles({
+    errorDetails: {
+      whiteSpace: "pre",
+    },
+    link: {
+      border: "none",
+      cursor: "pointer",
+      color: "#036DCF",
+      textDecoration: "underline",
+      background: "none",
+    },
+  }),
+);
+
+type TaskTableActionsProps = {
+  newIA?: boolean;
+  task: Task;
+};
+
+const TaskTableActions = ({ task, newIA = false }: TaskTableActionsProps) => {
+  const classes = useTaskTableActionsStyles();
+  const { ipLogMap } = useContext(GlobalContext);
+  const [showErrorDetailsDialog, setShowErrorDetailsDialog] = useState(false);
+
+  const handleErrorClick = () => {
+    setShowErrorDetailsDialog(true);
+  };
+
+  const executeEvent = task.profiling_data?.events?.find(
+    ({ event_name }) => event_name === "task:execute",
+  );
+  const errorDetails =
+    executeEvent?.extra_data?.traceback && executeEvent?.extra_data?.type
+      ? `${executeEvent?.extra_data?.type}\n${executeEvent?.extra_data?.traceback}`
+      : undefined;
+
+  return (
+    <React.Fragment>
+      {task?.profiling_data?.node_ip_address &&
+        ipLogMap[task?.profiling_data?.node_ip_address] &&
+        task.worker_id &&
+        task.job_id && (
+          <React.Fragment>
+            <Link
+              target="_blank"
+              to={
+                newIA
+                  ? `/new/logs/${encodeURIComponent(
+                      ipLogMap[task.profiling_data.node_ip_address],
+                    )}?fileName=worker-${task.worker_id}`
+                  : `/log/${encodeURIComponent(
+                      ipLogMap[task.profiling_data.node_ip_address],
+                    )}?fileName=worker-${task.worker_id}`
+              }
+            >
+              Log
+            </Link>
+            <br />
+          </React.Fragment>
+        )}
+      {errorDetails && (
+        <button className={classes.link} onClick={handleErrorClick}>
+          Error
+        </button>
+      )}
+      {showErrorDetailsDialog && errorDetails && (
+        <DialogWithTitle
+          title="Error details"
+          handleClose={() => {
+            setShowErrorDetailsDialog(false);
+          }}
+        >
+          <div className={classes.errorDetails}>{errorDetails}</div>
+        </DialogWithTitle>
+      )}
+    </React.Fragment>
+  );
+};
diff --git a/dashboard/client/src/components/WorkerTable.tsx b/dashboard/client/src/components/WorkerTable.tsx
index 0f80325ea48b..f1f4f3e6dd84 100644
--- a/dashboard/client/src/components/WorkerTable.tsx
+++ b/dashboard/client/src/components/WorkerTable.tsx
@@ -86,9 +86,11 @@ export const ExpandableTableRow = ({
 const WorkerDetailTable = ({
   actorMap,
   coreWorkerStats,
+  newIA = false,
 }: {
   actorMap: { [actorId: string]: Actor };
   coreWorkerStats: CoreWorkerStats[];
+  newIA?: boolean;
 }) => {
   const actors = {} as { [actorId: string]: Actor };
   (coreWorkerStats || [])
@@ -101,7 +103,7 @@ const WorkerDetailTable = ({
 
   return (
     <TableContainer>
-      <ActorTable actors={actors} detailPathPrefix="" />
+      <ActorTable actors={actors} newIA={newIA} />
     </TableContainer>
   );
 };
@@ -110,10 +112,12 @@ const RayletWorkerTable = ({
   workers = [],
   actorMap,
   mini,
+  newIA = false,
 }: {
   workers: Worker[];
   actorMap: { [actorId: string]: Actor };
   mini?: boolean;
+  newIA?: boolean;
 }) => {
   const { changeFilter, filterFunc } = useFilter();
   const [key, setKey] = useState("");
@@ -186,6 +190,7 @@ const RayletWorkerTable = ({
                     <WorkerDetailTable
                       actorMap={actorMap}
                       coreWorkerStats={coreWorkerStats}
+                      newIA={newIA}
                     />
                   }
                   length={
@@ -231,11 +236,19 @@ const RayletWorkerTable = ({
                         <Grid item>
                           <Link
                             target="_blank"
-                            to={`/log/${encodeURIComponent(
-                              ipLogMap[coreWorkerStats[0]?.ipAddress],
-                            )}?fileName=${
-                              coreWorkerStats[0].jobId || ""
-                            }-${pid}`}
+                            to={
+                              newIA
+                                ? `/new/logs/${encodeURIComponent(
+                                    ipLogMap[coreWorkerStats[0]?.ipAddress],
+                                  )}?fileName=${
+                                    coreWorkerStats[0].jobId || ""
+                                  }-${pid}`
+                                : `/log/${encodeURIComponent(
+                                    ipLogMap[coreWorkerStats[0]?.ipAddress],
+                                  )}?fileName=${
+                                    coreWorkerStats[0].jobId || ""
+                                  }-${pid}`
+                            }
                           >
                             Log
                           </Link>
diff --git a/dashboard/client/src/pages/actor/ActorList.tsx b/dashboard/client/src/pages/actor/ActorList.tsx
index cc06555cd273..d61b07a8cb4a 100644
--- a/dashboard/client/src/pages/actor/ActorList.tsx
+++ b/dashboard/client/src/pages/actor/ActorList.tsx
@@ -1,7 +1,7 @@
 import { Grid } from "@material-ui/core";
 import dayjs from "dayjs";
 import React, { useState } from "react";
-import ActorTable from "../../components/ActorTable";
+import ActorTable, { ActorTableProps } from "../../components/ActorTable";
 import { Actor } from "../../type/actor";
 import { useActorList } from "./hook/useActorList";
 
@@ -10,17 +10,17 @@ import { useActorList } from "./hook/useActorList";
  */
 const ActorList = ({
   jobId = null,
-  detailPathPrefix = null,
+  newIA = false,
+  detailPathPrefix = "",
+  ...actorTableProps
 }: {
   jobId?: string | null;
-  detailPathPrefix: string | null;
-}) => {
+  newIA?: boolean;
+  detailPathPrefix?: string;
+} & Pick<ActorTableProps, "filterToActorId" | "onFilterChange">) => {
   const [timeStamp] = useState(dayjs());
   const data: { [actorId: string]: Actor } | undefined = useActorList();
   const actors: { [actorId: string]: Actor } = data ? data : {};
-  if (detailPathPrefix === null) {
-    detailPathPrefix = "";
-  }
 
   return (
     <div>
@@ -32,7 +32,9 @@ const ActorList = ({
       <ActorTable
         actors={actors}
         jobId={jobId}
+        newIA={newIA}
         detailPathPrefix={detailPathPrefix}
+        {...actorTableProps}
       />
     </div>
   );
diff --git a/dashboard/client/src/pages/actor/index.tsx b/dashboard/client/src/pages/actor/index.tsx
index ff1f96f49e65..8183556f8c53 100644
--- a/dashboard/client/src/pages/actor/index.tsx
+++ b/dashboard/client/src/pages/actor/index.tsx
@@ -14,7 +14,7 @@ const useStyles = makeStyles((theme) => ({
 /**
  * Represent the standalone actors page.
  */
-const Actors = () => {
+const Actors = ({ newIA = false }: { newIA?: boolean }) => {
   const classes = useStyles();
 
   return (
@@ -27,7 +27,7 @@ const Actors = () => {
         }}
       />
       <TitleCard title="ACTORS">
-        <ActorList detailPathPrefix="" />
+        <ActorList newIA={newIA} />
       </TitleCard>
     </div>
   );
diff --git a/dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.tsx b/dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.tsx
index 4791b6c8a74d..6ba92e3ffcbf 100644
--- a/dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.tsx
+++ b/dashboard/client/src/pages/job/AdvancedProgressBar/AdvancedProgressBar.tsx
@@ -16,16 +16,18 @@ import {
   RiSubtractLine,
 } from "react-icons/ri";
 import { ClassNameProps } from "../../../common/props";
-import { JobProgressGroup } from "../../../type/job";
+import { JobProgressGroup, NestedJobProgressLink } from "../../../type/job";
 import { MiniTaskProgressBar } from "../TaskProgressBar";
 
 export type AdvancedProgressBarProps = {
   progressGroups: JobProgressGroup[] | undefined;
-} & ClassNameProps;
+} & ClassNameProps &
+  Pick<AdvancedProgressBarSegmentProps, "onClickLink">;
 
 export const AdvancedProgressBar = ({
   progressGroups,
   className,
+  ...segmentProps
 }: AdvancedProgressBarProps) => {
   return (
     <Table className={className}>
@@ -35,6 +37,7 @@ export const AdvancedProgressBar = ({
             <AdvancedProgressBarSegment
               key={group.key}
               jobProgressGroup={group}
+              {...segmentProps}
             />
           ))
         ) : (
@@ -71,6 +74,13 @@ const useAdvancedProgressBarSegmentStyles = makeStyles((theme) =>
     iconHidden: {
       visibility: "hidden",
     },
+    link: {
+      border: "none",
+      cursor: "pointer",
+      color: "#036DCF",
+      textDecoration: "underline",
+      background: "none",
+    },
   }),
 );
 
@@ -92,14 +102,16 @@ export type AdvancedProgressBarSegmentProps = {
    */
   showParentCollapseButton?: boolean;
   onParentCollapseButtonPressed?: () => void;
+  onClickLink?: (link: NestedJobProgressLink) => void;
 };
 
 export const AdvancedProgressBarSegment = ({
-  jobProgressGroup: { name, progress, children, type },
+  jobProgressGroup: { name, progress, children, type, link },
   startExpanded = false,
   nestedIndex = 1,
   showParentCollapseButton = false,
   onParentCollapseButtonPressed,
+  onClickLink,
 }: AdvancedProgressBarSegmentProps) => {
   const classes = useAdvancedProgressBarSegmentStyles();
 
@@ -153,7 +165,19 @@ export const AdvancedProgressBarSegment = ({
                 marginRight: isGroup ? 28 : 4,
               }}
             />
-            {name}
+            {link ? (
+              <button
+                className={classes.link}
+                onClick={(event) => {
+                  onClickLink?.(link);
+                  event.stopPropagation();
+                }}
+              >
+                {name}
+              </button>
+            ) : (
+              name
+            )}
             {isGroup && (
               <React.Fragment>
                 <span className={classes.spacer} />
@@ -176,6 +200,7 @@ export const AdvancedProgressBarSegment = ({
             nestedIndex={isGroup ? nestedIndex : nestedIndex + 1}
             showParentCollapseButton={showCollapse && index === 0}
             onParentCollapseButtonPressed={handleCollapse}
+            onClickLink={onClickLink}
           />
         ))}
     </React.Fragment>
diff --git a/dashboard/client/src/pages/job/JobDetail.tsx b/dashboard/client/src/pages/job/JobDetail.tsx
index d7e6427a0079..8adc0459d1be 100644
--- a/dashboard/client/src/pages/job/JobDetail.tsx
+++ b/dashboard/client/src/pages/job/JobDetail.tsx
@@ -1,6 +1,6 @@
 import { Box, Grid, makeStyles, Typography } from "@material-ui/core";
 import dayjs from "dayjs";
-import React, { useContext } from "react";
+import React, { useContext, useRef, useState } from "react";
 import { Link } from "react-router-dom";
 import { GlobalContext } from "../../App";
 import { CollapsibleSection } from "../../common/CollapsibleSection";
@@ -13,7 +13,7 @@ import Loading from "../../components/Loading";
 import { MetadataSection } from "../../components/MetadataSection";
 import { StatusChip } from "../../components/StatusChip";
 import TitleCard from "../../components/TitleCard";
-import { UnifiedJob } from "../../type/job";
+import { NestedJobProgressLink, UnifiedJob } from "../../type/job";
 import ActorList from "../actor/ActorList";
 import PlacementGroupList from "../state/PlacementGroup";
 import TaskList from "../state/task";
@@ -40,6 +40,13 @@ export const JobDetailChartsPage = ({
   const { job, msg, params } = useJobDetail();
   const jobId = params.id;
 
+  const [taskListFilter, setTaskListFilter] = useState<string>();
+  const [taskTableExpanded, setTaskTableExpanded] = useState(false);
+  const taskTableRef = useRef<HTMLDivElement>(null);
+
+  const [actorListFilter, setActorListFilter] = useState<string>();
+  const [actorTableExpanded, setActorTableExpanded] = useState(false);
+  const actorTableRef = useRef<HTMLDivElement>(null);
   const { cluster_status } = useRayStatus();
 
   const formatNodeStatus = (cluster_status: string) => {
@@ -78,7 +85,7 @@ export const JobDetailChartsPage = ({
           // See format_info_string in util.py
           if (i.startsWith("-----") || i.startsWith("=====")) {
             // Separator
-            return <div />;
+            return <div key={key} />;
           } else if (i.endsWith(":")) {
             return (
               <div key={key}>
@@ -86,7 +93,7 @@ export const JobDetailChartsPage = ({
               </div>
             );
           } else if (i === "") {
-            return <br />;
+            return <br key={key} />;
           } else {
             return <div key={key}>{i}</div>;
           }
@@ -108,6 +115,40 @@ export const JobDetailChartsPage = ({
     );
   }
 
+  const handleClickLink = (link: NestedJobProgressLink) => {
+    if (link.type === "task") {
+      setTaskListFilter(link.id);
+      if (!taskTableExpanded) {
+        setTaskTableExpanded(true);
+        setTimeout(() => {
+          // Wait a few ms to give the collapsible view some time to render.
+          taskTableRef.current?.scrollIntoView();
+        }, 50);
+      } else {
+        taskTableRef.current?.scrollIntoView();
+      }
+    } else if (link.type === "actor") {
+      setActorListFilter(link.id);
+      if (!actorTableExpanded) {
+        setActorTableExpanded(true);
+        setTimeout(() => {
+          // Wait a few ms to give the collapsible view some time to render.
+          actorTableRef.current?.scrollIntoView();
+        }, 50);
+      } else {
+        actorTableRef.current?.scrollIntoView();
+      }
+    }
+  };
+
+  const handleTaskListFilterChange = () => {
+    setTaskListFilter(undefined);
+  };
+
+  const handleActorListFilterChange = () => {
+    setActorListFilter(undefined);
+  };
+
   return (
     <div className={classes.root}>
       <TitleCard title={`JOB - ${params.id}`}>
@@ -196,10 +237,10 @@ export const JobDetailChartsPage = ({
           ]}
         />
       </TitleCard>
-      <TitleCard title="Tasks">
-        <JobProgressBar jobId={jobId} job={job} />
+      <TitleCard title="Tasks (beta)">
+        <JobProgressBar jobId={jobId} job={job} onClickLink={handleClickLink} />
       </TitleCard>
-      <TitleCard title="Task Timeline">
+      <TitleCard title="Task Timeline (beta)">
         <TaskTimeline jobId={jobId} />
       </TitleCard>
       <Grid container>
@@ -243,14 +284,36 @@ export const JobDetailChartsPage = ({
         </Grid>
       </Grid>
       <TitleCard>
-        <CollapsibleSection title="Task Table">
-          <TaskList jobId={jobId} />
+        <CollapsibleSection
+          ref={taskTableRef}
+          title="Task Table"
+          expanded={taskTableExpanded}
+          onExpandButtonClick={() => {
+            setTaskTableExpanded(!taskTableExpanded);
+          }}
+        >
+          <TaskList
+            jobId={jobId}
+            filterToTaskId={taskListFilter}
+            onFilterChange={handleTaskListFilterChange}
+            newIA={newIA}
+          />
         </CollapsibleSection>
       </TitleCard>
       <TitleCard>
-        <CollapsibleSection title="Actors">
+        <CollapsibleSection
+          ref={actorTableRef}
+          title="Actors"
+          expanded={actorTableExpanded}
+          onExpandButtonClick={() => {
+            setActorTableExpanded(!actorTableExpanded);
+          }}
+        >
           <ActorList
             jobId={jobId}
+            newIA={newIA}
+            filterToActorId={actorListFilter}
+            onFilterChange={handleActorListFilterChange}
             detailPathPrefix={newIA ? "actors" : "/actors"}
           />
         </CollapsibleSection>
diff --git a/dashboard/client/src/pages/job/JobDetailActorPage.tsx b/dashboard/client/src/pages/job/JobDetailActorPage.tsx
index 25d8fe773045..92b20c4fec9e 100644
--- a/dashboard/client/src/pages/job/JobDetailActorPage.tsx
+++ b/dashboard/client/src/pages/job/JobDetailActorPage.tsx
@@ -32,7 +32,7 @@ export const JobDetailActorsPage = () => {
     <div className={classes.root}>
       <MainNavPageInfo pageInfo={pageInfo} />
       <TitleCard title="Actors">
-        {<ActorList jobId={params.id} detailPathPrefix="" />}
+        <ActorList jobId={params.id} newIA />
       </TitleCard>
     </div>
   );
diff --git a/dashboard/client/src/pages/job/JobProgressBar.tsx b/dashboard/client/src/pages/job/JobProgressBar.tsx
index 59fe73784c93..d5d81b41124e 100644
--- a/dashboard/client/src/pages/job/JobProgressBar.tsx
+++ b/dashboard/client/src/pages/job/JobProgressBar.tsx
@@ -1,7 +1,10 @@
 import { makeStyles } from "@material-ui/core";
 import React, { useEffect, useState } from "react";
 import { UnifiedJob } from "../../type/job";
-import { AdvancedProgressBar } from "./AdvancedProgressBar";
+import {
+  AdvancedProgressBar,
+  AdvancedProgressBarProps,
+} from "./AdvancedProgressBar";
 import { useJobProgress, useJobProgressByLineage } from "./hook/useJobProgress";
 import { TaskProgressBar } from "./TaskProgressBar";
 
@@ -14,9 +17,13 @@ const useStyles = makeStyles((theme) => ({
 type JobProgressBarProps = {
   jobId: string;
   job: Pick<UnifiedJob, "status">;
-};
+} & Pick<AdvancedProgressBarProps, "onClickLink">;
 
-export const JobProgressBar = ({ jobId, job }: JobProgressBarProps) => {
+export const JobProgressBar = ({
+  jobId,
+  job,
+  ...advancedProgressBarProps
+}: JobProgressBarProps) => {
   const classes = useStyles();
 
   // Controls the first time we fetch the advanced progress bar data
@@ -75,6 +82,7 @@ export const JobProgressBar = ({ jobId, job }: JobProgressBarProps) => {
         <AdvancedProgressBar
           className={classes.advancedProgressBar}
           progressGroups={progressGroups}
+          {...advancedProgressBarProps}
         />
       )}
     </div>
diff --git a/dashboard/client/src/pages/job/hook/useJobProgress.ts b/dashboard/client/src/pages/job/hook/useJobProgress.ts
index 61b49377ade4..5a6a525da11d 100644
--- a/dashboard/client/src/pages/job/hook/useJobProgress.ts
+++ b/dashboard/client/src/pages/job/hook/useJobProgress.ts
@@ -213,6 +213,7 @@ const formatToJobProgressGroup = (
     progress: formattedProgress,
     children: nestedJobProgress.children.map(formatToJobProgressGroup),
     type: nestedJobProgress.type,
+    link: nestedJobProgress.link,
   };
 };
 
diff --git a/dashboard/client/src/pages/node/NodeDetail.tsx b/dashboard/client/src/pages/node/NodeDetail.tsx
index 219207ce8d56..5d650f9c5c78 100644
--- a/dashboard/client/src/pages/node/NodeDetail.tsx
+++ b/dashboard/client/src/pages/node/NodeDetail.tsx
@@ -36,7 +36,7 @@ const useStyle = makeStyles((theme) => ({
   },
 }));
 
-const NodeDetailPage = () => {
+const NodeDetailPage = ({ newIA = false }: { newIA?: boolean }) => {
   const classes = useStyle();
   const {
     params,
@@ -184,7 +184,13 @@ const NodeDetailPage = () => {
             <Grid container spacing={2}>
               <Grid item xs>
                 <div className={classes.label}>Logs</div>{" "}
-                <Link to={`/log/${encodeURIComponent(nodeDetail.logUrl)}`}>
+                <Link
+                  to={
+                    newIA
+                      ? `/new/logs/${encodeURIComponent(nodeDetail.logUrl)}`
+                      : `/log/${encodeURIComponent(nodeDetail.logUrl)}`
+                  }
+                >
                   log
                 </Link>
               </Grid>
@@ -225,6 +231,7 @@ const NodeDetailPage = () => {
               <RayletWorkerTable
                 workers={nodeDetail?.workers}
                 actorMap={nodeDetail?.actors}
+                newIA={newIA}
               />
             </TableContainer>
           </React.Fragment>
@@ -235,6 +242,7 @@ const NodeDetailPage = () => {
               <ActorTable
                 actors={nodeDetail.actors}
                 workers={nodeDetail?.workers}
+                newIA={newIA}
                 detailPathPrefix="/new/actors"
               />
             </TableContainer>
diff --git a/dashboard/client/src/pages/state/task.tsx b/dashboard/client/src/pages/state/task.tsx
index a81e4778d06f..3715dc5c9d0c 100644
--- a/dashboard/client/src/pages/state/task.tsx
+++ b/dashboard/client/src/pages/state/task.tsx
@@ -1,7 +1,7 @@
 import { Grid } from "@material-ui/core";
 import dayjs from "dayjs";
 import React, { useState } from "react";
-import TaskTable from "../../components/TaskTable";
+import TaskTable, { TaskTableProps } from "../../components/TaskTable";
 import { getTasks } from "../../service/task";
 import { Task } from "../../type/task";
 import { useStateApiList } from "./hook/useStateApi";
@@ -10,12 +10,13 @@ import { useStateApiList } from "./hook/useStateApi";
  * Represent the embedable tasks page.
  */
 const TaskList = ({
-  jobId = null,
-  actorId = null,
+  jobId,
+  actorId,
+  ...taskTableProps
 }: {
-  jobId?: string | null;
-  actorId?: string | null;
-}) => {
+  jobId?: string;
+  actorId?: string;
+} & Pick<TaskTableProps, "filterToTaskId" | "onFilterChange" | "newIA">) => {
   const [timeStamp] = useState(dayjs());
   const data: Task[] | undefined = useStateApiList("useTasks", () =>
     getTasks(jobId),
@@ -29,7 +30,12 @@ const TaskList = ({
           Last updated: {timeStamp.format("YYYY-MM-DD HH:mm:ss")}
         </Grid>
       </Grid>
-      <TaskTable tasks={tasks} jobId={jobId} actorId={actorId} />
+      <TaskTable
+        tasks={tasks}
+        jobId={jobId}
+        actorId={actorId}
+        {...taskTableProps}
+      />
     </div>
   );
 };
diff --git a/dashboard/client/src/service/task.ts b/dashboard/client/src/service/task.ts
index 6d43ef343ad8..41a9355585ba 100644
--- a/dashboard/client/src/service/task.ts
+++ b/dashboard/client/src/service/task.ts
@@ -2,7 +2,7 @@ import { StateApiResponse } from "../type/stateApi";
 import { Task } from "../type/task";
 import { get } from "./requestHandlers";
 
-export const getTasks = (jobId: string | null) => {
+export const getTasks = (jobId: string | undefined) => {
   let url = "api/v0/tasks?detail=1&limit=10000";
   if (jobId) {
     url += `&job_id=${jobId}`;
@@ -10,7 +10,7 @@ export const getTasks = (jobId: string | null) => {
   return get<StateApiResponse<Task>>(url);
 };
 
-export const downloadTaskTimelineHref = (jobId: string | null) => {
+export const downloadTaskTimelineHref = (jobId: string | undefined) => {
   let url = "/api/v0/tasks/timeline?download=1";
   if (jobId) {
     url += `&job_id=${jobId}`;
diff --git a/dashboard/client/src/type/job.d.ts b/dashboard/client/src/type/job.d.ts
index 4fe73ca5c273..4fc6632c56a7 100644
--- a/dashboard/client/src/type/job.d.ts
+++ b/dashboard/client/src/type/job.d.ts
@@ -138,6 +138,11 @@ export type StateApiJobProgressByTaskNameRsp = {
   result: boolean;
 };
 
+export type NestedJobProgressLink = {
+  type: "actor" | "task";
+  id: string;
+};
+
 export type NestedJobProgress = {
   name: string;
   key: string;
@@ -146,6 +151,7 @@ export type NestedJobProgress = {
   };
   children: NestedJobProgress[];
   type: TypeTaskType | "GROUP" | "ACTOR";
+  link?: NestedJobProgressLink;
 };
 
 export type JobProgressGroup = {
@@ -154,6 +160,7 @@ export type JobProgressGroup = {
   progress: TaskProgress;
   children: JobProgressGroup[];
   type: TypeTaskType | "GROUP" | "ACTOR";
+  link?: NestedJobProgressLink;
 };
 
 export type StateApiNestedJobProgress = {
diff --git a/dashboard/client/src/type/task.ts b/dashboard/client/src/type/task.ts
index 0ed4c8d5b5f7..711a4dbd4cd9 100644
--- a/dashboard/client/src/type/task.ts
+++ b/dashboard/client/src/type/task.ts
@@ -37,4 +37,17 @@ export type Task = {
   events: { [key: string]: string }[];
   start_time_ms: number | null;
   end_time_ms: number | null;
+  worker_id: string | null;
+  profiling_data: ProfilingData;
+};
+
+export type ProfilingData = {
+  node_ip_address?: string;
+  events: {
+    event_name: string;
+    extra_data?: {
+      type?: string;
+      traceback?: string;
+    };
+  }[];
 };
diff --git a/dashboard/client/src/util/hook.ts b/dashboard/client/src/util/hook.ts
index 460db4354ac3..8412ed3ee78d 100644
--- a/dashboard/client/src/util/hook.ts
+++ b/dashboard/client/src/util/hook.ts
@@ -1,8 +1,18 @@
 import { get } from "lodash";
 import { useState } from "react";
 
-export const useFilter = <KeyType extends string>() => {
+export const useFilter = <KeyType extends string>({
+  overrideFilters,
+  onFilterChange,
+}:
+  | {
+      overrideFilters?: { key: KeyType; val: string }[];
+      onFilterChange?: () => void;
+    }
+  | undefined = {}) => {
   const [filters, setFilters] = useState<{ key: KeyType; val: string }[]>([]);
+  const finalFilters =
+    overrideFilters !== undefined ? overrideFilters : filters;
   const changeFilter = (key: KeyType, val: string) => {
     const f = filters.find((e) => e.key === key);
     if (f) {
@@ -11,9 +21,10 @@ export const useFilter = <KeyType extends string>() => {
       filters.push({ key, val });
     }
     setFilters([...filters]);
+    onFilterChange?.();
   };
   const filterFunc = (instance: { [key: string]: any }) => {
-    return filters.every((f) => {
+    return finalFilters.every((f) => {
       const instance_val = get(instance, f.key, "");
       return (
         !f.val || (instance_val && instance_val.toString().includes(f.val))
diff --git a/python/ray/experimental/state/common.py b/python/ray/experimental/state/common.py
index 84b234192981..4042312a735f 100644
--- a/python/ray/experimental/state/common.py
+++ b/python/ray/experimental/state/common.py
@@ -551,7 +551,7 @@ class TaskState(StateSchema):
     #: The placement group id that's associated with this task.
     placement_group_id: str = state_column(detail=True, filterable=True)
     #: The worker id that's associated with this task.
-    worker_id: str = state_column(detail=True, filterable=True)
+    worker_id: str = state_column(filterable=True)
     #: The list of events of the given task.
     #: Refer to src/ray/protobuf/common.proto for a detailed explanation of the state
     #: breakdowns and typical state transition flow.
@@ -751,6 +751,14 @@ class TaskSummaryPerFuncOrClassName:
     state_counts: Dict[TypeTaskStatus, int] = field(default_factory=dict)
 
 
+@dataclass
+class Link:
+    #: The type of entity to link to
+    type: str
+    #: The id of the entity to link to
+    id: str
+
+
 @dataclass(init=True)
 class NestedTaskSummary:
     #: The name of this task group
@@ -767,6 +775,8 @@ class NestedTaskSummary:
     state_counts: Dict[TypeTaskStatus, int] = field(default_factory=dict)
     #: The child
     children: List["NestedTaskSummary"] = field(default_factory=list)
+    #: A link to more details about this summary.
+    link: Optional[Link] = None
 
 
 @dataclass
@@ -897,6 +907,7 @@ def get_or_create_task_group(task_id: str) -> Optional[NestedTaskSummary]:
                 key=task_id,
                 type=task["type"],
                 timestamp=task["creation_time_ms"],
+                link=Link(type="task", id=task_id),
             )
 
             # Set summary in right place under parent
@@ -951,6 +962,7 @@ def get_or_create_actor_task_group(
                     key=key,
                     type="ACTOR",
                     timestamp=task["creation_time_ms"],
+                    link=Link(type="actor", id=actor_id),
                 )
 
                 parent_task_id = creation_task["parent_task_id"]
diff --git a/python/ray/tests/test_state_api_summary.py b/python/ray/tests/test_state_api_summary.py
index bb8d38ad0d37..5d209fe4e202 100644
--- a/python/ray/tests/test_state_api_summary.py
+++ b/python/ray/tests/test_state_api_summary.py
@@ -31,6 +31,7 @@
 from ray.experimental.state.common import (
     DEFAULT_RPC_TIMEOUT,
     SummaryApiOptions,
+    Link,
     NestedTaskSummary,
     TaskSummaries,
     DRIVER_TASK_ID_PREFIX,
@@ -499,6 +500,7 @@ def test_summarize_by_lineage():
                     state_counts={
                         "FINISHED": 2,
                     },
+                    link=Link("task", f"preprocess-{i}"),
                     children=[
                         NestedTaskSummary(
                             name="preprocess_sub_task",
@@ -508,6 +510,7 @@ def test_summarize_by_lineage():
                             state_counts={
                                 "FINISHED": 1,
                             },
+                            link=Link("task", f"preprocess-{i}-0"),
                         )
                     ],
                 )
@@ -523,6 +526,7 @@ def test_summarize_by_lineage():
                 "FINISHED": 111,
                 "RUNNING": 10,
             },
+            link=Link("actor", "tune-actor-0"),
             children=[
                 NestedTaskSummary(
                     name="TuneActor.__init__",
@@ -533,6 +537,7 @@ def test_summarize_by_lineage():
                         "FINISHED": 111,
                         "RUNNING": 10,
                     },
+                    link=Link("task", "tune-actor-init-0"),
                     children=[
                         NestedTaskSummary(
                             name="TrainActor",
@@ -553,6 +558,7 @@ def test_summarize_by_lineage():
                                         "FINISHED": 11,
                                         "RUNNING": 1,
                                     },
+                                    link=Link("actor", f"train-actor-{i}"),
                                     children=[
                                         NestedTaskSummary(
                                             name="TrainActor.__init__",
@@ -562,6 +568,7 @@ def test_summarize_by_lineage():
                                             state_counts={
                                                 "FINISHED": 1,
                                             },
+                                            link=Link("task", f"train-actor-init-{i}"),
                                         ),
                                         NestedTaskSummary(
                                             name="TrainActor.train_step_map",
@@ -583,6 +590,11 @@ def test_summarize_by_lineage():
                                                     state_counts={
                                                         "FINISHED": 1,
                                                     },
+                                                    link=Link(
+                                                        "task",
+                                                        "train-actor-train-step-map-"
+                                                        f"{i}-{j}",
+                                                    ),
                                                 )
                                                 for j in range(10)
                                             ],
@@ -595,6 +607,10 @@ def test_summarize_by_lineage():
                                             state_counts={
                                                 "RUNNING": 1,
                                             },
+                                            link=Link(
+                                                "task",
+                                                f"train-actor-train-step-reduce-{i}",
+                                            ),
                                         ),
                                     ],
                                 )
@@ -657,7 +673,6 @@ def grab_tasks_from_task_group(
     assert summary.total_tasks == 20
     assert summary.total_actor_tasks == 110
     assert summary.total_actor_scheduled == 11
-    assert summary.summary[1] == expected_summary[1]
     assert summary.summary == expected_summary
 
 
From ed837156f8544f902258356701540c4d4a6e4ffa Mon Sep 17 00:00:00 2001
From: WeichenXu <weichen.xu@databricks.com>
Date: Thu, 2 Feb 2023 20:36:00 +0800
Subject: [PATCH 137/267] [spark] Refine some text in Ray on Spark exception
 messages and warning messages (#32162)

See follow-up comments in #31962

Signed-off-by: Weichen Xu <weichen.xu@databricks.com>
---
 python/ray/util/spark/cluster_init.py    |  6 ++++--
 python/ray/util/spark/databricks_hook.py | 20 +++++++++-----------
 2 files changed, 13 insertions(+), 13 deletions(-)

diff --git a/python/ray/util/spark/cluster_init.py b/python/ray/util/spark/cluster_init.py
index 50c5ba4fa21f..100ec69e09c8 100644
--- a/python/ray/util/spark/cluster_init.py
+++ b/python/ray/util/spark/cluster_init.py
@@ -127,7 +127,7 @@ def wait_until_ready(self):
                 # in this case, raise error directly.
                 if self.background_job_exception is not None:
                     raise RuntimeError(
-                        "Ray workers have exited."
+                        "Ray workers failed to start."
                     ) from self.background_job_exception
 
                 cur_alive_worker_count = (
@@ -406,6 +406,8 @@ def _setup_ray_cluster(
     ray_head_ip = socket.gethostbyname(get_spark_application_driver_host(spark))
     ray_head_port = get_random_unused_port(ray_head_ip, min_port=9000, max_port=10000)
 
+    # Make a copy for head_node_options to avoid changing original dict in user code.
+    head_node_options = head_node_options.copy()
     include_dashboard = head_node_options.pop("include_dashboard", None)
     ray_dashboard_port = head_node_options.pop("dashboard_port", None)
 
@@ -851,7 +853,7 @@ def setup_ray_cluster(
             collect their logs to the specified path. On Databricks Runtime, we
             recommend you to specify a local path starts with '/dbfs/', because the
             path mounts with a centralized storage device and stored data is persisted
-            after databricks spark cluster terminated.
+            after Databricks spark cluster terminated.
 
     Returns:
         The address of the initiated Ray cluster on spark.
diff --git a/python/ray/util/spark/databricks_hook.py b/python/ray/util/spark/databricks_hook.py
index 0d45baef499c..404ff5a7211e 100644
--- a/python/ray/util/spark/databricks_hook.py
+++ b/python/ray/util/spark/databricks_hook.py
@@ -93,7 +93,7 @@ def on_cluster_created(self, ray_cluster_handler):
             _logger.warning(
                 "Registering Ray cluster spark job as background job failed. "
                 "You need to manually call `ray.util.spark.shutdown_ray_cluster()` "
-                "before detaching your databricks notebook."
+                "before detaching your Databricks notebook."
             )
 
         auto_shutdown_minutes = float(
@@ -102,7 +102,7 @@ def on_cluster_created(self, ray_cluster_handler):
         if auto_shutdown_minutes == 0:
             _logger.info(
                 "The Ray cluster will keep running until you manually detach the "
-                "databricks notebook or call "
+                "Databricks notebook or call "
                 "`ray.util.spark.shutdown_ray_cluster()`."
             )
             return
@@ -117,12 +117,10 @@ def on_cluster_created(self, ray_cluster_handler):
             db_api_entry.getIdleTimeMillisSinceLastNotebookExecution()
         except Exception:
             _logger.warning(
-                "Databricks `getIdleTimeMillisSinceLastNotebookExecution` API "
-                "is unavailable, it is probably because that "
-                "your current Databricks Runtime version does not support API "
-                "`getIdleTimeMillisSinceLastNotebookExecution`, we cannot "
-                "automatically shut down Ray cluster when databricks notebook "
-                "is inactive, you need to manually detach databricks notebook "
+                "Failed to retrieve idle time since last notebook execution, "
+                "so that we cannot automatically shut down Ray cluster when "
+                "Databricks notebook is inactive for the specified minutes. "
+                "You need to manually detach Databricks notebook "
                 "or call `ray.util.spark.shutdown_ray_cluster()` to shut down "
                 "Ray cluster on spark."
             )
@@ -130,13 +128,13 @@ def on_cluster_created(self, ray_cluster_handler):
 
         _logger.info(
             "The Ray cluster will be shut down automatically if you don't run "
-            "commands on the databricks notebook for "
+            "commands on the Databricks notebook for "
             f"{auto_shutdown_minutes} minutes. You can change the "
-            "automatically shutdown minutes by setting "
+            "auto-shutdown minutes by setting "
             f"'{DATABRICKS_RAY_ON_SPARK_AUTOSHUTDOWN_MINUTES}' environment "
             "variable, setting it to 0 means that the Ray cluster keeps running "
             "until you manually call `ray.util.spark.shutdown_ray_cluster()` or "
-            "detach databricks notebook."
+            "detach Databricks notebook."
         )
 
         def auto_shutdown_watcher():

From ada5db71db36f672301639a61b5849fd4fd5914e Mon Sep 17 00:00:00 2001
From: Chen Shen <scv119@gmail.com>
Date: Thu, 2 Feb 2023 04:38:44 -0800
Subject: [PATCH 138/267] Revert "Revert "[Core] add ray-core as code-owner for
 most of the core code-path (#32082)" (#32176)" (#32190)

This reverts commit 4d526c5b296e4fedadd73aa45b4db8ed50e83bbe.
---
 .github/CODEOWNERS | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS
index 41d46bc05397..1b4eb7f6dbd0 100644
--- a/.github/CODEOWNERS
+++ b/.github/CODEOWNERS
@@ -25,8 +25,8 @@
 /python/ray/autoscaler/ @wuisawesome @DmitriGekhtman @ericl
 
 # Metrics
-/src/ray/stats/metric_defs.h @ericl @scv119 @rkooo567
-/src/ray/stats/metric_defs.cc @ericl @scv119 @rkooo567
+/src/ray/stats/metric_defs.h @ray-project/ray-core
+/src/ray/stats/metric_defs.cc @ray-project/ray-core
 
 # Telemetry
 /src/ray/protobuf/usage.proto @pcmoritz @thomasdesr
@@ -35,7 +35,7 @@
 # /src/ray @ray-project/ray-core-cpp
 
 # GCS
-/src/ray/gcs/ @iycheng @scv119 @rkooo567 @ericl
+/src/ray/gcs/ @ray-project/ray-core
 
 # Dependencies
 /python/setup.py @richardliaw @ericl @edoakes
@@ -44,12 +44,12 @@
 /ci/lint/format.sh @richardliaw @ericl @edoakes
 
 # Docker image build script.
-/ci/build/build-docker-images.py @amogkam @krfricke
+/ci/build/build-docker-images.py @amogkam @krfricke @ray-project/ray-core
 
 # Python worker.
-#/python/ray/ @ray-project/ray-core-python
-#!/python/ray/tune/ @ray-project/ray-core-python
-#!/python/ray/rllib/ @ray-project/ray-core-python
+#/python/ray/ @ray-project/ray-core
+#!/python/ray/tune/ @ray-project/ray-core
+#!/python/ray/rllib/ @ray-project/ray-core
 
 # Java worker.
 /java/dependencies.bzl @jovany-wang @kfstorm @raulchen @ericl @iycheng @WangTaoTheTonic
@@ -59,15 +59,15 @@
 /java/api/ @jovany-wang @kfstorm @raulchen @ericl @iycheng @WangTaoTheTonic
 
 # C++ worker
-/cpp/include/ray @SongGuyang @raulchen @kfstorm
+/cpp/include/ray @SongGuyang @raulchen @kfstorm @ray-project/ray-core
 
 # Ray Client
 /src/ray/protobuf/ray_client.proto @ijrsvt @ameerhajali @ckw017
 
 # Runtime Env
 # TODO(SongGuyang): Add new items to guarantee runtime env API compatibility in multiple languages.
-/src/ray/protobuf/runtime_env_common.proto @SongGuyang @raulchen @edoakes @architkulkarni
-/src/ray/protobuf/runtime_env_agent.proto @SongGuyang @raulchen @edoakes @architkulkarni
+/src/ray/protobuf/runtime_env_common.proto @SongGuyang @raulchen @edoakes @architkulkarni @ray-project/ray-core
+/src/ray/protobuf/runtime_env_agent.proto @SongGuyang @raulchen @edoakes @architkulkarni @ray-project/ray-core
 
 # ==== Libraries and frameworks ====
 

From 29cd2fa93df80a83f80117865f017ad5ec5d77e0 Mon Sep 17 00:00:00 2001
From: Ram Rachum <ram@rachum.com>
Date: Thu, 2 Feb 2023 19:22:06 +0200
Subject: [PATCH 139/267] [RLlib] Fix typehint for `explore` argument. (#30734)

Signed-off-by: Ram Rachum <ram@rachum.com>
---
 rllib/policy/policy.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/rllib/policy/policy.py b/rllib/policy/policy.py
index f53f0561c131..7cc5ceddae5d 100644
--- a/rllib/policy/policy.py
+++ b/rllib/policy/policy.py
@@ -535,7 +535,7 @@ def compute_single_action(
     def compute_actions_from_input_dict(
         self,
         input_dict: Union[SampleBatch, Dict[str, TensorStructType]],
-        explore: bool = None,
+        explore: Optional[bool] = None,
         timestep: Optional[int] = None,
         episodes: Optional[List["Episode"]] = None,
         **kwargs,

From a53907c61b2c76353578847c674e732e03f1b3e5 Mon Sep 17 00:00:00 2001
From: Avnish Narayan <38871737+avnishn@users.noreply.github.com>
Date: Thu, 2 Feb 2023 10:20:51 -0800
Subject: [PATCH 140/267] [RLlib] Add tags option to actor manager (#31803)

Signed-off-by: Avnish <avnishnarayan@gmail.com>
---
 rllib/utils/actor_manager.py            | 72 +++++++++++++++++++---
 rllib/utils/tests/test_actor_manager.py | 79 +++++++++++++++++++++++++
 2 files changed, 142 insertions(+), 9 deletions(-)

diff --git a/rllib/utils/actor_manager.py b/rllib/utils/actor_manager.py
index 6b61876d0081..4d0ae0a6a5dd 100644
--- a/rllib/utils/actor_manager.py
+++ b/rllib/utils/actor_manager.py
@@ -62,6 +62,7 @@ class CallResult:
 
     actor_id: int
     result_or_error: ResultOrError
+    tag: str
 
     @property
     def ok(self):
@@ -108,14 +109,15 @@ def __next__(self) -> CallResult:
     def __init__(self):
         self.result_or_errors: List[CallResult] = []
 
-    def add_result(self, actor_id: int, result_or_error: ResultOrError):
+    def add_result(self, actor_id: int, result_or_error: ResultOrError, tag: str):
         """Add index of a remote actor plus the call result to the list.
 
         Args:
             actor_id: ID of the remote actor.
             result_or_error: The result or error from the call.
+            tag: A description to identify the call.
         """
-        self.result_or_errors.append(CallResult(actor_id, result_or_error))
+        self.result_or_errors.append(CallResult(actor_id, result_or_error, tag))
 
     def __iter__(self) -> Iterator[ResultOrError]:
         """Return an iterator over the results."""
@@ -429,6 +431,7 @@ def __fetch_result(
         *,
         remote_actor_ids: List[int],
         remote_calls: List[ray.ObjectRef],
+        tags: List[str],
         timeout_seconds: int = None,
         return_obj_refs: bool = False,
         mark_healthy: bool = False,
@@ -441,6 +444,7 @@ def __fetch_result(
             remote_actor_ids: IDs of the actors these remote
                 calls were fired against.
             remote_calls: list of remote calls to fetch.
+            tags: list of tags used for identifying the remote calls.
             timeout_seconds: timeout for the ray.wait() call. Default is None.
             return_obj_refs: whether to return ObjectRef instead of actual results.
             mark_healthy: whether to mark certain actors healthy based on the results
@@ -467,15 +471,16 @@ def __fetch_result(
         for r in ready:
             # Find the corresponding actor ID for this remote call.
             actor_id = remote_actor_ids[remote_calls.index(r)]
+            tag = tags[remote_calls.index(r)]
 
             # If caller wants ObjectRefs, return directly without resolve them.
             if return_obj_refs:
-                remote_results.add_result(actor_id, ResultOrError(result=r))
+                remote_results.add_result(actor_id, ResultOrError(result=r), tag)
                 continue
 
             try:
                 result = ray.get(r)
-                remote_results.add_result(actor_id, ResultOrError(result=result))
+                remote_results.add_result(actor_id, ResultOrError(result=result), tag)
 
                 if mark_healthy and not self.is_actor_healthy(actor_id):
                     # Yay, mark this actor as healthy.
@@ -484,7 +489,7 @@ def __fetch_result(
                     self._num_actor_restarts += 1
             except Exception as e:
                 # Return error to the user.
-                remote_results.add_result(actor_id, ResultOrError(error=e))
+                remote_results.add_result(actor_id, ResultOrError(error=e), tag)
 
                 # Mark the actor as unhealthy.
                 # TODO(jungong): Using RayError here to preserve historical behavior.
@@ -588,6 +593,7 @@ def foreach_actor(
         _, remote_results = self.__fetch_result(
             remote_actor_ids=remote_actor_ids,
             remote_calls=remote_calls,
+            tags=[None] * len(remote_calls),
             timeout_seconds=timeout_seconds,
             return_obj_refs=return_obj_refs,
             mark_healthy=mark_healthy,
@@ -599,6 +605,7 @@ def foreach_actor(
     def foreach_actor_async(
         self,
         func: Union[Callable[[Any], Any], List[Callable[[Any], Any]]],
+        tag: str = None,
         *,
         healthy_only=True,
         remote_actor_ids: List[int] = None,
@@ -608,6 +615,7 @@ def foreach_actor_async(
         Args:
             func: A single, or a list of Callables, that get applied on the list
                 of specified remote actors.
+            tag: A tag to identify the results from this async call.
             healthy_only: If True, applies func on known healthy actors only.
             remote_actor_ids: Apply func on a selected set of remote actors.
                 Note, for fault tolerance reasons, these returned ObjectRefs should
@@ -616,6 +624,14 @@ def foreach_actor_async(
         Returns:
             The number of async requests that are actually fired.
         """
+        # TODO(avnishn, jungong): so thinking about this a bit more, it would be the
+        # best if we can attach multiple tags to an async all, like basically this
+        # parameter should be tags:
+        # for sync alls, tags would be ()
+        # for async call users, they can attached multiple tags for a single call, like
+        # ("rollout_worker", "sync_weight")
+        # for async fetch result, we can also specify a single, or list of tags. for
+        # example, ("eval", "sample") will fetch all the sample() calls on eval workers.
         remote_actor_ids = remote_actor_ids or list(self.__actors.keys())
 
         if healthy_only:
@@ -667,14 +683,46 @@ def foreach_actor_async(
         # Save these as outstanding requests.
         for id, call in zip(limited_remote_actor_ids, remote_calls):
             self.__remote_actor_states[id].num_in_flight_async_requests += 1
-            self.__in_flight_req_to_actor_id[call] = id
+            self.__in_flight_req_to_actor_id[call] = (tag, id)
 
         return len(remote_calls)
 
+    def __filter_calls_by_tag(
+        self, tags
+    ) -> Tuple[List[ray.ObjectRef], List[ActorHandle], List[str]]:
+        """Return all the in flight requests that match the given tags.
+
+        Args:
+            tags: A str or a list of str. If tags is empty, return all the in flight
+
+        Returns:
+            A tuple of corresponding (remote_calls, remote_actor_ids, valid_tags)
+
+        """
+        if isinstance(tags, str):
+            tags = {tags}
+        elif isinstance(tags, (list, tuple)):
+            tags = set(tags)
+        else:
+            raise ValueError(
+                f"tags must be either a str or a list of str, got {type(tags)}."
+            )
+        remote_calls = []
+        remote_actor_ids = []
+        valid_tags = []
+        for call, (tag, actor_id) in self.__in_flight_req_to_actor_id.items():
+            # the default behavior is to return all ready results.
+            if not len(tags) or tag in tags:
+                remote_calls.append(call)
+                remote_actor_ids.append(actor_id)
+                valid_tags.append(tag)
+        return remote_calls, remote_actor_ids, valid_tags
+
     @DeveloperAPI
     def fetch_ready_async_reqs(
         self,
         *,
+        tags: Union[str, List[str]] = (),
         timeout_seconds: Union[None, int] = 0,
         return_obj_refs: bool = False,
         mark_healthy: bool = False,
@@ -683,9 +731,13 @@ def fetch_ready_async_reqs(
 
         Automatically mark actors unhealthy if they fail to respond.
 
+        Note: If tags is an empty tuple then results from all ready async requests are
+            returned.
+
         Args:
             timeout_seconds: Ray.get() timeout. Default is 0 (only those that are
                 already ready).
+            tags: A tag or a list of tags to identify the results from this async call.
             return_obj_refs: whether to return ObjectRef instead of actual results.
             mark_healthy: whether to mark certain actors healthy based on the results
                 of these remote calls. Useful, for example, to make sure actors
@@ -696,10 +748,12 @@ def fetch_ready_async_reqs(
             The values may be actual data returned or exceptions raised during the
             remote call in the format of RemoteCallResults.
         """
-        # Construct the list of in-flight requests.
+        # Construct the list of in-flight requests filtered by tag.
+        remote_calls, remote_actor_ids, valid_tags = self.__filter_calls_by_tag(tags)
         ready, remote_results = self.__fetch_result(
-            remote_actor_ids=list(self.__in_flight_req_to_actor_id.values()),
-            remote_calls=list(self.__in_flight_req_to_actor_id.keys()),
+            remote_actor_ids=remote_actor_ids,
+            remote_calls=remote_calls,
+            tags=valid_tags,
             timeout_seconds=timeout_seconds,
             return_obj_refs=return_obj_refs,
             mark_healthy=mark_healthy,
diff --git a/rllib/utils/tests/test_actor_manager.py b/rllib/utils/tests/test_actor_manager.py
index 18a951d6358a..f65f925d0508 100644
--- a/rllib/utils/tests/test_actor_manager.py
+++ b/rllib/utils/tests/test_actor_manager.py
@@ -359,6 +359,85 @@ def test_probe_unhealthy_actors(self):
         # Both actors are now healthy.
         self.assertEqual(len(manager.healthy_actor_ids()), 4)
 
+    def test_tags(self):
+        """Test that tags work for async calls."""
+        actors = [Actor.remote(i, maybe_crash=False) for i in range(4)]
+        manager = FaultTolerantActorManager(actors=actors)
+
+        manager.foreach_actor_async(lambda w: w.ping(), tag="pingpong")
+        manager.foreach_actor_async(lambda w: w.call(), tag="call")
+        time.sleep(1)
+        results_ping_pong = manager.fetch_ready_async_reqs(
+            tags="pingpong", timeout_seconds=5
+        )
+        results_call = manager.fetch_ready_async_reqs(tags="call", timeout_seconds=5)
+        self.assertEquals(len(list(results_ping_pong)), 4)
+        self.assertEquals(len(list(results_call)), 4)
+        for result in results_ping_pong:
+            data = result.get()
+            self.assertEqual(data, "pong")
+            self.assertEqual(result.tag, "pingpong")
+        for result in results_call:
+            data = result.get()
+            self.assertEqual(data, 1)
+            self.assertEqual(result.tag, "call")
+
+        # test with default tag
+        manager.foreach_actor_async(lambda w: w.ping())
+        manager.foreach_actor_async(lambda w: w.call())
+        time.sleep(1)
+        results = manager.fetch_ready_async_reqs(timeout_seconds=5)
+        self.assertEquals(len(list(results)), 8)
+        for result in results:
+            data = result.get()
+            self.assertEqual(result.tag, None)
+            if isinstance(data, str):
+                self.assertEqual(data, "pong")
+            elif isinstance(data, int):
+                self.assertEqual(data, 2)
+            else:
+                raise ValueError("data is not str or int")
+
+        # test with custom tags
+        manager.foreach_actor_async(lambda w: w.ping(), tag="pingpong")
+        manager.foreach_actor_async(lambda w: w.call(), tag="call")
+        time.sleep(1)
+        results = manager.fetch_ready_async_reqs(
+            timeout_seconds=5, tags=["pingpong", "call"]
+        )
+        self.assertEquals(len(list(results)), 8)
+        for result in results:
+            data = result.get()
+            if isinstance(data, str):
+                self.assertEqual(data, "pong")
+                self.assertEqual(result.tag, "pingpong")
+            elif isinstance(data, int):
+                self.assertEqual(data, 3)
+                self.assertEqual(result.tag, "call")
+            else:
+                raise ValueError("data is not str or int")
+
+        # test with incorrect tags
+        manager.foreach_actor_async(lambda w: w.ping(), tag="pingpong")
+        manager.foreach_actor_async(lambda w: w.call(), tag="call")
+        time.sleep(1)
+        results = manager.fetch_ready_async_reqs(timeout_seconds=5, tags=["incorrect"])
+        self.assertEquals(len(list(results)), 0)
+
+        # now test that passing no tags still gives back all of the results
+        results = manager.fetch_ready_async_reqs(timeout_seconds=5)
+        self.assertEquals(len(list(results)), 8)
+        for result in results:
+            data = result.get()
+            if isinstance(data, str):
+                self.assertEqual(data, "pong")
+                self.assertEqual(result.tag, "pingpong")
+            elif isinstance(data, int):
+                self.assertEqual(data, 4)
+                self.assertEqual(result.tag, "call")
+            else:
+                raise ValueError("result is not str or int")
+
 
 if __name__ == "__main__":
     import pytest

From fdfef1f0a2296cdb9aebe5a925a80ed1d0b48a84 Mon Sep 17 00:00:00 2001
From: Avnish Narayan <38871737+avnishn@users.noreply.github.com>
Date: Thu, 2 Feb 2023 11:49:27 -0800
Subject: [PATCH 141/267] [RLlib] Optimize the trainer runner test, add method
 for shutting down a trainer runner and releasing resources (#32109)

Signed-off-by: avnish <avnish@anyscale.com>
---
 .../rl_trainer/tests/test_trainer_runner.py   | 146 ++++++++----------
 rllib/core/rl_trainer/trainer_runner.py       |  10 ++
 2 files changed, 74 insertions(+), 82 deletions(-)

diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner.py b/rllib/core/rl_trainer/tests/test_trainer_runner.py
index 67a511b6d5bc..302321d7ca6d 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner.py
@@ -1,13 +1,11 @@
 import gymnasium as gym
-import unittest
-import ray
-import time
-import numpy as np
 import itertools
+import numpy as np
+import unittest
 
+import ray
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID, MultiAgentBatch
 from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
-from ray.rllib.utils.framework import try_import_tf
 from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 from ray.rllib.core.testing.utils import (
     get_trainer_runner,
@@ -16,94 +14,84 @@
 )
 
 
-class TestTrainerRunner(unittest.TestCase):
-    @classmethod
-    def setUpClass(cls) -> None:
-        ray.init()
+REMOTE_SCALING_CONFIGS = {
+    "remote-cpu": TrainerScalingConfig(num_workers=1),
+    "remote-gpu": TrainerScalingConfig(num_workers=1, num_gpus_per_worker=0.5),
+    "multi-gpu-ddp": TrainerScalingConfig(num_workers=2, num_gpus_per_worker=1),
+    "multi-cpu-ddp": TrainerScalingConfig(num_workers=2, num_cpus_per_worker=2),
+    # "multi-gpu-ddp-pipeline": TrainerScalingConfig(
+    #     num_workers=2, num_gpus_per_worker=2
+    # ),
+}
 
-        # Settings to test
-        cls.scaling_configs = {
-            "local-cpu": TrainerScalingConfig(num_workers=0, num_gpus_per_worker=0),
-            "local-gpu": TrainerScalingConfig(num_workers=0, num_gpus_per_worker=0.5),
-            "remote-cpu": TrainerScalingConfig(num_workers=1),
-            "remote-gpu": TrainerScalingConfig(num_workers=1, num_gpus_per_worker=0.5),
-            "multi-gpu-ddp": TrainerScalingConfig(num_workers=2, num_gpus_per_worker=1),
-            "multi-cpu-ddp": TrainerScalingConfig(num_workers=2, num_cpus_per_worker=2),
-            # "multi-gpu-ddp-pipeline": TrainerScalingConfig(
-            #     num_workers=2, num_gpus_per_worker=2
-            # ),
-        }
-
-    @classmethod
-    def tearDownClass(cls) -> None:
-        ray.shutdown()
 
-    def test_trainer_runner_local(self):
+LOCAL_SCALING_CONFIGS = {
+    "local-cpu": TrainerScalingConfig(num_workers=0, num_gpus_per_worker=0),
+    "local-gpu": TrainerScalingConfig(num_workers=0, num_gpus_per_worker=0.5),
+}
 
-        tf1, tf, tfv = try_import_tf()
-        tf1.executing_eagerly()
 
-        # TODO (Avnish): tf does not clear out the GPU memory footprint, therefore
-        # doing it first before torch will result in OOM. Find a way to clear out the
-        # GPU memory footprint of tf.
-        fws = ["torch"]
-        scaling_modes = ["local-cpu", "local-gpu"]
-        test_iterator = itertools.product(fws, scaling_modes)
+class TestTrainerRunner(unittest.TestCase):
+    def setUp(self) -> None:
+        ray.init()
+
+    def tearDown(self) -> None:
+        ray.shutdown()
 
+    @staticmethod
+    def local_training_helper(fw, scaling_mode) -> None:
         env = gym.make("CartPole-v1")
-        for fw, scaling_mode in test_iterator:
-            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}")
-            ray.init(ignore_reinit_error=True)
-            scaling_config = self.scaling_configs[scaling_mode]
-            runner = get_trainer_runner(fw, env, scaling_config)
-            local_trainer = get_rl_trainer(fw, env)
-            local_trainer.build()
+        scaling_config = LOCAL_SCALING_CONFIGS[scaling_mode]
+        runner = get_trainer_runner(fw, env, scaling_config)
+        local_trainer = get_rl_trainer(fw, env)
+        local_trainer.build()
 
-            # make the state of the trainer and the local runner identical
-            local_trainer.set_state(runner.get_state()[0])
+        # make the state of the trainer and the local runner identical
+        local_trainer.set_state(runner.get_state()[0])
 
-            reader = get_cartpole_dataset_reader(batch_size=500)
-            batch = reader.next()
-            batch = batch.as_multi_agent()
-            check(local_trainer.update(batch), runner.update(batch)[0])
+        reader = get_cartpole_dataset_reader(batch_size=500)
+        batch = reader.next()
+        batch = batch.as_multi_agent()
+        check(local_trainer.update(batch), runner.update(batch)[0])
 
-            new_module_id = "test_module"
+        new_module_id = "test_module"
 
-            add_module_to_runner_or_trainer(fw, env, new_module_id, runner)
-            add_module_to_runner_or_trainer(fw, env, new_module_id, local_trainer)
+        add_module_to_runner_or_trainer(fw, env, new_module_id, runner)
+        add_module_to_runner_or_trainer(fw, env, new_module_id, local_trainer)
 
-            # make the state of the trainer and the local runner identical
-            local_trainer.set_state(runner.get_state()[0])
+        # make the state of the trainer and the local runner identical
+        local_trainer.set_state(runner.get_state()[0])
 
-            # do another update
-            batch = reader.next()
-            ma_batch = MultiAgentBatch(
-                {new_module_id: batch, DEFAULT_POLICY_ID: batch}, env_steps=batch.count
-            )
-            check(local_trainer.update(ma_batch), runner.update(ma_batch)[0])
+        # do another update
+        batch = reader.next()
+        ma_batch = MultiAgentBatch(
+            {new_module_id: batch, DEFAULT_POLICY_ID: batch}, env_steps=batch.count
+        )
+        check(local_trainer.update(ma_batch), runner.update(ma_batch)[0])
 
-            check(local_trainer.get_state(), runner.get_state()[0])
+        check(local_trainer.get_state(), runner.get_state()[0])
 
-            # make sure the runner resources are freed up so that we don't autoscale
-            del runner
-            del local_trainer
-            ray.shutdown()
-            time.sleep(10)
+    def test_trainer_runner_local(self):
+        fws = ["tf", "torch"]
+        test_iterator = itertools.product(fws, LOCAL_SCALING_CONFIGS)
+        # run the logic of this test inside of a ray actor because we want tensorflow
+        # resources to be gracefully released. Tensorflow blocks the gpu resources
+        # otherwise between test cases, causing a gpu oom error.
+        remote_helper_fn = ray.remote(self.local_training_helper)
+        for fw, scaling_mode in test_iterator:
+            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}")
+            ray.get(remote_helper_fn.remote(fw, scaling_mode))
 
     def test_update_multigpu(self):
-
-        # TODO (Avnish): The tf + remote-gpu test is flakey. Removing for now until
-        # investigated.
-        fws = ["torch"]
-        scaling_modes = self.scaling_configs.keys()
+        fws = ["tf", "torch"]
+        scaling_modes = REMOTE_SCALING_CONFIGS.keys()
         test_iterator = itertools.product(fws, scaling_modes)
 
         for fw, scaling_mode in test_iterator:
             print(f"Testing framework: {fw}, scaling mode: {scaling_mode}.")
-            ray.init(ignore_reinit_error=True)
             env = gym.make("CartPole-v1")
 
-            scaling_config = self.scaling_configs[scaling_mode]
+            scaling_config = REMOTE_SCALING_CONFIGS[scaling_mode]
             runner = get_trainer_runner(fw, env, scaling_config)
             reader = get_cartpole_dataset_reader(batch_size=1024)
 
@@ -129,23 +117,18 @@ def test_update_multigpu(self):
             self.assertLess(min_loss, 0.57)
 
             # make sure the runner resources are freed up so that we don't autoscale
+            runner.shutdown()
             del runner
-            ray.shutdown()
-            time.sleep(10)
 
     def test_add_remove_module(self):
-
-        # TODO (Avnish): The tf + remote-gpu test is flakey. Removing for now until
-        # investigated.
-        fws = ["torch"]
-        scaling_modes = self.scaling_configs.keys()
+        fws = ["tf", "torch"]
+        scaling_modes = REMOTE_SCALING_CONFIGS.keys()
         test_iterator = itertools.product(fws, scaling_modes)
 
         for fw, scaling_mode in test_iterator:
             print(f"Testing framework: {fw}, scaling mode: {scaling_mode}.")
-            ray.init(ignore_reinit_error=True)
             env = gym.make("CartPole-v1")
-            scaling_config = self.scaling_configs[scaling_mode]
+            scaling_config = REMOTE_SCALING_CONFIGS[scaling_mode]
             runner = get_trainer_runner(fw, env, scaling_config)
             reader = get_cartpole_dataset_reader(batch_size=500)
             batch = reader.next()
@@ -204,9 +187,8 @@ def test_add_remove_module(self):
                 )
 
             # make sure the runner resources are freed up so that we don't autoscale
+            runner.shutdown()
             del runner
-            ray.shutdown()
-            time.sleep(10)
 
 
 if __name__ == "__main__":
diff --git a/rllib/core/rl_trainer/trainer_runner.py b/rllib/core/rl_trainer/trainer_runner.py
index b6889c77d973..65fb40914678 100644
--- a/rllib/core/rl_trainer/trainer_runner.py
+++ b/rllib/core/rl_trainer/trainer_runner.py
@@ -89,6 +89,7 @@ def __init__(
                 train_cls=rl_trainer_class,
                 train_cls_kwargs=rl_trainer_spec.get_params_dict(),
             )
+            self._backend_executor = backend_executor
 
             self._workers = [w.actor for w in backend_executor.worker_group.workers]
 
@@ -255,3 +256,12 @@ def set_state(self, state: List[Mapping[ModuleID, Mapping[str, Any]]]) -> None:
             for worker in self._workers:
                 refs.append(worker.set_state.remote(state))
             ray.get(refs)
+
+    def shutdown(self):
+        """Shuts down the TrainerRunner."""
+        if not self._is_local:
+            self._backend_executor.shutdown()
+
+    def __del__(self):
+        self.shutdown()
+        super().__del__()

From b81f0cdfaa140ef09dd1fbefbcb19f88befffe5c Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Thu, 2 Feb 2023 15:24:50 -0800
Subject: [PATCH 142/267] [RLlib] Exclude gpu tag from Examples test suite in
 RLlib (#32141)

* RLlib's example test suite should run on no-gpu instances, so we should exclude the gpu tag

Signed-off-by: Kourosh Hakhamaneshi <kourosh@anyscale.com>
---
 .buildkite/pipeline.ml.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.buildkite/pipeline.ml.yml b/.buildkite/pipeline.ml.yml
index 7db645a5b83e..3d095e7a932b 100644
--- a/.buildkite/pipeline.ml.yml
+++ b/.buildkite/pipeline.ml.yml
@@ -177,7 +177,7 @@
     - RLLIB_TESTING=1 ./ci/env/install-dependencies.sh
     - ./ci/env/env_info.sh
     - ./ci/run/run_bazel_test_with_sharding.sh --config=ci $(./ci/run/bazel_export_options) --build_tests_only
-      --test_tag_filters=examples,-multi_gpu --test_env=RAY_USE_MULTIPROCESSING_CPU_COUNT=1 rllib/...
+      --test_tag_filters=examples,-multi_gpu,-gpu --test_env=RAY_USE_MULTIPROCESSING_CPU_COUNT=1 rllib/...
 
 - label: ":brain: RLlib: tests/ dir"
   conditions: ["NO_WHEELS_REQUIRED", "RAY_CI_RLLIB_DIRECTLY_AFFECTED"]

From b31343a8afcafef0fbcf7e81f102aa947870265f Mon Sep 17 00:00:00 2001
From: yuduber <74632396+yuduber@users.noreply.github.com>
Date: Thu, 2 Feb 2023 17:04:36 -0800
Subject: [PATCH 143/267] [air] avoid inconsistency of create filesystem from
 uri for hdfs case (#30611)

pyarrow.fs.FileSystem.from_uri(uri) will work if uri is the form of hdfs://name_server/user_folder/... But it will fail if uri is in the form of hdfs:///user_folder. But certain raytune module make it not possible to supply uri always in hdfs://name_server/user_folder/... format. If fssepc is available, we don't have such issue. So we place fsspec at a higher priority

Signed-off-by: yud <yud@uber.com>
---
 .buildkite/pipeline.build.yml               |  2 +-
 python/ray/air/_internal/remote_storage.py  | 22 ++++++++++++++++++---
 python/ray/air/tests/test_remote_storage.py | 18 +++++++++++++++++
 3 files changed, 38 insertions(+), 4 deletions(-)

diff --git a/.buildkite/pipeline.build.yml b/.buildkite/pipeline.build.yml
index cc1acbc0261e..6a5cdd0197bf 100644
--- a/.buildkite/pipeline.build.yml
+++ b/.buildkite/pipeline.build.yml
@@ -648,7 +648,7 @@
   commands:
     - cleanup() { if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then ./ci/build/upload_build_info.sh; fi }; trap cleanup EXIT
     - ./ci/env/install-minimal.sh 3.7
-    - DATA_PROCESSING_TESTING=1 TUNE_TESTING=1 TRAIN_TESTING=1 ./ci/env/install-dependencies.sh
+    - DATA_PROCESSING_TESTING=1 TUNE_TESTING=1 TRAIN_TESTING=1 INSTALL_HDFS=1 ./ci/env/install-dependencies.sh
     - pip install -r python/requirements/compat/requirements_legacy_compat.txt
     - pip install -U typing-extensions
     - HOROVOD_WITH_GLOO=1 HOROVOD_WITHOUT_MPI=1 HOROVOD_WITHOUT_MXNET=1 HOROVOD_WITH_TENSORFLOW=1 HOROVOD_WITH_PYTORCH=1 pip install horovod
diff --git a/python/ray/air/_internal/remote_storage.py b/python/ray/air/_internal/remote_storage.py
index 66708deb02f3..7df9c6f5f402 100644
--- a/python/ray/air/_internal/remote_storage.py
+++ b/python/ray/air/_internal/remote_storage.py
@@ -105,10 +105,26 @@ def get_fs_and_path(
         fs = _cached_fs[cache_key]
         return fs, path
 
+    # In case of hdfs filesystem, if uri does not have the netloc part below will
+    # fail with hdfs access error.  For example 'hdfs:///user_folder/...' will
+    # fail, while only 'hdfs://namenode_server/user_foler/...' will work
+    # we consider the two cases of uri: short_hdfs_uri or other_uri,
+    # other_uri includes long hdfs uri and other filesystem uri, like s3 or gcp
+    # filesystem. Two cases of imported module of fsspec: yes or no. So we need
+    # to handle 4 cases:
+    # (uri,             fsspec)
+    # (short_hdfs_uri,  yes) --> use fsspec
+    # (short_hdfs_uri,  no) --> return None and avoid init pyarrow
+    # (other_uri,       yes) --> try pyarrow, if throw use fsspec
+    # (other_uri,       no) --> try pyarrow, if throw return None
+    short_hdfs_uri = parsed.scheme == "hdfs" and parsed.netloc == ""
     try:
-        fs, path = pyarrow.fs.FileSystem.from_uri(uri)
-        _cached_fs[cache_key] = fs
-        return fs, path
+        if short_hdfs_uri and not fsspec:
+            return None, None
+        if not short_hdfs_uri:
+            fs, path = pyarrow.fs.FileSystem.from_uri(uri)
+            _cached_fs[cache_key] = fs
+            return fs, path
     except (pyarrow.lib.ArrowInvalid, pyarrow.lib.ArrowNotImplementedError):
         # Raised when URI not recognized
         if not fsspec:
diff --git a/python/ray/air/tests/test_remote_storage.py b/python/ray/air/tests/test_remote_storage.py
index 49c93c25e95a..cc3c98209a6f 100644
--- a/python/ray/air/tests/test_remote_storage.py
+++ b/python/ray/air/tests/test_remote_storage.py
@@ -9,6 +9,7 @@
 from ray.air._internal.remote_storage import (
     upload_to_uri,
     download_from_uri,
+    get_fs_and_path,
 )
 from ray.tune.utils.file_transfer import _get_recursive_files_and_stats
 
@@ -157,6 +158,23 @@ def waiting_lstat(*args, **kwargs):
     assert_file(True, tmp_source, "level0_exclude.txt")
 
 
+def test_get_fs_and_path():
+    short_uri = "hdfs:///user_folder/mock_folder"
+    try:
+        fs, path = get_fs_and_path(short_uri)
+        # if fsspec not imported, then we will have None
+        assert fs is None
+        assert path is None
+    except Exception as e:
+        # if fsspec imported, checking uri will not find the file
+        str_e = str(e)
+        find_error = (
+            "No such file or directory" in str_e
+            or "pyarrow and local java libraries required for HDFS" in str_e
+        )
+        assert find_error
+
+
 if __name__ == "__main__":
     import sys
 

From 6f97a8301e8b32d78fbf3ce73fdaf068fa87e7ba Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Fri, 3 Feb 2023 08:56:07 -0800
Subject: [PATCH 144/267] Revert "Revert "[core] Increase the threshold for
 pubsub integration test"" (#32177)

* Revert "Revert "[core] Increase the threshold for pubsub integration test (#32145)" (#32165)"

This reverts commit 83e1a2a136d97c0cf70b227415b48c0fddc2ddfc.

Signed-off-by: Yi Cheng <74173148+iycheng@users.noreply.github.com>
---
 BUILD.bazel                             | 2 +-
 src/ray/pubsub/test/integration_test.cc | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/BUILD.bazel b/BUILD.bazel
index 6baa80541cf4..93400cb80985 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -1711,7 +1711,7 @@ cc_test(
 
 cc_test(
     name = "pubsub_integration_test",
-    timeout = "short",
+    size = "small",
     srcs = ["src/ray/pubsub/test/integration_test.cc"],
     copts = COPTS,
     tags = ["team:core"],
diff --git a/src/ray/pubsub/test/integration_test.cc b/src/ray/pubsub/test/integration_test.cc
index 9f52c6e7a499..ffca2acd0e05 100644
--- a/src/ray/pubsub/test/integration_test.cc
+++ b/src/ray/pubsub/test/integration_test.cc
@@ -295,7 +295,7 @@ TEST_F(IntegrationTest, SubscribersToOneIDAndAllIDs) {
   // logic below.
   int wait_count = 0;
   while (!(subscriber_1->CheckNoLeaks() && subscriber_2->CheckNoLeaks())) {
-    ASSERT_LT(wait_count, 15) << "Subscribers still have inflight operations after 15s";
+    ASSERT_LT(wait_count, 60) << "Subscribers still have inflight operations after 60s";
     ++wait_count;
     absl::SleepFor(absl::Seconds(1));
   }

From 370a57482689daf7c151369f7a32e87b6255dbde Mon Sep 17 00:00:00 2001
From: clarng <clarence.wyng@gmail.com>
Date: Fri, 3 Feb 2023 08:56:55 -0800
Subject: [PATCH 145/267] [core] release test for nested air (tune) oom
 (#31768)

[core] release test for nested air (tune) oom #31768

Signed-off-by: Clarence Ng <clarence@anyscale.com>
---
 .../mlperf-train/resnet50_ray_air.py          | 45 ++++++++++++++++++-
 .../stress_tests_tune_air_oom_app_config.yaml | 17 +++++++
 .../stress_tests_tune_air_oom_compute.yaml    | 10 +++++
 release/air_tests/oom/tune_air_oom.sh         | 34 ++++++++++++++
 release/release_tests.yaml                    | 16 +++++++
 5 files changed, 120 insertions(+), 2 deletions(-)
 create mode 100644 release/air_tests/oom/stress_tests_tune_air_oom_app_config.yaml
 create mode 100644 release/air_tests/oom/stress_tests_tune_air_oom_compute.yaml
 create mode 100755 release/air_tests/oom/tune_air_oom.sh

diff --git a/release/air_tests/air_benchmarks/mlperf-train/resnet50_ray_air.py b/release/air_tests/air_benchmarks/mlperf-train/resnet50_ray_air.py
index 1f818fba6e3c..f37d5e1784b9 100644
--- a/release/air_tests/air_benchmarks/mlperf-train/resnet50_ray_air.py
+++ b/release/air_tests/air_benchmarks/mlperf-train/resnet50_ray_air.py
@@ -12,6 +12,9 @@
 from ray.train.tensorflow import prepare_dataset_shard, TensorflowTrainer
 from ray.air.config import ScalingConfig
 from ray.data.preprocessors import BatchMapper
+from ray import tune
+from ray.tune import Tuner
+
 
 from tf_utils import (
     DEFAULT_IMAGE_SIZE,
@@ -449,6 +452,21 @@ def append_to_test_output_json(path, metrics):
             "Default value taken from MLPerf reference implementation."
         ),
     )
+    parser.add_argument(
+        "--trainer-resources-cpu",
+        default=1,
+        type=int,
+        help=("CPU resources requested per AIR trainer instance. Defaults to 1."),
+    )
+    parser.add_argument(
+        "--tune-trials",
+        default=0,
+        type=int,
+        help=(
+            "Number of Tune trials to run. Defaults to 0, "
+            "which disables Tune and executes a Trainer instance directly."
+        ),
+    )
     parser.add_argument("--output-file", default="out.csv", type=str)
     parser.add_argument("--use-gpu", action="store_true")
     parser.add_argument("--online-processing", action="store_true")
@@ -530,17 +548,40 @@ def append_to_test_output_json(path, metrics):
 
     trainer = TensorflowTrainer(
         train_loop_for_worker,
-        scaling_config=ScalingConfig(num_workers=1, use_gpu=args.use_gpu),
+        scaling_config=ScalingConfig(
+            num_workers=1,
+            use_gpu=args.use_gpu,
+            trainer_resources={"CPU": args.trainer_resources_cpu},
+        ),
         datasets=datasets,
         preprocessor=preprocessor,
         train_loop_config=train_loop_config,
     )
+
+    tuner = None
+    if args.tune_trials > 0:
+        tuner = Tuner(
+            trainer,
+            param_space={
+                "train_loop_config": {
+                    "random_var": tune.grid_search(range(1, args.tune_trials + 1))
+                }
+            },
+            tune_config=tune.TuneConfig(
+                metric="time_total_s", mode="max", num_samples=1
+            ),
+        )
+
     result = {}
     exc = None
     start_time_s = time.perf_counter()
     ray_spill_stats_start = get_ray_spilled_and_restored_mb()
     try:
-        result = trainer.fit()
+        if tuner:
+            result_grid = tuner.fit()
+            result = result_grid.get_best_result()
+        else:
+            result = trainer.fit()
         result = result.metrics
     except Exception as e:
         exc = e
diff --git a/release/air_tests/oom/stress_tests_tune_air_oom_app_config.yaml b/release/air_tests/oom/stress_tests_tune_air_oom_app_config.yaml
new file mode 100644
index 000000000000..e1ea1808bced
--- /dev/null
+++ b/release/air_tests/oom/stress_tests_tune_air_oom_app_config.yaml
@@ -0,0 +1,17 @@
+base_image: {{ env["RAY_IMAGE_NIGHTLY_CPU"] | default("anyscale/ray:nightly-py37") }}
+debian_packages: []
+# Lower the threshold to trigger memory pressure.
+# TODO: turn on infinite retry by default when we switch to new policy.
+env_vars: {"RAY_memory_usage_threshold": "0.7", "RAY_task_oom_retries": "-1"}
+
+
+python:
+  pip_packages:
+    - tensorflow
+  conda_packages: []
+
+post_build_cmds:
+  - pip3 uninstall -y ray && pip3 install -U {{ env["RAY_WHEELS"] | default("ray") }}
+  - pip3 install ray[default]
+  - echo {{env["DATESTAMP"]}}
+  - {{ env["RAY_WHEELS_SANITY_CHECK"] | default("echo No Ray wheels sanity check") }}
diff --git a/release/air_tests/oom/stress_tests_tune_air_oom_compute.yaml b/release/air_tests/oom/stress_tests_tune_air_oom_compute.yaml
new file mode 100644
index 000000000000..52564851afe3
--- /dev/null
+++ b/release/air_tests/oom/stress_tests_tune_air_oom_compute.yaml
@@ -0,0 +1,10 @@
+cloud_id: {{env["ANYSCALE_CLOUD_ID"]}}
+region: us-west-2
+
+max_workers: 0
+
+head_node_type:
+    name: head_node
+    instance_type: m5.2xlarge
+
+worker_node_types: []
diff --git a/release/air_tests/oom/tune_air_oom.sh b/release/air_tests/oom/tune_air_oom.sh
new file mode 100755
index 000000000000..1318c7b9f841
--- /dev/null
+++ b/release/air_tests/oom/tune_air_oom.sh
@@ -0,0 +1,34 @@
+#!/bin/bash
+# Trigger OOM in the Tune AIR workload and verify it passes.
+
+# Exit if any of the test commands fail.
+set -x -e pipeline
+
+NUM_IMAGES_PER_FILE="2048"
+NUM_FILES="16"
+NUM_EPOCHS=1
+BATCH_SIZE=64
+SHUFFLE_BUFFER_SIZE=0
+DATA_DIR=/home/ray/data
+
+SHARD_URL_PREFIX=https://air-example-data.s3.us-west-2.amazonaws.com/air-benchmarks
+
+rm -rf $DATA_DIR
+mkdir -p $DATA_DIR
+time python air_benchmarks/mlperf-train/make_fake_dataset.py \
+    --num-shards "$NUM_FILES" \
+    --shard-url "$SHARD_URL_PREFIX/single-image-repeated-$NUM_IMAGES_PER_FILE-times" \
+    --output-directory $DATA_DIR
+
+num_images_per_epoch=$((NUM_FILES * NUM_IMAGES_PER_FILE))
+time python air_benchmarks/mlperf-train/resnet50_ray_air.py \
+    --num-images-per-input-file "$NUM_IMAGES_PER_FILE" \
+    --num-epochs $NUM_EPOCHS \
+    --batch-size $BATCH_SIZE \
+    --shuffle-buffer-size $SHUFFLE_BUFFER_SIZE \
+    --num-images-per-epoch $num_images_per_epoch \
+    --train-sleep-time-ms 0 \
+    --data-root $DATA_DIR \
+    --use-ray-data \
+    --trainer-resources-cpu 0 \
+    --tune-trials 2
diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index df2f34c8308c..3f7dc6783e80 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -3901,6 +3901,22 @@
     script: python stress_tests/test_parallel_tasks_memory_pressure.py --num-tasks 20
 
 
+- name: tune_air_oom
+  group: core-daily-test
+  working_dir: air_tests
+  stable: false
+
+  frequency: nightly
+  team: core
+  cluster:
+    cluster_env: oom/stress_tests_tune_air_oom_app_config.yaml
+    cluster_compute: oom/stress_tests_tune_air_oom_compute.yaml
+
+  run:
+    timeout: 3600
+    script: bash oom/tune_air_oom.sh
+
+
 - name: dask_on_ray_1tb_sort
   group: core-daily-test
   working_dir: nightly_tests

From 8b55e2d85301ffae02bd980b9e242e5671bf104c Mon Sep 17 00:00:00 2001
From: David Xia <davidxia@users.noreply.github.com>
Date: Sat, 4 Feb 2023 00:09:09 -0500
Subject: [PATCH 146/267] [Docs] Fix typo in Huggingface example notebook 
 (#32218)

Signed-off-by: David Xia <dxia@spotify.com>
---
 .../ray-air/examples/huggingface_text_classification.ipynb      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/doc/source/ray-air/examples/huggingface_text_classification.ipynb b/doc/source/ray-air/examples/huggingface_text_classification.ipynb
index da844f73c124..dae1556a24e1 100644
--- a/doc/source/ray-air/examples/huggingface_text_classification.ipynb
+++ b/doc/source/ray-air/examples/huggingface_text_classification.ipynb
@@ -530,7 +530,7 @@
         "\n",
         "Furthermore, `push_to_hub=True` is not yet supported. Ray will, however, checkpoint the model at every epoch, allowing you to push it to hub manually. We will do that after the training.\n",
         "\n",
-        "If you wish to use thrid party logging libraries, such as MLflow or Weights&Biases, do not set them in `TrainingArguments` (they will be automatically disabled) - instead, you should pass Ray AIR callbacks to `HuggingFaceTrainer`'s `run_config`. In this example, we will use MLflow."
+        "If you wish to use third-party logging libraries, such as MLflow or Weights&Biases, do not set them in `TrainingArguments` (they will be automatically disabled) - instead, you should pass Ray AIR callbacks to `HuggingFaceTrainer`'s `run_config`. In this example, we will use MLflow."
       ]
     },
     {

From 37c0f7687f8684658f39e26513e00271542833bf Mon Sep 17 00:00:00 2001
From: David Xia <davidxia@users.noreply.github.com>
Date: Sat, 4 Feb 2023 05:45:22 -0500
Subject: [PATCH 147/267] [docs] fix typo in
 huggingface_text_classification.ipynb (#32207)

---
 .../ray-air/examples/huggingface_text_classification.ipynb      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/doc/source/ray-air/examples/huggingface_text_classification.ipynb b/doc/source/ray-air/examples/huggingface_text_classification.ipynb
index dae1556a24e1..70ca14156995 100644
--- a/doc/source/ray-air/examples/huggingface_text_classification.ipynb
+++ b/doc/source/ray-air/examples/huggingface_text_classification.ipynb
@@ -59,7 +59,7 @@
         "id": "LRdL3kWBhYbQ"
       },
       "source": [
-        "We will use `ray.init()` to initialize a local cluster. By default, this cluster will be compromised of only the machine you are running this notebook on. You can also run this notebook on an Anyscale cluster.\n",
+        "We will use `ray.init()` to initialize a local cluster. By default, this cluster will be comprised of only the machine you are running this notebook on. You can also run this notebook on an Anyscale cluster.\n",
         "\n",
         "Note: this notebook *will not* run in Ray Client mode."
       ]

From 715e1b297b0493594acabccb3e9d6d25e28f9070 Mon Sep 17 00:00:00 2001
From: xwjiang2010 <87673679+xwjiang2010@users.noreply.github.com>
Date: Sat, 4 Feb 2023 02:45:53 -0800
Subject: [PATCH 148/267] [tune/doc] improve `log_to_file` doc. (#32128)

---
 doc/source/ray-observability/ray-logging.rst |  2 +
 doc/source/tune/tutorials/tune-output.rst    | 41 +++++++++++++++-----
 2 files changed, 34 insertions(+), 9 deletions(-)

diff --git a/doc/source/ray-observability/ray-logging.rst b/doc/source/ray-observability/ray-logging.rst
index 692fbeb479e0..c7f0404cdee4 100644
--- a/doc/source/ray-observability/ray-logging.rst
+++ b/doc/source/ray-observability/ray-logging.rst
@@ -14,6 +14,8 @@ Job logs
 Logs for jobs submitted via the :ref:`Ray Jobs API <jobs-overview>` can be retrieved using the ``ray job logs`` :ref:`CLI command <ray-job-logs-doc>` or using ``JobSubmissionClient.get_logs()`` or ``JobSubmissionClient.tail_job_logs()`` via the :ref:`Python SDK <ray-job-submission-sdk-ref>`.
 The log file consists of the stdout of the entrypoint command of the job.  For the location of the log file on disk, see :ref:`Logging directory structure <logging-directory-structure>`.
 
+.. _ray-worker-logs:
+
 Worker logs
 ~~~~~~~~~~~
 Ray's tasks or actors are executed remotely within Ray's worker processes. Ray has special support to improve the visibility of logs produced by workers.
diff --git a/doc/source/tune/tutorials/tune-output.rst b/doc/source/tune/tutorials/tune-output.rst
index 2d61bef07a50..c113e58d74da 100644
--- a/doc/source/tune/tutorials/tune-output.rst
+++ b/doc/source/tune/tutorials/tune-output.rst
@@ -108,15 +108,15 @@ You can use a :ref:`Reporter <tune-reporter-doc>` object to customize the consol
 
 .. _tune-log_to_file:
 
-How to redirect stdout and stderr to files in a Tune run?
+How to redirect Trainable logs to files in a Tune run?
 ---------------------------------------------------------
 
-The stdout and stderr streams are usually printed to the console.
-For remote actors, Ray collects these logs and prints them to the head process.
-
-However, if you would like to collect the stream outputs in files for later
-analysis or troubleshooting, Tune offers an utility parameter, ``log_to_file``,
-for this.
+In Tune, Trainables are run as remote actors. By default, Ray collects actors' stdout and stderr and prints them to
+the head process (see :ref:`ray worker logs <ray-worker-logs>` for more information).
+Logging that happens within Tune Trainables follows this handling by default.
+However, if you wish to collect Trainable logs in files for analysis, Tune offers the option
+``log_to_file`` for this.
+This applies to print statements, ``warnings.warn`` and ``logger.info`` etc.
 
 By passing ``log_to_file=True`` to ``air.RunConfig``, which is taken in by ``Tuner``, stdout and stderr will be logged
 to ``trial_logdir/stdout`` and ``trial_logdir/stderr``, respectively:
@@ -149,8 +149,31 @@ respectively:
 The file names are relative to the trial's logdir. You can pass absolute paths,
 too.
 
-If ``log_to_file`` is set, Tune will automatically register a new logging handler
-for Ray's base logger and log the output to the specified stderr output file.
+Caveats
+^^^^^^^
+Logging that happens in distributed training workers (if you happen to use Ray Tune together with Ray Train)
+is not part of this ``log_to_file`` configuration.
+
+Where to find ``log_to_file`` files?
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+If your Tune workload is configured with syncing to head node, then the corresponding ``log_to_file`` outputs
+can be located under each trial folder.
+If your Tune workload is instead configured with syncing to cloud, then the corresponding ``log_to_file``
+outputs are *NOT* synced to cloud and can only be found in the worker nodes that the corresponding trial happens.
+
+.. note::
+    This can cause problems when the trainable is moved across different nodes throughout its lifetime.
+    This can happen with some schedulers or with node failures.
+    We may prioritize enabling this if there are enough user requests.
+    If this impacts your workflow, consider commenting on
+    [this ticket](https://github.com/ray-project/ray/issues/32142).
+
+
+Leave us feedback on this feature
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+We know that logging and observability can be a huge performance boost for your workflow. Let us know what is your
+preferred way to interact with logging that happens in trainables. Leave you comments in
+[this ticket](https://github.com/ray-project/ray/issues/32142).
 
 .. _trainable-logging:
 

From 5503bcdb7f70bc7dcfaaf174a48441de8f7070c1 Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Sat, 4 Feb 2023 13:26:55 -0800
Subject: [PATCH 149/267] [Dashboard] Turn on new IA by default (#32164)

---
 dashboard/client/src/App.tsx                      |  2 +-
 .../client/src/pages/layout/MainNavLayout.tsx     |  2 +-
 dashboard/tests/cypress/e2e/test_render.cy.js     | 15 +++++++++------
 3 files changed, 11 insertions(+), 8 deletions(-)

diff --git a/dashboard/client/src/App.tsx b/dashboard/client/src/App.tsx
index 52e89c5315e2..3953f2520769 100644
--- a/dashboard/client/src/App.tsx
+++ b/dashboard/client/src/App.tsx
@@ -147,7 +147,7 @@ const App = () => {
             {/* Dummy MainNavContext so we can re-use existing pages in new layout */}
             <MainNavContext.Provider value={DEFAULT_VALUE}>
               <Routes>
-                <Route element={<Navigate replace to="/node" />} path="/" />
+                <Route element={<Navigate replace to="/new" />} path="/" />
                 <Route
                   element={<BasicLayout setTheme={setTheme} theme={theme} />}
                 >
diff --git a/dashboard/client/src/pages/layout/MainNavLayout.tsx b/dashboard/client/src/pages/layout/MainNavLayout.tsx
index fb2fcd6f968c..f6d846f31072 100644
--- a/dashboard/client/src/pages/layout/MainNavLayout.tsx
+++ b/dashboard/client/src/pages/layout/MainNavLayout.tsx
@@ -190,7 +190,7 @@ const MainNavBar = () => {
       <div className={classes.actionItemsContainer}>
         <Link
           className={classNames(classes.actionItem, classes.backToOld)}
-          to="/"
+          to="/node"
         >
           <Typography
             variant="body2"
diff --git a/dashboard/tests/cypress/e2e/test_render.cy.js b/dashboard/tests/cypress/e2e/test_render.cy.js
index 80675ee96a05..c92deb690279 100644
--- a/dashboard/tests/cypress/e2e/test_render.cy.js
+++ b/dashboard/tests/cypress/e2e/test_render.cy.js
@@ -1,6 +1,9 @@
-describe('Ray Dashboard Test', () => {
-    it('opens a new Ray dashboard', () => {
-        cy.visit('localhost:8653')
-        cy.contains('Ray')
-    })
-  })
+describe("Ray Dashboard Test", () => {
+  it("opens a new Ray dashboard", () => {
+    cy.visit("localhost:8653");
+    cy.contains("Overview");
+    cy.contains("Jobs");
+    cy.contains("Cluster");
+    cy.contains("Logs");
+  });
+});

From 276559effb4ff31cad1f5216e282aed26adb8014 Mon Sep 17 00:00:00 2001
From: Archit Kulkarni <architkulkarni@users.noreply.github.com>
Date: Mon, 6 Feb 2023 08:21:01 -0800
Subject: [PATCH 150/267] [Doc] [runtime env] Address common question about
 importing packages outside Ray (#31373)

Answer a common user question by emphasizing in the docs that runtime envs are only active for Ray processes, so you shouldn't expect to be able to install a runtime env and then log into the cluster and start importing the packages outside Ray.
---
 doc/source/ray-core/handling-dependencies.rst | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/doc/source/ray-core/handling-dependencies.rst b/doc/source/ray-core/handling-dependencies.rst
index 0f06200770a8..4ce58595e3ce 100644
--- a/doc/source/ray-core/handling-dependencies.rst
+++ b/doc/source/ray-core/handling-dependencies.rst
@@ -62,6 +62,7 @@ It is installed dynamically on the cluster at runtime and cached for future use
 
 Runtime environments can be used on top of the prepared environment from :ref:`the Ray Cluster launcher <using-the-cluster-launcher>` if it was used.
 For example, you can use the Cluster launcher to install a base set of packages, and then use runtime environments to install additional packages.
+In contrast with the base cluster environment, a runtime environment will only be active for Ray processes.  (For example, if using a runtime environment specifying a ``pip`` package ``my_pkg``, the statement ``import my_pkg`` will fail if called outside of a Ray task, actor, or job.)
 
 Runtime environments also allow you to set dependencies per-task, per-actor, and per-job on a long-running Ray cluster.
 
@@ -464,8 +465,6 @@ Where are the environments cached?
 
 Any local files downloaded by the environments are cached at ``/tmp/ray/session_latest/runtime_resources``.
 
-
-
 How long does it take to install or to load from cache?
 """""""""""""""""""""""""""""""""""""""""""""""""""""""
 
@@ -484,6 +483,11 @@ They can be used independently or together.
 A container image can be specified in the :ref:`Cluster Launcher <vm-cluster-quick-start>` for large or static dependencies, and runtime environments can be specified per-job or per-task/actor for more dynamic use cases.
 The runtime environment will inherit packages, files, and environment variables from the container image.
 
+My ``runtime_env`` was installed, but when I log into the node I can't import the packages.
+"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""
+
+The runtime environment is only active for the Ray worker processes; it does not install any packages "globally" on the node.
+
 .. _remote-uris:
 
 Remote URIs

From 2314775e4cf1dd3bd3dab3e8a6744c3f8213933b Mon Sep 17 00:00:00 2001
From: shrekris-anyscale <92341594+shrekris-anyscale@users.noreply.github.com>
Date: Mon, 6 Feb 2023 09:04:46 -0800
Subject: [PATCH 151/267] [Serve] Remove logging requirement for
 `long_running_serve_failure` (#32181)

#32063 fixed some issues with the long_running_serve_failure release test and then marked it stable. The test ran successfully afterwards (see test run), but the CI failed to access logs from the cluster and reported the test as errored. The logs were inaccessible on the cluster due to an issue with the cluster setup.

Since this test can run without persisting logs, this change drops the logging requirement for this test.

Related issue number
Closes #32169
---
 release/long_running_tests/workloads/serve_failure.py | 10 ++++------
 release/ray_release/alerts/long_running_tests.py      |  5 ++++-
 2 files changed, 8 insertions(+), 7 deletions(-)

diff --git a/release/long_running_tests/workloads/serve_failure.py b/release/long_running_tests/workloads/serve_failure.py
index 4dac08549c1e..e45d4358f467 100644
--- a/release/long_running_tests/workloads/serve_failure.py
+++ b/release/long_running_tests/workloads/serve_failure.py
@@ -151,12 +151,10 @@ def run(self):
 
             new_time = time.time()
             print(
-                "Iteration {}:\n"
-                "  - Iteration time: {}.\n"
-                "  - Absolute time: {}.\n"
-                "  - Total elapsed time: {}.".format(
-                    iteration, new_time - previous_time, new_time, new_time - start_time
-                )
+                f"Iteration {iteration}:\n"
+                f"  - Iteration time: {new_time - previous_time}.\n"
+                f"  - Absolute time: {new_time}.\n"
+                f"  - Total elapsed time: {new_time - start_time}."
             )
             update_progress(
                 {
diff --git a/release/ray_release/alerts/long_running_tests.py b/release/ray_release/alerts/long_running_tests.py
index ffbd02bde9ab..fc7237242ccc 100644
--- a/release/ray_release/alerts/long_running_tests.py
+++ b/release/ray_release/alerts/long_running_tests.py
@@ -27,10 +27,13 @@ def handle_result(
     elif test_name in ["apex", "impala", "many_ppo", "pbt"]:
         # Tune/RLlib style tests
         target_update_diff = 480
-    elif test_name in ["serve", "serve_failure"]:
+    elif test_name in ["serve"]:
         # Serve tests have workload logs every five minutes.
         # Leave up to 180 seconds overhead.
         target_update_diff = 480
+    elif test_name in ["serve_failure"]:
+        # TODO (shrekris-anyscale): set update_diff limit for serve failure
+        target_update_diff = float("inf")
     else:
         return None
 

From 095960cf650bcbd672e72b6e8e383a1812ce0ab9 Mon Sep 17 00:00:00 2001
From: Jian Xiao <99709935+jianoaix@users.noreply.github.com>
Date: Mon, 6 Feb 2023 12:31:36 -0800
Subject: [PATCH 152/267] [Datasets] Deflake the test_dataset.py (#32200)

Signed-off-by: jianoaix <iamjianxiao@gmail.com>
---
 python/ray/data/tests/test_dataset.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/python/ray/data/tests/test_dataset.py b/python/ray/data/tests/test_dataset.py
index 99ace502471f..1c0c4b748ef4 100644
--- a/python/ray/data/tests/test_dataset.py
+++ b/python/ray/data/tests/test_dataset.py
@@ -59,6 +59,10 @@ def _read_stream(self, f: "pa.NativeFile", path: str, **reader_args):
 # https://github.com/ray-project/ray/issues/20625
 @pytest.mark.parametrize("block_split", [False, True])
 def test_bulk_lazy_eval_split_mode(shutdown_only, block_split, tmp_path):
+    # Defensively shutdown Ray for the first test here to make sure there
+    # is no existing Ray cluster.
+    ray.shutdown()
+
     ray.init(num_cpus=8)
     ctx = ray.data.context.DatasetContext.get_current()
 

From e71e3a7ab42238d572a48d158b9d91d612c4c39c Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Mon, 6 Feb 2023 17:28:18 -0800
Subject: [PATCH 153/267] [Docs] Refactor Ray Workflows API documentation
 (#32248)

---
 doc/source/_toc.yml                     |  2 +-
 doc/source/ray-references/api.rst       |  2 +-
 doc/source/workflows/api/api.rst        |  8 ++++++++
 doc/source/workflows/api/execution.rst  | 10 ++++++++++
 doc/source/workflows/api/management.rst | 17 +++++++++++++++++
 doc/source/workflows/package-ref.rst    | 21 ---------------------
 6 files changed, 37 insertions(+), 23 deletions(-)
 create mode 100644 doc/source/workflows/api/api.rst
 create mode 100644 doc/source/workflows/api/execution.rst
 create mode 100644 doc/source/workflows/api/management.rst
 delete mode 100644 doc/source/workflows/package-ref.rst

diff --git a/doc/source/_toc.yml b/doc/source/_toc.yml
index 223b1f9276ba..4975ca63a112 100644
--- a/doc/source/_toc.yml
+++ b/doc/source/_toc.yml
@@ -357,7 +357,7 @@ parts:
               - file: workflows/events
               - file: workflows/comparison
               - file: workflows/advanced
-              - file: workflows/package-ref
+              - file: workflows/api/api
 
       - file: ray-observability/monitoring-debugging/monitoring-debugging
         title: "Monitoring and Debugging"
diff --git a/doc/source/ray-references/api.rst b/doc/source/ray-references/api.rst
index 6aef18962dbc..2e97eac3dfba 100644
--- a/doc/source/ray-references/api.rst
+++ b/doc/source/ray-references/api.rst
@@ -11,6 +11,6 @@ API References
     ../tune/api_docs/overview.rst
     ../serve/package-ref.rst
     ../rllib/package_ref/index.rst
-    ../workflows/package-ref.rst
+    ../workflows/api/api.rst
     ../cluster/package-overview.rst
     ../ray-core/package-ref.rst
diff --git a/doc/source/workflows/api/api.rst b/doc/source/workflows/api/api.rst
new file mode 100644
index 000000000000..b9c78ded0556
--- /dev/null
+++ b/doc/source/workflows/api/api.rst
@@ -0,0 +1,8 @@
+Ray Workflows API
+=================
+
+.. toctree::
+    :maxdepth: 1
+
+    execution.rst
+    management.rst
diff --git a/doc/source/workflows/api/execution.rst b/doc/source/workflows/api/execution.rst
new file mode 100644
index 000000000000..e4c4a42afdf7
--- /dev/null
+++ b/doc/source/workflows/api/execution.rst
@@ -0,0 +1,10 @@
+Workflow Execution API
+======================
+
+.. currentmodule:: ray.workflow
+
+.. autosummary::
+   :toctree: doc/
+
+   run
+   run_async
\ No newline at end of file
diff --git a/doc/source/workflows/api/management.rst b/doc/source/workflows/api/management.rst
new file mode 100644
index 000000000000..e934c980d8bf
--- /dev/null
+++ b/doc/source/workflows/api/management.rst
@@ -0,0 +1,17 @@
+Workflow Management API
+=======================
+
+.. currentmodule:: ray.workflow
+
+.. autosummary::
+   :toctree: doc/
+
+   resume
+   resume_async
+   resume_all
+   list_all
+   get_status
+   get_output
+   get_output_async
+   get_metadata
+   cancel
\ No newline at end of file
diff --git a/doc/source/workflows/package-ref.rst b/doc/source/workflows/package-ref.rst
deleted file mode 100644
index 44a88f41ca1b..000000000000
--- a/doc/source/workflows/package-ref.rst
+++ /dev/null
@@ -1,21 +0,0 @@
-Ray Workflows API
-=================
-
-Workflow Execution API
-----------------------
-
-.. autofunction:: ray.workflow.run
-.. autofunction:: ray.workflow.run_async
-
-
-Management API
---------------
-.. autofunction:: ray.workflow.resume
-.. autofunction:: ray.workflow.resume_async
-.. autofunction:: ray.workflow.resume_all
-.. autofunction:: ray.workflow.list_all
-.. autofunction:: ray.workflow.get_status
-.. autofunction:: ray.workflow.get_output
-.. autofunction:: ray.workflow.get_output_async
-.. autofunction:: ray.workflow.get_metadata
-.. autofunction:: ray.workflow.cancel

From f3ae74e7de375a8bf870540d031d9011fef754e9 Mon Sep 17 00:00:00 2001
From: Alan Guo <aguo@anyscale.com>
Date: Tue, 7 Feb 2023 01:00:26 -0800
Subject: [PATCH 154/267] Allow overriding the UID of the default grafana
 dashboard exported by ray (#32255)

Signed-off-by: Alan Guo <aguo@anyscale.com>

This lets users with their own grafana setups to have multiple dashboards, one per ray instance. Without this change, each dashboard would have the same uid and replace each other in the grafana DB.
---
 dashboard/client/src/App.tsx                  | 15 +++-
 .../pages/metrics/Metrics.component.test.tsx  |  2 +
 .../client/src/pages/metrics/Metrics.tsx      | 83 ++++++++++---------
 dashboard/client/src/pages/metrics/utils.ts   |  5 ++
 .../metrics/grafana_dashboard_factory.py      | 10 ++-
 dashboard/modules/metrics/metrics_head.py     |  7 +-
 python/ray/tests/test_metrics_head.py         | 16 +++-
 7 files changed, 95 insertions(+), 43 deletions(-)

diff --git a/dashboard/client/src/App.tsx b/dashboard/client/src/App.tsx
index 3953f2520769..619c3bf764fe 100644
--- a/dashboard/client/src/App.tsx
+++ b/dashboard/client/src/App.tsx
@@ -53,6 +53,10 @@ type GlobalContextType = {
    * running as detected by the grafana healthcheck endpoint.
    */
   grafanaHost: string | undefined;
+  /**
+   * The uid of the default dashboard that powers the Metrics page.
+   */
+  grafanaDefaultDashboardUid: string | undefined;
   /**
    * Whether prometheus is runing or not
    */
@@ -68,6 +72,7 @@ export const GlobalContext = React.createContext<GlobalContextType>({
   ipLogMap: {},
   namespaceMap: {},
   grafanaHost: undefined,
+  grafanaDefaultDashboardUid: undefined,
   prometheusHealth: undefined,
   sessionName: undefined,
 });
@@ -85,6 +90,7 @@ const App = () => {
     ipLogMap: {},
     namespaceMap: {},
     grafanaHost: undefined,
+    grafanaDefaultDashboardUid: undefined,
     prometheusHealth: undefined,
     sessionName: undefined,
   });
@@ -126,11 +132,16 @@ const App = () => {
   // Detect if grafana is running
   useEffect(() => {
     const doEffect = async () => {
-      const { grafanaHost, sessionName, prometheusHealth } =
-        await getMetricsInfo();
+      const {
+        grafanaHost,
+        sessionName,
+        prometheusHealth,
+        grafanaDefaultDashboardUid,
+      } = await getMetricsInfo();
       setContext((existingContext) => ({
         ...existingContext,
         grafanaHost,
+        grafanaDefaultDashboardUid,
         sessionName,
         prometheusHealth,
       }));
diff --git a/dashboard/client/src/pages/metrics/Metrics.component.test.tsx b/dashboard/client/src/pages/metrics/Metrics.component.test.tsx
index 5198cd38a540..4798d685c949 100644
--- a/dashboard/client/src/pages/metrics/Metrics.component.test.tsx
+++ b/dashboard/client/src/pages/metrics/Metrics.component.test.tsx
@@ -8,6 +8,7 @@ const Wrapper = ({ children }: PropsWithChildren<{}>) => {
     <GlobalContext.Provider
       value={{
         grafanaHost: "localhost:3000",
+        grafanaDefaultDashboardUid: "rayDefaultDashboard",
         prometheusHealth: true,
         sessionName: "session-name",
         ipLogMap: {},
@@ -26,6 +27,7 @@ const MetricsDisabledWrapper = ({ children }: PropsWithChildren<{}>) => {
     <GlobalContext.Provider
       value={{
         grafanaHost: undefined,
+        grafanaDefaultDashboardUid: undefined,
         prometheusHealth: false,
         sessionName: undefined,
         ipLogMap: {},
diff --git a/dashboard/client/src/pages/metrics/Metrics.tsx b/dashboard/client/src/pages/metrics/Metrics.tsx
index be13274b11e9..620574f26dff 100644
--- a/dashboard/client/src/pages/metrics/Metrics.tsx
+++ b/dashboard/client/src/pages/metrics/Metrics.tsx
@@ -94,7 +94,7 @@ const TIME_RANGE_TO_FROM_VALUE: Record<TimeRangeOptions, string> = {
 
 type MetricConfig = {
   title: string;
-  path: string;
+  pathParams: string;
 };
 
 type MetricsSectionConfig = {
@@ -109,19 +109,19 @@ const METRICS_CONFIG: MetricsSectionConfig[] = [
     contents: [
       {
         title: "Scheduler Task State",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=26",
+        pathParams: "orgId=1&theme=light&panelId=26",
       },
       {
         title: "Active Tasks by Name",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=35",
+        pathParams: "orgId=1&theme=light&panelId=35",
       },
       {
         title: "Scheduler Actor State",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=33",
+        pathParams: "orgId=1&theme=light&panelId=33",
       },
       {
         title: "Active Actors by Name",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=36",
+        pathParams: "orgId=1&theme=light&panelId=36",
       },
     ],
   },
@@ -130,19 +130,19 @@ const METRICS_CONFIG: MetricsSectionConfig[] = [
     contents: [
       {
         title: "Scheduler CPUs (logical slots)",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=27",
+        pathParams: "orgId=1&theme=light&panelId=27",
       },
       {
         title: "Scheduler GPUs (logical slots)",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=28",
+        pathParams: "orgId=1&theme=light&panelId=28",
       },
       {
         title: "Object Store Memory",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=29",
+        pathParams: "orgId=1&theme=light&panelId=29",
       },
       {
         title: "Placement Groups",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=40",
+        pathParams: "orgId=1&theme=light&panelId=40",
       },
     ],
   },
@@ -151,43 +151,43 @@ const METRICS_CONFIG: MetricsSectionConfig[] = [
     contents: [
       {
         title: "Node Count",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=24",
+        pathParams: "orgId=1&theme=light&panelId=24",
       },
       {
         title: "Node CPU (hardware utilization)",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=2",
+        pathParams: "orgId=1&theme=light&panelId=2",
       },
       {
         title: "Node Memory (heap + object store)",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=4",
+        pathParams: "orgId=1&theme=light&panelId=4",
       },
       {
         title: "Node GPU (hardware utilization)",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=8",
+        pathParams: "orgId=1&theme=light&panelId=8",
       },
       {
         title: "Node GPU Memory (GRAM)",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=18",
+        pathParams: "orgId=1&theme=light&panelId=18",
       },
       {
         title: "Node Disk",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=6",
+        pathParams: "orgId=1&theme=light&panelId=6",
       },
       {
         title: "Node Disk IO Speed",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=32",
+        pathParams: "orgId=1&theme=light&panelId=32",
       },
       {
         title: "Node Network",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=20",
+        pathParams: "orgId=1&theme=light&panelId=20",
       },
       {
         title: "Node CPU by Component",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=37",
+        pathParams: "orgId=1&theme=light&panelId=37",
       },
       {
         title: "Node Memory by Component",
-        path: "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=34",
+        pathParams: "orgId=1&theme=light&panelId=34",
       },
     ],
   },
@@ -199,8 +199,12 @@ type MetricsProps = {
 
 export const Metrics = ({ newIA = false }: MetricsProps) => {
   const classes = useStyles();
-  const { grafanaHost, sessionName, prometheusHealth } =
-    useContext(GlobalContext);
+  const {
+    grafanaHost,
+    sessionName,
+    prometheusHealth,
+    grafanaDefaultDashboardUid = "rayDefaultDashboard",
+  } = useContext(GlobalContext);
 
   const [timeRangeOption, setTimeRangeOption] = useState<TimeRangeOptions>(
     TimeRangeOptions.FIVE_MINS,
@@ -276,22 +280,27 @@ export const Metrics = ({ newIA = false }: MetricsProps) => {
                 keepRendered
               >
                 <div className={classes.grafanaEmbedsContainer}>
-                  {contents.map(({ title, path }) => (
-                    <Paper
-                      key={path}
-                      className={classes.chart}
-                      elevation={1}
-                      variant="outlined"
-                    >
-                      <iframe
-                        key={title}
-                        title={title}
-                        className={classes.grafanaEmbed}
-                        src={`${grafanaHost}${path}&refresh${timeRangeParams}&var-SessionName=${sessionName}`}
-                        frameBorder="0"
-                      />
-                    </Paper>
-                  ))}
+                  {contents.map(({ title, pathParams }) => {
+                    const path =
+                      `/d-solo/${grafanaDefaultDashboardUid}?${pathParams}` +
+                      `&refresh${timeRangeParams}&var-SessionName=${sessionName}`;
+                    return (
+                      <Paper
+                        key={pathParams}
+                        className={classes.chart}
+                        elevation={1}
+                        variant="outlined"
+                      >
+                        <iframe
+                          key={title}
+                          title={title}
+                          className={classes.grafanaEmbed}
+                          src={`${grafanaHost}${path}`}
+                          frameBorder="0"
+                        />
+                      </Paper>
+                    );
+                  })}
                 </div>
               </CollapsibleSection>
             ))}
diff --git a/dashboard/client/src/pages/metrics/utils.ts b/dashboard/client/src/pages/metrics/utils.ts
index ea89a4430bb6..65272e689f77 100644
--- a/dashboard/client/src/pages/metrics/utils.ts
+++ b/dashboard/client/src/pages/metrics/utils.ts
@@ -9,6 +9,7 @@ type GrafanaHealthcheckRsp = {
   data: {
     grafanaHost: string;
     sessionName: string;
+    grafanaDefaultDashboardUid: string;
   };
 };
 
@@ -29,6 +30,7 @@ type MetricsInfo = {
   grafanaHost?: string;
   sessionName?: string;
   prometheusHealth?: boolean;
+  grafanaDefaultDashboardUid?: string;
 };
 
 export const getMetricsInfo = async () => {
@@ -36,12 +38,15 @@ export const getMetricsInfo = async () => {
     grafanaHost: undefined,
     sessionName: undefined,
     prometheusHealth: undefined,
+    grafanaDefaultDashboardUid: undefined,
   };
   try {
     const resp = await fetchGrafanaHealthcheck();
     if (resp.data.result) {
       info.grafanaHost = resp.data.data.grafanaHost;
       info.sessionName = resp.data.data.sessionName;
+      info.grafanaDefaultDashboardUid =
+        resp.data.data.grafanaDefaultDashboardUid;
     }
   } catch (e) {}
   try {
diff --git a/dashboard/modules/metrics/grafana_dashboard_factory.py b/dashboard/modules/metrics/grafana_dashboard_factory.py
index f8b9bdbc0942..21770928982f 100644
--- a/dashboard/modules/metrics/grafana_dashboard_factory.py
+++ b/dashboard/modules/metrics/grafana_dashboard_factory.py
@@ -4,8 +4,9 @@
 import json
 import os
 from dataclasses import dataclass
+from typing import List, Dict, Optional
 
-from typing import List, Dict
+import ray
 
 
 @dataclass
@@ -527,11 +528,16 @@ def max_plus_pending(max_resource, pending_resource):
 }
 
 
-def generate_grafana_dashboard() -> str:
+def generate_grafana_dashboard(override_uid: Optional[str] = None) -> str:
     base_json = json.load(
         open(os.path.join(os.path.dirname(__file__), "grafana_dashboard_base.json"))
     )
     base_json["panels"] = _generate_grafana_panels()
+    tags = base_json.get("tags", []) or []
+    tags.append(f"rayVersion:{ray.__version__}")
+    base_json["tags"] = tags
+    if override_uid:
+        base_json["uid"] = override_uid
     return json.dumps(base_json, indent=4)
 
 
diff --git a/dashboard/modules/metrics/metrics_head.py b/dashboard/modules/metrics/metrics_head.py
index 7326d519fe6e..864e36704ea7 100644
--- a/dashboard/modules/metrics/metrics_head.py
+++ b/dashboard/modules/metrics/metrics_head.py
@@ -45,6 +45,7 @@
 GRAFANA_HOST_ENV_VAR = "RAY_GRAFANA_HOST"
 GRAFANA_HOST_DISABLED_VALUE = "DISABLED"
 GRAFANA_IFRAME_HOST_ENV_VAR = "RAY_GRAFANA_IFRAME_HOST"
+GRAFANA_DEFAULT_DASHBOARD_UID = "RAY_GRAFANA_DEFAULT_DASHBOARD_UID"
 GRAFANA_DASHBOARD_OUTPUT_DIR_ENV_VAR = "RAY_METRICS_GRAFANA_DASHBOARD_OUTPUT_DIR"
 GRAFANA_CONFIG_INPUT_PATH = os.path.join(METRICS_INPUT_ROOT, "grafana")
 GRAFANA_HEALTHCHECK_PATH = "api/health"
@@ -111,6 +112,9 @@ def __init__(
             GRAFANA_DASHBOARD_OUTPUT_DIR_ENV_VAR,
             os.path.join(grafana_config_output_path, "dashboards"),
         )
+        self._grafana_default_dashboard_uid = os.environ.get(
+            GRAFANA_DEFAULT_DASHBOARD_UID, "rayDefaultDashboard"
+        )
 
         self._session = aiohttp.ClientSession()
         self._ip = dashboard_head.ip
@@ -159,6 +163,7 @@ async def grafana_health(self, req) -> aiohttp.web.Response:
                     message="Grafana running",
                     grafana_host=grafana_iframe_host,
                     session_name=self._session_name,
+                    grafana_default_dashboard_uid=self._grafana_default_dashboard_uid,
                 )
 
         except Exception as e:
@@ -341,7 +346,7 @@ def _create_default_grafana_configs(self):
             ),
             "w",
         ) as f:
-            f.write(generate_grafana_dashboard())
+            f.write(generate_grafana_dashboard(self._grafana_default_dashboard_uid))
 
     def _create_default_prometheus_configs(self):
         """
diff --git a/python/ray/tests/test_metrics_head.py b/python/ray/tests/test_metrics_head.py
index 707e84df4616..3a43c79bbcef 100644
--- a/python/ray/tests/test_metrics_head.py
+++ b/python/ray/tests/test_metrics_head.py
@@ -1,4 +1,5 @@
 # coding: utf-8
+import json
 import logging
 import os
 import pytest
@@ -47,7 +48,17 @@ def override_dashboard_dir():
         del os.environ["RAY_METRICS_GRAFANA_DASHBOARD_OUTPUT_DIR"]
 
 
-def test_metrics_folder_with_dashboard_override(override_dashboard_dir):
+@pytest.fixture
+def override_dashboard_uid():
+    uid = "test_uid_ses_12345"
+    os.environ["RAY_GRAFANA_DEFAULT_DASHBOARD_UID"] = "test_uid_ses_12345"
+    yield uid
+    del os.environ["RAY_GRAFANA_DEFAULT_DASHBOARD_UID"]
+
+
+def test_metrics_folder_with_dashboard_override(
+    override_dashboard_dir, override_dashboard_uid
+):
     """
     Tests that the default dashboard files get created.
     """
@@ -61,6 +72,9 @@ def test_metrics_folder_with_dashboard_override(override_dashboard_dir):
         ) as f:
             contents = f.read()
             assert override_dashboard_dir in contents
+        with open(f"{override_dashboard_dir}/default_grafana_dashboard.json") as f:
+            contents = json.loads(f.read())
+            assert contents["uid"] == override_dashboard_uid
 
 
 def test_metrics_folder_when_dashboard_disabled():

From 8030e51816ef70b316681867ab93e2e61d95841b Mon Sep 17 00:00:00 2001
From: Alan Guo <aguo@anyscale.com>
Date: Tue, 7 Feb 2023 01:01:28 -0800
Subject: [PATCH 155/267] Remove metrics-based progress-bar endpoints (#31702)

Signed-off-by: Alan Guo <aguo@anyscale.com>

This is no longer necessary after #31577
---
 dashboard/client/src/service/job.ts       |  13 --
 dashboard/modules/metrics/metrics_head.py | 183 +---------------------
 python/ray/tests/test_metrics_head.py     | 164 -------------------
 3 files changed, 1 insertion(+), 359 deletions(-)

diff --git a/dashboard/client/src/service/job.ts b/dashboard/client/src/service/job.ts
index dad2959cc1eb..41e80cbfc28b 100644
--- a/dashboard/client/src/service/job.ts
+++ b/dashboard/client/src/service/job.ts
@@ -1,7 +1,5 @@
 import {
   JobListRsp,
-  JobProgressByTaskNameRsp,
-  JobProgressRsp,
   StateApiJobProgressByTaskNameRsp,
   StateApiNestedJobProgressRsp,
   UnifiedJob,
@@ -16,17 +14,6 @@ export const getJobDetail = (id: string) => {
   return get<UnifiedJob>(`api/jobs/${id}`);
 };
 
-export const getJobProgress = (jobId?: string) => {
-  const jobIdQuery = jobId ? `?job_id=${jobId}` : "";
-  return get<JobProgressRsp>(`api/progress${jobIdQuery}`);
-};
-
-export const getJobProgressByTaskName = (jobId: string) => {
-  return get<JobProgressByTaskNameRsp>(
-    `api/progress_by_task_name?job_id=${jobId}`,
-  );
-};
-
 export const getStateApiJobProgressByTaskName = (jobId: string) => {
   return get<StateApiJobProgressByTaskNameRsp>(
     `api/v0/tasks/summarize?filter_keys=job_id&filter_predicates=%3D&filter_values=${jobId}`,
diff --git a/dashboard/modules/metrics/metrics_head.py b/dashboard/modules/metrics/metrics_head.py
index 864e36704ea7..3f45eab6aea6 100644
--- a/dashboard/modules/metrics/metrics_head.py
+++ b/dashboard/modules/metrics/metrics_head.py
@@ -4,11 +4,10 @@
 import os
 import shutil
 
-from typing import Any, Dict, Optional, List
+from typing import Optional
 
 import psutil
 
-from pydantic import BaseModel
 from urllib.parse import quote
 from ray.dashboard.modules.metrics.grafana_dashboard_factory import (
     generate_grafana_dashboard,
@@ -50,26 +49,6 @@
 GRAFANA_CONFIG_INPUT_PATH = os.path.join(METRICS_INPUT_ROOT, "grafana")
 GRAFANA_HEALTHCHECK_PATH = "api/health"
 
-
-class TaskProgress(BaseModel):
-    num_finished: int = 0
-    num_pending_args_avail: int = 0
-    num_submitted_to_worker: int = 0
-    num_running: int = 0
-    num_pending_node_assignment: int = 0
-    num_failed: int = 0
-    num_unknown: int = 0
-
-
-class TaskProgressWithTaskName(BaseModel):
-    name: str
-    progress: TaskProgress
-
-
-class TaskProgressByTaskNameResponse(BaseModel):
-    tasks: List[TaskProgressWithTaskName]
-
-
 PROMETHEUS_METRIC_MAP = {
     "FINISHED": "num_finished",
     "PENDING_ARGS_AVAIL": "num_pending_args_avail",
@@ -210,75 +189,6 @@ async def prometheus_health(self, req):
                 success=False, message="prometheus healthcheck failed.", reason=str(e)
             )
 
-    # TODO(aguo): DEPRECATED: Delete this endpoint
-    @routes.get("/api/progress")
-    async def get_progress(self, req):
-        """
-        Fetches the progress of tasks by job id. If job_id is not provided,
-        then we will fetch the progress across all jobs.
-        """
-        job_id = req.query.get("job_id")
-
-        job_id_filter = f'JobId="{job_id}"' if job_id else None
-
-        query = self._create_prometheus_query_for_progress(
-            [job_id_filter] if job_id_filter else [], ["State"]
-        )
-
-        try:
-            prom_data = await self._query_prometheus(query)
-            progress = _format_prometheus_output(prom_data) or TaskProgress()
-            return dashboard_optional_utils.rest_response(
-                success=True, message="success", detail=progress.dict()
-            )
-
-        except PrometheusQueryError as e:
-            return dashboard_optional_utils.rest_response(
-                success=False,
-                message=e.message,
-            )
-        except aiohttp.client_exceptions.ClientConnectorError as e:
-            return dashboard_optional_utils.rest_response(
-                success=False,
-                message=str(e),
-            )
-
-    # TODO(aguo): DEPRECATED: Delete this endpoint
-    @routes.get("/api/progress_by_task_name")
-    async def get_progress_by_task_name(self, req):
-        """
-        Fetches the progress of tasks by job id. If job_id is not provided,
-        then we will fetch the progress across all jobs.
-        """
-        if "job_id" not in req.query:
-            return dashboard_optional_utils.rest_response(
-                success=False,
-                message="job_id query is required!",
-            )
-
-        job_id = req.query["job_id"]
-        job_id_filter = f'JobId="{job_id}"'
-        query = self._create_prometheus_query_for_progress(
-            [job_id_filter], ["State", "Name"]
-        )
-
-        try:
-            prom_data = await self._query_prometheus(query)
-            progress = _format_prometheus_output_by_task_names(prom_data)
-            return dashboard_optional_utils.rest_response(
-                success=True, message="success", detail=progress.dict()
-            )
-        except PrometheusQueryError as e:
-            return dashboard_optional_utils.rest_response(
-                success=False,
-                message=e.message,
-            )
-        except aiohttp.client_exceptions.ClientConnectorError as e:
-            return dashboard_optional_utils.rest_response(
-                success=False,
-                message=str(e),
-            )
-
     @staticmethod
     def is_minimal_module():
         return False
@@ -387,43 +297,6 @@ async def run(self, server):
             f"Generated prometheus and grafana configurations in: {self._metrics_root}"
         )
 
-    def _create_prometheus_query_for_progress(
-        self, filters: List[str], sum_by: List[str]
-    ) -> str:
-        filter_for_terminal_states = [
-            'State=~"FINISHED|FAILED"',
-            f'SessionName="{self._session_name}"',
-        ] + filters
-        filter_for_non_terminal_states = [
-            'State!~"FINISHED|FAILED"',
-            f'SessionName="{self._session_name}"',
-        ] + filters
-
-        filter_for_terminal_states_str = ",".join(filter_for_terminal_states)
-        filter_for_non_terminal_states_str = ",".join(filter_for_non_terminal_states)
-        sum_by_str = ",".join(sum_by)
-
-        # Ray does not currently permanently track worker task metrics.
-        # The metric is cleared after a worker exits. We need to work around
-        # these restrictions when we query metrics.
-
-        # For terminal states (Finished, Failed), we know that the count can
-        # never decrease. Therefore, we get the latest count of tasks by
-        # fetching the max value over the past 14 days.
-        query_for_terminal_states = (
-            "sum(max_over_time("
-            f"ray_tasks{{{filter_for_terminal_states_str}}}[14d])) by ({sum_by_str})"
-        )
-
-        # For non-terminal states, we assume that if a worker has at least
-        # one task in one of these states, the worker has not exited. Therefore,
-        # we fetch the current count.
-        query_for_non_terminal_states = (
-            f"clamp_min(sum(ray_tasks{{{filter_for_non_terminal_states_str}}}) "
-            f"by ({sum_by_str}), 0)"
-        )
-        return f"{query_for_terminal_states} or {query_for_non_terminal_states}"
-
     async def _query_prometheus(self, query):
         async with self.http_session.get(
             f"{self.prometheus_host}/api/v1/query?query={quote(query)}"
@@ -434,57 +307,3 @@ async def _query_prometheus(self, query):
 
             message = await resp.text()
             raise PrometheusQueryError(resp.status, message)
-
-
-def _format_prometheus_output(prom_data: Dict[str, Any]) -> Optional[TaskProgress]:
-    if prom_data["status"] == "success" and prom_data["data"]["resultType"] == "vector":
-        metrics = prom_data["data"]["result"]
-        kwargs = {}
-        for metric in metrics:
-            metric_name = metric["metric"]["State"]
-            kwarg_name = (
-                PROMETHEUS_METRIC_MAP[metric_name]
-                if metric_name in PROMETHEUS_METRIC_MAP
-                else "num_unknown"
-            )
-            # metric["value"] is a tuple where first item is a timestamp
-            # and second item is the value.
-            metric_value = int(metric["value"][1])
-            kwargs[kwarg_name] = kwargs.get(kwarg_name, 0) + metric_value
-
-        return TaskProgress(**kwargs)
-
-    return None
-
-
-def _format_prometheus_output_by_task_names(
-    prom_data: Dict[str, Any]
-) -> TaskProgressByTaskNameResponse:
-    """
-    Returns a list of task names with number of tasks for
-    each state with that task name.
-    """
-    task_map = {}
-
-    if prom_data["status"] == "success" and prom_data["data"]["resultType"] == "vector":
-        metrics = prom_data["data"]["result"]
-        for metric in metrics:
-            task_name = metric["metric"]["Name"]
-            metric_name = metric["metric"]["State"]
-            kwargs = task_map.setdefault(task_name, {})
-            kwarg_name = (
-                PROMETHEUS_METRIC_MAP[metric_name]
-                if metric_name in PROMETHEUS_METRIC_MAP
-                else "num_unknown"
-            )
-            # metric["value"] is a tuple where first item is a timestamp
-            # and second item is the value.
-            metric_value = int(metric["value"][1])
-            kwargs[kwarg_name] = kwargs.get(kwarg_name, 0) + metric_value
-
-    tasks = [
-        TaskProgressWithTaskName(name=task_name, progress=TaskProgress(**kwargs))
-        for task_name, kwargs in task_map.items()
-    ]
-
-    return TaskProgressByTaskNameResponse(tasks=tasks)
diff --git a/python/ray/tests/test_metrics_head.py b/python/ray/tests/test_metrics_head.py
index 3a43c79bbcef..5084ed3a4968 100644
--- a/python/ray/tests/test_metrics_head.py
+++ b/python/ray/tests/test_metrics_head.py
@@ -6,13 +6,6 @@
 import sys
 import tempfile
 
-from ray.dashboard.modules.metrics.metrics_head import (
-    _format_prometheus_output,
-    _format_prometheus_output_by_task_names,
-    TaskProgressByTaskNameResponse,
-    TaskProgressWithTaskName,
-    TaskProgress,
-)
 from ray.dashboard.modules.metrics.grafana_dashboard_factory import GRAFANA_PANELS
 from ray.tests.conftest import _ray_start
 
@@ -97,163 +90,6 @@ def test_metrics_folder_when_dashboard_disabled():
         assert not os.path.exists(f"{session_dir}/metrics/prometheus/prometheus.yml")
 
 
-def test_format_prometheus_output():
-    prom_output = {
-        "status": "success",
-        "data": {
-            "resultType": "vector",
-            "result": [
-                {"metric": {"State": "RUNNING"}, "value": [1664330796.832, "2"]},
-                {
-                    "metric": {"State": "RUNNING_IN_RAY_GET"},
-                    "value": [1664330796.832, "4"],
-                },
-                {
-                    "metric": {"State": "RUNNING_IN_RAY_WAIT"},
-                    "value": [1664330796.832, "3"],
-                },
-                {
-                    "metric": {"State": "SUBMITTED_TO_WORKER"},
-                    "value": [1664330796.832, "5"],
-                },
-                {"metric": {"State": "FINISHED"}, "value": [1664330796.832, "3"]},
-                {
-                    "metric": {"State": "PENDING_ARGS_AVAIL"},
-                    "value": [1664330796.832, "5"],
-                },
-                {
-                    "metric": {"State": "PENDING_NODE_ASSIGNMENT"},
-                    "value": [1664330796.832, "2"],
-                },
-                {
-                    "metric": {"State": "PENDING_ARGS_FETCH"},
-                    "value": [1664330796.832, "7"],
-                },
-                {
-                    "metric": {"State": "PENDING_OBJ_STORE_MEM_AVAIL"},
-                    "value": [1664330796.832, "8"],
-                },
-                {
-                    "metric": {"State": "FAILED"},
-                    "value": [1664330796.832, "6"],
-                },
-            ],
-        },
-    }
-    assert _format_prometheus_output(prom_output) == TaskProgress(
-        num_finished=3,
-        num_pending_args_avail=5,
-        num_pending_node_assignment=17,
-        num_running=9,
-        num_submitted_to_worker=5,
-        num_unknown=0,
-        num_failed=6,
-    )
-
-    # With unknown states from prometheus
-    prom_output_with_unknown = {
-        "status": "success",
-        "data": {
-            "resultType": "vector",
-            "result": [
-                {"metric": {"State": "RUNNING"}, "value": [1664330796.832, "10"]},
-                {
-                    "metric": {"State": "RUNNING_IN_RAY_GET"},
-                    "value": [1664330796.832, "4"],
-                },
-                {"metric": {"State": "FINISHED"}, "value": [1664330796.832, "20"]},
-                {
-                    "metric": {"State": "PENDING_ARGS_AVAIL"},
-                    "value": [1664330796.832, "5"],
-                },
-                {
-                    "metric": {"State": "SOME_NEW_VARIABLE"},
-                    "value": [1664330796.832, "3"],
-                },
-                {
-                    "metric": {"State": "FAILED"},
-                    "value": [1664330796.832, "3"],
-                },
-            ],
-        },
-    }
-    assert _format_prometheus_output(prom_output_with_unknown) == TaskProgress(
-        num_finished=20,
-        num_pending_args_avail=5,
-        num_pending_node_assignment=0,
-        num_running=14,
-        num_submitted_to_worker=0,
-        num_unknown=3,
-        num_failed=3,
-    )
-
-
-def test_format_prometheus_output_by_task_names():
-    prom_output = {
-        "status": "success",
-        "data": {
-            "resultType": "vector",
-            "result": [
-                {
-                    "metric": {"Name": "step1", "State": "RUNNING"},
-                    "value": [1666390500.167, "3"],
-                },
-                {
-                    "metric": {"Name": "step1", "State": "SUBMITTED_TO_WORKER"},
-                    "value": [1666390500.167, "3"],
-                },
-                {
-                    "metric": {"Name": "step1", "State": "PENDING_ARGS_AVAIL"},
-                    "value": [1666390500.167, "0"],
-                },
-                {
-                    "metric": {"Name": "step1", "State": "PENDING_NODE_ASSIGNMENT"},
-                    "value": [1666390500.167, "0"],
-                },
-                {
-                    "metric": {"Name": "step2", "State": "RUNNING"},
-                    "value": [1666390500.167, "2"],
-                },
-                {
-                    "metric": {"Name": "step2", "State": "SUBMITTED_TO_WORKER"},
-                    "value": [1666390500.167, "0"],
-                },
-                {
-                    "metric": {"Name": "step2", "State": "PENDING_ARGS_AVAIL"},
-                    "value": [1666390500.167, "3"],
-                },
-                {
-                    "metric": {"Name": "step3", "State": "PENDING_ARGS_AVAIL"},
-                    "value": [1666390500.167, "1"],
-                },
-            ],
-        },
-    }
-    assert _format_prometheus_output_by_task_names(
-        prom_output
-    ) == TaskProgressByTaskNameResponse(
-        tasks=[
-            TaskProgressWithTaskName(
-                name="step1",
-                progress=TaskProgress(
-                    num_running=3,
-                    num_submitted_to_worker=3,
-                ),
-            ),
-            TaskProgressWithTaskName(
-                name="step2",
-                progress=TaskProgress(
-                    num_running=2,
-                    num_pending_args_avail=3,
-                ),
-            ),
-            TaskProgressWithTaskName(
-                name="step3", progress=TaskProgress(num_pending_args_avail=1)
-            ),
-        ]
-    )
-
-
 def test_default_dashboard_utilizes_global_filters():
     for panel in GRAFANA_PANELS:
         for target in panel.targets:

From eec97912b4124cb191809c16a9cfec49107a49ac Mon Sep 17 00:00:00 2001
From: clarng <clarence.wyng@gmail.com>
Date: Tue, 7 Feb 2023 01:18:55 -0800
Subject: [PATCH 156/267] clean up raylet client mocks (#32216)

Signed-off-by: Clarence Ng <clarence@anyscale.com>

Remove redundant mock classes. We just need one mock class for the interface that covers all the sub interface. The mock for the sub interface is unused
---
 src/mock/ray/raylet_client/raylet_client.h | 118 ---------------------
 1 file changed, 118 deletions(-)

diff --git a/src/mock/ray/raylet_client/raylet_client.h b/src/mock/ray/raylet_client/raylet_client.h
index bf52af509e1a..c8b59e902b2d 100644
--- a/src/mock/ray/raylet_client/raylet_client.h
+++ b/src/mock/ray/raylet_client/raylet_client.h
@@ -14,124 +14,6 @@
 
 namespace ray {
 
-class MockPinObjectsInterface : public PinObjectsInterface {
- public:
-  MOCK_METHOD(void,
-              PinObjectIDs,
-              (const rpc::Address &caller_address,
-               const std::vector<ObjectID> &object_ids,
-               const ObjectID &generator_id,
-               const ray::rpc::ClientCallback<ray::rpc::PinObjectIDsReply> &callback),
-              (override));
-};
-
-}  // namespace ray
-
-namespace ray {
-
-class MockWorkerLeaseInterface : public WorkerLeaseInterface {
- public:
-  MOCK_METHOD(
-      void,
-      RequestWorkerLease,
-      (const rpc::TaskSpec &task_spec,
-       bool grant_or_reject,
-       const ray::rpc::ClientCallback<ray::rpc::RequestWorkerLeaseReply> &callback,
-       const int64_t backlog_size,
-       const bool is_selected_based_on_locality),
-      (override));
-  MOCK_METHOD(ray::Status,
-              ReturnWorker,
-              (int worker_port,
-               const WorkerID &worker_id,
-               bool disconnect_worker,
-               bool worker_exiting),
-              (override));
-  MOCK_METHOD(void,
-              ReleaseUnusedWorkers,
-              (const std::vector<WorkerID> &workers_in_use,
-               const rpc::ClientCallback<rpc::ReleaseUnusedWorkersReply> &callback),
-              (override));
-  MOCK_METHOD(void,
-              CancelWorkerLease,
-              (const TaskID &task_id,
-               const rpc::ClientCallback<rpc::CancelWorkerLeaseReply> &callback),
-              (override));
-  MOCK_METHOD(void,
-              GetTaskFailureCause,
-              (const TaskID &task_id,
-               const rpc::ClientCallback<rpc::GetTaskFailureCauseReply> &callback),
-              (override));
-};
-
-}  // namespace ray
-
-namespace ray {
-
-class MockResourceReserveInterface : public ResourceReserveInterface {
- public:
-  MOCK_METHOD(
-      void,
-      PrepareBundleResources,
-      (const std::vector<std::shared_ptr<const BundleSpecification>> &bundle_specs,
-       const ray::rpc::ClientCallback<ray::rpc::PrepareBundleResourcesReply> &callback),
-      (override));
-  MOCK_METHOD(
-      void,
-      CommitBundleResources,
-      (const std::vector<std::shared_ptr<const BundleSpecification>> &bundle_specs,
-       const ray::rpc::ClientCallback<ray::rpc::CommitBundleResourcesReply> &callback),
-      (override));
-  MOCK_METHOD(
-      void,
-      CancelResourceReserve,
-      (const BundleSpecification &bundle_spec,
-       const ray::rpc::ClientCallback<ray::rpc::CancelResourceReserveReply> &callback),
-      (override));
-  MOCK_METHOD(void,
-              ReleaseUnusedBundles,
-              (const std::vector<rpc::Bundle> &bundles_in_use,
-               const rpc::ClientCallback<rpc::ReleaseUnusedBundlesReply> &callback),
-              (override));
-};
-
-}  // namespace ray
-
-namespace ray {
-
-class MockDependencyWaiterInterface : public DependencyWaiterInterface {
- public:
-  MOCK_METHOD(ray::Status,
-              WaitForDirectActorCallArgs,
-              (const std::vector<rpc::ObjectReference> &references, int64_t tag),
-              (override));
-};
-
-}  // namespace ray
-
-namespace ray {
-
-class MockResourceTrackingInterface : public ResourceTrackingInterface {
- public:
-  MOCK_METHOD(void,
-              UpdateResourceUsage,
-              (std::string & serialized_resource_usage_batch,
-               const rpc::ClientCallback<rpc::UpdateResourceUsageReply> &callback),
-              (override));
-  MOCK_METHOD(void,
-              RequestResourceReport,
-              (const rpc::ClientCallback<rpc::RequestResourceReportReply> &callback),
-              (override));
-  MOCK_METHOD(void,
-              GetResourceLoad,
-              (const rpc::ClientCallback<rpc::GetResourceLoadReply> &callback),
-              (override));
-};
-
-}  // namespace ray
-
-namespace ray {
-
 class MockRayletClientInterface : public RayletClientInterface {
  public:
   MOCK_METHOD(ray::Status,

From 74323671ba2ca719a3742d5a114d1647c5745204 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Tue, 7 Feb 2023 10:12:06 -0800
Subject: [PATCH 157/267] Refactor API documentation for job submission
 (#32252)

---
 .../job-submission/jobs-package-ref.rst       | 64 +++++++++++--------
 1 file changed, 37 insertions(+), 27 deletions(-)

diff --git a/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst b/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst
index e5384bf455e0..3e6afaec76ec 100644
--- a/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst
+++ b/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst
@@ -3,6 +3,8 @@
 Python SDK API Reference
 ========================
 
+.. currentmodule:: ray.job_submission
+
 For an overview with examples see :ref:`Ray Jobs <jobs-overview>`.
 
 For the CLI reference see :ref:`Ray Job Submission CLI Reference <ray-job-submission-cli-ref>`.
@@ -10,58 +12,66 @@ For the CLI reference see :ref:`Ray Job Submission CLI Reference <ray-job-submis
 .. _job-submission-client-ref:
 
 JobSubmissionClient
-~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-    :nosignatures:
+-------------------
 
-    ray.job_submission.JobSubmissionClient
-    ray.job_submission.JobSubmissionClient.submit_job
-    ray.job_submission.JobSubmissionClient.stop_job
-    ray.job_submission.JobSubmissionClient.get_job_status
-    ray.job_submission.JobSubmissionClient.get_job_info
-    ray.job_submission.JobSubmissionClient.list_jobs
-    ray.job_submission.JobSubmissionClient.get_job_logs
-    ray.job_submission.JobSubmissionClient.tail_job_logs
+.. autosummary::
+   :toctree: doc/
 
-.. autoclass:: ray.job_submission.JobSubmissionClient
-    :members:
+   JobSubmissionClient
+   JobSubmissionClient.submit_job
+   JobSubmissionClient.stop_job
+   JobSubmissionClient.get_job_status
+   JobSubmissionClient.get_job_info
+   JobSubmissionClient.list_jobs
+   JobSubmissionClient.get_job_logs
+   JobSubmissionClient.tail_job_logs
 
 .. _job-status-ref:
 
 JobStatus
-~~~~~~~~~
+---------
 
-.. autoclass:: ray.job_submission.JobStatus
-    :members:
+.. autosummary::
+   :toctree: doc/
+
+   JobStatus
 
 .. _job-info-ref:
 
 JobInfo
-~~~~~~~
+-------
+
+.. autosummary::
+   :toctree: doc/
 
-.. autoclass:: ray.job_submission.JobInfo
-    :members:
+   JobInfo
 
 .. _job-details-ref:
 
 JobDetails
-~~~~~~~~~~
+----------
+
+.. autosummary::
+   :toctree: doc/
 
-.. autopydantic_model:: ray.job_submission.JobDetails
+   JobDetails
 
 .. _job-type-ref:
 
 JobType
-~~~~~~~
+-------
 
-.. autoclass:: ray.job_submission.JobType
-    :members:
-    :noindex:
+.. autosummary::
+   :toctree: doc/
+
+   JobType
 
 .. _driver-info-ref:
 
 DriverInfo
-~~~~~~~~~~
+----------
 
-.. autopydantic_model:: ray.job_submission.DriverInfo
+.. autosummary::
+   :toctree: doc/
 
+   DriverInfo

From c83111a2230aae8e610ab5403bcb311a9a277e35 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Tue, 7 Feb 2023 10:31:49 -0800
Subject: [PATCH 158/267] [air/benchmarks] Fix typo in tensorflow_benchmark.py
 script preventing proper error surfacing (#32269)

There is a small typo in the tensorflow_benchmark.py script that does not properly catch when a vanilla TF run failed three times. Because of this, we would previously record a training time of 0.0 for vanilla TF, which skews the calculated average and suggests that vanilla TF outperformed Ray Train. Instead, we should have raised an error message to surface the problem.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 .../air_tests/air_benchmarks/workloads/tensorflow_benchmark.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/release/air_tests/air_benchmarks/workloads/tensorflow_benchmark.py b/release/air_tests/air_benchmarks/workloads/tensorflow_benchmark.py
index 0883745947fc..e35c8b279f07 100644
--- a/release/air_tests/air_benchmarks/workloads/tensorflow_benchmark.py
+++ b/release/air_tests/air_benchmarks/workloads/tensorflow_benchmark.py
@@ -310,7 +310,7 @@ def run(
                     config=config,
                 )
             except Exception as e:
-                if i > +2:
+                if i >= 2:
                     raise RuntimeError("Vanilla TF run failed 3 times") from e
                 print("Vanilla TF run failed:", e)
                 continue
@@ -338,6 +338,7 @@ def run(
         times_ray.append(time_ray)
         times_local_ray.append(time_local_ray)
         losses_ray.append(loss_ray)
+
         times_vanilla.append(time_vanilla)
         times_local_vanilla.append(time_local_vanilla)
         losses_vanilla.append(loss_vanilla)

From 027965b7b4c0f56f6abe9a08383a4a01a98c8572 Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Tue, 7 Feb 2023 19:48:07 +0100
Subject: [PATCH 159/267] [RLlib] Chaining Models in RLModules (#31469)

Signed-off-by: Artur Niederfahrenhorst <artur@anyscale.com>
---
 rllib/BUILD                                   |   8 -
 .../ppo/tests/test_ppo_rl_module.py           | 177 +++++---------
 rllib/algorithms/ppo/tf/ppo_tf_rl_module.py   | 132 +++++------
 .../ppo/torch/ppo_torch_rl_module.py          | 215 ++++++++----------
 rllib/core/rl_module/encoder.py               | 202 ----------------
 rllib/core/rl_module/encoder_tf.py            |  37 ---
 rllib/models/configs/encoder.py               |  83 -------
 rllib/models/experimental/README.rst          |   2 +
 rllib/models/experimental/__init__.py         |   0
 rllib/models/experimental/base.py             |  72 ++++++
 rllib/models/experimental/configs.py          | 115 ++++++++++
 rllib/models/experimental/encoder.py          |  57 +++++
 rllib/models/experimental/tf/__init__.py      |   0
 rllib/models/experimental/tf/encoder.py       | 159 +++++++++++++
 rllib/models/experimental/tf/mlp.py           |  34 +++
 rllib/models/experimental/tf/primitives.py    | 107 +++++++++
 rllib/models/experimental/torch/__init__.py   |   0
 rllib/models/experimental/torch/encoder.py    | 167 ++++++++++++++
 rllib/models/experimental/torch/mlp.py        |  39 ++++
 rllib/models/experimental/torch/primitives.py |  99 ++++++++
 rllib/models/specs/checker.py                 |  12 +
 .../tests/test_torch_vector_encoder.py        |  70 ------
 rllib/models/torch/encoders/vector.py         |  97 --------
 rllib/models/torch/primitives.py              |   4 +-
 24 files changed, 1075 insertions(+), 813 deletions(-)
 delete mode 100644 rllib/core/rl_module/encoder.py
 delete mode 100644 rllib/core/rl_module/encoder_tf.py
 delete mode 100644 rllib/models/configs/encoder.py
 create mode 100644 rllib/models/experimental/README.rst
 create mode 100644 rllib/models/experimental/__init__.py
 create mode 100644 rllib/models/experimental/base.py
 create mode 100644 rllib/models/experimental/configs.py
 create mode 100644 rllib/models/experimental/encoder.py
 create mode 100644 rllib/models/experimental/tf/__init__.py
 create mode 100644 rllib/models/experimental/tf/encoder.py
 create mode 100644 rllib/models/experimental/tf/mlp.py
 create mode 100644 rllib/models/experimental/tf/primitives.py
 create mode 100644 rllib/models/experimental/torch/__init__.py
 create mode 100644 rllib/models/experimental/torch/encoder.py
 create mode 100644 rllib/models/experimental/torch/mlp.py
 create mode 100644 rllib/models/experimental/torch/primitives.py
 delete mode 100644 rllib/models/torch/encoders/tests/test_torch_vector_encoder.py
 delete mode 100644 rllib/models/torch/encoders/vector.py

diff --git a/rllib/BUILD b/rllib/BUILD
index 4882d7cd65cd..93015763f7ed 100644
--- a/rllib/BUILD
+++ b/rllib/BUILD
@@ -1975,14 +1975,6 @@ py_test(
     srcs = ["models/specs/tests/test_spec_dict.py"]
 )
 
-# test TorchVectorEncoder
-py_test(
-    name = "test_torch_vector_encoder",
-    tags = ["team:rllib", "models"],
-    size = "small",
-    srcs = ["models/torch/encoders/tests/test_torch_vector_encoder.py"]
-)
-
 
 # --------------------------------------------------------------------
 # Offline
diff --git a/rllib/algorithms/ppo/tests/test_ppo_rl_module.py b/rllib/algorithms/ppo/tests/test_ppo_rl_module.py
index 6b0e0161a5a6..18b917dd86e4 100644
--- a/rllib/algorithms/ppo/tests/test_ppo_rl_module.py
+++ b/rllib/algorithms/ppo/tests/test_ppo_rl_module.py
@@ -1,47 +1,43 @@
 import itertools
-import ray
 import unittest
-import numpy as np
+
 import gymnasium as gym
-import torch
+import numpy as np
 import tensorflow as tf
+import torch
 import tree
 
+import ray
 from ray.rllib import SampleBatch
+from ray.rllib.algorithms.ppo.tf.ppo_tf_rl_module import (
+    PPOTfRLModule,
+)
+from ray.rllib.algorithms.ppo.torch.ppo_torch_rl_module import PPOModuleConfig
 from ray.rllib.algorithms.ppo.torch.ppo_torch_rl_module import (
     PPOTorchRLModule,
-    PPOModuleConfig,
 )
-from ray.rllib.algorithms.ppo.tf.ppo_tf_rl_module import (
-    PPOTfRLModule,
-    PPOTfModuleConfig,
+from ray.rllib.models.experimental.configs import (
+    MLPConfig,
+    MLPEncoderConfig,
+    LSTMEncoderConfig,
 )
-from ray.rllib.core.rl_module.encoder import (
-    FCConfig,
-    IdentityConfig,
-    LSTMConfig,
+from ray.rllib.models.experimental.torch.encoder import (
     STATE_IN,
     STATE_OUT,
 )
-from ray.rllib.core.rl_module.encoder_tf import (
-    FCTfConfig,
-    IdentityTfConfig,
-)
 from ray.rllib.utils.numpy import convert_to_numpy
 from ray.rllib.utils.torch_utils import convert_to_torch_tensor
 
 
-def get_expected_model_config_torch(
-    env: gym.Env, lstm: bool, shared_encoder: bool
+def get_expected_model_config(
+    env: gym.Env,
+    lstm: bool,
 ) -> PPOModuleConfig:
     """Get a PPOModuleConfig that we would expect from the catalog otherwise.
 
     Args:
         env: Environment for which we build the model later
         lstm: If True, build recurrent pi encoder
-        shared_encoder: If True, build a shared encoder for pi and vf, where pi
-            encoder and vf encoder will be identity. If False, the shared encoder
-            will be identity.
 
     Returns:
          A PPOModuleConfig containing the relevant configs to build PPORLModule
@@ -51,107 +47,44 @@ def get_expected_model_config_torch(
     )
     obs_dim = env.observation_space.shape[0]
 
-    if shared_encoder:
-        assert not lstm, "LSTM can only be used in PI"
-        shared_encoder_config = FCConfig(
+    if lstm:
+        encoder_config = LSTMEncoderConfig(
             input_dim=obs_dim,
-            hidden_layers=[32],
-            activation="ReLU",
+            hidden_dim=32,
+            batch_first=True,
+            num_layers=1,
             output_dim=32,
         )
-        pi_encoder_config = IdentityConfig(output_dim=32)
-        vf_encoder_config = IdentityConfig(output_dim=32)
     else:
-        shared_encoder_config = IdentityConfig(output_dim=obs_dim)
-        if lstm:
-            pi_encoder_config = LSTMConfig(
-                input_dim=obs_dim,
-                hidden_dim=32,
-                batch_first=True,
-                output_dim=32,
-                num_layers=1,
-            )
-        else:
-            pi_encoder_config = FCConfig(
-                input_dim=obs_dim,
-                output_dim=32,
-                hidden_layers=[32],
-                activation="ReLU",
-            )
-        vf_encoder_config = FCConfig(
+        encoder_config = MLPEncoderConfig(
             input_dim=obs_dim,
+            hidden_layer_dims=[32],
+            hidden_layer_activation="ReLU",
             output_dim=32,
-            hidden_layers=[32],
-            activation="ReLU",
         )
 
-    pi_config = FCConfig()
-    vf_config = FCConfig()
-
-    if isinstance(env.action_space, gym.spaces.Discrete):
-        pi_config.output_dim = env.action_space.n
-    else:
-        pi_config.output_dim = env.action_space.shape[0] * 2
-
-    return PPOModuleConfig(
-        observation_space=env.observation_space,
-        action_space=env.action_space,
-        shared_encoder_config=shared_encoder_config,
-        pi_encoder_config=pi_encoder_config,
-        vf_encoder_config=vf_encoder_config,
-        pi_config=pi_config,
-        vf_config=vf_config,
-        shared_encoder=shared_encoder,
+    pi_config = MLPConfig(
+        input_dim=32,
+        hidden_layer_dims=[32],
+        hidden_layer_activation="ReLU",
     )
-
-
-def get_expected_model_config_tf(
-    env: gym.Env, shared_encoder: bool
-) -> PPOTfModuleConfig:
-    """Get a PPOTfModuleConfig that we would expect from the catalog otherwise.
-
-    Args:
-        env: Environment for which we build the model later
-        shared_encoder: If True, build a shared encoder for pi and vf, where pi
-            encoder and vf encoder will be identity. If False, the shared encoder
-            will be identity.
-
-    Returns:
-         A PPOTfModuleConfig containing the relevant configs to build PPOTfRLModule.
-    """
-    assert len(env.observation_space.shape) == 1, (
-        "No multidimensional obs space " "supported."
+    vf_config = MLPConfig(
+        input_dim=32,
+        hidden_layer_dims=[32, 1],
+        hidden_layer_activation="ReLU",
     )
-    obs_dim = env.observation_space.shape[0]
-
-    if shared_encoder:
-        shared_encoder_config = FCTfConfig(
-            input_dim=obs_dim,
-            hidden_layers=[32],
-            activation="ReLU",
-            output_dim=32,
-        )
-    else:
-        shared_encoder_config = IdentityTfConfig(output_dim=obs_dim)
-    pi_config = FCConfig()
-    vf_config = FCConfig()
-    pi_config.input_dim = vf_config.input_dim = shared_encoder_config.output_dim
 
     if isinstance(env.action_space, gym.spaces.Discrete):
         pi_config.output_dim = env.action_space.n
     else:
         pi_config.output_dim = env.action_space.shape[0] * 2
 
-    pi_config.hidden_layers = vf_config.hidden_layers = [32]
-    pi_config.activation = vf_config.activation = "ReLU"
-
-    return PPOTfModuleConfig(
+    return PPOModuleConfig(
         observation_space=env.observation_space,
         action_space=env.action_space,
-        shared_encoder_config=shared_encoder_config,
+        encoder_config=encoder_config,
         pi_config=pi_config,
         vf_config=vf_config,
-        shared_encoder=shared_encoder,
     )
 
 
@@ -207,12 +140,11 @@ def setUpClass(cls):
     def tearDownClass(cls):
         ray.shutdown()
 
-    def get_ppo_module(self, framwework, env, lstm, shared_encoder):
-        if framwework == "torch":
-            config = get_expected_model_config_torch(env, lstm, shared_encoder)
+    def get_ppo_module(self, framework, env, lstm):
+        config = get_expected_model_config(env, lstm)
+        if framework == "torch":
             module = PPOTorchRLModule(config)
         else:
-            config = get_expected_model_config_tf(env, shared_encoder)
             module = PPOTfRLModule(config)
         return module
 
@@ -222,7 +154,7 @@ def get_input_batch_from_obs(self, framework, obs):
                 SampleBatch.OBS: convert_to_torch_tensor(obs)[None],
             }
         else:
-            batch = {SampleBatch.OBS: np.array([obs])}
+            batch = {SampleBatch.OBS: tf.convert_to_tensor([obs])}
         return batch
 
     def test_rollouts(self):
@@ -230,21 +162,16 @@ def test_rollouts(self):
         frameworks = ["torch", "tf2"]
         env_names = ["CartPole-v1", "Pendulum-v1"]
         fwd_fns = ["forward_exploration", "forward_inference"]
-        shared_encoders = [False, True]
-        ltsms = [False, True]
-        config_combinations = [frameworks, env_names, fwd_fns, shared_encoders, ltsms]
+        lstm = [False, True]
+        config_combinations = [frameworks, env_names, fwd_fns, lstm]
         for config in itertools.product(*config_combinations):
-            fw, env_name, fwd_fn, shared_encoder, lstm = config
-            if lstm and shared_encoder:
-                # Not yet implemented
-                # TODO (Artur): Implement
-                continue
+            fw, env_name, fwd_fn, lstm = config
             if lstm and fw == "tf2":
                 # LSTM not implemented in TF2 yet
                 continue
-            print(f"[ENV={env_name}] | [SHARED={shared_encoder}] | LSTM" f"={lstm}")
+            print(f"[FW={fw} | [ENV={env_name}] | [FWD={fwd_fn}] | LSTM" f"={lstm}")
             env = gym.make(env_name)
-            module = self.get_ppo_module(fw, env, lstm, shared_encoder)
+            module = self.get_ppo_module(framework=fw, env=env, lstm=lstm)
 
             obs, _ = env.reset()
 
@@ -267,22 +194,17 @@ def test_forward_train(self):
         # TODO: Add BreakoutNoFrameskip-v4 to cover a 3D obs space
         frameworks = ["torch", "tf2"]
         env_names = ["CartPole-v1", "Pendulum-v1"]
-        shared_encoders = [False, True]
-        ltsms = [False, True]
-        config_combinations = [frameworks, env_names, shared_encoders, ltsms]
+        lstm = [False, True]
+        config_combinations = [frameworks, env_names, lstm]
         for config in itertools.product(*config_combinations):
-            fw, env_name, shared_encoder, lstm = config
-            if lstm and shared_encoder:
-                # Not yet implemented
-                # TODO (Artur): Implement
-                continue
+            fw, env_name, lstm = config
             if lstm and fw == "tf2":
                 # LSTM not implemented in TF2 yet
                 continue
-            print(f"[ENV={env_name}] | [SHARED=" f"{shared_encoder}] | LSTM={lstm}")
+            print(f"[FW={fw} | [ENV={env_name}] | LSTM={lstm}")
             env = gym.make(env_name)
 
-            module = self.get_ppo_module(fw, env, lstm, shared_encoder)
+            module = self.get_ppo_module(fw, env, lstm)
 
             # collect a batch of data
             batches = []
@@ -343,6 +265,9 @@ def test_forward_train(self):
                 for param in module.parameters():
                     self.assertIsNotNone(param.grad)
             else:
+                batch = tree.map_structure(
+                    lambda x: tf.convert_to_tensor(x, dtype=tf.float32), batch
+                )
                 with tf.GradientTape() as tape:
                     fwd_out = module.forward_train(batch)
                     loss = dummy_tf_ppo_loss(batch, fwd_out)
diff --git a/rllib/algorithms/ppo/tf/ppo_tf_rl_module.py b/rllib/algorithms/ppo/tf/ppo_tf_rl_module.py
index 5568d06a4224..d24ba43e7a01 100644
--- a/rllib/algorithms/ppo/tf/ppo_tf_rl_module.py
+++ b/rllib/algorithms/ppo/tf/ppo_tf_rl_module.py
@@ -1,41 +1,27 @@
-from dataclasses import dataclass
-import gymnasium as gym
 from typing import Mapping, Any, List
+
+import gymnasium as gym
+
+from ray.rllib.algorithms.ppo.torch.ppo_torch_rl_module import PPOModuleConfig
 from ray.rllib.core.rl_module.rl_module import RLModuleConfig
 from ray.rllib.core.rl_module.tf.tf_rl_module import TfRLModule
+from ray.rllib.models.experimental.configs import MLPConfig, IdentityConfig
+from ray.rllib.models.experimental.encoder import STATE_OUT
+from ray.rllib.models.experimental.tf.encoder import ENCODER_OUT
+from ray.rllib.models.experimental.tf.primitives import TfMLP
+from ray.rllib.models.tf.tf_action_dist import Categorical, Deterministic, DiagGaussian
 from ray.rllib.policy.sample_batch import SampleBatch
-from ray.rllib.core.rl_module.encoder_tf import FCTfConfig, IdentityTfConfig
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.framework import try_import_tf
 from ray.rllib.utils.gym import convert_old_gym_space_to_gymnasium_space
 from ray.rllib.utils.nested_dict import NestedDict
-from ray.rllib.models.tf.tf_action_dist import Categorical, Deterministic, DiagGaussian
-from ray.rllib.models.tf.primitives import FCNet
-
 
 tf1, tf, _ = try_import_tf()
 tf1.enable_eager_execution()
 
 
-@dataclass
-class PPOTfModuleConfig(RLModuleConfig):
-    """Configuration for the PPO module.
-
-    Attributes:
-        pi_config: The configuration for the policy network.
-        vf_config: The configuration for the value network.
-    """
-
-    observation_space: gym.Space = None
-    action_space: gym.Space = None
-    pi_config: FCTfConfig = None
-    vf_config: FCTfConfig = None
-    shared_encoder_config: FCTfConfig = None
-    shared_encoder: bool = True
-
-
 class PPOTfRLModule(TfRLModule):
-    def __init__(self, config: PPOTfModuleConfig):
+    def __init__(self, config: RLModuleConfig):
         super().__init__()
         self.config = config
         self.setup()
@@ -43,20 +29,20 @@ def __init__(self, config: PPOTfModuleConfig):
     def setup(self) -> None:
         assert self.config.pi_config, "pi_config must be provided."
         assert self.config.vf_config, "vf_config must be provided."
-        self.shared_encoder = self.config.shared_encoder_config.build()
+        self.encoder = self.config.encoder_config.build(framework="tf")
 
-        self.pi = FCNet(
-            input_dim=self.config.shared_encoder_config.output_dim,
+        self.pi = TfMLP(
+            input_dim=self.config.encoder_config.output_dim,
             output_dim=self.config.pi_config.output_dim,
-            hidden_layers=self.config.pi_config.hidden_layers,
-            activation=self.config.pi_config.activation,
+            hidden_layer_dims=self.config.pi_config.hidden_layer_dims,
+            hidden_layer_activation=self.config.pi_config.hidden_layer_activation,
         )
 
-        self.vf = FCNet(
-            input_dim=self.config.shared_encoder_config.output_dim,
+        self.vf = TfMLP(
+            input_dim=self.config.encoder_config.output_dim,
             output_dim=1,
-            hidden_layers=self.config.vf_config.hidden_layers,
-            activation=self.config.vf_config.activation,
+            hidden_layer_dims=self.config.vf_config.hidden_layer_dims,
+            hidden_layer_activation=self.config.vf_config.hidden_layer_activation,
         )
 
         self._is_discrete = isinstance(
@@ -77,10 +63,14 @@ def output_specs_train(self) -> List[str]:
 
     @override(TfRLModule)
     def _forward_train(self, batch: NestedDict):
-        obs = batch[SampleBatch.OBS]
-        encoder_out = self.shared_encoder(obs)
-        action_logits = self.pi(encoder_out)
-        vf = self.vf(encoder_out)
+        output = {}
+
+        encoder_out = self.encoder(batch)
+        if STATE_OUT in encoder_out:
+            output[STATE_OUT] = encoder_out[STATE_OUT]
+
+        # Actions
+        action_logits = self.pi(encoder_out[ENCODER_OUT])
 
         if self._is_discrete:
             action_dist = Categorical(action_logits)
@@ -89,10 +79,10 @@ def _forward_train(self, batch: NestedDict):
                 action_logits, None, action_space=self.config.action_space
             )
 
-        output = {
-            SampleBatch.ACTION_DIST: action_dist,
-            SampleBatch.VF_PREDS: tf.squeeze(vf, axis=-1),
-        }
+        vf = self.vf(encoder_out[ENCODER_OUT])
+        output[SampleBatch.ACTION_DIST] = action_dist
+        output[SampleBatch.VF_PREDS] = tf.squeeze(vf, axis=-1)
+
         return output
 
     @override(TfRLModule)
@@ -105,10 +95,13 @@ def output_specs_inference(self) -> List[str]:
 
     @override(TfRLModule)
     def _forward_inference(self, batch) -> Mapping[str, Any]:
-        obs = batch[SampleBatch.OBS]
-        encoder_out = self.shared_encoder(obs)
+        output = {}
 
-        action_logits = self.pi(encoder_out)
+        encoder_out = self.encoder(batch)
+        if STATE_OUT in encoder_out:
+            output[STATE_OUT] = encoder_out[STATE_OUT]
+
+        action_logits = self.pi(encoder_out[ENCODER_OUT])
 
         if self._is_discrete:
             action = tf.math.argmax(action_logits, axis=-1)
@@ -116,9 +109,8 @@ def _forward_inference(self, batch) -> Mapping[str, Any]:
             action, _ = tf.split(action_logits, num_or_size_splits=2, axis=1)
 
         action_dist = Deterministic(action, model=None)
-        output = {
-            SampleBatch.ACTION_DIST: action_dist,
-        }
+        output[SampleBatch.ACTION_DIST] = action_dist
+
         return output
 
     @override(TfRLModule)
@@ -135,11 +127,13 @@ def output_specs_exploration(self) -> List[str]:
 
     @override(TfRLModule)
     def _forward_exploration(self, batch: NestedDict) -> Mapping[str, Any]:
-        obs = batch[SampleBatch.OBS]
-        encoder_out = self.shared_encoder(obs)
+        output = {}
+        encoder_out = self.encoder(batch)
+        if STATE_OUT in encoder_out:
+            output[STATE_OUT] = encoder_out[STATE_OUT]
 
-        action_logits = self.pi(encoder_out)
-        vf = self.vf(encoder_out)
+        action_logits = self.pi(encoder_out[ENCODER_OUT])
+        vf = self.vf(encoder_out[ENCODER_OUT])
 
         if self._is_discrete:
             action_dist = Categorical(action_logits)
@@ -147,11 +141,11 @@ def _forward_exploration(self, batch: NestedDict) -> Mapping[str, Any]:
             action_dist = DiagGaussian(
                 action_logits, None, action_space=self.config.action_space
             )
-        output = {
-            SampleBatch.ACTION_DIST: action_dist,
-            SampleBatch.ACTION_DIST_INPUTS: action_logits,
-            SampleBatch.VF_PREDS: tf.squeeze(vf, axis=-1),
-        }
+
+        output[SampleBatch.ACTION_DIST] = action_dist
+        output[SampleBatch.ACTION_DIST_INPUTS] = action_logits
+        output[SampleBatch.VF_PREDS] = tf.squeeze(vf, axis=-1)
+
         return output
 
     @classmethod
@@ -180,14 +174,14 @@ def from_model_config(
         if use_lstm:
             raise ValueError("LSTM not supported by PPOTfRLModule yet.")
         if vf_share_layers:
-            shared_encoder_config = FCTfConfig(
+            encoder_config = MLPConfig(
                 input_dim=obs_dim,
-                hidden_layers=fcnet_hiddens,
-                activation=activation,
+                hidden_layer_dims=fcnet_hiddens,
+                hidden_layer_activation=activation,
                 output_dim=model_config["fcnet_hiddens"][-1],
             )
         else:
-            shared_encoder_config = IdentityTfConfig(output_dim=obs_dim)
+            encoder_config = IdentityConfig(output_dim=obs_dim)
         assert isinstance(
             observation_space, gym.spaces.Box
         ), "This simple PPOModule only supports Box observation space."
@@ -199,23 +193,23 @@ def from_model_config(
         assert isinstance(action_space, (gym.spaces.Discrete, gym.spaces.Box)), (
             "This simple PPOModule only supports Discrete and Box action space.",
         )
-        pi_config = FCTfConfig()
-        vf_config = FCTfConfig()
-        shared_encoder_config.input_dim = observation_space.shape[0]
-        pi_config.input_dim = shared_encoder_config.output_dim
-        pi_config.hidden_layers = fcnet_hiddens
+        pi_config = MLPConfig()
+        vf_config = MLPConfig()
+        encoder_config.input_dim = observation_space.shape[0]
+        pi_config.input_dim = encoder_config.output_dim
+        pi_config.hidden_layer_dims = fcnet_hiddens
         if isinstance(action_space, gym.spaces.Discrete):
             pi_config.output_dim = action_space.n
         else:
             pi_config.output_dim = action_space.shape[0] * 2
         # build vf network
-        vf_config.input_dim = shared_encoder_config.output_dim
-        vf_config.hidden_layers = fcnet_hiddens
+        vf_config.input_dim = encoder_config.output_dim
+        vf_config.hidden_layer_dims = fcnet_hiddens
         vf_config.output_dim = 1
-        config_ = PPOTfModuleConfig(
+        config_ = PPOModuleConfig(
             pi_config=pi_config,
             vf_config=vf_config,
-            shared_encoder_config=shared_encoder_config,
+            encoder_config=encoder_config,
             observation_space=observation_space,
             action_space=action_space,
         )
diff --git a/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py b/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py
index b3cc51a732f3..2c26c1a02f3c 100644
--- a/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py
+++ b/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py
@@ -1,13 +1,18 @@
 from dataclasses import dataclass
-import gymnasium as gym
 from typing import Mapping, Any, Union
 
-from ray.rllib.core.rl_module.torch import TorchRLModule
+import gymnasium as gym
+
 from ray.rllib.core.rl_module.rl_module import RLModule, RLModuleConfig
-from ray.rllib.policy.sample_batch import SampleBatch
-from ray.rllib.utils.annotations import override
-from ray.rllib.utils.nested_dict import NestedDict
-from ray.rllib.utils.framework import try_import_torch
+from ray.rllib.core.rl_module.torch import TorchRLModule
+from ray.rllib.models.experimental.encoder import STATE_OUT
+from ray.rllib.models.experimental.configs import MLPConfig, MLPEncoderConfig
+from ray.rllib.models.experimental.configs import (
+    LSTMEncoderConfig,
+)
+from ray.rllib.models.experimental.torch.encoder import (
+    ENCODER_OUT,
+)
 from ray.rllib.models.specs.specs_dict import SpecDict
 from ray.rllib.models.specs.specs_torch import TorchTensorSpec
 from ray.rllib.models.torch.torch_distributions import (
@@ -15,15 +20,11 @@
     TorchDeterministic,
     TorchDiagGaussian,
 )
-from ray.rllib.core.rl_module.encoder import (
-    FCNet,
-    FCConfig,
-    LSTMConfig,
-    IdentityConfig,
-    LSTMEncoder,
-    ENCODER_OUT,
-)
+from ray.rllib.policy.sample_batch import SampleBatch
+from ray.rllib.utils.annotations import override, ExperimentalAPI
+from ray.rllib.utils.framework import try_import_torch
 from ray.rllib.utils.gym import convert_old_gym_space_to_gymnasium_space
+from ray.rllib.utils.nested_dict import NestedDict
 
 
 torch, nn = try_import_torch()
@@ -42,27 +43,26 @@ def get_ppo_loss(fwd_in, fwd_out):
     return loss
 
 
+@ExperimentalAPI
 @dataclass
-class PPOModuleConfig(RLModuleConfig):
-    """Configuration for the PPO module.
+class PPOModuleConfig(RLModuleConfig):  # TODO (Artur): Move to non-torch-specific file
+    """Configuration for the PPORLModule.
 
     Attributes:
-        pi_config: The configuration for the policy network.
-        vf_config: The configuration for the value network.
-        shared_encoder_config: The configuration for the encoder network.
+        observation_space: The observation space of the environment.
+        action_space: The action space of the environment.
+        encoder_config: The configuration for the encoder network.
+        pi_config: The configuration for the policy head.
+        vf_config: The configuration for the value function head.
         free_log_std: For DiagGaussian action distributions, make the second half of
             the model outputs floating bias variables instead of state-dependent. This
             only has an effect is using the default fully connected net.
-        shared_encoder: Whether to share the encoder between the pi and value
     """
 
-    pi_config: FCConfig = None
-    vf_config: FCConfig = None
-    pi_encoder_config: FCConfig = None
-    vf_encoder_config: FCConfig = None
-    shared_encoder_config: FCConfig = None
+    encoder_config: MLPConfig = None
+    pi_config: MLPConfig = None
+    vf_config: MLPConfig = None
     free_log_std: bool = False
-    shared_encoder: bool = True
 
 
 class PPOTorchRLModule(TorchRLModule):
@@ -72,27 +72,14 @@ def __init__(self, config: PPOModuleConfig) -> None:
         self.setup()
 
     def setup(self) -> None:
-
         assert self.config.pi_config, "pi_config must be provided."
         assert self.config.vf_config, "vf_config must be provided."
+        assert self.config.encoder_config, "shared encoder config must be " "provided."
 
-        self.shared_encoder = self.config.shared_encoder_config.build()
-        self.pi_encoder = self.config.pi_encoder_config.build()
-        self.vf_encoder = self.config.vf_encoder_config.build()
-
-        self.pi = FCNet(
-            input_dim=self.config.pi_encoder_config.output_dim,
-            output_dim=self.config.pi_config.output_dim,
-            hidden_layers=self.config.pi_config.hidden_layers,
-            activation=self.config.pi_config.activation,
-        )
-
-        self.vf = FCNet(
-            input_dim=self.config.vf_encoder_config.output_dim,
-            output_dim=1,
-            hidden_layers=self.config.vf_config.hidden_layers,
-            activation=self.config.vf_config.activation,
-        )
+        # TODO(Artur): Unify to tf and torch setup with Catalog
+        self.encoder = self.config.encoder_config.build(framework="torch")
+        self.pi = self.config.pi_config.build(framework="torch")
+        self.vf = self.config.vf_config.build(framework="torch")
 
         self._is_discrete = isinstance(
             convert_old_gym_space_to_gymnasium_space(self.config.action_space),
@@ -123,44 +110,38 @@ def from_model_config(
 
         obs_dim = observation_space.shape[0]
         fcnet_hiddens = model_config["fcnet_hiddens"]
-        vf_share_layers = model_config["vf_share_layers"]
         free_log_std = model_config["free_log_std"]
-        use_lstm = model_config["use_lstm"]
+        assert (
+            model_config.get("vf_share_layers") is False
+        ), "`vf_share_layers=False` is no longer supported."
 
-        if vf_share_layers:
-            shared_encoder_config = FCConfig(
+        if model_config["use_lstm"]:
+            encoder_config = LSTMEncoderConfig(
                 input_dim=obs_dim,
-                hidden_layers=fcnet_hiddens,
-                activation=activation,
-                output_dim=model_config["fcnet_hiddens"][-1],
-            )
-        else:
-            shared_encoder_config = IdentityConfig(output_dim=obs_dim)
-
-        if use_lstm:
-            pi_encoder_config = LSTMConfig(
-                input_dim=shared_encoder_config.output_dim,
                 hidden_dim=model_config["lstm_cell_size"],
                 batch_first=not model_config["_time_major"],
-                output_dim=model_config["lstm_cell_size"],
                 num_layers=1,
+                output_dim=model_config["lstm_cell_size"],
             )
         else:
-            pi_encoder_config = FCConfig(
-                input_dim=shared_encoder_config.output_dim,
-                hidden_layers=fcnet_hiddens,
-                activation=activation,
-                output_dim=model_config["fcnet_hiddens"][-1],
+            encoder_config = MLPEncoderConfig(
+                input_dim=obs_dim,
+                hidden_layer_dims=fcnet_hiddens[:-1],
+                hidden_layer_activation=activation,
+                output_dim=fcnet_hiddens[-1],
             )
 
-        vf_encoder_config = FCConfig(
-            input_dim=shared_encoder_config.output_dim,
-            hidden_layers=fcnet_hiddens,
-            activation=activation,
-            output_dim=model_config["fcnet_hiddens"][-1],
+        pi_config = MLPConfig(
+            input_dim=encoder_config.output_dim,
+            hidden_layer_dims=[32],
+            hidden_layer_activation="ReLU",
+        )
+        vf_config = MLPConfig(
+            input_dim=encoder_config.output_dim,
+            hidden_layer_dims=[32, 1],
+            hidden_layer_activation="ReLU",
+            output_dim=1,
         )
-        pi_config = FCConfig()
-        vf_config = FCConfig()
 
         assert isinstance(
             observation_space, gym.spaces.Box
@@ -174,41 +155,29 @@ def from_model_config(
             "This simple PPOModule only supports Discrete and Box action space.",
         )
 
-        # build pi network
-        shared_encoder_config.input_dim = observation_space.shape[0]
-        pi_encoder_config.input_dim = shared_encoder_config.output_dim
-        pi_config.input_dim = pi_encoder_config.output_dim
+        # build policy network head
+        encoder_config.input_dim = observation_space.shape[0]
+        pi_config.input_dim = encoder_config.output_dim
         if isinstance(action_space, gym.spaces.Discrete):
             pi_config.output_dim = action_space.n
         else:
             pi_config.output_dim = action_space.shape[0] * 2
 
-        # build vf network
-        vf_encoder_config.input_dim = shared_encoder_config.output_dim
-        vf_config.input_dim = vf_encoder_config.output_dim
-        vf_config.output_dim = 1
-
         config_ = PPOModuleConfig(
             observation_space=observation_space,
             action_space=action_space,
-            max_seq_len=model_config["max_seq_len"],
-            shared_encoder_config=shared_encoder_config,
+            encoder_config=encoder_config,
             pi_config=pi_config,
             vf_config=vf_config,
-            pi_encoder_config=pi_encoder_config,
-            vf_encoder_config=vf_encoder_config,
             free_log_std=free_log_std,
-            shared_encoder=vf_share_layers,
         )
 
         module = PPOTorchRLModule(config_)
         return module
 
     def get_initial_state(self) -> NestedDict:
-        if isinstance(self.shared_encoder, LSTMEncoder):
-            return self.shared_encoder.get_initial_state()
-        elif isinstance(self.pi_encoder, LSTMEncoder):
-            return self.pi_encoder.get_initial_state()
+        if hasattr(self.encoder, "get_initial_state"):
+            return self.encoder.get_initial_state()
         else:
             return NestedDict({})
 
@@ -222,24 +191,26 @@ def output_specs_inference(self) -> SpecDict:
 
     @override(RLModule)
     def _forward_inference(self, batch: NestedDict) -> Mapping[str, Any]:
-        shared_enc_out = self.shared_encoder(batch)
-        pi_enc_out = self.pi_encoder(shared_enc_out)
+        output = {}
 
-        action_logits = self.pi(pi_enc_out[ENCODER_OUT])
+        encoder_out = self.encoder(batch)
+        if STATE_OUT in encoder_out:
+            output[STATE_OUT] = encoder_out[STATE_OUT]
 
+        # Actions
+        action_logits = self.pi(encoder_out[ENCODER_OUT])
         if self._is_discrete:
             action = torch.argmax(action_logits, dim=-1)
         else:
             action, _ = action_logits.chunk(2, dim=-1)
-
         action_dist = TorchDeterministic(action)
-        output = {SampleBatch.ACTION_DIST: action_dist}
-        output["state_out"] = pi_enc_out.get("state_out", {})
+        output[SampleBatch.ACTION_DIST] = action_dist
+
         return output
 
     @override(RLModule)
     def input_specs_exploration(self):
-        return self.shared_encoder.input_spec()
+        return self.encoder.input_spec
 
     @override(RLModule)
     def output_specs_exploration(self) -> SpecDict:
@@ -264,12 +235,20 @@ def _forward_exploration(self, batch: NestedDict) -> Mapping[str, Any]:
         policy distribution to be used for computing KL divergence between the old
         policy and the new policy during training.
         """
-        encoder_out = self.shared_encoder(batch)
-        encoder_out_pi = self.pi_encoder(encoder_out)
-        encoder_out_vf = self.vf_encoder(encoder_out)
-        action_logits = self.pi(encoder_out_pi[ENCODER_OUT])
-
         output = {}
+
+        # Shared encoder
+        encoder_out = self.encoder(batch)
+        if STATE_OUT in encoder_out:
+            output[STATE_OUT] = encoder_out[STATE_OUT]
+
+        # Value head
+        vf_out = self.vf(encoder_out[ENCODER_OUT])
+        output[SampleBatch.VF_PREDS] = vf_out.squeeze(-1)
+
+        # Policy head
+        pi_out = self.pi(encoder_out[ENCODER_OUT])
+        action_logits = pi_out
         if self._is_discrete:
             action_dist = TorchCategorical(logits=action_logits)
             output[SampleBatch.ACTION_DIST_INPUTS] = {"logits": action_logits}
@@ -280,9 +259,6 @@ def _forward_exploration(self, batch: NestedDict) -> Mapping[str, Any]:
             output[SampleBatch.ACTION_DIST_INPUTS] = {"loc": loc, "scale": scale}
         output[SampleBatch.ACTION_DIST] = action_dist
 
-        # compute the value function
-        output[SampleBatch.VF_PREDS] = self.vf(encoder_out_vf[ENCODER_OUT]).squeeze(-1)
-        output["state_out"] = encoder_out_pi.get("state_out", {})
         return output
 
     @override(RLModule)
@@ -293,7 +269,7 @@ def input_specs_train(self) -> SpecDict:
             action_dim = self.config.action_space.shape[0]
             action_spec = TorchTensorSpec("b, h", h=action_dim)
 
-        spec_dict = self.shared_encoder.input_spec()
+        spec_dict = self.encoder.input_spec
         spec_dict.update({SampleBatch.ACTIONS: action_spec})
         if SampleBatch.OBS in spec_dict:
             spec_dict[SampleBatch.NEXT_OBS] = spec_dict[SampleBatch.OBS]
@@ -314,30 +290,31 @@ def output_specs_train(self) -> SpecDict:
 
     @override(RLModule)
     def _forward_train(self, batch: NestedDict) -> Mapping[str, Any]:
-        encoder_out = self.shared_encoder(batch)
-        encoder_out_pi = self.pi_encoder(encoder_out)
-        encoder_out_vf = self.vf_encoder(encoder_out)
+        output = {}
+
+        # Shared encoder
+        encoder_out = self.encoder(batch)
+        if STATE_OUT in encoder_out:
+            output[STATE_OUT] = encoder_out[STATE_OUT]
 
-        action_logits = self.pi(encoder_out_pi[ENCODER_OUT])
-        vf = self.vf(encoder_out_vf[ENCODER_OUT])
+        # Value head
+        vf_out = self.vf(encoder_out[ENCODER_OUT])
+        output[SampleBatch.VF_PREDS] = vf_out.squeeze(-1)
 
+        # Policy head
+        pi_out = self.pi(encoder_out[ENCODER_OUT])
+        action_logits = pi_out
         if self._is_discrete:
             action_dist = TorchCategorical(logits=action_logits)
         else:
             mu, scale = action_logits.chunk(2, dim=-1)
             action_dist = TorchDiagGaussian(mu, scale.exp())
-
         logp = action_dist.logp(batch[SampleBatch.ACTIONS])
         entropy = action_dist.entropy()
+        output[SampleBatch.ACTION_DIST] = action_dist
+        output[SampleBatch.ACTION_LOGP] = logp
+        output["entropy"] = entropy
 
-        output = {
-            SampleBatch.ACTION_DIST: action_dist,
-            SampleBatch.ACTION_LOGP: logp,
-            SampleBatch.VF_PREDS: vf.squeeze(-1),
-            "entropy": entropy,
-        }
-
-        output["state_out"] = encoder_out_pi.get("state_out", {})
         return output
 
     def __get_action_dist_type(self):
diff --git a/rllib/core/rl_module/encoder.py b/rllib/core/rl_module/encoder.py
deleted file mode 100644
index f3bb22b46900..000000000000
--- a/rllib/core/rl_module/encoder.py
+++ /dev/null
@@ -1,202 +0,0 @@
-import torch
-import torch.nn as nn
-import tree
-from typing import List
-
-from dataclasses import dataclass, field
-
-from ray.rllib.policy.sample_batch import SampleBatch
-from ray.rllib.policy.rnn_sequencing import add_time_dimension
-from ray.rllib.models.specs.specs_dict import SpecDict
-from ray.rllib.models.specs.checker import check_input_specs, check_output_specs
-from ray.rllib.models.specs.specs_torch import TorchTensorSpec
-from ray.rllib.models.torch.primitives import FCNet
-
-# TODO (Kourosh): Find a better / more straight fwd approach for sub-components
-
-ENCODER_OUT = "encoder_out"
-STATE_IN = "state_in"
-STATE_OUT = "state_out"
-
-
-@dataclass
-class EncoderConfig:
-    """Configuration for an encoder network.
-
-    Attributes:
-        output_dim: The output dimension of the network. if None, the last layer would
-            be the last hidden layer.
-    """
-
-    output_dim: int = None
-
-
-@dataclass
-class IdentityConfig(EncoderConfig):
-    """Configuration for an identity encoder."""
-
-    def build(self):
-        return IdentityEncoder(self)
-
-
-@dataclass
-class FCConfig(EncoderConfig):
-    """Configuration for a fully connected network.
-    input_dim: The input dimension of the network. It cannot be None.
-    hidden_layers: The sizes of the hidden layers.
-    activation: The activation function to use after each layer (except for the
-        output).
-    output_activation: The activation function to use for the output layer.
-    """
-
-    input_dim: int = None
-    hidden_layers: List[int] = field(default_factory=lambda: [256, 256])
-    activation: str = "ReLU"
-
-    def build(self):
-        return FullyConnectedEncoder(self)
-
-
-@dataclass
-class LSTMConfig(EncoderConfig):
-    input_dim: int = None
-    hidden_dim: int = None
-    num_layers: int = None
-    batch_first: bool = True
-
-    def build(self):
-        return LSTMEncoder(self)
-
-
-class Encoder(nn.Module):
-    def __init__(self, config: EncoderConfig) -> None:
-        super().__init__()
-        self.config = config
-        self._input_spec = self.input_spec()
-        self._output_spec = self.output_spec()
-
-    def get_initial_state(self):
-        return []
-
-    def input_spec(self):
-        return SpecDict()
-
-    def output_spec(self):
-        return SpecDict()
-
-    @check_input_specs("_input_spec")
-    @check_output_specs("_output_spec")
-    def forward(self, input_dict):
-        return self._forward(input_dict)
-
-    def _forward(self, input_dict):
-        raise NotImplementedError
-
-
-class FullyConnectedEncoder(Encoder):
-    def __init__(self, config: FCConfig) -> None:
-        super().__init__(config)
-
-        self.net = FCNet(
-            input_dim=config.input_dim,
-            hidden_layers=config.hidden_layers,
-            output_dim=config.output_dim,
-            activation=config.activation,
-        )
-
-    def input_spec(self):
-        return SpecDict(
-            {SampleBatch.OBS: TorchTensorSpec("b, h", h=self.config.input_dim)}
-        )
-
-    def output_spec(self):
-        return SpecDict(
-            {ENCODER_OUT: TorchTensorSpec("b, h", h=self.config.output_dim)}
-        )
-
-    def _forward(self, input_dict):
-        return {ENCODER_OUT: self.net(input_dict[SampleBatch.OBS])}
-
-
-class LSTMEncoder(Encoder):
-    def __init__(self, config: LSTMConfig) -> None:
-        super().__init__(config)
-
-        self.lstm = nn.LSTM(
-            config.input_dim,
-            config.hidden_dim,
-            config.num_layers,
-            batch_first=config.batch_first,
-        )
-        self.linear = nn.Linear(config.hidden_dim, config.output_dim)
-
-    def get_initial_state(self):
-        config = self.config
-        return {
-            "h": torch.zeros(config.num_layers, config.hidden_dim),
-            "c": torch.zeros(config.num_layers, config.hidden_dim),
-        }
-
-    def input_spec(self):
-        config = self.config
-        return SpecDict(
-            {
-                # bxt is just a name for better readability to indicated padded batch
-                SampleBatch.OBS: TorchTensorSpec("bxt, h", h=config.input_dim),
-                STATE_IN: {
-                    "h": TorchTensorSpec(
-                        "b, l, h", h=config.hidden_dim, l=config.num_layers
-                    ),
-                    "c": TorchTensorSpec(
-                        "b, l, h", h=config.hidden_dim, l=config.num_layers
-                    ),
-                },
-            }
-        )
-
-    def output_spec(self):
-        config = self.config
-        return SpecDict(
-            {
-                ENCODER_OUT: TorchTensorSpec("bxt, h", h=config.output_dim),
-                STATE_OUT: {
-                    "h": TorchTensorSpec(
-                        "b, l, h", h=config.hidden_dim, l=config.num_layers
-                    ),
-                    "c": TorchTensorSpec(
-                        "b, l, h", h=config.hidden_dim, l=config.num_layers
-                    ),
-                },
-            }
-        )
-
-    def _forward(self, input_dict: SampleBatch):
-        x = input_dict[SampleBatch.OBS]
-        states = input_dict[STATE_IN]
-        # states are batch-first when coming in
-        states = tree.map_structure(lambda x: x.transpose(0, 1), states)
-
-        x = add_time_dimension(
-            x,
-            seq_lens=input_dict[SampleBatch.SEQ_LENS],
-            framework="torch",
-            time_major=not self.config.batch_first,
-        )
-        states_o = {}
-        x, (states_o["h"], states_o["c"]) = self.lstm(x, (states["h"], states["c"]))
-
-        x = self.linear(x)
-        x = x.view(-1, x.shape[-1])
-
-        return {
-            ENCODER_OUT: x,
-            STATE_OUT: tree.map_structure(lambda x: x.transpose(0, 1), states_o),
-        }
-
-
-class IdentityEncoder(Encoder):
-    def __init__(self, config: EncoderConfig) -> None:
-        super().__init__(config)
-
-    def _forward(self, input_dict):
-        return input_dict
diff --git a/rllib/core/rl_module/encoder_tf.py b/rllib/core/rl_module/encoder_tf.py
deleted file mode 100644
index 5c517f6c745d..000000000000
--- a/rllib/core/rl_module/encoder_tf.py
+++ /dev/null
@@ -1,37 +0,0 @@
-from dataclasses import dataclass, field
-from typing import List
-
-from ray.rllib.core.rl_module.encoder import EncoderConfig
-from ray.rllib.utils.framework import try_import_tf
-from ray.rllib.models.tf.primitives import FCNet, IdentityNetwork
-
-tf1, tf, tfv = try_import_tf()
-
-
-@dataclass
-class FCTfConfig(EncoderConfig):
-    """Configuration for a fully connected network.
-    input_dim: The input dimension of the network. It cannot be None.
-    hidden_layers: The sizes of the hidden layers.
-    activation: The activation function to use after each layer (except for the
-        output).
-    output_activation: The activation function to use for the output layer.
-    """
-
-    input_dim: int = None
-    output_dim: int = None
-    hidden_layers: List[int] = field(default_factory=lambda: [256, 256])
-    activation: str = "ReLU"
-
-    def build(self):
-        return FCNet(
-            self.input_dim, self.hidden_layers, self.output_dim, self.activation
-        )
-
-
-@dataclass
-class IdentityTfConfig(EncoderConfig):
-    """A network that returns the input as the output."""
-
-    def build(self):
-        return IdentityNetwork()
diff --git a/rllib/models/configs/encoder.py b/rllib/models/configs/encoder.py
deleted file mode 100644
index 38a7f305123a..000000000000
--- a/rllib/models/configs/encoder.py
+++ /dev/null
@@ -1,83 +0,0 @@
-import abc
-from dataclasses import dataclass
-from typing import TYPE_CHECKING, Tuple
-
-from ray.rllib.models.specs.specs_dict import SpecDict
-from ray.rllib.models.torch.encoders.vector import TorchVectorEncoder
-
-if TYPE_CHECKING:
-    from ray.rllib.models.torch.encoders.vector import Encoder
-
-
-@dataclass
-class EncoderConfig:
-    """The base config for encoder models.
-
-    Each config should define a `build` method that builds a model from the config.
-
-    All user-configurable parameters known before runtime
-    (e.g. framework, activation, num layers, etc.) should be defined as attributes.
-
-    Parameters unknown before runtime (e.g. the output size of the module providing
-    input for this module) should be passed as arguments to `build`. This should be
-    as few params as possible.
-
-    `build` should return an instance of the encoder associated with the config.
-
-    Attributes:
-        framework_str: The tensor framework to construct a model for.
-            This can be 'torch', 'tf2', or 'jax'.
-    """
-
-    framework_str: str = "torch"
-
-    @abc.abstractmethod
-    def build(self, input_spec: SpecDict, **kwargs) -> "Encoder":
-        """Builds the EncoderConfig into an Encoder instance"""
-
-
-@dataclass
-class VectorEncoderConfig(EncoderConfig):
-    """An MLP encoder mappings tensors with shape [..., feature] to [..., output].
-
-    Attributes:
-        activation: The type of activation function to use between hidden layers.
-            Options are 'relu', 'swish', 'tanh', or 'linear'
-        final_activation: The activation function to use after the final linear layer.
-            Options are the same as for activation.
-        hidden_layer_sizes: A list, where each element represents the number of neurons
-            in that layer. For example, [128, 64] would produce a two-layer MLP with
-            128 hidden neurons and 64 hidden neurons.
-        output_key: Write the output of the encoder to this key in the NestedDict.
-    """
-
-    activation: str = "relu"
-    final_activation: str = "linear"
-    hidden_layer_sizes: Tuple[int, ...] = (128, 128)
-    output_key: str = "encoding"
-
-    def build(self, input_spec: SpecDict) -> TorchVectorEncoder:
-        """Build the config into a VectorEncoder model instance.
-
-        Args:
-            input_spec: The output spec of the previous module(s) that will feed
-                inputs to this encoder.
-
-        Returns:
-            A VectorEncoder of the specified framework.
-        """
-        assert (
-            len(self.hidden_layer_sizes) > 1
-        ), "Must have at least a single hidden layer"
-        for k in input_spec.shallow_keys():
-            assert isinstance(
-                input_spec[k].shape[-1], int
-            ), "Input spec {k} does not define the size of the feature (last) dimension"
-
-        if self.framework_str == "torch":
-            return TorchVectorEncoder(input_spec, self)
-        else:
-            raise NotImplementedError(
-                "{self.__class__.__name__} not implemented"
-                " for framework {self.framework}"
-            )
diff --git a/rllib/models/experimental/README.rst b/rllib/models/experimental/README.rst
new file mode 100644
index 000000000000..2ef2007403e2
--- /dev/null
+++ b/rllib/models/experimental/README.rst
@@ -0,0 +1,2 @@
+This folder holds models that are under development and to be used with RLModules in upcoming versions of RLlib.
+They are not yet ready for use in the current version of RLlib.
\ No newline at end of file
diff --git a/rllib/models/experimental/__init__.py b/rllib/models/experimental/__init__.py
new file mode 100644
index 000000000000..e69de29bb2d1
diff --git a/rllib/models/experimental/base.py b/rllib/models/experimental/base.py
new file mode 100644
index 000000000000..bcf822770e97
--- /dev/null
+++ b/rllib/models/experimental/base.py
@@ -0,0 +1,72 @@
+from dataclasses import dataclass
+import abc
+
+from ray.rllib.models.specs.specs_dict import SpecDict
+from ray.rllib.models.temp_spec_classes import TensorDict
+from ray.rllib.utils.annotations import ExperimentalAPI
+
+ForwardOutputType = TensorDict
+
+
+@ExperimentalAPI
+@dataclass
+class ModelConfig(abc.ABC):
+    """Base class for model configurations.
+
+    Attributes:
+        output_dim: The output dimension of the network.
+    """
+
+    output_dim: int = None
+
+    @abc.abstractmethod
+    def build(self, framework: str = "torch"):
+        """Builds the model.
+
+        Args:
+            framework: The framework to use for building the model.
+        """
+        raise NotImplementedError
+
+
+class Model:
+    """Framework-agnostic base class for RLlib models.
+
+    Models are low-level neural network components that offer input- and
+    output-specification, a forward method, and a get_initial_state method. Models
+    are composed in RLModules.
+    """
+
+    def __init__(self, config: ModelConfig):
+        self.config = config
+
+    @abc.abstractmethod
+    def get_initial_state(self):
+        """Returns the initial state of the model."""
+        return {}
+
+    @property
+    @abc.abstractmethod
+    def output_spec(self) -> SpecDict:
+        """Returns the outputs spec of this model.
+
+        This can include the state specs as well.
+
+        Examples:
+            >>> ...
+        """
+        # If no checking is needed, we can simply return an empty spec.
+        return SpecDict()
+
+    @property
+    @abc.abstractmethod
+    def input_spec(self) -> SpecDict:
+        """Returns the input spec of this model.
+
+        This can include the state specs as well.
+
+        Examples:
+            >>> ...
+        """
+        # If no checking is needed, we can simply return an empty spec.
+        return SpecDict()
diff --git a/rllib/models/experimental/configs.py b/rllib/models/experimental/configs.py
new file mode 100644
index 000000000000..6a6c84772063
--- /dev/null
+++ b/rllib/models/experimental/configs.py
@@ -0,0 +1,115 @@
+from dataclasses import dataclass, field
+from typing import List, Callable
+import functools
+
+from ray.rllib.models.experimental.base import ModelConfig, Model
+from ray.rllib.models.experimental.encoder import Encoder
+from ray.rllib.utils.annotations import DeveloperAPI
+
+
+@DeveloperAPI
+def _framework_implemented(torch: bool = True, tf2: bool = True):
+    """Decorator to check if a model was implemented in a framework.
+
+    Args:
+        torch: Whether we can build this model with torch.
+        tf2: Whether we can build this model with tf2.
+
+    Returns:
+        The decorated function.
+
+    Raises:
+        ValueError: If the framework is not available to build.
+    """
+    accepted = []
+    if torch:
+        accepted.append("torch")
+    if tf2:
+        accepted.append("tf")
+        accepted.append("tf2")
+
+    def decorator(fn: Callable) -> Callable:
+        @functools.wraps(fn)
+        def checked_build(self, framework, **kwargs):
+            if framework not in accepted:
+                raise ValueError(f"Framework {framework} not supported.")
+            return fn(self, framework, **kwargs)
+
+        return checked_build
+
+    return decorator
+
+
+@dataclass
+class MLPConfig(ModelConfig):
+    """Configuration for a fully connected network.
+
+    Attributes:
+        input_dim: The input dimension of the network. It cannot be None.
+        hidden_layer_dims: The sizes of the hidden layers.
+        hidden_layer_activation: The activation function to use after each layer (
+        except for the output).
+        output_activation: The activation function to use for the output layer.
+    """
+
+    input_dim: int = None
+    hidden_layer_dims: List[int] = field(default_factory=lambda: [256, 256])
+    hidden_layer_activation: str = "ReLU"
+    output_activation: str = "linear"
+
+    @_framework_implemented()
+    def build(self, framework: str = "torch") -> Model:
+        if framework == "torch":
+            from ray.rllib.models.experimental.torch.mlp import TorchMLPModel
+
+            return TorchMLPModel(self)
+        else:
+            from ray.rllib.models.experimental.tf.mlp import TfMLPModel
+
+            return TfMLPModel(self)
+
+
+@dataclass
+class MLPEncoderConfig(MLPConfig):
+    @_framework_implemented()
+    def build(self, framework: str = "torch") -> Encoder:
+        if framework == "torch":
+            from ray.rllib.models.experimental.torch.encoder import TorchMLPEncoder
+
+            return TorchMLPEncoder(self)
+        else:
+            from ray.rllib.models.experimental.tf.encoder import TfMLPEncoder
+
+            return TfMLPEncoder(self)
+
+
+@dataclass
+class LSTMEncoderConfig(ModelConfig):
+    input_dim: int = None
+    hidden_dim: int = None
+    num_layers: int = None
+    batch_first: bool = True
+    output_activation: str = "linear"
+
+    @_framework_implemented(tf2=False)
+    def build(self, framework: str = "torch") -> Encoder:
+        if framework == "torch":
+            from ray.rllib.models.experimental.torch.encoder import TorchLSTMEncoder
+
+            return TorchLSTMEncoder(self)
+
+
+@dataclass
+class IdentityConfig(ModelConfig):
+    """Configuration for an identity encoder."""
+
+    @_framework_implemented()
+    def build(self, framework: str = "torch") -> Model:
+        if framework == "torch":
+            from ray.rllib.models.experimental.torch.encoder import TorchIdentityEncoder
+
+            return TorchIdentityEncoder(self)
+        else:
+            from ray.rllib.models.experimental.tf.encoder import TfIdentityEncoder
+
+            return TfIdentityEncoder(self)
diff --git a/rllib/models/experimental/encoder.py b/rllib/models/experimental/encoder.py
new file mode 100644
index 000000000000..bf1e85d4ff8e
--- /dev/null
+++ b/rllib/models/experimental/encoder.py
@@ -0,0 +1,57 @@
+import abc
+
+from ray.rllib.models.specs.checker import check_input_specs, check_output_specs
+from ray.rllib.models.temp_spec_classes import TensorDict
+from ray.rllib.utils.typing import TensorType
+from ray.rllib.models.experimental.base import Model, ForwardOutputType
+
+STATE_IN: str = "state_in"
+STATE_OUT: str = "state_out"
+
+
+class Encoder(Model):
+    """The framework-agnostic base class for all encoders RLlib produces.
+
+    Encoders are used to encode observations into a latent space in RLModules.
+    Therefore, their input_spec contains the observation space dimensions.
+    Similarly, their output_spec usually the latent space dimensions.
+    Encoders can be recurrent, in which case they should also have state_specs.
+
+    Encoders encode observations into a latent space that serve as input to heads.
+    Outputs of encoders are generally of shape (B, latent_dim) or (B, T, latent_dim).
+    That is, for time-series data, we encode into the latent space for each time step.
+    This should be reflected in the output_spec.
+    """
+
+    def get_initial_state(self) -> TensorType:
+        """Returns the initial state of the encoder.
+
+        It can be left empty if this encoder is not stateful.
+
+        Examples:
+            >>> encoder = Encoder(...)
+            >>> state = encoder.get_initial_state()
+            >>> out = encoder.forward({"obs": ..., STATE_IN: state})
+        """
+        return {}
+
+    @check_input_specs("input_spec", cache=True)
+    @check_output_specs("output_spec", cache=True)
+    @abc.abstractmethod
+    def forward(self, inputs: TensorDict, **kwargs) -> ForwardOutputType:
+        """Computes the output of this module for each timestep.
+
+        Outputs and inputs are subjected to spec checking.
+
+        Args:
+            inputs: A TensorDict containing model inputs
+            kwargs: For forwards compatibility
+
+        Returns:
+            outputs: A TensorDict containing model outputs
+
+        Examples:
+            # This is abstract, see the framework implementations
+            >>> out = encoder.forward({"obs": np.arange(10)}))
+        """
+        raise NotImplementedError
diff --git a/rllib/models/experimental/tf/__init__.py b/rllib/models/experimental/tf/__init__.py
new file mode 100644
index 000000000000..e69de29bb2d1
diff --git a/rllib/models/experimental/tf/encoder.py b/rllib/models/experimental/tf/encoder.py
new file mode 100644
index 000000000000..4ee2ea4433ea
--- /dev/null
+++ b/rllib/models/experimental/tf/encoder.py
@@ -0,0 +1,159 @@
+import torch
+import torch.nn as nn
+import tree
+
+from ray.rllib.models.experimental.base import (
+    ForwardOutputType,
+    ModelConfig,
+)
+from ray.rllib.models.experimental.encoder import (
+    Encoder,
+    STATE_IN,
+    STATE_OUT,
+)
+from ray.rllib.models.temp_spec_classes import TensorDict
+from ray.rllib.policy.sample_batch import SampleBatch
+from ray.rllib.models.experimental.tf.primitives import TfMLP
+from ray.rllib.policy.rnn_sequencing import add_time_dimension
+from ray.rllib.models.specs.specs_dict import SpecDict
+from ray.rllib.models.specs.checker import check_input_specs, check_output_specs
+from ray.rllib.models.specs.specs_tf import TFTensorSpecs
+from ray.rllib.models.experimental.torch.encoder import ENCODER_OUT
+from ray.rllib.models.experimental.tf.primitives import TfModel
+
+
+class TfMLPEncoder(Encoder, TfModel):
+    """A fully connected encoder."""
+
+    def __init__(self, config: ModelConfig) -> None:
+        Encoder.__init__(self, config)
+        TfModel.__init__(self, config)
+
+        self.net = TfMLP(
+            input_dim=config.input_dim,
+            hidden_layer_dims=config.hidden_layer_dims,
+            output_dim=config.output_dim,
+            hidden_layer_activation=config.hidden_layer_activation,
+        )
+
+    @property
+    def input_spec(self):
+        return SpecDict(
+            {SampleBatch.OBS: TFTensorSpecs("b, h", h=self.config.input_dim)}
+        )
+
+    @property
+    def output_spec(self):
+        return SpecDict({ENCODER_OUT: TFTensorSpecs("b, h", h=self.config.output_dim)})
+
+    @check_input_specs("input_spec", cache=False)
+    @check_output_specs("output_spec", cache=False)
+    def __call__(self, inputs: TensorDict, **kwargs) -> ForwardOutputType:
+        return {ENCODER_OUT: self.net(inputs[SampleBatch.OBS])}
+
+
+class LSTMEncoder(Encoder, TfModel):
+    """An encoder that uses an LSTM cell and a linear layer."""
+
+    def __init__(self, config: ModelConfig) -> None:
+        Encoder.__init__(self, config)
+        TfModel.__init__(self, config)
+
+        self.lstm = nn.LSTM(
+            config.input_dim,
+            config.hidden_dim,
+            config.num_layers,
+            batch_first=config.batch_first,
+        )
+        self.linear = nn.Linear(config.hidden_dim, config.output_dim)
+
+    def get_initial_state(self):
+        config = self.config
+        return {
+            "h": torch.zeros(config.num_layers, config.hidden_dim),
+            "c": torch.zeros(config.num_layers, config.hidden_dim),
+        }
+
+    @property
+    def input_spec(self):
+        config = self.config
+        return SpecDict(
+            {
+                # bxt is just a name for better readability to indicated padded batch
+                SampleBatch.OBS: TFTensorSpecs("bxt, h", h=config.input_dim),
+                STATE_IN: {
+                    "h": TFTensorSpecs(
+                        "b, l, h", h=config.hidden_dim, l=config.num_layers
+                    ),
+                    "c": TFTensorSpecs(
+                        "b, l, h", h=config.hidden_dim, l=config.num_layers
+                    ),
+                },
+                SampleBatch.SEQ_LENS: None,
+            }
+        )
+
+    @property
+    def output_spec(self):
+        config = self.config
+        return SpecDict(
+            {
+                ENCODER_OUT: TFTensorSpecs("bxt, h", h=config.output_dim),
+                STATE_OUT: {
+                    "h": TFTensorSpecs(
+                        "b, l, h", h=config.hidden_dim, l=config.num_layers
+                    ),
+                    "c": TFTensorSpecs(
+                        "b, l, h", h=config.hidden_dim, l=config.num_layers
+                    ),
+                },
+            }
+        )
+
+    @check_input_specs("input_spec", cache=False)
+    @check_output_specs("output_spec", cache=False)
+    def __call__(self, inputs: TensorDict, **kwargs) -> ForwardOutputType:
+        x = inputs[SampleBatch.OBS]
+        states = inputs[STATE_IN]
+        # states are batch-first when coming in
+        states = tree.map_structure(lambda x: x.transpose(0, 1), states)
+
+        x = add_time_dimension(
+            x,
+            seq_lens=inputs[SampleBatch.SEQ_LENS],
+            framework="torch",
+            time_major=not self.config.batch_first,
+        )
+        states_o = {}
+        x, (states_o["h"], states_o["c"]) = self.lstm(x, (states["h"], states["c"]))
+
+        x = self.linear(x)
+        x = x.view(-1, x.shape[-1])
+
+        return {
+            ENCODER_OUT: x,
+            STATE_OUT: tree.map_structure(lambda x: x.transpose(0, 1), states_o),
+        }
+
+
+class TfIdentityEncoder(TfModel):
+    """An encoder that does nothing but passing on inputs.
+
+    We use this so that we avoid having many if/else statements in the RLModule.
+    """
+
+    @property
+    def input_spec(self):
+        return SpecDict(
+            # Use the output dim as input dim because identity.
+            {SampleBatch.OBS: TFTensorSpecs("b, h", h=self.config.output_dim)}
+        )
+
+    @property
+    def output_spec(self):
+        return SpecDict({ENCODER_OUT: TFTensorSpecs("b, h", h=self.config.output_dim)})
+
+    @check_input_specs("input_spec", cache=False)
+    @check_output_specs("output_spec", cache=False)
+    def __call__(self, inputs: TensorDict, **kwargs) -> ForwardOutputType:
+        return {ENCODER_OUT: inputs[SampleBatch.OBS]}
diff --git a/rllib/models/experimental/tf/mlp.py b/rllib/models/experimental/tf/mlp.py
new file mode 100644
index 000000000000..beebabd02c68
--- /dev/null
+++ b/rllib/models/experimental/tf/mlp.py
@@ -0,0 +1,34 @@
+from ray.rllib.models.specs.checker import check_input_specs, check_output_specs
+from ray.rllib.models.specs.specs_tf import TFTensorSpecs
+from ray.rllib.utils import try_import_tf
+from ray.rllib.models.temp_spec_classes import TensorDict
+from ray.rllib.models.experimental.tf.primitives import TfMLP, TfModel
+from ray.rllib.models.experimental.base import ModelConfig, ForwardOutputType
+
+tf1, tf, tfv = try_import_tf()
+
+
+class TfMLPModel(TfModel):
+    def __init__(self, config: ModelConfig) -> None:
+        TfModel.__init__(self, config)
+
+        self.net = TfMLP(
+            input_dim=config.input_dim,
+            hidden_layer_dims=config.hidden_layer_dims,
+            output_dim=config.output_dim,
+            hidden_layer_activation=config.hidden_layer_activation,
+            output_activation=config.output_activation,
+        )
+
+    @property
+    def input_spec(self):
+        return TFTensorSpecs("b, h", h=self.config.input_dim)
+
+    @property
+    def output_spec(self):
+        return TFTensorSpecs("b, h", h=self.config.output_dim)
+
+    @check_input_specs("input_spec", cache=False)
+    @check_output_specs("output_spec", cache=False)
+    def __call__(self, inputs: TensorDict, **kwargs) -> ForwardOutputType:
+        return self.net(inputs)
diff --git a/rllib/models/experimental/tf/primitives.py b/rllib/models/experimental/tf/primitives.py
new file mode 100644
index 000000000000..a7c45c11afe0
--- /dev/null
+++ b/rllib/models/experimental/tf/primitives.py
@@ -0,0 +1,107 @@
+from typing import List
+from ray.rllib.utils.framework import try_import_tf
+from ray.rllib.models.specs.checker import (
+    is_input_decorated,
+    is_output_decorated,
+)
+from ray.rllib.models.temp_spec_classes import TensorDict
+from ray.rllib.models.experimental.base import Model
+from ray.rllib.utils.typing import TensorType
+from ray.rllib.models.utils import get_activation_fn
+from typing import Tuple
+from ray.rllib.models.specs.checker import (
+    check_input_specs,
+    check_output_specs,
+)
+
+_, tf, _ = try_import_tf()
+
+
+def _call_not_decorated(input_or_output):
+    return (
+        f"forward not decorated with {input_or_output} specification. Decorate "
+        f"with @check_{input_or_output}_specs() to define a specification. See "
+        f"BaseModel for examples."
+    )
+
+
+class TfModel(Model, tf.Module):
+    """Base class for RLlib models.
+
+    This class is used to define the general interface for RLlib models and checks
+    whether inputs and outputs are checked with `check_input_specs()` and
+    `check_output_specs()` respectively.
+    """
+
+    def __init__(self, config):
+        super().__init__(config)
+        # automatically apply spec checking
+        if not is_input_decorated(self.__call__):
+            self.__call__ = check_input_specs("input_spec", cache=True)(self.__call__)
+        if not is_output_decorated(self.__call__):
+            self.__call__ = check_output_specs("output_spec", cache=True)(self.__call__)
+
+    @check_input_specs("input_spec", cache=True)
+    @check_output_specs("output_spec", cache=True)
+    def __call__(self, input_dict: TensorDict) -> Tuple[TensorDict, List[TensorType]]:
+        """Returns the output of this model for the given input.
+
+        Args:
+            input_dict: The input tensors.
+
+        Returns:
+            Tuple[TensorDict, List[TensorType]]: The output tensors.
+        """
+        raise NotImplementedError
+
+
+class TfMLP(tf.Module):
+    """A multi-layer perceptron.
+
+    Attributes:
+        input_dim: The input dimension of the network. It cannot be None.
+        hidden_layer_dims: The sizes of the hidden layers.
+        output_dim: The output dimension of the network.
+        hidden_layer_activation: The activation function to use after each layer.
+            Currently "Linear" (no activation) and "ReLU" are supported.
+        output_activation: The activation function to use for the output layer.
+    """
+
+    def __init__(
+        self,
+        input_dim: int,
+        hidden_layer_dims: List[int],
+        output_dim: int,
+        hidden_layer_activation: str = "linear",
+        output_activation: str = "linear",
+    ):
+        super().__init__()
+
+        assert hidden_layer_activation in ("linear", "ReLU", "Tanh"), (
+            "Activation function not " "supported"
+        )
+        assert input_dim is not None, "Input dimension must not be None"
+        assert output_dim is not None, "Output dimension must not be None"
+        layers = []
+        hidden_layer_activation = hidden_layer_activation.lower()
+        # input = tf.keras.layers.Dense(input_dim, activation=activation)
+        layers.append(tf.keras.Input(shape=(input_dim,)))
+        for i in range(len(hidden_layer_dims)):
+            layers.append(
+                tf.keras.layers.Dense(
+                    hidden_layer_dims[i], activation=hidden_layer_activation
+                )
+            )
+        if output_activation != "linear":
+            output_activation = get_activation_fn(output_activation, framework="torch")
+            final_layer = tf.keras.layers.Dense(
+                output_dim, activation=output_activation
+            )
+        else:
+            final_layer = tf.keras.layers.Dense(output_dim)
+
+        layers.append(final_layer)
+        self.network = tf.keras.Sequential(layers)
+
+    def __call__(self, inputs):
+        return self.network(inputs)
diff --git a/rllib/models/experimental/torch/__init__.py b/rllib/models/experimental/torch/__init__.py
new file mode 100644
index 000000000000..e69de29bb2d1
diff --git a/rllib/models/experimental/torch/encoder.py b/rllib/models/experimental/torch/encoder.py
new file mode 100644
index 000000000000..cb87f9b8dc78
--- /dev/null
+++ b/rllib/models/experimental/torch/encoder.py
@@ -0,0 +1,167 @@
+import torch
+import torch.nn as nn
+import tree
+
+from ray.rllib.models.experimental.base import (
+    ForwardOutputType,
+    ModelConfig,
+)
+from ray.rllib.models.experimental.encoder import (
+    Encoder,
+    STATE_IN,
+    STATE_OUT,
+)
+from ray.rllib.models.temp_spec_classes import TensorDict
+from ray.rllib.policy.sample_batch import SampleBatch
+from ray.rllib.utils.annotations import override
+from ray.rllib.policy.rnn_sequencing import add_time_dimension
+from ray.rllib.models.specs.specs_dict import SpecDict
+from ray.rllib.models.specs.checker import check_input_specs, check_output_specs
+from ray.rllib.models.specs.specs_torch import TorchTensorSpec
+from ray.rllib.models.experimental.torch.primitives import TorchMLP, TorchModel
+
+ENCODER_OUT: str = "encoder_out"
+
+
+class TorchMLPEncoder(TorchModel, Encoder):
+    """A fully connected encoder."""
+
+    def __init__(self, config: ModelConfig) -> None:
+        TorchModel.__init__(self, config)
+        Encoder.__init__(self, config)
+
+        self.net = TorchMLP(
+            input_dim=config.input_dim,
+            hidden_layer_dims=config.hidden_layer_dims,
+            output_dim=config.output_dim,
+            hidden_layer_activation=config.hidden_layer_activation,
+        )
+
+    @property
+    @override(TorchModel)
+    def input_spec(self) -> SpecDict:
+        return SpecDict(
+            {SampleBatch.OBS: TorchTensorSpec("b, h", h=self.config.input_dim)}
+        )
+
+    @property
+    @override(TorchModel)
+    def output_spec(self) -> SpecDict:
+        return SpecDict(
+            {ENCODER_OUT: TorchTensorSpec("b, h", h=self.config.output_dim)}
+        )
+
+    @check_input_specs("input_spec", cache=False)
+    @check_output_specs("output_spec", cache=False)
+    def forward(self, inputs: TensorDict, **kwargs) -> ForwardOutputType:
+        return {ENCODER_OUT: self.net(inputs[SampleBatch.OBS])}
+
+
+class TorchLSTMEncoder(TorchModel, Encoder):
+    """An encoder that uses an LSTM cell and a linear layer."""
+
+    def __init__(self, config: ModelConfig) -> None:
+        TorchModel.__init__(self, config)
+
+        self.lstm = nn.LSTM(
+            config.input_dim,
+            config.hidden_dim,
+            config.num_layers,
+            batch_first=config.batch_first,
+        )
+        self.linear = nn.Linear(config.hidden_dim, config.output_dim)
+
+    def get_initial_state(self):
+        config = self.config
+        return {
+            "h": torch.zeros(config.num_layers, config.hidden_dim),
+            "c": torch.zeros(config.num_layers, config.hidden_dim),
+        }
+
+    @property
+    @override(TorchModel)
+    def input_spec(self) -> SpecDict:
+        config = self.config
+        return SpecDict(
+            {
+                # bxt is just a name for better readability to indicated padded batch
+                SampleBatch.OBS: TorchTensorSpec("bxt, h", h=config.input_dim),
+                STATE_IN: {
+                    "h": TorchTensorSpec(
+                        "b, l, h", h=config.hidden_dim, l=config.num_layers
+                    ),
+                    "c": TorchTensorSpec(
+                        "b, l, h", h=config.hidden_dim, l=config.num_layers
+                    ),
+                },
+                SampleBatch.SEQ_LENS: None,
+            }
+        )
+
+    @property
+    @override(TorchModel)
+    def output_spec(self) -> SpecDict:
+        config = self.config
+        return SpecDict(
+            {
+                ENCODER_OUT: TorchTensorSpec("bxt, h", h=config.output_dim),
+                STATE_OUT: {
+                    "h": TorchTensorSpec(
+                        "b, l, h", h=config.hidden_dim, l=config.num_layers
+                    ),
+                    "c": TorchTensorSpec(
+                        "b, l, h", h=config.hidden_dim, l=config.num_layers
+                    ),
+                },
+            }
+        )
+
+    @check_input_specs("input_spec", filter=True, cache=False)
+    @check_output_specs("output_spec", cache=False)
+    def forward(self, inputs: TensorDict, **kwargs) -> ForwardOutputType:
+        x = inputs[SampleBatch.OBS]
+        states = inputs[STATE_IN]
+        # states are batch-first when coming in
+        states = tree.map_structure(lambda x: x.transpose(0, 1), states)
+
+        x = add_time_dimension(
+            x,
+            seq_lens=inputs[SampleBatch.SEQ_LENS],
+            framework="torch",
+            time_major=not self.config.batch_first,
+        )
+        states_o = {}
+        x, (states_o["h"], states_o["c"]) = self.lstm(x, (states["h"], states["c"]))
+
+        x = self.linear(x)
+        x = x.view(-1, x.shape[-1])
+
+        return {
+            ENCODER_OUT: x,
+            STATE_OUT: tree.map_structure(lambda x: x.transpose(0, 1), states_o),
+        }
+
+
+class TorchIdentityEncoder(TorchModel):
+    """An encoder that does nothing but passing on inputs.
+
+    We use this so that we avoid having many if/else statements in the RLModule.
+    """
+
+    @property
+    def input_spec(self) -> SpecDict:
+        return SpecDict(
+            # Use the output dim as input dim because identity.
+            {SampleBatch.OBS: TorchTensorSpec("b, h", h=self.config.output_dim)}
+        )
+
+    @property
+    def output_spec(self) -> SpecDict:
+        return SpecDict(
+            {ENCODER_OUT: TorchTensorSpec("b, h", h=self.config.output_dim)}
+        )
+
+    @check_input_specs("input_spec", cache=False)
+    @check_output_specs("output_spec", cache=False)
+    def forward(self, inputs: TensorDict, **kwargs) -> ForwardOutputType:
+        return {ENCODER_OUT: inputs[SampleBatch.OBS]}
diff --git a/rllib/models/experimental/torch/mlp.py b/rllib/models/experimental/torch/mlp.py
new file mode 100644
index 000000000000..4d5afa11d502
--- /dev/null
+++ b/rllib/models/experimental/torch/mlp.py
@@ -0,0 +1,39 @@
+import torch.nn as nn
+
+from ray.rllib.models.experimental.base import ForwardOutputType, Model, ModelConfig
+from ray.rllib.models.specs.checker import check_input_specs, check_output_specs
+from ray.rllib.models.specs.specs_torch import TorchTensorSpec
+from ray.rllib.models.temp_spec_classes import TensorDict
+from ray.rllib.models.experimental.torch.primitives import TorchMLP
+from ray.rllib.models.experimental.torch.primitives import TorchModel
+from ray.rllib.utils.annotations import override
+
+
+class TorchMLPModel(TorchModel, nn.Module):
+    def __init__(self, config: ModelConfig) -> None:
+        nn.Module.__init__(self)
+        TorchModel.__init__(self, config)
+
+        self.net = TorchMLP(
+            input_dim=config.input_dim,
+            hidden_layer_dims=config.hidden_layer_dims,
+            output_dim=config.output_dim,
+            hidden_layer_activation=config.hidden_layer_activation,
+            output_activation=config.output_activation,
+        )
+
+    @property
+    @override(Model)
+    def input_spec(self) -> TorchTensorSpec:
+        return TorchTensorSpec("b, h", h=self.config.input_dim)
+
+    @property
+    @override(Model)
+    def output_spec(self) -> TorchTensorSpec:
+        return TorchTensorSpec("b, h", h=self.config.output_dim)
+
+    @check_input_specs("input_spec", cache=False)
+    @check_output_specs("output_spec", cache=False)
+    @override(TorchModel)
+    def forward(self, inputs: TensorDict, **kwargs) -> ForwardOutputType:
+        return self.net(inputs)
diff --git a/rllib/models/experimental/torch/primitives.py b/rllib/models/experimental/torch/primitives.py
new file mode 100644
index 000000000000..11156380133d
--- /dev/null
+++ b/rllib/models/experimental/torch/primitives.py
@@ -0,0 +1,99 @@
+from typing import List, Optional
+from typing import Tuple
+
+from ray.rllib.models.experimental.base import Model
+from ray.rllib.models.specs.checker import (
+    is_input_decorated,
+    is_output_decorated,
+)
+from ray.rllib.models.temp_spec_classes import TensorDict
+from ray.rllib.utils.framework import try_import_torch
+from ray.rllib.utils.typing import TensorType
+from ray.rllib.models.experimental.base import ModelConfig
+from ray.rllib.models.utils import get_activation_fn
+from ray.rllib.models.specs.checker import (
+    check_input_specs,
+    check_output_specs,
+)
+
+torch, nn = try_import_torch()
+
+
+class TorchModel(nn.Module, Model):
+    """Base class for torch models.
+
+    This class is used to define the general interface for torch models and checks
+    whether inputs and outputs are checked with `check_input_specs()` and
+    `check_output_specs()` respectively.
+    """
+
+    def __init__(self, config: ModelConfig):
+        nn.Module.__init__(self)
+        Model.__init__(self, config)
+        # automatically apply spec checking
+        if not is_input_decorated(self.forward):
+            self.forward = check_input_specs("input_spec", cache=True)(self.forward)
+        if not is_output_decorated(self.forward):
+            self.forward = check_output_specs("output_spec", cache=True)(self.forward)
+
+    @check_input_specs("input_spec", cache=True)
+    @check_output_specs("output_spec", cache=True)
+    def forward(self, input_dict: TensorDict) -> Tuple[TensorDict, List[TensorType]]:
+        """Returns the output of this model for the given input.
+
+        Args:
+            input_dict: The input tensors.
+
+        Returns:
+            Tuple[TensorDict, List[TensorType]]: The output tensors.
+        """
+        raise NotImplementedError
+
+
+class TorchMLP(nn.Module):
+    """A multi-layer perceptron.
+
+    Attributes:
+        input_dim: The input dimension of the network. It cannot be None.
+        hidden_layer_dims: The sizes of the hidden layers.
+        output_dim: The output dimension of the network. if None, the last layer would
+            be the last hidden layer.
+        hidden_layer_activation: The activation function to use after each layer.
+        output_activation: The activation function to use for the output layer.
+    """
+
+    def __init__(
+        self,
+        input_dim: int,
+        hidden_layer_dims: List[int],
+        output_dim: Optional[int] = None,
+        hidden_layer_activation: str = "linear",
+        output_activation: str = "linear",
+    ):
+        super().__init__()
+        self.input_dim = input_dim
+        hidden_layer_dims = hidden_layer_dims
+
+        activation_class = getattr(nn, hidden_layer_activation, lambda: None)()
+        layers = []
+        layers.append(nn.Linear(input_dim, hidden_layer_dims[0]))
+        for i in range(len(hidden_layer_dims) - 1):
+            if hidden_layer_activation != "linear":
+                layers.append(activation_class)
+            layers.append(nn.Linear(hidden_layer_dims[i], hidden_layer_dims[i + 1]))
+
+        if output_dim is not None:
+            if hidden_layer_activation != "linear":
+                layers.append(activation_class)
+            layers.append(nn.Linear(hidden_layer_dims[-1], output_dim))
+            self.output_dim = output_dim
+        else:
+            self.output_dim = hidden_layer_dims[-1]
+
+        if output_activation != "linear":
+            layers.append(get_activation_fn(output_activation, framework="torch"))
+
+        self.mlp = nn.Sequential(*layers)
+
+    def forward(self, x):
+        return self.mlp(x)
diff --git a/rllib/models/specs/checker.py b/rllib/models/specs/checker.py
index b7ca04c74325..1662c58aa07d 100644
--- a/rllib/models/specs/checker.py
+++ b/rllib/models/specs/checker.py
@@ -336,3 +336,15 @@ def wrapper(self, input_data, **kwargs):
         return wrapper
 
     return decorator
+
+
+@DeveloperAPI
+def is_input_decorated(obj: object) -> bool:
+    """Returns True if the object is decorated with `check_input_specs`."""
+    return hasattr(obj, "__checked_input_specs__")
+
+
+@DeveloperAPI
+def is_output_decorated(obj: object) -> bool:
+    """Returns True if the object is decorated with `check_output_specs`."""
+    return hasattr(obj, "__checked_output_specs__")
diff --git a/rllib/models/torch/encoders/tests/test_torch_vector_encoder.py b/rllib/models/torch/encoders/tests/test_torch_vector_encoder.py
deleted file mode 100644
index 0f3743be2f43..000000000000
--- a/rllib/models/torch/encoders/tests/test_torch_vector_encoder.py
+++ /dev/null
@@ -1,70 +0,0 @@
-import unittest
-
-import torch
-
-from ray.rllib.models.configs.encoder import VectorEncoderConfig
-from ray.rllib.models.specs.specs_dict import SpecDict
-from ray.rllib.models.specs.specs_torch import TorchTensorSpec
-from ray.rllib.utils.nested_dict import NestedDict
-
-
-class TestConfig(unittest.TestCase):
-    def test_error_no_feature_dim(self):
-        """Ensure we error out if we don't know the input dim"""
-        input_spec = SpecDict({"bork": TorchTensorSpec("a, b, c")})
-        c = VectorEncoderConfig()
-        with self.assertRaises(AssertionError):
-            c.build(input_spec)
-
-    def test_default_build(self):
-        """Test building with the default config"""
-        input_spec = SpecDict({"bork": TorchTensorSpec("a, b, c", c=3)})
-        c = VectorEncoderConfig()
-        c.build(input_spec)
-
-    def test_nonlinear_final_build(self):
-        input_spec = SpecDict({"bork": TorchTensorSpec("a, b, c", c=3)})
-        c = VectorEncoderConfig(final_activation="relu")
-        c.build(input_spec)
-
-    def test_default_forward(self):
-        """Test the default config/model _forward implementation"""
-        input_spec = SpecDict({"bork": TorchTensorSpec("a, b, c", c=3)})
-        c = VectorEncoderConfig()
-        m = c.build(input_spec)
-        inputs = NestedDict({"bork": torch.rand((2, 4, 3))})
-        outputs, _ = m.unroll(inputs, NestedDict())
-        self.assertEqual(outputs[c.output_key].shape[-1], c.hidden_layer_sizes[-1])
-        self.assertEqual(outputs[c.output_key].shape[:-1], (2, 4))
-
-    def test_two_inputs_forward(self):
-        """Test the default model when we have two items in the input_spec.
-        These two items will be concatenated and fed thru the mlp."""
-        """Test the default config/model _forward implementation"""
-        input_spec = SpecDict(
-            {
-                "bork": TorchTensorSpec("a, b, c", c=3),
-                "dork": TorchTensorSpec("x, y, z", z=5),
-            }
-        )
-        c = VectorEncoderConfig()
-        m = c.build(input_spec)
-        self.assertEqual(m.net[0].in_features, 8)
-        inputs = NestedDict(
-            {"bork": torch.rand((2, 4, 3)), "dork": torch.rand((2, 4, 5))}
-        )
-        outputs, _ = m.unroll(inputs, NestedDict())
-        self.assertEqual(outputs[c.output_key].shape[-1], c.hidden_layer_sizes[-1])
-        self.assertEqual(outputs[c.output_key].shape[:-1], (2, 4))
-
-    def test_deep_build(self):
-        input_spec = SpecDict({"bork": TorchTensorSpec("a, b, c", c=3)})
-        c = VectorEncoderConfig()
-        c.build(input_spec)
-
-
-if __name__ == "__main__":
-    import pytest
-    import sys
-
-    sys.exit(pytest.main(["-v", __file__]))
diff --git a/rllib/models/torch/encoders/vector.py b/rllib/models/torch/encoders/vector.py
deleted file mode 100644
index 91ef65d71f44..000000000000
--- a/rllib/models/torch/encoders/vector.py
+++ /dev/null
@@ -1,97 +0,0 @@
-from typing import TYPE_CHECKING
-from ray.rllib.models.specs.specs_torch import TorchTensorSpec
-
-import torch
-from torch import nn
-
-from ray.rllib.models.specs.specs_dict import SpecDict
-from ray.rllib.models.torch.model import TorchModel
-from ray.rllib.models.utils import get_activation_fn
-from ray.rllib.utils.nested_dict import NestedDict
-
-from ray.rllib.models.utils import input_to_output_spec
-
-if TYPE_CHECKING:
-    from ray.rllib.models.configs.encoder import VectorEncoderConfig
-
-
-class TorchVectorEncoder(TorchModel):
-    """A torch implementation of an MLP encoder.
-
-    This encoder concatenates inputs along the last dimension,
-    then pushes them through a series of linear layers and nonlinear activations.
-    """
-
-    @property
-    def input_spec(self) -> SpecDict:
-        return self._input_spec
-
-    @property
-    def output_spec(self) -> SpecDict:
-        return self._output_spec
-
-    def __init__(
-        self,
-        input_spec: SpecDict,
-        config: "VectorEncoderConfig",
-    ):
-        super().__init__(config=config)
-        # Setup input and output specs
-        self._input_spec = input_spec
-        self._output_spec = input_to_output_spec(
-            input_spec=input_spec,
-            num_input_feature_dims=1,
-            output_key=config.output_key,
-            output_feature_spec=TorchTensorSpec("f", f=config.hidden_layer_sizes[-1]),
-        )
-        # Returns the size of the feature dimension for the input tensors
-        prev_size = sum(v.shape[-1] for v in input_spec.values())
-
-        # Construct layers
-        layers = []
-        activation = (
-            None
-            if config.activation == "linear"
-            else get_activation_fn(config.activation, framework=config.framework_str)()
-        )
-        for size in config.hidden_layer_sizes[:-1]:
-            layers += [nn.Linear(prev_size, size)]
-            layers += [activation] if activation is not None else []
-            prev_size = size
-
-        # Final layer
-        layers += [
-            nn.Linear(config.hidden_layer_sizes[-2], config.hidden_layer_sizes[-1])
-        ]
-        if config.final_activation != "linear":
-            layers += [
-                get_activation_fn(
-                    config.final_activation, framework=config.framework_str
-                )()
-            ]
-
-        self.net = nn.Sequential(*layers)
-
-    def _forward(self, inputs: NestedDict) -> NestedDict:
-        """Runs the forward pass of the MLP. Call this via unroll().
-
-        Args:
-            inputs: The nested dictionary of inputs
-
-        Returns:
-            The nested dictionary of outputs
-        """
-        # Ensure all inputs have matching dims before concat
-        # so we can emit an informative error message
-        first_key, first_tensor = list(inputs.items())[0]
-        for k, tensor in inputs.items():
-            assert tensor.shape[:-1] == first_tensor.shape[:-1], (
-                "Inputs have mismatching dimensions, all dims but the last should "
-                f"be equal: {first_key}: {first_tensor.shape} != {k}: {tensor.shape}"
-            )
-
-        # Concatenate all input along the feature dim
-        x = torch.cat(list(inputs.values()), dim=-1)
-        [out_key] = self.output_spec.keys()
-        inputs[out_key] = self.net(x)
-        return inputs
diff --git a/rllib/models/torch/primitives.py b/rllib/models/torch/primitives.py
index 191a0ff35e5a..eaa43a6db3d4 100644
--- a/rllib/models/torch/primitives.py
+++ b/rllib/models/torch/primitives.py
@@ -11,8 +11,8 @@ class FCNet(nn.Module):
 
     Attributes:
         input_dim: The input dimension of the network. It cannot be None.
-        output_dim: The output dimension of the network. if None, the last layer would
-            be the last hidden layer.
+        output_dim: The output dimension of the network. If None, the output_dim will
+            be the number of nodes in the last hidden layer.
         hidden_layers: The sizes of the hidden layers.
         activation: The activation function to use after each layer.
     """

From 2efee1591612f1cdf5366819021dac3f66a5348c Mon Sep 17 00:00:00 2001
From: Balaji Veeramani <balaji@anyscale.com>
Date: Tue, 7 Feb 2023 12:40:23 -0800
Subject: [PATCH 160/267] [Data] Revise "Getting Started" page (#31989)

The "Getting Started" page is long. It contains large code snippets and potentially irrelevant information. This PR revises the page for readability and brevity.

Signed-off-by: Balaji Veeramani <balaji@anyscale.com>
---
 doc/source/data/doc_code/quick_start.py |  65 +------
 doc/source/data/getting-started.rst     | 218 ++++++++++++++----------
 2 files changed, 125 insertions(+), 158 deletions(-)

diff --git a/doc/source/data/doc_code/quick_start.py b/doc/source/data/doc_code/quick_start.py
index 21163d42ee0a..eaa3c789f76c 100644
--- a/doc/source/data/doc_code/quick_start.py
+++ b/doc/source/data/doc_code/quick_start.py
@@ -42,7 +42,7 @@
 # -> petal.width: double
 # -> variety: string
 # __create_from_python_end__
-# fmt: on 
+# fmt: on
 
 # fmt: off
 # __create_from_files_begin__
@@ -63,19 +63,6 @@
 # __create_from_files_end__
 # fmt: on
 
-# fmt: off
-# __save_dataset_begin__
-# Write to Parquet files in /tmp/iris.
-ds.write_parquet("/tmp/iris")
-# -> /tmp/iris/data_000000.parquet
-
-# Use repartition to control the number of output files:
-ds.repartition(2).write_parquet("/tmp/iris2")
-# -> /tmp/iris2/data_000000.parquet
-# -> /tmp/iris2/data_000001.parquet
-# __save_dataset_end__
-# fmt: on
-
 # fmt: off
 # __data_transform_begin__
 import pandas
@@ -104,53 +91,3 @@ def transform_batch(df: pandas.DataFrame) -> pandas.DataFrame:
 #     'petal.length': 4.5, 'petal.width': 1.7, 'variety': 'Virginica'}
 # __data_transform_end__
 # fmt: on
-
-# fmt: off
-# __data_access_begin__
-@ray.remote
-def consume(data) -> int:
-    num_batches = 0
-    for batch in data.iter_batches(batch_size=10):
-        num_batches += 1
-    return num_batches
-
-ray.get(consume.remote(ds))
-# -> 15
-# __data_access_end__
-# fmt: on
-
-# fmt: off
-# __dataset_split_begin__
-@ray.remote
-class Worker:
-    def __init__(self, rank: int):
-        pass
-
-    def train(self, shard) -> int:
-        for batch in shard.iter_batches(batch_size=256):
-            pass
-        return shard.count()
-
-workers = [Worker.remote(i) for i in range(4)]
-# -> [Actor(Worker, ...), Actor(Worker, ...), ...]
-
-shards = ds.split(n=4, locality_hints=workers)
-# -> [
-#       Dataset(num_blocks=3, num_rows=45,
-#               schema={sepal.length: double, sepal.width: double,
-#                       petal.length: double, petal.width: double, variety: string}),
-#       Dataset(num_blocks=3, num_rows=45,
-#               schema={sepal.length: double, sepal.width: double,
-#                       petal.length: double, petal.width: double, variety: string}),
-#       Dataset(num_blocks=2, num_rows=30,
-#               schema={sepal.length: double, sepal.width: double,
-#                       petal.length: double, petal.width: double, variety: string}),
-#       Dataset(num_blocks=2, num_rows=30,
-#               schema={sepal.length: double, sepal.width: double,
-#                       petal.length: double, petal.width: double, variety: string}),
-#    ]
-
-ray.get([w.train.remote(s) for w, s in zip(workers, shards)])
-# -> [45, 45, 30, 30]
-# __dataset_split_end__
-# fmt: on
diff --git a/doc/source/data/getting-started.rst b/doc/source/data/getting-started.rst
index 95d798c7e24d..497899752098 100644
--- a/doc/source/data/getting-started.rst
+++ b/doc/source/data/getting-started.rst
@@ -4,113 +4,143 @@ Getting Started
 ===============
 
 A Ray :class:`Dataset <ray.data.Dataset>` is a distributed data collection. It holds
-a list of Ray object references pointing to distributed data *blocks*, and has APIs
-for distributed data loading and processing. Each block holds an ordered collection
-of items in either an `Arrow table <https://arrow.apache.org/docs/python/data.html#tables>`__
-(when creating from or transforming to tabular or tensor data) or a Python list (for non-tabular Python objects).
+references to distributed data *blocks*, and exposes APIs for loading and processing
+data.
 
-In this tutorial you will learn how to:
+Install Ray Data
+----------------
 
-- Create and save a Ray ``Dataset``.
-- Transform a ``Dataset``.
-- Pass a ``Dataset`` to Ray tasks/actors and access the data inside.
+To install Ray Data, run:
 
-.. tip::
+.. code-block:: console
 
-   Run ``pip install "ray[data]"`` to get started!
+    $ pip install 'ray[data]'
 
-Creating and Saving Datasets
-----------------------------
+To learn more about installing Ray and its libraries, read
+:ref:`Installing Ray <installation>`.
 
-You can create a Dataset from Python objects. These objects can be held inside
-Dataset as the plain Python objects (where the schema is a Python type), or as
-Arrow records (in which case their schema is Arrow).
+Create a dataset
+----------------
 
-.. literalinclude:: ./doc_code/quick_start.py
-   :language: python
-   :start-after: __create_from_python_begin__
-   :end-before: __create_from_python_end__
+Create datasets from on-disk files, Python objects, and cloud storage services like S3.
+Ray reads from any `filesystem supported by Arrow
+<http://arrow.apache.org/docs/python/generated/pyarrow.fs.FileSystem.html>`__.
 
-Datasets can also be created from files on local disk or remote datasources such as S3.
-Any filesystem `supported by pyarrow <http://arrow.apache.org/docs/python/generated/pyarrow.fs.FileSystem.html>`__
-can be used to specify file locations. See more at :ref:`Creating Datasets <creating_datasets>`.
+.. testcode::
 
-.. literalinclude:: ./doc_code/quick_start.py
-   :language: python
-   :start-after: __create_from_files_begin__
-   :end-before: __create_from_files_end__
+    import ray
 
-Once you have a Dataset (potentially after transformation), you can save it to local
-or remote storage in desired format using methods such as :meth:`~ray.data.Dataset.write_csv`,
-:meth:`~ray.data.Dataset.write_json`, and :meth:`~ray.data.Dataset.write_parquet`.
-See more at :ref:`Saving Datasets <saving_datasets>`.
+    dataset = ray.data.read_csv("s3://anonymous@air-example-data/iris.csv")
 
-.. literalinclude:: ./doc_code/quick_start.py
-   :language: python
-   :start-after: __save_dataset_begin__
-   :end-before: __save_dataset_end__
+    dataset.show(limit=1)
 
-See the :ref:`Creating Datasets <creating_datasets>` and :ref:`Saving Datasets
-<saving_datasets>` guides for more details on how to create and save datasets.
+.. testoutput::
 
+    {'sepal length (cm)': 5.1, 'sepal width (cm)': 3.5, 'petal length (cm)': 1.4, 'petal width (cm)': 0.2, 'target': 0}
 
-Transforming Datasets
+
+To learn more about creating datasets, read
+:ref:`Creating datasets <creating_datasets>`.
+
+Transform the dataset
 ---------------------
 
-Once you have a :class:`~ray.data.Dataset`, you can transform it by applying a
-:ref:`user-defined function <transform_datasets_writing_udfs>`, which produces another
-:class:`~ray.data.Dataset`. Under the hood, the transformation is executed in parallel
-for performance at scale.
-
-.. literalinclude:: ./doc_code/quick_start.py
-   :language: python
-   :start-after: __data_transform_begin__
-   :end-before: __data_transform_end__
-
-.. tip::
-
-    Datasets also provide the convenience transformation methods :meth:`~ray.data.Dataset.map`, 
-    :meth:`~ray.data.Dataset.flat_map`, and :meth:`~ray.data.Dataset.filter`, which are not 
-    vectorized (slower than :meth:`~ray.data.Dataset.map_batches`), but may be useful for development.
-
-These transformations are composable. You can further apply transformations on the
-output Dataset, forming a chain of transformations to express more complex logic.
-
-By default, transformations are executed using Ray tasks.
-For transformations that require setup, you may want to use Ray actors by specifying
-``compute=ray.data.ActorPoolStrategy(min, max)`` and Ray will use an autoscaling
-actor pool of ``min`` to ``max`` actors to execute your transforms. This will cache
-the stateful setup at the actor creation time, which is particularly useful if the
-setup is expensive.
-
-See the :ref:`Transforming Datasets guide <transforming_datasets>` for an in-depth guide
-on transforming datasets.
-
-Accessing and exchanging datasets
----------------------------------
-
-Datasets can be passed to Ray tasks or actors and accessed with
-:meth:`~ray.data.Dataset.iter_batches` or
-:meth:`~ray.data.Dataset.iter_rows`.
-This does not incur a copy, since the blocks of the Dataset are passed by reference
-as Ray objects:
-
-.. literalinclude:: ./doc_code/quick_start.py
-   :language: python
-   :start-after: __data_access_begin__
-   :end-before: __data_access_end__
-
-Datasets can be split up into disjoint sub-datasets.
-Locality-aware splitting is supported if you pass in a list of actor handles to the
-:meth:`~ray.data.Dataset.split` function along with the number of desired
-splits.
-This is a common pattern useful for loading and splitting data between distributed
-training actors:
-
-.. literalinclude:: ./doc_code/quick_start.py
-   :language: python
-   :start-after: __dataset_split_begin__
-   :end-before: __dataset_split_end__
-
-See the :ref:`Consuming Datasets guide <consuming_datasets>` for an in-depth guide
-on accessing and exchanging datasets.
+Apply :ref:`user-defined functions <transform_datasets_writing_udfs>` (UDFs) to
+transform datasets. Ray executes transformations in parallel for performance at scale.
+
+.. testcode::
+
+    import pandas as pd
+
+    # Find rows with spepal length < 5.5 and petal length > 3.5.
+    def transform_batch(df: pd.DataFrame) -> pd.DataFrame:
+        return df[(df["sepal length (cm)"] < 5.5) & (df["petal length (cm)"] > 3.5)]
+
+    transformed_dataset = dataset.map_batches(transform_batch)
+    print(transformed_dataset)
+
+.. testoutput::
+
+    MapBatches
+    +- Dataset(num_blocks=1, num_rows=150, schema={sepal length (cm): double, sepal width (cm): double, petal length (cm): double, petal width (cm): double, target: int64})
+
+To learn more about transforming datasets, read
+:ref:`Transforming datasets <transforming_datasets>`.
+
+Consume the dataset
+-------------------
+
+Pass datasets to Ray tasks or actors, and access records with methods like
+:meth:`~ray.data.Dataset.iter_batches`.
+
+.. tabbed:: Local
+
+    .. testcode::
+
+        batches = transformed_dataset.iter_batches(batch_size=8)
+        print(next(iter(batches)))
+
+    .. testoutput::
+        :options: +NORMALIZE_WHITESPACE
+
+           sepal length (cm)  ...  target
+        0                5.2  ...       1
+        1                5.4  ...       1
+        2                4.9  ...       2
+
+        [3 rows x 5 columns]
+
+.. tabbed:: Tasks
+
+   .. testcode::
+
+        @ray.remote
+        def consume(dataset: ray.data.Dataset) -> int:
+            num_batches = 0
+            for batch in dataset.iter_batches(batch_size=8):
+                num_batches += 1
+            return num_batches
+
+        ray.get(consume.remote(transformed_dataset))
+
+.. tabbed:: Actors
+
+    .. testcode::
+
+        @ray.remote
+        class Worker:
+
+            def train(self, shard) -> int:
+                for batch in shard.iter_batches(batch_size=8):
+                    pass
+                return shard.count()
+
+        workers = [Worker.remote() for _ in range(4)]
+        shards = transformed_dataset.split(n=4, locality_hints=workers)
+        ray.get([w.train.remote(s) for w, s in zip(workers, shards)])
+
+
+To learn more about consuming datasets, read
+:ref:`Consuming datasets <consuming_datasets>`.
+
+Save the dataset
+----------------
+
+Call methods like :meth:`~ray.data.Dataset.write_parquet` to save datasets to local
+or remote filesystems.
+
+.. testcode::
+
+    import os
+
+    transformed_dataset.write_parquet("iris")
+
+    print(os.listdir("iris"))
+
+.. testoutput::
+    :options: +ELLIPSIS
+
+    ['..._000000.parquet']
+
+
+To learn more about saving datasets, read :ref:`Saving datasets <saving_datasets>`.

From 773f7bf176277650039e48e1a4afa94f22d54e06 Mon Sep 17 00:00:00 2001
From: Antoni Baum <antoni.baum@protonmail.com>
Date: Tue, 7 Feb 2023 13:48:52 -0800
Subject: [PATCH 161/267] [Tune] Add `use_threads=False` in pyarrow syncing
 (#32256)

Fixes a pyarrow issue where the syncing deadlocks when there are more files in a directory than available CPU cores.

Signed-off-by: Antoni Baum <antoni.baum@protonmail.com>
Signed-off-by: Kai Fricke <kai@anyscale.com>
Co-authored-by: Kai Fricke <kai@anyscale.com>
---
 python/ray/air/_internal/remote_storage.py | 27 ++++++++++++---
 python/ray/tune/tests/test_syncer.py       | 40 ++++++++++++++++++++++
 2 files changed, 63 insertions(+), 4 deletions(-)

diff --git a/python/ray/air/_internal/remote_storage.py b/python/ray/air/_internal/remote_storage.py
index 7df9c6f5f402..8e3cf6833060 100644
--- a/python/ray/air/_internal/remote_storage.py
+++ b/python/ray/air/_internal/remote_storage.py
@@ -36,6 +36,25 @@ def create_dir(self, path, recursive):
 from ray import logger
 
 
+def _pyarrow_fs_copy_files(
+    source, destination, source_filesystem=None, destination_filesystem=None, **kwargs
+):
+    if isinstance(source_filesystem, pyarrow.fs.S3FileSystem) or isinstance(
+        destination_filesystem, pyarrow.fs.S3FileSystem
+    ):
+        # Workaround multi-threading issue with pyarrow
+        # https://github.com/apache/arrow/issues/32372
+        kwargs.setdefault("use_threads", False)
+
+    return pyarrow.fs.copy_files(
+        source,
+        destination,
+        source_filesystem=source_filesystem,
+        destination_filesystem=destination_filesystem,
+        **kwargs,
+    )
+
+
 def _assert_pyarrow_installed():
     if pyarrow is None:
         raise RuntimeError(
@@ -214,9 +233,9 @@ def download_from_uri(uri: str, local_path: str, filelock: bool = True):
 
     if filelock:
         with TempFileLock(f"{os.path.normpath(local_path)}.lock"):
-            pyarrow.fs.copy_files(bucket_path, local_path, source_filesystem=fs)
+            _pyarrow_fs_copy_files(bucket_path, local_path, source_filesystem=fs)
     else:
-        pyarrow.fs.copy_files(bucket_path, local_path, source_filesystem=fs)
+        _pyarrow_fs_copy_files(bucket_path, local_path, source_filesystem=fs)
 
 
 def upload_to_uri(
@@ -233,7 +252,7 @@ def upload_to_uri(
         )
 
     if not exclude:
-        pyarrow.fs.copy_files(local_path, bucket_path, destination_filesystem=fs)
+        _pyarrow_fs_copy_files(local_path, bucket_path, destination_filesystem=fs)
         return
 
     # Else, walk and upload
@@ -262,7 +281,7 @@ def _should_exclude(candidate: str) -> bool:
             full_source_path = os.path.normpath(os.path.join(local_path, candidate))
             full_target_path = os.path.normpath(os.path.join(bucket_path, candidate))
 
-            pyarrow.fs.copy_files(
+            _pyarrow_fs_copy_files(
                 full_source_path, full_target_path, destination_filesystem=fs
             )
 
diff --git a/python/ray/tune/tests/test_syncer.py b/python/ray/tune/tests/test_syncer.py
index 0b02fe80a522..83d03b285da4 100644
--- a/python/ray/tune/tests/test_syncer.py
+++ b/python/ray/tune/tests/test_syncer.py
@@ -4,10 +4,12 @@
 import subprocess
 import tempfile
 import time
+from pathlib import Path
 from typing import List, Optional
 from unittest.mock import patch
 
 import pytest
+import boto3
 from freezegun import freeze_time
 
 import ray
@@ -18,6 +20,7 @@
 from ray.tune.syncer import Syncer, _DefaultSyncer
 from ray.tune.utils.file_transfer import _pack_dir, _unpack_dir
 from ray.air._internal.remote_storage import upload_to_uri, download_from_uri
+from ray._private.test_utils import simulate_storage
 
 
 @pytest.fixture
@@ -673,6 +676,43 @@ def train_func(config):
     )
 
 
+def test_sync_folder_with_many_files_s3(tmpdir):
+    # Create 256 files to upload
+    for i in range(256):
+        (tmpdir / str(i)).write_text("", encoding="utf-8")
+
+    root = "bucket_test_syncer/dir"
+    with simulate_storage("s3", root) as s3_uri:
+        # Upload to S3
+
+        s3 = boto3.client(
+            "s3", region_name="us-west-2", endpoint_url="http://localhost:5002"
+        )
+        s3.create_bucket(
+            Bucket="bucket_test_syncer",
+            CreateBucketConfiguration={"LocationConstraint": "us-west-2"},
+        )
+        upload_to_uri(tmpdir, s3_uri)
+
+        with tempfile.TemporaryDirectory() as download_dir:
+            download_from_uri(s3_uri, download_dir)
+
+            assert (Path(download_dir) / "255").exists()
+
+
+def test_sync_folder_with_many_files_fs(tmpdir):
+    # Create 256 files to upload
+    for i in range(256):
+        (tmpdir / str(i)).write_text("", encoding="utf-8")
+
+    # Upload to file URI
+    with tempfile.TemporaryDirectory() as upload_dir:
+        target_uri = "file://" + upload_dir
+        upload_to_uri(tmpdir, target_uri)
+
+        assert (tmpdir / "255").exists()
+
+
 if __name__ == "__main__":
     import sys
 

From ce5a21a53b57a63a1f4d33cc79b25cc7cfb66baa Mon Sep 17 00:00:00 2001
From: Alan Guo <aguo@anyscale.com>
Date: Tue, 7 Feb 2023 14:23:26 -0800
Subject: [PATCH 162/267] Fix overview page to work with the new DASHBOARD_UID
 env var (#32279)

In #32255 , i added a new env var to customize grafana dashboard uid. I forgot to use this var in the overview page.
I also made the "View in Grafana" button take the user directly to the dashboard instead of the homepage of Grafana.

Signed-off-by: Alan Guo aguo@anyscale.com
---
 dashboard/client/src/pages/metrics/Metrics.tsx        |  2 +-
 .../pages/overview/cards/ClusterUtilizationCard.tsx   | 11 +++++++----
 .../client/src/pages/overview/cards/NodeCountCard.tsx | 11 +++++++----
 3 files changed, 15 insertions(+), 9 deletions(-)

diff --git a/dashboard/client/src/pages/metrics/Metrics.tsx b/dashboard/client/src/pages/metrics/Metrics.tsx
index 620574f26dff..106acf4d9e46 100644
--- a/dashboard/client/src/pages/metrics/Metrics.tsx
+++ b/dashboard/client/src/pages/metrics/Metrics.tsx
@@ -241,7 +241,7 @@ export const Metrics = ({ newIA = false }: MetricsProps) => {
             })}
           >
             <Button
-              href={grafanaHost}
+              href={`${grafanaHost}/d/${grafanaDefaultDashboardUid}`}
               target="_blank"
               rel="noopener noreferrer"
               endIcon={<RiExternalLinkLine />}
diff --git a/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx b/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx
index 52ad45422c1a..e3c05b1c0890 100644
--- a/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx
+++ b/dashboard/client/src/pages/overview/cards/ClusterUtilizationCard.tsx
@@ -40,10 +40,13 @@ export const ClusterUtilizationCard = ({
 }: ClusterUtilizationCardProps) => {
   const classes = useStyles();
 
-  const { grafanaHost, prometheusHealth, sessionName } =
-    useContext(GlobalContext);
-  const path =
-    "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=41";
+  const {
+    grafanaHost,
+    prometheusHealth,
+    sessionName,
+    grafanaDefaultDashboardUid = "rayDefaultDashboard",
+  } = useContext(GlobalContext);
+  const path = `/d-solo/${grafanaDefaultDashboardUid}/default-dashboard?orgId=1&theme=light&panelId=41`;
   const timeRangeParams = "&from=now-30m&to=now";
 
   return (
diff --git a/dashboard/client/src/pages/overview/cards/NodeCountCard.tsx b/dashboard/client/src/pages/overview/cards/NodeCountCard.tsx
index fc09a4c53b67..daa14970b580 100644
--- a/dashboard/client/src/pages/overview/cards/NodeCountCard.tsx
+++ b/dashboard/client/src/pages/overview/cards/NodeCountCard.tsx
@@ -38,10 +38,13 @@ type NodeCountCardProps = {
 export const NodeCountCard = ({ className }: NodeCountCardProps) => {
   const classes = useStyles();
 
-  const { grafanaHost, prometheusHealth, sessionName } =
-    useContext(GlobalContext);
-  const path =
-    "/d-solo/rayDefaultDashboard/default-dashboard?orgId=1&theme=light&panelId=24";
+  const {
+    grafanaHost,
+    prometheusHealth,
+    sessionName,
+    grafanaDefaultDashboardUid = "rayDefaultDashboard",
+  } = useContext(GlobalContext);
+  const path = `/d-solo/${grafanaDefaultDashboardUid}/default-dashboard?orgId=1&theme=light&panelId=24`;
   const timeRangeParams = "&from=now-30m&to=now";
 
   return (

From 999559998b4f8d6d0b34fe02a4a504823ea1dfc3 Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Tue, 7 Feb 2023 23:39:12 +0100
Subject: [PATCH 163/267] [build_base] [Docker] Add cuda 11.8 images (#32247)

In order to keep up CUDA versions need for PyTorch 2.0, this PR adds a CUDA 11.8 image.

Signed-off-by: Artur Niederfahrenhorst <artur@anyscale.com>
Signed-off-by: Kai Fricke <kai@anyscale.com>
Co-authored-by: Kai Fricke <kai@anyscale.com>
---
 .buildkite/pipeline.arm64.yml         | 6 +++---
 .buildkite/pipeline.build.yml         | 6 +++---
 ci/build/build-docker-images.py       | 6 ++++--
 ci/docker/base.gpu.Dockerfile         | 2 +-
 docker/retag-lambda/cuda_versions.txt | 1 +
 5 files changed, 12 insertions(+), 9 deletions(-)

diff --git a/.buildkite/pipeline.arm64.yml b/.buildkite/pipeline.arm64.yml
index e49fff07fb41..7b735a791c82 100644
--- a/.buildkite/pipeline.arm64.yml
+++ b/.buildkite/pipeline.arm64.yml
@@ -94,7 +94,7 @@
     - pip install -q docker aws_requests_auth boto3
     - ./ci/env/env_info.sh
     - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
-    - python ./ci/build/build-docker-images.py --py-versions py38 --device-types cu113 cu116 --build-type BUILDKITE --build-base --suffix aarch64
+    - python ./ci/build/build-docker-images.py --py-versions py38 --device-types cu113 cu116 cu118 --build-type BUILDKITE --build-base --suffix aarch64
 
 - label: ":mechanical_arm: :docker: Build Images: py39 [aarch64] (1/2)"
   conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
@@ -114,7 +114,7 @@
     - pip install -q docker aws_requests_auth boto3
     - ./ci/env/env_info.sh
     - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
-    - python ./ci/build/build-docker-images.py --py-versions py39 --device-types cu113 cu116 --build-type BUILDKITE --build-base --suffix aarch64
+    - python ./ci/build/build-docker-images.py --py-versions py39 --device-types cu113 cu116 cu118 --build-type BUILDKITE --build-base --suffix aarch64
 
 - label: ":mechanical_arm: :docker: Build Images: py310 [aarch64] (1/2)"
   conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
@@ -133,4 +133,4 @@
     - LINUX_WHEELS=1 ./ci/ci.sh build
     - pip install -q docker aws_requests_auth boto3
     - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
-    - python ./ci/build/build-docker-images.py --py-versions py310 --device-types cu113 cu116 --build-type BUILDKITE --build-base --suffix aarch64
+    - python ./ci/build/build-docker-images.py --py-versions py310 --device-types cu113 cu116 cu118 --build-type BUILDKITE --build-base --suffix aarch64
diff --git a/.buildkite/pipeline.build.yml b/.buildkite/pipeline.build.yml
index 6a5cdd0197bf..4c3d1593db64 100644
--- a/.buildkite/pipeline.build.yml
+++ b/.buildkite/pipeline.build.yml
@@ -122,7 +122,7 @@
     - pip install -q docker aws_requests_auth boto3
     - ./ci/env/env_info.sh
     - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
-    - python ./ci/build/build-docker-images.py --py-versions py38 --device-types cu111 cu112 cu113 cu116 --build-type BUILDKITE --build-base
+    - python ./ci/build/build-docker-images.py --py-versions py38 --device-types cu111 cu112 cu113 cu116 cu118 --build-type BUILDKITE --build-base
 
 - label: ":docker: Build Images: py39 (1/2)"
   conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
@@ -142,7 +142,7 @@
     - pip install -q docker aws_requests_auth boto3
     - ./ci/env/env_info.sh
     - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
-    - python ./ci/build/build-docker-images.py --py-versions py39 --device-types cu111 cu112 cu113 cu116 --build-type BUILDKITE --build-base
+    - python ./ci/build/build-docker-images.py --py-versions py39 --device-types cu111 cu112 cu113 cu116 cu118 --build-type BUILDKITE --build-base
 
 - label: ":docker: Build Images: py310 (1/2)"
   conditions: ["RAY_CI_LINUX_WHEELS_AFFECTED"]
@@ -161,7 +161,7 @@
     - LINUX_WHEELS=1 ./ci/ci.sh build
     - pip install -q docker aws_requests_auth boto3
     - if [ "${BUILDKITE_PULL_REQUEST}" = "false" ]; then python .buildkite/copy_files.py --destination docker_login; fi
-    - python ./ci/build/build-docker-images.py --py-versions py310 --device-types cu111 cu112 cu113 cu116 --build-type BUILDKITE --build-base
+    - python ./ci/build/build-docker-images.py --py-versions py310 --device-types cu111 cu112 cu113 cu116 cu118 --build-type BUILDKITE --build-base
 
 - label: ":java: Java"
   conditions: ["RAY_CI_JAVA_AFFECTED"]
diff --git a/ci/build/build-docker-images.py b/ci/build/build-docker-images.py
index e3a3fec464c6..ceb523475c9c 100644
--- a/ci/build/build-docker-images.py
+++ b/ci/build/build-docker-images.py
@@ -40,6 +40,7 @@
 }
 
 BASE_IMAGES = {
+    "cu118": "nvidia/cuda:11.8.0-cudnn8-devel-ubuntu20.04",
     "cu116": "nvidia/cuda:11.6.1-cudnn8-devel-ubuntu20.04",
     "cu113": "nvidia/cuda:11.3.1-cudnn8-devel-ubuntu20.04",
     "cu112": "nvidia/cuda:11.2.0-cudnn8-devel-ubuntu20.04",
@@ -52,6 +53,7 @@
 }
 
 CUDA_FULL = {
+    "cu118": "CUDA 11.8",
     "cu116": "CUDA 11.6",
     "cu113": "CUDA 11.3",
     "cu112": "CUDA 11.2",
@@ -63,9 +65,9 @@
 
 # The CUDA version to use for the ML Docker image.
 # If changing the CUDA version in the below line, you should also change the base Docker
-# image being used in ~/ci/docker/Dockerfile.gpu to match the same image being used
+# image being used in ~/ci/docker/Dockerfile.base.gpu to match the same image being used
 # here.
-ML_CUDA_VERSION = "cu116"
+ML_CUDA_VERSION = "cu118"
 
 DEFAULT_PYTHON_VERSION = "py37"
 
diff --git a/ci/docker/base.gpu.Dockerfile b/ci/docker/base.gpu.Dockerfile
index d0cd22525c77..f0f15620c369 100644
--- a/ci/docker/base.gpu.Dockerfile
+++ b/ci/docker/base.gpu.Dockerfile
@@ -1,4 +1,4 @@
-FROM nvidia/cuda:11.6.1-cudnn8-devel-ubuntu20.04
+FROM nvidia/cuda:11.8.0-cudnn8-devel-ubuntu20.04
 
 ARG REMOTE_CACHE_URL
 ARG BUILDKITE_PULL_REQUEST
diff --git a/docker/retag-lambda/cuda_versions.txt b/docker/retag-lambda/cuda_versions.txt
index f8e781dbbc72..dc92eb55da3b 100644
--- a/docker/retag-lambda/cuda_versions.txt
+++ b/docker/retag-lambda/cuda_versions.txt
@@ -1,3 +1,4 @@
+cu118
 cu116
 cu113
 cu112

From cf955141f90bb644a040c55bacb0d88801d62d5d Mon Sep 17 00:00:00 2001
From: Yunxuan Xiao <xiaoyunxuan1998@gmail.com>
Date: Tue, 7 Feb 2023 14:56:34 -0800
Subject: [PATCH 164/267] [Tune] Add repr for ResultGrid class (#31941)

Add __repr__() for ResultGrid class and prettify __repr__() of Result class.

Signed-off-by: Yunxuan Xiao <yunxuanx@Yunxuans-MBP.local.meter>
Co-authored-by: Yunxuan Xiao <yunxuanx@Yunxuans-MBP.local.meter>
---
 python/ray/air/result.py                  | 23 +++++++--
 python/ray/tune/result_grid.py            | 16 +++++--
 python/ray/tune/tests/test_result_grid.py | 57 ++++++++++++++++++++++-
 python/ray/tune/tests/test_tuner.py       |  4 ++
 4 files changed, 90 insertions(+), 10 deletions(-)

diff --git a/python/ray/air/result.py b/python/ray/air/result.py
index 002a80b770f0..f3aaf9d57edf 100644
--- a/python/ray/air/result.py
+++ b/python/ray/air/result.py
@@ -44,7 +44,7 @@ class Result:
     log_dir: Optional[Path]
     metrics_dataframe: Optional["pd.DataFrame"]
     best_checkpoints: Optional[List[Tuple[Checkpoint, Dict[str, Any]]]]
-    _items_to_repr = ["metrics", "error", "log_dir"]
+    _items_to_repr = ["error", "metrics", "log_dir", "checkpoint"]
 
     @property
     def config(self) -> Optional[Dict[str, Any]]:
@@ -53,14 +53,29 @@ def config(self) -> Optional[Dict[str, Any]]:
             return None
         return self.metrics.get("config", None)
 
-    def __repr__(self):
+    def _repr(self, indent: int = 0) -> str:
+        """Construct the representation with specified number of space indent."""
         from ray.tune.result import AUTO_RESULT_KEYS
 
         shown_attributes = {k: self.__dict__[k] for k in self._items_to_repr}
+        if self.error:
+            shown_attributes["error"] = type(self.error).__name__
+        else:
+            shown_attributes.pop("error")
 
         if self.metrics:
             shown_attributes["metrics"] = {
                 k: v for k, v in self.metrics.items() if k not in AUTO_RESULT_KEYS
             }
-        kws = [f"{key}={value!r}" for key, value in shown_attributes.items()]
-        return "{}({})".format(type(self).__name__, ", ".join(kws))
+
+        cls_indent = " " * indent
+        kws_indent = " " * (indent + 2)
+
+        kws = [
+            f"{kws_indent}{key}={value!r}" for key, value in shown_attributes.items()
+        ]
+        kws_repr = ",\n".join(kws)
+        return "{0}{1}(\n{2}\n{0})".format(cls_indent, type(self).__name__, kws_repr)
+
+    def __repr__(self) -> str:
+        return self._repr(indent=0)
diff --git a/python/ray/tune/result_grid.py b/python/ray/tune/result_grid.py
index 82fcb325890f..61e5ec9550be 100644
--- a/python/ray/tune/result_grid.py
+++ b/python/ray/tune/result_grid.py
@@ -69,6 +69,9 @@ def __init__(
         experiment_analysis: ExperimentAnalysis,
     ):
         self._experiment_analysis = experiment_analysis
+        self._results = [
+            self._trial_to_result(trial) for trial in self._experiment_analysis.trials
+        ]
 
     def get_best_result(
         self,
@@ -178,13 +181,11 @@ def get_dataframe(
         )
 
     def __len__(self) -> int:
-        return len(self._experiment_analysis.trials)
+        return len(self._results)
 
     def __getitem__(self, i: int) -> Result:
         """Returns the i'th result in the grid."""
-        return self._trial_to_result(
-            self._experiment_analysis.trials[i],
-        )
+        return self._results[i]
 
     @property
     def errors(self):
@@ -235,8 +236,13 @@ def _trial_to_result(self, trial: Trial) -> Result:
             metrics_dataframe=self._experiment_analysis.trial_dataframes.get(
                 trial.logdir
             )
-            if self._experiment_analysis
+            if self._experiment_analysis.trial_dataframes
             else None,
             best_checkpoints=best_checkpoints,
         )
         return result
+
+    def __repr__(self) -> str:
+        all_results_repr = [result._repr(indent=2) for result in self]
+        all_results_repr = ",\n".join(all_results_repr)
+        return f"ResultGrid<[\n{all_results_repr}\n]>"
diff --git a/python/ray/tune/tests/test_result_grid.py b/python/ray/tune/tests/test_result_grid.py
index d2873573ef96..81086370fb50 100644
--- a/python/ray/tune/tests/test_result_grid.py
+++ b/python/ray/tune/tests/test_result_grid.py
@@ -12,6 +12,7 @@
 from ray.air._internal.checkpoint_manager import CheckpointStorage, _TrackedCheckpoint
 from ray import air, tune
 from ray.air import Checkpoint, session
+from ray.air.result import Result
 from ray.tune.registry import get_trainable_cls
 from ray.tune.result_grid import ResultGrid
 from ray.tune.experiment import Trial
@@ -142,7 +143,12 @@ def test_result_grid_future_checkpoint(ray_start_2_cpus, to_object):
     )
     trial.pickled_error_filename = None
     trial.error_filename = None
-    result_grid = ResultGrid(None)
+
+    class MockExperimentAnalysis:
+        trials = []
+        trial_dataframes = None
+
+    result_grid = ResultGrid(MockExperimentAnalysis())
 
     # Internal result grid conversion
     result = result_grid._trial_to_result(trial)
@@ -224,6 +230,55 @@ def f(config):
     assert not any(key in representation for key in AUTO_RESULT_KEYS)
 
 
+def test_result_grid_repr():
+    class MockExperimentAnalysis:
+        trials = []
+
+    result_grid = ResultGrid(experiment_analysis=MockExperimentAnalysis())
+
+    result_grid._results = [
+        Result(
+            metrics={"loss": 1.0},
+            checkpoint=Checkpoint(data_dict={"weight": 1.0}),
+            log_dir=Path("./log_1"),
+            error=None,
+            metrics_dataframe=None,
+            best_checkpoints=None,
+        ),
+        Result(
+            metrics={"loss": 2.0},
+            checkpoint=Checkpoint(data_dict={"weight": 2.0}),
+            log_dir=Path("./log_2"),
+            error=RuntimeError(),
+            metrics_dataframe=None,
+            best_checkpoints=None,
+        ),
+    ]
+
+    representation = result_grid.__repr__()
+
+    from ray.tune.result import AUTO_RESULT_KEYS
+
+    assert len(result_grid) == 2
+    assert not any(key in representation for key in AUTO_RESULT_KEYS)
+
+    expected_repr = """ResultGrid<[
+  Result(
+    metrics={'loss': 1.0},
+    log_dir=PosixPath('log_1'),
+    checkpoint=Checkpoint(data_dict={'weight': 1.0})
+  ),
+  Result(
+    error='RuntimeError',
+    metrics={'loss': 2.0},
+    log_dir=PosixPath('log_2'),
+    checkpoint=Checkpoint(data_dict={'weight': 2.0})
+  )
+]>"""
+
+    assert representation == expected_repr
+
+
 def test_no_metric_mode(ray_start_2_cpus):
     def f(config):
         tune.report(x=1)
diff --git a/python/ray/tune/tests/test_tuner.py b/python/ray/tune/tests/test_tuner.py
index d32a676e8b89..843186693f7a 100644
--- a/python/ray/tune/tests/test_tuner.py
+++ b/python/ray/tune/tests/test_tuner.py
@@ -343,8 +343,12 @@ def test_tuner_api_kwargs(shutdown_only, params_expected):
 
     caught_kwargs = {}
 
+    class MockExperimentAnalysis:
+        trials = []
+
     def catch_kwargs(**kwargs):
         caught_kwargs.update(kwargs)
+        return MockExperimentAnalysis()
 
     with patch("ray.tune.impl.tuner_internal.run", catch_kwargs):
         tuner.fit()

From 37580d7713dd29b3f5767ee80b9015c5464c6f0e Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Tue, 7 Feb 2023 14:56:56 -0800
Subject: [PATCH 165/267] [ci/release] Improve error message when kicking off
 tests from a commit (#32281)

If kicking off release tests from Buildkite, it's easy to make the mistake to insert a commit in both the Buildkite dialog and our own dialog. In the first case, it will checkout the repository from the specific commit, so if a test is not contained in that commit, it can't be run for that commit.

This PR will provide a better error message in that case.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 release/ray_release/scripts/build_pipeline.py | 25 +++++++++++++------
 1 file changed, 18 insertions(+), 7 deletions(-)

diff --git a/release/ray_release/scripts/build_pipeline.py b/release/ray_release/scripts/build_pipeline.py
index 7e7a774b1b45..11017392ec61 100644
--- a/release/ray_release/scripts/build_pipeline.py
+++ b/release/ray_release/scripts/build_pipeline.py
@@ -16,7 +16,7 @@
     DEFAULT_WHEEL_WAIT_TIMEOUT,
     parse_python_version,
 )
-from ray_release.exception import ReleaseTestCLIError
+from ray_release.exception import ReleaseTestCLIError, ReleaseTestConfigError
 from ray_release.logger import logger
 from ray_release.wheels import (
     find_and_wait_for_ray_wheels_url,
@@ -44,12 +44,12 @@ def main(test_collection_file: Optional[str] = None):
     env = {}
     if repo:
         # If the Ray test repo is set, we clone that repo to fetch
-        # the test configuration file. Otherwise we might be missing newly
+        # the test configuration file. Otherwise, we might be missing newly
         # added test.
-        repo = settings["ray_test_repo"]
         tmpdir = tempfile.mktemp()
 
         clone_cmd = f"git clone --depth 1 --branch {branch} {repo} {tmpdir}"
+        logger.info(f"Cloning test repository: {clone_cmd}")
         try:
             subprocess.check_output(clone_cmd, shell=True)
         except Exception as e:
@@ -65,10 +65,6 @@ def main(test_collection_file: Optional[str] = None):
         test_collection_file = test_collection_file or os.path.join(
             os.path.dirname(__file__), "..", "..", "release_tests.yaml"
         )
-    test_collection = read_and_validate_release_test_collection(test_collection_file)
-
-    if tmpdir:
-        shutil.rmtree(tmpdir, ignore_errors=True)
 
     frequency = settings["frequency"]
     prefer_smoke_tests = settings["prefer_smoke_tests"]
@@ -88,6 +84,21 @@ def main(test_collection_file: Optional[str] = None):
         f"  no_concurrency_limit =    {settings['no_concurrency_limit']}\n"
     )
 
+    try:
+        test_collection = read_and_validate_release_test_collection(
+            test_collection_file
+        )
+    except ReleaseTestConfigError as e:
+        raise ReleaseTestConfigError(
+            "Cannot load test yaml file.\nHINT: If you're kicking off tests for a "
+            "specific commit on Buildkite to test Ray wheels, after clicking "
+            "'New build', leave the commit at HEAD, and only specify the commit "
+            "in the dialog that asks for the Ray wheels."
+        ) from e
+
+    if tmpdir:
+        shutil.rmtree(tmpdir, ignore_errors=True)
+
     filtered_tests = filter_tests(
         test_collection,
         frequency=frequency,

From 00db3364f6849a99573bd14f1d0aa0791d77f943 Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Tue, 7 Feb 2023 15:36:36 -0800
Subject: [PATCH 166/267] [Core] Fix recursive cancelation crashes the worker
 when actor task is a child.  (#32259)

Signed-off-by: SangBin Cho <rkooo567@gmail.com>

ray.cancel is only supported for tasks, not actor tasks (https://docs.ray.io/en/master/ray-core/package-ref.html#ray-cancel). Note that it is an intended design because canceling actor tasks could corrupt the actor states easily.

When ray.cancel is called, we set recursive=True, which means all children's tasks will also be canceled. However, when this happens, if the task has a child "actor task", it crashes the worker with WorkerCrashedError: task_spec.cc:200: Check failed: sched_cls_id_ > 0 because we don't handle this case properly.

To fix the issue, we check if the child tasks are actor task. This PR also improves the error message when recursive cancellation is failed. Note that because ray.cancel is not blocking, we couldn't include the error message into ray.get(canceled_task).
---
 python/ray/tests/test_cancel.py    | 137 ++++++++++++++++++++++++++++-
 src/ray/core_worker/core_worker.cc |  46 ++++++++--
 2 files changed, 174 insertions(+), 9 deletions(-)

diff --git a/python/ray/tests/test_cancel.py b/python/ray/tests/test_cancel.py
index d0340c041823..fcfc196c7258 100644
--- a/python/ray/tests/test_cancel.py
+++ b/python/ray/tests/test_cancel.py
@@ -17,7 +17,8 @@
     ObjectLostError,
 )
 from ray._private.utils import DeferSigint
-from ray._private.test_utils import SignalActor
+from ray._private.test_utils import SignalActor, wait_for_condition
+from ray.experimental.state.api import list_tasks
 
 
 def valid_exceptions(use_force):
@@ -528,6 +529,140 @@ def many_resources():
     assert ray.get(many_fut, timeout=30)
 
 
+def test_recursive_cancel_actor_task(shutdown_only):
+    ray.init()
+
+    @ray.remote(num_cpus=0)
+    class Semaphore:
+        def wait(self):
+            import time
+
+            time.sleep(600)
+
+    @ray.remote(num_cpus=0)
+    class Actor2:
+        def __init__(self, obj):
+            (self.obj,) = obj
+
+        def cancel(self):
+            ray.cancel(self.obj)
+
+    @ray.remote
+    def task(sema):
+        return ray.get(sema.wait.remote())
+
+    sema = Semaphore.remote()
+
+    t = task.remote(sema)
+
+    def wait_until_wait_task_starts():
+        wait_state = list_tasks(
+            filters=[("func_or_class_name", "=", "Semaphore.wait")]
+        )[0]
+        return wait_state["state"] == "RUNNING"
+
+    wait_for_condition(wait_until_wait_task_starts)
+
+    # Make sure this will not crash ray.
+    # https://github.com/ray-project/ray/issues/31398
+    a2 = Actor2.remote((t,))
+    a2.cancel.remote()
+
+    with pytest.raises(RayTaskError, match="TaskCancelledError"):
+        ray.get(t)
+
+    wait_state = list_tasks(filters=[("func_or_class_name", "=", "Semaphore.wait")])
+    assert len(wait_state) == 1
+    wait_state = wait_state[0]
+    task_state = list_tasks(filters=[("func_or_class_name", "=", "task")])
+    assert len(task_state) == 1
+    task_state = task_state[0]
+
+    def verify():
+        wait_state = list_tasks(filters=[("func_or_class_name", "=", "Semaphore.wait")])
+        assert len(wait_state) == 1
+        wait_state = wait_state[0]
+        task_state = list_tasks(filters=[("func_or_class_name", "=", "task")])
+        assert len(task_state) == 1
+        task_state = task_state[0]
+
+        assert task_state["state"] == "FINISHED"
+        assert wait_state["state"] == "RUNNING"
+
+        return True
+
+    wait_for_condition(verify)
+
+
+def test_recursive_cancel_error_messages(shutdown_only, capsys):
+    """
+    Make sure the error message printed from the core worker
+    when the recursive cancelation fails it correct.
+
+    It should only sample 10 tasks.
+
+    Example output:
+    (task pid=55118) [2023-02-07 12:51:45,000 E 55118 6637966] core_worker.cc:3360: Unknown error: Failed to cancel all the children tasks of 85748392bcd969ccffffffffffffffffffffffff01000000 recursively. # noqa
+    (task pid=55118) Here are up to 10 samples tasks that failed to be canceled # noqa
+    (task pid=55118) 	b2094147c88795c9678740914e63d022610d70d501000000, Invalid: Actor task cancellation is not supported. The task won't be cancelled. # noqa
+    (task pid=55118) 	d33d38e548ef4f998e63e2e1aaf05a3270e2722e01000000, Invalid: Actor task cancellation is not supported. The task won't be cancelled. # noqa
+    (task pid=55118) 	46009b11e76c891daae7fa9272cac4a2755bb1a901000000, Invalid: Actor task cancellation is not supported. The task won't be cancelled. # noqa
+    (task pid=55118) 	163f27568ace977d38a1ee4f11d3a358e694488901000000, Invalid: Actor task cancellation is not supported. The task won't be cancelled. # noqa
+    (task pid=55118) 	4a0fec5a878ccb98afd7e48837351bfd14957bf001000000, Invalid: Actor task cancellation is not supported. The task won't be cancelled. # noqa
+    (task pid=55118) 	45757cb171c13b7409953bfd8065a5eb36ba936201000000, Invalid: Actor task cancellation is not supported. The task won't be cancelled. # noqa
+    (task pid=55118) 	a5220c501dc8f624f3ab13166dcf73e3f35068a101000000, Invalid: Actor task cancellation is not supported. The task won't be cancelled. # noqa
+    (task pid=55118) 	f8bdb7979cd66dfc0fb4f8225e6197a779e4b7e901000000, Invalid: Actor task cancellation is not supported. The task won't be cancelled. # noqa
+    (task pid=55118) 	3d941239bca36a1cef9d9405523ce46181ebecfe01000000, Invalid: Actor task cancellation is not supported. The task won't be cancelled. # noqa
+    (task pid=55118) 	d6fe9100f5c082db407a983e2f7ada3b5a065e3f01000000, Invalid: Actor task cancellation is not supported. The task won't be cancelled. # noqa
+    (task pid=55118) Total Recursive cancelation success: 0, failures: 12
+    """
+    ray.init(num_cpus=12)
+    NUM_ACTORS = 12
+
+    @ray.remote(num_cpus=0)
+    class Semaphore:
+        def wait(self):
+            print("wait called")
+            import time
+
+            time.sleep(600)
+
+    @ray.remote
+    def task(semas):
+        refs = []
+        for sema in semas:
+            refs.append(sema.wait.remote())
+        return ray.get(refs)
+
+    semas = [Semaphore.remote() for _ in range(NUM_ACTORS)]
+
+    t = task.remote(semas)
+
+    def wait_until_wait_task_starts():
+        wait_state = list_tasks(filters=[("func_or_class_name", "=", "Semaphore.wait")])
+        return len(wait_state) == 12
+
+    wait_for_condition(wait_until_wait_task_starts)
+    ray.cancel(t)
+
+    with pytest.raises(RayTaskError, match="TaskCancelledError"):
+        ray.get(t)
+
+    msgs = capsys.readouterr().err.strip(" \n").split("\n")
+    total_result = msgs[-1]
+
+    samples = []
+    for msg in msgs:
+        if "Invalid: Actor task cancellation is not supported." in msg:
+            samples.append(msg)
+    assert len(samples) == 10
+
+    assert (
+        f"Total Recursive cancelation success: 0, failures: {NUM_ACTORS}"
+        in total_result
+    )
+
+
 if __name__ == "__main__":
     if os.environ.get("PARALLEL_CI"):
         sys.exit(pytest.main(["-n", "auto", "--boxed", "-vs", __file__]))
diff --git a/src/ray/core_worker/core_worker.cc b/src/ray/core_worker/core_worker.cc
index 452bea1ad478..3255d092f3de 100644
--- a/src/ray/core_worker/core_worker.cc
+++ b/src/ray/core_worker/core_worker.cc
@@ -2212,22 +2212,53 @@ Status CoreWorker::CancelTask(const ObjectID &object_id,
 }
 
 Status CoreWorker::CancelChildren(const TaskID &task_id, bool force_kill) {
+  std::vector<std::pair<TaskID, Status>> recursive_cancellation_status;
   bool recursive_success = true;
   for (const auto &child_id : task_manager_->GetPendingChildrenTasks(task_id)) {
     auto child_spec = task_manager_->GetTaskSpec(child_id);
-    if (child_spec.has_value()) {
+    if (!child_spec.has_value()) {
+      recursive_success = false;
+      recursive_cancellation_status.push_back(
+          std::make_pair(child_id,
+                         Status::UnknownError(
+                             "Recursive task cancellation failed--check warning logs.")));
+    } else if (child_spec->IsActorTask()) {
+      recursive_success = false;
+      recursive_cancellation_status.push_back(std::make_pair(
+          child_id,
+          Status::Invalid(
+              "Actor task cancellation is not supported. The task won't be cancelled.")));
+    } else {
       auto result =
           direct_task_submitter_->CancelTask(child_spec.value(), force_kill, true);
-      recursive_success = recursive_success && result.ok();
-    } else {
-      recursive_success = false;
+      recursive_cancellation_status.push_back(std::make_pair(child_id, result));
     }
   }
+
   if (recursive_success) {
     return Status::OK();
   } else {
-    return Status::UnknownError(
-        "Recursive task cancellation failed--check warning logs.");
+    auto kMaxFailedTaskSampleSize = 10;
+    std::ostringstream ostr;
+    ostr << "Failed to cancel all the children tasks of " << task_id << " recursively.\n"
+         << "Here are up to " << kMaxFailedTaskSampleSize
+         << " samples tasks that failed to be canceled\n";
+    auto success = 0;
+    auto failures = 0;
+    for (const auto &[child_id, status] : recursive_cancellation_status) {
+      if (status.ok()) {
+        success += 1;
+      } else {
+        // Only record up to sample sizes.
+        if (failures < kMaxFailedTaskSampleSize) {
+          ostr << "\t" << child_id << ", " << status.ToString() << "\n";
+        }
+        failures += 1;
+      }
+    }
+    ostr << "Total Recursive cancelation success: " << success
+         << ", failures: " << failures;
+    return Status::UnknownError(ostr.str());
   }
 }
 
@@ -3326,8 +3357,7 @@ void CoreWorker::HandleCancelTask(rpc::CancelTaskRequest request,
   if (request.recursive()) {
     auto recursive_cancel = CancelChildren(task_id, request.force_kill());
     if (!recursive_cancel.ok()) {
-      RAY_LOG(ERROR) << "Recursive cancel failed for a task " << task_id
-                     << " due to reason: " << recursive_cancel.ToString();
+      RAY_LOG(ERROR) << recursive_cancel.ToString();
     }
   }
 

From 51efd2fba2eec3b870d98023d271acc3bf00fb1a Mon Sep 17 00:00:00 2001
From: Cade Daniel <cade@anyscale.com>
Date: Tue, 7 Feb 2023 16:17:14 -0800
Subject: [PATCH 167/267] Increase timeout of stress_test_many_tasks to ensure
 perf metrics are available (#32286)

---
 release/release_tests.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index 3f7dc6783e80..615b630369ec 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -3771,7 +3771,7 @@
     cluster_compute: stress_tests/stress_tests_compute.yaml
 
   run:
-    timeout: 7200
+    timeout: 14400
     wait_for_nodes:
       num_nodes: 101
 

From 3fa36d9c0faa24a31ee3353870b12baf0131a786 Mon Sep 17 00:00:00 2001
From: Balaji Veeramani <balaji@anyscale.com>
Date: Tue, 7 Feb 2023 16:34:00 -0800
Subject: [PATCH 168/267] [Datasets] Fix book-documentation (#32293)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Signed-off-by: Balaji Veeramani <balaji@anyscale.com>

#31989 broke the 📖 Documentation job. This PR fixes the doctest failure.
---
 doc/source/data/getting-started.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/doc/source/data/getting-started.rst b/doc/source/data/getting-started.rst
index 497899752098..70dc206163f4 100644
--- a/doc/source/data/getting-started.rst
+++ b/doc/source/data/getting-started.rst
@@ -61,7 +61,7 @@ transform datasets. Ray executes transformations in parallel for performance at
 
 .. testoutput::
 
-    MapBatches
+    MapBatches(transformBatch)
     +- Dataset(num_blocks=1, num_rows=150, schema={sepal length (cm): double, sepal width (cm): double, petal length (cm): double, petal width (cm): double, target: int64})
 
 To learn more about transforming datasets, read

From 5e1def0a95140a01c869c10ea8ec943c8280c325 Mon Sep 17 00:00:00 2001
From: Balaji Veeramani <balaji@anyscale.com>
Date: Tue, 7 Feb 2023 16:47:10 -0800
Subject: [PATCH 169/267] [AIR] Fix `dtype` type hint in `DLPredictor` methods
 (#32198)

The dtype parameter of DLPredictor._predict_pandas and DLPredictor._predict_numpy is None but default, but the type hint suggests dtype is non-None. This PR fixes the type hint by labeling the parameter as Optional.

Signed-off-by: Balaji Veeramani <balaji@anyscale.com>
---
 python/ray/train/_internal/dl_predictor.py          | 12 +++++++-----
 python/ray/train/tensorflow/tensorflow_predictor.py |  4 ++--
 python/ray/train/torch/torch_predictor.py           |  4 ++--
 3 files changed, 11 insertions(+), 9 deletions(-)

diff --git a/python/ray/train/_internal/dl_predictor.py b/python/ray/train/_internal/dl_predictor.py
index e097fe1297bc..65aee3d9f085 100644
--- a/python/ray/train/_internal/dl_predictor.py
+++ b/python/ray/train/_internal/dl_predictor.py
@@ -1,13 +1,13 @@
 import abc
-from typing import Dict, TypeVar, Union
+from typing import Dict, Optional, TypeVar, Union
 
 import numpy as np
 import pandas as pd
 
 from ray.air.util.data_batch_conversion import (
     BatchFormat,
-    convert_pandas_to_batch_type,
     convert_batch_type_to_pandas,
+    convert_pandas_to_batch_type,
 )
 from ray.train.predictor import Predictor
 from ray.util.annotations import DeveloperAPI
@@ -21,7 +21,7 @@ class DLPredictor(Predictor):
     def _arrays_to_tensors(
         self,
         numpy_arrays: Union[np.ndarray, Dict[str, np.ndarray]],
-        dtype: Union[TensorDtype, Dict[str, TensorDtype]],
+        dtype: Optional[Union[TensorDtype, Dict[str, TensorDtype]]],
     ) -> Union[TensorType, Dict[str, TensorType]]:
         """Converts a NumPy ndarray batch to the tensor type for the DL framework.
 
@@ -72,7 +72,9 @@ def preferred_batch_format(cls) -> BatchFormat:
         return BatchFormat.NUMPY
 
     def _predict_pandas(
-        self, data: pd.DataFrame, dtype: Union[TensorDtype, Dict[str, TensorDtype]]
+        self,
+        data: pd.DataFrame,
+        dtype: Optional[Union[TensorDtype, Dict[str, TensorDtype]]],
     ) -> pd.DataFrame:
         numpy_input = convert_pandas_to_batch_type(
             data,
@@ -85,7 +87,7 @@ def _predict_pandas(
     def _predict_numpy(
         self,
         data: Union[np.ndarray, Dict[str, np.ndarray]],
-        dtype: Union[TensorDtype, Dict[str, TensorDtype]],
+        dtype: Optional[Union[TensorDtype, Dict[str, TensorDtype]]],
     ) -> Union[np.ndarray, Dict[str, np.ndarray]]:
         # Single column selection return numpy array so preprocessors can be
         # reused in both training and prediction
diff --git a/python/ray/train/tensorflow/tensorflow_predictor.py b/python/ray/train/tensorflow/tensorflow_predictor.py
index 6faa2642df78..980bb388e884 100644
--- a/python/ray/train/tensorflow/tensorflow_predictor.py
+++ b/python/ray/train/tensorflow/tensorflow_predictor.py
@@ -225,9 +225,9 @@ def predict(
     def _arrays_to_tensors(
         self,
         numpy_arrays: Union[np.ndarray, Dict[str, np.ndarray]],
-        dtypes: Union[tf.dtypes.DType, Dict[str, tf.dtypes.DType]],
+        dtype: Optional[Union[tf.dtypes.DType, Dict[str, tf.dtypes.DType]]],
     ) -> Union[tf.Tensor, Dict[str, tf.Tensor]]:
-        return convert_ndarray_batch_to_tf_tensor_batch(numpy_arrays, dtypes=dtypes)
+        return convert_ndarray_batch_to_tf_tensor_batch(numpy_arrays, dtypes=dtype)
 
     def _tensor_to_array(self, tensor: tf.Tensor) -> np.ndarray:
         if not isinstance(tensor, tf.Tensor):
diff --git a/python/ray/train/torch/torch_predictor.py b/python/ray/train/torch/torch_predictor.py
index f621e28198b3..eb74d5e808bd 100644
--- a/python/ray/train/torch/torch_predictor.py
+++ b/python/ray/train/torch/torch_predictor.py
@@ -226,11 +226,11 @@ def forward(self, input_dict: dict):
     def _arrays_to_tensors(
         self,
         numpy_arrays: Union[np.ndarray, Dict[str, np.ndarray]],
-        dtypes: Union[torch.dtype, Dict[str, torch.dtype]],
+        dtype: Optional[Union[torch.dtype, Dict[str, torch.dtype]]],
     ) -> Union[torch.Tensor, Dict[str, torch.Tensor]]:
         return convert_ndarray_batch_to_torch_tensor_batch(
             numpy_arrays,
-            dtypes=dtypes,
+            dtypes=dtype,
             device="cuda" if self.use_gpu else None,
         )
 

From 3f43969f77aa583d16ccc0a3e2005043a6bc4188 Mon Sep 17 00:00:00 2001
From: Balaji Veeramani <balaji@anyscale.com>
Date: Tue, 7 Feb 2023 18:17:33 -0800
Subject: [PATCH 170/267] [Datasets] Promote `_create_strict_ragged_ndarray` to
 public API (#31975)

Closes https://github.com/ray-project/ray/issues/31779
---
 doc/source/data/api/data_representations.rst  |  3 +-
 python/ray/air/tests/test_tensor_extension.py | 18 +++++-
 .../ray/air/util/tensor_extensions/arrow.py   |  4 +-
 .../ray/air/util/tensor_extensions/utils.py   | 58 ++++++++++++++-----
 .../ray/data/extensions/tensor_extension.py   |  1 +
 5 files changed, 66 insertions(+), 18 deletions(-)

diff --git a/doc/source/data/api/data_representations.rst b/doc/source/data/api/data_representations.rst
index aacc09b963ab..8cedc04578af 100644
--- a/doc/source/data/api/data_representations.rst
+++ b/doc/source/data/api/data_representations.rst
@@ -23,7 +23,7 @@ Batch API
 
 .. autosummary::
    :toctree: doc/
-   
+
    block.DataBatch
 
 Row API
@@ -42,6 +42,7 @@ Tensor Column Extension API
 .. autosummary::
    :toctree: doc/
 
+   extensions.tensor_extension.create_ragged_ndarray
    extensions.tensor_extension.TensorDtype
    extensions.tensor_extension.TensorArray
    extensions.tensor_extension.ArrowTensorType
diff --git a/python/ray/air/tests/test_tensor_extension.py b/python/ray/air/tests/test_tensor_extension.py
index b7cdd383a936..c7022fefdab2 100644
--- a/python/ray/air/tests/test_tensor_extension.py
+++ b/python/ray/air/tests/test_tensor_extension.py
@@ -13,8 +13,22 @@
     ArrowVariableShapedTensorType,
 )
 from ray.air.util.tensor_extensions.pandas import TensorArray, TensorDtype
+from ray.air.util.tensor_extensions.utils import create_ragged_ndarray
 from ray._private.utils import _get_pyarrow_version
-from ray.air.util.tensor_extensions.utils import _create_strict_ragged_ndarray
+
+
+@pytest.mark.parametrize(
+    "values",
+    [
+        [np.zeros((3, 1)), np.zeros((3, 2))],
+        [np.zeros((3,))],
+    ],
+)
+def test_create_ragged_ndarray(values):
+    ragged_array = create_ragged_ndarray(values)
+    assert len(ragged_array) == len(values)
+    for actual_array, expected_array in zip(ragged_array, values):
+        np.testing.assert_array_equal(actual_array, expected_array)
 
 
 def test_tensor_array_validation():
@@ -582,7 +596,7 @@ def test_arrow_tensor_array_slice(test_arr, dtype):
     for shape in pytest_tensor_array_concat_shapes
 ]
 pytest_tensor_array_concat_arrs += [
-    _create_strict_ragged_ndarray(
+    create_ragged_ndarray(
         [np.arange(4).reshape((2, 2)), np.arange(4, 13).reshape((3, 3))]
     )
 ]
diff --git a/python/ray/air/util/tensor_extensions/arrow.py b/python/ray/air/util/tensor_extensions/arrow.py
index 6d61c3ab25ad..587ed9cddfc3 100644
--- a/python/ray/air/util/tensor_extensions/arrow.py
+++ b/python/ray/air/util/tensor_extensions/arrow.py
@@ -8,7 +8,7 @@
 
 from ray.air.util.tensor_extensions.utils import (
     _is_ndarray_variable_shaped_tensor,
-    _create_strict_ragged_ndarray,
+    create_ragged_ndarray,
 )
 from ray._private.utils import _get_pyarrow_version
 from ray.util.annotations import PublicAPI
@@ -783,7 +783,7 @@ def _to_numpy(self, index: Optional[int] = None, zero_copy_only: bool = False):
             arrs = [self._to_numpy(i, zero_copy_only) for i in range(len(self))]
             # Return ragged NumPy ndarray in the ndarray of ndarray pointers
             # representation.
-            return _create_strict_ragged_ndarray(arrs)
+            return create_ragged_ndarray(arrs)
         data = self.storage.field("data")
         shapes = self.storage.field("shape")
 
diff --git a/python/ray/air/util/tensor_extensions/utils.py b/python/ray/air/util/tensor_extensions/utils.py
index fe7ad97d16b4..410f4c3a2a44 100644
--- a/python/ray/air/util/tensor_extensions/utils.py
+++ b/python/ray/air/util/tensor_extensions/utils.py
@@ -3,6 +3,8 @@
 
 import numpy as np
 
+from ray.util import PublicAPI
+
 if TYPE_CHECKING:
     from pandas.core.dtypes.generic import ABCSeries
 
@@ -60,25 +62,55 @@ def _create_possibly_ragged_ndarray(
             or "The requested array has an inhomogeneous shape" in error_str
         ):
             # Fall back to strictly creating a ragged ndarray.
-            return _create_strict_ragged_ndarray(values)
+            return create_ragged_ndarray(values)
         else:
             # Re-raise original error if the failure wasn't a broadcast error.
             raise e from None
 
 
-def _create_strict_ragged_ndarray(values: Any) -> np.ndarray:
-    """Create a ragged ndarray; the representation will be ragged (1D array of
-    subndarray pointers) even if it's possible to represent it as a non-ragged ndarray.
-    """
-    # Use the create-empty-and-fill method. This avoids the following pitfalls of the
-    # np.array constructor - np.array(values, dtype=object):
-    #  1. It will fail to construct an ndarray if the first element dimension is
-    #  uniform, e.g. for imagery whose first element dimension is the channel.
-    #  2. It will construct the wrong representation for a single-row column (i.e. unit
-    #  outer dimension). Namely, it will consolidate it into a single multi-dimensional
-    #  ndarray rather than a 1D array of subndarray pointers, resulting in the single
-    #  row not being well-typed (having object dtype).
+@PublicAPI(stability="alpha")
+def create_ragged_ndarray(values: Sequence[np.ndarray]) -> np.ndarray:
+    """Create an array that contains arrays of different length
+
+    If you're working with variable-length arrays like images, use this function to
+    create ragged arrays instead of ``np.array``.
+
+    .. note::
+        ``np.array`` fails to construct ragged arrays if the input arrays have a uniform
+        first dimension:
+
+        .. testsetup::
+
+            import numpy as np
+            from ray.air.util.tensor_extensions.utils import create_ragged_ndarray
+
+        .. doctest::
+
+            >>> values = [np.zeros((3, 1)), np.zeros((3, 2))]
+            >>> np.array(values, dtype=object)
+            Traceback (most recent call last):
+                ...
+            ValueError: could not broadcast input array from shape (3,1) into shape (3,)
+            >>> create_ragged_ndarray(values)
+            array([array([[0.],
+                          [0.],
+                          [0.]]), array([[0., 0.],
+                                         [0., 0.],
+                                         [0., 0.]])], dtype=object)
+
+        Or if you're creating a ragged array from a single array:
+
+        .. doctest::
+
+            >>> values = [np.zeros((3, 1))]
+            >>> np.array(values, dtype=object)[0].dtype
+            dtype('O')
+            >>> create_ragged_ndarray(values)[0].dtype
+            dtype('float64')
 
+        ``create_ragged_ndarray`` avoids the limitations of ``np.array`` by creating an
+        empty array and filling it with pointers to the variable-length arrays.
+    """  # noqa: E501
     # Create an empty object-dtyped 1D array.
     arr = np.empty(len(values), dtype=object)
     # Try to fill the 1D array of pointers with the (ragged) tensors.
diff --git a/python/ray/data/extensions/tensor_extension.py b/python/ray/data/extensions/tensor_extension.py
index 3541e41e6f1c..2734de875718 100644
--- a/python/ray/data/extensions/tensor_extension.py
+++ b/python/ray/data/extensions/tensor_extension.py
@@ -10,3 +10,4 @@
     ArrowVariableShapedTensorType,
     ArrowVariableShapedTensorArray,
 )
+from ray.air.util.tensor_extensions.utils import create_ragged_ndarray  # noqa: F401

From 1f77e04040df07d3ccf49d1c892c63e74bed25ab Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Tue, 7 Feb 2023 18:21:37 -0800
Subject: [PATCH 171/267] [RLlib] PPO torch RLTrainer (#31801)

Signed-off-by: Kourosh Hakhamaneshi <kourosh@anyscale.com>
---
 rllib/BUILD                                   |  46 ++++++
 rllib/algorithms/algorithm.py                 |  47 ++++--
 rllib/algorithms/algorithm_config.py          |   7 +
 rllib/algorithms/ppo/ppo.py                   |  82 ++++++++--
 rllib/algorithms/ppo/ppo_rl_trainer_config.py |  21 +++
 .../ppo/tests/test_ppo_rl_trainer.py          | 109 +++++++++++++
 .../ppo/torch/ppo_torch_rl_trainer.py         | 152 ++++++++++++++++++
 .../core/rl_trainer/reduce_result_dict_fn.py  |  18 +++
 rllib/core/rl_trainer/rl_trainer.py           |  15 ++
 .../rl_trainer/tests/test_trainer_runner.py   |  21 +--
 rllib/core/rl_trainer/tf/tf_rl_trainer.py     |   8 +
 .../core/rl_trainer/torch/torch_rl_trainer.py |  28 +++-
 rllib/core/rl_trainer/trainer_runner.py       | 133 ++++++++++++---
 rllib/evaluation/worker_set.py                |  30 ++--
 .../rl_trainer/multi_agent_cartpole_ppo.py    | 123 ++++++++++++++
 rllib/policy/policy.py                        |  11 +-
 rllib/utils/minibatch_utils.py                |  63 ++++++++
 17 files changed, 839 insertions(+), 75 deletions(-)
 create mode 100644 rllib/algorithms/ppo/ppo_rl_trainer_config.py
 create mode 100644 rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py
 create mode 100644 rllib/algorithms/ppo/torch/ppo_torch_rl_trainer.py
 create mode 100644 rllib/core/rl_trainer/reduce_result_dict_fn.py
 create mode 100644 rllib/examples/rl_trainer/multi_agent_cartpole_ppo.py
 create mode 100644 rllib/utils/minibatch_utils.py

diff --git a/rllib/BUILD b/rllib/BUILD
index 93015763f7ed..696caf5b444b 100644
--- a/rllib/BUILD
+++ b/rllib/BUILD
@@ -1133,6 +1133,14 @@ py_test(
     srcs = ["algorithms/ppo/tests/test_ppo_rl_module.py"]
 )
 
+
+py_test(
+    name = "test_ppo_rl_trainer",
+    tags = ["team:rllib", "algorithms_dir"],
+    size = "medium",
+    srcs = ["algorithms/ppo/tests/test_ppo_rl_trainer.py"]
+)
+
 # PPO Reproducibility
 py_test(
     name = "test_repro_ppo",
@@ -3832,6 +3840,44 @@ py_test(
     ]
 )
 
+# --------------------------------------------------------------------
+# examples/rl_trainer directory
+#
+# 
+# Description: These are RLlib tests for the new multi-gpu enabled 
+# training stack via RLTrainers.
+#
+# NOTE: Add tests alphabetically to this list.
+# --------------------------------------------------------------------
+
+py_test(
+    name = "examples/rl_trainer/multi_agent_cartpole_ppo_torch",
+    main = "examples/rl_trainer/multi_agent_cartpole_ppo.py",
+    tags = ["team:rllib", "exclusive", "examples", "no-gpu"],
+    size = "medium",
+    srcs = ["examples/rl_trainer/multi_agent_cartpole_ppo.py"],
+    args = ["--as-test", "--framework=torch", "--num-gpus=0"]
+)
+
+py_test(
+    name = "examples/rl_trainer/multi_agent_cartpole_ppo_torch_gpu",
+    main = "examples/rl_trainer/multi_agent_cartpole_ppo.py",
+    tags = ["team:rllib", "exclusive", "examples", "gpu"],
+    size = "medium",
+    srcs = ["examples/rl_trainer/multi_agent_cartpole_ppo.py"],
+    args = ["--as-test", "--framework=torch", "--num-gpus=1"]
+)
+
+
+py_test(
+    name = "examples/rl_trainer/multi_agent_cartpole_ppo_torch_multi_gpu",
+    main = "examples/rl_trainer/multi_agent_cartpole_ppo.py",
+    tags = ["team:rllib", "exclusive", "examples", "multi-gpu"],
+    size = "medium",
+    srcs = ["examples/rl_trainer/multi_agent_cartpole_ppo.py"],
+    args = ["--as-test", "--framework=torch", "--num-gpus=2"]
+)
+
 # --------------------------------------------------------------------
 # examples/documentation directory
 #
diff --git a/rllib/algorithms/algorithm.py b/rllib/algorithms/algorithm.py
index e5e0c778af8f..4f835a151969 100644
--- a/rllib/algorithms/algorithm.py
+++ b/rllib/algorithms/algorithm.py
@@ -695,7 +695,7 @@ def setup(self, config: AlgorithmConfig) -> None:
             # TODO (Kourosh): This is an interim solution where policies and modules
             # co-exist. In this world we have both policy_map and MARLModule that need
             # to be consistent with one another. To make a consistent parity between
-            # the two we need to loop throught the policy modules and create a simple
+            # the two we need to loop through the policy modules and create a simple
             # MARLModule from the RLModule within each policy.
             local_worker = self.workers.local_worker()
             module_specs = {}
@@ -715,6 +715,10 @@ def setup(self, config: AlgorithmConfig) -> None:
             trainer_runner_config = self.config.get_trainer_runner_config(module_spec)
             self.trainer_runner = trainer_runner_config.build()
 
+            # sync the weights from local rollout worker to trainers
+            weights = local_worker.get_weights()
+            self.trainer_runner.set_weights(weights)
+
         # Run `on_algorithm_init` callback after initialization is done.
         self.callbacks.on_algorithm_init(algorithm=self)
 
@@ -858,7 +862,7 @@ def evaluate(
         # Sync weights to the evaluation WorkerSet.
         if self.evaluation_workers is not None:
             self.evaluation_workers.sync_weights(
-                from_worker=self.workers.local_worker()
+                from_worker_or_trainer=self.workers.local_worker()
             )
             self._sync_filters_if_needed(
                 from_worker=self.workers.local_worker(),
@@ -1376,11 +1380,11 @@ def training_step(self) -> ResultDict:
             # TODO (Avnish): Implement this on trainer_runner.get_weights().
             # TODO (Kourosh): figure out how we are going to sync MARLModule
             # weights to MARLModule weights under the policy_map objects?
-            from_worker = None
+            from_worker_or_trainer = None
             if self.config._enable_rl_trainer_api:
-                from_worker = self.trainer_runner
+                from_worker_or_trainer = self.trainer_runner
             self.workers.sync_weights(
-                from_worker=from_worker,
+                from_worker_or_trainer=from_worker_or_trainer,
                 policies=list(train_results.keys()),
                 global_vars=global_vars,
             )
@@ -2132,10 +2136,13 @@ def default_resource_request(
         eval_cf.freeze()
 
         # resources for local worker
-        local_worker = {
-            "CPU": cf.num_cpus_for_local_worker,
-            "GPU": 0 if cf._fake_gpus else cf.num_gpus,
-        }
+        if cf._enable_rl_trainer_api:
+            local_worker = {"CPU": cf.num_cpus_for_local_worker, "GPU": 0}
+        else:
+            local_worker = {
+                "CPU": cf.num_cpus_for_local_worker,
+                "GPU": 0 if cf._fake_gpus else cf.num_gpus,
+            }
 
         bundles = [local_worker]
 
@@ -2179,6 +2186,28 @@ def default_resource_request(
 
         bundles += rollout_workers + evaluation_bundle
 
+        if cf._enable_rl_trainer_api:
+            # resources for the trainer
+            if cf.num_trainer_workers == 0:
+                # if num_trainer_workers is 0, then we need to allocate one gpu if
+                # num_gpus_per_trainer_worker is greater than 0.
+                trainer_bundle = [
+                    {
+                        "CPU": cf.num_cpus_per_trainer_worker,
+                        "GPU": cf.num_gpus_per_trainer_worker,
+                    }
+                ]
+            else:
+                trainer_bundle = [
+                    {
+                        "CPU": cf.num_cpus_per_trainer_worker,
+                        "GPU": cf.num_gpus_per_trainer_worker,
+                    }
+                    for _ in range(cf.num_trainer_workers)
+                ]
+
+            bundles += trainer_bundle
+
         # Return PlacementGroupFactory containing all needed resources
         # (already properly defined as device bundles).
         return PlacementGroupFactory(
diff --git a/rllib/algorithms/algorithm_config.py b/rllib/algorithms/algorithm_config.py
index 63f6541ff140..96e777b458b5 100644
--- a/rllib/algorithms/algorithm_config.py
+++ b/rllib/algorithms/algorithm_config.py
@@ -883,6 +883,13 @@ def validate(self) -> None:
             rl_module_class_path = self.get_default_rl_module_class()
             self.rl_module_class = _resolve_class_path(rl_module_class_path)
 
+        # make sure the resource requirements for trainer runner is valid
+        if self.num_trainer_workers == 0 and self.num_gpus_per_worker > 1:
+            raise ValueError(
+                "num_gpus_per_worker must be 0 (cpu) or 1 (gpu) when using local mode "
+                "(i.e. num_trainer_workers = 0)"
+            )
+
         # resolve rl_trainer class
         if self._enable_rl_trainer_api and self.rl_trainer_class is None:
             rl_trainer_class_path = self.get_default_rl_trainer_class()
diff --git a/rllib/algorithms/ppo/ppo.py b/rllib/algorithms/ppo/ppo.py
index 89b7955c149b..7108241fd68c 100644
--- a/rllib/algorithms/ppo/ppo.py
+++ b/rllib/algorithms/ppo/ppo.py
@@ -16,6 +16,7 @@
 from ray.rllib.algorithms.algorithm import Algorithm
 from ray.rllib.algorithms.algorithm_config import AlgorithmConfig, NotProvided
 from ray.rllib.algorithms.pg import PGConfig
+from ray.rllib.algorithms.ppo.ppo_rl_trainer_config import PPORLTrainerHPs
 from ray.rllib.execution.rollout_ops import (
     standardize_fields,
 )
@@ -42,6 +43,8 @@
 
 if TYPE_CHECKING:
     from ray.rllib.core.rl_module import RLModule
+    from ray.rllib.core.rl_trainer.rl_trainer import RLTrainer
+
 
 logger = logging.getLogger(__name__)
 
@@ -89,6 +92,7 @@ def __init__(self, algo_class=None):
         # fmt: off
         # __sphinx_doc_begin__
         # PPO specific settings:
+        self._rl_trainer_hps = PPORLTrainerHPs()
         self.use_critic = True
         self.use_gae = True
         self.lambda_ = 1.0
@@ -131,6 +135,17 @@ def get_default_rl_module_class(self) -> Union[Type["RLModule"], str]:
         else:
             raise ValueError(f"The framework {self.framework_str} is not supported.")
 
+    @override(AlgorithmConfig)
+    def get_default_rl_trainer_class(self) -> Union[Type["RLTrainer"], str]:
+        if self.framework_str == "torch":
+            from ray.rllib.algorithms.ppo.torch.ppo_torch_rl_trainer import (
+                PPOTorchRLTrainer,
+            )
+
+            return PPOTorchRLTrainer
+        else:
+            raise ValueError(f"The framework {self.framework_str} is not supported.")
+
     @override(AlgorithmConfig)
     def training(
         self,
@@ -201,12 +216,16 @@ def training(
             self.lr_schedule = lr_schedule
         if use_critic is not NotProvided:
             self.use_critic = use_critic
+            # TODO (Kourosh) This is experimental. Set rl_trainer_hps parameters as
+            # well. Don't forget to remove .use_critic from algorithm config.
+            self._rl_trainer_hps.use_critic = use_critic
         if use_gae is not NotProvided:
             self.use_gae = use_gae
         if lambda_ is not NotProvided:
             self.lambda_ = lambda_
         if kl_coeff is not NotProvided:
             self.kl_coeff = kl_coeff
+            self._rl_trainer_hps.kl_coeff = kl_coeff
         if sgd_minibatch_size is not NotProvided:
             self.sgd_minibatch_size = sgd_minibatch_size
         if num_sgd_iter is not NotProvided:
@@ -215,18 +234,24 @@ def training(
             self.shuffle_sequences = shuffle_sequences
         if vf_loss_coeff is not NotProvided:
             self.vf_loss_coeff = vf_loss_coeff
+            self._rl_trainer_hps.vf_loss_coeff = vf_loss_coeff
         if entropy_coeff is not NotProvided:
             self.entropy_coeff = entropy_coeff
+            self._rl_trainer_hps.entropy_coeff = entropy_coeff
         if entropy_coeff_schedule is not NotProvided:
             self.entropy_coeff_schedule = entropy_coeff_schedule
+            self._rl_trainer_hps.entropy_coeff_schedule = entropy_coeff_schedule
         if clip_param is not NotProvided:
             self.clip_param = clip_param
+            self._rl_trainer_hps.clip_param = clip_param
         if vf_clip_param is not NotProvided:
             self.vf_clip_param = vf_clip_param
+            self._rl_trainer_hps.vf_clip_param = vf_clip_param
         if grad_clip is not NotProvided:
             self.grad_clip = grad_clip
         if kl_target is not NotProvided:
             self.kl_target = kl_target
+            self._rl_trainer_hps.kl_target = kl_target
 
         return self
 
@@ -366,14 +391,39 @@ def training_step(self) -> ResultDict:
         train_batch = standardize_fields(train_batch, ["advantages"])
         # Train
         if self.config._enable_rl_trainer_api:
-            train_results = self.trainer_runner.update(train_batch)
+            # TODO (Kourosh) Clearly define what train_batch_size
+            # vs. sgd_minibatch_size and num_sgd_iter is in the config.
+            # TODO (Kourosh) Do this inside the RL Trainer so
+            # that we don't have to do this back and forth
+            # communication between driver and the remote
+            # trainer workers
+
+            train_results = self.trainer_runner.fit(
+                train_batch,
+                minibatch_size=self.config.sgd_minibatch_size,
+                num_iters=self.config.num_sgd_iter,
+            )
+
         elif self.config.simple_optimizer:
             train_results = train_one_step(self, train_batch)
         else:
             train_results = multi_gpu_train_one_step(self, train_batch)
 
-        policies_to_update = list(train_results.keys())
+        if self.config._enable_rl_trainer_api:
+            # the train results's loss keys are pids to their loss values. But we also
+            # return a total_loss key at the same level as the pid keys. So we need to
+            # subtract that to get the total set of pids to update.
+            # TODO (Kourosh): We need to make a better design for the hierarchy of the
+            # train results, so that all the policy ids end up in the same level.
+            # TODO (Kourosh): We should also not be using train_results as a message
+            # passing medium to infer whcih policies to update. We could use
+            # policies_to_train variable that is given by the user to infer this.
+            policies_to_update = set(train_results["loss"].keys()) - {"total_loss"}
+        else:
+            policies_to_update = list(train_results.keys())
 
+        # TODO (Kourosh): num_grad_updates per each policy should be accessible via
+        # train_results
         global_vars = {
             "timestep": self._counters[NUM_AGENT_STEPS_SAMPLED],
             "num_grad_updates_per_policy": {
@@ -384,24 +434,34 @@ def training_step(self) -> ResultDict:
 
         # Update weights - after learning on the local worker - on all remote
         # workers.
-        if self.workers.num_remote_workers() > 0:
-            with self._timers[SYNCH_WORKER_WEIGHTS_TIMER]:
-                from_worker = None
+        with self._timers[SYNCH_WORKER_WEIGHTS_TIMER]:
+            if self.workers.num_remote_workers() > 0:
+                from_worker_or_trainer = None
                 if self.config._enable_rl_trainer_api:
-                    from_worker = self.trainer_runner
+                    # sync weights from trainer_runner to all rollout workers
+                    from_worker_or_trainer = self.trainer_runner
                 self.workers.sync_weights(
-                    from_worker=from_worker,
-                    policies=list(train_results.keys()),
+                    from_worker_or_trainer=from_worker_or_trainer,
+                    policies=policies_to_update,
                     global_vars=global_vars,
                 )
+            elif self.config._enable_rl_trainer_api:
+                weights = self.trainer_runner.get_weights()
+                self.workers.local_worker().set_weights(weights)
 
         if self.config._enable_rl_trainer_api:
             kl_dict = {
-                pid: pinfo[LEARNER_STATS_KEY].get("kl")
-                for pid, pinfo in train_results.items()
+                # TODO (Kourosh): Train results don't match the old format. The thing
+                # that used to be under `kl` is now under `mean_kl_loss`. Fix this. Do
+                # we need get here?
+                pid: train_results["loss"][pid].get("mean_kl_loss")
+                for pid in policies_to_update
             }
             # triggers a special update method on RLOptimizer to update the KL values.
-            self.trainer_runner.additional_update(kl_values=kl_dict)
+            self.trainer_runner.additional_update(
+                sampled_kl_values=kl_dict,
+                timestep=self._counters[NUM_AGENT_STEPS_SAMPLED],
+            )
 
             return train_results
 
diff --git a/rllib/algorithms/ppo/ppo_rl_trainer_config.py b/rllib/algorithms/ppo/ppo_rl_trainer_config.py
new file mode 100644
index 000000000000..2f616ca45787
--- /dev/null
+++ b/rllib/algorithms/ppo/ppo_rl_trainer_config.py
@@ -0,0 +1,21 @@
+from dataclasses import dataclass
+from typing import List, Optional, Union
+
+from ray.rllib.core.rl_trainer.rl_trainer import RLTrainerHPs
+
+
+@dataclass
+class PPORLTrainerHPs(RLTrainerHPs):
+    """Hyperparameters for the PPO RL Trainer"""
+
+    kl_coeff: float = 0.2
+    kl_target: float = 0.01
+    use_critic: bool = True
+    clip_param: float = 0.3
+    vf_clip_param: float = 10.0
+    entropy_coeff: float = 0.0
+    vf_loss_coeff: float = 1.0
+
+    # experimental placeholder for things that could be part of the base RLTrainerHPs
+    lr_schedule: Optional[List[List[Union[int, float]]]] = None
+    entropy_coeff_schedule: Optional[List[List[Union[int, float]]]] = None
diff --git a/rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py b/rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py
new file mode 100644
index 000000000000..a7eb642a6697
--- /dev/null
+++ b/rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py
@@ -0,0 +1,109 @@
+import ray
+import unittest
+import numpy as np
+from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
+import torch
+import tree  # pip install dm-tree
+
+import ray.rllib.algorithms.ppo as ppo
+from ray.rllib.policy.sample_batch import SampleBatch
+from ray.rllib.utils.torch_utils import convert_to_torch_tensor
+from ray.rllib.utils.test_utils import check
+
+from ray.rllib.evaluation.postprocessing import (
+    compute_gae_for_sample_batch,
+)
+
+# Fake CartPole episode of n time steps.
+FAKE_BATCH = {
+    SampleBatch.OBS: np.array(
+        [[0.1, 0.2, 0.3, 0.4], [0.5, 0.6, 0.7, 0.8], [0.9, 1.0, 1.1, 1.2]],
+        dtype=np.float32,
+    ),
+    SampleBatch.ACTIONS: np.array([0, 1, 1]),
+    SampleBatch.PREV_ACTIONS: np.array([0, 1, 1]),
+    SampleBatch.REWARDS: np.array([1.0, -1.0, 0.5], dtype=np.float32),
+    SampleBatch.PREV_REWARDS: np.array([1.0, -1.0, 0.5], dtype=np.float32),
+    SampleBatch.TERMINATEDS: np.array([False, False, True]),
+    SampleBatch.TRUNCATEDS: np.array([False, False, False]),
+    SampleBatch.VF_PREDS: np.array([0.5, 0.6, 0.7], dtype=np.float32),
+    SampleBatch.ACTION_DIST_INPUTS: {
+        "logits": np.array([[-2.0, 0.5], [-3.0, -0.3], [-0.1, 2.5]], dtype=np.float32)
+    },
+    SampleBatch.ACTION_LOGP: np.array([-0.5, -0.1, -0.2], dtype=np.float32),
+    SampleBatch.EPS_ID: np.array([0, 0, 0]),
+    SampleBatch.AGENT_INDEX: np.array([0, 0, 0]),
+}
+
+
+class TestPPO(unittest.TestCase):
+    @classmethod
+    def setUpClass(cls):
+        ray.init()
+
+    @classmethod
+    def tearDownClass(cls):
+        ray.shutdown()
+
+    def test_loss(self):
+
+        config = (
+            ppo.PPOConfig()
+            .environment("CartPole-v1")
+            .framework("torch")
+            .rollouts(
+                num_rollout_workers=0,
+            )
+            .training(
+                gamma=0.99,
+                model=dict(
+                    fcnet_hiddens=[10],
+                    fcnet_activation="linear",
+                    vf_share_layers=False,
+                ),
+            )
+            .rl_module(
+                _enable_rl_module_api=True,
+            )
+        )
+
+        trainer = config.build()
+        policy = trainer.get_policy()
+
+        train_batch = SampleBatch(FAKE_BATCH)
+        train_batch = compute_gae_for_sample_batch(policy, train_batch)
+
+        # convert to torch tensors with tree.map_structure
+        train_batch = tree.map_structure(
+            lambda x: torch.as_tensor(x).float(), train_batch
+        )
+
+        policy_loss = policy.loss(policy.model, policy.dist_class, train_batch)
+
+        config.training(_enable_rl_trainer_api=True)
+        config.validate()
+        config.freeze()
+        trainer_runner_config = config.get_trainer_runner_config(
+            SingleAgentRLModuleSpec(
+                observation_space=policy.observation_space,
+                action_space=policy.action_space,
+            )
+        )
+        trainer_runner = trainer_runner_config.build()
+
+        # load the policy weights into the trainer runner
+        state_dict = {"module_state": {"default_policy": policy.get_weights()}}
+        state_dict = convert_to_torch_tensor(state_dict)
+        trainer_runner.set_state(state_dict)
+        results = trainer_runner.update(train_batch.as_multi_agent())
+
+        trainer_runner_loss = results["loss"]["total_loss"]
+
+        check(trainer_runner_loss, policy_loss)
+
+
+if __name__ == "__main__":
+    import pytest
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/rllib/algorithms/ppo/torch/ppo_torch_rl_trainer.py b/rllib/algorithms/ppo/torch/ppo_torch_rl_trainer.py
new file mode 100644
index 000000000000..ab65abf22eb8
--- /dev/null
+++ b/rllib/algorithms/ppo/torch/ppo_torch_rl_trainer.py
@@ -0,0 +1,152 @@
+import logging
+from typing import Mapping, Any
+
+from ray.rllib.core.rl_trainer.torch.torch_rl_trainer import TorchRLTrainer
+from ray.rllib.evaluation.postprocessing import Postprocessing
+from ray.rllib.policy.sample_batch import SampleBatch
+from ray.rllib.utils.framework import try_import_torch
+from ray.rllib.utils.torch_utils import (
+    explained_variance,
+)
+from ray.rllib.utils.annotations import override
+from ray.rllib.utils.typing import TensorType
+
+torch, nn = try_import_torch()
+
+logger = logging.getLogger(__name__)
+
+
+class PPOTorchRLTrainer(TorchRLTrainer):
+    """Implements PPO loss / update logic on top of TorchRLTrainer.
+
+    This class implements the ppo loss under `_compute_loss_per_module()` and the
+    additional non-gradient based updates such as KL-coeff and learning rate updates
+    under `_additional_update_per_module()`.
+    """
+
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+
+        # TODO (Kourosh): Move these failures to config.validate() or support them.
+        self.entropy_coeff_scheduler = None
+        if self.config.entropy_coeff_schedule:
+            raise ValueError("entropy_coeff_schedule is not supported in RLTrainer yet")
+
+        # TODO (Kourosh): Create a way on the base class for users to define arbitrary
+        # schedulers for learning rates.
+        self.lr_scheduler = None
+        if self.config.lr_schedule:
+            raise ValueError("lr_schedule is not supported in RLTrainer yet")
+
+        # TODO (Kourosh): We can still use mix-ins in the new design. Do we want that?
+        # Most likely not. I rather be specific about everything. kl_coeff is a
+        # none-gradient based update which we can define here and add as update with
+        # additional_update() method.
+        self.kl_coeff = self.config.kl_coeff
+        self.kl_target = self.config.kl_target
+
+    @override(TorchRLTrainer)
+    def _compute_loss_per_module(
+        self, module_id: str, batch: SampleBatch, fwd_out: Mapping[str, TensorType]
+    ) -> TensorType:
+        # TODO (Kourosh): batch type is NestedDict.
+        # TODO (Kourosh): We may or may not user module_id. For example if we have an
+        # agent based learning rate scheduler, we may want to use module_id to get the
+        # learning rate for that agent.
+        # TODO (Kourosh): come back to RNNs later
+
+        curr_action_dist = fwd_out[SampleBatch.ACTION_DIST]
+        action_dist_class = type(fwd_out[SampleBatch.ACTION_DIST])
+        prev_action_dist = action_dist_class(
+            **batch[SampleBatch.ACTION_DIST_INPUTS].asdict()
+        )
+
+        logp_ratio = torch.exp(
+            fwd_out[SampleBatch.ACTION_LOGP] - batch[SampleBatch.ACTION_LOGP]
+        )
+
+        # Only calculate kl loss if necessary (kl-coeff > 0.0).
+        if self.config.kl_coeff > 0.0:
+            action_kl = prev_action_dist.kl(curr_action_dist)
+            mean_kl_loss = torch.mean(action_kl)
+            if mean_kl_loss.isinf():
+                logger.warning(
+                    "KL divergence is non-finite, this will likely destabilize "
+                    "your model and the training process. Action(s) in a "
+                    "specific state have near-zero probability. "
+                    "This can happen naturally in deterministic "
+                    "environments where the optimal policy has zero mass "
+                    "for a specific action. To fix this issue, consider "
+                    "setting the coefficient for the KL loss term to "
+                    "zero or increasing policy entropy."
+                )
+        else:
+            mean_kl_loss = torch.tensor(0.0, device=logp_ratio.device)
+
+        curr_entropy = fwd_out["entropy"]
+        mean_entropy = torch.mean(curr_entropy)
+
+        surrogate_loss = torch.min(
+            batch[Postprocessing.ADVANTAGES] * logp_ratio,
+            batch[Postprocessing.ADVANTAGES]
+            * torch.clamp(
+                logp_ratio, 1 - self.config.clip_param, 1 + self.config.clip_param
+            ),
+        )
+
+        # Compute a value function loss.
+        if self.config.use_critic:
+            value_fn_out = fwd_out[SampleBatch.VF_PREDS]
+            vf_loss = torch.pow(value_fn_out - batch[Postprocessing.VALUE_TARGETS], 2.0)
+            vf_loss_clipped = torch.clamp(vf_loss, 0, self.config.vf_clip_param)
+            mean_vf_loss = torch.mean(vf_loss_clipped)
+        # Ignore the value function.
+        else:
+            value_fn_out = torch.tensor(0.0).to(surrogate_loss.device)
+            vf_loss_clipped = mean_vf_loss = torch.tensor(0.0).to(surrogate_loss.device)
+
+        total_loss = torch.mean(
+            -surrogate_loss
+            + self.config.vf_loss_coeff * vf_loss_clipped
+            - self.config.entropy_coeff * curr_entropy
+        )
+
+        # Add mean_kl_loss (already processed through `reduce_mean_valid`),
+        # if necessary.
+        if self.config.kl_coeff > 0.0:
+            total_loss += self.config.kl_coeff * mean_kl_loss
+
+        return {
+            self.TOTAL_LOSS_KEY: total_loss,
+            "mean_policy_loss": -torch.mean(surrogate_loss),
+            "mean_vf_loss": mean_vf_loss,
+            "vf_explained_var": explained_variance(
+                batch[Postprocessing.VALUE_TARGETS], value_fn_out
+            ),
+            "mean_entropy": mean_entropy,
+            "mean_kl_loss": mean_kl_loss,
+        }
+
+    @override(TorchRLTrainer)
+    def _additional_update_per_module(
+        self, module_id: str, sampled_kl_values: dict, timestep: int
+    ) -> Mapping[str, Any]:
+
+        sampled_kl = sampled_kl_values[module_id]
+        if sampled_kl > 2.0 * self.kl_target:
+            # TODO (Kourosh) why not 2?
+            self.kl_coeff *= 1.5
+        elif sampled_kl < 0.5 * self.kl_target:
+            self.kl_coeff *= 0.5
+
+        results = {"kl_coeff": self.kl_coeff}
+
+        # TODO (Kourosh): We may want to index into the schedulers to get the right one
+        # for this module
+        if self.entropy_coeff_scheduler is not None:
+            self.entropy_coeff_scheduler.update(timestep)
+
+        if self.lr_scheduler is not None:
+            self.lr_scheduler.update(timestep)
+
+        return results
diff --git a/rllib/core/rl_trainer/reduce_result_dict_fn.py b/rllib/core/rl_trainer/reduce_result_dict_fn.py
new file mode 100644
index 000000000000..47ca597d2b11
--- /dev/null
+++ b/rllib/core/rl_trainer/reduce_result_dict_fn.py
@@ -0,0 +1,18 @@
+"""The following is set of default rllib reduction methods for ResultDicts"""
+
+from typing import List
+import numpy as np
+import tree  # pip install dm-tree
+from ray.rllib.utils.typing import ResultDict
+
+
+def _reduce_mean_results(results: List[ResultDict]) -> ResultDict:
+    """Takes the average of all the leaves in the result dict
+
+    Args:
+        results: list of result dicts to average
+
+    Returns:
+        Averaged result dict
+    """
+    return tree.map_structure(lambda *x: np.mean(x), *results)
diff --git a/rllib/core/rl_trainer/rl_trainer.py b/rllib/core/rl_trainer/rl_trainer.py
index ca78f7a096f7..d8b9d1cc3ff6 100644
--- a/rllib/core/rl_trainer/rl_trainer.py
+++ b/rllib/core/rl_trainer/rl_trainer.py
@@ -12,6 +12,7 @@
     Mapping,
     Optional,
     Sequence,
+    Set,
     Tuple,
     Type,
     Union,
@@ -68,6 +69,10 @@ class RLTrainerHPs:
 
     When creating a new RLTrainer, the new hyper-parameters have to be defined by
     subclassing this class and adding the new hyper-parameters as fields.
+
+    # TODO (Kourosh): The things that could be part of the base class:
+    - lr_schedule
+    - grad_clip
     """
 
     pass
@@ -438,6 +443,14 @@ def apply_gradients(self, gradients: Dict[ParamRef, TensorType]) -> None:
             gradients: A dictionary of gradients.
         """
 
+    @abc.abstractmethod
+    def get_weights(self, module_ids: Optional[Set[str]] = None) -> Mapping[str, Any]:
+        """Returns the state of the underlying MultiAgentRLModule"""
+
+    @abc.abstractmethod
+    def set_weights(self, weights: Mapping[str, Any]) -> None:
+        """Sets the state of the underlying MultiAgentRLModule"""
+
     def set_state(self, state: Mapping[str, Any]) -> None:
         """Set the state of the trainer.
 
@@ -446,6 +459,8 @@ def set_state(self, state: Mapping[str, Any]) -> None:
                 from `get_state`.
 
         """
+        # TODO (Kourosh): We have both get(set)_state and get(set)_weights. I think
+        # having both can become confusing. Can we simplify this API requirement?
         self.__check_if_build_called()
         # TODO: once we figure out the optimizer format, we can set/get the state
         self._module.set_state(state.get("module_state", {}))
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner.py b/rllib/core/rl_trainer/tests/test_trainer_runner.py
index 302321d7ca6d..fb4ed6dfbd98 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner.py
@@ -47,12 +47,12 @@ def local_training_helper(fw, scaling_mode) -> None:
         local_trainer.build()
 
         # make the state of the trainer and the local runner identical
-        local_trainer.set_state(runner.get_state()[0])
+        local_trainer.set_state(runner.get_state())
 
         reader = get_cartpole_dataset_reader(batch_size=500)
         batch = reader.next()
         batch = batch.as_multi_agent()
-        check(local_trainer.update(batch), runner.update(batch)[0])
+        check(local_trainer.update(batch), runner.update(batch))
 
         new_module_id = "test_module"
 
@@ -60,16 +60,16 @@ def local_training_helper(fw, scaling_mode) -> None:
         add_module_to_runner_or_trainer(fw, env, new_module_id, local_trainer)
 
         # make the state of the trainer and the local runner identical
-        local_trainer.set_state(runner.get_state()[0])
+        local_trainer.set_state(runner.get_state())
 
         # do another update
         batch = reader.next()
         ma_batch = MultiAgentBatch(
             {new_module_id: batch, DEFAULT_POLICY_ID: batch}, env_steps=batch.count
         )
-        check(local_trainer.update(ma_batch), runner.update(ma_batch)[0])
+        check(local_trainer.update(ma_batch), runner.update(ma_batch))
 
-        check(local_trainer.get_state(), runner.get_state()[0])
+        check(local_trainer.get_state(), runner.get_state())
 
     def test_trainer_runner_local(self):
         fws = ["tf", "torch"]
@@ -98,7 +98,7 @@ def test_update_multigpu(self):
             min_loss = float("inf")
             for iter_i in range(1000):
                 batch = reader.next()
-                results = runner.update(batch.as_multi_agent())
+                results = runner.update(batch.as_multi_agent(), reduce_fn=None)
 
                 loss = np.mean([res["loss"]["total_loss"] for res in results])
                 min_loss = min(loss, min_loss)
@@ -130,11 +130,11 @@ def test_add_remove_module(self):
             env = gym.make("CartPole-v1")
             scaling_config = REMOTE_SCALING_CONFIGS[scaling_mode]
             runner = get_trainer_runner(fw, env, scaling_config)
-            reader = get_cartpole_dataset_reader(batch_size=500)
+            reader = get_cartpole_dataset_reader(batch_size=512)
             batch = reader.next()
 
             # update once with the default policy
-            results = runner.update(batch.as_multi_agent())
+            results = runner.update(batch.as_multi_agent(), reduce_fn=None)
             module_ids_before_add = {DEFAULT_POLICY_ID}
             new_module_id = "test_module"
 
@@ -145,7 +145,8 @@ def test_add_remove_module(self):
             results = runner.update(
                 MultiAgentBatch(
                     {new_module_id: batch, DEFAULT_POLICY_ID: batch}, batch.count
-                )
+                ),
+                reduce_fn=None,
             )
 
             # check that module weights are updated across workers and synchronized
@@ -168,7 +169,7 @@ def test_add_remove_module(self):
             runner.remove_module(module_id=new_module_id)
 
             # run training without the test_module
-            results = runner.update(batch.as_multi_agent())
+            results = runner.update(batch.as_multi_agent(), reduce_fn=None)
 
             # check that module weights are updated across workers and synchronized
             for i in range(1, len(results)):
diff --git a/rllib/core/rl_trainer/tf/tf_rl_trainer.py b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
index 0455a0e772e0..a66d443f3e95 100644
--- a/rllib/core/rl_trainer/tf/tf_rl_trainer.py
+++ b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
@@ -244,6 +244,14 @@ def convert_batch_to_tf_tensor(self, batch: MultiAgentBatch) -> NestedDict:
             batch[key] = tf.convert_to_tensor(value, dtype=tf.float32)
         return batch
 
+    def get_weights(self) -> Mapping[str, Any]:
+        # TODO (Kourosh) Implement this.
+        raise NotImplementedError
+
+    def set_weights(self, weights: Mapping[str, Any]) -> None:
+        # TODO (Kourosh) Implement this.
+        raise NotImplementedError
+
     @override(RLTrainer)
     def get_parameters(self, module: RLModule) -> Sequence[ParamType]:
         return module.trainable_variables
diff --git a/rllib/core/rl_trainer/torch/torch_rl_trainer.py b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
index 8fe28c662718..1ce1762efe74 100644
--- a/rllib/core/rl_trainer/torch/torch_rl_trainer.py
+++ b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
@@ -8,6 +8,7 @@
     Hashable,
     Optional,
     Callable,
+    Set,
 )
 
 from ray.rllib.core.rl_module.rl_module import (
@@ -27,6 +28,8 @@
 from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 from ray.rllib.policy.sample_batch import MultiAgentBatch
 from ray.rllib.utils.annotations import override
+from ray.rllib.utils.torch_utils import convert_to_torch_tensor
+from ray.rllib.utils.numpy import convert_to_numpy
 from ray.rllib.utils.typing import TensorType
 from ray.rllib.utils.nested_dict import NestedDict
 from ray.rllib.utils.framework import try_import_torch
@@ -138,13 +141,8 @@ def _make_distributed_module(self) -> MultiAgentRLModule:
 
     @override(RLTrainer)
     def _convert_batch_type(self, batch: MultiAgentBatch):
-        batch = NestedDict(batch.policy_batches)
-        batch = NestedDict(
-            {
-                k: torch.as_tensor(v, dtype=torch.float32, device=self._device)
-                for k, v in batch.items()
-            }
-        )
+        batch = convert_to_torch_tensor(batch.policy_batches, device=self._device)
+        batch = NestedDict(batch)
         return batch
 
     @override(RLTrainer)
@@ -152,6 +150,22 @@ def do_distributed_update(self, batch: MultiAgentBatch) -> Mapping[str, Any]:
         # in torch the distributed update is no different than the normal update
         return self._update(batch)
 
+    def get_weights(self, module_ids: Optional[Set[str]] = None) -> Mapping[str, Any]:
+        """Returns the state of the underlying MultiAgentRLModule"""
+
+        module_weights = self._module.get_state()
+        if module_ids is None:
+            return module_weights
+
+        return convert_to_numpy(
+            {k: v for k, v in module_weights.items() if k in module_ids}
+        )
+
+    def set_weights(self, weights: Mapping[str, Any]) -> None:
+        """Sets the state of the underlying MultiAgentRLModule"""
+        weights = convert_to_torch_tensor(weights, device=self._device)
+        return self._module.set_state(weights)
+
     @override(RLTrainer)
     def get_param_ref(self, param: ParamType) -> Hashable:
         return param
diff --git a/rllib/core/rl_trainer/trainer_runner.py b/rllib/core/rl_trainer/trainer_runner.py
index 65fb40914678..55f99dfc0b47 100644
--- a/rllib/core/rl_trainer/trainer_runner.py
+++ b/rllib/core/rl_trainer/trainer_runner.py
@@ -1,8 +1,14 @@
 import math
-from typing import Any, List, Mapping, Type, Optional, Callable, Dict, TYPE_CHECKING
+import tree  # pip install dm-tree
+import numpy as np
+from typing import Any, List, Mapping, Type, Optional, Callable, Set, TYPE_CHECKING
 
 import ray
 
+from ray.rllib.utils.typing import ResultDict
+from ray.rllib.utils.numpy import convert_to_numpy
+from ray.rllib.utils.minibatch_utils import MiniBatchCyclicIterator
+from ray.rllib.core.rl_trainer.reduce_result_dict_fn import _reduce_mean_results
 from ray.rllib.core.rl_module.rl_module import (
     RLModule,
     ModuleID,
@@ -100,19 +106,76 @@ def __init__(
     def is_local(self) -> bool:
         return self._is_local
 
-    def update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
-        """Do a gradient based update to the RLTrainer(s) maintained by this TrainerRunner.
+    def fit(
+        self,
+        batch: MultiAgentBatch,
+        *,
+        minibatch_size: int,
+        num_iters: int,
+        reduce_fn: Optional[Callable[[ResultDict], ResultDict]] = _reduce_mean_results,
+    ) -> Mapping[str, Any]:
+        """Do `num_iters` minibatch updates given the original batch.
+
+        Given a batch of episodes you can use this method to take more
+        than one backward pass on the batch. The same minibatch_size and num_iters gets
+        will be used for all module ids (previously known as policies) in the
+        multiagent batch
 
         Args:
             batch: The data to use for the update.
+            minibatch_size: The size of the minibatch to use for each update.
+            num_iters: The number of complete passes over all the sub-batches
+                in the input multi-agent batch.
+            reduce_fn: See `update()` documenation for more details.
+
+        Returns:
+            A dictionary of results summarizing the statistics of the updates.
+        """
+
+        # TODO (Kourosh): One data transfer is probably better than many for each mini
+        # batch. How should we do this?
+        # loop until the number of passes through all modules batches reaches the
+        # num_iters
+        results = []
+        for minibatch in MiniBatchCyclicIterator(batch, minibatch_size, num_iters):
+            results.append(self.update(minibatch, reduce_fn=reduce_fn))
+
+        # return the average of the results using tree map
+        # TODO (Kourosh): There should be system for reporting back metrics from
+        # RLTrainers. Some metrics should be averaged, while some should be just
+        # concatenated.
+        return tree.map_structure(lambda *x: np.mean(x), *results)
+
+    def update(
+        self,
+        batch: MultiAgentBatch,
+        *,
+        reduce_fn: Optional[Callable[[ResultDict], ResultDict]] = _reduce_mean_results,
+    ) -> List[Mapping[str, Any]]:
+        """Do one gradient based update to the RLTrainer(s).
+
+        Args:
+            batch: The data to use for the update.
+            reduce_fn: A function to reduce the results from a list of RLTrainer Actors
+                into a single result. This can be any arbitrary function that takes a
+                list of dictionaries and returns a single dictionary. For example you
+                can either take an average (default) or concatenate the results (for
+                example for metrics) or be more selective about you want to report back
+                to the algorithm's training_step. If None is passed, the results will
+                not get reduced.
 
         Returns:
             A list of dictionaries of results from the updates from the RLTrainer(s)
         """
         if self.is_local:
-            return [self._trainer.update(batch)]
+            results = [self._trainer.update(batch)]
         else:
-            return self._distributed_update(batch)
+            results = self._distributed_update(batch)
+
+        # TODO (Kourosh): Maybe we should use LearnerInfoBuilder() here?
+        if reduce_fn is None:
+            return results
+        return reduce_fn(results)
 
     def _distributed_update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
         """Do a gradient based update to the RLTrainers using DDP training.
@@ -130,7 +193,6 @@ def _distributed_update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]
         """
         refs = []
         global_size = len(self._workers)
-        batch_size = math.ceil(len(batch) / global_size)
         for i, worker in enumerate(self._workers):
             batch_to_send = {}
             for pid, sub_batch in batch.policy_batches.items():
@@ -138,12 +200,19 @@ def _distributed_update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]
                 start = batch_size * i
                 end = min(start + batch_size, len(sub_batch))
                 batch_to_send[pid] = sub_batch[int(start) : int(end)]
+            # TODO (Avnish): int(batch_size) ? How should we shard MA batches really?
             new_batch = MultiAgentBatch(batch_to_send, int(batch_size))
             refs.append(worker.update.remote(new_batch))
 
-        return ray.get(refs)
+        results = ray.get(refs)
+        return results
 
-    def additional_update(self, *args, **kwargs) -> List[Mapping[str, Any]]:
+    def additional_update(
+        self,
+        *,
+        reduce_fn: Optional[Callable[[ResultDict], ResultDict]] = _reduce_mean_results,
+        **kwargs,
+    ) -> List[Mapping[str, Any]]:
         """Apply additional non-gradient based updates to the RLTrainers.
 
         For example, this could be used to do a polyak averaging update
@@ -152,7 +221,7 @@ def additional_update(self, *args, **kwargs) -> List[Mapping[str, Any]]:
         By default this is a pass through that calls `RLTrainer.additional_update`
 
         Args:
-            *args: Arguments to pass to each RLTrainer.
+            reduce_fn: See `update()` documentation for more details.
             **kwargs: Keyword arguments to pass to each RLTrainer.
 
         Returns:
@@ -160,12 +229,15 @@ def additional_update(self, *args, **kwargs) -> List[Mapping[str, Any]]:
         """
 
         if self.is_local:
-            return [self._trainer.additional_update(*args, **kwargs)]
+            results = [self._trainer.additional_update(**kwargs)]
         else:
             refs = []
             for worker in self._workers:
-                refs.append(worker.additional_update.remote(*args, **kwargs))
-            return ray.get(refs)
+                refs.append(worker.additional_update.remote(**kwargs))
+            results = ray.get(refs)
+        if reduce_fn is None:
+            return results
+        return reduce_fn(results)
 
     def add_module(
         self,
@@ -223,24 +295,33 @@ def remove_module(self, module_id: ModuleID) -> None:
                 refs.append(ref)
             ray.get(refs)
 
-    def get_weight(self) -> Dict:
-        """Get the weights of the MARLModule.
+    def set_weights(self, weights) -> None:
+        # TODO (Kourosh) Set / get weight has to be thoroughly
+        # tested across actors and multi-gpus
+        if self.is_local:
+            self._trainer.set_weights(weights)
+        else:
+            ray.get([worker.set_weights.remote(weights) for worker in self._workers])
 
-        Returns:
-            The weights of the neural networks that can be exchanged with the policy.
-        """
-        # TODO (Avnish): implement this.
-        pass
+    def get_weights(self, module_ids: Optional[Set[str]] = None) -> Mapping[str, Any]:
+        if self.is_local:
+            weights = self._trainer.get_weights(module_ids)
+        else:
+            worker = next(iter(self._workers))
+            weights = ray.get(worker.get_weights.remote(module_ids))
+
+        return convert_to_numpy(weights)
+
+    def get_state(self) -> Mapping[ModuleID, Mapping[str, Any]]:
+        """Get the states of the first RLTrainers.
 
-    def get_state(self) -> List[Mapping[ModuleID, Mapping[str, Any]]]:
-        """Get the states of the RLTrainers"""
+        This should be the same across RLTrainers
+        """
         if self.is_local:
-            return [self._trainer.get_state()]
+            return self._trainer.get_state()
         else:
-            refs = []
-            for worker in self._workers:
-                refs.append(worker.get_state.remote())
-            return ray.get(refs)
+            worker = next(iter(self._workers))
+            return ray.get(worker.get_state.remote())
 
     def set_state(self, state: List[Mapping[ModuleID, Mapping[str, Any]]]) -> None:
         """Sets the states of the RLTrainers.
diff --git a/rllib/evaluation/worker_set.py b/rllib/evaluation/worker_set.py
index 6dfd566bd0a1..e5e7243df6d3 100644
--- a/rllib/evaluation/worker_set.py
+++ b/rllib/evaluation/worker_set.py
@@ -382,19 +382,22 @@ def num_remote_worker_restarts(self) -> int:
     def sync_weights(
         self,
         policies: Optional[List[PolicyID]] = None,
-        from_worker: Optional[Union[RolloutWorker, TrainerRunner]] = None,
+        from_worker_or_trainer: Optional[Union[RolloutWorker, TrainerRunner]] = None,
         to_worker_indices: Optional[List[int]] = None,
         global_vars: Optional[Dict[str, TensorType]] = None,
         timeout_seconds: Optional[int] = 0,
     ) -> None:
-        """Syncs model weights from the local worker to all remote workers.
+        """Syncs model weights from the given weight source to all remote workers.
+
+        Weight source can be either a (local) rollout worker or a trainer runner. It
+        should just implement a `get_weights` method.
 
         Args:
             policies: Optional list of PolicyIDs to sync weights for.
                 If None (default), sync weights to/from all policies.
-            from_worker: Optional local RolloutWorker instance or TrainerRunner
-                instance to sync from.
-                If None (default), sync from this WorkerSet's local worker.
+            from_worker_or_trainer: Optional (local) RolloutWorker instance or
+                TrainerRunner instance to sync from. If None (default),
+                sync from this WorkerSet's local worker.
             to_worker_indices: Optional list of worker indices to sync the
                 weights to. If None (default), sync to all remote workers.
             global_vars: An optional global vars dict to set this
@@ -404,16 +407,23 @@ def sync_weights(
                 for any sync calls to finish). This significantly improves
                 algorithm performance.
         """
-        if self.local_worker() is None and from_worker is None:
+        if self.local_worker() is None and from_worker_or_trainer is None:
             raise TypeError(
                 "No `local_worker` in WorkerSet, must provide `from_worker` "
                 "arg in `sync_weights()`!"
             )
 
-        # Only sync if we have remote workers or `from_worker` is provided.
+        # Only sync if we have remote workers or `from_worker_or_trainer` is provided.
         weights = None
-        if self.num_remote_workers() or from_worker is not None:
-            weights = (from_worker or self.local_worker()).get_weights(policies)
+        if self.num_remote_workers() or from_worker_or_trainer is not None:
+            weights_src = from_worker_or_trainer or self.local_worker()
+
+            if weights_src is None:
+                raise ValueError(
+                    "`from_worker_or_trainer` is None. In this case, workerset "
+                    "should have local_worker. But local_worker is also None."
+                )
+            weights = weights_src.get_weights(policies)
 
             def set_weight(w):
                 w.set_weights(weights, global_vars)
@@ -433,7 +443,7 @@ def set_weight(w):
         # If `from_worker` is provided, also sync to this WorkerSet's
         # local worker.
         if self.local_worker() is not None:
-            if from_worker is not None:
+            if from_worker_or_trainer is not None:
                 self.local_worker().set_weights(weights, global_vars=global_vars)
             # If `global_vars` is provided and local worker exists  -> Update its
             # global_vars.
diff --git a/rllib/examples/rl_trainer/multi_agent_cartpole_ppo.py b/rllib/examples/rl_trainer/multi_agent_cartpole_ppo.py
new file mode 100644
index 000000000000..319b0b432f83
--- /dev/null
+++ b/rllib/examples/rl_trainer/multi_agent_cartpole_ppo.py
@@ -0,0 +1,123 @@
+"""Simple example of setting up a multi-agent policy mapping.
+
+Control the number of agents and policies via --num-agents and --num-policies.
+
+This works with hundreds of agents and policies, but note that initializing
+many TF policies will take some time.
+
+Also, TF evals might slow down with large numbers of policies. To debug TF
+execution, set the TF_TIMELINE_DIR environment variable.
+"""
+
+import argparse
+import os
+import random
+
+import ray
+from ray import tune, air
+from ray.rllib.algorithms.ppo import PPOConfig
+from ray.rllib.examples.env.multi_agent import MultiAgentCartPole
+from ray.rllib.policy.policy import PolicySpec
+from ray.rllib.utils.framework import try_import_tf
+from ray.rllib.utils.test_utils import check_learning_achieved
+
+
+tf1, tf, tfv = try_import_tf()
+
+parser = argparse.ArgumentParser()
+
+parser.add_argument("--num-agents", type=int, default=4)
+parser.add_argument("--num-policies", type=int, default=2)
+parser.add_argument(
+    "--framework",
+    choices=["tf2", "torch"],  # tf will be deprecated with the new RLTrainer stack
+    default="torch",
+    help="The DL framework specifier.",
+)
+
+parser.add_argument(
+    "--num-gpus",
+    type=int,
+    default=int(os.environ.get("RLLIB_NUM_GPUS", "0")),
+    help="Number of GPUs to use for training.",
+)
+
+parser.add_argument(
+    "--as-test",
+    action="store_true",
+    help="Whether this script should be run as a test: --stop-reward must "
+    "be achieved within --stop-timesteps AND --stop-iters.",
+)
+
+parser.add_argument(
+    "--stop-iters", type=int, default=20, help="Number of iterations to train."
+)
+parser.add_argument(
+    "--stop-timesteps", type=int, default=50000, help="Number of timesteps to train."
+)
+
+parser.add_argument(
+    "--stop-reward-per-agent",
+    type=float,
+    default=150.0,
+    help="Min. reward per agent at which we stop training.",
+)
+
+if __name__ == "__main__":
+    args = parser.parse_args()
+
+    ray.init()
+
+    # Each policy can have a different configuration (including custom model).
+    def gen_policy(i):
+        gammas = [0.95, 0.99]
+        # just change the gammas between the two policies.
+        # changing the module is not a critical part of this example.
+        # the important part is that the policies are different.
+        config = {
+            "gamma": gammas[i % len(gammas)],
+        }
+
+        return PolicySpec(config=config)
+
+    # Setup PPO with an ensemble of `num_policies` different policies.
+    policies = {"policy_{}".format(i): gen_policy(i) for i in range(args.num_policies)}
+    policy_ids = list(policies.keys())
+
+    def policy_mapping_fn(agent_id, episode, worker, **kwargs):
+        pol_id = random.choice(policy_ids)
+        return pol_id
+
+    scaling_config = {
+        "num_trainer_workers": args.num_gpus,
+        "num_gpus_per_trainer_worker": int(args.num_gpus > 0),
+    }
+
+    config = (
+        PPOConfig()
+        .rollouts(rollout_fragment_length=500)
+        .environment(MultiAgentCartPole, env_config={"num_agents": args.num_agents})
+        .framework(args.framework)
+        .training(num_sgd_iter=10)
+        .multi_agent(policies=policies, policy_mapping_fn=policy_mapping_fn)
+        .rl_module(_enable_rl_module_api=True)
+        .training(_enable_rl_trainer_api=True)
+        .resources(**scaling_config)
+    )
+
+    stop_reward = args.stop_reward_per_agent * args.num_agents
+    stop = {
+        "episode_reward_mean": stop_reward,
+        "timesteps_total": args.stop_timesteps,
+        "training_iteration": args.stop_iters,
+    }
+
+    results = tune.Tuner(
+        "PPO",
+        param_space=config.to_dict(),
+        run_config=air.RunConfig(stop=stop, verbose=1),
+    ).fit()
+
+    if args.as_test:
+        check_learning_achieved(results, stop_reward)
+    ray.shutdown()
diff --git a/rllib/policy/policy.py b/rllib/policy/policy.py
index 7cc5ceddae5d..82c4549abcf4 100644
--- a/rllib/policy/policy.py
+++ b/rllib/policy/policy.py
@@ -1193,6 +1193,7 @@ def _get_num_gpus_for_policy(self) -> int:
         """
         worker_idx = self.config.get("worker_index", 0)
         fake_gpus = self.config.get("_fake_gpus", False)
+
         if (
             ray._private.worker._mode() == ray._private.worker.LOCAL_MODE
             and not fake_gpus
@@ -1200,8 +1201,14 @@ def _get_num_gpus_for_policy(self) -> int:
             # If in local debugging mode, and _fake_gpus is not on.
             num_gpus = 0
         elif worker_idx == 0:
-            # If head node, take num_gpus.
-            num_gpus = self.config["num_gpus"]
+            # if we are in the new rl trainer world num_gpus is deprecated.
+            # so use num_gpus_per_worker for policy sampling
+            # we need this .get() syntax here to ensure backwards compatibility.
+            if self.config.get("_enable_rl_trainer_api", False):
+                num_gpus = self.config["num_gpus_per_worker"]
+            else:
+                # If head node, take num_gpus.
+                num_gpus = self.config["num_gpus"]
         else:
             # If worker node, take num_gpus_per_worker
             num_gpus = self.config["num_gpus_per_worker"]
diff --git a/rllib/utils/minibatch_utils.py b/rllib/utils/minibatch_utils.py
new file mode 100644
index 000000000000..5b21b57eacee
--- /dev/null
+++ b/rllib/utils/minibatch_utils.py
@@ -0,0 +1,63 @@
+from ray.rllib.policy.sample_batch import MultiAgentBatch, concat_samples
+from ray.rllib.utils.annotations import DeveloperAPI
+
+
+@DeveloperAPI
+class MiniBatchCyclicIterator:
+    """This implements a simple multi-agent minibatch iterator.
+
+
+    This iterator will split the input multi-agent batch into minibatches where the
+    size of batch for each module_id (aka policy_id) is equal to minibatch_size. If the
+    input batch is smaller than minibatch_size, then the iterator will cycle through
+    the batch until it has covered num_iters epochs.
+
+    Args:
+        batch: The input multi-agent batch.
+        minibatch_size: The size of the minibatch for each module_id.
+        num_iters: The number of epochs to cover. If the input batch is smaller than
+            minibatch_size, then the iterator will cycle through the batch until it
+            has covered num_iters epochs.
+    """
+
+    def __init__(
+        self, batch: MultiAgentBatch, minibatch_size: int, num_iters: int = 1
+    ) -> None:
+        self._batch = batch
+        self._minibatch_size = minibatch_size
+        self._num_iters = num_iters
+
+        # mapping from module_id to the start index of the batch
+        self._start = {mid: 0 for mid in batch.policy_batches.keys()}
+        # mapping from module_id to the number of epochs covered for each module_id
+        self._num_covered_epochs = {mid: 0 for mid in batch.policy_batches.keys()}
+
+    def __iter__(self):
+
+        while min(self._num_covered_epochs.values()) < self._num_iters:
+            minibatch = {}
+            for module_id, module_batch in self._batch.policy_batches.items():
+                s = self._start[module_id]  # start
+                e = s + self._minibatch_size  # end
+
+                samples_to_concat = []
+                # cycle through the batch until we have enough samples
+                while e >= len(module_batch):
+                    samples_to_concat.append(module_batch[s:])
+                    e = self._minibatch_size - len(module_batch[s:])
+                    s = 0
+                    self._num_covered_epochs[module_id] += 1
+
+                samples_to_concat.append(module_batch[s:e])
+
+                # concatenate all the samples, we should have minibatch_size of sample
+                # after this step
+                minibatch[module_id] = concat_samples(samples_to_concat)
+                # roll miniback to zero when we reach the end of the batch
+                self._start[module_id] = e
+
+            # TODO (Kourosh): len(batch) is not correct here. However it's also not
+            # clear what the correct value should be. Since training does not depend on
+            # this it will be fine for now.
+            minibatch = MultiAgentBatch(minibatch, len(self._batch))
+            yield minibatch

From befad81464d6f9ebe3be03c1d9c0313466c9d000 Mon Sep 17 00:00:00 2001
From: Jun Gong <jungong@anyscale.com>
Date: Tue, 7 Feb 2023 18:23:19 -0800
Subject: [PATCH 172/267] [Tune] Replace reference values in a config dict with
 placeholders (#31927)

Signed-off-by: Jun Gong <gongjunoliver@hotmail.com>
Co-authored-by: Justin Yu <justinvyu@anyscale.com>
Co-authored-by: Kai Fricke <krfricke@users.noreply.github.com>
---
 python/ray/tune/BUILD                         |   8 +
 .../ray/tune/execution/ray_trial_executor.py  |   4 +-
 python/ray/tune/execution/trial_runner.py     |  15 +-
 python/ray/tune/experiment/trial.py           | 101 +++---
 python/ray/tune/impl/placeholder.py           | 245 +++++++++++++++
 python/ray/tune/impl/tuner_internal.py        |  18 +-
 python/ray/tune/search/sample.py              |  56 ++--
 python/ray/tune/search/variant_generator.py   |  20 +-
 python/ray/tune/tests/test_cluster.py         |  18 +-
 python/ray/tune/tests/test_placeholder.py     | 295 ++++++++++++++++++
 .../ray/tune/tests/test_ray_trial_executor.py |  33 +-
 python/ray/tune/tests/test_sample.py          |   5 +-
 .../tune/tests/test_trial_relative_logdir.py  |   1 +
 python/ray/tune/tests/test_trial_runner_2.py  |   4 +-
 python/ray/tune/tests/test_trial_runner_3.py  |  66 ++++
 python/ray/tune/tests/test_tune_restore.py    |  64 ++++
 python/ray/tune/tune.py                       |  17 +
 17 files changed, 877 insertions(+), 93 deletions(-)
 create mode 100644 python/ray/tune/impl/placeholder.py
 create mode 100644 python/ray/tune/tests/test_placeholder.py

diff --git a/python/ray/tune/BUILD b/python/ray/tune/BUILD
index b386ccd9853a..6410bb6cfc2e 100644
--- a/python/ray/tune/BUILD
+++ b/python/ray/tune/BUILD
@@ -240,6 +240,14 @@ py_test(
     tags = ["team:ml", "exclusive", "medium_instance"],
 )
 
+py_test(
+    name = "test_placeholder",
+    size = "small",
+    srcs = ["tests/test_placeholder.py"],
+    deps = [":tune_lib"],
+    tags = ["team:ml", "exclusive"],
+)
+
 py_test(
     name = "test_searchers",
     size = "large",
diff --git a/python/ray/tune/execution/ray_trial_executor.py b/python/ray/tune/execution/ray_trial_executor.py
index d16469b1041e..239c6b562f1d 100644
--- a/python/ray/tune/execution/ray_trial_executor.py
+++ b/python/ray/tune/execution/ray_trial_executor.py
@@ -13,6 +13,7 @@
 from typing import Callable, Dict, Iterable, List, Optional, Set, Union, Tuple
 
 import ray
+from ray.actor import ActorHandle
 from ray.air import Checkpoint, AcquiredResources, ResourceRequest
 from ray.air._internal.checkpoint_manager import CheckpointStorage, _TrackedCheckpoint
 from ray.air.constants import COPY_DIRECTORY_CHECKPOINTS_INSTEAD_OF_MOVING_ENV
@@ -351,7 +352,7 @@ def get_ready_trial(self) -> Optional[Trial]:
 
         return None
 
-    def _maybe_use_cached_actor(self, trial, logger_creator) -> Optional:
+    def _maybe_use_cached_actor(self, trial, logger_creator) -> Optional[ActorHandle]:
         if not self._reuse_actors:
             return None
 
@@ -426,7 +427,6 @@ def _setup_remote_runner(self, trial):
         # configure the remote runner to use a noop-logger.
         trial_config = copy.deepcopy(trial.config)
         trial_config[TRIAL_INFO] = _TrialInfo(trial)
-
         stdout_file, stderr_file = trial.log_to_file
         trial_config[STDOUT_FILE] = stdout_file
         trial_config[STDERR_FILE] = stderr_file
diff --git a/python/ray/tune/execution/trial_runner.py b/python/ray/tune/execution/trial_runner.py
index dbcc4919d34e..b6d6b9715068 100644
--- a/python/ray/tune/execution/trial_runner.py
+++ b/python/ray/tune/execution/trial_runner.py
@@ -1,6 +1,6 @@
 from collections import defaultdict
 from dataclasses import dataclass
-from typing import DefaultDict, List, Optional, Union, Tuple, Set
+from typing import Any, DefaultDict, Dict, List, Optional, Union, Tuple, Set
 
 import click
 from datetime import datetime
@@ -331,7 +331,9 @@ class TrialRunner:
 
     def __init__(
         self,
+        *,
         search_alg: Optional[SearchAlgorithm] = None,
+        placeholder_resolvers: Optional[Dict[Tuple, Any]] = None,
         scheduler: Optional[TrialScheduler] = None,
         local_checkpoint_dir: Optional[str] = None,
         sync_config: Optional[SyncConfig] = None,
@@ -349,6 +351,7 @@ def __init__(
         driver_sync_trial_checkpoints: bool = False,
     ):
         self._search_alg = search_alg or BasicVariantGenerator()
+        self._placeholder_resolvers = placeholder_resolvers
         self._scheduler_alg = scheduler or FIFOScheduler()
         self.trial_executor = trial_executor or RayTrialExecutor()
         self._callbacks = CallbackList(callbacks or [])
@@ -823,7 +826,6 @@ def resume(
             if not ray.util.client.ray.is_connected():
                 trial.init_logdir()  # Create logdir if it does not exist
 
-            trial.refresh_default_resource_request()
             trials.append(trial)
 
         # 4. Set trial statuses according to the resume configuration
@@ -1085,6 +1087,14 @@ def add_trial(self, trial: Trial):
         Args:
             trial: Trial to queue.
         """
+        # If the config map has had all the references replaced with placeholders,
+        # resolve them before adding the trial.
+        if self._placeholder_resolvers:
+            trial.resolve_config_placeholders(self._placeholder_resolvers)
+
+        # With trial.config resolved, create placement group factory if needed.
+        trial.create_placement_group_factory()
+
         self._trials.append(trial)
         if trial.status != Trial.TERMINATED:
             self._live_trials.add(trial)
@@ -1586,6 +1596,7 @@ def __getstate__(self):
             "_stop_queue",
             "_server",
             "_search_alg",
+            "_placeholder_resolvers",
             "_scheduler_alg",
             "_pending_trial_queue_times",
             "trial_executor",
diff --git a/python/ray/tune/experiment/trial.py b/python/ray/tune/experiment/trial.py
index 88f37b8a0a48..2697329981ba 100644
--- a/python/ray/tune/experiment/trial.py
+++ b/python/ray/tune/experiment/trial.py
@@ -9,7 +9,7 @@
 import re
 import shutil
 import time
-from typing import Dict, Optional, Sequence, Union, Callable, List, Tuple
+from typing import Any, Dict, Optional, Sequence, Union, Callable, List, Tuple
 import uuid
 
 import ray
@@ -239,6 +239,8 @@ class Trial:
         "param_config",
         "extra_arg",
         "placement_group_factory",
+        "_resources",
+        "_default_placement_group_factory",
     ]
 
     PENDING = "PENDING"
@@ -292,42 +294,25 @@ def __init__(
         # Trial config
         self.trainable_name = trainable_name
         self.trial_id = Trial.generate_id() if trial_id is None else trial_id
-        self.config = config or {}
         self._local_dir = local_dir  # This remains unexpanded for syncing.
 
+        self.config = config or {}
+        # Save a copy of the original unresolved config so that we can swap
+        # out and update any reference config values after restoration.
+        self.__unresolved_config = self.config
+
         # Parameters that Tune varies across searches.
         self.evaluated_params = evaluated_params or {}
         self.experiment_tag = experiment_tag
         self.location = _Location()
-        trainable_cls = self.get_trainable_cls()
-        if trainable_cls and _setup_default_resource:
-            default_resources = trainable_cls.default_resource_request(self.config)
-
-            # If Trainable returns resources, do not allow manual override via
-            # `resources_per_trial` by the user.
-            if default_resources:
-                if resources or placement_group_factory:
-                    raise ValueError(
-                        "Resources for {} have been automatically set to {} "
-                        "by its `default_resource_request()` method. Please "
-                        "clear the `resources_per_trial` option.".format(
-                            trainable_cls, default_resources
-                        )
-                    )
-
-                if isinstance(default_resources, PlacementGroupFactory):
-                    placement_group_factory = default_resources
-                    resources = None
-                else:
-                    placement_group_factory = None
-                    resources = default_resources
-
-        self.placement_group_factory = _to_pg_factory(
-            resources, placement_group_factory
-        )
-
         self.stopping_criterion = stopping_criterion or {}
 
+        self._setup_default_resource = _setup_default_resource
+        self._resources = resources
+        self._default_placement_group_factory = placement_group_factory
+        # Will be created in create_placement_group_factory().
+        self.placement_group_factory = None
+
         self.log_to_file = log_to_file
         # Make sure `stdout_file, stderr_file = Trial.log_to_file` works
         if (
@@ -417,6 +402,48 @@ def __init__(
         self._state_json = None
         self._state_valid = False
 
+    def create_placement_group_factory(self):
+        """Compute placement group factor if needed.
+
+        Note: this must be called after all the placeholders in
+        self.config are resolved.
+        """
+        trainable_cls = self.get_trainable_cls()
+        if not trainable_cls or not self._setup_default_resource:
+            # Create placement group factory using default resources.
+            self.placement_group_factory = _to_pg_factory(
+                self._resources, self._default_placement_group_factory
+            )
+            return
+
+        default_resources = trainable_cls.default_resource_request(self.config)
+
+        # If Trainable returns resources, do not allow manual override via
+        # `resources_per_trial` by the user.
+        if default_resources:
+            if self._resources or self._default_placement_group_factory:
+                raise ValueError(
+                    "Resources for {} have been automatically set to {} "
+                    "by its `default_resource_request()` method. Please "
+                    "clear the `resources_per_trial` option.".format(
+                        trainable_cls, default_resources
+                    )
+                )
+
+            if isinstance(default_resources, PlacementGroupFactory):
+                default_placement_group_factory = default_resources
+                resources = None
+            else:
+                default_placement_group_factory = None
+                resources = default_resources
+        else:
+            default_placement_group_factory = self._default_placement_group_factory
+            resources = self._resources
+
+        self.placement_group_factory = _to_pg_factory(
+            resources, default_placement_group_factory
+        )
+
     def _get_default_result_or_future(self) -> Optional[dict]:
         """Calls ray.get on self._default_result_or_future and assigns back.
 
@@ -439,6 +466,13 @@ def _get_default_result_or_future(self) -> Optional[dict]:
             )
         return self._default_result_or_future
 
+    def resolve_config_placeholders(self, placeholder_resolvers: Dict[Tuple, Any]):
+        from ray.tune.impl.placeholder import resolve_placeholders
+
+        # Make a copy of the unresolved config before resolve it.
+        self.config = copy.deepcopy(self.__unresolved_config)
+        resolve_placeholders(self.config, placeholder_resolvers)
+
     @property
     def last_result(self) -> dict:
         # The logic in here is as follows:
@@ -654,15 +688,6 @@ def update_resources(
 
         self.invalidate_json_state()
 
-    def refresh_default_resource_request(self):
-        """Update trial resources according to the trainable's default resource
-        request, if it is provided."""
-        trainable_cls = self.get_trainable_cls()
-        if trainable_cls:
-            default_resources = trainable_cls.default_resource_request(self.config)
-            if default_resources:
-                self.update_resources(default_resources)
-
     def set_runner(self, runner):
         self.runner = runner
         if runner:
diff --git a/python/ray/tune/impl/placeholder.py b/python/ray/tune/impl/placeholder.py
new file mode 100644
index 000000000000..e7ba78c10103
--- /dev/null
+++ b/python/ray/tune/impl/placeholder.py
@@ -0,0 +1,245 @@
+from collections import defaultdict
+import hashlib
+from typing import Any, Dict, Tuple
+
+from ray.tune.search.sample import Categorical, Domain, Function
+from ray.tune.search.variant_generator import assign_value
+from ray.util.annotations import DeveloperAPI
+
+
+ID_HASH_LENGTH = 8
+
+
+def create_resolvers_map():
+    return defaultdict(list)
+
+
+def _id_hash(path_tuple):
+    """Compute a hash for the specific placeholder based on its path."""
+    return hashlib.sha1(str(path_tuple).encode("utf-8")).hexdigest()[:ID_HASH_LENGTH]
+
+
+class _FunctionResolver:
+    """Replaced value for function typed objects."""
+
+    TOKEN = "__fn_ph"
+
+    def __init__(self, hash, fn):
+        self.hash = hash
+        self._fn = fn
+
+    def resolve(self, config: Dict):
+        """Some functions take a resolved spec dict as input.
+
+        Note: Function placeholders are independently sampled during
+        resolution. Therefore their random states are not restored.
+        """
+        return self._fn.sample(config=config)
+
+    def get_placeholder(self) -> str:
+        return (self.TOKEN, self.hash)
+
+
+class _RefResolver:
+    """Replaced value for all other non-primitive objects."""
+
+    TOKEN = "__ref_ph"
+
+    def __init__(self, hash, value):
+        self.hash = hash
+        self._value = value
+
+    def resolve(self):
+        return self._value
+
+    def get_placeholder(self) -> str:
+        return (self.TOKEN, self.hash)
+
+
+def _is_primitive(x):
+    """Returns True if x is a primitive type.
+
+    Primitive types are int, float, str, bool, and None.
+    """
+    return isinstance(x, (int, float, str, bool)) or not x
+
+
+@DeveloperAPI
+def inject_placeholders(
+    config: Any,
+    resolvers: defaultdict,
+    id_prefix: Tuple = (),
+    path_prefix: Tuple = (),
+) -> Dict:
+    """Replaces reference objects contained by a config dict with placeholders.
+
+    Given a config dict, this function replaces all reference objects contained
+    by this dict with placeholder strings. It recursively expands nested dicts
+    and lists, and properly handles Tune native search objects such as Categorical
+    and Function.
+    This makes sure the config dict only contains primitive typed values, which
+    can then be handled by different search algorithms.
+
+    A few details about id_prefix and path_prefix. Consider the following config,
+    where "param1" is a simple grid search of 3 tuples.
+
+    config = {
+        "param1": tune.grid_search([
+            (Cat, None, None),
+            (None, Dog, None),
+            (None, None, Fish),
+        ]),
+    }
+
+    We will replace the 3 objects contained with placeholders. And after trial
+    expansion, the config may look like this:
+
+    config = {
+        "param1": (None, (placeholder, hash), None)
+    }
+
+    Now you need 2 pieces of information to resolve the placeholder. One is the
+    path of ("param1", 1), which tells you that the first element of the tuple
+    under "param1" key is a placeholder that needs to be resolved.
+    The other is the mapping from the placeholder to the actual object. In this
+    case hash -> Dog.
+
+    id and path prefixes serve exactly this purpose here. The difference between
+    these two is that id_prefix is the location of the value in the pre-injected
+    config tree. So if a value is the second option in a grid_search, it gets an
+    id part of 1. Injected placeholders all get unique id prefixes. path prefix
+    identifies a placeholder in the expanded config tree. So for example, all
+    options of a single grid_search will get the same path prefix. This is how
+    we know which location has a placeholder to be resolved in the post-expansion
+    tree.
+
+    Args:
+        config: The config dict to replace references in.
+        resolvers: A dict from path to replaced objects.
+        id_prefix: The prefix to prepend to id every single placeholders.
+        path_prefix: The prefix to prepend to every path identifying
+            potential locations of placeholders in an expanded tree.
+
+    Returns:
+        The config with all references replaced.
+    """
+    if isinstance(config, dict) and "grid_search" in config and len(config) == 1:
+        config["grid_search"] = [
+            # Different options gets different id prefixes.
+            # But we should omit appending to path_prefix because after expansion,
+            # this level will not be there.
+            inject_placeholders(choice, resolvers, id_prefix + (i,), path_prefix)
+            for i, choice in enumerate(config["grid_search"])
+        ]
+        return config
+    elif isinstance(config, dict):
+        return {
+            k: inject_placeholders(v, resolvers, id_prefix + (k,), path_prefix + (k,))
+            for k, v in config.items()
+        }
+    elif isinstance(config, list):
+        return [
+            inject_placeholders(elem, resolvers, id_prefix + (i,), path_prefix + (i,))
+            for i, elem in enumerate(config)
+        ]
+    elif isinstance(config, tuple):
+        return tuple(
+            inject_placeholders(elem, resolvers, id_prefix + (i,), path_prefix + (i,))
+            for i, elem in enumerate(config)
+        )
+    elif _is_primitive(config):
+        # Primitive types.
+        return config
+    elif isinstance(config, Categorical):
+        config.categories = [
+            # Different options gets different id prefixes.
+            # But we should omit appending to path_prefix because after expansion,
+            # this level will not be there.
+            inject_placeholders(choice, resolvers, id_prefix + (i,), path_prefix)
+            for i, choice in enumerate(config.categories)
+        ]
+        return config
+    elif isinstance(config, Function):
+        # Function type.
+        id_hash = _id_hash(id_prefix)
+        v = _FunctionResolver(id_hash, config)
+        resolvers[path_prefix].append(v)
+        return v.get_placeholder()
+    elif not isinstance(config, Domain):
+        # Other non-search space reference objects, dataset, actor handle, etc.
+        id_hash = _id_hash(id_prefix)
+        v = _RefResolver(id_hash, config)
+        resolvers[path_prefix].append(v)
+        return v.get_placeholder()
+    else:
+        # All the other cases, do nothing.
+        return config
+
+
+def _get_placeholder(config: Any, prefix: Tuple, path: Tuple):
+    if not path:
+        return prefix, config
+
+    key = path[0]
+    if isinstance(config, tuple):
+        if config[0] in (_FunctionResolver.TOKEN, _RefResolver.TOKEN):
+            # Found a matching placeholder.
+            # Note that we do not require that the full path are consumed before
+            # declaring a match. Because this placeholder may be part of a nested
+            # search space. For example, the following config:
+            #   config = {
+            #       "param1": tune.grid_search([
+            #           tune.grid_search([Object1, 2, 3]),
+            #           tune.grid_search([Object2, 5, 6]),
+            #       ]),
+            #   }
+            # will result in placeholders under path ("param1", 0, 0).
+            # After expansion though, the choosen placeholder will live under path
+            # ("param1", 0) like this: config = {"param1": (Placeholder1, 2, 3)}
+            return prefix, config
+        elif key < len(config):
+            return _get_placeholder(
+                config[key], prefix=prefix + (path[0],), path=path[1:]
+            )
+    elif (isinstance(config, dict) and key in config) or (
+        isinstance(config, list) and key < len(config)
+    ):
+        # Expand config tree recursively.
+        return _get_placeholder(config[key], prefix=prefix + (path[0],), path=path[1:])
+
+    # Can not find a matching placeholder.
+    return None, None
+
+
+@DeveloperAPI
+def resolve_placeholders(config: Any, replaced: defaultdict):
+    """Replaces placeholders contained by a config dict with the original values.
+
+    Args:
+        config: The config to replace placeholders in.
+        replaced: A dict from path to replaced objects.
+    """
+
+    def __resolve(resolver_type, args):
+        for path, resolvers in replaced.items():
+            assert resolvers
+
+            if not isinstance(resolvers[0], resolver_type):
+                continue
+
+            prefix, ph = _get_placeholder(config, (), path)
+            if not ph:
+                # Represents an unchosen value. Just skip.
+                continue
+
+            for resolver in resolvers:
+                if resolver.hash != ph[1]:
+                    continue
+                # Found the matching resolver.
+                assign_value(config, prefix, resolver.resolve(*args))
+
+    # RefResolvers first.
+    __resolve(_RefResolver, args=())
+    # Functions need to be resolved after RefResolvers, in case they are
+    # referencing values from the RefResolvers.
+    __resolve(_FunctionResolver, args=(config,))
diff --git a/python/ray/tune/impl/tuner_internal.py b/python/ray/tune/impl/tuner_internal.py
index e6184cb87b47..76b5f233d7a8 100644
--- a/python/ray/tune/impl/tuner_internal.py
+++ b/python/ray/tune/impl/tuner_internal.py
@@ -104,6 +104,9 @@ def __init__(
 
         self._missing_params_error_message = None
 
+        self._param_space = param_space or {}
+        self._process_scaling_config()
+
         # Restore from Tuner checkpoint.
         if restore_path:
             self._restore_from_path_or_uri(
@@ -128,10 +131,6 @@ def __init__(
 
         self._experiment_analysis = None
 
-        # Not used for restored Tuner.
-        self._param_space = param_space or {}
-        self._process_scaling_config()
-
         # This needs to happen before `tune.run()` is kicked in.
         # This is because currently tune does not exit gracefully if
         # run in ray client mode - if crash happens, it just exits immediately
@@ -450,11 +449,11 @@ def _convert_trainable(self, trainable: TrainableTypeOrTrainer) -> TrainableType
     def fit(self) -> ResultGrid:
         trainable = self.converted_trainable
         assert self._experiment_checkpoint_dir
+        param_space = copy.deepcopy(self._param_space)
         if not self._is_restored:
-            param_space = copy.deepcopy(self._param_space)
             analysis = self._fit_internal(trainable, param_space)
         else:
-            analysis = self._fit_resume(trainable)
+            analysis = self._fit_resume(trainable, param_space)
 
         self._experiment_analysis = analysis
 
@@ -553,7 +552,7 @@ def _get_tune_run_arguments(self, trainable: TrainableType) -> Dict[str, Any]:
         )
 
     def _fit_internal(
-        self, trainable: TrainableType, param_space
+        self, trainable: TrainableType, param_space: Dict[str, Any]
     ) -> ExperimentAnalysis:
         """Fitting for a fresh Tuner."""
         args = {
@@ -575,7 +574,9 @@ def _fit_internal(
         self.clear_remote_string_queue()
         return analysis
 
-    def _fit_resume(self, trainable: TrainableType) -> ExperimentAnalysis:
+    def _fit_resume(
+        self, trainable: TrainableType, param_space: Dict[str, Any]
+    ) -> ExperimentAnalysis:
         """Fitting for a restored Tuner."""
         if self._missing_params_error_message:
             raise ValueError(self._missing_params_error_message)
@@ -598,6 +599,7 @@ def _fit_resume(self, trainable: TrainableType) -> ExperimentAnalysis:
             **self._get_tune_run_arguments(trainable),
             **dict(
                 run_or_experiment=trainable,
+                config={**param_space},
                 resume=resume,
                 search_alg=self._tune_config.search_alg,
                 scheduler=self._tune_config.scheduler,
diff --git a/python/ray/tune/search/sample.py b/python/ray/tune/search/sample.py
index 95d2f8b42fb1..743da14de20f 100644
--- a/python/ray/tune/search/sample.py
+++ b/python/ray/tune/search/sample.py
@@ -108,14 +108,14 @@ def get_sampler(self):
 
     def sample(
         self,
-        spec: Optional[Union[List[Dict], Dict]] = None,
+        config: Optional[Union[List[Dict], Dict]] = None,
         size: int = 1,
         random_state: "RandomState" = None,
     ):
         if not isinstance(random_state, _BackwardsCompatibleNumpyRng):
             random_state = _BackwardsCompatibleNumpyRng(random_state)
         sampler = self.get_sampler()
-        return sampler.sample(self, spec=spec, size=size, random_state=random_state)
+        return sampler.sample(self, config=config, size=size, random_state=random_state)
 
     def is_grid(self):
         return isinstance(self.sampler, Grid)
@@ -137,7 +137,7 @@ class Sampler:
     def sample(
         self,
         domain: Domain,
-        spec: Optional[Union[List[Dict], Dict]] = None,
+        config: Optional[Union[List[Dict], Dict]] = None,
         size: int = 1,
         random_state: "RandomState" = None,
     ):
@@ -185,7 +185,7 @@ class Grid(Sampler):
     def sample(
         self,
         domain: Domain,
-        spec: Optional[Union[List[Dict], Dict]] = None,
+        config: Optional[Union[List[Dict], Dict]] = None,
         size: int = 1,
         random_state: "RandomState" = None,
     ):
@@ -198,7 +198,7 @@ class _Uniform(Uniform):
         def sample(
             self,
             domain: "Float",
-            spec: Optional[Union[List[Dict], Dict]] = None,
+            config: Optional[Union[List[Dict], Dict]] = None,
             size: int = 1,
             random_state: "RandomState" = None,
         ):
@@ -213,7 +213,7 @@ class _LogUniform(LogUniform):
         def sample(
             self,
             domain: "Float",
-            spec: Optional[Union[List[Dict], Dict]] = None,
+            config: Optional[Union[List[Dict], Dict]] = None,
             size: int = 1,
             random_state: "RandomState" = None,
         ):
@@ -233,7 +233,7 @@ class _Normal(Normal):
         def sample(
             self,
             domain: "Float",
-            spec: Optional[Union[List[Dict], Dict]] = None,
+            config: Optional[Union[List[Dict], Dict]] = None,
             size: int = 1,
             random_state: "RandomState" = None,
         ):
@@ -331,7 +331,7 @@ class _Uniform(Uniform):
         def sample(
             self,
             domain: "Integer",
-            spec: Optional[Union[List[Dict], Dict]] = None,
+            config: Optional[Union[List[Dict], Dict]] = None,
             size: int = 1,
             random_state: "RandomState" = None,
         ):
@@ -344,7 +344,7 @@ class _LogUniform(LogUniform):
         def sample(
             self,
             domain: "Integer",
-            spec: Optional[Union[List[Dict], Dict]] = None,
+            config: Optional[Union[List[Dict], Dict]] = None,
             size: int = 1,
             random_state: "RandomState" = None,
         ):
@@ -413,7 +413,7 @@ class _Uniform(Uniform):
         def sample(
             self,
             domain: "Categorical",
-            spec: Optional[Union[List[Dict], Dict]] = None,
+            config: Optional[Union[List[Dict], Dict]] = None,
             size: int = 1,
             random_state: "RandomState" = None,
         ):
@@ -459,18 +459,34 @@ def domain_str(self):
 @DeveloperAPI
 class Function(Domain):
     class _CallSampler(BaseSampler):
+        def __try_fn(self, domain: "Function", config: Dict[str, Any]):
+            try:
+                return domain.func(config)
+            except (AttributeError, KeyError):
+                from ray.tune.search.variant_generator import _UnresolvedAccessGuard
+
+                r = domain.func(_UnresolvedAccessGuard({"config": config}))
+                logger.warning(
+                    "sample_from functions that take a spec dict are "
+                    "deprecated. Please update your function to work with "
+                    "the config dict directly."
+                )
+                return r
+
         def sample(
             self,
             domain: "Function",
-            spec: Optional[Union[List[Dict], Dict]] = None,
+            config: Optional[Union[List[Dict], Dict]] = None,
             size: int = 1,
             random_state: "RandomState" = None,
         ):
             if not isinstance(random_state, _BackwardsCompatibleNumpyRng):
                 random_state = _BackwardsCompatibleNumpyRng(random_state)
-            if domain.pass_spec:
+            if domain.pass_config:
                 items = [
-                    domain.func(spec[i] if isinstance(spec, list) else spec)
+                    self.__try_fn(domain, config[i])
+                    if isinstance(config, list)
+                    else self.__try_fn(domain, config)
                     for i in range(size)
                 ]
             else:
@@ -483,13 +499,13 @@ def sample(
     def __init__(self, func: Callable):
         sig = signature(func)
 
-        pass_spec = True  # whether we should pass `spec` when calling `func`
+        pass_config = True  # whether we should pass `config` when calling `func`
         try:
             sig.bind({})
         except TypeError:
-            pass_spec = False
+            pass_config = False
 
-        if not pass_spec:
+        if not pass_config:
             try:
                 sig.bind()
             except TypeError as exc:
@@ -498,7 +514,7 @@ def __init__(self, func: Callable):
                     "callable with either 0 or 1 parameters."
                 ) from exc
 
-        self.pass_spec = pass_spec
+        self.pass_config = pass_config
         self.func = func
 
     def is_function(self):
@@ -526,7 +542,7 @@ def get_sampler(self):
     def sample(
         self,
         domain: Domain,
-        spec: Optional[Union[List[Dict], Dict]] = None,
+        config: Optional[Union[List[Dict], Dict]] = None,
         size: int = 1,
         random_state: "RandomState" = None,
     ):
@@ -534,13 +550,13 @@ def sample(
             random_state = _BackwardsCompatibleNumpyRng(random_state)
 
         if self.q == 1:
-            return self.sampler.sample(domain, spec, size, random_state=random_state)
+            return self.sampler.sample(domain, config, size, random_state=random_state)
 
         quantized_domain = copy(domain)
         quantized_domain.lower = np.ceil(domain.lower / self.q) * self.q
         quantized_domain.upper = np.floor(domain.upper / self.q) * self.q
         values = self.sampler.sample(
-            quantized_domain, spec, size, random_state=random_state
+            quantized_domain, config, size, random_state=random_state
         )
         quantized = np.round(np.divide(values, self.q)) * self.q
 
diff --git a/python/ray/tune/search/variant_generator.py b/python/ray/tune/search/variant_generator.py
index 117bcac00fec..41ab39d4c3a4 100644
--- a/python/ray/tune/search/variant_generator.py
+++ b/python/ray/tune/search/variant_generator.py
@@ -341,9 +341,27 @@ def _get_preset_variants(
 
 @DeveloperAPI
 def assign_value(spec: Dict, path: Tuple, value: Any):
+    """Assigns a value to a nested dictionary.
+
+    Handles the special case of tuples, in which case the tuples
+    will be re-constructed to accomodate the updated value.
+    """
+    parent_spec = None
+    parent_key = None
     for k in path[:-1]:
+        parent_spec = spec
+        parent_key = k
         spec = spec[k]
-    spec[path[-1]] = value
+    key = path[-1]
+    if not isinstance(spec, tuple):
+        # spec is mutable. Just assign the value.
+        spec[key] = value
+    else:
+        if parent_spec is None:
+            raise ValueError("Cannot assign value to a tuple.")
+        assert isinstance(key, int), "Tuple key must be an int."
+        # Special handling since tuples are immutable.
+        parent_spec[parent_key] = spec[:key] + (value,) + spec[key + 1 :]
 
 
 def _get_value(spec: Dict, path: Tuple) -> Any:
diff --git a/python/ray/tune/tests/test_cluster.py b/python/ray/tune/tests/test_cluster.py
index 55c84bae984a..1576577e407e 100644
--- a/python/ray/tune/tests/test_cluster.py
+++ b/python/ray/tune/tests/test_cluster.py
@@ -86,7 +86,7 @@ def test_counting_resources(start_connected_cluster):
     cluster = start_connected_cluster
     nodes = []
     assert ray.cluster_resources()["CPU"] == 1
-    runner = TrialRunner(BasicVariantGenerator())
+    runner = TrialRunner(search_alg=BasicVariantGenerator())
     kwargs = {"stopping_criterion": {"training_iteration": 10}}
 
     trials = [Trial("__fake", **kwargs), Trial("__fake", **kwargs)]
@@ -127,7 +127,7 @@ def test_trial_processed_after_node_failure(start_connected_emptyhead_cluster):
     node = cluster.add_node(num_cpus=1)
     cluster.wait_for_nodes()
 
-    runner = TrialRunner(BasicVariantGenerator())
+    runner = TrialRunner(search_alg=BasicVariantGenerator())
     mock_process_failure = MagicMock(side_effect=runner._process_trial_failure)
     runner._process_trial_failure = mock_process_failure
 
@@ -149,7 +149,7 @@ def test_remove_node_before_result(start_connected_emptyhead_cluster):
     node = cluster.add_node(num_cpus=1)
     cluster.wait_for_nodes()
 
-    runner = TrialRunner(BasicVariantGenerator())
+    runner = TrialRunner(search_alg=BasicVariantGenerator())
     kwargs = {
         "stopping_criterion": {"training_iteration": 3},
         "checkpoint_config": CheckpointConfig(checkpoint_frequency=2),
@@ -208,7 +208,9 @@ def test_trial_migration(start_connected_emptyhead_cluster, tmpdir, durable):
         upload_dir = None
         syncer_callback = custom_driver_logdir_callback(str(tmpdir))
 
-    runner = TrialRunner(BasicVariantGenerator(), callbacks=[syncer_callback])
+    runner = TrialRunner(
+        search_alg=BasicVariantGenerator(), callbacks=[syncer_callback]
+    )
     kwargs = {
         "stopping_criterion": {"training_iteration": 4},
         "checkpoint_config": CheckpointConfig(checkpoint_frequency=2),
@@ -293,7 +295,9 @@ def test_trial_requeue(start_connected_emptyhead_cluster, tmpdir, durable):
         upload_dir = None
         syncer_callback = custom_driver_logdir_callback(str(tmpdir))
 
-    runner = TrialRunner(BasicVariantGenerator(), callbacks=[syncer_callback])  # noqa
+    runner = TrialRunner(
+        search_alg=BasicVariantGenerator(), callbacks=[syncer_callback]
+    )  # noqa
     kwargs = {
         "stopping_criterion": {"training_iteration": 5},
         "checkpoint_config": CheckpointConfig(checkpoint_frequency=1),
@@ -337,7 +341,9 @@ def test_migration_checkpoint_removal(
         upload_dir = None
         syncer_callback = custom_driver_logdir_callback(str(tmpdir))
 
-    runner = TrialRunner(BasicVariantGenerator(), callbacks=[syncer_callback])
+    runner = TrialRunner(
+        search_alg=BasicVariantGenerator(), callbacks=[syncer_callback]
+    )
     kwargs = {
         "stopping_criterion": {"training_iteration": 4},
         "checkpoint_config": CheckpointConfig(checkpoint_frequency=2),
diff --git a/python/ray/tune/tests/test_placeholder.py b/python/ray/tune/tests/test_placeholder.py
new file mode 100644
index 000000000000..ffc2d98a9fd4
--- /dev/null
+++ b/python/ray/tune/tests/test_placeholder.py
@@ -0,0 +1,295 @@
+import unittest
+
+from ray import tune
+from ray.tune.impl.placeholder import (
+    inject_placeholders,
+    resolve_placeholders,
+    create_resolvers_map,
+    _FunctionResolver,
+    _RefResolver,
+)
+from ray.tune.search.sample import Float, Integer
+
+
+class Dummy:
+    def __init__(self, value):
+        self.value = value
+
+
+class PlaceholderTest(unittest.TestCase):
+    def testNotReplaced(self):
+        config = {
+            "param1": "ok",
+            "param2": ["not ok", tune.grid_search(["ok", "not ok"])],
+            "param3": {
+                "param4": tune.choice(["ok", "not ok"]),
+            },
+        }
+
+        replaced = create_resolvers_map()
+        config = inject_placeholders(config, replaced)
+
+        # Primitive typed choices are not replaced.
+        self.assertEqual(config["param2"][1]["grid_search"], ["ok", "not ok"])
+        self.assertEqual(config["param3"]["param4"].categories, ["ok", "not ok"])
+
+    def testGridSearch(self):
+        config = {
+            "param1": "ok",
+            "param2": ["not ok", tune.grid_search(["ok", Dummy("not ok")])],
+            "param3": {
+                "param4": tune.grid_search([Dummy("ok"), "not ok"]),
+            },
+        }
+
+        replaced = create_resolvers_map()
+        config = inject_placeholders(config, replaced)
+
+        self.assertEqual(
+            config["param2"][1]["grid_search"],
+            ["ok", (_RefResolver.TOKEN, "e1eaa08f")],
+        )
+        self.assertEqual(
+            config["param3"]["param4"]["grid_search"],
+            [(_RefResolver.TOKEN, "35397f1a"), "not ok"],
+        )
+
+        # Pretend we picked a choice from the grid searches.
+        config["param2"][1] = (_RefResolver.TOKEN, "e1eaa08f")
+        config["param3"]["param4"] = "not ok"
+
+        resolve_placeholders(config, replaced)
+
+        self.assertEqual(config["param2"][1].value, "not ok")
+        self.assertEqual(config["param3"]["param4"], "not ok")
+
+    def testCategorical(self):
+        config = {
+            "param1": "ok",
+            "param2": ["not ok", tune.choice([Dummy("ok"), "not ok"])],
+            "param3": {
+                "param4": tune.choice([Dummy("ok"), "not ok"]),
+            },
+        }
+
+        replaced = create_resolvers_map()
+        config = inject_placeholders(config, replaced)
+
+        self.assertEqual(
+            config["param2"][1].categories,
+            [(_RefResolver.TOKEN, "e6a5a3d5"), "not ok"],
+        )
+        self.assertEqual(
+            config["param3"]["param4"].categories,
+            [(_RefResolver.TOKEN, "35397f1a"), "not ok"],
+        )
+
+        # Pretend we picked a choice from the grid searches.
+        config["param2"][1] = (_RefResolver.TOKEN, "e6a5a3d5")
+        config["param3"]["param4"] = "not ok"
+
+        resolve_placeholders(config, replaced)
+
+        self.assertEqual(config["param2"][1].value, "ok")
+        self.assertEqual(config["param3"]["param4"], "not ok")
+
+    def testFunction(self):
+        config = {
+            "param1": "ok",
+            "param2": ["not ok", tune.sample_from(lambda: "not ok")],
+            # Both lambdas, either taking spec or config, should work.
+            "param3": {
+                "param4": tune.sample_from(lambda spec: spec["config"]["param1"]),
+            },
+            "param4": {
+                "param4": tune.sample_from(lambda config: config["param1"]),
+            },
+            # Make sure dot notation also works with spec passed in.
+            "param5": {
+                "param4": tune.sample_from(lambda spec: spec.config["param1"]),
+            },
+        }
+
+        replaced = create_resolvers_map()
+        config = inject_placeholders(config, replaced)
+
+        self.assertEqual(config["param2"][1][0], _FunctionResolver.TOKEN)
+        self.assertEqual(config["param3"]["param4"][0], _FunctionResolver.TOKEN)
+        self.assertEqual(config["param4"]["param4"][0], _FunctionResolver.TOKEN)
+        self.assertEqual(config["param5"]["param4"][0], _FunctionResolver.TOKEN)
+
+        resolve_placeholders(config, replaced)
+
+        self.assertEqual(config["param2"][1], "not ok")
+        self.assertEqual(config["param3"]["param4"], "ok")
+        self.assertEqual(config["param4"]["param4"], "ok")
+        self.assertEqual(config["param5"]["param4"], "ok")
+
+    def testRefValue(self):
+        config = {
+            "param1": "ok",
+            "param2": ["not ok", Dummy("ok")],
+            "param3": {
+                "param4": Dummy("not ok"),
+            },
+        }
+
+        replaced = create_resolvers_map()
+        config = inject_placeholders(config, replaced)
+
+        self.assertEqual(config["param2"][1][0], _RefResolver.TOKEN)
+        self.assertEqual(config["param3"]["param4"][0], _RefResolver.TOKEN)
+
+        resolve_placeholders(config, replaced)
+
+        self.assertEqual(config["param2"][1].value, "ok")
+        self.assertEqual(config["param3"]["param4"].value, "not ok")
+
+    def testTuple(self):
+        class Dummy:
+            def __init__(self, value):
+                self.value = value
+
+        config = {
+            "param1": ("ok", "not ok"),
+            "param2": ["not ok", (1, Dummy("ok"))],
+            "param3": {
+                "param4": (1, [2, Dummy("not ok")], 3),
+            },
+        }
+
+        replaced = create_resolvers_map()
+        config = inject_placeholders(config, replaced)
+
+        self.assertTrue(isinstance(config["param1"], tuple))
+        self.assertEqual(config["param1"], ("ok", "not ok"))
+        self.assertTrue(isinstance(config["param2"][1], tuple))
+        self.assertTrue(isinstance(config["param3"]["param4"], tuple))
+
+        resolve_placeholders(config, replaced)
+
+        self.assertTrue(isinstance(config["param2"][1], tuple))
+        self.assertEqual(config["param2"][1][1].value, "ok")
+        self.assertTrue(isinstance(config["param3"]["param4"], tuple))
+        self.assertEqual(config["param3"]["param4"][1][1].value, "not ok")
+
+    def testOtherDomains(self):
+        class Dummy:
+            def __init__(self, value):
+                self.value = value
+
+        config = {
+            "param1": tune.uniform(0, 1),
+            "param2": tune.randint(2, 3),
+            "param3": tune.qrandn(0, 1, 0.1),
+        }
+
+        replaced = create_resolvers_map()
+        config = inject_placeholders(config, replaced)
+
+        # Normal params are not replaced.
+        self.assertTrue(isinstance(config["param1"], Float))
+        self.assertTrue(isinstance(config["param2"], Integer))
+        self.assertTrue(isinstance(config["param3"], Float))
+
+    def testPointToEval(self):
+        config = {
+            "param1": "ok",
+            "param2": ["not ok", tune.choice([Dummy("ok"), "not ok"])],
+            "param3": {
+                "param4": tune.sample_from(lambda spec: spec["config"]["param1"]),
+            },
+        }
+
+        replaced = create_resolvers_map()
+        config = inject_placeholders(config, replaced)
+
+        # Normal params are not replaced.
+        self.assertEqual(
+            config["param2"][1].categories,
+            [(_RefResolver.TOKEN, "e6a5a3d5"), "not ok"],
+        )
+        self.assertEqual(
+            config["param3"]["param4"], (_FunctionResolver.TOKEN, "843363f5")
+        )
+
+        # Now, say we manually resolved the placeholders based on
+        # points_to_evaluate.
+        config["param2"][1] = "not_ok"
+        config["param3"]["param4"] = "ok"
+
+        resolve_placeholders(config, replaced)
+
+        # Params stays the same.
+        self.assertEqual(config["param2"][1], "not_ok")
+        self.assertEqual(config["param3"]["param4"], "ok")
+
+    def testSimpleNestedSearchSpaces(self):
+        config = {
+            "param1": "ok",
+            "param2": tune.choice(
+                [
+                    tune.choice([Dummy(1), 2, 3]),
+                    tune.uniform(5, 6),
+                ]
+            ),
+        }
+
+        replaced = create_resolvers_map()
+        config = inject_placeholders(config, replaced)
+
+        # Manually resolve. Select the Dummy value.
+        config["param2"] = (_RefResolver.TOKEN, "41821403")
+
+        resolve_placeholders(config, replaced)
+
+        self.assertEqual(config["param2"].value, 1)
+
+    def testSimpleNestedSearchSpaces2(self):
+        config = {
+            "param1": "ok",
+            "param2": tune.choice(
+                [
+                    (None, Dummy(1), None),
+                    (Dummy(2), None, None),
+                    (None, None, Dummy(3)),
+                ]
+            ),
+        }
+
+        replaced = create_resolvers_map()
+        config = inject_placeholders(config, replaced)
+
+        # Manually resolve. Select the Dummy value.
+        config["param2"] = (None, None, (_RefResolver.TOKEN, "49964529"))
+
+        resolve_placeholders(config, replaced)
+
+        self.assertEqual(config["param2"][2].value, 3)
+
+    def testResolveFunctionAfterRef(self):
+        config = {
+            "param1": "ok",
+            "param2": tune.choice([Dummy("ok"), "not ok"]),
+            "param3": {
+                "param4": tune.sample_from(lambda config: config["param2"]),
+            },
+        }
+
+        replaced = create_resolvers_map()
+        config = inject_placeholders(config, replaced)
+
+        # Manually resolve param2.
+        config["param2"] = (_RefResolver.TOKEN, "60238385")
+
+        resolve_placeholders(config, replaced)
+
+        # param3.param4 should get the same value as resolved param2.
+        self.assertEqual(config["param3"]["param4"].value, "ok")
+
+
+if __name__ == "__main__":
+    import pytest
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/python/ray/tune/tests/test_ray_trial_executor.py b/python/ray/tune/tests/test_ray_trial_executor.py
index 412785a74042..457b23df8133 100644
--- a/python/ray/tune/tests/test_ray_trial_executor.py
+++ b/python/ray/tune/tests/test_ray_trial_executor.py
@@ -28,6 +28,12 @@
 from unittest.mock import patch
 
 
+def _make_trial(name, **kwargs):
+    trial = Trial(name, **kwargs)
+    trial.create_placement_group_factory()
+    return trial
+
+
 class _HangingTrainable(tune.Trainable):
     def setup(self, config):
         pass
@@ -153,13 +159,13 @@ def _simulate_saving(self, trial):
         self.assertEqual(checkpoint, trial.checkpoint)
 
     def testStartStop(self):
-        trial = Trial("__fake")
+        trial = _make_trial("__fake")
         self._simulate_starting_trial(trial)
         self.trial_executor.stop_trial(trial)
 
     def testAsyncSave(self):
         """Tests that saved checkpoint value not immediately set."""
-        trial = Trial("__fake")
+        trial = _make_trial("__fake")
         self._simulate_starting_trial(trial)
 
         self._simulate_getting_result(trial)
@@ -170,7 +176,7 @@ def testAsyncSave(self):
         self.assertEqual(Trial.TERMINATED, trial.status)
 
     def testSaveRestore(self):
-        trial = Trial("__fake")
+        trial = _make_trial("__fake")
         self._simulate_starting_trial(trial)
 
         self._simulate_getting_result(trial)
@@ -183,7 +189,7 @@ def testSaveRestore(self):
 
     def testPauseResume(self):
         """Tests that pausing works for trials in flight."""
-        trial = Trial("__fake")
+        trial = _make_trial("__fake")
         self._simulate_starting_trial(trial)
 
         self.trial_executor.pause_trial(trial)
@@ -196,7 +202,7 @@ def testPauseResume(self):
 
     def testSavePauseResumeErrorRestore(self):
         """Tests that pause checkpoint does not replace restore checkpoint."""
-        trial = Trial("__fake")
+        trial = _make_trial("__fake")
         self._simulate_starting_trial(trial)
 
         self._simulate_getting_result(trial)
@@ -227,13 +233,13 @@ def testSavePauseResumeErrorRestore(self):
 
     def testStartFailure(self):
         _global_registry.register(TRAINABLE_CLASS, "asdf", None)
-        trial = Trial("asdf", resources=Resources(1, 0))
+        trial = _make_trial("asdf", resources=Resources(1, 0))
         self.trial_executor.start_trial(trial)
         self.assertEqual(Trial.ERROR, trial.status)
 
     def testTrialHangingCleanup(self):
         register_trainable("hanging", _HangingTrainable)
-        trial = Trial("hanging")
+        trial = _make_trial("hanging")
 
         os.environ["TUNE_FORCE_TRIAL_CLEANUP_S"] = "1"
         os.environ["TUNE_GET_EXECUTOR_EVENT_WAIT_S"] = "30"
@@ -290,7 +296,7 @@ def testTrialHangingCleanup(self):
 
     def testPauseResume2(self):
         """Tests that pausing works for trials being processed."""
-        trial = Trial("__fake")
+        trial = _make_trial("__fake")
         self._simulate_starting_trial(trial)
 
         self._simulate_getting_result(trial)
@@ -312,7 +318,7 @@ def _testPauseAndStart(self, result_buffer_length):
 
         base = max(result_buffer_length, 1)
 
-        trial = Trial("__fake")
+        trial = _make_trial("__fake")
         self._simulate_starting_trial(trial)
 
         self._simulate_getting_result(trial)
@@ -339,7 +345,7 @@ def testPauseAndStartActualBuffer(self):
 
     def testNoResetTrial(self):
         """Tests that reset handles NotImplemented properly."""
-        trial = Trial("__fake")
+        trial = _make_trial("__fake")
         self._simulate_starting_trial(trial)
         exists = self.trial_executor.reset_trial(trial, {}, "modified_mock")
         self.assertEqual(exists, False)
@@ -453,6 +459,7 @@ def generate_trials(spec, name):
         while not suggester.is_finished():
             trial = suggester.next_trial()
             if trial:
+                trial.create_placement_group_factory()
                 trials.append(trial)
             else:
                 break
@@ -615,9 +622,9 @@ def train(config):
 
         register_trainable("resettable", train)
 
-        trial1 = Trial("resettable", placement_group_factory=pgf1)
-        trial2 = Trial("resettable", placement_group_factory=pgf1)
-        trial3 = Trial("resettable", placement_group_factory=pgf2)
+        trial1 = _make_trial("resettable", placement_group_factory=pgf1)
+        trial2 = _make_trial("resettable", placement_group_factory=pgf1)
+        trial3 = _make_trial("resettable", placement_group_factory=pgf2)
 
         assert executor.has_resources_for_trial(trial1)
         assert executor.has_resources_for_trial(trial2)
diff --git a/python/ray/tune/tests/test_sample.py b/python/ray/tune/tests/test_sample.py
index 4c10af22454c..dcdeb6a8a83a 100644
--- a/python/ray/tune/tests/test_sample.py
+++ b/python/ray/tune/tests/test_sample.py
@@ -1085,7 +1085,10 @@ def testConvertHyperOptNested(self):
 
         searcher = HyperOptSearch(metric="a", mode="max")
         analysis = tune.run(
-            _mock_objective, config=config, search_alg=searcher, num_samples=10
+            _mock_objective,
+            config=config,
+            search_alg=searcher,
+            num_samples=10,
         )
 
         for trial in analysis.trials:
diff --git a/python/ray/tune/tests/test_trial_relative_logdir.py b/python/ray/tune/tests/test_trial_relative_logdir.py
index f2f388ec6858..79863abf5d07 100644
--- a/python/ray/tune/tests/test_trial_relative_logdir.py
+++ b/python/ray/tune/tests/test_trial_relative_logdir.py
@@ -262,6 +262,7 @@ def test_load_trial_from_json_state(tmpdir):
     trial = Trial(
         "MockTrainable", stub=True, trial_id="abcd1234", local_dir=str(tmpdir)
     )
+    trial.create_placement_group_factory()
     trial.init_logdir()
     trial.status = Trial.TERMINATED
 
diff --git a/python/ray/tune/tests/test_trial_runner_2.py b/python/ray/tune/tests/test_trial_runner_2.py
index 9681865c09de..8363c0a813d3 100644
--- a/python/ray/tune/tests/test_trial_runner_2.py
+++ b/python/ray/tune/tests/test_trial_runner_2.py
@@ -89,7 +89,7 @@ def testFailureRecoveryDisabled(self):
         searchalg, scheduler = create_mock_components()
 
         runner = TrialRunner(
-            searchalg,
+            search_alg=searchalg,
             scheduler=scheduler,
             trial_executor=RayTrialExecutor(resource_manager=self._resourceManager()),
         )
@@ -117,7 +117,7 @@ def testFailureRecoveryEnabled(self):
         searchalg, scheduler = create_mock_components()
 
         runner = TrialRunner(
-            searchalg,
+            search_alg=searchalg,
             scheduler=scheduler,
             trial_executor=RayTrialExecutor(resource_manager=self._resourceManager()),
         )
diff --git a/python/ray/tune/tests/test_trial_runner_3.py b/python/ray/tune/tests/test_trial_runner_3.py
index fb855abb1e9e..3c07f667a2fb 100644
--- a/python/ray/tune/tests/test_trial_runner_3.py
+++ b/python/ray/tune/tests/test_trial_runner_3.py
@@ -19,10 +19,13 @@
 
 from ray.tune import TuneError
 from ray.tune.execution.ray_trial_executor import RayTrialExecutor
+from ray.tune.impl.placeholder import create_resolvers_map, inject_placeholders
 from ray.tune.result import TRAINING_ITERATION
 from ray.tune.schedulers import TrialScheduler, FIFOScheduler
 from ray.tune.experiment import Experiment
 from ray.tune.search import BasicVariantGenerator
+from ray.tune.search.sample import sample_from
+from ray.tune.search.variant_generator import grid_search
 from ray.tune.experiment import Trial
 from ray.tune.execution.trial_runner import TrialRunner
 from ray.tune.resources import Resources, json_to_resources, resources_to_json
@@ -426,6 +429,69 @@ def testCallbackSaveRestore(self):
         runner2.resume()
         assert callback.counter == 3
 
+    def testSearcherCorrectReferencesAfterRestore(self):
+        class FakeDataset:
+            def __init__(self, name):
+                self.name = name
+
+        ray.init(num_cpus=8)
+
+        config = {
+            "param1": {
+                "param2": grid_search(
+                    [FakeDataset("1"), FakeDataset("2"), FakeDataset("3")]
+                ),
+            },
+            "param4": sample_from(lambda: 1),
+            "param5": sample_from(lambda spec: spec.config["param1"]["param2"]),
+        }
+        resolvers = create_resolvers_map()
+        config = inject_placeholders(config, resolvers)
+
+        def create_searcher():
+            search_alg = BasicVariantGenerator()
+            experiment_spec = {
+                "run": "__fake",
+                "stop": {"training_iteration": 2},
+                "config": config,
+            }
+            experiments = [Experiment.from_json("test", experiment_spec)]
+            search_alg.add_configurations(experiments)
+            return search_alg
+
+        searcher = create_searcher()
+
+        restored_config = {
+            "param1": {
+                "param2": grid_search(
+                    [FakeDataset("4"), FakeDataset("5"), FakeDataset("6")]
+                ),
+            },
+            "param4": sample_from(lambda: 8),
+            "param5": sample_from(lambda spec: spec["config"]["param1"]["param2"]),
+        }
+        replaced_resolvers = create_resolvers_map()
+        restored_config = inject_placeholders(restored_config, replaced_resolvers)
+
+        runner = TrialRunner(
+            search_alg=searcher,
+            # Use the new ref map to construct the TrailRunner.
+            placeholder_resolvers=replaced_resolvers,
+            local_checkpoint_dir=self.tmpdir,
+            checkpoint_period=-1,
+            trial_executor=RayTrialExecutor(resource_manager=self._resourceManager()),
+        )
+
+        for _ in range(3):
+            runner.step()
+
+        assert len(runner.get_trials()) == 3, [t.config for t in runner.get_trials()]
+        for t in runner.get_trials():
+            # Make sure that all the trials carry updated config values.
+            assert t.config["param1"]["param2"].name in ["4", "5", "6"]
+            assert t.config["param4"] == 8
+            assert t.config["param5"].name in ["4", "5", "6"]
+
     def testTrialErrorResumeFalse(self):
         ray.init(num_cpus=3, local_mode=True, include_dashboard=False)
         runner = TrialRunner(
diff --git a/python/ray/tune/tests/test_tune_restore.py b/python/ray/tune/tests/test_tune_restore.py
index 4bd937eaeae4..a582688f1435 100644
--- a/python/ray/tune/tests/test_tune_restore.py
+++ b/python/ray/tune/tests/test_tune_restore.py
@@ -314,6 +314,70 @@ def testResourceUpdateInResume(self):
         )
         assert len(analysis.trials) == 27
 
+    # Unfinished trials' resources should be updated.
+    def testConfigUpdateInResume(self):
+        os.environ["TUNE_MAX_PENDING_TRIALS_PG"] = "1"
+
+        class FakeDataset:
+            def __init__(self, name):
+                self.name = name
+
+        config = dict(
+            num_samples=1,
+            fail_fast=True,
+            config={
+                "test": tune.grid_search(
+                    [FakeDataset("1"), FakeDataset("2"), FakeDataset("3")]
+                ),
+                "test2": tune.grid_search(
+                    [
+                        FakeDataset("4"),
+                        FakeDataset("5"),
+                        FakeDataset("6"),
+                        FakeDataset("7"),
+                    ]
+                ),
+            },
+            stop={"training_iteration": 2},
+            local_dir=self.logdir,
+            verbose=1,
+        )
+
+        with self.assertRaises(RuntimeError):
+            tune.run(
+                "trainable",
+                callbacks=[
+                    self.FailureInjectorCallback(num_trials=1),
+                    self.CheckTrialResourcesCallback(1),
+                ],
+                **config,
+            )
+
+        config["config"] = {
+            "test": tune.grid_search(
+                [FakeDataset("8"), FakeDataset("9"), FakeDataset("10")]
+            ),
+            "test2": tune.grid_search(
+                [
+                    FakeDataset("11"),
+                    FakeDataset("12"),
+                    FakeDataset("13"),
+                    FakeDataset("14"),
+                ]
+            ),
+        }
+
+        analysis = tune.run(
+            "trainable",
+            resume=True,
+            **config,
+        )
+        assert len(analysis.trials) == 12
+        for t in analysis.trials:
+            # Make sure that test and test2 are updated.
+            assert t.config["test"].name in ["8", "9", "10"]
+            assert t.config["test2"].name in ["11", "12", "13", "14"]
+
     def testFailResumeWithPreset(self):
         os.environ["TUNE_MAX_PENDING_TRIALS_PG"] = "1"
 
diff --git a/python/ray/tune/tune.py b/python/ray/tune/tune.py
index 15242cf5f281..b72d6230c060 100644
--- a/python/ray/tune/tune.py
+++ b/python/ray/tune/tune.py
@@ -1,3 +1,4 @@
+import copy
 import datetime
 import logging
 import os
@@ -15,6 +16,7 @@
 from ray.tune.callback import Callback
 from ray.tune.error import TuneError
 from ray.tune.experiment import Experiment, _convert_to_experiment_list
+from ray.tune.impl.placeholder import create_resolvers_map, inject_placeholders
 from ray.tune.progress_reporter import (
     ProgressReporter,
     _detect_reporter,
@@ -564,6 +566,20 @@ class and registered trainables.
             "well as implementing `reset_config` for Trainable."
         )
 
+    # Before experiments are created, we first clean up the passed in
+    # Config dictionary by replacing all the non-primitive config values
+    # with placeholders. This serves two purposes:
+    # 1. we can replace and "fix" these objects if a Trial is restored.
+    # 2. the config dictionary will then be compatible with all supported
+    #   search algorithms, since a lot of them do not support non-primitive
+    #   config values.
+    placeholder_resolvers = create_resolvers_map()
+    config = inject_placeholders(
+        # Make a deep copy here to avoid modifying the original config dict.
+        copy.deepcopy(config),
+        placeholder_resolvers,
+    )
+
     if isinstance(run_or_experiment, list):
         experiments = run_or_experiment
     else:
@@ -711,6 +727,7 @@ class and registered trainables.
     )
     runner = TrialRunner(
         search_alg=search_alg,
+        placeholder_resolvers=placeholder_resolvers,
         scheduler=scheduler,
         local_checkpoint_dir=experiments[0].checkpoint_dir,
         experiment_dir_name=experiments[0].dir_name,

From aa504aed4f38b51050570e52976ac287c38c4b59 Mon Sep 17 00:00:00 2001
From: Jian Xiao <99709935+jianoaix@users.noreply.github.com>
Date: Tue, 7 Feb 2023 19:36:52 -0800
Subject: [PATCH 173/267] Make write an operator as part of the execution plan
 (#32015)

---
 python/ray/data/dataset.py                    | 90 +++++++++++++------
 python/ray/data/datasource/datasource.py      | 44 ++++++---
 .../data/datasource/file_based_datasource.py  | 57 ++++++------
 .../ray/data/datasource/mongo_datasource.py   | 33 +++----
 python/ray/data/tests/conftest.py             |  2 +-
 python/ray/data/tests/test_dataset_formats.py | 40 ++++-----
 .../data/tests/test_execution_optimizer.py    | 33 +++----
 python/ray/data/tests/test_optimize.py        | 25 ++++++
 python/ray/data/tests/test_size_estimation.py | 13 ++-
 9 files changed, 207 insertions(+), 130 deletions(-)

diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index 8b6fc9c5bed6..ed4d8f0ac3b9 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -2640,8 +2640,6 @@ def write_datasource(
             ray_remote_args: Kwargs passed to ray.remote in the write tasks.
             write_args: Additional write args to pass to the datasource.
         """
-
-        ctx = DatasetContext.get_current()
         if ray_remote_args is None:
             ray_remote_args = {}
         path = write_args.get("path", None)
@@ -2655,37 +2653,71 @@ def write_datasource(
                 soft=False,
             )
 
-        blocks, metadata = zip(*self._plan.execute().get_blocks_with_metadata())
-
-        # TODO(ekl) remove this feature flag.
-        if "RAY_DATASET_FORCE_LOCAL_METADATA" in os.environ:
-            write_results: List[ObjectRef[WriteResult]] = datasource.do_write(
-                blocks, metadata, ray_remote_args=ray_remote_args, **write_args
-            )
-        else:
-            # Prepare write in a remote task so that in Ray client mode, we
-            # don't do metadata resolution from the client machine.
-            do_write = cached_remote_fn(_do_write, retry_exceptions=False, num_cpus=0)
-            write_results: List[ObjectRef[WriteResult]] = ray.get(
-                do_write.remote(
-                    datasource,
-                    ctx,
-                    blocks,
-                    metadata,
+        if hasattr(datasource, "write"):
+            # If the write operator succeeds, the resulting Dataset is a list of
+            # WriteResult (one element per write task). Otherwise, an error will
+            # be raised. The Datasource can handle execution outcomes with the
+            # on_write_complete() and on_write_failed().
+            def transform(blocks: Iterable[Block], ctx, fn) -> Iterable[Block]:
+                return [[datasource.write(blocks, ctx, **write_args)]]
+
+            plan = self._plan.with_stage(
+                OneToOneStage(
+                    "write",
+                    transform,
+                    "tasks",
                     ray_remote_args,
-                    _wrap_arrow_serialization_workaround(write_args),
+                    fn=lambda x: x,
                 )
             )
+            try:
+                self._write_ds = Dataset(plan, self._epoch, self._lazy).fully_executed()
+                datasource.on_write_complete(
+                    ray.get(self._write_ds._plan.execute().get_blocks())
+                )
+            except Exception as e:
+                datasource.on_write_failed([], e)
+                raise
+        else:
+            ctx = DatasetContext.get_current()
+            blocks, metadata = zip(*self._plan.execute().get_blocks_with_metadata())
 
-        progress = ProgressBar("Write Progress", len(write_results))
-        try:
-            progress.block_until_complete(write_results)
-            datasource.on_write_complete(ray.get(write_results))
-        except Exception as e:
-            datasource.on_write_failed(write_results, e)
-            raise
-        finally:
-            progress.close()
+            # TODO(ekl) remove this feature flag.
+            if "RAY_DATASET_FORCE_LOCAL_METADATA" in os.environ:
+                write_results: List[ObjectRef[WriteResult]] = datasource.do_write(
+                    blocks, metadata, ray_remote_args=ray_remote_args, **write_args
+                )
+            else:
+                logger.warning(
+                    "The Datasource.do_write() is deprecated in "
+                    "Ray 2.4 and will be removed in future release. Use "
+                    "Datasource.write() instead."
+                )
+                # Prepare write in a remote task so that in Ray client mode, we
+                # don't do metadata resolution from the client machine.
+                do_write = cached_remote_fn(
+                    _do_write, retry_exceptions=False, num_cpus=0
+                )
+                write_results: List[ObjectRef[WriteResult]] = ray.get(
+                    do_write.remote(
+                        datasource,
+                        ctx,
+                        blocks,
+                        metadata,
+                        ray_remote_args,
+                        _wrap_arrow_serialization_workaround(write_args),
+                    )
+                )
+
+            progress = ProgressBar("Write Progress", len(write_results))
+            try:
+                progress.block_until_complete(write_results)
+                datasource.on_write_complete(ray.get(write_results))
+            except Exception as e:
+                datasource.on_write_failed(write_results, e)
+                raise
+            finally:
+                progress.close()
 
     def iterator(self) -> DatasetIterator:
         """Return a :class:`~ray.data.DatasetIterator` that
diff --git a/python/ray/data/datasource/datasource.py b/python/ray/data/datasource/datasource.py
index 98c0eb722f1c..0919ffba8c8d 100644
--- a/python/ray/data/datasource/datasource.py
+++ b/python/ray/data/datasource/datasource.py
@@ -6,6 +6,7 @@
 import ray
 from ray.data._internal.arrow_block import ArrowRow
 from ray.data._internal.delegating_block_builder import DelegatingBlockBuilder
+from ray.data._internal.execution.interfaces import TaskContext
 from ray.data._internal.util import _check_pyarrow_version
 from ray.data.block import (
     Block,
@@ -31,7 +32,7 @@ class Datasource(Generic[T]):
     of how to implement readable and writable datasources.
 
     Datasource instances must be serializable, since ``create_reader()`` and
-    ``do_write()`` are called in remote tasks.
+    ``write()`` are called in remote tasks.
     """
 
     def create_reader(self, **read_args) -> "Reader[T]":
@@ -50,6 +51,25 @@ def prepare_read(self, parallelism: int, **read_args) -> List["ReadTask[T]"]:
         """Deprecated: Please implement create_reader() instead."""
         raise NotImplementedError
 
+    def write(
+        self,
+        blocks: Iterable[Block],
+        **write_args,
+    ) -> WriteResult:
+        """Write blocks out to the datasource. This is used by a single write task.
+
+        Args:
+            blocks: List of data blocks.
+            write_args: Additional kwargs to pass to the datasource impl.
+
+        Returns:
+            The output of the write task.
+        """
+        raise NotImplementedError
+
+    @Deprecated(
+        message="do_write() is deprecated in Ray 2.4. Use write() instead", warning=True
+    )
     def do_write(
         self,
         blocks: List[ObjectRef[Block]],
@@ -319,35 +339,33 @@ def __init__(self):
 
             def write(self, block: Block) -> str:
                 block = BlockAccessor.for_block(block)
-                if not self.enabled:
-                    raise ValueError("disabled")
                 self.rows_written += block.num_rows()
                 return "ok"
 
             def get_rows_written(self):
                 return self.rows_written
 
-            def set_enabled(self, enabled):
-                self.enabled = enabled
-
         self.data_sink = DataSink.remote()
         self.num_ok = 0
         self.num_failed = 0
+        self.enabled = True
 
-    def do_write(
+    def write(
         self,
-        blocks: List[ObjectRef[Block]],
-        metadata: List[BlockMetadata],
-        ray_remote_args: Dict[str, Any],
+        blocks: Iterable[Block],
+        ctx: TaskContext,
         **write_args,
-    ) -> List[ObjectRef[WriteResult]]:
+    ) -> WriteResult:
         tasks = []
+        if not self.enabled:
+            raise ValueError("disabled")
         for b in blocks:
             tasks.append(self.data_sink.write.remote(b))
-        return tasks
+        ray.get(tasks)
+        return "ok"
 
     def on_write_complete(self, write_results: List[WriteResult]) -> None:
-        assert all(w == "ok" for w in write_results), write_results
+        assert all(w == ["ok"] for w in write_results), write_results
         self.num_ok += 1
 
     def on_write_failed(
diff --git a/python/ray/data/datasource/file_based_datasource.py b/python/ray/data/datasource/file_based_datasource.py
index e4cd15550ba3..2badee7158f6 100644
--- a/python/ray/data/datasource/file_based_datasource.py
+++ b/python/ray/data/datasource/file_based_datasource.py
@@ -16,9 +16,9 @@
 )
 
 from ray.data._internal.arrow_block import ArrowRow
-from ray.data._internal.block_list import BlockMetadata
+from ray.data._internal.delegating_block_builder import DelegatingBlockBuilder
+from ray.data._internal.execution.interfaces import TaskContext
 from ray.data._internal.output_buffer import BlockOutputBuffer
-from ray.data._internal.remote_fn import cached_remote_fn
 from ray.data._internal.util import _check_pyarrow_version, _resolve_custom_scheme
 from ray.data.block import Block, BlockAccessor
 from ray.data.context import DatasetContext
@@ -60,7 +60,7 @@ def _get_write_path_for_block(
         *,
         filesystem: Optional["pyarrow.fs.FileSystem"] = None,
         dataset_uuid: Optional[str] = None,
-        block: Optional[ObjectRef[Block]] = None,
+        block: Optional[Block] = None,
         block_index: Optional[int] = None,
         file_format: Optional[str] = None,
     ) -> str:
@@ -77,7 +77,7 @@ def _get_write_path_for_block(
                 write a file out to the write path returned.
             dataset_uuid: Unique identifier for the dataset that this block
                 belongs to.
-            block: Object reference to the block to write.
+            block: The block to write.
             block_index: Ordered index of the block to write within its parent
                 dataset.
             file_format: File format string for the block that can be used as
@@ -94,7 +94,7 @@ def __call__(
         *,
         filesystem: Optional["pyarrow.fs.FileSystem"] = None,
         dataset_uuid: Optional[str] = None,
-        block: Optional[ObjectRef[Block]] = None,
+        block: Optional[Block] = None,
         block_index: Optional[int] = None,
         file_format: Optional[str] = None,
     ) -> str:
@@ -257,10 +257,10 @@ def _convert_block_to_tabular_block(
             "then you need to implement `_convert_block_to_tabular_block."
         )
 
-    def do_write(
+    def write(
         self,
-        blocks: List[ObjectRef[Block]],
-        metadata: List[BlockMetadata],
+        blocks: Iterable[Block],
+        ctx: TaskContext,
         path: str,
         dataset_uuid: str,
         filesystem: Optional["pyarrow.fs.FileSystem"] = None,
@@ -269,10 +269,9 @@ def do_write(
         block_path_provider: BlockWritePathProvider = DefaultBlockWritePathProvider(),
         write_args_fn: Callable[[], Dict[str, Any]] = lambda: {},
         _block_udf: Optional[Callable[[Block], Block]] = None,
-        ray_remote_args: Dict[str, Any] = None,
         **write_args,
-    ) -> List[ObjectRef[WriteResult]]:
-        """Creates and returns write tasks for a file-based datasource."""
+    ) -> WriteResult:
+        """Write blocks for a file-based datasource."""
         path, filesystem = _resolve_paths_and_filesystem(path, filesystem)
         path = path[0]
         if try_create_dir:
@@ -287,9 +286,6 @@ def do_write(
         if open_stream_args is None:
             open_stream_args = {}
 
-        if ray_remote_args is None:
-            ray_remote_args = {}
-
         def write_block(write_path: str, block: Block):
             logger.debug(f"Writing {write_path} file.")
             fs = filesystem
@@ -305,29 +301,30 @@ def write_block(write_path: str, block: Block):
                     writer_args_fn=write_args_fn,
                     **write_args,
                 )
-
-        write_block = cached_remote_fn(write_block).options(**ray_remote_args)
+            # TODO: decide if we want to return richer object when the task
+            # succeeds.
+            return "ok"
 
         file_format = self._FILE_EXTENSION
         if isinstance(file_format, list):
             file_format = file_format[0]
 
-        write_tasks = []
+        builder = DelegatingBlockBuilder()
+        for block in blocks:
+            builder.add_block(block)
+        block = builder.build()
+
         if not block_path_provider:
             block_path_provider = DefaultBlockWritePathProvider()
-        for block_idx, block in enumerate(blocks):
-            write_path = block_path_provider(
-                path,
-                filesystem=filesystem,
-                dataset_uuid=dataset_uuid,
-                block=block,
-                block_index=block_idx,
-                file_format=file_format,
-            )
-            write_task = write_block.remote(write_path, block)
-            write_tasks.append(write_task)
-
-        return write_tasks
+        write_path = block_path_provider(
+            path,
+            filesystem=filesystem,
+            dataset_uuid=dataset_uuid,
+            block=block,
+            block_index=ctx.task_idx,
+            file_format=file_format,
+        )
+        return write_block(write_path, block)
 
     def _write_block(
         self,
diff --git a/python/ray/data/datasource/mongo_datasource.py b/python/ray/data/datasource/mongo_datasource.py
index f1153271c532..ef35497bbe7f 100644
--- a/python/ray/data/datasource/mongo_datasource.py
+++ b/python/ray/data/datasource/mongo_datasource.py
@@ -1,5 +1,5 @@
 import logging
-from typing import Any, Dict, List, Optional, TYPE_CHECKING
+from typing import Dict, List, Optional, TYPE_CHECKING
 
 from ray.data.datasource.datasource import Datasource, Reader, ReadTask, WriteResult
 from ray.data.block import (
@@ -7,9 +7,10 @@
     BlockAccessor,
     BlockMetadata,
 )
-from ray.data._internal.remote_fn import cached_remote_fn
-from ray.types import ObjectRef
+from ray.data._internal.delegating_block_builder import DelegatingBlockBuilder
+from ray.data._internal.execution.interfaces import TaskContext
 from ray.util.annotations import PublicAPI
+from typing import Iterable
 
 if TYPE_CHECKING:
     import pymongoarrow.api
@@ -37,15 +38,14 @@ class MongoDatasource(Datasource):
     def create_reader(self, **kwargs) -> Reader:
         return _MongoDatasourceReader(**kwargs)
 
-    def do_write(
+    def write(
         self,
-        blocks: List[ObjectRef[Block]],
-        metadata: List[BlockMetadata],
-        ray_remote_args: Optional[Dict[str, Any]],
+        blocks: Iterable[Block],
+        ctx: TaskContext,
         uri: str,
         database: str,
         collection: str,
-    ) -> List[ObjectRef[WriteResult]]:
+    ) -> WriteResult:
         import pymongo
 
         _validate_database_collection_exist(
@@ -59,15 +59,16 @@ def write_block(uri: str, database: str, collection: str, block: Block):
             client = pymongo.MongoClient(uri)
             write(client[database][collection], block)
 
-        if ray_remote_args is None:
-            ray_remote_args = {}
-
-        write_block = cached_remote_fn(write_block).options(**ray_remote_args)
-        write_tasks = []
+        builder = DelegatingBlockBuilder()
         for block in blocks:
-            write_task = write_block.remote(uri, database, collection, block)
-            write_tasks.append(write_task)
-        return write_tasks
+            builder.add_block(block)
+        block = builder.build()
+
+        write_block(uri, database, collection, block)
+
+        # TODO: decide if we want to return richer object when the task
+        # succeeds.
+        return "ok"
 
 
 class _MongoDatasourceReader(Reader):
diff --git a/python/ray/data/tests/conftest.py b/python/ray/data/tests/conftest.py
index 0d1cb84deb92..2cf6f8abe2d3 100644
--- a/python/ray/data/tests/conftest.py
+++ b/python/ray/data/tests/conftest.py
@@ -162,7 +162,7 @@ def _get_write_path_for_block(
             block_index=None,
             file_format=None,
         ):
-            num_rows = BlockAccessor.for_block(ray.get(block)).num_rows()
+            num_rows = BlockAccessor.for_block(block).num_rows()
             suffix = (
                 f"{block_index:06}_{num_rows:02}_{dataset_uuid}" f".test.{file_format}"
             )
diff --git a/python/ray/data/tests/test_dataset_formats.py b/python/ray/data/tests/test_dataset_formats.py
index efbbef88886f..94e07ad126a2 100644
--- a/python/ray/data/tests/test_dataset_formats.py
+++ b/python/ray/data/tests/test_dataset_formats.py
@@ -1,5 +1,5 @@
 import os
-from typing import Any, Dict, List, Union
+from typing import List, Union
 
 import pandas as pd
 import pyarrow as pa
@@ -13,7 +13,8 @@
 
 import ray
 from ray.data._internal.arrow_block import ArrowRow
-from ray.data.block import Block, BlockAccessor, BlockMetadata
+from ray.data._internal.execution.interfaces import TaskContext
+from ray.data.block import Block, BlockAccessor
 from ray.data.datasource import (
     Datasource,
     DummyOutputDatasource,
@@ -24,6 +25,7 @@
 from ray.data.tests.mock_http_server import *  # noqa
 from ray.tests.conftest import *  # noqa
 from ray.types import ObjectRef
+from typing import Iterable
 
 
 def maybe_pipeline(ds, enabled):
@@ -179,10 +181,10 @@ def test_write_datasource(ray_start_regular_shared, pipelined):
     assert output.num_failed == 0
     assert ray.get(output.data_sink.get_rows_written.remote()) == 10
 
-    ray.get(output.data_sink.set_enabled.remote(False))
-    ds = maybe_pipeline(ds0, pipelined)
+    output.enabled = False
+    ds = maybe_pipeline(ray.data.range(10, parallelism=2), pipelined)
     with pytest.raises(ValueError):
-        ds.write_datasource(output)
+        ds.write_datasource(output, ray_remote_args={"max_retries": 0})
     if pipelined:
         assert output.num_ok == 2
     else:
@@ -228,13 +230,10 @@ def __init__(self):
         class DataSink:
             def __init__(self):
                 self.rows_written = 0
-                self.enabled = True
                 self.node_ids = set()
 
             def write(self, node_id: str, block: Block) -> str:
                 block = BlockAccessor.for_block(block)
-                if not self.enabled:
-                    raise ValueError("disabled")
                 self.rows_written += block.num_rows()
                 self.node_ids.add(node_id)
                 return "ok"
@@ -245,34 +244,30 @@ def get_rows_written(self):
             def get_node_ids(self):
                 return self.node_ids
 
-            def set_enabled(self, enabled):
-                self.enabled = enabled
-
         self.data_sink = DataSink.remote()
         self.num_ok = 0
         self.num_failed = 0
 
-    def do_write(
+    def write(
         self,
-        blocks: List[ObjectRef[Block]],
-        metadata: List[BlockMetadata],
-        ray_remote_args: Dict[str, Any],
+        blocks: Iterable[Block],
+        ctx: TaskContext,
         **write_args,
-    ) -> List[ObjectRef[WriteResult]]:
+    ) -> WriteResult:
         data_sink = self.data_sink
 
-        @ray.remote
         def write(b):
             node_id = ray.get_runtime_context().get_node_id()
-            return ray.get(data_sink.write.remote(node_id, b))
+            return data_sink.write.remote(node_id, b)
 
         tasks = []
         for b in blocks:
-            tasks.append(write.options(**ray_remote_args).remote(b))
-        return tasks
+            tasks.append(write(b))
+        ray.get(tasks)
+        return "ok"
 
     def on_write_complete(self, write_results: List[WriteResult]) -> None:
-        assert all(w == "ok" for w in write_results), write_results
+        assert all(w == ["ok"] for w in write_results), write_results
         self.num_ok += 1
 
     def on_write_failed(
@@ -282,6 +277,7 @@ def on_write_failed(
 
 
 def test_write_datasource_ray_remote_args(ray_start_cluster):
+    ray.shutdown()
     cluster = ray_start_cluster
     cluster.add_node(
         resources={"foo": 100},
@@ -299,7 +295,7 @@ def get_node_id():
 
     output = NodeLoggerOutputDatasource()
     ds = ray.data.range(100, parallelism=10)
-    # Pin write tasks to
+    # Pin write tasks to node with "bar" resource.
     ds.write_datasource(output, ray_remote_args={"resources": {"bar": 1}})
     assert output.num_ok == 1
     assert output.num_failed == 0
diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index 83b2c9b6cd01..1cc091391b7f 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -1,6 +1,4 @@
-import os
 import pytest
-import pandas as pd
 
 import ray
 from ray.data._internal.execution.operators.map_operator import MapOperator
@@ -545,20 +543,23 @@ def test_sort_e2e(
     ds = ds.sort()
     assert ds.take_all() == list(range(100))
 
-    df = pd.DataFrame({"one": list(range(100)), "two": ["a"] * 100})
-    ds = ray.data.from_pandas([df])
-    path = os.path.join(local_path, "test_parquet_dir")
-    os.mkdir(path)
-    ds.write_parquet(path)
-
-    ds = ray.data.read_parquet(path)
-    ds = ds.random_shuffle()
-    ds1 = ds.sort("one")
-    ds2 = ds.sort("one", descending=True)
-    r1 = ds1.select_columns(["one"]).take_all()
-    r2 = ds2.select_columns(["one"]).take_all()
-    assert [d["one"] for d in r1] == list(range(100))
-    assert [d["one"] for d in r2] == list(reversed(range(100)))
+    # TODO: write_XXX and from_XXX are not supported yet in new execution plan.
+    # Re-enable once supported.
+
+    # df = pd.DataFrame({"one": list(range(100)), "two": ["a"] * 100})
+    # ds = ray.data.from_pandas([df])
+    # path = os.path.join(local_path, "test_parquet_dir")
+    # os.mkdir(path)
+    # ds.write_parquet(path)
+
+    # ds = ray.data.read_parquet(path)
+    # ds = ds.random_shuffle()
+    # ds1 = ds.sort("one")
+    # ds2 = ds.sort("one", descending=True)
+    # r1 = ds1.select_columns(["one"]).take_all()
+    # r2 = ds2.select_columns(["one"]).take_all()
+    # assert [d["one"] for d in r1] == list(range(100))
+    # assert [d["one"] for d in r2] == list(reversed(range(100)))
 
 
 if __name__ == "__main__":
diff --git a/python/ray/data/tests/test_optimize.py b/python/ray/data/tests/test_optimize.py
index 97b62885e1b2..317167faefb1 100644
--- a/python/ray/data/tests/test_optimize.py
+++ b/python/ray/data/tests/test_optimize.py
@@ -349,6 +349,31 @@ def test_window_randomize_fusion(ray_start_regular_shared):
     assert "read->randomize_block_order->MapBatches(dummy_map)" in stats, stats
 
 
+def test_write_fusion(ray_start_regular_shared, tmp_path):
+    context = DatasetContext.get_current()
+    context.optimize_fuse_stages = True
+    context.optimize_fuse_read_stages = True
+    context.optimize_fuse_shuffle_stages = True
+
+    path = os.path.join(tmp_path, "out")
+    ds = ray.data.range(100).map_batches(lambda x: x)
+    ds.write_csv(path)
+    stats = ds._write_ds.stats()
+    assert "read->MapBatches(<lambda>)->write" in stats, stats
+
+    ds = (
+        ray.data.range(100)
+        .map_batches(lambda x: x)
+        .random_shuffle()
+        .map_batches(lambda x: x)
+    )
+    ds.write_csv(path)
+    stats = ds._write_ds.stats()
+    assert "read->MapBatches(<lambda>)" in stats, stats
+    assert "random_shuffle" in stats, stats
+    assert "MapBatches(<lambda>)->write" in stats, stats
+
+
 def test_optimize_fuse(ray_start_regular_shared):
     context = DatasetContext.get_current()
 
diff --git a/python/ray/data/tests/test_size_estimation.py b/python/ray/data/tests/test_size_estimation.py
index 35cdce44fed9..018a85394260 100644
--- a/python/ray/data/tests/test_size_estimation.py
+++ b/python/ray/data/tests/test_size_estimation.py
@@ -158,9 +158,16 @@ def test_split_read_parquet(ray_start_regular_shared, tmp_path):
 
     def gen(name):
         path = os.path.join(tmp_path, name)
-        ray.data.range(200000, parallelism=1).map(
-            lambda _: uuid.uuid4().hex
-        ).write_parquet(path)
+        ds = (
+            ray.data.range(200000, parallelism=1)
+            .map(lambda _: uuid.uuid4().hex)
+            .fully_executed()
+        )
+        # Fully execute the operations prior to write, because with
+        # parallelism=1, there is only one task; so the write operator
+        # will only write to one file, even though there are multiple
+        # blocks created by block splitting.
+        ds.write_parquet(path)
         return ray.data.read_parquet(path, parallelism=200)
 
     # 20MiB

From cefd3c4ce7450f053ed16691fb5997ac692e2132 Mon Sep 17 00:00:00 2001
From: Jian Xiao <99709935+jianoaix@users.noreply.github.com>
Date: Tue, 7 Feb 2023 19:37:50 -0800
Subject: [PATCH 174/267] Reenable autoscaling use in xgboost bench (#32196)

---
 .../air_tests/air_benchmarks/workloads/xgboost_benchmark.py  | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/release/air_tests/air_benchmarks/workloads/xgboost_benchmark.py b/release/air_tests/air_benchmarks/workloads/xgboost_benchmark.py
index 98d903b88a9d..19d41cfa844d 100644
--- a/release/air_tests/air_benchmarks/workloads/xgboost_benchmark.py
+++ b/release/air_tests/air_benchmarks/workloads/xgboost_benchmark.py
@@ -112,13 +112,8 @@ def run_xgboost_prediction(model_path: str, data_path: str):
     ds = data.read_parquet(data_path)
     ckpt = XGBoostCheckpoint.from_model(booster=model)
     batch_predictor = BatchPredictor.from_checkpoint(ckpt, XGBoostPredictor)
-    # TODO(https://github.com/ray-project/ray/issues/31723): Once autoscaling
-    # is supported in new execution backend's actor pool, we should remove the
-    # min_scoring_workers and max_scoring_workers.
     result = batch_predictor.predict(
         ds.drop_columns(["labels"]),
-        min_scoring_workers=10,
-        max_scoring_workers=10,
         # Improve prediction throughput for xgboost with larger
         # batch size than default 4096
         batch_size=8192,

From e84fcb12dbd16af9f8a686c4897a737b91d37a3c Mon Sep 17 00:00:00 2001
From: Justin Yu <justinvyu@berkeley.edu>
Date: Tue, 7 Feb 2023 22:36:52 -0800
Subject: [PATCH 175/267] [Tune] Remove Ray Client references from Tune and
 Train docs/examples (#32299)

This PR removes references to Ray Client in Tune and Train examples. It also removes outdated references of needing `ray.init("auto")` being used to connect to an existing cluster vs. `ray.init()` creating a new local cluster.

The latest `ray.init()` docstring explains that:

> This method handles two cases; either a Ray cluster already exists and we just attach this driver to it or we start all of the processes associated with a Ray cluster and attach to the newly started cluster.

New version of this PR: https://github.com/ray-project/ray/pull/31712

Signed-off-by: Justin Yu <justinvyu@berkeley.edu>
---
 .../huggingface_text_classification.ipynb     | 4293 ++++++++---------
 doc/source/tune/examples/horovod_simple.ipynb |   54 +-
 .../tune/examples/lightgbm_example.ipynb      |   39 +-
 doc/source/tune/examples/mxnet_example.ipynb  |   25 +-
 .../tune/examples/pbt_ppo_example.ipynb       |  765 +--
 .../tune/examples/pbt_transformers.ipynb      |   34 +-
 doc/source/tune/examples/tune-xgboost.ipynb   |  242 +-
 .../tune/examples/tune_mnist_keras.ipynb      |   42 +-
 doc/source/tune/tutorials/tune-stopping.rst   |    2 +-
 .../examples/horovod/horovod_tune_example.py  |   12 -
 .../tune/examples/async_hyperband_example.py  |   17 -
 python/ray/tune/examples/ax_example.py        |   12 -
 python/ray/tune/examples/bayesopt_example.py  |   12 -
 .../ray/tune/examples/blendsearch_example.py  |   13 +-
 python/ray/tune/examples/bohb_example.py      |   16 +-
 python/ray/tune/examples/cfo_example.py       |   13 +-
 .../examples/custom_func_checkpointing.py     |   12 -
 python/ray/tune/examples/dragonfly_example.py |   12 -
 python/ray/tune/examples/hebo_example.py      |   12 -
 python/ray/tune/examples/hyperband_example.py |   13 +-
 .../examples/hyperband_function_example.py    |   13 +-
 ...peropt_conditional_search_space_example.py |   13 +-
 python/ray/tune/examples/lightgbm_example.py  |   12 -
 python/ray/tune/examples/logging_example.py   |   12 -
 python/ray/tune/examples/mnist_ptl_mini.py    |   12 -
 python/ray/tune/examples/mnist_pytorch.py     |   18 +-
 python/ray/tune/examples/mxnet_example.py     |   12 -
 python/ray/tune/examples/nevergrad_example.py |   12 -
 .../examples/optuna_define_by_run_example.py  |   13 +-
 python/ray/tune/examples/optuna_example.py    |   13 +-
 .../examples/optuna_multiobjective_example.py |   13 +-
 python/ray/tune/examples/pb2_example.py       |   13 +-
 python/ray/tune/examples/pbt_example.py       |   18 +-
 python/ray/tune/examples/pbt_function.py      |   12 -
 python/ray/tune/examples/pbt_memnn_example.py |    9 -
 .../pbt_transformers/pbt_transformers.py      |   24 -
 python/ray/tune/examples/skopt_example.py     |   12 -
 python/ray/tune/examples/tf_mnist_example.py  |   12 -
 .../ray/tune/examples/tune_basic_example.py   |   13 +-
 python/ray/tune/examples/tune_mnist_keras.py  |   10 +-
 python/ray/tune/examples/zoopt_example.py     |   12 -
 41 files changed, 2422 insertions(+), 3496 deletions(-)

diff --git a/doc/source/ray-air/examples/huggingface_text_classification.ipynb b/doc/source/ray-air/examples/huggingface_text_classification.ipynb
index 70ca14156995..fddac1cf342e 100644
--- a/doc/source/ray-air/examples/huggingface_text_classification.ipynb
+++ b/doc/source/ray-air/examples/huggingface_text_classification.ipynb
@@ -1,2282 +1,2281 @@
 {
-  "cells": [
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Fine-tune a 🤗 Transformers model"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "VaFMt6AIhYbK"
+   },
+   "source": [
+    "This notebook is based on [an official 🤗 notebook - \"How to fine-tune a model on text classification\"](https://github.com/huggingface/notebooks/blob/6ca682955173cc9d36ffa431ddda505a048cbe80/examples/text_classification.ipynb). The main aim of this notebook is to show the process of conversion from vanilla 🤗 to [Ray AIR](https://docs.ray.io/en/latest/ray-air/getting-started.html) 🤗 without changing the training logic unless necessary.\n",
+    "\n",
+    "In this notebook, we will:\n",
+    "1. [Set up Ray](#setup)\n",
+    "2. [Load the dataset](#load)\n",
+    "3. [Preprocess the dataset with Ray AIR](#preprocess)\n",
+    "4. [Run the training with Ray AIR](#train)\n",
+    "5. [Predict on test data with Ray AIR](#predict)\n",
+    "6. [Optionally, share the model with the community](#share)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "sQbdfyWQhYbO"
+   },
+   "source": [
+    "Uncomment and run the following line in order to install all the necessary dependencies (this notebook is being tested with `transformers==4.19.1`):"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "id": "YajFzmkthYbO"
+   },
+   "outputs": [],
+   "source": [
+    "#! pip install \"datasets\" \"transformers>=4.19.0\" \"torch>=1.10.0\" \"mlflow\" \"ray[air]>=1.13\""
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "pvSRaEHChYbP"
+   },
+   "source": [
+    "## Set up Ray <a name=\"setup\"></a>"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "LRdL3kWBhYbQ"
+   },
+   "source": [
+    "We will use `ray.init()` to initialize a local cluster. By default, this cluster will be comprised of only the machine you are running this notebook on. You can also run this notebook on an Anyscale cluster."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/"
+    },
+    "id": "MOsHUjgdIrIW",
+    "outputId": "e527bdbb-2f28-4142-cca0-762e0566cbcd"
+   },
+   "outputs": [
     {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "# Fine-tune a 🤗 Transformers model"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "2022-08-25 10:09:51,282\tINFO worker.py:1223 -- Using address localhost:9031 set in the environment variable RAY_ADDRESS\n",
+      "2022-08-25 10:09:51,697\tINFO worker.py:1333 -- Connecting to existing Ray cluster at address: 172.31.80.117:9031...\n",
+      "2022-08-25 10:09:51,706\tINFO worker.py:1509 -- Connected to Ray cluster. View the dashboard at \u001b[1m\u001b[32mhttps://session-i8ddtfaxhwypbvnyb9uzg7xs.i.anyscaleuserdata-staging.com/auth/?token=agh0_CkcwRQIhAJXwvxwq31GryaWthvXGCXZebsijbuqi7qL2pCa5uROOAiBGjzsyXAJFHLlaEI9zSlNI8ewtghKg5UV3t8NmlxuMcRJmEiCtvjcKE0VPiU7iQx51P9oPQjfpo5g1RJXccVSS5005cBgCIgNuL2E6DAj9xazjBhDwj4veAUIMCP3ClJgGEPCPi94B-gEeChxzZXNfaThERFRmQVhId1lwYlZueWI5dVpnN3hT&redirect_to=dashboard \u001b[39m\u001b[22m\n",
+      "2022-08-25 10:09:51,709\tINFO packaging.py:342 -- Pushing file package 'gcs://_ray_pkg_3332f64b0a461fddc20be71129115d0a.zip' (0.34MiB) to Ray cluster...\n",
+      "2022-08-25 10:09:51,714\tINFO packaging.py:351 -- Successfully pushed file package 'gcs://_ray_pkg_3332f64b0a461fddc20be71129115d0a.zip'.\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "VaFMt6AIhYbK"
-      },
-      "source": [
-        "This notebook is based on [an official 🤗 notebook - \"How to fine-tune a model on text classification\"](https://github.com/huggingface/notebooks/blob/6ca682955173cc9d36ffa431ddda505a048cbe80/examples/text_classification.ipynb). The main aim of this notebook is to show the process of conversion from vanilla 🤗 to [Ray AIR](https://docs.ray.io/en/latest/ray-air/getting-started.html) 🤗 without changing the training logic unless necessary.\n",
-        "\n",
-        "In this notebook, we will:\n",
-        "1. [Set up Ray](#setup)\n",
-        "2. [Load the dataset](#load)\n",
-        "3. [Preprocess the dataset with Ray AIR](#preprocess)\n",
-        "4. [Run the training with Ray AIR](#train)\n",
-        "5. [Predict on test data with Ray AIR](#predict)\n",
-        "6. [Optionally, share the model with the community](#share)"
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "    <div style=\"margin-left: 50px;display: flex;flex-direction: row;align-items: center\">\n",
+       "        <h3 style=\"color: var(--jp-ui-font-color0)\">Ray</h3>\n",
+       "        <svg version=\"1.1\" id=\"ray\" width=\"3em\" viewBox=\"0 0 144.5 144.6\" style=\"margin-left: 3em;margin-right: 3em\">\n",
+       "            <g id=\"layer-1\">\n",
+       "                <path fill=\"#00a2e9\" class=\"st0\" d=\"M97.3,77.2c-3.8-1.1-6.2,0.9-8.3,5.1c-3.5,6.8-9.9,9.9-17.4,9.6S58,88.1,54.8,81.2c-1.4-3-3-4-6.3-4.1\n",
+       "                    c-5.6-0.1-9.9,0.1-13.1,6.4c-3.8,7.6-13.6,10.2-21.8,7.6C5.2,88.4-0.4,80.5,0,71.7c0.1-8.4,5.7-15.8,13.8-18.2\n",
+       "                    c8.4-2.6,17.5,0.7,22.3,8c1.3,1.9,1.3,5.2,3.6,5.6c3.9,0.6,8,0.2,12,0.2c1.8,0,1.9-1.6,2.4-2.8c3.5-7.8,9.7-11.8,18-11.9\n",
+       "                    c8.2-0.1,14.4,3.9,17.8,11.4c1.3,2.8,2.9,3.6,5.7,3.3c1-0.1,2,0.1,3,0c2.8-0.5,6.4,1.7,8.1-2.7s-2.3-5.5-4.1-7.5\n",
+       "                    c-5.1-5.7-10.9-10.8-16.1-16.3C84,38,81.9,37.1,78,38.3C66.7,42,56.2,35.7,53,24.1C50.3,14,57.3,2.8,67.7,0.5\n",
+       "                    C78.4-2,89,4.7,91.5,15.3c0.1,0.3,0.1,0.5,0.2,0.8c0.7,3.4,0.7,6.9-0.8,9.8c-1.7,3.2-0.8,5,1.5,7.2c6.7,6.5,13.3,13,19.8,19.7\n",
+       "                    c1.8,1.8,3,2.1,5.5,1.2c9.1-3.4,17.9-0.6,23.4,7c4.8,6.9,4.6,16.1-0.4,22.9c-5.4,7.2-14.2,9.9-23.1,6.5c-2.3-0.9-3.5-0.6-5.1,1.1\n",
+       "                    c-6.7,6.9-13.6,13.7-20.5,20.4c-1.8,1.8-2.5,3.2-1.4,5.9c3.5,8.7,0.3,18.6-7.7,23.6c-7.9,5-18.2,3.8-24.8-2.9\n",
+       "                    c-6.4-6.4-7.4-16.2-2.5-24.3c4.9-7.8,14.5-11,23.1-7.8c3,1.1,4.7,0.5,6.9-1.7C91.7,98.4,98,92.3,104.2,86c1.6-1.6,4.1-2.7,2.6-6.2\n",
+       "                    c-1.4-3.3-3.8-2.5-6.2-2.6C99.8,77.2,98.9,77.2,97.3,77.2z M72.1,29.7c5.5,0.1,9.9-4.3,10-9.8c0-0.1,0-0.2,0-0.3\n",
+       "                    C81.8,14,77,9.8,71.5,10.2c-5,0.3-9,4.2-9.3,9.2c-0.2,5.5,4,10.1,9.5,10.3C71.8,29.7,72,29.7,72.1,29.7z M72.3,62.3\n",
+       "                    c-5.4-0.1-9.9,4.2-10.1,9.7c0,0.2,0,0.3,0,0.5c0.2,5.4,4.5,9.7,9.9,10c5.1,0.1,9.9-4.7,10.1-9.8c0.2-5.5-4-10-9.5-10.3\n",
+       "                    C72.6,62.3,72.4,62.3,72.3,62.3z M115,72.5c0.1,5.4,4.5,9.7,9.8,9.9c5.6-0.2,10-4.8,10-10.4c-0.2-5.4-4.6-9.7-10-9.7\n",
+       "                    c-5.3-0.1-9.8,4.2-9.9,9.5C115,72.1,115,72.3,115,72.5z M19.5,62.3c-5.4,0.1-9.8,4.4-10,9.8c-0.1,5.1,5.2,10.4,10.2,10.3\n",
+       "                    c5.6-0.2,10-4.9,9.8-10.5c-0.1-5.4-4.5-9.7-9.9-9.6C19.6,62.3,19.5,62.3,19.5,62.3z M71.8,134.6c5.9,0.2,10.3-3.9,10.4-9.6\n",
+       "                    c0.5-5.5-3.6-10.4-9.1-10.8c-5.5-0.5-10.4,3.6-10.8,9.1c0,0.5,0,0.9,0,1.4c-0.2,5.3,4,9.8,9.3,10\n",
+       "                    C71.6,134.6,71.7,134.6,71.8,134.6z\"/>\n",
+       "            </g>\n",
+       "        </svg>\n",
+       "        <table>\n",
+       "            <tr>\n",
+       "                <td style=\"text-align: left\"><b>Python version:</b></td>\n",
+       "                <td style=\"text-align: left\"><b>3.8.5</b></td>\n",
+       "            </tr>\n",
+       "            <tr>\n",
+       "                <td style=\"text-align: left\"><b>Ray version:</b></td>\n",
+       "                <td style=\"text-align: left\"><b> 2.0.0</b></td>\n",
+       "            </tr>\n",
+       "            <tr>\n",
+       "    <td style=\"text-align: left\"><b>Dashboard:</b></td>\n",
+       "    <td style=\"text-align: left\"><b><a href=\"http://session-i8ddtfaxhwypbvnyb9uzg7xs.i.anyscaleuserdata-staging.com/auth/?token=agh0_CkcwRQIhAJXwvxwq31GryaWthvXGCXZebsijbuqi7qL2pCa5uROOAiBGjzsyXAJFHLlaEI9zSlNI8ewtghKg5UV3t8NmlxuMcRJmEiCtvjcKE0VPiU7iQx51P9oPQjfpo5g1RJXccVSS5005cBgCIgNuL2E6DAj9xazjBhDwj4veAUIMCP3ClJgGEPCPi94B-gEeChxzZXNfaThERFRmQVhId1lwYlZueWI5dVpnN3hT&redirect_to=dashboard\" target=\"_blank\">http://session-i8ddtfaxhwypbvnyb9uzg7xs.i.anyscaleuserdata-staging.com/auth/?token=agh0_CkcwRQIhAJXwvxwq31GryaWthvXGCXZebsijbuqi7qL2pCa5uROOAiBGjzsyXAJFHLlaEI9zSlNI8ewtghKg5UV3t8NmlxuMcRJmEiCtvjcKE0VPiU7iQx51P9oPQjfpo5g1RJXccVSS5005cBgCIgNuL2E6DAj9xazjBhDwj4veAUIMCP3ClJgGEPCPi94B-gEeChxzZXNfaThERFRmQVhId1lwYlZueWI5dVpnN3hT&redirect_to=dashboard</a></b></td>\n",
+       "</tr>\n",
+       "\n",
+       "        </table>\n",
+       "    </div>\n",
+       "</div>\n"
+      ],
+      "text/plain": [
+       "RayContext(dashboard_url='session-i8ddtfaxhwypbvnyb9uzg7xs.i.anyscaleuserdata-staging.com/auth/?token=agh0_CkcwRQIhAJXwvxwq31GryaWthvXGCXZebsijbuqi7qL2pCa5uROOAiBGjzsyXAJFHLlaEI9zSlNI8ewtghKg5UV3t8NmlxuMcRJmEiCtvjcKE0VPiU7iQx51P9oPQjfpo5g1RJXccVSS5005cBgCIgNuL2E6DAj9xazjBhDwj4veAUIMCP3ClJgGEPCPi94B-gEeChxzZXNfaThERFRmQVhId1lwYlZueWI5dVpnN3hT&redirect_to=dashboard', python_version='3.8.5', ray_version='2.0.0', ray_commit='cba26cc83f6b5b8a2ff166594a65cb74c0ec8740', address_info={'node_ip_address': '172.31.80.117', 'raylet_ip_address': '172.31.80.117', 'redis_address': None, 'object_store_address': '/tmp/ray/session_2022-08-25_09-57-39_455459_216/sockets/plasma_store', 'raylet_socket_name': '/tmp/ray/session_2022-08-25_09-57-39_455459_216/sockets/raylet', 'webui_url': 'session-i8ddtfaxhwypbvnyb9uzg7xs.i.anyscaleuserdata-staging.com/auth/?token=agh0_CkcwRQIhAJXwvxwq31GryaWthvXGCXZebsijbuqi7qL2pCa5uROOAiBGjzsyXAJFHLlaEI9zSlNI8ewtghKg5UV3t8NmlxuMcRJmEiCtvjcKE0VPiU7iQx51P9oPQjfpo5g1RJXccVSS5005cBgCIgNuL2E6DAj9xazjBhDwj4veAUIMCP3ClJgGEPCPi94B-gEeChxzZXNfaThERFRmQVhId1lwYlZueWI5dVpnN3hT&redirect_to=dashboard', 'session_dir': '/tmp/ray/session_2022-08-25_09-57-39_455459_216', 'metrics_export_port': 55366, 'gcs_address': '172.31.80.117:9031', 'address': '172.31.80.117:9031', 'dashboard_agent_listen_port': 52365, 'node_id': '422ff33444fd0f870aa6e718628407400a0ec9483a637c3026c3f9a3'})"
       ]
+     },
+     "execution_count": 2,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from pprint import pprint\n",
+    "import ray\n",
+    "\n",
+    "ray.init()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "oJiSdWy2hYbR"
+   },
+   "source": [
+    "We can check the resources our cluster is composed of. If you are running this notebook on your local machine or Google Colab, you should see the number of CPU cores and GPUs available on the said machine."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/"
     },
+    "id": "KlMz0dt9hYbS",
+    "outputId": "2d485449-ee69-4334-fcba-47e0ceb63078"
+   },
+   "outputs": [
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "sQbdfyWQhYbO"
-      },
-      "source": [
-        "Uncomment and run the following line in order to install all the necessary dependencies (this notebook is being tested with `transformers==4.19.1`):"
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "{'CPU': 208.0,\n",
+      " 'GPU': 16.0,\n",
+      " 'accelerator_type:T4': 4.0,\n",
+      " 'memory': 616693614180.0,\n",
+      " 'node:172.31.76.237': 1.0,\n",
+      " 'node:172.31.80.117': 1.0,\n",
+      " 'node:172.31.85.193': 1.0,\n",
+      " 'node:172.31.85.32': 1.0,\n",
+      " 'node:172.31.90.137': 1.0,\n",
+      " 'object_store_memory': 259318055729.0}\n"
+     ]
+    }
+   ],
+   "source": [
+    "pprint(ray.cluster_resources())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "uS6oeJELhYbS"
+   },
+   "source": [
+    "In this notebook, we will see how to fine-tune one of the [🤗 Transformers](https://github.com/huggingface/transformers) model to a text classification task of the [GLUE Benchmark](https://gluebenchmark.com/). We will be running the training using [Ray AIR](https://docs.ray.io/en/latest/ray-air/getting-started.html).\n",
+    "\n",
+    "You can change those two variables to control whether the training (which we will get to later) uses CPUs or GPUs, and how many workers should be spawned. Each worker will claim one CPU or GPU. Make sure not to request more resources than the resources present!\n",
+    "\n",
+    "By default, we will run the training with one GPU worker."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "id": "gAbhv9OqhYbT"
+   },
+   "outputs": [],
+   "source": [
+    "use_gpu = True  # set this to False to run on CPUs\n",
+    "num_workers = 1  # set this to number of GPUs/CPUs you want to use"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "rEJBSTyZIrIb"
+   },
+   "source": [
+    "## Fine-tuning a model on a text classification task"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "kTCFado4IrIc"
+   },
+   "source": [
+    "The GLUE Benchmark is a group of nine classification tasks on sentences or pairs of sentences. If you would like to learn more, refer to the [original notebook](https://github.com/huggingface/notebooks/blob/6ca682955173cc9d36ffa431ddda505a048cbe80/examples/text_classification.ipynb).\n",
+    "\n",
+    "Each task is named by its acronym, with `mnli-mm` standing for the mismatched version of MNLI (so same training set as `mnli` but different validation and test sets):"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {
+    "id": "YZbiBDuGIrId"
+   },
+   "outputs": [],
+   "source": [
+    "GLUE_TASKS = [\"cola\", \"mnli\", \"mnli-mm\", \"mrpc\", \"qnli\", \"qqp\", \"rte\", \"sst2\", \"stsb\", \"wnli\"]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "4RRkXuteIrIh"
+   },
+   "source": [
+    "This notebook is built to run on any of the tasks in the list above, with any model checkpoint from the [Model Hub](https://huggingface.co/models) as long as that model has a version with a classification head. Depending on your model and the GPU you are using, you might need to adjust the batch size to avoid out-of-memory errors. Set those three parameters, then the rest of the notebook should run smoothly:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {
+    "id": "zVvslsfMIrIh"
+   },
+   "outputs": [],
+   "source": [
+    "task = \"cola\"\n",
+    "model_checkpoint = \"distilbert-base-uncased\"\n",
+    "batch_size = 16"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "whPRbBNbIrIl"
+   },
+   "source": [
+    "### Loading the dataset <a name=\"load\"></a>"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "W7QYTpxXIrIl"
+   },
+   "source": [
+    "We will use the [🤗 Datasets](https://github.com/huggingface/datasets) library to download the data and get the metric we need to use for evaluation (to compare our model to the benchmark). This can be easily done with the functions `load_dataset` and `load_metric`.\n",
+    "\n",
+    "Apart from `mnli-mm` being a special code, we can directly pass our task name to those functions.\n",
+    "\n",
+    "As Ray AIR doesn't provide integrations for 🤗 Datasets yet, we will simply run the normal 🤗 Datasets code to load the dataset from the Hub."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/",
+     "height": 200
+    },
+    "id": "MwhAeEOuhYbV",
+    "outputId": "3aff8c73-d6eb-4784-890a-a419403b5bda"
+   },
+   "outputs": [],
+   "source": [
+    "from datasets import load_dataset\n",
+    "\n",
+    "actual_task = \"mnli\" if task == \"mnli-mm\" else task\n",
+    "datasets = load_dataset(\"glue\", actual_task)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "RzfPtOMoIrIu"
+   },
+   "source": [
+    "The `dataset` object itself is [`DatasetDict`](https://huggingface.co/docs/datasets/package_reference/main_classes.html#datasetdict), which contains one key for the training, validation, and test set (with more keys for the mismatched validation and test set in the special case of `mnli`)."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "_TOee7nohYbW"
+   },
+   "source": [
+    "We will also need the metric. In order to avoid serialization errors, we will load the metric inside the training workers later. Therefore, now we will just define the function we will use."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {
+    "id": "FNE583uBhYbW"
+   },
+   "outputs": [],
+   "source": [
+    "from datasets import load_metric\n",
+    "\n",
+    "def load_metric_fn():\n",
+    "    return load_metric('glue', actual_task)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "lnjDIuQ3IrI-"
+   },
+   "source": [
+    "The metric is an instance of [`datasets.Metric`](https://huggingface.co/docs/datasets/package_reference/main_classes.html#datasets.Metric)."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "n9qywopnIrJH"
+   },
+   "source": [
+    "### Preprocessing the data with Ray AIR <a name=\"preprocess\"></a>"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "YVx71GdAIrJH"
+   },
+   "source": [
+    "Before we can feed those texts to our model, we need to preprocess them. This is done by a 🤗 Transformers' `Tokenizer`, which will (as the name indicates) tokenize the inputs (including converting the tokens to their corresponding IDs in the pretrained vocabulary) and put it in a format the model expects, as well as generate the other inputs that model requires.\n",
+    "\n",
+    "To do all of this, we instantiate our tokenizer with the `AutoTokenizer.from_pretrained` method, which will ensure that:\n",
+    "\n",
+    "- we get a tokenizer that corresponds to the model architecture we want to use,\n",
+    "- we download the vocabulary used when pretraining this specific checkpoint."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/",
+     "height": 145
+    },
+    "id": "eXNLu_-nIrJI",
+    "outputId": "f545a7a5-f341-4315-cd89-9942a657aa31"
+   },
+   "outputs": [],
+   "source": [
+    "from transformers import AutoTokenizer\n",
+    "\n",
+    "tokenizer = AutoTokenizer.from_pretrained(model_checkpoint, use_fast=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "Vl6IidfdIrJK"
+   },
+   "source": [
+    "We pass along `use_fast=True` to the call above to use one of the fast tokenizers (backed by Rust) from the 🤗 Tokenizers library. Those fast tokenizers are available for almost all models, but if you got an error with the previous call, remove that argument."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "qo_0B1M2IrJM"
+   },
+   "source": [
+    "To preprocess our dataset, we will thus need the names of the columns containing the sentence(s). The following dictionary keeps track of the correspondence task to column names:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {
+    "id": "fyGdtK9oIrJM"
+   },
+   "outputs": [],
+   "source": [
+    "task_to_keys = {\n",
+    "    \"cola\": (\"sentence\", None),\n",
+    "    \"mnli\": (\"premise\", \"hypothesis\"),\n",
+    "    \"mnli-mm\": (\"premise\", \"hypothesis\"),\n",
+    "    \"mrpc\": (\"sentence1\", \"sentence2\"),\n",
+    "    \"qnli\": (\"question\", \"sentence\"),\n",
+    "    \"qqp\": (\"question1\", \"question2\"),\n",
+    "    \"rte\": (\"sentence1\", \"sentence2\"),\n",
+    "    \"sst2\": (\"sentence\", None),\n",
+    "    \"stsb\": (\"sentence1\", \"sentence2\"),\n",
+    "    \"wnli\": (\"sentence1\", \"sentence2\"),\n",
+    "}"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "256fOuzjhYbY"
+   },
+   "source": [
+    "For Ray AIR, instead of using 🤗 Dataset objects directly, we will convert them to [Ray Datasets](https://docs.ray.io/en/latest/data/dataset.html). Both are backed by Arrow tables, so the conversion is straightforward. We will use the built-in `ray.data.from_huggingface` function."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'train': Dataset(num_blocks=1, num_rows=8551, schema={sentence: string, label: int64, idx: int32}),\n",
+       " 'validation': Dataset(num_blocks=1, num_rows=1043, schema={sentence: string, label: int64, idx: int32}),\n",
+       " 'test': Dataset(num_blocks=1, num_rows=1063, schema={sentence: string, label: int64, idx: int32})}"
       ]
+     },
+     "execution_count": 11,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "import ray.data\n",
+    "\n",
+    "ray_datasets = ray.data.from_huggingface(datasets)\n",
+    "ray_datasets"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "2C0hcmp9IrJQ"
+   },
+   "source": [
+    "We can then write the function that will preprocess our samples. We just feed them to the `tokenizer` with the argument `truncation=True`. This will ensure that an input longer than what the model selected can handle will be truncated to the maximum length accepted by the model.\n",
+    "\n",
+    "We use a `BatchMapper` to create a Ray AIR preprocessor that will map the function to the dataset in a distributed fashion. It will run during training and prediction."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {
+    "id": "vc0BSBLIIrJQ"
+   },
+   "outputs": [],
+   "source": [
+    "import pandas as pd\n",
+    "from ray.data.preprocessors import BatchMapper\n",
+    "\n",
+    "def preprocess_function(examples: pd.DataFrame):\n",
+    "    # if we only have one column, we are inferring.\n",
+    "    # no need to tokenize in that case. \n",
+    "    if len(examples.columns) == 1:\n",
+    "        return examples\n",
+    "    examples = examples.to_dict(\"list\")\n",
+    "    sentence1_key, sentence2_key = task_to_keys[task]\n",
+    "    if sentence2_key is None:\n",
+    "        ret = tokenizer(examples[sentence1_key], truncation=True)\n",
+    "    else:\n",
+    "        ret = tokenizer(examples[sentence1_key], examples[sentence2_key], truncation=True)\n",
+    "    # Add back the original columns\n",
+    "    ret = {**examples, **ret}\n",
+    "    return pd.DataFrame.from_dict(ret)\n",
+    "\n",
+    "batch_encoder = BatchMapper(preprocess_function, batch_format=\"pandas\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "545PP3o8IrJV"
+   },
+   "source": [
+    "### Fine-tuning the model with Ray AIR <a name=\"train\"></a>"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "FBiW8UpKIrJW"
+   },
+   "source": [
+    "Now that our data is ready, we can download the pretrained model and fine-tune it.\n",
+    "\n",
+    "Since all our tasks are about sentence classification, we use the `AutoModelForSequenceClassification` class.\n",
+    "\n",
+    "We will not go into details about each specific component of the training (see the [original notebook](https://github.com/huggingface/notebooks/blob/6ca682955173cc9d36ffa431ddda505a048cbe80/examples/text_classification.ipynb) for that). The tokenizer is the same as we have used to encoded the dataset before.\n",
+    "\n",
+    "The main difference when using the Ray AIR is that we need to create our 🤗 Transformers `Trainer` inside a function (`trainer_init_per_worker`) and return it. That function will be passed to the `HuggingFaceTrainer` and will run on every Ray worker. The training will then proceed by the means of PyTorch DDP.\n",
+    "\n",
+    "Make sure that you initialize the model, metric, and tokenizer inside that function. Otherwise, you may run into serialization errors.\n",
+    "\n",
+    "Furthermore, `push_to_hub=True` is not yet supported. Ray will, however, checkpoint the model at every epoch, allowing you to push it to hub manually. We will do that after the training.\n",
+    "\n",
+    "If you wish to use thrid party logging libraries, such as MLflow or Weights&Biases, do not set them in `TrainingArguments` (they will be automatically disabled) - instead, you should pass Ray AIR callbacks to `HuggingFaceTrainer`'s `run_config`. In this example, we will use MLflow."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {
+    "id": "TlqNaB8jIrJW"
+   },
+   "outputs": [],
+   "source": [
+    "from transformers import AutoModelForSequenceClassification, TrainingArguments, Trainer\n",
+    "import numpy as np\n",
+    "import torch\n",
+    "\n",
+    "num_labels = 3 if task.startswith(\"mnli\") else 1 if task==\"stsb\" else 2\n",
+    "metric_name = \"pearson\" if task == \"stsb\" else \"matthews_correlation\" if task == \"cola\" else \"accuracy\"\n",
+    "model_name = model_checkpoint.split(\"/\")[-1]\n",
+    "validation_key = \"validation_mismatched\" if task == \"mnli-mm\" else \"validation_matched\" if task == \"mnli\" else \"validation\"\n",
+    "name = f\"{model_name}-finetuned-{task}\"\n",
+    "\n",
+    "def trainer_init_per_worker(train_dataset, eval_dataset = None, **config):\n",
+    "    print(f\"Is CUDA available: {torch.cuda.is_available()}\")\n",
+    "    metric = load_metric_fn()\n",
+    "    tokenizer = AutoTokenizer.from_pretrained(model_checkpoint, use_fast=True)\n",
+    "    model = AutoModelForSequenceClassification.from_pretrained(model_checkpoint, num_labels=num_labels)\n",
+    "    args = TrainingArguments(\n",
+    "        name,\n",
+    "        evaluation_strategy=\"epoch\",\n",
+    "        save_strategy=\"epoch\",\n",
+    "        logging_strategy=\"epoch\",\n",
+    "        learning_rate=config.get(\"learning_rate\", 2e-5),\n",
+    "        per_device_train_batch_size=batch_size,\n",
+    "        per_device_eval_batch_size=batch_size,\n",
+    "        num_train_epochs=config.get(\"epochs\", 2),\n",
+    "        weight_decay=config.get(\"weight_decay\", 0.01),\n",
+    "        push_to_hub=False,\n",
+    "        disable_tqdm=True,  # declutter the output a little\n",
+    "        no_cuda=not use_gpu,  # you need to explicitly set no_cuda if you want CPUs\n",
+    "    )\n",
+    "\n",
+    "    def compute_metrics(eval_pred):\n",
+    "        predictions, labels = eval_pred\n",
+    "        if task != \"stsb\":\n",
+    "            predictions = np.argmax(predictions, axis=1)\n",
+    "        else:\n",
+    "            predictions = predictions[:, 0]\n",
+    "        return metric.compute(predictions=predictions, references=labels)\n",
+    "\n",
+    "    trainer = Trainer(\n",
+    "        model,\n",
+    "        args,\n",
+    "        train_dataset=train_dataset,\n",
+    "        eval_dataset=eval_dataset,\n",
+    "        tokenizer=tokenizer,\n",
+    "        compute_metrics=compute_metrics\n",
+    "    )\n",
+    "\n",
+    "    print(\"Starting training\")\n",
+    "    return trainer"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "CdzABDVcIrJg"
+   },
+   "source": [
+    "With our `trainer_init_per_worker` complete, we can now instantiate the `HuggingFaceTrainer`. Aside from the function, we set the `scaling_config`, controlling the amount of workers and resources used, and the `datasets` we will use for training and evaluation.\n",
+    "\n",
+    "We specify the `MLflowLoggerCallback` inside the `run_config`, and pass the preprocessor we have defined earlier as an argument. The preprocessor will be included with the returned `Checkpoint`, meaning it will also be applied during inference."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {
+    "id": "RElw7OgLhYba"
+   },
+   "outputs": [],
+   "source": [
+    "from ray.train.huggingface import HuggingFaceTrainer\n",
+    "from ray.air.config import RunConfig, ScalingConfig, CheckpointConfig\n",
+    "from ray.air.integrations.mlflow import MLflowLoggerCallback\n",
+    "\n",
+    "trainer = HuggingFaceTrainer(\n",
+    "    trainer_init_per_worker=trainer_init_per_worker,\n",
+    "    scaling_config=ScalingConfig(num_workers=num_workers, use_gpu=use_gpu),\n",
+    "    datasets={\n",
+    "        \"train\": ray_datasets[\"train\"],\n",
+    "        \"evaluation\": ray_datasets[validation_key],\n",
+    "    },\n",
+    "    run_config=RunConfig(\n",
+    "        callbacks=[MLflowLoggerCallback(experiment_name=name)],\n",
+    "        checkpoint_config=CheckpointConfig(\n",
+    "            num_to_keep=1,\n",
+    "            checkpoint_score_attribute=\"eval_loss\",\n",
+    "            checkpoint_score_order=\"min\",\n",
+    "        ),\n",
+    "    ),\n",
+    "    preprocessor=batch_encoder,\n",
+    ")\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "XvS136zKhYba"
+   },
+   "source": [
+    "Finally, we call the `fit` method to start training with Ray AIR. We will save the `Result` object to a variable so we can access metrics and checkpoints."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/",
+     "height": 1000
     },
+    "id": "uNx5pyRlIrJh",
+    "outputId": "8496fe4f-f1c3-48ad-a6d3-b16a65716135"
+   },
+   "outputs": [
     {
-      "cell_type": "code",
-      "execution_count": 1,
-      "metadata": {
-        "id": "YajFzmkthYbO"
-      },
-      "outputs": [],
-      "source": [
-        "#! pip install \"datasets\" \"transformers>=4.19.0\" \"torch>=1.10.0\" \"mlflow\" \"ray[air]>=1.13\""
+     "data": {
+      "text/html": [
+       "== Status ==<br>Current time: 2022-08-25 10:14:09 (running for 00:04:06.45)<br>Memory usage on this node: 4.3/62.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/208 CPUs, 0/16 GPUs, 0.0/574.34 GiB heap, 0.0/241.51 GiB objects (0.0/4.0 accelerator_type:T4)<br>Result logdir: /home/ray/ray_results/HuggingFaceTrainer_2022-08-25_10-10-02<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
+       "<thead>\n",
+       "<tr><th>Trial name                    </th><th>status    </th><th>loc              </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  loss</th><th style=\"text-align: right;\">  learning_rate</th><th style=\"text-align: right;\">  epoch</th></tr>\n",
+       "</thead>\n",
+       "<tbody>\n",
+       "<tr><td>HuggingFaceTrainer_c1ff5_00000</td><td>TERMINATED</td><td>172.31.90.137:947</td><td style=\"text-align: right;\">     2</td><td style=\"text-align: right;\">         200.217</td><td style=\"text-align: right;\">0.3886</td><td style=\"text-align: right;\">              0</td><td style=\"text-align: right;\">      2</td></tr>\n",
+       "</tbody>\n",
+       "</table><br><br>"
+      ],
+      "text/plain": [
+       "<IPython.core.display.HTML object>"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "pvSRaEHChYbP"
-      },
-      "source": [
-        "## Set up Ray <a name=\"setup\"></a>"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) 2022-08-25 10:10:44,617\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=4]\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "LRdL3kWBhYbQ"
-      },
-      "source": [
-        "We will use `ray.init()` to initialize a local cluster. By default, this cluster will be comprised of only the machine you are running this notebook on. You can also run this notebook on an Anyscale cluster.\n",
-        "\n",
-        "Note: this notebook *will not* run in Ray Client mode."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1116, ip=172.31.90.137) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1117, ip=172.31.90.137) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1115, ip=172.31.90.137) Is CUDA available: True\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 2,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "MOsHUjgdIrIW",
-        "outputId": "e527bdbb-2f28-4142-cca0-762e0566cbcd"
-      },
-      "outputs": [
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "2022-08-25 10:09:51,282\tINFO worker.py:1223 -- Using address localhost:9031 set in the environment variable RAY_ADDRESS\n",
-            "2022-08-25 10:09:51,697\tINFO worker.py:1333 -- Connecting to existing Ray cluster at address: 172.31.80.117:9031...\n",
-            "2022-08-25 10:09:51,706\tINFO worker.py:1509 -- Connected to Ray cluster. View the dashboard at \u001b[1m\u001b[32mhttps://session-i8ddtfaxhwypbvnyb9uzg7xs.i.anyscaleuserdata-staging.com/auth/?token=agh0_CkcwRQIhAJXwvxwq31GryaWthvXGCXZebsijbuqi7qL2pCa5uROOAiBGjzsyXAJFHLlaEI9zSlNI8ewtghKg5UV3t8NmlxuMcRJmEiCtvjcKE0VPiU7iQx51P9oPQjfpo5g1RJXccVSS5005cBgCIgNuL2E6DAj9xazjBhDwj4veAUIMCP3ClJgGEPCPi94B-gEeChxzZXNfaThERFRmQVhId1lwYlZueWI5dVpnN3hT&redirect_to=dashboard \u001b[39m\u001b[22m\n",
-            "2022-08-25 10:09:51,709\tINFO packaging.py:342 -- Pushing file package 'gcs://_ray_pkg_3332f64b0a461fddc20be71129115d0a.zip' (0.34MiB) to Ray cluster...\n",
-            "2022-08-25 10:09:51,714\tINFO packaging.py:351 -- Successfully pushed file package 'gcs://_ray_pkg_3332f64b0a461fddc20be71129115d0a.zip'.\n"
-          ]
-        },
-        {
-          "data": {
-            "text/html": [
-              "<div>\n",
-              "    <div style=\"margin-left: 50px;display: flex;flex-direction: row;align-items: center\">\n",
-              "        <h3 style=\"color: var(--jp-ui-font-color0)\">Ray</h3>\n",
-              "        <svg version=\"1.1\" id=\"ray\" width=\"3em\" viewBox=\"0 0 144.5 144.6\" style=\"margin-left: 3em;margin-right: 3em\">\n",
-              "            <g id=\"layer-1\">\n",
-              "                <path fill=\"#00a2e9\" class=\"st0\" d=\"M97.3,77.2c-3.8-1.1-6.2,0.9-8.3,5.1c-3.5,6.8-9.9,9.9-17.4,9.6S58,88.1,54.8,81.2c-1.4-3-3-4-6.3-4.1\n",
-              "                    c-5.6-0.1-9.9,0.1-13.1,6.4c-3.8,7.6-13.6,10.2-21.8,7.6C5.2,88.4-0.4,80.5,0,71.7c0.1-8.4,5.7-15.8,13.8-18.2\n",
-              "                    c8.4-2.6,17.5,0.7,22.3,8c1.3,1.9,1.3,5.2,3.6,5.6c3.9,0.6,8,0.2,12,0.2c1.8,0,1.9-1.6,2.4-2.8c3.5-7.8,9.7-11.8,18-11.9\n",
-              "                    c8.2-0.1,14.4,3.9,17.8,11.4c1.3,2.8,2.9,3.6,5.7,3.3c1-0.1,2,0.1,3,0c2.8-0.5,6.4,1.7,8.1-2.7s-2.3-5.5-4.1-7.5\n",
-              "                    c-5.1-5.7-10.9-10.8-16.1-16.3C84,38,81.9,37.1,78,38.3C66.7,42,56.2,35.7,53,24.1C50.3,14,57.3,2.8,67.7,0.5\n",
-              "                    C78.4-2,89,4.7,91.5,15.3c0.1,0.3,0.1,0.5,0.2,0.8c0.7,3.4,0.7,6.9-0.8,9.8c-1.7,3.2-0.8,5,1.5,7.2c6.7,6.5,13.3,13,19.8,19.7\n",
-              "                    c1.8,1.8,3,2.1,5.5,1.2c9.1-3.4,17.9-0.6,23.4,7c4.8,6.9,4.6,16.1-0.4,22.9c-5.4,7.2-14.2,9.9-23.1,6.5c-2.3-0.9-3.5-0.6-5.1,1.1\n",
-              "                    c-6.7,6.9-13.6,13.7-20.5,20.4c-1.8,1.8-2.5,3.2-1.4,5.9c3.5,8.7,0.3,18.6-7.7,23.6c-7.9,5-18.2,3.8-24.8-2.9\n",
-              "                    c-6.4-6.4-7.4-16.2-2.5-24.3c4.9-7.8,14.5-11,23.1-7.8c3,1.1,4.7,0.5,6.9-1.7C91.7,98.4,98,92.3,104.2,86c1.6-1.6,4.1-2.7,2.6-6.2\n",
-              "                    c-1.4-3.3-3.8-2.5-6.2-2.6C99.8,77.2,98.9,77.2,97.3,77.2z M72.1,29.7c5.5,0.1,9.9-4.3,10-9.8c0-0.1,0-0.2,0-0.3\n",
-              "                    C81.8,14,77,9.8,71.5,10.2c-5,0.3-9,4.2-9.3,9.2c-0.2,5.5,4,10.1,9.5,10.3C71.8,29.7,72,29.7,72.1,29.7z M72.3,62.3\n",
-              "                    c-5.4-0.1-9.9,4.2-10.1,9.7c0,0.2,0,0.3,0,0.5c0.2,5.4,4.5,9.7,9.9,10c5.1,0.1,9.9-4.7,10.1-9.8c0.2-5.5-4-10-9.5-10.3\n",
-              "                    C72.6,62.3,72.4,62.3,72.3,62.3z M115,72.5c0.1,5.4,4.5,9.7,9.8,9.9c5.6-0.2,10-4.8,10-10.4c-0.2-5.4-4.6-9.7-10-9.7\n",
-              "                    c-5.3-0.1-9.8,4.2-9.9,9.5C115,72.1,115,72.3,115,72.5z M19.5,62.3c-5.4,0.1-9.8,4.4-10,9.8c-0.1,5.1,5.2,10.4,10.2,10.3\n",
-              "                    c5.6-0.2,10-4.9,9.8-10.5c-0.1-5.4-4.5-9.7-9.9-9.6C19.6,62.3,19.5,62.3,19.5,62.3z M71.8,134.6c5.9,0.2,10.3-3.9,10.4-9.6\n",
-              "                    c0.5-5.5-3.6-10.4-9.1-10.8c-5.5-0.5-10.4,3.6-10.8,9.1c0,0.5,0,0.9,0,1.4c-0.2,5.3,4,9.8,9.3,10\n",
-              "                    C71.6,134.6,71.7,134.6,71.8,134.6z\"/>\n",
-              "            </g>\n",
-              "        </svg>\n",
-              "        <table>\n",
-              "            <tr>\n",
-              "                <td style=\"text-align: left\"><b>Python version:</b></td>\n",
-              "                <td style=\"text-align: left\"><b>3.8.5</b></td>\n",
-              "            </tr>\n",
-              "            <tr>\n",
-              "                <td style=\"text-align: left\"><b>Ray version:</b></td>\n",
-              "                <td style=\"text-align: left\"><b> 2.0.0</b></td>\n",
-              "            </tr>\n",
-              "            <tr>\n",
-              "    <td style=\"text-align: left\"><b>Dashboard:</b></td>\n",
-              "    <td style=\"text-align: left\"><b><a href=\"http://session-i8ddtfaxhwypbvnyb9uzg7xs.i.anyscaleuserdata-staging.com/auth/?token=agh0_CkcwRQIhAJXwvxwq31GryaWthvXGCXZebsijbuqi7qL2pCa5uROOAiBGjzsyXAJFHLlaEI9zSlNI8ewtghKg5UV3t8NmlxuMcRJmEiCtvjcKE0VPiU7iQx51P9oPQjfpo5g1RJXccVSS5005cBgCIgNuL2E6DAj9xazjBhDwj4veAUIMCP3ClJgGEPCPi94B-gEeChxzZXNfaThERFRmQVhId1lwYlZueWI5dVpnN3hT&redirect_to=dashboard\" target=\"_blank\">http://session-i8ddtfaxhwypbvnyb9uzg7xs.i.anyscaleuserdata-staging.com/auth/?token=agh0_CkcwRQIhAJXwvxwq31GryaWthvXGCXZebsijbuqi7qL2pCa5uROOAiBGjzsyXAJFHLlaEI9zSlNI8ewtghKg5UV3t8NmlxuMcRJmEiCtvjcKE0VPiU7iQx51P9oPQjfpo5g1RJXccVSS5005cBgCIgNuL2E6DAj9xazjBhDwj4veAUIMCP3ClJgGEPCPi94B-gEeChxzZXNfaThERFRmQVhId1lwYlZueWI5dVpnN3hT&redirect_to=dashboard</a></b></td>\n",
-              "</tr>\n",
-              "\n",
-              "        </table>\n",
-              "    </div>\n",
-              "</div>\n"
-            ],
-            "text/plain": [
-              "RayContext(dashboard_url='session-i8ddtfaxhwypbvnyb9uzg7xs.i.anyscaleuserdata-staging.com/auth/?token=agh0_CkcwRQIhAJXwvxwq31GryaWthvXGCXZebsijbuqi7qL2pCa5uROOAiBGjzsyXAJFHLlaEI9zSlNI8ewtghKg5UV3t8NmlxuMcRJmEiCtvjcKE0VPiU7iQx51P9oPQjfpo5g1RJXccVSS5005cBgCIgNuL2E6DAj9xazjBhDwj4veAUIMCP3ClJgGEPCPi94B-gEeChxzZXNfaThERFRmQVhId1lwYlZueWI5dVpnN3hT&redirect_to=dashboard', python_version='3.8.5', ray_version='2.0.0', ray_commit='cba26cc83f6b5b8a2ff166594a65cb74c0ec8740', address_info={'node_ip_address': '172.31.80.117', 'raylet_ip_address': '172.31.80.117', 'redis_address': None, 'object_store_address': '/tmp/ray/session_2022-08-25_09-57-39_455459_216/sockets/plasma_store', 'raylet_socket_name': '/tmp/ray/session_2022-08-25_09-57-39_455459_216/sockets/raylet', 'webui_url': 'session-i8ddtfaxhwypbvnyb9uzg7xs.i.anyscaleuserdata-staging.com/auth/?token=agh0_CkcwRQIhAJXwvxwq31GryaWthvXGCXZebsijbuqi7qL2pCa5uROOAiBGjzsyXAJFHLlaEI9zSlNI8ewtghKg5UV3t8NmlxuMcRJmEiCtvjcKE0VPiU7iQx51P9oPQjfpo5g1RJXccVSS5005cBgCIgNuL2E6DAj9xazjBhDwj4veAUIMCP3ClJgGEPCPi94B-gEeChxzZXNfaThERFRmQVhId1lwYlZueWI5dVpnN3hT&redirect_to=dashboard', 'session_dir': '/tmp/ray/session_2022-08-25_09-57-39_455459_216', 'metrics_export_port': 55366, 'gcs_address': '172.31.80.117:9031', 'address': '172.31.80.117:9031', 'dashboard_agent_listen_port': 52365, 'node_id': '422ff33444fd0f870aa6e718628407400a0ec9483a637c3026c3f9a3'})"
-            ]
-          },
-          "execution_count": 2,
-          "metadata": {},
-          "output_type": "execute_result"
-        }
-      ],
-      "source": [
-        "from pprint import pprint\n",
-        "import ray\n",
-        "\n",
-        "ray.init()"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Downloading builder script: 5.76kB [00:00, 6.45MB/s]                   \n",
+      "Downloading builder script: 5.76kB [00:00, 6.91MB/s]                   \n",
+      "Downloading builder script: 5.76kB [00:00, 6.44MB/s]                   \n",
+      "Downloading builder script: 5.76kB [00:00, 6.94MB/s]                   \n",
+      "Downloading tokenizer_config.json: 100%|██████████| 28.0/28.0 [00:00<00:00, 30.5kB/s]\n",
+      "Downloading config.json: 100%|██████████| 483/483 [00:00<00:00, 817kB/s]\n",
+      "Downloading vocab.txt:   0%|          | 0.00/226k [00:00<?, ?B/s]\n",
+      "Downloading vocab.txt:  18%|█▊        | 41.0k/226k [00:00<00:00, 353kB/s]\n",
+      "Downloading vocab.txt: 100%|██████████| 226k/226k [00:00<00:00, 773kB/s] \n",
+      "Downloading tokenizer.json:   0%|          | 0.00/455k [00:00<?, ?B/s]\n",
+      "Downloading tokenizer.json:   6%|▌         | 28.0k/455k [00:00<00:01, 227kB/s]\n",
+      "Downloading tokenizer.json:  24%|██▍       | 111k/455k [00:00<00:00, 488kB/s] \n",
+      "Downloading tokenizer.json:  42%|████▏     | 191k/455k [00:00<00:00, 559kB/s]\n",
+      "Downloading tokenizer.json:  67%|██████▋   | 303k/455k [00:00<00:00, 694kB/s]\n",
+      "Downloading tokenizer.json: 100%|██████████| 455k/455k [00:00<00:00, 815kB/s]\n",
+      "Downloading pytorch_model.bin:   0%|          | 0.00/256M [00:00<?, ?B/s]\n",
+      "Downloading pytorch_model.bin:   0%|          | 1.20M/256M [00:00<00:21, 12.6MB/s]\n",
+      "Downloading pytorch_model.bin:   2%|▏         | 6.02M/256M [00:00<00:07, 34.9MB/s]\n",
+      "Downloading pytorch_model.bin:   6%|▌         | 15.0M/256M [00:00<00:04, 62.0MB/s]\n",
+      "Downloading pytorch_model.bin:   9%|▉         | 24.0M/256M [00:00<00:03, 74.8MB/s]\n",
+      "Downloading pytorch_model.bin:  13%|█▎        | 33.1M/256M [00:00<00:02, 82.3MB/s]\n",
+      "Downloading pytorch_model.bin:  17%|█▋        | 42.2M/256M [00:00<00:02, 86.7MB/s]\n",
+      "Downloading pytorch_model.bin:  20%|██        | 51.4M/256M [00:00<00:02, 89.8MB/s]\n",
+      "Downloading pytorch_model.bin:  24%|██▎       | 60.6M/256M [00:00<00:02, 91.8MB/s]\n",
+      "Downloading pytorch_model.bin:  27%|██▋       | 69.8M/256M [00:00<00:02, 93.3MB/s]\n",
+      "Downloading pytorch_model.bin:  31%|███       | 78.9M/256M [00:01<00:01, 94.2MB/s]\n",
+      "Downloading pytorch_model.bin:  34%|███▍      | 88.0M/256M [00:01<00:01, 94.6MB/s]\n",
+      "Downloading pytorch_model.bin:  38%|███▊      | 97.2M/256M [00:01<00:01, 95.1MB/s]\n",
+      "Downloading pytorch_model.bin:  42%|████▏     | 106M/256M [00:01<00:01, 95.6MB/s] \n",
+      "Downloading pytorch_model.bin:  45%|████▌     | 116M/256M [00:01<00:01, 96.0MB/s]\n",
+      "Downloading pytorch_model.bin:  49%|████▉     | 125M/256M [00:01<00:01, 96.2MB/s]\n",
+      "Downloading pytorch_model.bin:  52%|█████▏    | 134M/256M [00:01<00:01, 96.0MB/s]\n",
+      "Downloading pytorch_model.bin:  56%|█████▌    | 143M/256M [00:01<00:01, 96.1MB/s]\n",
+      "Downloading pytorch_model.bin:  60%|█████▉    | 152M/256M [00:01<00:01, 96.0MB/s]\n",
+      "Downloading pytorch_model.bin:  63%|██████▎   | 162M/256M [00:01<00:01, 96.2MB/s]\n",
+      "Downloading pytorch_model.bin:  67%|██████▋   | 171M/256M [00:02<00:00, 96.1MB/s]\n",
+      "Downloading pytorch_model.bin:  70%|███████   | 180M/256M [00:02<00:00, 96.2MB/s]\n",
+      "Downloading pytorch_model.bin:  74%|███████▍  | 189M/256M [00:02<00:00, 96.2MB/s]\n",
+      "Downloading pytorch_model.bin:  78%|███████▊  | 198M/256M [00:02<00:00, 96.2MB/s]\n",
+      "Downloading pytorch_model.bin:  81%|████████  | 208M/256M [00:02<00:00, 95.9MB/s]\n",
+      "Downloading pytorch_model.bin:  85%|████████▍ | 217M/256M [00:02<00:00, 95.9MB/s]\n",
+      "Downloading pytorch_model.bin:  88%|████████▊ | 226M/256M [00:02<00:00, 96.2MB/s]\n",
+      "Downloading pytorch_model.bin:  92%|█████████▏| 235M/256M [00:02<00:00, 96.1MB/s]\n",
+      "Downloading pytorch_model.bin:  96%|█████████▌| 244M/256M [00:02<00:00, 96.1MB/s]\n",
+      "Downloading pytorch_model.bin: 100%|██████████| 256M/256M [00:02<00:00, 91.6MB/s]\n",
+      "(RayTrainWorker pid=1117, ip=172.31.90.137) Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_projector.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_projector.bias', 'vocab_transform.weight', 'vocab_layer_norm.bias']\n",
+      "(RayTrainWorker pid=1117, ip=172.31.90.137) - This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+      "(RayTrainWorker pid=1117, ip=172.31.90.137) - This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
+      "(RayTrainWorker pid=1117, ip=172.31.90.137) Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['pre_classifier.bias', 'classifier.bias', 'classifier.weight', 'pre_classifier.weight']\n",
+      "(RayTrainWorker pid=1117, ip=172.31.90.137) You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_layer_norm.weight', 'vocab_projector.bias', 'vocab_layer_norm.bias', 'vocab_transform.bias', 'vocab_projector.weight', 'vocab_transform.weight']\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) - This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) - This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['pre_classifier.bias', 'pre_classifier.weight', 'classifier.weight', 'classifier.bias']\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
+      "(RayTrainWorker pid=1116, ip=172.31.90.137) Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_layer_norm.bias', 'vocab_transform.bias', 'vocab_projector.bias', 'vocab_layer_norm.weight', 'vocab_transform.weight', 'vocab_projector.weight']\n",
+      "(RayTrainWorker pid=1116, ip=172.31.90.137) - This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+      "(RayTrainWorker pid=1116, ip=172.31.90.137) - This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
+      "(RayTrainWorker pid=1116, ip=172.31.90.137) Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'pre_classifier.weight', 'pre_classifier.bias', 'classifier.weight']\n",
+      "(RayTrainWorker pid=1116, ip=172.31.90.137) You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
+      "(RayTrainWorker pid=1115, ip=172.31.90.137) Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_projector.bias', 'vocab_projector.weight', 'vocab_transform.bias', 'vocab_layer_norm.bias', 'vocab_transform.weight', 'vocab_layer_norm.weight']\n",
+      "(RayTrainWorker pid=1115, ip=172.31.90.137) - This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
+      "(RayTrainWorker pid=1115, ip=172.31.90.137) - This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
+      "(RayTrainWorker pid=1115, ip=172.31.90.137) Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['pre_classifier.weight', 'classifier.weight', 'classifier.bias', 'pre_classifier.bias']\n",
+      "(RayTrainWorker pid=1115, ip=172.31.90.137) You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "oJiSdWy2hYbR"
-      },
-      "source": [
-        "We can check the resources our cluster is composed of. If you are running this notebook on your local machine or Google Colab, you should see the number of CPU cores and GPUs available on the said machine."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Starting training\n",
+      "(RayTrainWorker pid=1116, ip=172.31.90.137) Starting training\n",
+      "(RayTrainWorker pid=1117, ip=172.31.90.137) Starting training\n",
+      "(RayTrainWorker pid=1115, ip=172.31.90.137) Starting training\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 3,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "KlMz0dt9hYbS",
-        "outputId": "2d485449-ee69-4334-fcba-47e0ceb63078"
-      },
-      "outputs": [
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "{'CPU': 208.0,\n",
-            " 'GPU': 16.0,\n",
-            " 'accelerator_type:T4': 4.0,\n",
-            " 'memory': 616693614180.0,\n",
-            " 'node:172.31.76.237': 1.0,\n",
-            " 'node:172.31.80.117': 1.0,\n",
-            " 'node:172.31.85.193': 1.0,\n",
-            " 'node:172.31.85.32': 1.0,\n",
-            " 'node:172.31.90.137': 1.0,\n",
-            " 'object_store_memory': 259318055729.0}\n"
-          ]
-        }
-      ],
-      "source": [
-        "pprint(ray.cluster_resources())"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) ***** Running training *****\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137)   Num examples = 8551\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137)   Num Epochs = 2\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137)   Instantaneous batch size per device = 16\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137)   Total train batch size (w. parallel, distributed & accumulation) = 64\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137)   Gradient Accumulation steps = 1\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137)   Total optimization steps = 1070\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "uS6oeJELhYbS"
-      },
-      "source": [
-        "In this notebook, we will see how to fine-tune one of the [🤗 Transformers](https://github.com/huggingface/transformers) model to a text classification task of the [GLUE Benchmark](https://gluebenchmark.com/). We will be running the training using [Ray AIR](https://docs.ray.io/en/latest/ray-air/getting-started.html).\n",
-        "\n",
-        "You can change those two variables to control whether the training (which we will get to later) uses CPUs or GPUs, and how many workers should be spawned. Each worker will claim one CPU or GPU. Make sure not to request more resources than the resources present!\n",
-        "\n",
-        "By default, we will run the training with one GPU worker."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) {'loss': 0.5437, 'learning_rate': 1e-05, 'epoch': 1.0}\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 4,
-      "metadata": {
-        "id": "gAbhv9OqhYbT"
-      },
-      "outputs": [],
-      "source": [
-        "use_gpu = True  # set this to False to run on CPUs\n",
-        "num_workers = 1  # set this to number of GPUs/CPUs you want to use"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) ***** Running Evaluation *****\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137)   Num examples = 1043\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137)   Batch size = 16\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "rEJBSTyZIrIb"
-      },
-      "source": [
-        "## Fine-tuning a model on a text classification task"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) {'eval_loss': 0.5794203281402588, 'eval_matthews_correlation': 0.3293676852500821, 'eval_runtime': 0.9804, 'eval_samples_per_second': 277.441, 'eval_steps_per_second': 5.1, 'epoch': 1.0}\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "kTCFado4IrIc"
-      },
-      "source": [
-        "The GLUE Benchmark is a group of nine classification tasks on sentences or pairs of sentences. If you would like to learn more, refer to the [original notebook](https://github.com/huggingface/notebooks/blob/6ca682955173cc9d36ffa431ddda505a048cbe80/examples/text_classification.ipynb).\n",
-        "\n",
-        "Each task is named by its acronym, with `mnli-mm` standing for the mismatched version of MNLI (so same training set as `mnli` but different validation and test sets):"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-535\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/config.json\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/pytorch_model.bin\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/tokenizer_config.json\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/special_tokens_map.json\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 5,
-      "metadata": {
-        "id": "YZbiBDuGIrId"
-      },
-      "outputs": [],
-      "source": [
-        "GLUE_TASKS = [\"cola\", \"mnli\", \"mnli-mm\", \"mrpc\", \"qnli\", \"qqp\", \"rte\", \"sst2\", \"stsb\", \"wnli\"]"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Result for HuggingFaceTrainer_c1ff5_00000:\n",
+      "  _time_this_iter_s: 90.87123560905457\n",
+      "  _timestamp: 1661447540\n",
+      "  _training_iteration: 1\n",
+      "  date: 2022-08-25_10-12-20\n",
+      "  done: false\n",
+      "  epoch: 1.0\n",
+      "  eval_loss: 0.5794203281402588\n",
+      "  eval_matthews_correlation: 0.3293676852500821\n",
+      "  eval_runtime: 0.9804\n",
+      "  eval_samples_per_second: 277.441\n",
+      "  eval_steps_per_second: 5.1\n",
+      "  experiment_id: 592e02b25b254bd1a3743904313dc85b\n",
+      "  hostname: ip-172-31-90-137\n",
+      "  iterations_since_restore: 1\n",
+      "  learning_rate: 1.0e-05\n",
+      "  loss: 0.5437\n",
+      "  node_ip: 172.31.90.137\n",
+      "  pid: 947\n",
+      "  should_checkpoint: true\n",
+      "  step: 535\n",
+      "  time_since_restore: 103.24057936668396\n",
+      "  time_this_iter_s: 103.24057936668396\n",
+      "  time_total_s: 103.24057936668396\n",
+      "  timestamp: 1661447540\n",
+      "  timesteps_since_restore: 0\n",
+      "  training_iteration: 1\n",
+      "  trial_id: c1ff5_00000\n",
+      "  warmup_time: 0.003858327865600586\n",
+      "  \n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "4RRkXuteIrIh"
-      },
-      "source": [
-        "This notebook is built to run on any of the tasks in the list above, with any model checkpoint from the [Model Hub](https://huggingface.co/models) as long as that model has a version with a classification head. Depending on your model and the GPU you are using, you might need to adjust the batch size to avoid out-of-memory errors. Set those three parameters, then the rest of the notebook should run smoothly:"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-1070\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/config.json\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/pytorch_model.bin\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/tokenizer_config.json\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/special_tokens_map.json\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 6,
-      "metadata": {
-        "id": "zVvslsfMIrIh"
-      },
-      "outputs": [],
-      "source": [
-        "task = \"cola\"\n",
-        "model_checkpoint = \"distilbert-base-uncased\"\n",
-        "batch_size = 16"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) {'loss': 0.3886, 'learning_rate': 0.0, 'epoch': 2.0}\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "whPRbBNbIrIl"
-      },
-      "source": [
-        "### Loading the dataset <a name=\"load\"></a>"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) ***** Running Evaluation *****\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137)   Num examples = 1043\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137)   Batch size = 16\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "W7QYTpxXIrIl"
-      },
-      "source": [
-        "We will use the [🤗 Datasets](https://github.com/huggingface/datasets) library to download the data and get the metric we need to use for evaluation (to compare our model to the benchmark). This can be easily done with the functions `load_dataset` and `load_metric`.\n",
-        "\n",
-        "Apart from `mnli-mm` being a special code, we can directly pass our task name to those functions.\n",
-        "\n",
-        "As Ray AIR doesn't provide integrations for 🤗 Datasets yet, we will simply run the normal 🤗 Datasets code to load the dataset from the Hub."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) {'eval_loss': 0.6215357184410095, 'eval_matthews_correlation': 0.42957017514952434, 'eval_runtime': 0.9956, 'eval_samples_per_second': 273.204, 'eval_steps_per_second': 5.022, 'epoch': 2.0}\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/",
-          "height": 200
-        },
-        "id": "MwhAeEOuhYbV",
-        "outputId": "3aff8c73-d6eb-4784-890a-a419403b5bda"
-      },
-      "outputs": [],
-      "source": [
-        "from datasets import load_dataset\n",
-        "\n",
-        "actual_task = \"mnli\" if task == \"mnli-mm\" else task\n",
-        "datasets = load_dataset(\"glue\", actual_task)"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-1070\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/config.json\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/pytorch_model.bin\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/tokenizer_config.json\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/special_tokens_map.json\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "RzfPtOMoIrIu"
-      },
-      "source": [
-        "The `dataset` object itself is [`DatasetDict`](https://huggingface.co/docs/datasets/package_reference/main_classes.html#datasetdict), which contains one key for the training, validation, and test set (with more keys for the mismatched validation and test set in the special case of `mnli`)."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) {'train_runtime': 174.4696, 'train_samples_per_second': 98.023, 'train_steps_per_second': 6.133, 'train_loss': 0.4661755713346963, 'epoch': 2.0}\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "_TOee7nohYbW"
-      },
-      "source": [
-        "We will also need the metric. In order to avoid serialization errors, we will load the metric inside the training workers later. Therefore, now we will just define the function we will use."
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) \n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) \n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) Training completed. Do not forget to share your model on huggingface.co/models =)\n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) \n",
+      "(RayTrainWorker pid=1114, ip=172.31.90.137) \n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 8,
-      "metadata": {
-        "id": "FNE583uBhYbW"
-      },
-      "outputs": [],
-      "source": [
-        "from datasets import load_metric\n",
-        "\n",
-        "def load_metric_fn():\n",
-        "    return load_metric('glue', actual_task)"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Result for HuggingFaceTrainer_c1ff5_00000:\n",
+      "  _time_this_iter_s: 96.96447467803955\n",
+      "  _timestamp: 1661447637\n",
+      "  _training_iteration: 2\n",
+      "  date: 2022-08-25_10-13-57\n",
+      "  done: false\n",
+      "  epoch: 2.0\n",
+      "  eval_loss: 0.6215357184410095\n",
+      "  eval_matthews_correlation: 0.42957017514952434\n",
+      "  eval_runtime: 0.9956\n",
+      "  eval_samples_per_second: 273.204\n",
+      "  eval_steps_per_second: 5.022\n",
+      "  experiment_id: 592e02b25b254bd1a3743904313dc85b\n",
+      "  hostname: ip-172-31-90-137\n",
+      "  iterations_since_restore: 2\n",
+      "  learning_rate: 0.0\n",
+      "  loss: 0.3886\n",
+      "  node_ip: 172.31.90.137\n",
+      "  pid: 947\n",
+      "  should_checkpoint: true\n",
+      "  step: 1070\n",
+      "  time_since_restore: 200.21722102165222\n",
+      "  time_this_iter_s: 96.97664165496826\n",
+      "  time_total_s: 200.21722102165222\n",
+      "  timestamp: 1661447637\n",
+      "  timesteps_since_restore: 0\n",
+      "  train_loss: 0.4661755713346963\n",
+      "  train_runtime: 174.4696\n",
+      "  train_samples_per_second: 98.023\n",
+      "  train_steps_per_second: 6.133\n",
+      "  training_iteration: 2\n",
+      "  trial_id: c1ff5_00000\n",
+      "  warmup_time: 0.003858327865600586\n",
+      "  \n",
+      "Result for HuggingFaceTrainer_c1ff5_00000:\n",
+      "  _time_this_iter_s: 96.96447467803955\n",
+      "  _timestamp: 1661447637\n",
+      "  _training_iteration: 2\n",
+      "  date: 2022-08-25_10-13-57\n",
+      "  done: true\n",
+      "  epoch: 2.0\n",
+      "  eval_loss: 0.6215357184410095\n",
+      "  eval_matthews_correlation: 0.42957017514952434\n",
+      "  eval_runtime: 0.9956\n",
+      "  eval_samples_per_second: 273.204\n",
+      "  eval_steps_per_second: 5.022\n",
+      "  experiment_id: 592e02b25b254bd1a3743904313dc85b\n",
+      "  experiment_tag: '0'\n",
+      "  hostname: ip-172-31-90-137\n",
+      "  iterations_since_restore: 2\n",
+      "  learning_rate: 0.0\n",
+      "  loss: 0.3886\n",
+      "  node_ip: 172.31.90.137\n",
+      "  pid: 947\n",
+      "  should_checkpoint: true\n",
+      "  step: 1070\n",
+      "  time_since_restore: 200.21722102165222\n",
+      "  time_this_iter_s: 96.97664165496826\n",
+      "  time_total_s: 200.21722102165222\n",
+      "  timestamp: 1661447637\n",
+      "  timesteps_since_restore: 0\n",
+      "  train_loss: 0.4661755713346963\n",
+      "  train_runtime: 174.4696\n",
+      "  train_samples_per_second: 98.023\n",
+      "  train_steps_per_second: 6.133\n",
+      "  training_iteration: 2\n",
+      "  trial_id: c1ff5_00000\n",
+      "  warmup_time: 0.003858327865600586\n",
+      "  \n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "lnjDIuQ3IrI-"
-      },
-      "source": [
-        "The metric is an instance of [`datasets.Metric`](https://huggingface.co/docs/datasets/package_reference/main_classes.html#datasets.Metric)."
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "2022-08-25 10:14:09,300\tINFO tune.py:758 -- Total run time: 246.67 seconds (246.44 seconds for the tuning loop).\n"
+     ]
+    }
+   ],
+   "source": [
+    "result = trainer.fit()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "4cnWqUWmhYba"
+   },
+   "source": [
+    "You can use the returned `Result` object to access metrics and the Ray AIR `Checkpoint` associated with the last iteration."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/"
     },
+    "id": "AMN5qjUwhYba",
+    "outputId": "7b754c36-c58b-4ff4-d7a8-63ec9764bd0c"
+   },
+   "outputs": [
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "n9qywopnIrJH"
-      },
-      "source": [
-        "### Preprocessing the data with Ray AIR <a name=\"preprocess\"></a>"
+     "data": {
+      "text/plain": [
+       "Result(metrics={'loss': 0.3886, 'learning_rate': 0.0, 'epoch': 2.0, 'step': 1070, 'eval_loss': 0.6215357184410095, 'eval_matthews_correlation': 0.42957017514952434, 'eval_runtime': 0.9956, 'eval_samples_per_second': 273.204, 'eval_steps_per_second': 5.022, 'train_runtime': 174.4696, 'train_samples_per_second': 98.023, 'train_steps_per_second': 6.133, 'train_loss': 0.4661755713346963, '_timestamp': 1661447637, '_time_this_iter_s': 96.96447467803955, '_training_iteration': 2, 'should_checkpoint': True, 'done': True, 'trial_id': 'c1ff5_00000', 'experiment_tag': '0'}, error=None, log_dir=PosixPath('/home/ray/ray_results/HuggingFaceTrainer_2022-08-25_10-10-02/HuggingFaceTrainer_c1ff5_00000_0_2022-08-25_10-10-04'))"
       ]
-    },
+     },
+     "execution_count": 16,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "result"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Tune hyperparameters with Ray AIR <a name=\"predict\"></a>"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "If we would like to tune any hyperparameters of the model, we can do so by simply passing our `HuggingFaceTrainer` into a `Tuner` and defining the search space.\n",
+    "\n",
+    "We can also take advantage of the advanced search algorithms and schedulers provided by Ray Tune. In this example, we will use an `ASHAScheduler` to aggresively terminate underperforming trials."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from ray import tune\n",
+    "from ray.tune import Tuner\n",
+    "from ray.tune.schedulers.async_hyperband import ASHAScheduler\n",
+    "\n",
+    "tune_epochs = 4\n",
+    "tuner = Tuner(\n",
+    "    trainer,\n",
+    "    param_space={\n",
+    "        \"trainer_init_config\": {\n",
+    "            \"learning_rate\": tune.grid_search([2e-5, 2e-4, 2e-3, 2e-2]),\n",
+    "            \"epochs\": tune_epochs,\n",
+    "        }\n",
+    "    },\n",
+    "    tune_config=tune.TuneConfig(\n",
+    "        metric=\"eval_loss\",\n",
+    "        mode=\"min\",\n",
+    "        num_samples=1,\n",
+    "        scheduler=ASHAScheduler(\n",
+    "            max_t=tune_epochs,\n",
+    "        )\n",
+    "    ),\n",
+    "    run_config=RunConfig(\n",
+    "        checkpoint_config=CheckpointConfig(num_to_keep=1, checkpoint_score_attribute=\"eval_loss\", checkpoint_score_order=\"min\")\n",
+    "    ),\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "metadata": {},
+   "outputs": [
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "YVx71GdAIrJH"
-      },
-      "source": [
-        "Before we can feed those texts to our model, we need to preprocess them. This is done by a 🤗 Transformers' `Tokenizer`, which will (as the name indicates) tokenize the inputs (including converting the tokens to their corresponding IDs in the pretrained vocabulary) and put it in a format the model expects, as well as generate the other inputs that model requires.\n",
-        "\n",
-        "To do all of this, we instantiate our tokenizer with the `AutoTokenizer.from_pretrained` method, which will ensure that:\n",
-        "\n",
-        "- we get a tokenizer that corresponds to the model architecture we want to use,\n",
-        "- we download the vocabulary used when pretraining this specific checkpoint."
+     "data": {
+      "text/html": [
+       "== Status ==<br>Current time: 2022-08-25 10:20:13 (running for 00:06:01.75)<br>Memory usage on this node: 4.4/62.0 GiB<br>Using AsyncHyperBand: num_stopped=4\n",
+       "Bracket: Iter 4.000: -0.8064090609550476 | Iter 1.000: -0.6378736793994904<br>Resources requested: 0/208 CPUs, 0/16 GPUs, 0.0/574.34 GiB heap, 0.0/241.51 GiB objects (0.0/4.0 accelerator_type:T4)<br>Current best trial: 5654d_00001 with eval_loss=0.6492420434951782 and parameters={'trainer_init_config': {'learning_rate': 0.0002, 'epochs': 4}}<br>Result logdir: /home/ray/ray_results/HuggingFaceTrainer_2022-08-25_10-14-11<br>Number of trials: 4/4 (4 TERMINATED)<br><table>\n",
+       "<thead>\n",
+       "<tr><th>Trial name                    </th><th>status    </th><th>loc               </th><th style=\"text-align: right;\">  trainer_init_conf...</th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  loss</th><th style=\"text-align: right;\">  learning_rate</th><th style=\"text-align: right;\">  epoch</th></tr>\n",
+       "</thead>\n",
+       "<tbody>\n",
+       "<tr><td>HuggingFaceTrainer_5654d_00000</td><td>TERMINATED</td><td>172.31.90.137:1729</td><td style=\"text-align: right;\">                2e-05 </td><td style=\"text-align: right;\">     4</td><td style=\"text-align: right;\">        347.171 </td><td style=\"text-align: right;\">0.1958</td><td style=\"text-align: right;\">        0      </td><td style=\"text-align: right;\">      4</td></tr>\n",
+       "<tr><td>HuggingFaceTrainer_5654d_00001</td><td>TERMINATED</td><td>172.31.76.237:1805</td><td style=\"text-align: right;\">                0.0002</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">         95.2492</td><td style=\"text-align: right;\">0.6225</td><td style=\"text-align: right;\">        0.00015</td><td style=\"text-align: right;\">      1</td></tr>\n",
+       "<tr><td>HuggingFaceTrainer_5654d_00002</td><td>TERMINATED</td><td>172.31.85.32:1322 </td><td style=\"text-align: right;\">                0.002 </td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">         93.7613</td><td style=\"text-align: right;\">0.6463</td><td style=\"text-align: right;\">        0.0015 </td><td style=\"text-align: right;\">      1</td></tr>\n",
+       "<tr><td>HuggingFaceTrainer_5654d_00003</td><td>TERMINATED</td><td>172.31.85.193:1060</td><td style=\"text-align: right;\">                0.02  </td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">         99.3677</td><td style=\"text-align: right;\">0.926 </td><td style=\"text-align: right;\">        0.015  </td><td style=\"text-align: right;\">      1</td></tr>\n",
+       "</tbody>\n",
+       "</table><br><br>"
+      ],
+      "text/plain": [
+       "<IPython.core.display.HTML object>"
       ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-      "cell_type": "code",
-      "execution_count": 9,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/",
-          "height": 145
-        },
-        "id": "eXNLu_-nIrJI",
-        "outputId": "f545a7a5-f341-4315-cd89-9942a657aa31"
-      },
-      "outputs": [],
-      "source": [
-        "from transformers import AutoTokenizer\n",
-        "\n",
-        "tokenizer = AutoTokenizer.from_pretrained(model_checkpoint, use_fast=True)"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) 2022-08-25 10:14:23,379\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=4]\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "Vl6IidfdIrJK"
-      },
-      "source": [
-        "We pass along `use_fast=True` to the call above to use one of the fast tokenizers (backed by Rust) from the 🤗 Tokenizers library. Those fast tokenizers are available for almost all models, but if you got an error with the previous call, remove that argument."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1792, ip=172.31.90.137) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1790, ip=172.31.90.137) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1791, ip=172.31.90.137) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Is CUDA available: True\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "qo_0B1M2IrJM"
-      },
-      "source": [
-        "To preprocess our dataset, we will thus need the names of the columns containing the sentence(s). The following dictionary keeps track of the correspondence task to column names:"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) 2022-08-25 10:14:29,354\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=4]\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 10,
-      "metadata": {
-        "id": "fyGdtK9oIrJM"
-      },
-      "outputs": [],
-      "source": [
-        "task_to_keys = {\n",
-        "    \"cola\": (\"sentence\", None),\n",
-        "    \"mnli\": (\"premise\", \"hypothesis\"),\n",
-        "    \"mnli-mm\": (\"premise\", \"hypothesis\"),\n",
-        "    \"mrpc\": (\"sentence1\", \"sentence2\"),\n",
-        "    \"qnli\": (\"question\", \"sentence\"),\n",
-        "    \"qqp\": (\"question1\", \"question2\"),\n",
-        "    \"rte\": (\"sentence1\", \"sentence2\"),\n",
-        "    \"sst2\": (\"sentence\", None),\n",
-        "    \"stsb\": (\"sentence1\", \"sentence2\"),\n",
-        "    \"wnli\": (\"sentence1\", \"sentence2\"),\n",
-        "}"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1977, ip=172.31.76.237) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1976, ip=172.31.76.237) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1975, ip=172.31.76.237) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) Is CUDA available: True\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "256fOuzjhYbY"
-      },
-      "source": [
-        "For Ray AIR, instead of using 🤗 Dataset objects directly, we will convert them to [Ray Datasets](https://docs.ray.io/en/latest/data/dataset.html). Both are backed by Arrow tables, so the conversion is straightforward. We will use the built-in `ray.data.from_huggingface` function."
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) 2022-08-25 10:14:35,313\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=4]\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 11,
-      "metadata": {},
-      "outputs": [
-        {
-          "data": {
-            "text/plain": [
-              "{'train': Dataset(num_blocks=1, num_rows=8551, schema={sentence: string, label: int64, idx: int32}),\n",
-              " 'validation': Dataset(num_blocks=1, num_rows=1043, schema={sentence: string, label: int64, idx: int32}),\n",
-              " 'test': Dataset(num_blocks=1, num_rows=1063, schema={sentence: string, label: int64, idx: int32})}"
-            ]
-          },
-          "execution_count": 11,
-          "metadata": {},
-          "output_type": "execute_result"
-        }
-      ],
-      "source": [
-        "import ray.data\n",
-        "\n",
-        "ray_datasets = ray.data.from_huggingface(datasets)\n",
-        "ray_datasets"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1790, ip=172.31.90.137) Starting training\n",
+      "(RayTrainWorker pid=1792, ip=172.31.90.137) Starting training\n",
+      "(RayTrainWorker pid=1791, ip=172.31.90.137) Starting training\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Starting training\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "2C0hcmp9IrJQ"
-      },
-      "source": [
-        "We can then write the function that will preprocess our samples. We just feed them to the `tokenizer` with the argument `truncation=True`. This will ensure that an input longer than what the model selected can handle will be truncated to the maximum length accepted by the model.\n",
-        "\n",
-        "We use a `BatchMapper` to create a Ray AIR preprocessor that will map the function to the dataset in a distributed fashion. It will run during training and prediction."
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) ***** Running training *****\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num examples = 8551\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num Epochs = 4\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Instantaneous batch size per device = 16\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Total train batch size (w. parallel, distributed & accumulation) = 64\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Gradient Accumulation steps = 1\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Total optimization steps = 2140\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 12,
-      "metadata": {
-        "id": "vc0BSBLIIrJQ"
-      },
-      "outputs": [],
-      "source": [
-        "import pandas as pd\n",
-        "from ray.data.preprocessors import BatchMapper\n",
-        "\n",
-        "def preprocess_function(examples: pd.DataFrame):\n",
-        "    # if we only have one column, we are inferring.\n",
-        "    # no need to tokenize in that case. \n",
-        "    if len(examples.columns) == 1:\n",
-        "        return examples\n",
-        "    examples = examples.to_dict(\"list\")\n",
-        "    sentence1_key, sentence2_key = task_to_keys[task]\n",
-        "    if sentence2_key is None:\n",
-        "        ret = tokenizer(examples[sentence1_key], truncation=True)\n",
-        "    else:\n",
-        "        ret = tokenizer(examples[sentence1_key], examples[sentence2_key], truncation=True)\n",
-        "    # Add back the original columns\n",
-        "    ret = {**examples, **ret}\n",
-        "    return pd.DataFrame.from_dict(ret)\n",
-        "\n",
-        "batch_encoder = BatchMapper(preprocess_function, batch_format=\"pandas\")"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1485, ip=172.31.85.32) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1486, ip=172.31.85.32) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1484, ip=172.31.85.32) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1977, ip=172.31.76.237) Starting training\n",
+      "(RayTrainWorker pid=1976, ip=172.31.76.237) Starting training\n",
+      "(RayTrainWorker pid=1975, ip=172.31.76.237) Starting training\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) Starting training\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "545PP3o8IrJV"
-      },
-      "source": [
-        "### Fine-tuning the model with Ray AIR <a name=\"train\"></a>"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) ***** Running training *****\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237)   Num examples = 8551\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237)   Num Epochs = 4\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237)   Instantaneous batch size per device = 16\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237)   Total train batch size (w. parallel, distributed & accumulation) = 64\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237)   Gradient Accumulation steps = 1\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237)   Total optimization steps = 2140\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "FBiW8UpKIrJW"
-      },
-      "source": [
-        "Now that our data is ready, we can download the pretrained model and fine-tune it.\n",
-        "\n",
-        "Since all our tasks are about sentence classification, we use the `AutoModelForSequenceClassification` class.\n",
-        "\n",
-        "We will not go into details about each specific component of the training (see the [original notebook](https://github.com/huggingface/notebooks/blob/6ca682955173cc9d36ffa431ddda505a048cbe80/examples/text_classification.ipynb) for that). The tokenizer is the same as we have used to encoded the dataset before.\n",
-        "\n",
-        "The main difference when using the Ray AIR is that we need to create our 🤗 Transformers `Trainer` inside a function (`trainer_init_per_worker`) and return it. That function will be passed to the `HuggingFaceTrainer` and will run on every Ray worker. The training will then proceed by the means of PyTorch DDP.\n",
-        "\n",
-        "Make sure that you initialize the model, metric, and tokenizer inside that function. Otherwise, you may run into serialization errors.\n",
-        "\n",
-        "Furthermore, `push_to_hub=True` is not yet supported. Ray will, however, checkpoint the model at every epoch, allowing you to push it to hub manually. We will do that after the training.\n",
-        "\n",
-        "If you wish to use third-party logging libraries, such as MLflow or Weights&Biases, do not set them in `TrainingArguments` (they will be automatically disabled) - instead, you should pass Ray AIR callbacks to `HuggingFaceTrainer`'s `run_config`. In this example, we will use MLflow."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) Starting training\n",
+      "(RayTrainWorker pid=1485, ip=172.31.85.32) Starting training\n",
+      "(RayTrainWorker pid=1486, ip=172.31.85.32) Starting training\n",
+      "(RayTrainWorker pid=1484, ip=172.31.85.32) Starting training\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 13,
-      "metadata": {
-        "id": "TlqNaB8jIrJW"
-      },
-      "outputs": [],
-      "source": [
-        "from transformers import AutoModelForSequenceClassification, TrainingArguments, Trainer\n",
-        "import numpy as np\n",
-        "import torch\n",
-        "\n",
-        "num_labels = 3 if task.startswith(\"mnli\") else 1 if task==\"stsb\" else 2\n",
-        "metric_name = \"pearson\" if task == \"stsb\" else \"matthews_correlation\" if task == \"cola\" else \"accuracy\"\n",
-        "model_name = model_checkpoint.split(\"/\")[-1]\n",
-        "validation_key = \"validation_mismatched\" if task == \"mnli-mm\" else \"validation_matched\" if task == \"mnli\" else \"validation\"\n",
-        "name = f\"{model_name}-finetuned-{task}\"\n",
-        "\n",
-        "def trainer_init_per_worker(train_dataset, eval_dataset = None, **config):\n",
-        "    print(f\"Is CUDA available: {torch.cuda.is_available()}\")\n",
-        "    metric = load_metric_fn()\n",
-        "    tokenizer = AutoTokenizer.from_pretrained(model_checkpoint, use_fast=True)\n",
-        "    model = AutoModelForSequenceClassification.from_pretrained(model_checkpoint, num_labels=num_labels)\n",
-        "    args = TrainingArguments(\n",
-        "        name,\n",
-        "        evaluation_strategy=\"epoch\",\n",
-        "        save_strategy=\"epoch\",\n",
-        "        logging_strategy=\"epoch\",\n",
-        "        learning_rate=config.get(\"learning_rate\", 2e-5),\n",
-        "        per_device_train_batch_size=batch_size,\n",
-        "        per_device_eval_batch_size=batch_size,\n",
-        "        num_train_epochs=config.get(\"epochs\", 2),\n",
-        "        weight_decay=config.get(\"weight_decay\", 0.01),\n",
-        "        push_to_hub=False,\n",
-        "        disable_tqdm=True,  # declutter the output a little\n",
-        "        no_cuda=not use_gpu,  # you need to explicitly set no_cuda if you want CPUs\n",
-        "    )\n",
-        "\n",
-        "    def compute_metrics(eval_pred):\n",
-        "        predictions, labels = eval_pred\n",
-        "        if task != \"stsb\":\n",
-        "            predictions = np.argmax(predictions, axis=1)\n",
-        "        else:\n",
-        "            predictions = predictions[:, 0]\n",
-        "        return metric.compute(predictions=predictions, references=labels)\n",
-        "\n",
-        "    trainer = Trainer(\n",
-        "        model,\n",
-        "        args,\n",
-        "        train_dataset=train_dataset,\n",
-        "        eval_dataset=eval_dataset,\n",
-        "        tokenizer=tokenizer,\n",
-        "        compute_metrics=compute_metrics\n",
-        "    )\n",
-        "\n",
-        "    print(\"Starting training\")\n",
-        "    return trainer"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) ***** Running training *****\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32)   Num examples = 8551\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32)   Num Epochs = 4\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32)   Instantaneous batch size per device = 16\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32)   Total train batch size (w. parallel, distributed & accumulation) = 64\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32)   Gradient Accumulation steps = 1\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32)   Total optimization steps = 2140\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) 2022-08-25 10:14:48,193\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=4]\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "CdzABDVcIrJg"
-      },
-      "source": [
-        "With our `trainer_init_per_worker` complete, we can now instantiate the `HuggingFaceTrainer`. Aside from the function, we set the `scaling_config`, controlling the amount of workers and resources used, and the `datasets` we will use for training and evaluation.\n",
-        "\n",
-        "We specify the `MLflowLoggerCallback` inside the `run_config`, and pass the preprocessor we have defined earlier as an argument. The preprocessor will be included with the returned `Checkpoint`, meaning it will also be applied during inference."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1224, ip=172.31.85.193) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1226, ip=172.31.85.193) Is CUDA available: True\n",
+      "(RayTrainWorker pid=1225, ip=172.31.85.193) Is CUDA available: True\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 14,
-      "metadata": {
-        "id": "RElw7OgLhYba"
-      },
-      "outputs": [],
-      "source": [
-        "from ray.train.huggingface import HuggingFaceTrainer\n",
-        "from ray.air.config import RunConfig, ScalingConfig, CheckpointConfig\n",
-        "from ray.air.integrations.mlflow import MLflowLoggerCallback\n",
-        "\n",
-        "trainer = HuggingFaceTrainer(\n",
-        "    trainer_init_per_worker=trainer_init_per_worker,\n",
-        "    scaling_config=ScalingConfig(num_workers=num_workers, use_gpu=use_gpu),\n",
-        "    datasets={\"train\": ray_datasets[\"train\"], \"evaluation\": ray_datasets[validation_key]},\n",
-        "    run_config=RunConfig(\n",
-        "        callbacks=[MLflowLoggerCallback(experiment_name=name)],\n",
-        "        checkpoint_config=CheckpointConfig(num_to_keep=1, checkpoint_score_attribute=\"eval_loss\", checkpoint_score_order=\"min\"),\n",
-        "    ),\n",
-        "    preprocessor=batch_encoder,\n",
-        ")"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Downloading builder script: 5.76kB [00:00, 6.59MB/s]                   \n",
+      "Downloading builder script: 5.76kB [00:00, 6.52MB/s]                   \n",
+      "Downloading builder script: 5.76kB [00:00, 6.07MB/s]                   \n",
+      "Downloading builder script: 5.76kB [00:00, 6.81MB/s]                   \n",
+      "Downloading tokenizer_config.json: 100%|██████████| 28.0/28.0 [00:00<00:00, 46.0kB/s]\n",
+      "Downloading config.json: 100%|██████████| 483/483 [00:00<00:00, 766kB/s]\n",
+      "Downloading vocab.txt:   0%|          | 0.00/226k [00:00<?, ?B/s]\n",
+      "Downloading vocab.txt:  32%|███▏      | 72.0k/226k [00:00<00:00, 624kB/s]\n",
+      "Downloading vocab.txt: 100%|██████████| 226k/226k [00:00<00:00, 966kB/s] \n",
+      "Downloading tokenizer.json:   0%|          | 0.00/455k [00:00<?, ?B/s]\n",
+      "Downloading tokenizer.json:   6%|▋         | 29.0k/455k [00:00<00:01, 233kB/s]\n",
+      "Downloading tokenizer.json:  30%|██▉       | 136k/455k [00:00<00:00, 600kB/s] \n",
+      "Downloading tokenizer.json: 100%|██████████| 455k/455k [00:00<00:00, 1.44MB/s]\n",
+      "Downloading pytorch_model.bin:   0%|          | 0.00/256M [00:00<?, ?B/s]\n",
+      "Downloading pytorch_model.bin:   1%|          | 2.32M/256M [00:00<00:10, 24.4MB/s]\n",
+      "Downloading pytorch_model.bin:   4%|▍         | 11.0M/256M [00:00<00:04, 63.4MB/s]\n",
+      "Downloading pytorch_model.bin:   8%|▊         | 20.0M/256M [00:00<00:03, 77.7MB/s]\n",
+      "Downloading pytorch_model.bin:  11%|█▏        | 29.1M/256M [00:00<00:02, 84.8MB/s]\n",
+      "Downloading pytorch_model.bin:  15%|█▍        | 38.2M/256M [00:00<00:02, 88.5MB/s]\n",
+      "Downloading pytorch_model.bin:  18%|█▊        | 47.3M/256M [00:00<00:02, 90.7MB/s]\n",
+      "Downloading pytorch_model.bin:  22%|██▏       | 56.4M/256M [00:00<00:02, 92.4MB/s]\n",
+      "Downloading pytorch_model.bin:  26%|██▌       | 65.5M/256M [00:00<00:02, 93.4MB/s]\n",
+      "Downloading pytorch_model.bin:  29%|██▉       | 74.7M/256M [00:00<00:02, 94.2MB/s]\n",
+      "Downloading pytorch_model.bin:  33%|███▎      | 83.8M/256M [00:01<00:01, 94.8MB/s]\n",
+      "Downloading pytorch_model.bin:  36%|███▋      | 93.0M/256M [00:01<00:01, 95.1MB/s]\n",
+      "Downloading pytorch_model.bin:  40%|███▉      | 102M/256M [00:01<00:01, 95.4MB/s] \n",
+      "Downloading pytorch_model.bin:  44%|████▎     | 111M/256M [00:01<00:01, 95.6MB/s]\n",
+      "Downloading pytorch_model.bin:  47%|████▋     | 120M/256M [00:01<00:01, 95.7MB/s]\n",
+      "Downloading pytorch_model.bin:  51%|█████     | 130M/256M [00:01<00:01, 95.8MB/s]\n",
+      "Downloading pytorch_model.bin:  54%|█████▍    | 139M/256M [00:01<00:01, 95.8MB/s]\n",
+      "Downloading pytorch_model.bin:  58%|█████▊    | 148M/256M [00:01<00:01, 95.9MB/s]\n",
+      "Downloading pytorch_model.bin:  61%|██████▏   | 157M/256M [00:01<00:01, 96.1MB/s]\n",
+      "Downloading pytorch_model.bin:  65%|██████▌   | 166M/256M [00:01<00:00, 96.1MB/s]\n",
+      "Downloading pytorch_model.bin:  69%|██████▊   | 175M/256M [00:02<00:00, 96.1MB/s]\n",
+      "Downloading pytorch_model.bin:  72%|███████▏  | 185M/256M [00:02<00:00, 96.2MB/s]\n",
+      "Downloading pytorch_model.bin:  76%|███████▌  | 194M/256M [00:02<00:00, 96.2MB/s]\n",
+      "Downloading pytorch_model.bin:  79%|███████▉  | 203M/256M [00:02<00:00, 96.1MB/s]\n",
+      "Downloading pytorch_model.bin:  83%|████████▎ | 212M/256M [00:02<00:00, 96.1MB/s]\n",
+      "Downloading pytorch_model.bin:  87%|████████▋ | 221M/256M [00:02<00:00, 96.2MB/s]\n",
+      "Downloading pytorch_model.bin:  90%|█████████ | 231M/256M [00:02<00:00, 96.2MB/s]\n",
+      "Downloading pytorch_model.bin:  94%|█████████▍| 240M/256M [00:02<00:00, 96.1MB/s]\n",
+      "Downloading pytorch_model.bin:  97%|█████████▋| 249M/256M [00:02<00:00, 96.0MB/s]\n",
+      "Downloading pytorch_model.bin: 100%|██████████| 256M/256M [00:02<00:00, 93.2MB/s]\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "XvS136zKhYba"
-      },
-      "source": [
-        "Finally, we call the `fit` method to start training with Ray AIR. We will save the `Result` object to a variable so we can access metrics and checkpoints."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) Starting training\n",
+      "(RayTrainWorker pid=1226, ip=172.31.85.193) Starting training\n",
+      "(RayTrainWorker pid=1225, ip=172.31.85.193) Starting training\n",
+      "(RayTrainWorker pid=1224, ip=172.31.85.193) Starting training\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 15,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/",
-          "height": 1000
-        },
-        "id": "uNx5pyRlIrJh",
-        "outputId": "8496fe4f-f1c3-48ad-a6d3-b16a65716135"
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "== Status ==<br>Current time: 2022-08-25 10:14:09 (running for 00:04:06.45)<br>Memory usage on this node: 4.3/62.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/208 CPUs, 0/16 GPUs, 0.0/574.34 GiB heap, 0.0/241.51 GiB objects (0.0/4.0 accelerator_type:T4)<br>Result logdir: /home/ray/ray_results/HuggingFaceTrainer_2022-08-25_10-10-02<br>Number of trials: 1/1 (1 TERMINATED)<br><table>\n",
-              "<thead>\n",
-              "<tr><th>Trial name                    </th><th>status    </th><th>loc              </th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  loss</th><th style=\"text-align: right;\">  learning_rate</th><th style=\"text-align: right;\">  epoch</th></tr>\n",
-              "</thead>\n",
-              "<tbody>\n",
-              "<tr><td>HuggingFaceTrainer_c1ff5_00000</td><td>TERMINATED</td><td>172.31.90.137:947</td><td style=\"text-align: right;\">     2</td><td style=\"text-align: right;\">         200.217</td><td style=\"text-align: right;\">0.3886</td><td style=\"text-align: right;\">              0</td><td style=\"text-align: right;\">      2</td></tr>\n",
-              "</tbody>\n",
-              "</table><br><br>"
-            ],
-            "text/plain": [
-              "<IPython.core.display.HTML object>"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) 2022-08-25 10:10:44,617\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=4]\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1116, ip=172.31.90.137) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1117, ip=172.31.90.137) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1115, ip=172.31.90.137) Is CUDA available: True\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "Downloading builder script: 5.76kB [00:00, 6.45MB/s]                   \n",
-            "Downloading builder script: 5.76kB [00:00, 6.91MB/s]                   \n",
-            "Downloading builder script: 5.76kB [00:00, 6.44MB/s]                   \n",
-            "Downloading builder script: 5.76kB [00:00, 6.94MB/s]                   \n",
-            "Downloading tokenizer_config.json: 100%|██████████| 28.0/28.0 [00:00<00:00, 30.5kB/s]\n",
-            "Downloading config.json: 100%|██████████| 483/483 [00:00<00:00, 817kB/s]\n",
-            "Downloading vocab.txt:   0%|          | 0.00/226k [00:00<?, ?B/s]\n",
-            "Downloading vocab.txt:  18%|█▊        | 41.0k/226k [00:00<00:00, 353kB/s]\n",
-            "Downloading vocab.txt: 100%|██████████| 226k/226k [00:00<00:00, 773kB/s] \n",
-            "Downloading tokenizer.json:   0%|          | 0.00/455k [00:00<?, ?B/s]\n",
-            "Downloading tokenizer.json:   6%|▌         | 28.0k/455k [00:00<00:01, 227kB/s]\n",
-            "Downloading tokenizer.json:  24%|██▍       | 111k/455k [00:00<00:00, 488kB/s] \n",
-            "Downloading tokenizer.json:  42%|████▏     | 191k/455k [00:00<00:00, 559kB/s]\n",
-            "Downloading tokenizer.json:  67%|██████▋   | 303k/455k [00:00<00:00, 694kB/s]\n",
-            "Downloading tokenizer.json: 100%|██████████| 455k/455k [00:00<00:00, 815kB/s]\n",
-            "Downloading pytorch_model.bin:   0%|          | 0.00/256M [00:00<?, ?B/s]\n",
-            "Downloading pytorch_model.bin:   0%|          | 1.20M/256M [00:00<00:21, 12.6MB/s]\n",
-            "Downloading pytorch_model.bin:   2%|▏         | 6.02M/256M [00:00<00:07, 34.9MB/s]\n",
-            "Downloading pytorch_model.bin:   6%|▌         | 15.0M/256M [00:00<00:04, 62.0MB/s]\n",
-            "Downloading pytorch_model.bin:   9%|▉         | 24.0M/256M [00:00<00:03, 74.8MB/s]\n",
-            "Downloading pytorch_model.bin:  13%|█▎        | 33.1M/256M [00:00<00:02, 82.3MB/s]\n",
-            "Downloading pytorch_model.bin:  17%|█▋        | 42.2M/256M [00:00<00:02, 86.7MB/s]\n",
-            "Downloading pytorch_model.bin:  20%|██        | 51.4M/256M [00:00<00:02, 89.8MB/s]\n",
-            "Downloading pytorch_model.bin:  24%|██▎       | 60.6M/256M [00:00<00:02, 91.8MB/s]\n",
-            "Downloading pytorch_model.bin:  27%|██▋       | 69.8M/256M [00:00<00:02, 93.3MB/s]\n",
-            "Downloading pytorch_model.bin:  31%|███       | 78.9M/256M [00:01<00:01, 94.2MB/s]\n",
-            "Downloading pytorch_model.bin:  34%|███▍      | 88.0M/256M [00:01<00:01, 94.6MB/s]\n",
-            "Downloading pytorch_model.bin:  38%|███▊      | 97.2M/256M [00:01<00:01, 95.1MB/s]\n",
-            "Downloading pytorch_model.bin:  42%|████▏     | 106M/256M [00:01<00:01, 95.6MB/s] \n",
-            "Downloading pytorch_model.bin:  45%|████▌     | 116M/256M [00:01<00:01, 96.0MB/s]\n",
-            "Downloading pytorch_model.bin:  49%|████▉     | 125M/256M [00:01<00:01, 96.2MB/s]\n",
-            "Downloading pytorch_model.bin:  52%|█████▏    | 134M/256M [00:01<00:01, 96.0MB/s]\n",
-            "Downloading pytorch_model.bin:  56%|█████▌    | 143M/256M [00:01<00:01, 96.1MB/s]\n",
-            "Downloading pytorch_model.bin:  60%|█████▉    | 152M/256M [00:01<00:01, 96.0MB/s]\n",
-            "Downloading pytorch_model.bin:  63%|██████▎   | 162M/256M [00:01<00:01, 96.2MB/s]\n",
-            "Downloading pytorch_model.bin:  67%|██████▋   | 171M/256M [00:02<00:00, 96.1MB/s]\n",
-            "Downloading pytorch_model.bin:  70%|███████   | 180M/256M [00:02<00:00, 96.2MB/s]\n",
-            "Downloading pytorch_model.bin:  74%|███████▍  | 189M/256M [00:02<00:00, 96.2MB/s]\n",
-            "Downloading pytorch_model.bin:  78%|███████▊  | 198M/256M [00:02<00:00, 96.2MB/s]\n",
-            "Downloading pytorch_model.bin:  81%|████████  | 208M/256M [00:02<00:00, 95.9MB/s]\n",
-            "Downloading pytorch_model.bin:  85%|████████▍ | 217M/256M [00:02<00:00, 95.9MB/s]\n",
-            "Downloading pytorch_model.bin:  88%|████████▊ | 226M/256M [00:02<00:00, 96.2MB/s]\n",
-            "Downloading pytorch_model.bin:  92%|█████████▏| 235M/256M [00:02<00:00, 96.1MB/s]\n",
-            "Downloading pytorch_model.bin:  96%|█████████▌| 244M/256M [00:02<00:00, 96.1MB/s]\n",
-            "Downloading pytorch_model.bin: 100%|██████████| 256M/256M [00:02<00:00, 91.6MB/s]\n",
-            "(RayTrainWorker pid=1117, ip=172.31.90.137) Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_projector.weight', 'vocab_transform.bias', 'vocab_layer_norm.weight', 'vocab_projector.bias', 'vocab_transform.weight', 'vocab_layer_norm.bias']\n",
-            "(RayTrainWorker pid=1117, ip=172.31.90.137) - This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
-            "(RayTrainWorker pid=1117, ip=172.31.90.137) - This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
-            "(RayTrainWorker pid=1117, ip=172.31.90.137) Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['pre_classifier.bias', 'classifier.bias', 'classifier.weight', 'pre_classifier.weight']\n",
-            "(RayTrainWorker pid=1117, ip=172.31.90.137) You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_layer_norm.weight', 'vocab_projector.bias', 'vocab_layer_norm.bias', 'vocab_transform.bias', 'vocab_projector.weight', 'vocab_transform.weight']\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) - This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) - This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['pre_classifier.bias', 'pre_classifier.weight', 'classifier.weight', 'classifier.bias']\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
-            "(RayTrainWorker pid=1116, ip=172.31.90.137) Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_layer_norm.bias', 'vocab_transform.bias', 'vocab_projector.bias', 'vocab_layer_norm.weight', 'vocab_transform.weight', 'vocab_projector.weight']\n",
-            "(RayTrainWorker pid=1116, ip=172.31.90.137) - This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
-            "(RayTrainWorker pid=1116, ip=172.31.90.137) - This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
-            "(RayTrainWorker pid=1116, ip=172.31.90.137) Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'pre_classifier.weight', 'pre_classifier.bias', 'classifier.weight']\n",
-            "(RayTrainWorker pid=1116, ip=172.31.90.137) You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
-            "(RayTrainWorker pid=1115, ip=172.31.90.137) Some weights of the model checkpoint at distilbert-base-uncased were not used when initializing DistilBertForSequenceClassification: ['vocab_projector.bias', 'vocab_projector.weight', 'vocab_transform.bias', 'vocab_layer_norm.bias', 'vocab_transform.weight', 'vocab_layer_norm.weight']\n",
-            "(RayTrainWorker pid=1115, ip=172.31.90.137) - This IS expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
-            "(RayTrainWorker pid=1115, ip=172.31.90.137) - This IS NOT expected if you are initializing DistilBertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
-            "(RayTrainWorker pid=1115, ip=172.31.90.137) Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['pre_classifier.weight', 'classifier.weight', 'classifier.bias', 'pre_classifier.bias']\n",
-            "(RayTrainWorker pid=1115, ip=172.31.90.137) You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Starting training\n",
-            "(RayTrainWorker pid=1116, ip=172.31.90.137) Starting training\n",
-            "(RayTrainWorker pid=1117, ip=172.31.90.137) Starting training\n",
-            "(RayTrainWorker pid=1115, ip=172.31.90.137) Starting training\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) ***** Running training *****\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137)   Num examples = 8551\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137)   Num Epochs = 2\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137)   Instantaneous batch size per device = 16\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137)   Total train batch size (w. parallel, distributed & accumulation) = 64\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137)   Gradient Accumulation steps = 1\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137)   Total optimization steps = 1070\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) The following columns in the training set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) {'loss': 0.5437, 'learning_rate': 1e-05, 'epoch': 1.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) ***** Running Evaluation *****\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137)   Num examples = 1043\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137)   Batch size = 16\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) {'eval_loss': 0.5794203281402588, 'eval_matthews_correlation': 0.3293676852500821, 'eval_runtime': 0.9804, 'eval_samples_per_second': 277.441, 'eval_steps_per_second': 5.1, 'epoch': 1.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-535\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/config.json\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/pytorch_model.bin\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/tokenizer_config.json\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/special_tokens_map.json\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Result for HuggingFaceTrainer_c1ff5_00000:\n",
-            "  _time_this_iter_s: 90.87123560905457\n",
-            "  _timestamp: 1661447540\n",
-            "  _training_iteration: 1\n",
-            "  date: 2022-08-25_10-12-20\n",
-            "  done: false\n",
-            "  epoch: 1.0\n",
-            "  eval_loss: 0.5794203281402588\n",
-            "  eval_matthews_correlation: 0.3293676852500821\n",
-            "  eval_runtime: 0.9804\n",
-            "  eval_samples_per_second: 277.441\n",
-            "  eval_steps_per_second: 5.1\n",
-            "  experiment_id: 592e02b25b254bd1a3743904313dc85b\n",
-            "  hostname: ip-172-31-90-137\n",
-            "  iterations_since_restore: 1\n",
-            "  learning_rate: 1.0e-05\n",
-            "  loss: 0.5437\n",
-            "  node_ip: 172.31.90.137\n",
-            "  pid: 947\n",
-            "  should_checkpoint: true\n",
-            "  step: 535\n",
-            "  time_since_restore: 103.24057936668396\n",
-            "  time_this_iter_s: 103.24057936668396\n",
-            "  time_total_s: 103.24057936668396\n",
-            "  timestamp: 1661447540\n",
-            "  timesteps_since_restore: 0\n",
-            "  training_iteration: 1\n",
-            "  trial_id: c1ff5_00000\n",
-            "  warmup_time: 0.003858327865600586\n",
-            "  \n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-1070\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/config.json\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/pytorch_model.bin\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/tokenizer_config.json\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/special_tokens_map.json\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) {'loss': 0.3886, 'learning_rate': 0.0, 'epoch': 2.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) ***** Running Evaluation *****\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137)   Num examples = 1043\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137)   Batch size = 16\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) {'eval_loss': 0.6215357184410095, 'eval_matthews_correlation': 0.42957017514952434, 'eval_runtime': 0.9956, 'eval_samples_per_second': 273.204, 'eval_steps_per_second': 5.022, 'epoch': 2.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-1070\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/config.json\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/pytorch_model.bin\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/tokenizer_config.json\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/special_tokens_map.json\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) {'train_runtime': 174.4696, 'train_samples_per_second': 98.023, 'train_steps_per_second': 6.133, 'train_loss': 0.4661755713346963, 'epoch': 2.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) \n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) \n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) Training completed. Do not forget to share your model on huggingface.co/models =)\n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) \n",
-            "(RayTrainWorker pid=1114, ip=172.31.90.137) \n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Result for HuggingFaceTrainer_c1ff5_00000:\n",
-            "  _time_this_iter_s: 96.96447467803955\n",
-            "  _timestamp: 1661447637\n",
-            "  _training_iteration: 2\n",
-            "  date: 2022-08-25_10-13-57\n",
-            "  done: false\n",
-            "  epoch: 2.0\n",
-            "  eval_loss: 0.6215357184410095\n",
-            "  eval_matthews_correlation: 0.42957017514952434\n",
-            "  eval_runtime: 0.9956\n",
-            "  eval_samples_per_second: 273.204\n",
-            "  eval_steps_per_second: 5.022\n",
-            "  experiment_id: 592e02b25b254bd1a3743904313dc85b\n",
-            "  hostname: ip-172-31-90-137\n",
-            "  iterations_since_restore: 2\n",
-            "  learning_rate: 0.0\n",
-            "  loss: 0.3886\n",
-            "  node_ip: 172.31.90.137\n",
-            "  pid: 947\n",
-            "  should_checkpoint: true\n",
-            "  step: 1070\n",
-            "  time_since_restore: 200.21722102165222\n",
-            "  time_this_iter_s: 96.97664165496826\n",
-            "  time_total_s: 200.21722102165222\n",
-            "  timestamp: 1661447637\n",
-            "  timesteps_since_restore: 0\n",
-            "  train_loss: 0.4661755713346963\n",
-            "  train_runtime: 174.4696\n",
-            "  train_samples_per_second: 98.023\n",
-            "  train_steps_per_second: 6.133\n",
-            "  training_iteration: 2\n",
-            "  trial_id: c1ff5_00000\n",
-            "  warmup_time: 0.003858327865600586\n",
-            "  \n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Result for HuggingFaceTrainer_c1ff5_00000:\n",
-            "  _time_this_iter_s: 96.96447467803955\n",
-            "  _timestamp: 1661447637\n",
-            "  _training_iteration: 2\n",
-            "  date: 2022-08-25_10-13-57\n",
-            "  done: true\n",
-            "  epoch: 2.0\n",
-            "  eval_loss: 0.6215357184410095\n",
-            "  eval_matthews_correlation: 0.42957017514952434\n",
-            "  eval_runtime: 0.9956\n",
-            "  eval_samples_per_second: 273.204\n",
-            "  eval_steps_per_second: 5.022\n",
-            "  experiment_id: 592e02b25b254bd1a3743904313dc85b\n",
-            "  experiment_tag: '0'\n",
-            "  hostname: ip-172-31-90-137\n",
-            "  iterations_since_restore: 2\n",
-            "  learning_rate: 0.0\n",
-            "  loss: 0.3886\n",
-            "  node_ip: 172.31.90.137\n",
-            "  pid: 947\n",
-            "  should_checkpoint: true\n",
-            "  step: 1070\n",
-            "  time_since_restore: 200.21722102165222\n",
-            "  time_this_iter_s: 96.97664165496826\n",
-            "  time_total_s: 200.21722102165222\n",
-            "  timestamp: 1661447637\n",
-            "  timesteps_since_restore: 0\n",
-            "  train_loss: 0.4661755713346963\n",
-            "  train_runtime: 174.4696\n",
-            "  train_samples_per_second: 98.023\n",
-            "  train_steps_per_second: 6.133\n",
-            "  training_iteration: 2\n",
-            "  trial_id: c1ff5_00000\n",
-            "  warmup_time: 0.003858327865600586\n",
-            "  \n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "2022-08-25 10:14:09,300\tINFO tune.py:758 -- Total run time: 246.67 seconds (246.44 seconds for the tuning loop).\n"
-          ]
-        }
-      ],
-      "source": [
-        "result = trainer.fit()"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) ***** Running training *****\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193)   Num examples = 8551\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193)   Num Epochs = 4\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193)   Instantaneous batch size per device = 16\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193)   Total train batch size (w. parallel, distributed & accumulation) = 64\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193)   Gradient Accumulation steps = 1\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193)   Total optimization steps = 2140\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) ***** Running Evaluation *****\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num examples = 1043\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Batch size = 16\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "4cnWqUWmhYba"
-      },
-      "source": [
-        "You can use the returned `Result` object to access metrics and the Ray AIR `Checkpoint` associated with the last iteration."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) {'loss': 0.5458, 'learning_rate': 1.5000000000000002e-05, 'epoch': 1.0}\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 16,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "AMN5qjUwhYba",
-        "outputId": "7b754c36-c58b-4ff4-d7a8-63ec9764bd0c"
-      },
-      "outputs": [
-        {
-          "data": {
-            "text/plain": [
-              "Result(metrics={'loss': 0.3886, 'learning_rate': 0.0, 'epoch': 2.0, 'step': 1070, 'eval_loss': 0.6215357184410095, 'eval_matthews_correlation': 0.42957017514952434, 'eval_runtime': 0.9956, 'eval_samples_per_second': 273.204, 'eval_steps_per_second': 5.022, 'train_runtime': 174.4696, 'train_samples_per_second': 98.023, 'train_steps_per_second': 6.133, 'train_loss': 0.4661755713346963, '_timestamp': 1661447637, '_time_this_iter_s': 96.96447467803955, '_training_iteration': 2, 'should_checkpoint': True, 'done': True, 'trial_id': 'c1ff5_00000', 'experiment_tag': '0'}, error=None, log_dir=PosixPath('/home/ray/ray_results/HuggingFaceTrainer_2022-08-25_10-10-02/HuggingFaceTrainer_c1ff5_00000_0_2022-08-25_10-10-04'))"
-            ]
-          },
-          "execution_count": 16,
-          "metadata": {},
-          "output_type": "execute_result"
-        }
-      ],
-      "source": [
-        "result"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "### Tune hyperparameters with Ray AIR <a name=\"predict\"></a>"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) {'eval_loss': 0.6037685871124268, 'eval_matthews_correlation': 0.3654892178274207, 'eval_runtime': 0.9847, 'eval_samples_per_second': 276.225, 'eval_steps_per_second': 5.078, 'epoch': 1.0}\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "If we would like to tune any hyperparameters of the model, we can do so by simply passing our `HuggingFaceTrainer` into a `Tuner` and defining the search space.\n",
-        "\n",
-        "We can also take advantage of the advanced search algorithms and schedulers provided by Ray Tune. In this example, we will use an `ASHAScheduler` to aggresively terminate underperforming trials."
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-535\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/config.json\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/pytorch_model.bin\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/tokenizer_config.json\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/special_tokens_map.json\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 17,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "from ray import tune\n",
-        "from ray.tune import Tuner\n",
-        "from ray.tune.schedulers.async_hyperband import ASHAScheduler\n",
-        "\n",
-        "tune_epochs = 4\n",
-        "tuner = Tuner(\n",
-        "    trainer,\n",
-        "    param_space={\n",
-        "        \"trainer_init_config\": {\n",
-        "            \"learning_rate\": tune.grid_search([2e-5, 2e-4, 2e-3, 2e-2]),\n",
-        "            \"epochs\": tune_epochs,\n",
-        "        }\n",
-        "    },\n",
-        "    tune_config=tune.TuneConfig(\n",
-        "        metric=\"eval_loss\",\n",
-        "        mode=\"min\",\n",
-        "        num_samples=1,\n",
-        "        scheduler=ASHAScheduler(\n",
-        "            max_t=tune_epochs,\n",
-        "        )\n",
-        "    ),\n",
-        "    run_config=RunConfig(\n",
-        "        checkpoint_config=CheckpointConfig(num_to_keep=1, checkpoint_score_attribute=\"eval_loss\", checkpoint_score_order=\"min\")\n",
-        "    ),\n",
-        ")"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Result for HuggingFaceTrainer_5654d_00000:\n",
+      "  _time_this_iter_s: 85.01727724075317\n",
+      "  _timestamp: 1661447753\n",
+      "  _training_iteration: 1\n",
+      "  date: 2022-08-25_10-15-53\n",
+      "  done: false\n",
+      "  epoch: 1.0\n",
+      "  eval_loss: 0.6037685871124268\n",
+      "  eval_matthews_correlation: 0.3654892178274207\n",
+      "  eval_runtime: 0.9847\n",
+      "  eval_samples_per_second: 276.225\n",
+      "  eval_steps_per_second: 5.078\n",
+      "  experiment_id: cee1b96afcf344e89482e3c5e298a412\n",
+      "  hostname: ip-172-31-90-137\n",
+      "  iterations_since_restore: 1\n",
+      "  learning_rate: 1.5000000000000002e-05\n",
+      "  loss: 0.5458\n",
+      "  node_ip: 172.31.90.137\n",
+      "  pid: 1729\n",
+      "  should_checkpoint: true\n",
+      "  step: 535\n",
+      "  time_since_restore: 94.93232989311218\n",
+      "  time_this_iter_s: 94.93232989311218\n",
+      "  time_total_s: 94.93232989311218\n",
+      "  timestamp: 1661447753\n",
+      "  timesteps_since_restore: 0\n",
+      "  training_iteration: 1\n",
+      "  trial_id: 5654d_00000\n",
+      "  warmup_time: 0.0037021636962890625\n",
+      "  \n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) {'loss': 0.6225, 'learning_rate': 0.00015000000000000001, 'epoch': 1.0}\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 18,
-      "metadata": {},
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "== Status ==<br>Current time: 2022-08-25 10:20:13 (running for 00:06:01.75)<br>Memory usage on this node: 4.4/62.0 GiB<br>Using AsyncHyperBand: num_stopped=4\n",
-              "Bracket: Iter 4.000: -0.8064090609550476 | Iter 1.000: -0.6378736793994904<br>Resources requested: 0/208 CPUs, 0/16 GPUs, 0.0/574.34 GiB heap, 0.0/241.51 GiB objects (0.0/4.0 accelerator_type:T4)<br>Current best trial: 5654d_00001 with eval_loss=0.6492420434951782 and parameters={'trainer_init_config': {'learning_rate': 0.0002, 'epochs': 4}}<br>Result logdir: /home/ray/ray_results/HuggingFaceTrainer_2022-08-25_10-14-11<br>Number of trials: 4/4 (4 TERMINATED)<br><table>\n",
-              "<thead>\n",
-              "<tr><th>Trial name                    </th><th>status    </th><th>loc               </th><th style=\"text-align: right;\">  trainer_init_conf...</th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  loss</th><th style=\"text-align: right;\">  learning_rate</th><th style=\"text-align: right;\">  epoch</th></tr>\n",
-              "</thead>\n",
-              "<tbody>\n",
-              "<tr><td>HuggingFaceTrainer_5654d_00000</td><td>TERMINATED</td><td>172.31.90.137:1729</td><td style=\"text-align: right;\">                2e-05 </td><td style=\"text-align: right;\">     4</td><td style=\"text-align: right;\">        347.171 </td><td style=\"text-align: right;\">0.1958</td><td style=\"text-align: right;\">        0      </td><td style=\"text-align: right;\">      4</td></tr>\n",
-              "<tr><td>HuggingFaceTrainer_5654d_00001</td><td>TERMINATED</td><td>172.31.76.237:1805</td><td style=\"text-align: right;\">                0.0002</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">         95.2492</td><td style=\"text-align: right;\">0.6225</td><td style=\"text-align: right;\">        0.00015</td><td style=\"text-align: right;\">      1</td></tr>\n",
-              "<tr><td>HuggingFaceTrainer_5654d_00002</td><td>TERMINATED</td><td>172.31.85.32:1322 </td><td style=\"text-align: right;\">                0.002 </td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">         93.7613</td><td style=\"text-align: right;\">0.6463</td><td style=\"text-align: right;\">        0.0015 </td><td style=\"text-align: right;\">      1</td></tr>\n",
-              "<tr><td>HuggingFaceTrainer_5654d_00003</td><td>TERMINATED</td><td>172.31.85.193:1060</td><td style=\"text-align: right;\">                0.02  </td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">         99.3677</td><td style=\"text-align: right;\">0.926 </td><td style=\"text-align: right;\">        0.015  </td><td style=\"text-align: right;\">      1</td></tr>\n",
-              "</tbody>\n",
-              "</table><br><br>"
-            ],
-            "text/plain": [
-              "<IPython.core.display.HTML object>"
-            ]
-          },
-          "metadata": {},
-          "output_type": "display_data"
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) 2022-08-25 10:14:23,379\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=4]\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1792, ip=172.31.90.137) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1790, ip=172.31.90.137) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1791, ip=172.31.90.137) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Is CUDA available: True\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) 2022-08-25 10:14:29,354\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=4]\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1977, ip=172.31.76.237) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1976, ip=172.31.76.237) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1975, ip=172.31.76.237) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) Is CUDA available: True\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) 2022-08-25 10:14:35,313\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=4]\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1790, ip=172.31.90.137) Starting training\n",
-            "(RayTrainWorker pid=1792, ip=172.31.90.137) Starting training\n",
-            "(RayTrainWorker pid=1791, ip=172.31.90.137) Starting training\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Starting training\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) ***** Running training *****\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num examples = 8551\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num Epochs = 4\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Instantaneous batch size per device = 16\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Total train batch size (w. parallel, distributed & accumulation) = 64\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Gradient Accumulation steps = 1\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Total optimization steps = 2140\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1485, ip=172.31.85.32) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1486, ip=172.31.85.32) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1484, ip=172.31.85.32) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1977, ip=172.31.76.237) Starting training\n",
-            "(RayTrainWorker pid=1976, ip=172.31.76.237) Starting training\n",
-            "(RayTrainWorker pid=1975, ip=172.31.76.237) Starting training\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) Starting training\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) ***** Running training *****\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237)   Num examples = 8551\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237)   Num Epochs = 4\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237)   Instantaneous batch size per device = 16\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237)   Total train batch size (w. parallel, distributed & accumulation) = 64\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237)   Gradient Accumulation steps = 1\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237)   Total optimization steps = 2140\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) Starting training\n",
-            "(RayTrainWorker pid=1485, ip=172.31.85.32) Starting training\n",
-            "(RayTrainWorker pid=1486, ip=172.31.85.32) Starting training\n",
-            "(RayTrainWorker pid=1484, ip=172.31.85.32) Starting training\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) ***** Running training *****\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32)   Num examples = 8551\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32)   Num Epochs = 4\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32)   Instantaneous batch size per device = 16\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32)   Total train batch size (w. parallel, distributed & accumulation) = 64\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32)   Gradient Accumulation steps = 1\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32)   Total optimization steps = 2140\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) 2022-08-25 10:14:48,193\tINFO config.py:71 -- Setting up process group for: env:// [rank=0, world_size=4]\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1224, ip=172.31.85.193) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1226, ip=172.31.85.193) Is CUDA available: True\n",
-            "(RayTrainWorker pid=1225, ip=172.31.85.193) Is CUDA available: True\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "Downloading builder script: 5.76kB [00:00, 6.59MB/s]                   \n",
-            "Downloading builder script: 5.76kB [00:00, 6.52MB/s]                   \n",
-            "Downloading builder script: 5.76kB [00:00, 6.07MB/s]                   \n",
-            "Downloading builder script: 5.76kB [00:00, 6.81MB/s]                   \n",
-            "Downloading tokenizer_config.json: 100%|██████████| 28.0/28.0 [00:00<00:00, 46.0kB/s]\n",
-            "Downloading config.json: 100%|██████████| 483/483 [00:00<00:00, 766kB/s]\n",
-            "Downloading vocab.txt:   0%|          | 0.00/226k [00:00<?, ?B/s]\n",
-            "Downloading vocab.txt:  32%|███▏      | 72.0k/226k [00:00<00:00, 624kB/s]\n",
-            "Downloading vocab.txt: 100%|██████████| 226k/226k [00:00<00:00, 966kB/s] \n",
-            "Downloading tokenizer.json:   0%|          | 0.00/455k [00:00<?, ?B/s]\n",
-            "Downloading tokenizer.json:   6%|▋         | 29.0k/455k [00:00<00:01, 233kB/s]\n",
-            "Downloading tokenizer.json:  30%|██▉       | 136k/455k [00:00<00:00, 600kB/s] \n",
-            "Downloading tokenizer.json: 100%|██████████| 455k/455k [00:00<00:00, 1.44MB/s]\n",
-            "Downloading pytorch_model.bin:   0%|          | 0.00/256M [00:00<?, ?B/s]\n",
-            "Downloading pytorch_model.bin:   1%|          | 2.32M/256M [00:00<00:10, 24.4MB/s]\n",
-            "Downloading pytorch_model.bin:   4%|▍         | 11.0M/256M [00:00<00:04, 63.4MB/s]\n",
-            "Downloading pytorch_model.bin:   8%|▊         | 20.0M/256M [00:00<00:03, 77.7MB/s]\n",
-            "Downloading pytorch_model.bin:  11%|█▏        | 29.1M/256M [00:00<00:02, 84.8MB/s]\n",
-            "Downloading pytorch_model.bin:  15%|█▍        | 38.2M/256M [00:00<00:02, 88.5MB/s]\n",
-            "Downloading pytorch_model.bin:  18%|█▊        | 47.3M/256M [00:00<00:02, 90.7MB/s]\n",
-            "Downloading pytorch_model.bin:  22%|██▏       | 56.4M/256M [00:00<00:02, 92.4MB/s]\n",
-            "Downloading pytorch_model.bin:  26%|██▌       | 65.5M/256M [00:00<00:02, 93.4MB/s]\n",
-            "Downloading pytorch_model.bin:  29%|██▉       | 74.7M/256M [00:00<00:02, 94.2MB/s]\n",
-            "Downloading pytorch_model.bin:  33%|███▎      | 83.8M/256M [00:01<00:01, 94.8MB/s]\n",
-            "Downloading pytorch_model.bin:  36%|███▋      | 93.0M/256M [00:01<00:01, 95.1MB/s]\n",
-            "Downloading pytorch_model.bin:  40%|███▉      | 102M/256M [00:01<00:01, 95.4MB/s] \n",
-            "Downloading pytorch_model.bin:  44%|████▎     | 111M/256M [00:01<00:01, 95.6MB/s]\n",
-            "Downloading pytorch_model.bin:  47%|████▋     | 120M/256M [00:01<00:01, 95.7MB/s]\n",
-            "Downloading pytorch_model.bin:  51%|█████     | 130M/256M [00:01<00:01, 95.8MB/s]\n",
-            "Downloading pytorch_model.bin:  54%|█████▍    | 139M/256M [00:01<00:01, 95.8MB/s]\n",
-            "Downloading pytorch_model.bin:  58%|█████▊    | 148M/256M [00:01<00:01, 95.9MB/s]\n",
-            "Downloading pytorch_model.bin:  61%|██████▏   | 157M/256M [00:01<00:01, 96.1MB/s]\n",
-            "Downloading pytorch_model.bin:  65%|██████▌   | 166M/256M [00:01<00:00, 96.1MB/s]\n",
-            "Downloading pytorch_model.bin:  69%|██████▊   | 175M/256M [00:02<00:00, 96.1MB/s]\n",
-            "Downloading pytorch_model.bin:  72%|███████▏  | 185M/256M [00:02<00:00, 96.2MB/s]\n",
-            "Downloading pytorch_model.bin:  76%|███████▌  | 194M/256M [00:02<00:00, 96.2MB/s]\n",
-            "Downloading pytorch_model.bin:  79%|███████▉  | 203M/256M [00:02<00:00, 96.1MB/s]\n",
-            "Downloading pytorch_model.bin:  83%|████████▎ | 212M/256M [00:02<00:00, 96.1MB/s]\n",
-            "Downloading pytorch_model.bin:  87%|████████▋ | 221M/256M [00:02<00:00, 96.2MB/s]\n",
-            "Downloading pytorch_model.bin:  90%|█████████ | 231M/256M [00:02<00:00, 96.2MB/s]\n",
-            "Downloading pytorch_model.bin:  94%|█████████▍| 240M/256M [00:02<00:00, 96.1MB/s]\n",
-            "Downloading pytorch_model.bin:  97%|█████████▋| 249M/256M [00:02<00:00, 96.0MB/s]\n",
-            "Downloading pytorch_model.bin: 100%|██████████| 256M/256M [00:02<00:00, 93.2MB/s]\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) Starting training\n",
-            "(RayTrainWorker pid=1226, ip=172.31.85.193) Starting training\n",
-            "(RayTrainWorker pid=1225, ip=172.31.85.193) Starting training\n",
-            "(RayTrainWorker pid=1224, ip=172.31.85.193) Starting training\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) ***** Running training *****\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193)   Num examples = 8551\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193)   Num Epochs = 4\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193)   Instantaneous batch size per device = 16\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193)   Total train batch size (w. parallel, distributed & accumulation) = 64\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193)   Gradient Accumulation steps = 1\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193)   Total optimization steps = 2140\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) ***** Running Evaluation *****\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num examples = 1043\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Batch size = 16\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) {'loss': 0.5458, 'learning_rate': 1.5000000000000002e-05, 'epoch': 1.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) {'eval_loss': 0.6037685871124268, 'eval_matthews_correlation': 0.3654892178274207, 'eval_runtime': 0.9847, 'eval_samples_per_second': 276.225, 'eval_steps_per_second': 5.078, 'epoch': 1.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-535\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/config.json\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/pytorch_model.bin\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/tokenizer_config.json\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/special_tokens_map.json\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Result for HuggingFaceTrainer_5654d_00000:\n",
-            "  _time_this_iter_s: 85.01727724075317\n",
-            "  _timestamp: 1661447753\n",
-            "  _training_iteration: 1\n",
-            "  date: 2022-08-25_10-15-53\n",
-            "  done: false\n",
-            "  epoch: 1.0\n",
-            "  eval_loss: 0.6037685871124268\n",
-            "  eval_matthews_correlation: 0.3654892178274207\n",
-            "  eval_runtime: 0.9847\n",
-            "  eval_samples_per_second: 276.225\n",
-            "  eval_steps_per_second: 5.078\n",
-            "  experiment_id: cee1b96afcf344e89482e3c5e298a412\n",
-            "  hostname: ip-172-31-90-137\n",
-            "  iterations_since_restore: 1\n",
-            "  learning_rate: 1.5000000000000002e-05\n",
-            "  loss: 0.5458\n",
-            "  node_ip: 172.31.90.137\n",
-            "  pid: 1729\n",
-            "  should_checkpoint: true\n",
-            "  step: 535\n",
-            "  time_since_restore: 94.93232989311218\n",
-            "  time_this_iter_s: 94.93232989311218\n",
-            "  time_total_s: 94.93232989311218\n",
-            "  timestamp: 1661447753\n",
-            "  timesteps_since_restore: 0\n",
-            "  training_iteration: 1\n",
-            "  trial_id: 5654d_00000\n",
-            "  warmup_time: 0.0037021636962890625\n",
-            "  \n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) {'loss': 0.6225, 'learning_rate': 0.00015000000000000001, 'epoch': 1.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) ***** Running Evaluation *****\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237)   Num examples = 1043\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237)   Batch size = 16\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: idx, sentence. If idx, sentence are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) {'eval_loss': 0.6492420434951782, 'eval_matthews_correlation': 0.0, 'eval_runtime': 1.0157, 'eval_samples_per_second': 267.792, 'eval_steps_per_second': 4.923, 'epoch': 1.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-535\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/config.json\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/pytorch_model.bin\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/tokenizer_config.json\n",
-            "(RayTrainWorker pid=1974, ip=172.31.76.237) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/special_tokens_map.json\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Result for HuggingFaceTrainer_5654d_00001:\n",
-            "  _time_this_iter_s: 84.79700112342834\n",
-            "  _timestamp: 1661447759\n",
-            "  _training_iteration: 1\n",
-            "  date: 2022-08-25_10-16-00\n",
-            "  done: true\n",
-            "  epoch: 1.0\n",
-            "  eval_loss: 0.6492420434951782\n",
-            "  eval_matthews_correlation: 0.0\n",
-            "  eval_runtime: 1.0157\n",
-            "  eval_samples_per_second: 267.792\n",
-            "  eval_steps_per_second: 4.923\n",
-            "  experiment_id: 88145f9344584715a4bd7d018f751b12\n",
-            "  hostname: ip-172-31-76-237\n",
-            "  iterations_since_restore: 1\n",
-            "  learning_rate: 0.00015000000000000001\n",
-            "  loss: 0.6225\n",
-            "  node_ip: 172.31.76.237\n",
-            "  pid: 1805\n",
-            "  should_checkpoint: true\n",
-            "  step: 535\n",
-            "  time_since_restore: 95.24916434288025\n",
-            "  time_this_iter_s: 95.24916434288025\n",
-            "  time_total_s: 95.24916434288025\n",
-            "  timestamp: 1661447760\n",
-            "  timesteps_since_restore: 0\n",
-            "  training_iteration: 1\n",
-            "  trial_id: 5654d_00001\n",
-            "  warmup_time: 0.003660917282104492\n",
-            "  \n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) {'loss': 0.6463, 'learning_rate': 0.0015, 'epoch': 1.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) ***** Running Evaluation *****\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32)   Num examples = 1043\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32)   Batch size = 16\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) {'eval_loss': 0.6586529612541199, 'eval_matthews_correlation': 0.0, 'eval_runtime': 0.9576, 'eval_samples_per_second': 284.05, 'eval_steps_per_second': 5.222, 'epoch': 1.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-535\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/config.json\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/pytorch_model.bin\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/tokenizer_config.json\n",
-            "(RayTrainWorker pid=1483, ip=172.31.85.32) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/special_tokens_map.json\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Result for HuggingFaceTrainer_5654d_00002:\n",
-            "  _time_this_iter_s: 84.01720070838928\n",
-            "  _timestamp: 1661447764\n",
-            "  _training_iteration: 1\n",
-            "  date: 2022-08-25_10-16-04\n",
-            "  done: true\n",
-            "  epoch: 1.0\n",
-            "  eval_loss: 0.6586529612541199\n",
-            "  eval_matthews_correlation: 0.0\n",
-            "  eval_runtime: 0.9576\n",
-            "  eval_samples_per_second: 284.05\n",
-            "  eval_steps_per_second: 5.222\n",
-            "  experiment_id: 5f8ab183779d40379d59ea615f9d5411\n",
-            "  hostname: ip-172-31-85-32\n",
-            "  iterations_since_restore: 1\n",
-            "  learning_rate: 0.0015\n",
-            "  loss: 0.6463\n",
-            "  node_ip: 172.31.85.32\n",
-            "  pid: 1322\n",
-            "  should_checkpoint: true\n",
-            "  step: 535\n",
-            "  time_since_restore: 93.76131749153137\n",
-            "  time_this_iter_s: 93.76131749153137\n",
-            "  time_total_s: 93.76131749153137\n",
-            "  timestamp: 1661447764\n",
-            "  timesteps_since_restore: 0\n",
-            "  training_iteration: 1\n",
-            "  trial_id: 5654d_00002\n",
-            "  warmup_time: 0.004533290863037109\n",
-            "  \n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) ***** Running Evaluation *****\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193)   Num examples = 1043\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193)   Batch size = 16\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: idx, sentence. If idx, sentence are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) {'loss': 0.926, 'learning_rate': 0.015, 'epoch': 1.0}\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) {'eval_loss': 0.6529427766799927, 'eval_matthews_correlation': 0.0, 'eval_runtime': 0.9428, 'eval_samples_per_second': 288.51, 'eval_steps_per_second': 5.303, 'epoch': 1.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-535\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/config.json\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/pytorch_model.bin\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/tokenizer_config.json\n",
-            "(RayTrainWorker pid=1223, ip=172.31.85.193) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/special_tokens_map.json\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Result for HuggingFaceTrainer_5654d_00003:\n",
-            "  _time_this_iter_s: 89.4301290512085\n",
-            "  _timestamp: 1661447782\n",
-            "  _training_iteration: 1\n",
-            "  date: 2022-08-25_10-16-22\n",
-            "  done: true\n",
-            "  epoch: 1.0\n",
-            "  eval_loss: 0.6529427766799927\n",
-            "  eval_matthews_correlation: 0.0\n",
-            "  eval_runtime: 0.9428\n",
-            "  eval_samples_per_second: 288.51\n",
-            "  eval_steps_per_second: 5.303\n",
-            "  experiment_id: 8495977eeefd405fa4d9c1ea8fa735e1\n",
-            "  hostname: ip-172-31-85-193\n",
-            "  iterations_since_restore: 1\n",
-            "  learning_rate: 0.015\n",
-            "  loss: 0.926\n",
-            "  node_ip: 172.31.85.193\n",
-            "  pid: 1060\n",
-            "  should_checkpoint: true\n",
-            "  step: 535\n",
-            "  time_since_restore: 99.36774587631226\n",
-            "  time_this_iter_s: 99.36774587631226\n",
-            "  time_total_s: 99.36774587631226\n",
-            "  timestamp: 1661447782\n",
-            "  timesteps_since_restore: 0\n",
-            "  training_iteration: 1\n",
-            "  trial_id: 5654d_00003\n",
-            "  warmup_time: 0.004132509231567383\n",
-            "  \n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) ***** Running Evaluation *****\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num examples = 1043\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Batch size = 16\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) {'loss': 0.3841, 'learning_rate': 1e-05, 'epoch': 2.0}\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) {'eval_loss': 0.5994958281517029, 'eval_matthews_correlation': 0.4573244914254411, 'eval_runtime': 0.9442, 'eval_samples_per_second': 288.066, 'eval_steps_per_second': 5.295, 'epoch': 2.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-1070\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/config.json\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/pytorch_model.bin\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/tokenizer_config.json\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/special_tokens_map.json\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Result for HuggingFaceTrainer_5654d_00000:\n",
-            "  _time_this_iter_s: 76.82565689086914\n",
-            "  _timestamp: 1661447830\n",
-            "  _training_iteration: 2\n",
-            "  date: 2022-08-25_10-17-10\n",
-            "  done: false\n",
-            "  epoch: 2.0\n",
-            "  eval_loss: 0.5994958281517029\n",
-            "  eval_matthews_correlation: 0.4573244914254411\n",
-            "  eval_runtime: 0.9442\n",
-            "  eval_samples_per_second: 288.066\n",
-            "  eval_steps_per_second: 5.295\n",
-            "  experiment_id: cee1b96afcf344e89482e3c5e298a412\n",
-            "  hostname: ip-172-31-90-137\n",
-            "  iterations_since_restore: 2\n",
-            "  learning_rate: 1.0e-05\n",
-            "  loss: 0.3841\n",
-            "  node_ip: 172.31.90.137\n",
-            "  pid: 1729\n",
-            "  should_checkpoint: true\n",
-            "  step: 1070\n",
-            "  time_since_restore: 171.76071190834045\n",
-            "  time_this_iter_s: 76.82838201522827\n",
-            "  time_total_s: 171.76071190834045\n",
-            "  timestamp: 1661447830\n",
-            "  timesteps_since_restore: 0\n",
-            "  training_iteration: 2\n",
-            "  trial_id: 5654d_00000\n",
-            "  warmup_time: 0.0037021636962890625\n",
-            "  \n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) ***** Running Evaluation *****\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num examples = 1043\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Batch size = 16\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) {'loss': 0.2687, 'learning_rate': 5e-06, 'epoch': 3.0}\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) {'eval_loss': 0.6935313940048218, 'eval_matthews_correlation': 0.5300538425561, 'eval_runtime': 1.0176, 'eval_samples_per_second': 267.305, 'eval_steps_per_second': 4.914, 'epoch': 3.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-1605\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-1605/config.json\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-1605/pytorch_model.bin\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1605/tokenizer_config.json\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1605/special_tokens_map.json\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Result for HuggingFaceTrainer_5654d_00000:\n",
-            "  _time_this_iter_s: 76.47252488136292\n",
-            "  _timestamp: 1661447906\n",
-            "  _training_iteration: 3\n",
-            "  date: 2022-08-25_10-18-26\n",
-            "  done: false\n",
-            "  epoch: 3.0\n",
-            "  eval_loss: 0.6935313940048218\n",
-            "  eval_matthews_correlation: 0.5300538425561\n",
-            "  eval_runtime: 1.0176\n",
-            "  eval_samples_per_second: 267.305\n",
-            "  eval_steps_per_second: 4.914\n",
-            "  experiment_id: cee1b96afcf344e89482e3c5e298a412\n",
-            "  hostname: ip-172-31-90-137\n",
-            "  iterations_since_restore: 3\n",
-            "  learning_rate: 5.0e-06\n",
-            "  loss: 0.2687\n",
-            "  node_ip: 172.31.90.137\n",
-            "  pid: 1729\n",
-            "  should_checkpoint: true\n",
-            "  step: 1605\n",
-            "  time_since_restore: 248.23273348808289\n",
-            "  time_this_iter_s: 76.47202157974243\n",
-            "  time_total_s: 248.23273348808289\n",
-            "  timestamp: 1661447906\n",
-            "  timesteps_since_restore: 0\n",
-            "  training_iteration: 3\n",
-            "  trial_id: 5654d_00000\n",
-            "  warmup_time: 0.0037021636962890625\n",
-            "  \n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-2140\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/config.json\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/pytorch_model.bin\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/tokenizer_config.json\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/special_tokens_map.json\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) ***** Running Evaluation *****\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num examples = 1043\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137)   Batch size = 16\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) {'loss': 0.1958, 'learning_rate': 0.0, 'epoch': 4.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-2140\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/config.json\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) {'eval_loss': 0.8064090609550476, 'eval_matthews_correlation': 0.5322860764824153, 'eval_runtime': 1.0006, 'eval_samples_per_second': 271.827, 'eval_steps_per_second': 4.997, 'epoch': 4.0}\n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/pytorch_model.bin\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/tokenizer_config.json\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/special_tokens_map.json\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) \n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) \n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) Training completed. Do not forget to share your model on huggingface.co/models =)\n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) \n",
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) \n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "(RayTrainWorker pid=1789, ip=172.31.90.137) {'train_runtime': 329.1948, 'train_samples_per_second': 103.902, 'train_steps_per_second': 6.501, 'train_loss': 0.34860724689804506, 'epoch': 4.0}\n",
-            "Result for HuggingFaceTrainer_5654d_00000:\n",
-            "  _time_this_iter_s: 98.92064905166626\n",
-            "  _timestamp: 1661448005\n",
-            "  _training_iteration: 4\n",
-            "  date: 2022-08-25_10-20-05\n",
-            "  done: true\n",
-            "  epoch: 4.0\n",
-            "  eval_loss: 0.8064090609550476\n",
-            "  eval_matthews_correlation: 0.5322860764824153\n",
-            "  eval_runtime: 1.0006\n",
-            "  eval_samples_per_second: 271.827\n",
-            "  eval_steps_per_second: 4.997\n",
-            "  experiment_id: cee1b96afcf344e89482e3c5e298a412\n",
-            "  hostname: ip-172-31-90-137\n",
-            "  iterations_since_restore: 4\n",
-            "  learning_rate: 0.0\n",
-            "  loss: 0.1958\n",
-            "  node_ip: 172.31.90.137\n",
-            "  pid: 1729\n",
-            "  should_checkpoint: true\n",
-            "  step: 2140\n",
-            "  time_since_restore: 347.1705844402313\n",
-            "  time_this_iter_s: 98.93785095214844\n",
-            "  time_total_s: 347.1705844402313\n",
-            "  timestamp: 1661448005\n",
-            "  timesteps_since_restore: 0\n",
-            "  train_loss: 0.34860724689804506\n",
-            "  train_runtime: 329.1948\n",
-            "  train_samples_per_second: 103.902\n",
-            "  train_steps_per_second: 6.501\n",
-            "  training_iteration: 4\n",
-            "  trial_id: 5654d_00000\n",
-            "  warmup_time: 0.0037021636962890625\n",
-            "  \n"
-          ]
-        },
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "2022-08-25 10:20:13,409\tINFO tune.py:758 -- Total run time: 361.90 seconds (361.74 seconds for the tuning loop).\n"
-          ]
-        }
-      ],
-      "source": [
-        "tune_results = tuner.fit()"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) ***** Running Evaluation *****\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237)   Num examples = 1043\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237)   Batch size = 16\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: idx, sentence. If idx, sentence are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "We can view the results of the tuning run as a dataframe, and obtain the best result."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) {'eval_loss': 0.6492420434951782, 'eval_matthews_correlation': 0.0, 'eval_runtime': 1.0157, 'eval_samples_per_second': 267.792, 'eval_steps_per_second': 4.923, 'epoch': 1.0}\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 19,
-      "metadata": {},
-      "outputs": [
-        {
-          "data": {
-            "text/html": [
-              "<div>\n",
-              "<style scoped>\n",
-              "    .dataframe tbody tr th:only-of-type {\n",
-              "        vertical-align: middle;\n",
-              "    }\n",
-              "\n",
-              "    .dataframe tbody tr th {\n",
-              "        vertical-align: top;\n",
-              "    }\n",
-              "\n",
-              "    .dataframe thead th {\n",
-              "        text-align: right;\n",
-              "    }\n",
-              "</style>\n",
-              "<table border=\"1\" class=\"dataframe\">\n",
-              "  <thead>\n",
-              "    <tr style=\"text-align: right;\">\n",
-              "      <th></th>\n",
-              "      <th>loss</th>\n",
-              "      <th>learning_rate</th>\n",
-              "      <th>epoch</th>\n",
-              "      <th>step</th>\n",
-              "      <th>eval_loss</th>\n",
-              "      <th>eval_matthews_correlation</th>\n",
-              "      <th>eval_runtime</th>\n",
-              "      <th>eval_samples_per_second</th>\n",
-              "      <th>eval_steps_per_second</th>\n",
-              "      <th>_timestamp</th>\n",
-              "      <th>...</th>\n",
-              "      <th>pid</th>\n",
-              "      <th>hostname</th>\n",
-              "      <th>node_ip</th>\n",
-              "      <th>time_since_restore</th>\n",
-              "      <th>timesteps_since_restore</th>\n",
-              "      <th>iterations_since_restore</th>\n",
-              "      <th>warmup_time</th>\n",
-              "      <th>config/trainer_init_config/epochs</th>\n",
-              "      <th>config/trainer_init_config/learning_rate</th>\n",
-              "      <th>logdir</th>\n",
-              "    </tr>\n",
-              "  </thead>\n",
-              "  <tbody>\n",
-              "    <tr>\n",
-              "      <th>1</th>\n",
-              "      <td>0.6225</td>\n",
-              "      <td>0.00015</td>\n",
-              "      <td>1.0</td>\n",
-              "      <td>535</td>\n",
-              "      <td>0.649242</td>\n",
-              "      <td>0.000000</td>\n",
-              "      <td>1.0157</td>\n",
-              "      <td>267.792</td>\n",
-              "      <td>4.923</td>\n",
-              "      <td>1661447759</td>\n",
-              "      <td>...</td>\n",
-              "      <td>1805</td>\n",
-              "      <td>ip-172-31-76-237</td>\n",
-              "      <td>172.31.76.237</td>\n",
-              "      <td>95.249164</td>\n",
-              "      <td>0</td>\n",
-              "      <td>1</td>\n",
-              "      <td>0.003661</td>\n",
-              "      <td>4</td>\n",
-              "      <td>0.00020</td>\n",
-              "      <td>/home/ray/ray_results/HuggingFaceTrainer_2022-...</td>\n",
-              "    </tr>\n",
-              "    <tr>\n",
-              "      <th>3</th>\n",
-              "      <td>0.9260</td>\n",
-              "      <td>0.01500</td>\n",
-              "      <td>1.0</td>\n",
-              "      <td>535</td>\n",
-              "      <td>0.652943</td>\n",
-              "      <td>0.000000</td>\n",
-              "      <td>0.9428</td>\n",
-              "      <td>288.510</td>\n",
-              "      <td>5.303</td>\n",
-              "      <td>1661447782</td>\n",
-              "      <td>...</td>\n",
-              "      <td>1060</td>\n",
-              "      <td>ip-172-31-85-193</td>\n",
-              "      <td>172.31.85.193</td>\n",
-              "      <td>99.367746</td>\n",
-              "      <td>0</td>\n",
-              "      <td>1</td>\n",
-              "      <td>0.004133</td>\n",
-              "      <td>4</td>\n",
-              "      <td>0.02000</td>\n",
-              "      <td>/home/ray/ray_results/HuggingFaceTrainer_2022-...</td>\n",
-              "    </tr>\n",
-              "    <tr>\n",
-              "      <th>2</th>\n",
-              "      <td>0.6463</td>\n",
-              "      <td>0.00150</td>\n",
-              "      <td>1.0</td>\n",
-              "      <td>535</td>\n",
-              "      <td>0.658653</td>\n",
-              "      <td>0.000000</td>\n",
-              "      <td>0.9576</td>\n",
-              "      <td>284.050</td>\n",
-              "      <td>5.222</td>\n",
-              "      <td>1661447764</td>\n",
-              "      <td>...</td>\n",
-              "      <td>1322</td>\n",
-              "      <td>ip-172-31-85-32</td>\n",
-              "      <td>172.31.85.32</td>\n",
-              "      <td>93.761317</td>\n",
-              "      <td>0</td>\n",
-              "      <td>1</td>\n",
-              "      <td>0.004533</td>\n",
-              "      <td>4</td>\n",
-              "      <td>0.00200</td>\n",
-              "      <td>/home/ray/ray_results/HuggingFaceTrainer_2022-...</td>\n",
-              "    </tr>\n",
-              "    <tr>\n",
-              "      <th>0</th>\n",
-              "      <td>0.1958</td>\n",
-              "      <td>0.00000</td>\n",
-              "      <td>4.0</td>\n",
-              "      <td>2140</td>\n",
-              "      <td>0.806409</td>\n",
-              "      <td>0.532286</td>\n",
-              "      <td>1.0006</td>\n",
-              "      <td>271.827</td>\n",
-              "      <td>4.997</td>\n",
-              "      <td>1661448005</td>\n",
-              "      <td>...</td>\n",
-              "      <td>1729</td>\n",
-              "      <td>ip-172-31-90-137</td>\n",
-              "      <td>172.31.90.137</td>\n",
-              "      <td>347.170584</td>\n",
-              "      <td>0</td>\n",
-              "      <td>4</td>\n",
-              "      <td>0.003702</td>\n",
-              "      <td>4</td>\n",
-              "      <td>0.00002</td>\n",
-              "      <td>/home/ray/ray_results/HuggingFaceTrainer_2022-...</td>\n",
-              "    </tr>\n",
-              "  </tbody>\n",
-              "</table>\n",
-              "<p>4 rows × 33 columns</p>\n",
-              "</div>"
-            ],
-            "text/plain": [
-              "     loss  learning_rate  epoch  step  eval_loss  eval_matthews_correlation  \\\n",
-              "1  0.6225        0.00015    1.0   535   0.649242                   0.000000   \n",
-              "3  0.9260        0.01500    1.0   535   0.652943                   0.000000   \n",
-              "2  0.6463        0.00150    1.0   535   0.658653                   0.000000   \n",
-              "0  0.1958        0.00000    4.0  2140   0.806409                   0.532286   \n",
-              "\n",
-              "   eval_runtime  eval_samples_per_second  eval_steps_per_second  _timestamp  \\\n",
-              "1        1.0157                  267.792                  4.923  1661447759   \n",
-              "3        0.9428                  288.510                  5.303  1661447782   \n",
-              "2        0.9576                  284.050                  5.222  1661447764   \n",
-              "0        1.0006                  271.827                  4.997  1661448005   \n",
-              "\n",
-              "   ...   pid          hostname        node_ip  time_since_restore  \\\n",
-              "1  ...  1805  ip-172-31-76-237  172.31.76.237           95.249164   \n",
-              "3  ...  1060  ip-172-31-85-193  172.31.85.193           99.367746   \n",
-              "2  ...  1322   ip-172-31-85-32   172.31.85.32           93.761317   \n",
-              "0  ...  1729  ip-172-31-90-137  172.31.90.137          347.170584   \n",
-              "\n",
-              "   timesteps_since_restore  iterations_since_restore  warmup_time  \\\n",
-              "1                        0                         1     0.003661   \n",
-              "3                        0                         1     0.004133   \n",
-              "2                        0                         1     0.004533   \n",
-              "0                        0                         4     0.003702   \n",
-              "\n",
-              "   config/trainer_init_config/epochs config/trainer_init_config/learning_rate  \\\n",
-              "1                                  4                                  0.00020   \n",
-              "3                                  4                                  0.02000   \n",
-              "2                                  4                                  0.00200   \n",
-              "0                                  4                                  0.00002   \n",
-              "\n",
-              "                                              logdir  \n",
-              "1  /home/ray/ray_results/HuggingFaceTrainer_2022-...  \n",
-              "3  /home/ray/ray_results/HuggingFaceTrainer_2022-...  \n",
-              "2  /home/ray/ray_results/HuggingFaceTrainer_2022-...  \n",
-              "0  /home/ray/ray_results/HuggingFaceTrainer_2022-...  \n",
-              "\n",
-              "[4 rows x 33 columns]"
-            ]
-          },
-          "execution_count": 19,
-          "metadata": {},
-          "output_type": "execute_result"
-        }
-      ],
-      "source": [
-        "tune_results.get_dataframe().sort_values(\"eval_loss\")"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-535\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/config.json\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/pytorch_model.bin\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/tokenizer_config.json\n",
+      "(RayTrainWorker pid=1974, ip=172.31.76.237) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/special_tokens_map.json\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 20,
-      "metadata": {},
-      "outputs": [],
-      "source": [
-        "best_result = tune_results.get_best_result()"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Result for HuggingFaceTrainer_5654d_00001:\n",
+      "  _time_this_iter_s: 84.79700112342834\n",
+      "  _timestamp: 1661447759\n",
+      "  _training_iteration: 1\n",
+      "  date: 2022-08-25_10-16-00\n",
+      "  done: true\n",
+      "  epoch: 1.0\n",
+      "  eval_loss: 0.6492420434951782\n",
+      "  eval_matthews_correlation: 0.0\n",
+      "  eval_runtime: 1.0157\n",
+      "  eval_samples_per_second: 267.792\n",
+      "  eval_steps_per_second: 4.923\n",
+      "  experiment_id: 88145f9344584715a4bd7d018f751b12\n",
+      "  hostname: ip-172-31-76-237\n",
+      "  iterations_since_restore: 1\n",
+      "  learning_rate: 0.00015000000000000001\n",
+      "  loss: 0.6225\n",
+      "  node_ip: 172.31.76.237\n",
+      "  pid: 1805\n",
+      "  should_checkpoint: true\n",
+      "  step: 535\n",
+      "  time_since_restore: 95.24916434288025\n",
+      "  time_this_iter_s: 95.24916434288025\n",
+      "  time_total_s: 95.24916434288025\n",
+      "  timestamp: 1661447760\n",
+      "  timesteps_since_restore: 0\n",
+      "  training_iteration: 1\n",
+      "  trial_id: 5654d_00001\n",
+      "  warmup_time: 0.003660917282104492\n",
+      "  \n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) {'loss': 0.6463, 'learning_rate': 0.0015, 'epoch': 1.0}\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "### Predict on test data with Ray AIR <a name=\"predict\"></a>"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) ***** Running Evaluation *****\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32)   Num examples = 1043\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32)   Batch size = 16\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "Tfoyu1q7hYbb"
-      },
-      "source": [
-        "You can now use the checkpoint to run prediction with `HuggingFacePredictor`, which wraps around [🤗 Pipelines](https://huggingface.co/docs/transformers/main_classes/pipelines). In order to distribute prediction, we use `BatchPredictor`. While this is not necessary for the very small example we are using (you could use `HuggingFacePredictor` directly), it will scale well to a large dataset."
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) {'eval_loss': 0.6586529612541199, 'eval_matthews_correlation': 0.0, 'eval_runtime': 0.9576, 'eval_samples_per_second': 284.05, 'eval_steps_per_second': 5.222, 'epoch': 1.0}\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": 21,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/",
-          "height": 262
-        },
-        "id": "UOUcBkX8IrJi",
-        "outputId": "4dc16812-1400-482d-8c3f-85991ce4b081"
-      },
-      "outputs": [
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 12.41it/s]\n",
-            "Map_Batches: 100%|██████████| 1/1 [00:00<00:00,  7.46it/s]\n",
-            "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:18<00:00, 18.46s/it]\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "{'label': 'LABEL_1', 'score': 0.6822417974472046}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822402477264404}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822407841682434}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822386980056763}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822428107261658}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822453737258911}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822437047958374}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822428703308105}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822431683540344}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822426915168762}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822447776794434}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822456121444702}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822471022605896}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822477579116821}\n",
-            "{'label': 'LABEL_1', 'score': 0.682244598865509}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822422742843628}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822470426559448}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822417378425598}\n",
-            "{'label': 'LABEL_1', 'score': 0.6822449564933777}\n",
-            "{'label': 'LABEL_1', 'score': 0.682239294052124}\n"
-          ]
-        }
-      ],
-      "source": [
-        "from ray.train.huggingface import HuggingFacePredictor\n",
-        "from ray.train.batch_predictor import BatchPredictor\n",
-        "import pandas as pd\n",
-        "\n",
-        "predictor = BatchPredictor.from_checkpoint(\n",
-        "    checkpoint=best_result.checkpoint,\n",
-        "    predictor_cls=HuggingFacePredictor,\n",
-        "    task=\"text-classification\",\n",
-        "    device=0 if use_gpu else -1,  # -1 is CPU, otherwise device index\n",
-        ")\n",
-        "prediction = predictor.predict(ray_datasets[\"test\"].map_batches(lambda x: x[[\"sentence\"]]), num_gpus_per_worker=int(use_gpu))\n",
-        "prediction.show()"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-535\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/config.json\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/pytorch_model.bin\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/tokenizer_config.json\n",
+      "(RayTrainWorker pid=1483, ip=172.31.85.32) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/special_tokens_map.json\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "### Share the model <a name=\"share\"></a>"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Result for HuggingFaceTrainer_5654d_00002:\n",
+      "  _time_this_iter_s: 84.01720070838928\n",
+      "  _timestamp: 1661447764\n",
+      "  _training_iteration: 1\n",
+      "  date: 2022-08-25_10-16-04\n",
+      "  done: true\n",
+      "  epoch: 1.0\n",
+      "  eval_loss: 0.6586529612541199\n",
+      "  eval_matthews_correlation: 0.0\n",
+      "  eval_runtime: 0.9576\n",
+      "  eval_samples_per_second: 284.05\n",
+      "  eval_steps_per_second: 5.222\n",
+      "  experiment_id: 5f8ab183779d40379d59ea615f9d5411\n",
+      "  hostname: ip-172-31-85-32\n",
+      "  iterations_since_restore: 1\n",
+      "  learning_rate: 0.0015\n",
+      "  loss: 0.6463\n",
+      "  node_ip: 172.31.85.32\n",
+      "  pid: 1322\n",
+      "  should_checkpoint: true\n",
+      "  step: 535\n",
+      "  time_since_restore: 93.76131749153137\n",
+      "  time_this_iter_s: 93.76131749153137\n",
+      "  time_total_s: 93.76131749153137\n",
+      "  timestamp: 1661447764\n",
+      "  timesteps_since_restore: 0\n",
+      "  training_iteration: 1\n",
+      "  trial_id: 5654d_00002\n",
+      "  warmup_time: 0.004533290863037109\n",
+      "  \n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "mS8PId_NhYbb"
-      },
-      "source": [
-        "To be able to share your model with the community, there are a few more steps to follow.\n",
-        "\n",
-        "We have conducted the training on the Ray cluster, but share the model from the local enviroment - this will allow us to easily authenticate.\n",
-        "\n",
-        "First you have to store your authentication token from the Hugging Face website (sign up [here](https://huggingface.co/join) if you haven't already!) then execute the following cell and input your username and password:"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) ***** Running Evaluation *****\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193)   Num examples = 1043\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193)   Batch size = 16\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: idx, sentence. If idx, sentence are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "id": "2LClXkN8hYbb",
-        "tags": [
-          "remove-cell-ci"
-        ]
-      },
-      "outputs": [],
-      "source": [
-        "from huggingface_hub import notebook_login\n",
-        "\n",
-        "notebook_login()"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) {'loss': 0.926, 'learning_rate': 0.015, 'epoch': 1.0}\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) {'eval_loss': 0.6529427766799927, 'eval_matthews_correlation': 0.0, 'eval_runtime': 0.9428, 'eval_samples_per_second': 288.51, 'eval_steps_per_second': 5.303, 'epoch': 1.0}\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "SybKUDryhYbb"
-      },
-      "source": [
-        "Then you need to install Git-LFS. Uncomment the following instructions:"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-535\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/config.json\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/pytorch_model.bin\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/tokenizer_config.json\n",
+      "(RayTrainWorker pid=1223, ip=172.31.85.193) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-535/special_tokens_map.json\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "id": "_wF6aT-0hYbb",
-        "tags": [
-          "remove-cell-ci"
-        ]
-      },
-      "outputs": [],
-      "source": [
-        "# !apt install git-lfs"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Result for HuggingFaceTrainer_5654d_00003:\n",
+      "  _time_this_iter_s: 89.4301290512085\n",
+      "  _timestamp: 1661447782\n",
+      "  _training_iteration: 1\n",
+      "  date: 2022-08-25_10-16-22\n",
+      "  done: true\n",
+      "  epoch: 1.0\n",
+      "  eval_loss: 0.6529427766799927\n",
+      "  eval_matthews_correlation: 0.0\n",
+      "  eval_runtime: 0.9428\n",
+      "  eval_samples_per_second: 288.51\n",
+      "  eval_steps_per_second: 5.303\n",
+      "  experiment_id: 8495977eeefd405fa4d9c1ea8fa735e1\n",
+      "  hostname: ip-172-31-85-193\n",
+      "  iterations_since_restore: 1\n",
+      "  learning_rate: 0.015\n",
+      "  loss: 0.926\n",
+      "  node_ip: 172.31.85.193\n",
+      "  pid: 1060\n",
+      "  should_checkpoint: true\n",
+      "  step: 535\n",
+      "  time_since_restore: 99.36774587631226\n",
+      "  time_this_iter_s: 99.36774587631226\n",
+      "  time_total_s: 99.36774587631226\n",
+      "  timestamp: 1661447782\n",
+      "  timesteps_since_restore: 0\n",
+      "  training_iteration: 1\n",
+      "  trial_id: 5654d_00003\n",
+      "  warmup_time: 0.004132509231567383\n",
+      "  \n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "5fr6E0e8hYbb"
-      },
-      "source": [
-        "Now, load the model and tokenizer locally, and recreate the 🤗 Transformers `Trainer`:"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) ***** Running Evaluation *****\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num examples = 1043\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Batch size = 16\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "id": "cjH2A8m6hYbc",
-        "tags": [
-          "remove-cell-ci"
-        ]
-      },
-      "outputs": [],
-      "source": [
-        "from ray.train.huggingface import HuggingFaceCheckpoint\n",
-        "\n",
-        "checkpoint = HuggingFaceCheckpoint.from_checkpoint(result.checkpoint)\n",
-        "hf_trainer = checkpoint.get_model(model=AutoModelForSequenceClassification)"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) {'loss': 0.3841, 'learning_rate': 1e-05, 'epoch': 2.0}\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) {'eval_loss': 0.5994958281517029, 'eval_matthews_correlation': 0.4573244914254411, 'eval_runtime': 0.9442, 'eval_samples_per_second': 288.066, 'eval_steps_per_second': 5.295, 'epoch': 2.0}\n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "tgV2xKfFhYbc"
-      },
-      "source": [
-        "You can now upload the result of the training to the Hub, just execute this instruction:"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-1070\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/config.json\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/pytorch_model.bin\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/tokenizer_config.json\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1070/special_tokens_map.json\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "id": "XSkfJe3nhYbc",
-        "tags": [
-          "remove-cell-ci"
-        ]
-      },
-      "outputs": [],
-      "source": [
-        "hf_trainer.push_to_hub()"
-      ]
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Result for HuggingFaceTrainer_5654d_00000:\n",
+      "  _time_this_iter_s: 76.82565689086914\n",
+      "  _timestamp: 1661447830\n",
+      "  _training_iteration: 2\n",
+      "  date: 2022-08-25_10-17-10\n",
+      "  done: false\n",
+      "  epoch: 2.0\n",
+      "  eval_loss: 0.5994958281517029\n",
+      "  eval_matthews_correlation: 0.4573244914254411\n",
+      "  eval_runtime: 0.9442\n",
+      "  eval_samples_per_second: 288.066\n",
+      "  eval_steps_per_second: 5.295\n",
+      "  experiment_id: cee1b96afcf344e89482e3c5e298a412\n",
+      "  hostname: ip-172-31-90-137\n",
+      "  iterations_since_restore: 2\n",
+      "  learning_rate: 1.0e-05\n",
+      "  loss: 0.3841\n",
+      "  node_ip: 172.31.90.137\n",
+      "  pid: 1729\n",
+      "  should_checkpoint: true\n",
+      "  step: 1070\n",
+      "  time_since_restore: 171.76071190834045\n",
+      "  time_this_iter_s: 76.82838201522827\n",
+      "  time_total_s: 171.76071190834045\n",
+      "  timestamp: 1661447830\n",
+      "  timesteps_since_restore: 0\n",
+      "  training_iteration: 2\n",
+      "  trial_id: 5654d_00000\n",
+      "  warmup_time: 0.0037021636962890625\n",
+      "  \n"
+     ]
     },
     {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "UL-Boc4dhYbc"
-      },
-      "source": [
-        "You can now share this model with all your friends, family, favorite pets: they can all load it with the identifier `\"your-username/the-name-you-picked\"` so for instance:\n",
-        "\n",
-        "```python\n",
-        "from transformers import AutoModelForSequenceClassification\n",
-        "\n",
-        "model = AutoModelForSequenceClassification.from_pretrained(\"sgugger/my-awesome-model\")\n",
-        "```"
-      ]
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) ***** Running Evaluation *****\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num examples = 1043\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Batch size = 16\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) {'loss': 0.2687, 'learning_rate': 5e-06, 'epoch': 3.0}\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) {'eval_loss': 0.6935313940048218, 'eval_matthews_correlation': 0.5300538425561, 'eval_runtime': 1.0176, 'eval_samples_per_second': 267.305, 'eval_steps_per_second': 4.914, 'epoch': 3.0}\n"
+     ]
     },
     {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "id": "ipJBReeWhYbc",
-        "tags": [
-          "remove-cell-ci"
-        ]
-      },
-      "outputs": [],
-      "source": []
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-1605\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-1605/config.json\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-1605/pytorch_model.bin\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1605/tokenizer_config.json\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-1605/special_tokens_map.json\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Result for HuggingFaceTrainer_5654d_00000:\n",
+      "  _time_this_iter_s: 76.47252488136292\n",
+      "  _timestamp: 1661447906\n",
+      "  _training_iteration: 3\n",
+      "  date: 2022-08-25_10-18-26\n",
+      "  done: false\n",
+      "  epoch: 3.0\n",
+      "  eval_loss: 0.6935313940048218\n",
+      "  eval_matthews_correlation: 0.5300538425561\n",
+      "  eval_runtime: 1.0176\n",
+      "  eval_samples_per_second: 267.305\n",
+      "  eval_steps_per_second: 4.914\n",
+      "  experiment_id: cee1b96afcf344e89482e3c5e298a412\n",
+      "  hostname: ip-172-31-90-137\n",
+      "  iterations_since_restore: 3\n",
+      "  learning_rate: 5.0e-06\n",
+      "  loss: 0.2687\n",
+      "  node_ip: 172.31.90.137\n",
+      "  pid: 1729\n",
+      "  should_checkpoint: true\n",
+      "  step: 1605\n",
+      "  time_since_restore: 248.23273348808289\n",
+      "  time_this_iter_s: 76.47202157974243\n",
+      "  time_total_s: 248.23273348808289\n",
+      "  timestamp: 1661447906\n",
+      "  timesteps_since_restore: 0\n",
+      "  training_iteration: 3\n",
+      "  trial_id: 5654d_00000\n",
+      "  warmup_time: 0.0037021636962890625\n",
+      "  \n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-2140\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/config.json\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/pytorch_model.bin\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/tokenizer_config.json\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/special_tokens_map.json\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) ***** Running Evaluation *****\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Num examples = 1043\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137)   Batch size = 16\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) The following columns in the evaluation set don't have a corresponding argument in `DistilBertForSequenceClassification.forward` and have been ignored: sentence, idx. If sentence, idx are not expected by `DistilBertForSequenceClassification.forward`,  you can safely ignore this message.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) {'loss': 0.1958, 'learning_rate': 0.0, 'epoch': 4.0}\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Saving model checkpoint to distilbert-base-uncased-finetuned-cola/checkpoint-2140\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Configuration saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/config.json\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) {'eval_loss': 0.8064090609550476, 'eval_matthews_correlation': 0.5322860764824153, 'eval_runtime': 1.0006, 'eval_samples_per_second': 271.827, 'eval_steps_per_second': 4.997, 'epoch': 4.0}\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Model weights saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/pytorch_model.bin\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) tokenizer config file saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/tokenizer_config.json\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Special tokens file saved in distilbert-base-uncased-finetuned-cola/checkpoint-2140/special_tokens_map.json\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) \n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) \n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) Training completed. Do not forget to share your model on huggingface.co/models =)\n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) \n",
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) \n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(RayTrainWorker pid=1789, ip=172.31.90.137) {'train_runtime': 329.1948, 'train_samples_per_second': 103.902, 'train_steps_per_second': 6.501, 'train_loss': 0.34860724689804506, 'epoch': 4.0}\n",
+      "Result for HuggingFaceTrainer_5654d_00000:\n",
+      "  _time_this_iter_s: 98.92064905166626\n",
+      "  _timestamp: 1661448005\n",
+      "  _training_iteration: 4\n",
+      "  date: 2022-08-25_10-20-05\n",
+      "  done: true\n",
+      "  epoch: 4.0\n",
+      "  eval_loss: 0.8064090609550476\n",
+      "  eval_matthews_correlation: 0.5322860764824153\n",
+      "  eval_runtime: 1.0006\n",
+      "  eval_samples_per_second: 271.827\n",
+      "  eval_steps_per_second: 4.997\n",
+      "  experiment_id: cee1b96afcf344e89482e3c5e298a412\n",
+      "  hostname: ip-172-31-90-137\n",
+      "  iterations_since_restore: 4\n",
+      "  learning_rate: 0.0\n",
+      "  loss: 0.1958\n",
+      "  node_ip: 172.31.90.137\n",
+      "  pid: 1729\n",
+      "  should_checkpoint: true\n",
+      "  step: 2140\n",
+      "  time_since_restore: 347.1705844402313\n",
+      "  time_this_iter_s: 98.93785095214844\n",
+      "  time_total_s: 347.1705844402313\n",
+      "  timestamp: 1661448005\n",
+      "  timesteps_since_restore: 0\n",
+      "  train_loss: 0.34860724689804506\n",
+      "  train_runtime: 329.1948\n",
+      "  train_samples_per_second: 103.902\n",
+      "  train_steps_per_second: 6.501\n",
+      "  training_iteration: 4\n",
+      "  trial_id: 5654d_00000\n",
+      "  warmup_time: 0.0037021636962890625\n",
+      "  \n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "2022-08-25 10:20:13,409\tINFO tune.py:758 -- Total run time: 361.90 seconds (361.74 seconds for the tuning loop).\n"
+     ]
+    }
+   ],
+   "source": [
+    "tune_results = tuner.fit()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We can view the results of the tuning run as a dataframe, and obtain the best result."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 19,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>loss</th>\n",
+       "      <th>learning_rate</th>\n",
+       "      <th>epoch</th>\n",
+       "      <th>step</th>\n",
+       "      <th>eval_loss</th>\n",
+       "      <th>eval_matthews_correlation</th>\n",
+       "      <th>eval_runtime</th>\n",
+       "      <th>eval_samples_per_second</th>\n",
+       "      <th>eval_steps_per_second</th>\n",
+       "      <th>_timestamp</th>\n",
+       "      <th>...</th>\n",
+       "      <th>pid</th>\n",
+       "      <th>hostname</th>\n",
+       "      <th>node_ip</th>\n",
+       "      <th>time_since_restore</th>\n",
+       "      <th>timesteps_since_restore</th>\n",
+       "      <th>iterations_since_restore</th>\n",
+       "      <th>warmup_time</th>\n",
+       "      <th>config/trainer_init_config/epochs</th>\n",
+       "      <th>config/trainer_init_config/learning_rate</th>\n",
+       "      <th>logdir</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>0.6225</td>\n",
+       "      <td>0.00015</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>535</td>\n",
+       "      <td>0.649242</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>1.0157</td>\n",
+       "      <td>267.792</td>\n",
+       "      <td>4.923</td>\n",
+       "      <td>1661447759</td>\n",
+       "      <td>...</td>\n",
+       "      <td>1805</td>\n",
+       "      <td>ip-172-31-76-237</td>\n",
+       "      <td>172.31.76.237</td>\n",
+       "      <td>95.249164</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0.003661</td>\n",
+       "      <td>4</td>\n",
+       "      <td>0.00020</td>\n",
+       "      <td>/home/ray/ray_results/HuggingFaceTrainer_2022-...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>0.9260</td>\n",
+       "      <td>0.01500</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>535</td>\n",
+       "      <td>0.652943</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.9428</td>\n",
+       "      <td>288.510</td>\n",
+       "      <td>5.303</td>\n",
+       "      <td>1661447782</td>\n",
+       "      <td>...</td>\n",
+       "      <td>1060</td>\n",
+       "      <td>ip-172-31-85-193</td>\n",
+       "      <td>172.31.85.193</td>\n",
+       "      <td>99.367746</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0.004133</td>\n",
+       "      <td>4</td>\n",
+       "      <td>0.02000</td>\n",
+       "      <td>/home/ray/ray_results/HuggingFaceTrainer_2022-...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>0.6463</td>\n",
+       "      <td>0.00150</td>\n",
+       "      <td>1.0</td>\n",
+       "      <td>535</td>\n",
+       "      <td>0.658653</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>0.9576</td>\n",
+       "      <td>284.050</td>\n",
+       "      <td>5.222</td>\n",
+       "      <td>1661447764</td>\n",
+       "      <td>...</td>\n",
+       "      <td>1322</td>\n",
+       "      <td>ip-172-31-85-32</td>\n",
+       "      <td>172.31.85.32</td>\n",
+       "      <td>93.761317</td>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "      <td>0.004533</td>\n",
+       "      <td>4</td>\n",
+       "      <td>0.00200</td>\n",
+       "      <td>/home/ray/ray_results/HuggingFaceTrainer_2022-...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>0.1958</td>\n",
+       "      <td>0.00000</td>\n",
+       "      <td>4.0</td>\n",
+       "      <td>2140</td>\n",
+       "      <td>0.806409</td>\n",
+       "      <td>0.532286</td>\n",
+       "      <td>1.0006</td>\n",
+       "      <td>271.827</td>\n",
+       "      <td>4.997</td>\n",
+       "      <td>1661448005</td>\n",
+       "      <td>...</td>\n",
+       "      <td>1729</td>\n",
+       "      <td>ip-172-31-90-137</td>\n",
+       "      <td>172.31.90.137</td>\n",
+       "      <td>347.170584</td>\n",
+       "      <td>0</td>\n",
+       "      <td>4</td>\n",
+       "      <td>0.003702</td>\n",
+       "      <td>4</td>\n",
+       "      <td>0.00002</td>\n",
+       "      <td>/home/ray/ray_results/HuggingFaceTrainer_2022-...</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>4 rows × 33 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "     loss  learning_rate  epoch  step  eval_loss  eval_matthews_correlation  \\\n",
+       "1  0.6225        0.00015    1.0   535   0.649242                   0.000000   \n",
+       "3  0.9260        0.01500    1.0   535   0.652943                   0.000000   \n",
+       "2  0.6463        0.00150    1.0   535   0.658653                   0.000000   \n",
+       "0  0.1958        0.00000    4.0  2140   0.806409                   0.532286   \n",
+       "\n",
+       "   eval_runtime  eval_samples_per_second  eval_steps_per_second  _timestamp  \\\n",
+       "1        1.0157                  267.792                  4.923  1661447759   \n",
+       "3        0.9428                  288.510                  5.303  1661447782   \n",
+       "2        0.9576                  284.050                  5.222  1661447764   \n",
+       "0        1.0006                  271.827                  4.997  1661448005   \n",
+       "\n",
+       "   ...   pid          hostname        node_ip  time_since_restore  \\\n",
+       "1  ...  1805  ip-172-31-76-237  172.31.76.237           95.249164   \n",
+       "3  ...  1060  ip-172-31-85-193  172.31.85.193           99.367746   \n",
+       "2  ...  1322   ip-172-31-85-32   172.31.85.32           93.761317   \n",
+       "0  ...  1729  ip-172-31-90-137  172.31.90.137          347.170584   \n",
+       "\n",
+       "   timesteps_since_restore  iterations_since_restore  warmup_time  \\\n",
+       "1                        0                         1     0.003661   \n",
+       "3                        0                         1     0.004133   \n",
+       "2                        0                         1     0.004533   \n",
+       "0                        0                         4     0.003702   \n",
+       "\n",
+       "   config/trainer_init_config/epochs config/trainer_init_config/learning_rate  \\\n",
+       "1                                  4                                  0.00020   \n",
+       "3                                  4                                  0.02000   \n",
+       "2                                  4                                  0.00200   \n",
+       "0                                  4                                  0.00002   \n",
+       "\n",
+       "                                              logdir  \n",
+       "1  /home/ray/ray_results/HuggingFaceTrainer_2022-...  \n",
+       "3  /home/ray/ray_results/HuggingFaceTrainer_2022-...  \n",
+       "2  /home/ray/ray_results/HuggingFaceTrainer_2022-...  \n",
+       "0  /home/ray/ray_results/HuggingFaceTrainer_2022-...  \n",
+       "\n",
+       "[4 rows x 33 columns]"
+      ]
+     },
+     "execution_count": 19,
+     "metadata": {},
+     "output_type": "execute_result"
     }
-  ],
-  "metadata": {
-    "accelerator": "GPU",
+   ],
+   "source": [
+    "tune_results.get_dataframe().sort_values(\"eval_loss\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 20,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "best_result = tune_results.get_best_result()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Predict on test data with Ray AIR <a name=\"predict\"></a>"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "Tfoyu1q7hYbb"
+   },
+   "source": [
+    "You can now use the checkpoint to run prediction with `HuggingFacePredictor`, which wraps around [🤗 Pipelines](https://huggingface.co/docs/transformers/main_classes/pipelines). In order to distribute prediction, we use `BatchPredictor`. While this is not necessary for the very small example we are using (you could use `HuggingFacePredictor` directly), it will scale well to a large dataset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 21,
+   "metadata": {
     "colab": {
-      "collapsed_sections": [],
-      "name": "huggingface_text_classification.ipynb",
-      "provenance": []
-    },
-    "kernelspec": {
-      "display_name": "Python 3.8.9 64-bit",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.9.6"
-    },
-    "vscode": {
-      "interpreter": {
-        "hash": "31f2aee4e71d21fbe5cf8b01ff0e069b9275f58929596ceb00d14d90e3e16cd6"
-      }
+     "base_uri": "https://localhost:8080/",
+     "height": 262
+    },
+    "id": "UOUcBkX8IrJi",
+    "outputId": "4dc16812-1400-482d-8c3f-85991ce4b081"
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00, 12.41it/s]\n",
+      "Map_Batches: 100%|██████████| 1/1 [00:00<00:00,  7.46it/s]\n",
+      "Map Progress (1 actors 1 pending): 100%|██████████| 1/1 [00:18<00:00, 18.46s/it]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "{'label': 'LABEL_1', 'score': 0.6822417974472046}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822402477264404}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822407841682434}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822386980056763}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822428107261658}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822453737258911}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822437047958374}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822428703308105}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822431683540344}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822426915168762}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822447776794434}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822456121444702}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822471022605896}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822477579116821}\n",
+      "{'label': 'LABEL_1', 'score': 0.682244598865509}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822422742843628}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822470426559448}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822417378425598}\n",
+      "{'label': 'LABEL_1', 'score': 0.6822449564933777}\n",
+      "{'label': 'LABEL_1', 'score': 0.682239294052124}\n"
+     ]
     }
+   ],
+   "source": [
+    "from ray.train.huggingface import HuggingFacePredictor\n",
+    "from ray.train.batch_predictor import BatchPredictor\n",
+    "import pandas as pd\n",
+    "\n",
+    "predictor = BatchPredictor.from_checkpoint(\n",
+    "    checkpoint=best_result.checkpoint,\n",
+    "    predictor_cls=HuggingFacePredictor,\n",
+    "    task=\"text-classification\",\n",
+    "    device=0 if use_gpu else -1,  # -1 is CPU, otherwise device index\n",
+    ")\n",
+    "prediction = predictor.predict(ray_datasets[\"test\"].map_batches(lambda x: x[[\"sentence\"]]), num_gpus_per_worker=int(use_gpu))\n",
+    "prediction.show()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Share the model <a name=\"share\"></a>"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "mS8PId_NhYbb"
+   },
+   "source": [
+    "To be able to share your model with the community, there are a few more steps to follow.\n",
+    "\n",
+    "We have conducted the training on the Ray cluster, but share the model from the local enviroment - this will allow us to easily authenticate.\n",
+    "\n",
+    "First you have to store your authentication token from the Hugging Face website (sign up [here](https://huggingface.co/join) if you haven't already!) then execute the following cell and input your username and password:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "id": "2LClXkN8hYbb",
+    "tags": [
+     "remove-cell-ci"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "from huggingface_hub import notebook_login\n",
+    "\n",
+    "notebook_login()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "SybKUDryhYbb"
+   },
+   "source": [
+    "Then you need to install Git-LFS. Uncomment the following instructions:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "id": "_wF6aT-0hYbb",
+    "tags": [
+     "remove-cell-ci"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "# !apt install git-lfs"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "5fr6E0e8hYbb"
+   },
+   "source": [
+    "Now, load the model and tokenizer locally, and recreate the 🤗 Transformers `Trainer`:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "id": "cjH2A8m6hYbc",
+    "tags": [
+     "remove-cell-ci"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "from ray.train.huggingface import HuggingFaceCheckpoint\n",
+    "\n",
+    "checkpoint = HuggingFaceCheckpoint.from_checkpoint(result.checkpoint)\n",
+    "hf_trainer = checkpoint.get_model(model=AutoModelForSequenceClassification)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "tgV2xKfFhYbc"
+   },
+   "source": [
+    "You can now upload the result of the training to the Hub, just execute this instruction:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "id": "XSkfJe3nhYbc",
+    "tags": [
+     "remove-cell-ci"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "hf_trainer.push_to_hub()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "id": "UL-Boc4dhYbc"
+   },
+   "source": [
+    "You can now share this model with all your friends, family, favorite pets: they can all load it with the identifier `\"your-username/the-name-you-picked\"` so for instance:\n",
+    "\n",
+    "```python\n",
+    "from transformers import AutoModelForSequenceClassification\n",
+    "\n",
+    "model = AutoModelForSequenceClassification.from_pretrained(\"sgugger/my-awesome-model\")\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "id": "ipJBReeWhYbc",
+    "tags": [
+     "remove-cell-ci"
+    ]
+   },
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "accelerator": "GPU",
+  "colab": {
+   "collapsed_sections": [],
+   "name": "huggingface_text_classification.ipynb",
+   "provenance": []
+  },
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.13"
   },
-  "nbformat": 4,
-  "nbformat_minor": 0
+  "vscode": {
+   "interpreter": {
+    "hash": "31f2aee4e71d21fbe5cf8b01ff0e069b9275f58929596ceb00d14d90e3e16cd6"
+   }
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
 }
diff --git a/doc/source/tune/examples/horovod_simple.ipynb b/doc/source/tune/examples/horovod_simple.ipynb
index 9d8d8e1221c8..a409ddb247b8 100644
--- a/doc/source/tune/examples/horovod_simple.ipynb
+++ b/doc/source/tune/examples/horovod_simple.ipynb
@@ -47,6 +47,7 @@
     "from ray.tune.tune_config import TuneConfig\n",
     "from ray.tune.tuner import Tuner\n",
     "\n",
+    "\n",
     "def sq(x):\n",
     "    m2 = 1.0\n",
     "    m1 = -20.0\n",
@@ -126,17 +127,19 @@
     "\n",
     "\n",
     "def tune_horovod(num_workers, num_samples, use_gpu, mode=\"square\", x_max=1.0):\n",
-    "    horovod_trainer = HorovodTrainer(train_loop_per_worker=train_loop_per_worker,\n",
-    "                                     scaling_config=ScalingConfig(\n",
-    "                                         num_workers=num_workers,\n",
-    "                                         use_gpu=use_gpu),\n",
-    "                                     train_loop_config={\n",
-    "                                         \"mode\": mode,\n",
-    "                                         \"x_max\": x_max})\n",
-    "\n",
-    "    tuner = Tuner(horovod_trainer, param_space={\"train_loop_config\": {\"lr\": tune.uniform(\n",
-    "        0.1, 1)}}, tune_config=TuneConfig(mode=\"min\", metric=\"loss\",\n",
-    "                                          num_samples=num_samples))\n",
+    "    horovod_trainer = HorovodTrainer(\n",
+    "        train_loop_per_worker=train_loop_per_worker,\n",
+    "        scaling_config=ScalingConfig(\n",
+    "            trainer_resources={\"CPU\": 0}, num_workers=num_workers, use_gpu=use_gpu\n",
+    "        ),\n",
+    "        train_loop_config={\"mode\": mode, \"x_max\": x_max},\n",
+    "    )\n",
+    "\n",
+    "    tuner = Tuner(\n",
+    "        horovod_trainer,\n",
+    "        param_space={\"train_loop_config\": {\"lr\": tune.uniform(0.1, 1)}},\n",
+    "        tune_config=TuneConfig(mode=\"min\", metric=\"loss\", num_samples=num_samples),\n",
+    "    )\n",
     "\n",
     "    result_grid = tuner.fit()\n",
     "\n",
@@ -159,22 +162,12 @@
     "        \"--smoke-test\", action=\"store_true\", help=(\"Finish quickly for testing.\")\n",
     "    )\n",
     "    parser.add_argument(\"--num-workers\", type=int, default=2)\n",
-    "    parser.add_argument(\n",
-    "        \"--server-address\",\n",
-    "        type=str,\n",
-    "        default=None,\n",
-    "        required=False,\n",
-    "        help=\"The address of server to connect to if using Ray Client.\",\n",
-    "    )\n",
     "    args, _ = parser.parse_known_args()\n",
     "\n",
     "    if args.smoke_test:\n",
-    "        ray.init(num_cpus=2)\n",
-    "    elif args.server_address:\n",
-    "        ray.init(f\"ray://{args.server_address}\")\n",
-    "\n",
-    "    # import ray\n",
-    "    # ray.init(address=\"auto\")  # assumes ray is started with ray up\n",
+    "        # Smoke test with 2 samples x 2 workers x 1 CPU/worker\n",
+    "        # (and allocating 0 CPUs for the trainers)\n",
+    "        ray.init(num_cpus=4)\n",
     "\n",
     "    tune_horovod(\n",
     "        num_workers=args.num_workers,\n",
@@ -182,13 +175,13 @@
     "        use_gpu=args.gpu,\n",
     "        mode=args.mode,\n",
     "        x_max=args.x_max,\n",
-    "    )"
+    "    )\n"
    ]
   }
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "ray_dev_py38",
    "language": "python",
    "name": "python3"
   },
@@ -202,9 +195,14 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.13 | packaged by conda-forge | (default, Mar 25 2022, 06:05:16) \n[Clang 12.0.1 ]"
   },
-  "orphan": true
+  "orphan": true,
+  "vscode": {
+   "interpreter": {
+    "hash": "265d195fda5292fe8f69c6e37c435a5634a1ed3b6799724e66a975f68fa21517"
+   }
+  }
  },
  "nbformat": 4,
  "nbformat_minor": 5
diff --git a/doc/source/tune/examples/lightgbm_example.ipynb b/doc/source/tune/examples/lightgbm_example.ipynb
index c95e3fdc86d2..9c77e717ed3d 100644
--- a/doc/source/tune/examples/lightgbm_example.ipynb
+++ b/doc/source/tune/examples/lightgbm_example.ipynb
@@ -275,29 +275,15 @@
     "    )\n",
     "    preds = gbm.predict(test_x)\n",
     "    pred_labels = np.rint(preds)\n",
-    "    session.report({\n",
-    "        \"mean_accuracy\": sklearn.metrics.accuracy_score(test_y, pred_labels), \"done\": True\n",
-    "    })\n",
-    "\n",
-    "\n",
-    "if __name__ == \"__main__\":\n",
-    "    import argparse\n",
-    "\n",
-    "    parser = argparse.ArgumentParser()\n",
-    "    parser.add_argument(\n",
-    "        \"--server-address\",\n",
-    "        type=str,\n",
-    "        default=None,\n",
-    "        required=False,\n",
-    "        help=\"The address of server to connect to if using \" \"Ray Client.\",\n",
+    "    session.report(\n",
+    "        {\n",
+    "            \"mean_accuracy\": sklearn.metrics.accuracy_score(test_y, pred_labels),\n",
+    "            \"done\": True,\n",
+    "        }\n",
     "    )\n",
-    "    args, _ = parser.parse_known_args()\n",
     "\n",
-    "    if args.server_address:\n",
-    "        import ray\n",
-    "\n",
-    "        ray.init(f\"ray://{args.server_address}\")\n",
     "\n",
+    "if __name__ == \"__main__\":\n",
     "    config = {\n",
     "        \"objective\": \"binary\",\n",
     "        \"metric\": [\"binary_error\", \"binary_logloss\"],\n",
@@ -306,7 +292,7 @@
     "        \"num_leaves\": tune.randint(10, 1000),\n",
     "        \"learning_rate\": tune.loguniform(1e-8, 1e-1),\n",
     "    }\n",
-    "    \n",
+    "\n",
     "    tuner = tune.Tuner(\n",
     "        train_breast_cancer,\n",
     "        tune_config=tune.TuneConfig(\n",
@@ -325,7 +311,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "ray_dev_py38",
    "language": "python",
    "name": "python3"
   },
@@ -339,9 +325,14 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.13 | packaged by conda-forge | (default, Mar 25 2022, 06:05:16) \n[Clang 12.0.1 ]"
   },
-  "orphan": true
+  "orphan": true,
+  "vscode": {
+   "interpreter": {
+    "hash": "265d195fda5292fe8f69c6e37c435a5634a1ed3b6799724e66a975f68fa21517"
+   }
+  }
  },
  "nbformat": 4,
  "nbformat_minor": 5
diff --git a/doc/source/tune/examples/mxnet_example.ipynb b/doc/source/tune/examples/mxnet_example.ipynb
index f5aa2cc4bbcf..df7fe16c263d 100644
--- a/doc/source/tune/examples/mxnet_example.ipynb
+++ b/doc/source/tune/examples/mxnet_example.ipynb
@@ -91,7 +91,7 @@
     "    }\n",
     "\n",
     "    scheduler = ASHAScheduler(max_t=num_epochs, grace_period=1, reduction_factor=2)\n",
-    "    \n",
+    "\n",
     "    tuner = tune.Tuner(\n",
     "        tune.with_parameters(\n",
     "            train_mnist_mxnet, mnist=mnist_data, num_epochs=num_epochs\n",
@@ -115,20 +115,8 @@
     "    parser.add_argument(\n",
     "        \"--smoke-test\", action=\"store_true\", help=\"Finish quickly for testing\"\n",
     "    )\n",
-    "    parser.add_argument(\n",
-    "        \"--server-address\",\n",
-    "        type=str,\n",
-    "        default=None,\n",
-    "        required=False,\n",
-    "        help=\"The address of server to connect to if using \" \"Ray Client.\",\n",
-    "    )\n",
     "    args, _ = parser.parse_known_args()\n",
     "\n",
-    "    if args.server_address and not args.smoke_test:\n",
-    "        import ray\n",
-    "\n",
-    "        ray.init(f\"ray://{args.server_address}\")\n",
-    "\n",
     "    if args.smoke_test:\n",
     "        results = tune_mnist_mxnet(num_samples=1, num_epochs=1)\n",
     "    else:\n",
@@ -152,7 +140,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "ray_dev_py38",
    "language": "python",
    "name": "python3"
   },
@@ -166,9 +154,14 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.13 | packaged by conda-forge | (default, Mar 25 2022, 06:05:16) \n[Clang 12.0.1 ]"
   },
-  "orphan": true
+  "orphan": true,
+  "vscode": {
+   "interpreter": {
+    "hash": "265d195fda5292fe8f69c6e37c435a5634a1ed3b6799724e66a975f68fa21517"
+   }
+  }
  },
  "nbformat": 4,
  "nbformat_minor": 5
diff --git a/doc/source/tune/examples/pbt_ppo_example.ipynb b/doc/source/tune/examples/pbt_ppo_example.ipynb
index 2913b750bbf2..23bd303b5def 100644
--- a/doc/source/tune/examples/pbt_ppo_example.ipynb
+++ b/doc/source/tune/examples/pbt_ppo_example.ipynb
@@ -2,7 +2,7 @@
  "cells": [
   {
    "cell_type": "markdown",
-   "id": "3b05af3b",
+   "id": "aa1c2614",
    "metadata": {},
    "source": [
     "(tune-rllib-example)=\n",
@@ -23,653 +23,38 @@
     "\n",
     "## Example\n",
     "\n",
-    "Example of using PBT with RLlib.\n",
+    "Example of using a Tune scheduler ([Population Based Training](tune-scheduler-pbt)) with RLlib.\n",
     "\n",
-    "Note that this requires a cluster with at least 8 GPUs in order for all trials\n",
-    "to run concurrently, otherwise PBT will round-robin train the trials which\n",
-    "is less efficient (or you can set {\"gpu\": 0} to use CPUs for SGD instead).\n",
+    "This example specifies `num_workers=4`, `num_cpus=1`, and `num_gpus=0`, which means that each\n",
+    "PPO trial will use 5 CPUs: 1 (for training) + 4 (for sample collection).\n",
+    "This example runs 2 trials, so at least 10 CPUs must be available in the cluster resources\n",
+    "in order to run both trials concurrently. Otherwise, the PBT scheduler will round-robin\n",
+    "between training each trial, which is less efficient.\n",
     "\n",
-    "Note that Tune in general does not need 8 GPUs, and this is just a more\n",
-    "computationally demanding example."
+    "If you want to run this example with GPUs, you can set `num_gpus` accordingly."
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
-   "id": "19e3c389",
+   "execution_count": null,
+   "id": "f4621a1a",
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2022-07-22 16:45:04,893\tWARNING deprecation.py:48 -- DeprecationWarning: `ray.rllib.execution.buffers` has been deprecated. Use `ray.rllib.utils.replay_buffers` instead. This will raise an error in the future!\n",
-      "2022-07-22 16:45:08,004\tINFO services.py:1483 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8274\u001b[39m\u001b[22m\n",
-      "/Users/kai/coding/ray/python/ray/tune/tune.py:487: UserWarning: Consider boosting PBT performance by enabling `reuse_actors` as well as implementing `reset_config` for Trainable.\n",
-      "  \"Consider boosting PBT performance by enabling `reuse_actors` as \"\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "== Status ==<br>Current time: 2022-07-22 16:45:36 (running for 00:00:25.48)<br>Memory usage on this node: 11.3/16.0 GiB<br>PopulationBasedTraining: 0 checkpoints, 0 perturbs<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/5.53 GiB heap, 0.0/2.0 GiB objects<br>Result logdir: /Users/kai/ray_results/PPO<br>Number of trials: 1/1 (1 ERROR)<br><table>\n",
-       "<thead>\n",
-       "<tr><th>Trial name                 </th><th>status  </th><th>loc  </th><th style=\"text-align: right;\">  num_sgd_iter</th><th style=\"text-align: right;\">  sgd_minibatch_size</th><th style=\"text-align: right;\">  train_batch_size</th></tr>\n",
-       "</thead>\n",
-       "<tbody>\n",
-       "<tr><td>PPO_Humanoid-v1_45196_00000</td><td>ERROR   </td><td>     </td><td style=\"text-align: right;\">            30</td><td style=\"text-align: right;\">                 128</td><td style=\"text-align: right;\">             20000</td></tr>\n",
-       "</tbody>\n",
-       "</table><br>Number of errored trials: 1<br><table>\n",
-       "<thead>\n",
-       "<tr><th>Trial name                 </th><th style=\"text-align: right;\">  # failures</th><th>error file                                                                                                                                          </th></tr>\n",
-       "</thead>\n",
-       "<tbody>\n",
-       "<tr><td>PPO_Humanoid-v1_45196_00000</td><td style=\"text-align: right;\">           1</td><td>/Users/kai/ray_results/PPO/PPO_Humanoid-v1_45196_00000_0_num_sgd_iter=30,sgd_minibatch_size=128,train_batch_size=20000_2022-07-22_16-45-11/error.txt</td></tr>\n",
-       "</tbody>\n",
-       "</table><br>"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2022-07-22 16:45:11,206\tWARNING trial_runner.py:1517 -- You are trying to access _search_alg interface of TrialRunner in TrialScheduler, which is being restricted. If you believe it is reasonable for your scheduler to access this TrialRunner API, please reach out to Ray team on GitHub. A more strict API access pattern would be enforced starting 1.12s.0\n",
-      "2022-07-22 16:45:11,640\tINFO plugin_schema_manager.py:52 -- Loading the default runtime env schemas: ['/Users/kai/coding/ray/python/ray/_private/runtime_env/../../runtime_env/schemas/working_dir_schema.json', '/Users/kai/coding/ray/python/ray/_private/runtime_env/../../runtime_env/schemas/pip_schema.json'].\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m 2022-07-22 16:45:21,449\tINFO algorithm.py:1855 -- Your framework setting is 'tf', meaning you are using static-graph mode. Set framework='tf2' to enable eager execution with tf2.x. You may also then want to set eager_tracing=True in order to reach similar execution speed as with static-graph mode.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m 2022-07-22 16:45:21,450\tWARNING ppo.py:359 -- `train_batch_size` (20000) cannot be achieved with your other settings (num_workers=8 num_envs_per_worker=1 rollout_fragment_length=200)! Auto-adjusting `rollout_fragment_length` to 2500.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m 2022-07-22 16:45:21,450\tINFO ppo.py:379 -- In multi-agent mode, policies will be optimized sequentially by the multi-GPU optimizer. Consider setting simple_optimizer=True if this doesn't work for you.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m 2022-07-22 16:45:21,450\tINFO algorithm.py:343 -- Current log_level is WARN. For more information, set 'log_level': 'INFO' / 'DEBUG' or use the -v and -vv flags.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m 2022-07-22 16:45:36,608\tERROR worker.py:754 -- Exception raised in creation task: The actor died because of an error raised in its creation task, \u001b[36mray::PPO.__init__()\u001b[39m (pid=53765, ip=127.0.0.1, repr=PPO)\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/worker_set.py\", line 127, in __init__\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     validate=trainer_config.get(\"validate_workers_after_construction\"),\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/worker_set.py\", line 269, in add_workers\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     self.foreach_worker(lambda w: w.assert_healthy())\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/worker_set.py\", line 391, in foreach_worker\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     remote_results = ray.get([w.apply.remote(func) for w in self.remote_workers()])\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m ray.exceptions.RayActorError: The actor died because of an error raised in its creation task, \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m KeyError: 'Humanoid-v1'\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 50, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     return gym.make(env_descriptor, **env_context)\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 235, in make\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     return registry.make(id, **kwargs)\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 128, in make\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     spec = self.spec(path)\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 187, in spec\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     id, matching_envs\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m gym.error.DeprecatedEnv: Env Humanoid-v1 not found (valid versions include ['Humanoid-v2', 'Humanoid-v3'])\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/rollout_worker.py\", line 490, in __init__\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     self.env = env_creator(copy.deepcopy(self.env_context))\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 52, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m a) Not a supported/installed environment.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m b) Not a tune-registered environment creator.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m c) Not a valid env class string.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m Try one of the following:\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    For VizDoom support: Install VizDoom\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    `pip install vizdoomgym`.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    For PyBullet support: `pip install pybullet`.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m b) To register your custom env, do `from ray import tune;\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    Then in your config, do `config['env'] = [name]`.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m \u001b[36mray::PPO.__init__()\u001b[39m (pid=53765, ip=127.0.0.1, repr=PPO)\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/algorithms/algorithm.py\", line 299, in __init__\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     super().__init__(config=config, logger_creator=logger_creator, **kwargs)\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/tune/trainable/trainable.py\", line 157, in __init__\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     self.setup(copy.deepcopy(self.config))\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/algorithms/algorithm.py\", line 432, in setup\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m     raise e.args[0].args[2]\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m a) Not a supported/installed environment.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m b) Not a tune-registered environment creator.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m c) Not a valid env class string.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m Try one of the following:\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    For VizDoom support: Install VizDoom\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    `pip install vizdoomgym`.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    For PyBullet support: `pip install pybullet`.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m b) To register your custom env, do `from ray import tune;\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    Then in your config, do `config['env'] = [name]`.\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "\u001b[2m\u001b[36m(PPO pid=53765)\u001b[0m    `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m 2022-07-22 16:45:36,570\tERROR worker.py:754 -- Exception raised in creation task: The actor died because of an error raised in its creation task, \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53785, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1b6a39f90>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m KeyError: 'Humanoid-v1'\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53785, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1b6a39f90>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 50, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m     return gym.make(env_descriptor, **env_context)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 235, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m     return registry.make(id, **kwargs)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 128, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m     spec = self.spec(path)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 187, in spec\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m     id, matching_envs\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m gym.error.DeprecatedEnv: Env Humanoid-v1 not found (valid versions include ['Humanoid-v2', 'Humanoid-v3'])\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53785, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1b6a39f90>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/rollout_worker.py\", line 490, in __init__\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m     self.env = env_creator(copy.deepcopy(self.env_context))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 52, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m     raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m a) Not a supported/installed environment.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m b) Not a tune-registered environment creator.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m c) Not a valid env class string.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m Try one of the following:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m    For VizDoom support: Install VizDoom\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m    (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m    `pip install vizdoomgym`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m    For PyBullet support: `pip install pybullet`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m b) To register your custom env, do `from ray import tune;\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m    tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m    Then in your config, do `config['env'] = [name]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53785)\u001b[0m    `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m 2022-07-22 16:45:36,570\tERROR worker.py:754 -- Exception raised in creation task: The actor died because of an error raised in its creation task, \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53787, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1b29b1990>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m KeyError: 'Humanoid-v1'\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53787, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1b29b1990>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 50, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m     return gym.make(env_descriptor, **env_context)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 235, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m     return registry.make(id, **kwargs)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 128, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m     spec = self.spec(path)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 187, in spec\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m     id, matching_envs\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m gym.error.DeprecatedEnv: Env Humanoid-v1 not found (valid versions include ['Humanoid-v2', 'Humanoid-v3'])\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53787, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1b29b1990>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/rollout_worker.py\", line 490, in __init__\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m     self.env = env_creator(copy.deepcopy(self.env_context))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 52, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m     raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m a) Not a supported/installed environment.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m b) Not a tune-registered environment creator.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m c) Not a valid env class string.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m Try one of the following:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m    For VizDoom support: Install VizDoom\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m    (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m    `pip install vizdoomgym`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m    For PyBullet support: `pip install pybullet`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m b) To register your custom env, do `from ray import tune;\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m    tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m    Then in your config, do `config['env'] = [name]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53787)\u001b[0m    `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m 2022-07-22 16:45:36,570\tERROR worker.py:754 -- Exception raised in creation task: The actor died because of an error raised in its creation task, \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53791, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1bb744490>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m KeyError: 'Humanoid-v1'\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53791, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1bb744490>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 50, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m     return gym.make(env_descriptor, **env_context)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 235, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m     return registry.make(id, **kwargs)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 128, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m     spec = self.spec(path)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 187, in spec\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m     id, matching_envs\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m gym.error.DeprecatedEnv: Env Humanoid-v1 not found (valid versions include ['Humanoid-v2', 'Humanoid-v3'])\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53791, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1bb744490>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/rollout_worker.py\", line 490, in __init__\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m     self.env = env_creator(copy.deepcopy(self.env_context))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 52, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m     raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m a) Not a supported/installed environment.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m b) Not a tune-registered environment creator.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m c) Not a valid env class string.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m Try one of the following:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m    For VizDoom support: Install VizDoom\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m    (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m    `pip install vizdoomgym`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m    For PyBullet support: `pip install pybullet`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m b) To register your custom env, do `from ray import tune;\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m    tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m    Then in your config, do `config['env'] = [name]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53791)\u001b[0m    `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m 2022-07-22 16:45:36,570\tERROR worker.py:754 -- Exception raised in creation task: The actor died because of an error raised in its creation task, \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53788, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1bb4f53d0>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m KeyError: 'Humanoid-v1'\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53788, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1bb4f53d0>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 50, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m     return gym.make(env_descriptor, **env_context)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 235, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m     return registry.make(id, **kwargs)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 128, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m     spec = self.spec(path)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 187, in spec\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m     id, matching_envs\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m gym.error.DeprecatedEnv: Env Humanoid-v1 not found (valid versions include ['Humanoid-v2', 'Humanoid-v3'])\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53788, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1bb4f53d0>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/rollout_worker.py\", line 490, in __init__\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m     self.env = env_creator(copy.deepcopy(self.env_context))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 52, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m     raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m a) Not a supported/installed environment.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m b) Not a tune-registered environment creator.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m c) Not a valid env class string.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m Try one of the following:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m    For VizDoom support: Install VizDoom\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m    (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m    `pip install vizdoomgym`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m    For PyBullet support: `pip install pybullet`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m b) To register your custom env, do `from ray import tune;\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m    tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m    Then in your config, do `config['env'] = [name]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53788)\u001b[0m    `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m 2022-07-22 16:45:36,570\tERROR worker.py:754 -- Exception raised in creation task: The actor died because of an error raised in its creation task, \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53792, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x117d54a50>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m KeyError: 'Humanoid-v1'\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53792, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x117d54a50>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 50, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m     return gym.make(env_descriptor, **env_context)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 235, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m     return registry.make(id, **kwargs)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 128, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m     spec = self.spec(path)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 187, in spec\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m     id, matching_envs\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m gym.error.DeprecatedEnv: Env Humanoid-v1 not found (valid versions include ['Humanoid-v2', 'Humanoid-v3'])\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53792, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x117d54a50>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/rollout_worker.py\", line 490, in __init__\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m     self.env = env_creator(copy.deepcopy(self.env_context))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 52, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m     raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m a) Not a supported/installed environment.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m b) Not a tune-registered environment creator.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m c) Not a valid env class string.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m Try one of the following:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m    For VizDoom support: Install VizDoom\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m    (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m    `pip install vizdoomgym`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m    For PyBullet support: `pip install pybullet`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m b) To register your custom env, do `from ray import tune;\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m    tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m    Then in your config, do `config['env'] = [name]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53792)\u001b[0m    `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m 2022-07-22 16:45:36,570\tERROR worker.py:754 -- Exception raised in creation task: The actor died because of an error raised in its creation task, \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m KeyError: 'Humanoid-v1'\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 50, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m     return gym.make(env_descriptor, **env_context)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 235, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m     return registry.make(id, **kwargs)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 128, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m     spec = self.spec(path)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 187, in spec\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m     id, matching_envs\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m gym.error.DeprecatedEnv: Env Humanoid-v1 not found (valid versions include ['Humanoid-v2', 'Humanoid-v3'])\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/rollout_worker.py\", line 490, in __init__\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m     self.env = env_creator(copy.deepcopy(self.env_context))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 52, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m     raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m a) Not a supported/installed environment.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m b) Not a tune-registered environment creator.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m c) Not a valid env class string.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m Try one of the following:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m    For VizDoom support: Install VizDoom\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m    (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m    `pip install vizdoomgym`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m    For PyBullet support: `pip install pybullet`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m b) To register your custom env, do `from ray import tune;\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m    tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m    Then in your config, do `config['env'] = [name]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53786)\u001b[0m    `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m 2022-07-22 16:45:36,570\tERROR worker.py:754 -- Exception raised in creation task: The actor died because of an error raised in its creation task, \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53790, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1b35ba250>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m KeyError: 'Humanoid-v1'\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53790, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1b35ba250>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 50, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m     return gym.make(env_descriptor, **env_context)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 235, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m     return registry.make(id, **kwargs)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 128, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m     spec = self.spec(path)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 187, in spec\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m     id, matching_envs\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m gym.error.DeprecatedEnv: Env Humanoid-v1 not found (valid versions include ['Humanoid-v2', 'Humanoid-v3'])\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53790, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1b35ba250>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/rollout_worker.py\", line 490, in __init__\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m     self.env = env_creator(copy.deepcopy(self.env_context))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 52, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m     raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m a) Not a supported/installed environment.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m b) Not a tune-registered environment creator.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m c) Not a valid env class string.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m Try one of the following:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m    For VizDoom support: Install VizDoom\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m    (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m    `pip install vizdoomgym`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m    For PyBullet support: `pip install pybullet`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m b) To register your custom env, do `from ray import tune;\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m    tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m    Then in your config, do `config['env'] = [name]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53790)\u001b[0m    `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m 2022-07-22 16:45:36,570\tERROR worker.py:754 -- Exception raised in creation task: The actor died because of an error raised in its creation task, \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53789, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1be518cd0>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m KeyError: 'Humanoid-v1'\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53789, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1be518cd0>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 50, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m     return gym.make(env_descriptor, **env_context)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 235, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m     return registry.make(id, **kwargs)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 128, in make\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m     spec = self.spec(path)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m   File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 187, in spec\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m     id, matching_envs\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m gym.error.DeprecatedEnv: Env Humanoid-v1 not found (valid versions include ['Humanoid-v2', 'Humanoid-v3'])\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m During handling of the above exception, another exception occurred:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53789, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1be518cd0>)\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/rollout_worker.py\", line 490, in __init__\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m     self.env = env_creator(copy.deepcopy(self.env_context))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m   File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 52, in _gym_env_creator\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m     raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m a) Not a supported/installed environment.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m b) Not a tune-registered environment creator.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m c) Not a valid env class string.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m \n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m Try one of the following:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m    For VizDoom support: Install VizDoom\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m    (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m    `pip install vizdoomgym`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m    For PyBullet support: `pip install pybullet`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m b) To register your custom env, do `from ray import tune;\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m    tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m    Then in your config, do `config['env'] = [name]`.\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "\u001b[2m\u001b[36m(RolloutWorker pid=53789)\u001b[0m    `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "2022-07-22 16:45:36,660\tERROR trial_runner.py:921 -- Trial PPO_Humanoid-v1_45196_00000: Error processing event.\n",
-      "ray.tune.error._TuneNoNextExecutorEventError: Traceback (most recent call last):\n",
-      "  File \"/Users/kai/coding/ray/python/ray/tune/execution/ray_trial_executor.py\", line 989, in get_next_executor_event\n",
-      "    future_result = ray.get(ready_future)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/_private/client_mode_hook.py\", line 105, in wrapper\n",
-      "    return func(*args, **kwargs)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/_private/worker.py\", line 2199, in get\n",
-      "    raise value\n",
-      "  File \"python/ray/_raylet.pyx\", line 812, in ray._raylet.task_execution_handler\n",
-      "  File \"python/ray/_raylet.pyx\", line 623, in ray._raylet.execute_task\n",
-      "  File \"python/ray/_raylet.pyx\", line 772, in ray._raylet.execute_task\n",
-      "ray.exceptions.RayActorError: The actor died because of an error raised in its creation task, \u001b[36mray::PPO.__init__()\u001b[39m (pid=53765, ip=127.0.0.1, repr=PPO)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/worker_set.py\", line 127, in __init__\n",
-      "    validate=trainer_config.get(\"validate_workers_after_construction\"),\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/worker_set.py\", line 269, in add_workers\n",
-      "    self.foreach_worker(lambda w: w.assert_healthy())\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/worker_set.py\", line 391, in foreach_worker\n",
-      "    remote_results = ray.get([w.apply.remote(func) for w in self.remote_workers()])\n",
-      "ray.exceptions.RayActorError: The actor died because of an error raised in its creation task, \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "KeyError: 'Humanoid-v1'\n",
-      "\n",
-      "During handling of the above exception, another exception occurred:\n",
-      "\n",
-      "\u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 50, in _gym_env_creator\n",
-      "    return gym.make(env_descriptor, **env_context)\n",
-      "  File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 235, in make\n",
-      "    return registry.make(id, **kwargs)\n",
-      "  File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 128, in make\n",
-      "    spec = self.spec(path)\n",
-      "  File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 187, in spec\n",
-      "    id, matching_envs\n",
-      "gym.error.DeprecatedEnv: Env Humanoid-v1 not found (valid versions include ['Humanoid-v2', 'Humanoid-v3'])\n",
-      "\n",
-      "During handling of the above exception, another exception occurred:\n",
-      "\n",
-      "\u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/rollout_worker.py\", line 490, in __init__\n",
-      "    self.env = env_creator(copy.deepcopy(self.env_context))\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 52, in _gym_env_creator\n",
-      "    raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))\n",
-      "ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "a) Not a supported/installed environment.\n",
-      "b) Not a tune-registered environment creator.\n",
-      "c) Not a valid env class string.\n",
-      "\n",
-      "Try one of the following:\n",
-      "a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "   For VizDoom support: Install VizDoom\n",
-      "   (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "   `pip install vizdoomgym`.\n",
-      "   For PyBullet support: `pip install pybullet`.\n",
-      "b) To register your custom env, do `from ray import tune;\n",
-      "   tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "   Then in your config, do `config['env'] = [name]`.\n",
-      "c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "   `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\n",
-      "During handling of the above exception, another exception occurred:\n",
-      "\n",
-      "\u001b[36mray::PPO.__init__()\u001b[39m (pid=53765, ip=127.0.0.1, repr=PPO)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/algorithms/algorithm.py\", line 299, in __init__\n",
-      "    super().__init__(config=config, logger_creator=logger_creator, **kwargs)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/tune/trainable/trainable.py\", line 157, in __init__\n",
-      "    self.setup(copy.deepcopy(self.config))\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/algorithms/algorithm.py\", line 432, in setup\n",
-      "    raise e.args[0].args[2]\n",
-      "ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "a) Not a supported/installed environment.\n",
-      "b) Not a tune-registered environment creator.\n",
-      "c) Not a valid env class string.\n",
-      "\n",
-      "Try one of the following:\n",
-      "a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "   For VizDoom support: Install VizDoom\n",
-      "   (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "   `pip install vizdoomgym`.\n",
-      "   For PyBullet support: `pip install pybullet`.\n",
-      "b) To register your custom env, do `from ray import tune;\n",
-      "   tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "   Then in your config, do `config['env'] = [name]`.\n",
-      "c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "   `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Result for PPO_Humanoid-v1_45196_00000:\n",
-      "  trial_id: '45196_00000'\n",
-      "  \n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2022-07-22 16:45:36,688\tERROR ray_trial_executor.py:104 -- An exception occurred when trying to stop the Ray actor:Traceback (most recent call last):\n",
-      "  File \"/Users/kai/coding/ray/python/ray/tune/execution/ray_trial_executor.py\", line 94, in post_stop_cleanup\n",
-      "    ray.get(future, timeout=0)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/_private/client_mode_hook.py\", line 105, in wrapper\n",
-      "    return func(*args, **kwargs)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/_private/worker.py\", line 2199, in get\n",
-      "    raise value\n",
-      "  File \"python/ray/_raylet.pyx\", line 812, in ray._raylet.task_execution_handler\n",
-      "  File \"python/ray/_raylet.pyx\", line 623, in ray._raylet.execute_task\n",
-      "  File \"python/ray/_raylet.pyx\", line 772, in ray._raylet.execute_task\n",
-      "ray.exceptions.RayActorError: The actor died because of an error raised in its creation task, \u001b[36mray::PPO.__init__()\u001b[39m (pid=53765, ip=127.0.0.1, repr=PPO)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/worker_set.py\", line 127, in __init__\n",
-      "    validate=trainer_config.get(\"validate_workers_after_construction\"),\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/worker_set.py\", line 269, in add_workers\n",
-      "    self.foreach_worker(lambda w: w.assert_healthy())\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/worker_set.py\", line 391, in foreach_worker\n",
-      "    remote_results = ray.get([w.apply.remote(func) for w in self.remote_workers()])\n",
-      "ray.exceptions.RayActorError: The actor died because of an error raised in its creation task, \u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "KeyError: 'Humanoid-v1'\n",
-      "\n",
-      "During handling of the above exception, another exception occurred:\n",
-      "\n",
-      "\u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 50, in _gym_env_creator\n",
-      "    return gym.make(env_descriptor, **env_context)\n",
-      "  File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 235, in make\n",
-      "    return registry.make(id, **kwargs)\n",
-      "  File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 128, in make\n",
-      "    spec = self.spec(path)\n",
-      "  File \"/Users/kai/.pyenv/versions/3.7.7/lib/python3.7/site-packages/gym/envs/registration.py\", line 187, in spec\n",
-      "    id, matching_envs\n",
-      "gym.error.DeprecatedEnv: Env Humanoid-v1 not found (valid versions include ['Humanoid-v2', 'Humanoid-v3'])\n",
-      "\n",
-      "During handling of the above exception, another exception occurred:\n",
-      "\n",
-      "\u001b[36mray::RolloutWorker.__init__()\u001b[39m (pid=53786, ip=127.0.0.1, repr=<ray.rllib.evaluation.rollout_worker.RolloutWorker object at 0x1193ddd10>)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/evaluation/rollout_worker.py\", line 490, in __init__\n",
-      "    self.env = env_creator(copy.deepcopy(self.env_context))\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/env/utils.py\", line 52, in _gym_env_creator\n",
-      "    raise EnvError(ERR_MSG_INVALID_ENV_DESCRIPTOR.format(env_descriptor))\n",
-      "ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "a) Not a supported/installed environment.\n",
-      "b) Not a tune-registered environment creator.\n",
-      "c) Not a valid env class string.\n",
-      "\n",
-      "Try one of the following:\n",
-      "a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "   For VizDoom support: Install VizDoom\n",
-      "   (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "   `pip install vizdoomgym`.\n",
-      "   For PyBullet support: `pip install pybullet`.\n",
-      "b) To register your custom env, do `from ray import tune;\n",
-      "   tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "   Then in your config, do `config['env'] = [name]`.\n",
-      "c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "   `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\n",
-      "During handling of the above exception, another exception occurred:\n",
-      "\n",
-      "\u001b[36mray::PPO.__init__()\u001b[39m (pid=53765, ip=127.0.0.1, repr=PPO)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/algorithms/algorithm.py\", line 299, in __init__\n",
-      "    super().__init__(config=config, logger_creator=logger_creator, **kwargs)\n",
-      "  File \"/Users/kai/coding/ray/python/ray/tune/trainable/trainable.py\", line 157, in __init__\n",
-      "    self.setup(copy.deepcopy(self.config))\n",
-      "  File \"/Users/kai/coding/ray/python/ray/rllib/algorithms/algorithm.py\", line 432, in setup\n",
-      "    raise e.args[0].args[2]\n",
-      "ray.rllib.utils.error.EnvError: The env string you provided ('Humanoid-v1') is:\n",
-      "a) Not a supported/installed environment.\n",
-      "b) Not a tune-registered environment creator.\n",
-      "c) Not a valid env class string.\n",
-      "\n",
-      "Try one of the following:\n",
-      "a) For Atari support: `pip install gym[atari] autorom[accept-rom-license]`.\n",
-      "   For VizDoom support: Install VizDoom\n",
-      "   (https://github.com/mwydmuch/ViZDoom/blob/master/doc/Building.md) and\n",
-      "   `pip install vizdoomgym`.\n",
-      "   For PyBullet support: `pip install pybullet`.\n",
-      "b) To register your custom env, do `from ray import tune;\n",
-      "   tune.register('[name]', lambda cfg: [return env obj from here using cfg])`.\n",
-      "   Then in your config, do `config['env'] = [name]`.\n",
-      "c) Make sure you provide a fully qualified classpath, e.g.:\n",
-      "   `ray.rllib.examples.env.repeat_after_me_env.RepeatAfterMeEnv`\n",
-      "\n",
-      "2022-07-22 16:45:36,795\tERROR tune.py:733 -- Trials did not complete: [PPO_Humanoid-v1_45196_00000]\n",
-      "2022-07-22 16:45:36,795\tINFO tune.py:738 -- Total run time: 25.77 seconds (25.48 seconds for the tuning loop).\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "best hyperparameters:  None\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "import random\n",
     "\n",
+    "import ray\n",
     "from ray import air, tune\n",
     "from ray.tune.schedulers import PopulationBasedTraining\n",
     "\n",
     "if __name__ == \"__main__\":\n",
+    "    import argparse\n",
+    "\n",
+    "    parser = argparse.ArgumentParser()\n",
+    "    parser.add_argument(\n",
+    "        \"--smoke-test\", action=\"store_true\", help=\"Finish quickly for testing\"\n",
+    "    )\n",
+    "    args, _ = parser.parse_known_args()\n",
     "\n",
     "    # Postprocess the perturbed config to ensure it's still valid\n",
     "    def explore(config):\n",
@@ -681,35 +66,41 @@
     "            config[\"num_sgd_iter\"] = 1\n",
     "        return config\n",
     "\n",
+    "    hyperparam_mutations = {\n",
+    "        \"lambda\": lambda: random.uniform(0.9, 1.0),\n",
+    "        \"clip_param\": lambda: random.uniform(0.01, 0.5),\n",
+    "        \"lr\": [1e-3, 5e-4, 1e-4, 5e-5, 1e-5],\n",
+    "        \"num_sgd_iter\": lambda: random.randint(1, 30),\n",
+    "        \"sgd_minibatch_size\": lambda: random.randint(128, 16384),\n",
+    "        \"train_batch_size\": lambda: random.randint(2000, 160000),\n",
+    "    }\n",
+    "\n",
     "    pbt = PopulationBasedTraining(\n",
     "        time_attr=\"time_total_s\",\n",
     "        perturbation_interval=120,\n",
     "        resample_probability=0.25,\n",
     "        # Specifies the mutations of these hyperparams\n",
-    "        hyperparam_mutations={\n",
-    "            \"lambda\": lambda: random.uniform(0.9, 1.0),\n",
-    "            \"clip_param\": lambda: random.uniform(0.01, 0.5),\n",
-    "            \"lr\": [1e-3, 5e-4, 1e-4, 5e-5, 1e-5],\n",
-    "            \"num_sgd_iter\": lambda: random.randint(1, 30),\n",
-    "            \"sgd_minibatch_size\": lambda: random.randint(128, 16384),\n",
-    "            \"train_batch_size\": lambda: random.randint(2000, 160000),\n",
-    "        },\n",
+    "        hyperparam_mutations=hyperparam_mutations,\n",
     "        custom_explore_fn=explore,\n",
     "    )\n",
-    "    \n",
+    "\n",
+    "    # Stop when we've either reached 100 training iterations or reward=300\n",
+    "    stopping_criteria = {\"training_iteration\": 100, \"episode_reward_mean\": 300}\n",
+    "\n",
     "    tuner = tune.Tuner(\n",
     "        \"PPO\",\n",
     "        tune_config=tune.TuneConfig(\n",
     "            metric=\"episode_reward_mean\",\n",
     "            mode=\"max\",\n",
     "            scheduler=pbt,\n",
-    "            num_samples=1,\n",
+    "            num_samples=1 if args.smoke_test else 2,\n",
     "        ),\n",
     "        param_space={\n",
-    "            \"env\": \"Humanoid-v1\",\n",
+    "            \"env\": \"Humanoid-v2\",\n",
     "            \"kl_coeff\": 1.0,\n",
-    "            \"num_workers\": 8,\n",
-    "            \"num_gpus\": 0, # number of GPUs to use\n",
+    "            \"num_workers\": 4,\n",
+    "            \"num_cpus\": 1,  # number of CPUs to use per trial\n",
+    "            \"num_gpus\": 0,  # number of GPUs to use per trial\n",
     "            \"model\": {\"free_log_std\": True},\n",
     "            # These params are tuned from a fixed starting value.\n",
     "            \"lambda\": 0.95,\n",
@@ -720,15 +111,79 @@
     "            \"sgd_minibatch_size\": tune.choice([128, 512, 2048]),\n",
     "            \"train_batch_size\": tune.choice([10000, 20000, 40000]),\n",
     "        },\n",
+    "        run_config=air.RunConfig(stop=stopping_criteria),\n",
     "    )\n",
-    "    results = tuner.fit()\n",
+    "    results = tuner.fit()\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 35,
+   "id": "8cd3cc70",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Best performing trial's final set of hyperparameters:\n",
+      "\n",
+      "{'clip_param': 0.2,\n",
+      " 'lambda': 0.95,\n",
+      " 'lr': 0.0001,\n",
+      " 'num_sgd_iter': 30,\n",
+      " 'sgd_minibatch_size': 2048,\n",
+      " 'train_batch_size': 20000}\n",
+      "\n",
+      "Best performing trial's final reported metrics:\n",
+      "\n",
+      "{'episode_len_mean': 61.09146341463415,\n",
+      " 'episode_reward_max': 567.4424113245353,\n",
+      " 'episode_reward_mean': 310.36948184391935,\n",
+      " 'episode_reward_min': 87.74736189944105}\n"
+     ]
+    }
+   ],
+   "source": [
+    "import pprint\n",
+    "\n",
+    "best_result = results.get_best_result()\n",
+    "\n",
+    "print(\"Best performing trial's final set of hyperparameters:\\n\")\n",
+    "pprint.pprint(\n",
+    "    {k: v for k, v in best_result.config.items() if k in hyperparam_mutations}\n",
+    ")\n",
+    "\n",
+    "print(\"\\nBest performing trial's final reported metrics:\\n\")\n",
+    "\n",
+    "metrics_to_print = [\n",
+    "    \"episode_reward_mean\",\n",
+    "    \"episode_reward_max\",\n",
+    "    \"episode_reward_min\",\n",
+    "    \"episode_len_mean\",\n",
+    "]\n",
+    "pprint.pprint({k: v for k, v in best_result.metrics.items() if k in metrics_to_print})\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e4cc4685",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from ray.rllib.algorithms.algorithm import Algorithm\n",
     "\n",
-    "    print(\"best hyperparameters: \", results.get_best_result().config)\n"
+    "loaded_ppo = Algorithm.from_checkpoint(best_result.checkpoint)\n",
+    "loaded_policy = loaded_ppo.get_policy()\n",
+    "\n",
+    "# See your trained policy in action\n",
+    "# loaded_policy.compute_single_action(...)\n"
    ]
   },
   {
    "cell_type": "markdown",
-   "id": "6fb69a24",
+   "id": "db534c4e",
    "metadata": {
     "pycharm": {
      "name": "#%% md\n"
@@ -741,6 +196,14 @@
     "  Example of optimizing a distributed RLlib algorithm (PPO) with the PB2 scheduler.\n",
     "  Uses a small population size of 4, so can train on a laptop."
    ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a3d4fb61",
+   "metadata": {},
+   "outputs": [],
+   "source": []
   }
  ],
  "metadata": {
@@ -759,7 +222,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.13"
   },
   "orphan": true
  },
diff --git a/doc/source/tune/examples/pbt_transformers.ipynb b/doc/source/tune/examples/pbt_transformers.ipynb
index c50c1a2836c1..6e31b435442e 100644
--- a/doc/source/tune/examples/pbt_transformers.ipynb
+++ b/doc/source/tune/examples/pbt_transformers.ipynb
@@ -184,38 +184,20 @@
     "\n",
     "    parser = argparse.ArgumentParser()\n",
     "    parser.add_argument(\n",
-    "        \"--smoke-test\", default=True, action=\"store_true\", help=\"Finish quickly for testing\"\n",
+    "        \"--smoke-test\",\n",
+    "        default=True,\n",
+    "        action=\"store_true\",\n",
+    "        help=\"Finish quickly for testing\",\n",
     "    )\n",
-    "    parser.add_argument(\n",
-    "        \"--ray-address\",\n",
-    "        type=str,\n",
-    "        default=None,\n",
-    "        help=\"Address to use for Ray. \"\n",
-    "             'Use \"auto\" for cluster. '\n",
-    "             \"Defaults to None for local.\",\n",
-    "    )\n",
-    "    parser.add_argument(\n",
-    "        \"--server-address\",\n",
-    "        type=str,\n",
-    "        default=None,\n",
-    "        required=False,\n",
-    "        help=\"The address of server to connect to if using \" \"Ray Client.\",\n",
-    "    )\n",
-    "\n",
     "    args, _ = parser.parse_known_args()\n",
     "\n",
-    "    if args.smoke_test:\n",
-    "        ray.init()\n",
-    "    elif args.server_address:\n",
-    "        ray.init(f\"ray://{args.server_address}\")\n",
-    "    else:\n",
-    "        ray.init(args.ray_address)\n",
+    "    ray.init()\n",
     "\n",
     "    if args.smoke_test:\n",
     "        tune_transformer(num_samples=1, gpus_per_trial=0, smoke_test=True)\n",
     "    else:\n",
     "        # You can change the number of GPUs here:\n",
-    "        tune_transformer(num_samples=8, gpus_per_trial=1)"
+    "        tune_transformer(num_samples=8, gpus_per_trial=1)\n"
    ]
   },
   {
@@ -274,7 +256,7 @@
     "            \"Data already exists. Using downloaded data for task {} from {}\".format(\n",
     "                task_name, data_dir\n",
     "            )\n",
-    "        )"
+    "        )\n"
    ]
   }
  ],
@@ -294,7 +276,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.13"
   },
   "orphan": true
  },
diff --git a/doc/source/tune/examples/tune-xgboost.ipynb b/doc/source/tune/examples/tune-xgboost.ipynb
index e82cb1c6a12f..b732c1879fb9 100644
--- a/doc/source/tune/examples/tune-xgboost.ipynb
+++ b/doc/source/tune/examples/tune-xgboost.ipynb
@@ -81,11 +81,7 @@
    "cell_type": "code",
    "execution_count": 1,
    "id": "77b3c71c",
-   "metadata": {
-    "vscode": {
-     "languageId": "python"
-    }
-   },
+   "metadata": {},
    "outputs": [
     {
      "name": "stdout",
@@ -106,8 +102,7 @@
     "    # Load dataset\n",
     "    data, labels = sklearn.datasets.load_breast_cancer(return_X_y=True)\n",
     "    # Split into train and test set\n",
-    "    train_x, test_x, train_y, test_y = train_test_split(\n",
-    "        data, labels, test_size=0.25)\n",
+    "    train_x, test_x, train_y, test_y = train_test_split(data, labels, test_size=0.25)\n",
     "    # Build input matrices for XGBoost\n",
     "    train_set = xgb.DMatrix(train_x, label=train_y)\n",
     "    test_set = xgb.DMatrix(test_x, label=test_y)\n",
@@ -118,17 +113,17 @@
     "        train_set,\n",
     "        evals=[(test_set, \"eval\")],\n",
     "        evals_result=results,\n",
-    "        verbose_eval=False)\n",
+    "        verbose_eval=False,\n",
+    "    )\n",
     "    return results\n",
     "\n",
     "\n",
     "if __name__ == \"__main__\":\n",
-    "    results = train_breast_cancer({\n",
-    "        \"objective\": \"binary:logistic\",\n",
-    "        \"eval_metric\": [\"logloss\", \"error\"]\n",
-    "    })\n",
-    "    accuracy = 1. - results[\"eval\"][\"error\"][-1]\n",
-    "    print(f\"Accuracy: {accuracy:.4f}\")"
+    "    results = train_breast_cancer(\n",
+    "        {\"objective\": \"binary:logistic\", \"eval_metric\": [\"logloss\", \"error\"]}\n",
+    "    )\n",
+    "    accuracy = 1.0 - results[\"eval\"][\"error\"][-1]\n",
+    "    print(f\"Accuracy: {accuracy:.4f}\")\n"
    ]
   },
   {
@@ -264,11 +259,7 @@
    "cell_type": "code",
    "execution_count": 2,
    "id": "35073e88",
-   "metadata": {
-    "vscode": {
-     "languageId": "python"
-    }
-   },
+   "metadata": {},
    "outputs": [
     {
      "name": "stdout",
@@ -286,11 +277,11 @@
     "        \"max_depth\": 2,\n",
     "        \"min_child_weight\": 0,\n",
     "        \"subsample\": 0.8,\n",
-    "        \"eta\": 0.2\n",
+    "        \"eta\": 0.2,\n",
     "    }\n",
     "    results = train_breast_cancer(config)\n",
-    "    accuracy = 1. - results[\"eval\"][\"error\"][-1]\n",
-    "    print(f\"Accuracy: {accuracy:.4f}\")"
+    "    accuracy = 1.0 - results[\"eval\"][\"error\"][-1]\n",
+    "    print(f\"Accuracy: {accuracy:.4f}\")\n"
    ]
   },
   {
@@ -327,17 +318,13 @@
    "cell_type": "code",
    "execution_count": 3,
    "id": "ff856a82",
-   "metadata": {
-    "vscode": {
-     "languageId": "python"
-    }
-   },
+   "metadata": {},
    "outputs": [
     {
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "2022-07-22 15:52:52,004\tINFO services.py:1483 -- View the Ray dashboard at \u001B[1m\u001B[32mhttp://127.0.0.1:8268\u001B[39m\u001B[22m\n",
+      "2022-07-22 15:52:52,004\tINFO services.py:1483 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8268\u001b[39m\u001b[22m\n",
       "2022-07-22 15:52:55,858\tWARNING function_trainable.py:619 -- Function checkpointing is disabled. This may result in unexpected behavior when using checkpointing features or certain schedulers. To enable, set the train function arguments to be `func(config, checkpoint_dir=None)`.\n"
      ]
     },
@@ -579,25 +566,25 @@
     "\n",
     "\n",
     "def train_breast_cancer(config):\n",
-    "     # Load dataset\n",
-    "     data, labels = sklearn.datasets.load_breast_cancer(return_X_y=True)\n",
-    "     # Split into train and test set\n",
-    "     train_x, test_x, train_y, test_y = train_test_split(\n",
-    "         data, labels, test_size=0.25)\n",
-    "     # Build input matrices for XGBoost\n",
-    "     train_set = xgb.DMatrix(train_x, label=train_y)\n",
-    "     test_set = xgb.DMatrix(test_x, label=test_y)\n",
-    "     # Train the classifier\n",
-    "     results = {}\n",
-    "     xgb.train(\n",
-    "         config,\n",
-    "         train_set,\n",
-    "         evals=[(test_set, \"eval\")],\n",
-    "         evals_result=results,\n",
-    "         verbose_eval=False)\n",
-    "     # Return prediction accuracy\n",
-    "     accuracy = 1. - results[\"eval\"][\"error\"][-1]\n",
-    "     session.report({\"mean_accuracy\": accuracy, \"done\": True})\n",
+    "    # Load dataset\n",
+    "    data, labels = sklearn.datasets.load_breast_cancer(return_X_y=True)\n",
+    "    # Split into train and test set\n",
+    "    train_x, test_x, train_y, test_y = train_test_split(data, labels, test_size=0.25)\n",
+    "    # Build input matrices for XGBoost\n",
+    "    train_set = xgb.DMatrix(train_x, label=train_y)\n",
+    "    test_set = xgb.DMatrix(test_x, label=test_y)\n",
+    "    # Train the classifier\n",
+    "    results = {}\n",
+    "    xgb.train(\n",
+    "        config,\n",
+    "        train_set,\n",
+    "        evals=[(test_set, \"eval\")],\n",
+    "        evals_result=results,\n",
+    "        verbose_eval=False,\n",
+    "    )\n",
+    "    # Return prediction accuracy\n",
+    "    accuracy = 1.0 - results[\"eval\"][\"error\"][-1]\n",
+    "    session.report({\"mean_accuracy\": accuracy, \"done\": True})\n",
     "\n",
     "\n",
     "if __name__ == \"__main__\":\n",
@@ -607,7 +594,7 @@
     "        \"max_depth\": tune.randint(1, 9),\n",
     "        \"min_child_weight\": tune.choice([1, 2, 3]),\n",
     "        \"subsample\": tune.uniform(0.5, 1.0),\n",
-    "        \"eta\": tune.loguniform(1e-4, 1e-1)\n",
+    "        \"eta\": tune.loguniform(1e-4, 1e-1),\n",
     "    }\n",
     "    tuner = tune.Tuner(\n",
     "        train_breast_cancer,\n",
@@ -616,7 +603,7 @@
     "        ),\n",
     "        param_space=config,\n",
     "    )\n",
-    "    results = tuner.fit()"
+    "    results = tuner.fit()\n"
    ]
   },
   {
@@ -721,11 +708,7 @@
    "cell_type": "code",
    "execution_count": 9,
    "id": "d08b5b0a",
-   "metadata": {
-    "vscode": {
-     "languageId": "python"
-    }
-   },
+   "metadata": {},
    "outputs": [
     {
      "data": {
@@ -1058,28 +1041,28 @@
     "\n",
     "\n",
     "def train_breast_cancer(config: dict):\n",
-    "     # This is a simple training function to be passed into Tune\n",
-    "     # Load dataset\n",
-    "     data, labels = sklearn.datasets.load_breast_cancer(return_X_y=True)\n",
-    "     # Split into train and test set\n",
-    "     train_x, test_x, train_y, test_y = train_test_split(data, labels, test_size=0.25)\n",
-    "     # Build input matrices for XGBoost\n",
-    "     train_set = xgb.DMatrix(train_x, label=train_y)\n",
-    "     test_set = xgb.DMatrix(test_x, label=test_y)\n",
-    "     # Train the classifier, using the Tune callback\n",
-    "     xgb.train(\n",
-    "         config,\n",
-    "         train_set,\n",
-    "         evals=[(test_set, \"eval\")],\n",
-    "         verbose_eval=False,\n",
-    "         callbacks=[TuneReportCheckpointCallback(filename=\"model.xgb\")],\n",
-    "     )\n",
+    "    # This is a simple training function to be passed into Tune\n",
+    "    # Load dataset\n",
+    "    data, labels = sklearn.datasets.load_breast_cancer(return_X_y=True)\n",
+    "    # Split into train and test set\n",
+    "    train_x, test_x, train_y, test_y = train_test_split(data, labels, test_size=0.25)\n",
+    "    # Build input matrices for XGBoost\n",
+    "    train_set = xgb.DMatrix(train_x, label=train_y)\n",
+    "    test_set = xgb.DMatrix(test_x, label=test_y)\n",
+    "    # Train the classifier, using the Tune callback\n",
+    "    xgb.train(\n",
+    "        config,\n",
+    "        train_set,\n",
+    "        evals=[(test_set, \"eval\")],\n",
+    "        verbose_eval=False,\n",
+    "        callbacks=[TuneReportCheckpointCallback(filename=\"model.xgb\")],\n",
+    "    )\n",
     "\n",
     "\n",
     "def get_best_model_checkpoint(results):\n",
     "    best_bst = xgb.Booster()\n",
     "    best_result = results.get_best_result()\n",
-    "    \n",
+    "\n",
     "    with best_result.checkpoint.as_directory() as best_checkpoint_dir:\n",
     "        best_bst.load_model(os.path.join(best_checkpoint_dir, \"model.xgb\"))\n",
     "    accuracy = 1.0 - best_result.metrics[\"eval-error\"]\n",
@@ -1088,7 +1071,7 @@
     "    return best_bst\n",
     "\n",
     "\n",
-    "def tune_xgboost():\n",
+    "def tune_xgboost(smoke_test=False):\n",
     "    search_space = {\n",
     "        # You can mix constants with search space objects.\n",
     "        \"objective\": \"binary:logistic\",\n",
@@ -1102,14 +1085,14 @@
     "    scheduler = ASHAScheduler(\n",
     "        max_t=10, grace_period=1, reduction_factor=2  # 10 training iterations\n",
     "    )\n",
-    "    \n",
+    "\n",
     "    tuner = tune.Tuner(\n",
     "        train_breast_cancer,\n",
     "        tune_config=tune.TuneConfig(\n",
     "            metric=\"eval-logloss\",\n",
     "            mode=\"min\",\n",
     "            scheduler=scheduler,\n",
-    "            num_samples=10,\n",
+    "            num_samples=1 if smoke_test else 10,\n",
     "        ),\n",
     "        param_space=search_space,\n",
     "    )\n",
@@ -1123,26 +1106,17 @@
     "\n",
     "    parser = argparse.ArgumentParser()\n",
     "    parser.add_argument(\n",
-    "        \"--server-address\",\n",
-    "        type=str,\n",
-    "        default=None,\n",
-    "        required=False,\n",
-    "        help=\"The address of server to connect to if using Ray Client.\",\n",
+    "        \"--smoke-test\", action=\"store_true\", help=\"Finish quickly for testing\"\n",
     "    )\n",
     "    args, _ = parser.parse_known_args()\n",
     "\n",
-    "    if args.server_address:\n",
-    "        import ray\n",
-    "\n",
-    "        ray.init(f\"ray://{args.server_address}\")\n",
-    "\n",
-    "    results = tune_xgboost()\n",
+    "    results = tune_xgboost(smoke_test=args.smoke_test)\n",
     "\n",
     "    # Load the best model checkpoint.\n",
     "    best_bst = get_best_model_checkpoint(results)\n",
     "\n",
     "    # You could now do further predictions with\n",
-    "    # best_bst.predict(...)"
+    "    # best_bst.predict(...)\n"
    ]
   },
   {
@@ -1196,80 +1170,10 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": null,
    "id": "7d1b20a3",
-   "metadata": {
-    "vscode": {
-     "languageId": "python"
-    }
-   },
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "== Status ==<br>Current time: 2022-07-22 16:17:16 (running for 00:00:15.23)<br>Memory usage on this node: 10.6/16.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/4.57 GiB heap, 0.0/2.0 GiB objects<br>Result logdir: /Users/kai/ray_results/train_breast_cancer_2022-07-22_16-17-00<br>Number of trials: 10/10 (10 PENDING)<br><table>\n",
-       "<thead>\n",
-       "<tr><th>Trial name                     </th><th>status  </th><th>loc  </th><th style=\"text-align: right;\">        eta</th><th style=\"text-align: right;\">  max_depth</th><th style=\"text-align: right;\">  min_child_weight</th><th style=\"text-align: right;\">  subsample</th></tr>\n",
-       "</thead>\n",
-       "<tbody>\n",
-       "<tr><td>train_breast_cancer_55afc_00000</td><td>PENDING </td><td>     </td><td style=\"text-align: right;\">0.0576229  </td><td style=\"text-align: right;\">          6</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.877552</td></tr>\n",
-       "<tr><td>train_breast_cancer_55afc_00001</td><td>PENDING </td><td>     </td><td style=\"text-align: right;\">0.0489573  </td><td style=\"text-align: right;\">          4</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.53162 </td></tr>\n",
-       "<tr><td>train_breast_cancer_55afc_00002</td><td>PENDING </td><td>     </td><td style=\"text-align: right;\">0.000191779</td><td style=\"text-align: right;\">          5</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.556715</td></tr>\n",
-       "<tr><td>train_breast_cancer_55afc_00003</td><td>PENDING </td><td>     </td><td style=\"text-align: right;\">0.000372967</td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.972162</td></tr>\n",
-       "<tr><td>train_breast_cancer_55afc_00004</td><td>PENDING </td><td>     </td><td style=\"text-align: right;\">0.00164281 </td><td style=\"text-align: right;\">          1</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.941938</td></tr>\n",
-       "<tr><td>train_breast_cancer_55afc_00005</td><td>PENDING </td><td>     </td><td style=\"text-align: right;\">0.00632937 </td><td style=\"text-align: right;\">          4</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.562461</td></tr>\n",
-       "<tr><td>train_breast_cancer_55afc_00006</td><td>PENDING </td><td>     </td><td style=\"text-align: right;\">0.00574961 </td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.70719 </td></tr>\n",
-       "<tr><td>train_breast_cancer_55afc_00007</td><td>PENDING </td><td>     </td><td style=\"text-align: right;\">0.0321386  </td><td style=\"text-align: right;\">          5</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.581837</td></tr>\n",
-       "<tr><td>train_breast_cancer_55afc_00008</td><td>PENDING </td><td>     </td><td style=\"text-align: right;\">0.0351682  </td><td style=\"text-align: right;\">          4</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.554551</td></tr>\n",
-       "<tr><td>train_breast_cancer_55afc_00009</td><td>PENDING </td><td>     </td><td style=\"text-align: right;\">0.000204664</td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.995994</td></tr>\n",
-       "</tbody>\n",
-       "</table><br><br>"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\u001B[2m\u001B[1m\u001B[36m(scheduler +24m15s)\u001B[0m Tip: use `ray status` to view detailed cluster status. To disable these messages, set RAY_SCHEDULER_EVENTS=0.\n",
-      "\u001B[2m\u001B[1m\u001B[33m(scheduler +24m15s)\u001B[0m Error: No available node types can fulfill resource request {'CPU': 1.0, 'GPU': 0.1}. Add suitable node types to this cluster to resolve this issue.\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2022-07-22 16:17:19,124\tWARNING tune.py:666 -- Stop signal received (e.g. via SIGINT/Ctrl+C), ending Ray Tune run. This will try to checkpoint the experiment state one last time. Press CTRL+C (or send SIGINT/SIGKILL/SIGTERM) to skip. \n"
-     ]
-    },
-    {
-     "ename": "KeyboardInterrupt",
-     "evalue": "",
-     "output_type": "error",
-     "traceback": [
-      "\u001B[0;31m---------------------------------------------------------------------------\u001B[0m",
-      "\u001B[0;31mKeyboardInterrupt\u001B[0m                         Traceback (most recent call last)",
-      "\u001B[0;32m/var/folders/b2/0_91bd757rz02lrmr920v0gw0000gn/T/ipykernel_48774/3983013579.py\u001B[0m in \u001B[0;36m<module>\u001B[0;34m\u001B[0m\n\u001B[1;32m     19\u001B[0m     \u001B[0mparam_space\u001B[0m\u001B[0;34m=\u001B[0m\u001B[0mconfig\u001B[0m\u001B[0;34m,\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m     20\u001B[0m )\n\u001B[0;32m---> 21\u001B[0;31m \u001B[0mresults\u001B[0m \u001B[0;34m=\u001B[0m \u001B[0mtuner\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mfit\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0m",
-      "\u001B[0;32m~/coding/ray/python/ray/tune/tuner.py\u001B[0m in \u001B[0;36mfit\u001B[0;34m(self)\u001B[0m\n\u001B[1;32m    190\u001B[0m         \"\"\"\n\u001B[1;32m    191\u001B[0m \u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0;32m--> 192\u001B[0;31m         \u001B[0;32mif\u001B[0m \u001B[0;32mnot\u001B[0m \u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_is_ray_client\u001B[0m\u001B[0;34m:\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0m\u001B[1;32m    193\u001B[0m             \u001B[0;32mtry\u001B[0m\u001B[0;34m:\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m    194\u001B[0m                 \u001B[0;32mreturn\u001B[0m \u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_local_tuner\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mfit\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n",
-      "\u001B[0;32m~/coding/ray/python/ray/tune/impl/tuner_internal.py\u001B[0m in \u001B[0;36mfit\u001B[0;34m(self)\u001B[0m\n\u001B[1;32m    159\u001B[0m         \u001B[0;32mreturn\u001B[0m \u001B[0mtrainable\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m    160\u001B[0m \u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0;32m--> 161\u001B[0;31m     \u001B[0;32mdef\u001B[0m \u001B[0mfit\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0mself\u001B[0m\u001B[0;34m)\u001B[0m \u001B[0;34m->\u001B[0m \u001B[0mResultGrid\u001B[0m\u001B[0;34m:\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0m\u001B[1;32m    162\u001B[0m         \u001B[0mtrainable\u001B[0m \u001B[0;34m=\u001B[0m \u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_convert_trainable\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_trainable\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m    163\u001B[0m         \u001B[0;32massert\u001B[0m \u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_experiment_checkpoint_dir\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n",
-      "\u001B[0;32m~/coding/ray/python/ray/tune/impl/tuner_internal.py\u001B[0m in \u001B[0;36m_fit_internal\u001B[0;34m(self, trainable, param_space)\u001B[0m\n\u001B[1;32m    256\u001B[0m                 \u001B[0mscheduler\u001B[0m\u001B[0;34m=\u001B[0m\u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_tune_config\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mscheduler\u001B[0m\u001B[0;34m,\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m    257\u001B[0m                 \u001B[0mname\u001B[0m\u001B[0;34m=\u001B[0m\u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_run_config\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mname\u001B[0m\u001B[0;34m,\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0;32m--> 258\u001B[0;31m                 \u001B[0mlog_to_file\u001B[0m\u001B[0;34m=\u001B[0m\u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_run_config\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mlog_to_file\u001B[0m\u001B[0;34m,\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0m\u001B[1;32m    259\u001B[0m             ),\n\u001B[1;32m    260\u001B[0m             \u001B[0;34m**\u001B[0m\u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_tuner_kwargs\u001B[0m\u001B[0;34m,\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n",
-      "\u001B[0;32m~/coding/ray/python/ray/tune/tune.py\u001B[0m in \u001B[0;36mrun\u001B[0;34m(run_or_experiment, name, metric, mode, stop, time_budget_s, config, resources_per_trial, num_samples, local_dir, search_alg, scheduler, keep_checkpoints_num, checkpoint_score_attr, checkpoint_freq, checkpoint_at_end, verbose, progress_reporter, log_to_file, trial_name_creator, trial_dirname_creator, sync_config, export_formats, max_failures, fail_fast, restore, server_port, resume, reuse_actors, trial_executor, raise_on_failed_trial, callbacks, max_concurrent_trials, _experiment_checkpoint_dir, _remote)\u001B[0m\n\u001B[1;32m    699\u001B[0m     )\n\u001B[1;32m    700\u001B[0m     \u001B[0;32mwhile\u001B[0m \u001B[0;32mnot\u001B[0m \u001B[0mrunner\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mis_finished\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0;34m)\u001B[0m \u001B[0;32mand\u001B[0m \u001B[0;32mnot\u001B[0m \u001B[0mstate\u001B[0m\u001B[0;34m[\u001B[0m\u001B[0;34m\"signal\"\u001B[0m\u001B[0;34m]\u001B[0m\u001B[0;34m:\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0;32m--> 701\u001B[0;31m         \u001B[0mrunner\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mstep\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0m\u001B[1;32m    702\u001B[0m         \u001B[0;32mif\u001B[0m \u001B[0mhas_verbosity\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0mVerbosity\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mV1_EXPERIMENT\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m:\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m    703\u001B[0m             \u001B[0m_report_progress\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0mrunner\u001B[0m\u001B[0;34m,\u001B[0m \u001B[0mprogress_reporter\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n",
-      "\u001B[0;32m~/coding/ray/python/ray/tune/execution/trial_runner.py\u001B[0m in \u001B[0;36mstep\u001B[0;34m(self)\u001B[0m\n\u001B[1;32m    811\u001B[0m             \u001B[0mlogger\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mdebug\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0;34mf\"Got new trial to run: {next_trial}\"\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m    812\u001B[0m \u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0;32m--> 813\u001B[0;31m         \u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_wait_and_handle_event\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0mnext_trial\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0m\u001B[1;32m    814\u001B[0m \u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m    815\u001B[0m         \u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_stop_experiment_if_needed\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n",
-      "\u001B[0;32m~/coding/ray/python/ray/tune/execution/trial_runner.py\u001B[0m in \u001B[0;36m_wait_and_handle_event\u001B[0;34m(self, next_trial)\u001B[0m\n\u001B[1;32m    755\u001B[0m             \u001B[0;31m# Single wait of entire tune loop.\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m    756\u001B[0m             event = self.trial_executor.get_next_executor_event(\n\u001B[0;32m--> 757\u001B[0;31m                 \u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_live_trials\u001B[0m\u001B[0;34m,\u001B[0m \u001B[0mnext_trial\u001B[0m \u001B[0;32mis\u001B[0m \u001B[0;32mnot\u001B[0m \u001B[0;32mNone\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0m\u001B[1;32m    758\u001B[0m             )\n\u001B[1;32m    759\u001B[0m             \u001B[0;32mif\u001B[0m \u001B[0mevent\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mtype\u001B[0m \u001B[0;34m==\u001B[0m \u001B[0m_ExecutorEventType\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mPG_READY\u001B[0m\u001B[0;34m:\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n",
-      "\u001B[0;32m~/coding/ray/python/ray/tune/execution/ray_trial_executor.py\u001B[0m in \u001B[0;36mget_next_executor_event\u001B[0;34m(self, live_trials, next_trial_exists)\u001B[0m\n\u001B[1;32m    944\u001B[0m \u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m    945\u001B[0m             ready_futures, _ = ray.wait(\n\u001B[0;32m--> 946\u001B[0;31m                 \u001B[0mfutures_to_wait\u001B[0m\u001B[0;34m,\u001B[0m \u001B[0mnum_returns\u001B[0m\u001B[0;34m=\u001B[0m\u001B[0;36m1\u001B[0m\u001B[0;34m,\u001B[0m \u001B[0mtimeout\u001B[0m\u001B[0;34m=\u001B[0m\u001B[0mself\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m_get_next_event_wait\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0m\u001B[1;32m    947\u001B[0m             )\n\u001B[1;32m    948\u001B[0m \u001B[0;34m\u001B[0m\u001B[0m\n",
-      "\u001B[0;32m~/coding/ray/python/ray/_private/client_mode_hook.py\u001B[0m in \u001B[0;36mwrapper\u001B[0;34m(*args, **kwargs)\u001B[0m\n\u001B[1;32m    103\u001B[0m             \u001B[0;32mif\u001B[0m \u001B[0mfunc\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m__name__\u001B[0m \u001B[0;34m!=\u001B[0m \u001B[0;34m\"init\"\u001B[0m \u001B[0;32mor\u001B[0m \u001B[0mis_client_mode_enabled_by_default\u001B[0m\u001B[0;34m:\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m    104\u001B[0m                 \u001B[0;32mreturn\u001B[0m \u001B[0mgetattr\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0mray\u001B[0m\u001B[0;34m,\u001B[0m \u001B[0mfunc\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0m__name__\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0;34m*\u001B[0m\u001B[0margs\u001B[0m\u001B[0;34m,\u001B[0m \u001B[0;34m**\u001B[0m\u001B[0mkwargs\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0;32m--> 105\u001B[0;31m         \u001B[0;32mreturn\u001B[0m \u001B[0mfunc\u001B[0m\u001B[0;34m(\u001B[0m\u001B[0;34m*\u001B[0m\u001B[0margs\u001B[0m\u001B[0;34m,\u001B[0m \u001B[0;34m**\u001B[0m\u001B[0mkwargs\u001B[0m\u001B[0;34m)\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0m\u001B[1;32m    106\u001B[0m \u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m    107\u001B[0m     \u001B[0;32mreturn\u001B[0m \u001B[0mwrapper\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n",
-      "\u001B[0;32m~/coding/ray/python/ray/_private/worker.py\u001B[0m in \u001B[0;36mwait\u001B[0;34m(object_refs, num_returns, timeout, fetch_local)\u001B[0m\n\u001B[1;32m   2386\u001B[0m             \u001B[0mtimeout_milliseconds\u001B[0m\u001B[0;34m,\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[1;32m   2387\u001B[0m             \u001B[0mworker\u001B[0m\u001B[0;34m.\u001B[0m\u001B[0mcurrent_task_id\u001B[0m\u001B[0;34m,\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0;32m-> 2388\u001B[0;31m             \u001B[0mfetch_local\u001B[0m\u001B[0;34m,\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n\u001B[0m\u001B[1;32m   2389\u001B[0m         )\n\u001B[1;32m   2390\u001B[0m         \u001B[0;32mreturn\u001B[0m \u001B[0mready_ids\u001B[0m\u001B[0;34m,\u001B[0m \u001B[0mremaining_ids\u001B[0m\u001B[0;34m\u001B[0m\u001B[0;34m\u001B[0m\u001B[0m\n",
-      "\u001B[0;32mpython/ray/_raylet.pyx\u001B[0m in \u001B[0;36mray._raylet.CoreWorker.wait\u001B[0;34m()\u001B[0m\n",
-      "\u001B[0;32mpython/ray/_raylet.pyx\u001B[0m in \u001B[0;36mray._raylet.check_status\u001B[0;34m()\u001B[0m\n",
-      "\u001B[0;31mKeyboardInterrupt\u001B[0m: "
-     ]
-    }
-   ],
+   "metadata": {},
+   "outputs": [],
    "source": [
     "config = {\n",
     "    \"objective\": \"binary:logistic\",\n",
@@ -1278,20 +1182,17 @@
     "    \"max_depth\": tune.randint(1, 9),\n",
     "    \"min_child_weight\": tune.choice([1, 2, 3]),\n",
     "    \"subsample\": tune.uniform(0.5, 1.0),\n",
-    "    \"eta\": tune.loguniform(1e-4, 1e-1)\n",
+    "    \"eta\": tune.loguniform(1e-4, 1e-1),\n",
     "}\n",
     "\n",
     "tuner = tune.Tuner(\n",
-    "    tune.with_resources(\n",
-    "        train_breast_cancer,\n",
-    "        resources={\"cpu\": 1, \"gpu\": 0.1}\n",
-    "    ),\n",
+    "    tune.with_resources(train_breast_cancer, resources={\"cpu\": 1, \"gpu\": 0.1}),\n",
     "    tune_config=tune.TuneConfig(\n",
     "        num_samples=10,\n",
     "    ),\n",
     "    param_space=config,\n",
     ")\n",
-    "results = tuner.fit()"
+    "results = tuner.fit()\n"
    ]
   },
   {
@@ -1326,7 +1227,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "ray_dev_py38",
    "language": "python",
    "name": "python3"
   },
@@ -1340,9 +1241,14 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.6"
+   "version": "3.8.13 | packaged by conda-forge | (default, Mar 25 2022, 06:05:16) \n[Clang 12.0.1 ]"
   },
-  "orphan": true
+  "orphan": true,
+  "vscode": {
+   "interpreter": {
+    "hash": "265d195fda5292fe8f69c6e37c435a5634a1ed3b6799724e66a975f68fa21517"
+   }
+  }
  },
  "nbformat": 4,
  "nbformat_minor": 5
diff --git a/doc/source/tune/examples/tune_mnist_keras.ipynb b/doc/source/tune/examples/tune_mnist_keras.ipynb
index 780ad26112f2..271defbccf3f 100644
--- a/doc/source/tune/examples/tune_mnist_keras.ipynb
+++ b/doc/source/tune/examples/tune_mnist_keras.ipynb
@@ -543,13 +543,7 @@
       "  training_iteration: 7\n",
       "  trial_id: 55a9b_00005\n",
       "  warmup_time: 0.005449056625366211\n",
-      "  \n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
+      "  \n",
       "Result for train_mnist_55a9b_00007:\n",
       "  date: 2022-07-22_16-18-07\n",
       "  done: false\n",
@@ -855,13 +849,7 @@
       "  training_iteration: 7\n",
       "  trial_id: 55a9b_00007\n",
       "  warmup_time: 0.0028028488159179688\n",
-      "  \n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
+      "  \n",
       "Result for train_mnist_55a9b_00005:\n",
       "  date: 2022-07-22_16-18-21\n",
       "  done: true\n",
@@ -1156,13 +1144,7 @@
       "  training_iteration: 12\n",
       "  trial_id: 55a9b_00007\n",
       "  warmup_time: 0.0028028488159179688\n",
-      "  \n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
+      "  \n",
       "Result for train_mnist_55a9b_00008:\n",
       "  date: 2022-07-22_16-18-33\n",
       "  done: false\n",
@@ -1308,12 +1290,9 @@
     "    sched = AsyncHyperBandScheduler(\n",
     "        time_attr=\"training_iteration\", max_t=400, grace_period=20\n",
     "    )\n",
-    "    \n",
+    "\n",
     "    tuner = tune.Tuner(\n",
-    "        tune.with_resources(\n",
-    "            train_mnist,\n",
-    "            resources={\"cpu\": 2, \"gpu\": 0}\n",
-    "        ),\n",
+    "        tune.with_resources(train_mnist, resources={\"cpu\": 2, \"gpu\": 0}),\n",
     "        tune_config=tune.TuneConfig(\n",
     "            metric=\"mean_accuracy\",\n",
     "            mode=\"max\",\n",
@@ -1341,18 +1320,9 @@
     "    parser.add_argument(\n",
     "        \"--smoke-test\", action=\"store_true\", help=\"Finish quickly for testing\"\n",
     "    )\n",
-    "    parser.add_argument(\n",
-    "        \"--server-address\",\n",
-    "        type=str,\n",
-    "        default=None,\n",
-    "        required=False,\n",
-    "        help=\"The address of server to connect to if using \" \"Ray Client.\",\n",
-    "    )\n",
     "    args, _ = parser.parse_known_args()\n",
     "    if args.smoke_test:\n",
     "        ray.init(num_cpus=4)\n",
-    "    elif args.server_address:\n",
-    "        ray.init(f\"ray://{args.server_address}\")\n",
     "\n",
     "    tune_mnist(num_training_iterations=5 if args.smoke_test else 300)\n"
    ]
@@ -1389,7 +1359,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.7"
+   "version": "3.8.13"
   },
   "orphan": true
  },
diff --git a/doc/source/tune/tutorials/tune-stopping.rst b/doc/source/tune/tutorials/tune-stopping.rst
index 2f5ada23a943..2d7e2ee16d44 100644
--- a/doc/source/tune/tutorials/tune-stopping.rst
+++ b/doc/source/tune/tutorials/tune-stopping.rst
@@ -10,7 +10,7 @@ usually what happens when you press Ctrl+C in the console), Ray Tune shuts
 down training gracefully and saves a final experiment-level checkpoint.
 
 Ray Tune also accepts the SIGUSR1 signal to interrupt training gracefully. This
-should be used when running Ray Tune in a remote process (e.g. via Ray client)
+should be used when running Ray Tune in a remote Ray task
 as Ray will filter out SIGINT and SIGTERM signals per default.
 
 How to resume a Tune run?
diff --git a/python/ray/train/examples/horovod/horovod_tune_example.py b/python/ray/train/examples/horovod/horovod_tune_example.py
index 965346310f95..adae75b59894 100644
--- a/python/ray/train/examples/horovod/horovod_tune_example.py
+++ b/python/ray/train/examples/horovod/horovod_tune_example.py
@@ -125,22 +125,10 @@ def tune_horovod(num_workers, num_samples, use_gpu, mode="square", x_max=1.0):
         "--smoke-test", action="store_true", help=("Finish quickly for testing.")
     )
     parser.add_argument("--num-workers", type=int, default=2)
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
     if args.smoke_test:
         ray.init(num_cpus=3)
-    elif args.server_address:
-        ray.init(f"ray://{args.server_address}")
-
-    # import ray
-    # ray.init(address="auto")  # assumes ray is started with ray up
 
     tune_horovod(
         num_workers=args.num_workers,
diff --git a/python/ray/tune/examples/async_hyperband_example.py b/python/ray/tune/examples/async_hyperband_example.py
index 63f581dd66dd..ad667c93d68c 100644
--- a/python/ray/tune/examples/async_hyperband_example.py
+++ b/python/ray/tune/examples/async_hyperband_example.py
@@ -3,7 +3,6 @@
 import argparse
 import time
 
-import ray
 from ray import air, tune
 from ray.air import session
 from ray.tune.schedulers import AsyncHyperBandScheduler
@@ -30,23 +29,7 @@ def easy_objective(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--ray-address",
-        help="Address of Ray cluster for seamless distributed execution.",
-        required=False,
-    )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
-    if args.server_address is not None:
-        ray.init(f"ray://{args.server_address}")
-    else:
-        ray.init(address=args.ray_address)
 
     # AsyncHyperBand enables aggressive early stopping of bad trials.
     scheduler = AsyncHyperBandScheduler(grace_period=5, max_t=100)
diff --git a/python/ray/tune/examples/ax_example.py b/python/ray/tune/examples/ax_example.py
index 25d8a9984993..d8bf8c2e8670 100644
--- a/python/ray/tune/examples/ax_example.py
+++ b/python/ray/tune/examples/ax_example.py
@@ -60,20 +60,8 @@ def easy_objective(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     algo = AxSearch(
         parameter_constraints=["x1 + x2 <= 2.0"],  # Optional.
         outcome_constraints=["l2norm <= 1.25"],  # Optional.
diff --git a/python/ray/tune/examples/bayesopt_example.py b/python/ray/tune/examples/bayesopt_example.py
index 5d9486f67642..c8d4f05cb460 100644
--- a/python/ray/tune/examples/bayesopt_example.py
+++ b/python/ray/tune/examples/bayesopt_example.py
@@ -36,20 +36,8 @@ def easy_objective(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     algo = BayesOptSearch(utility_kwargs={"kind": "ucb", "kappa": 2.5, "xi": 0.0})
     algo = ConcurrencyLimiter(algo, max_concurrent=4)
     scheduler = AsyncHyperBandScheduler()
diff --git a/python/ray/tune/examples/blendsearch_example.py b/python/ray/tune/examples/blendsearch_example.py
index 094005159840..3791b361b890 100644
--- a/python/ray/tune/examples/blendsearch_example.py
+++ b/python/ray/tune/examples/blendsearch_example.py
@@ -96,18 +96,9 @@ def run_blendsearch_tune_w_budget(time_budget_s=10):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
-    if args.server_address is not None:
-        ray.init(f"ray://{args.server_address}")
-    else:
-        ray.init(configure_logging=False)
+
+    ray.init(configure_logging=False)
 
     run_blendsearch_tune_w_budget(time_budget_s=30)
     run_blendsearch_tune(smoke_test=args.smoke_test)
diff --git a/python/ray/tune/examples/bohb_example.py b/python/ray/tune/examples/bohb_example.py
index 7aa9b16aed4e..4d3e14572c80 100644
--- a/python/ray/tune/examples/bohb_example.py
+++ b/python/ray/tune/examples/bohb_example.py
@@ -6,7 +6,6 @@
 (`pip install hpbandster ConfigSpace`).
 """
 
-import argparse
 import json
 import time
 import os
@@ -51,20 +50,7 @@ def load_checkpoint(self, checkpoint_path):
 
 
 if __name__ == "__main__":
-    parser = argparse.ArgumentParser()
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
-    args, _ = parser.parse_known_args()
-
-    if args.server_address:
-        ray.init(f"ray://{args.server_address}")
-    else:
-        ray.init(num_cpus=8)
+    ray.init(num_cpus=8)
 
     config = {
         "iterations": 100,
diff --git a/python/ray/tune/examples/cfo_example.py b/python/ray/tune/examples/cfo_example.py
index 870067e870f4..99adc44e0f46 100644
--- a/python/ray/tune/examples/cfo_example.py
+++ b/python/ray/tune/examples/cfo_example.py
@@ -63,17 +63,8 @@ def run_cfo_tune(smoke_test=False):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
-    if args.server_address is not None:
-        ray.init(f"ray://{args.server_address}")
-    else:
-        ray.init(configure_logging=False)
+
+    ray.init(configure_logging=False)
 
     run_cfo_tune(smoke_test=args.smoke_test)
diff --git a/python/ray/tune/examples/custom_func_checkpointing.py b/python/ray/tune/examples/custom_func_checkpointing.py
index 9863764de709..1f4cba8a65a3 100644
--- a/python/ray/tune/examples/custom_func_checkpointing.py
+++ b/python/ray/tune/examples/custom_func_checkpointing.py
@@ -35,20 +35,8 @@ def train_func(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     tuner = tune.Tuner(
         train_func,
         run_config=air.RunConfig(
diff --git a/python/ray/tune/examples/dragonfly_example.py b/python/ray/tune/examples/dragonfly_example.py
index 572ad4424ffd..2064df253ec2 100644
--- a/python/ray/tune/examples/dragonfly_example.py
+++ b/python/ray/tune/examples/dragonfly_example.py
@@ -39,20 +39,8 @@ def objective(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     # Optional: Pass the parameter space yourself
     # space = [{
     #     "name": "LiNO3_vol",
diff --git a/python/ray/tune/examples/hebo_example.py b/python/ray/tune/examples/hebo_example.py
index fb3d3d352cac..3de8591195ef 100644
--- a/python/ray/tune/examples/hebo_example.py
+++ b/python/ray/tune/examples/hebo_example.py
@@ -35,20 +35,8 @@ def easy_objective(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     # The config will be automatically converted to HEBO's DesignSpace
 
     # Optional: Pass the parameter space yourself
diff --git a/python/ray/tune/examples/hyperband_example.py b/python/ray/tune/examples/hyperband_example.py
index e34e930186b1..11e7bc3895e4 100755
--- a/python/ray/tune/examples/hyperband_example.py
+++ b/python/ray/tune/examples/hyperband_example.py
@@ -12,18 +12,9 @@
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
-    if args.server_address:
-        ray.init(f"ray://{args.server_address}")
-    else:
-        ray.init(num_cpus=4 if args.smoke_test else None)
+
+    ray.init(num_cpus=4 if args.smoke_test else None)
 
     # Hyperband early stopping, configured with `episode_reward_mean` as the
     # objective and `training_iteration` as the time unit,
diff --git a/python/ray/tune/examples/hyperband_function_example.py b/python/ray/tune/examples/hyperband_function_example.py
index 3e1cbc0be42c..e376751eebff 100644
--- a/python/ray/tune/examples/hyperband_function_example.py
+++ b/python/ray/tune/examples/hyperband_function_example.py
@@ -39,18 +39,9 @@ def train(config, checkpoint_dir=None):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
-    if args.server_address is not None:
-        ray.init(f"ray://{args.server_address}")
-    else:
-        ray.init(num_cpus=4 if args.smoke_test else None)
+
+    ray.init(num_cpus=4 if args.smoke_test else None)
 
     # Hyperband early stopping, configured with `episode_reward_mean` as the
     # objective and `training_iteration` as the time unit,
diff --git a/python/ray/tune/examples/hyperopt_conditional_search_space_example.py b/python/ray/tune/examples/hyperopt_conditional_search_space_example.py
index 5b93d87354ce..b3512e851001 100644
--- a/python/ray/tune/examples/hyperopt_conditional_search_space_example.py
+++ b/python/ray/tune/examples/hyperopt_conditional_search_space_example.py
@@ -102,17 +102,8 @@ def run_hyperopt_tune(config_dict=config_space, smoke_test=False):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
-    if args.server_address is not None:
-        ray.util.connect(args.server_address)
-    else:
-        ray.init(configure_logging=False)
+
+    ray.init(configure_logging=False)
 
     run_hyperopt_tune(smoke_test=args.smoke_test)
diff --git a/python/ray/tune/examples/lightgbm_example.py b/python/ray/tune/examples/lightgbm_example.py
index 45d81b703c88..2e832e38959e 100644
--- a/python/ray/tune/examples/lightgbm_example.py
+++ b/python/ray/tune/examples/lightgbm_example.py
@@ -78,23 +78,11 @@ def train_breast_cancer_cv(config: dict):
     import argparse
 
     parser = argparse.ArgumentParser()
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     parser.add_argument(
         "--use-cv", action="store_true", help="Use `lgb.cv` instead of `lgb.train`."
     )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     config = {
         "objective": "binary",
         "metric": ["binary_error", "binary_logloss"],
diff --git a/python/ray/tune/examples/logging_example.py b/python/ray/tune/examples/logging_example.py
index 4875e96fbb1a..680c718d555e 100755
--- a/python/ray/tune/examples/logging_example.py
+++ b/python/ray/tune/examples/logging_example.py
@@ -38,20 +38,8 @@ def easy_objective(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     tuner = tune.Tuner(
         easy_objective,
         run_config=air.RunConfig(
diff --git a/python/ray/tune/examples/mnist_ptl_mini.py b/python/ray/tune/examples/mnist_ptl_mini.py
index 43194fedff87..1517fd2a3565 100644
--- a/python/ray/tune/examples/mnist_ptl_mini.py
+++ b/python/ray/tune/examples/mnist_ptl_mini.py
@@ -117,21 +117,9 @@ def tune_mnist(num_samples=10, num_epochs=10, gpus_per_trial=0):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
     if args.smoke_test:
         tune_mnist(num_samples=1, num_epochs=1, gpus_per_trial=0)
     else:
-        if args.server_address:
-            import ray
-
-            ray.init(f"ray://{args.server_address}")
-
         tune_mnist(num_samples=10, num_epochs=10, gpus_per_trial=0)
diff --git a/python/ray/tune/examples/mnist_pytorch.py b/python/ray/tune/examples/mnist_pytorch.py
index ce83440efb34..39a9a20fc7ef 100644
--- a/python/ray/tune/examples/mnist_pytorch.py
+++ b/python/ray/tune/examples/mnist_pytorch.py
@@ -120,25 +120,9 @@ def train_mnist(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--ray-address",
-        help="Address of Ray cluster for seamless distributed execution.",
-    )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        ray.init(f"ray://{args.server_address}")
-    elif args.ray_address:
-        ray.init(address=args.ray_address)
-    else:
-        ray.init(num_cpus=2 if args.smoke_test else None)
+    ray.init(num_cpus=2 if args.smoke_test else None)
 
     # for early stopping
     sched = AsyncHyperBandScheduler()
diff --git a/python/ray/tune/examples/mxnet_example.py b/python/ray/tune/examples/mxnet_example.py
index 2dbce55b0150..e380774b8dc6 100644
--- a/python/ray/tune/examples/mxnet_example.py
+++ b/python/ray/tune/examples/mxnet_example.py
@@ -85,20 +85,8 @@ def tune_mnist_mxnet(num_samples=10, num_epochs=10):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address and not args.smoke_test:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     if args.smoke_test:
         results = tune_mnist_mxnet(num_samples=1, num_epochs=1)
     else:
diff --git a/python/ray/tune/examples/nevergrad_example.py b/python/ray/tune/examples/nevergrad_example.py
index 5da2fe172cc9..868d6c3380fe 100644
--- a/python/ray/tune/examples/nevergrad_example.py
+++ b/python/ray/tune/examples/nevergrad_example.py
@@ -37,20 +37,8 @@ def easy_objective(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     # Optional: Pass the parameter space yourself
     # space = ng.p.Dict(
     #     width=ng.p.Scalar(lower=0, upper=20),
diff --git a/python/ray/tune/examples/optuna_define_by_run_example.py b/python/ray/tune/examples/optuna_define_by_run_example.py
index 3874a5cbd5d5..a98c3992fcbb 100644
--- a/python/ray/tune/examples/optuna_define_by_run_example.py
+++ b/python/ray/tune/examples/optuna_define_by_run_example.py
@@ -86,17 +86,8 @@ def run_optuna_tune(smoke_test=False):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
-    if args.server_address is not None:
-        ray.util.connect(args.server_address)
-    else:
-        ray.init(configure_logging=False)
+
+    ray.init(configure_logging=False)
 
     run_optuna_tune(smoke_test=args.smoke_test)
diff --git a/python/ray/tune/examples/optuna_example.py b/python/ray/tune/examples/optuna_example.py
index bd21a48c4bfb..65ef5340c934 100644
--- a/python/ray/tune/examples/optuna_example.py
+++ b/python/ray/tune/examples/optuna_example.py
@@ -66,17 +66,8 @@ def run_optuna_tune(smoke_test=False):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
-    if args.server_address is not None:
-        ray.init(f"ray://{args.server_address}")
-    else:
-        ray.init(configure_logging=False)
+
+    ray.init(configure_logging=False)
 
     run_optuna_tune(smoke_test=args.smoke_test)
diff --git a/python/ray/tune/examples/optuna_multiobjective_example.py b/python/ray/tune/examples/optuna_multiobjective_example.py
index ef4e62622252..c23ec5d4ef6f 100644
--- a/python/ray/tune/examples/optuna_multiobjective_example.py
+++ b/python/ray/tune/examples/optuna_multiobjective_example.py
@@ -73,17 +73,8 @@ def run_optuna_tune(smoke_test=False):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
-    if args.server_address is not None:
-        ray.init(f"ray://{args.server_address}")
-    else:
-        ray.init(configure_logging=False)
+
+    ray.init(configure_logging=False)
 
     run_optuna_tune(smoke_test=args.smoke_test)
diff --git a/python/ray/tune/examples/pb2_example.py b/python/ray/tune/examples/pb2_example.py
index 0fe8ce01e329..6647dc590ac4 100644
--- a/python/ray/tune/examples/pb2_example.py
+++ b/python/ray/tune/examples/pb2_example.py
@@ -12,21 +12,10 @@
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
+
     if args.smoke_test:
         ray.init(num_cpus=2)  # force pausing to happen for test
-    else:
-        if args.server_address:
-            ray.init(f"ray://{args.server_address}")
-        else:
-            ray.init()
 
     perturbation_interval = 5
     pbt = PB2(
diff --git a/python/ray/tune/examples/pbt_example.py b/python/ray/tune/examples/pbt_example.py
index 44badf3d02db..af61325eb7f5 100755
--- a/python/ray/tune/examples/pbt_example.py
+++ b/python/ray/tune/examples/pbt_example.py
@@ -86,26 +86,10 @@ def reset_config(self, new_config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--cluster", action="store_true", help="Distribute tuning on a cluster"
-    )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        ray.init(f"ray://{args.server_address}")
-    elif args.cluster:
-        ray.init(address="auto")
-    elif args.smoke_test:
+    if args.smoke_test:
         ray.init(num_cpus=2)  # force pausing to happen for test
-    else:
-        ray.init()
 
     perturbation_interval = 5
     pbt = PopulationBasedTraining(
diff --git a/python/ray/tune/examples/pbt_function.py b/python/ray/tune/examples/pbt_function.py
index 4307b14aba16..cfa38633aac4 100644
--- a/python/ray/tune/examples/pbt_function.py
+++ b/python/ray/tune/examples/pbt_function.py
@@ -164,20 +164,8 @@ def run_tune_pbt(smoke_test=False):
         default=False,
         help="Finish quickly for testing",
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
     if args.smoke_test:
         ray.init(num_cpus=2)  # force pausing to happen for test
-    else:
-        if args.server_address is not None:
-            ray.init(f"ray://{args.server_address}")
-        else:
-            ray.init()
 
     run_tune_pbt(smoke_test=args.smoke_test)
diff --git a/python/ray/tune/examples/pbt_memnn_example.py b/python/ray/tune/examples/pbt_memnn_example.py
index 6c140649f8fc..6717e69067dd 100644
--- a/python/ray/tune/examples/pbt_memnn_example.py
+++ b/python/ray/tune/examples/pbt_memnn_example.py
@@ -266,19 +266,10 @@ def load_checkpoint(self, path):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
     if args.smoke_test:
         ray.init(num_cpus=2)
-    elif args.server_address:
-        ray.init(f"ray://{args.server_address}")
 
     perturbation_interval = 2
     pbt = PopulationBasedTraining(
diff --git a/python/ray/tune/examples/pbt_transformers/pbt_transformers.py b/python/ray/tune/examples/pbt_transformers/pbt_transformers.py
index 00400a07f2e7..6bacbc176156 100644
--- a/python/ray/tune/examples/pbt_transformers/pbt_transformers.py
+++ b/python/ray/tune/examples/pbt_transformers/pbt_transformers.py
@@ -4,7 +4,6 @@
 """
 import os
 
-import ray
 from ray import tune
 from ray.tune import CLIReporter
 from ray.tune.examples.pbt_transformers.utils import (
@@ -153,31 +152,8 @@ def get_model():
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--ray-address",
-        type=str,
-        default=None,
-        help="Address to use for Ray. "
-        'Use "auto" for cluster. '
-        "Defaults to None for local.",
-    )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
-
     args, _ = parser.parse_known_args()
 
-    if args.smoke_test:
-        ray.init()
-    elif args.server_address:
-        ray.init(f"ray://{args.server_address}")
-    else:
-        ray.init(args.ray_address)
-
     if args.smoke_test:
         tune_transformer(num_samples=1, gpus_per_trial=0, smoke_test=True)
     else:
diff --git a/python/ray/tune/examples/skopt_example.py b/python/ray/tune/examples/skopt_example.py
index 1f8466f1f51c..b26de1b66cc5 100644
--- a/python/ray/tune/examples/skopt_example.py
+++ b/python/ray/tune/examples/skopt_example.py
@@ -36,20 +36,8 @@ def easy_objective(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     # The config will be automatically converted to SkOpt's search space
 
     # Optional: Pass the parameter space yourself
diff --git a/python/ray/tune/examples/tf_mnist_example.py b/python/ray/tune/examples/tf_mnist_example.py
index 2bf81940e3c3..d46b0fdb6737 100644
--- a/python/ray/tune/examples/tf_mnist_example.py
+++ b/python/ray/tune/examples/tf_mnist_example.py
@@ -121,20 +121,8 @@ def step(self):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address and not args.smoke_test:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     tuner = tune.Tuner(
         MNISTTrainable,
         tune_config=tune.TuneConfig(
diff --git a/python/ray/tune/examples/tune_basic_example.py b/python/ray/tune/examples/tune_basic_example.py
index 32deac29c0b0..f50814788d55 100644
--- a/python/ray/tune/examples/tune_basic_example.py
+++ b/python/ray/tune/examples/tune_basic_example.py
@@ -29,18 +29,9 @@ def easy_objective(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
-    if args.server_address is not None:
-        ray.init(f"ray://{args.server_address}")
-    else:
-        ray.init(configure_logging=False)
+
+    ray.init(configure_logging=False)
 
     # This will do a grid search over the `activation` parameter. This means
     # that each of the two values (`relu` and `tanh`) will be sampled once
diff --git a/python/ray/tune/examples/tune_mnist_keras.py b/python/ray/tune/examples/tune_mnist_keras.py
index 0b4655748285..5d5424a5f0b3 100644
--- a/python/ray/tune/examples/tune_mnist_keras.py
+++ b/python/ray/tune/examples/tune_mnist_keras.py
@@ -80,17 +80,9 @@ def tune_mnist(num_training_iterations):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
+
     if args.smoke_test:
         ray.init(num_cpus=4)
-    elif args.server_address:
-        ray.init(f"ray://{args.server_address}")
 
     tune_mnist(num_training_iterations=5 if args.smoke_test else 300)
diff --git a/python/ray/tune/examples/zoopt_example.py b/python/ray/tune/examples/zoopt_example.py
index 02d7575b4f83..bfc67659ce6c 100644
--- a/python/ray/tune/examples/zoopt_example.py
+++ b/python/ray/tune/examples/zoopt_example.py
@@ -35,20 +35,8 @@ def easy_objective(config):
     parser.add_argument(
         "--smoke-test", action="store_true", help="Finish quickly for testing"
     )
-    parser.add_argument(
-        "--server-address",
-        type=str,
-        default=None,
-        required=False,
-        help="The address of server to connect to if using Ray Client.",
-    )
     args, _ = parser.parse_known_args()
 
-    if args.server_address:
-        import ray
-
-        ray.init(f"ray://{args.server_address}")
-
     num_samples = 10 if args.smoke_test else 1000
 
     # Optional: Pass the parameter space yourself

From bae61d95c01460268e02846a82f77d330c20193d Mon Sep 17 00:00:00 2001
From: xwjiang2010 <87673679+xwjiang2010@users.noreply.github.com>
Date: Tue, 7 Feb 2023 22:44:17 -0800
Subject: [PATCH 176/267] [release] Improve handle_result in case of empty
 fetched result. (#32055)

Improve handle_result (result alert logic) for release tests in case when the fetched result is empty due to infra issues. For example if job server on the cluster is down (which we rely on to get files back to buildkite runners).

Without this, the error code indicates application error, which is misleading.
See an example here: https://buildkite.com/ray-project/release-tests-branch/builds/1318#0185fc29-1d4c-483a-999b-ede500781c7a

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>
---
 release/ray_release/alerts/handle.py          | 25 +++++++++++----
 .../command_runner/client_runner.py           |  4 +--
 .../ray_release/command_runner/job_runner.py  |  4 +--
 .../ray_release/command_runner/sdk_runner.py  |  4 +--
 release/ray_release/exception.py              |  4 +--
 release/ray_release/glue.py                   | 29 ++++++++++-------
 release/ray_release/result.py                 |  3 +-
 release/ray_release/tests/test_glue.py        | 31 +++++++++++++++----
 8 files changed, 71 insertions(+), 33 deletions(-)

diff --git a/release/ray_release/alerts/handle.py b/release/ray_release/alerts/handle.py
index ab2f20829b34..d880043a7edb 100644
--- a/release/ray_release/alerts/handle.py
+++ b/release/ray_release/alerts/handle.py
@@ -12,15 +12,28 @@
 )
 
 
+# The second bit in the tuple indicates whether a result is required to pass the alert.
+# If true, the release test will throw a FetchResultError when result cannot be fetched
+# successfully.
 result_to_handle_map = {
-    "default": default.handle_result,
-    "long_running_tests": long_running_tests.handle_result,
-    "rllib_tests": rllib_tests.handle_result,
-    "tune_tests": tune_tests.handle_result,
-    "xgboost_tests": xgboost_tests.handle_result,
+    "default": (default.handle_result, False),
+    "long_running_tests": (
+        long_running_tests.handle_result,
+        True,
+    ),
+    "rllib_tests": (rllib_tests.handle_result, False),
+    "tune_tests": (tune_tests.handle_result, True),
+    "xgboost_tests": (xgboost_tests.handle_result, True),
 }
 
 
+def require_result(test: Test) -> bool:
+    alert_suite = test.get("alert", "default")
+    if alert_suite not in result_to_handle_map:
+        raise ReleaseTestConfigError(f"Alert suite {alert_suite} not found.")
+    return result_to_handle_map[alert_suite][1]
+
+
 def handle_result(test: Test, result: Result):
     alert_suite = test.get("alert", "default")
 
@@ -32,7 +45,7 @@ def handle_result(test: Test, result: Result):
     if alert_suite not in result_to_handle_map:
         raise ReleaseTestConfigError(f"Alert suite {alert_suite} not found.")
 
-    handler = result_to_handle_map[alert_suite]
+    handler = result_to_handle_map[alert_suite][0]
     error = handler(test, result)
 
     if error:
diff --git a/release/ray_release/command_runner/client_runner.py b/release/ray_release/command_runner/client_runner.py
index 27901e3d39b8..dbf84586068b 100644
--- a/release/ray_release/command_runner/client_runner.py
+++ b/release/ray_release/command_runner/client_runner.py
@@ -13,7 +13,7 @@
 
 from ray_release.cluster_manager.cluster_manager import ClusterManager
 from ray_release.exception import (
-    ResultsError,
+    FetchResultError,
     LocalEnvSetupError,
     ClusterNodesWaitTimeout,
     CommandTimeout,
@@ -121,7 +121,7 @@ def _fetch_json(self, path: str) -> Dict[str, Any]:
             with open(path, "rt") as fp:
                 return json.load(fp)
         except Exception as e:
-            raise ResultsError(
+            raise FetchResultError(
                 f"Could not load local results from client command: {e}"
             ) from e
 
diff --git a/release/ray_release/command_runner/job_runner.py b/release/ray_release/command_runner/job_runner.py
index c199bd8682af..50af91fef683 100644
--- a/release/ray_release/command_runner/job_runner.py
+++ b/release/ray_release/command_runner/job_runner.py
@@ -11,7 +11,7 @@
     CommandTimeout,
     LocalEnvSetupError,
     LogsError,
-    ResultsError,
+    FetchResultError,
 )
 from ray_release.file_manager.file_manager import FileManager
 from ray_release.job_manager import JobManager
@@ -138,7 +138,7 @@ def _fetch_json(self, path: str) -> Dict[str, Any]:
             os.unlink(tmpfile)
             return data
         except Exception as e:
-            raise ResultsError(f"Could not fetch results from session: {e}") from e
+            raise FetchResultError(f"Could not fetch results from session: {e}") from e
 
     def fetch_results(self) -> Dict[str, Any]:
         return self._fetch_json(self.result_output_json)
diff --git a/release/ray_release/command_runner/sdk_runner.py b/release/ray_release/command_runner/sdk_runner.py
index ef40f0d3bbcf..6a68454f3ce3 100644
--- a/release/ray_release/command_runner/sdk_runner.py
+++ b/release/ray_release/command_runner/sdk_runner.py
@@ -13,7 +13,7 @@
     CommandTimeout,
     LogsError,
     RemoteEnvSetupError,
-    ResultsError,
+    FetchResultError,
 )
 from ray_release.file_manager.file_manager import FileManager
 from ray_release.logger import logger
@@ -189,7 +189,7 @@ def _fetch_json(self, path: str) -> Dict[str, Any]:
             os.unlink(tmpfile)
             return data
         except Exception as e:
-            raise ResultsError(f"Could not fetch results from session: {e}") from e
+            raise FetchResultError(f"Could not fetch results from session: {e}") from e
 
     def fetch_results(self) -> Dict[str, Any]:
         return self._fetch_json(self.result_output_json)
diff --git a/release/ray_release/exception.py b/release/ray_release/exception.py
index e00b9c69a4d8..eccf038a0719 100644
--- a/release/ray_release/exception.py
+++ b/release/ray_release/exception.py
@@ -129,8 +129,8 @@ class TestCommandError(CommandError):
     exit_code = ExitCode.COMMAND_ERROR
 
 
-class ResultsError(CommandError):
-    pass
+class FetchResultError(FileManagerError):
+    exit_code = ExitCode.FETCH_RESULT_ERROR
 
 
 class LogsError(CommandError):
diff --git a/release/ray_release/glue.py b/release/ray_release/glue.py
index 2771fb35e767..e8b924c02ca3 100644
--- a/release/ray_release/glue.py
+++ b/release/ray_release/glue.py
@@ -2,7 +2,7 @@
 import time
 from typing import Optional, List
 
-from ray_release.alerts.handle import handle_result
+from ray_release.alerts.handle import handle_result, require_result
 from ray_release.anyscale_util import get_cluster_name
 from ray_release.buildkite.output import buildkite_group, buildkite_open_last
 from ray_release.cluster_manager.full import FullClusterManager
@@ -167,6 +167,8 @@ def run_release_test(
         raise ReleaseTestSetupError(f"Error setting up release test: {e}") from e
 
     pipeline_exception = None
+    # non critical for some tests. So separate it from the general one.
+    fetch_result_exception = None
     try:
         # Load configs
         cluster_env = load_test_cluster_env(test, ray_wheels_url=ray_wheels_url)
@@ -321,9 +323,9 @@ def run_release_test(
         try:
             command_results = command_runner.fetch_results()
         except Exception as e:
-            logger.error("Could not fetch results for test command")
-            logger.exception(e)
+            logger.exception(f"Could not fetch results for test command: {e}")
             command_results = {}
+            fetch_result_exception = e
 
         # Postprocess result:
         if "last_update" in command_results:
@@ -357,7 +359,7 @@ def run_release_test(
     try:
         last_logs = command_runner.get_last_logs()
     except Exception as e:
-        logger.error(f"Error fetching logs: {e}")
+        logger.exception(f"Error fetching logs: {e}")
         last_logs = "No logs could be retrieved."
 
     result.last_logs = last_logs
@@ -367,7 +369,7 @@ def run_release_test(
         try:
             cluster_manager.terminate_cluster(wait=False)
         except Exception as e:
-            logger.error(f"Could not terminate cluster: {e}")
+            logger.exception(f"Could not terminate cluster: {e}")
 
     time_taken = time.monotonic() - start_time
     result.runtime = time_taken
@@ -376,12 +378,15 @@ def run_release_test(
     os.chdir(old_wd)
 
     if not pipeline_exception:
-        buildkite_group(":mag: Interpreting results")
-        # Only handle results if we didn't run into issues earlier
-        try:
-            handle_result(test, result)
-        except Exception as e:
-            pipeline_exception = e
+        if require_result(test) and fetch_result_exception:
+            pipeline_exception = fetch_result_exception
+        else:
+            buildkite_group(":mag: Interpreting results")
+            # Only handle results if we didn't run into issues earlier
+            try:
+                handle_result(test, result)
+            except Exception as e:
+                pipeline_exception = e
 
     if pipeline_exception:
         buildkite_group(":rotating_light: Handling errors")
@@ -398,7 +403,7 @@ def run_release_test(
         try:
             reporter.report_result(test, result)
         except Exception as e:
-            logger.error(f"Error reporting results via {type(reporter)}: {e}")
+            logger.exception(f"Error reporting results via {type(reporter)}: {e}")
 
     if pipeline_exception:
         raise pipeline_exception
diff --git a/release/ray_release/result.py b/release/ray_release/result.py
index 6acf371550cd..8f24339b0380 100644
--- a/release/ray_release/result.py
+++ b/release/ray_release/result.py
@@ -44,6 +44,7 @@ class ExitCode(enum.Enum):
     CLUSTER_STARTUP_ERROR = 15
     LOCAL_ENV_SETUP_ERROR = 16
     REMOTE_ENV_SETUP_ERROR = 17
+    FETCH_RESULT_ERROR = 18
     # ANYSCALE_SDK_ERROR = 19
 
     # Infra timeouts (retryable)
@@ -52,7 +53,7 @@ class ExitCode(enum.Enum):
     CLUSTER_STARTUP_TIMEOUT = 32
     CLUSTER_WAIT_TIMEOUT = 33
 
-    # Command errors
+    # Command errors - these are considered application errors
     COMMAND_ERROR = 40
     COMMAND_ALERT = 41
     COMMAND_TIMEOUT = 42
diff --git a/release/ray_release/tests/test_glue.py b/release/ray_release/tests/test_glue.py
index 630219965996..654516889be7 100644
--- a/release/ray_release/tests/test_glue.py
+++ b/release/ray_release/tests/test_glue.py
@@ -1,10 +1,11 @@
 import os
+import pytest
 import shutil
 import sys
 import tempfile
 import time
-import unittest
 from typing import Type, Callable
+import unittest
 from unittest.mock import patch
 
 from ray_release.alerts.handle import result_to_handle_map
@@ -33,7 +34,7 @@
     PrepareCommandTimeout,
     TestCommandError,
     TestCommandTimeout,
-    ResultsError,
+    FetchResultError,
     LogsError,
     ResultsAlert,
     ClusterNodesWaitTimeout,
@@ -153,7 +154,7 @@ def __init__(self, cluster_manager: ClusterManager):
         def mock_alerter(test: Test, result: Result):
             return self.mock_alert_return
 
-        result_to_handle_map["unit_test_alerter"] = mock_alerter
+        result_to_handle_map["unit_test_alerter"] = (mock_alerter, False)
 
         type_str_to_command_runner["unit_test"] = MockCommandRunner
         command_runner_to_cluster_manager[MockCommandRunner] = MockClusterManager
@@ -583,7 +584,7 @@ def testFetchResultFails(self):
 
         self._succeed_until("test_command")
 
-        self.command_runner_return["fetch_results"] = _fail_on_call(ResultsError)
+        self.command_runner_return["fetch_results"] = _fail_on_call(FetchResultError)
         with self.assertLogs(logger, "ERROR") as cm:
             self._run(result)
             self.assertTrue(any("Could not fetch results" in o for o in cm.output))
@@ -593,6 +594,26 @@ def testFetchResultFails(self):
         # Ensure cluster was terminated
         self.assertGreaterEqual(self.sdk.call_counter["terminate_cluster"], 1)
 
+    def testFetchResultFailsReqNonEmptyResult(self):
+        # set `require_result` bit.
+        new_handler = (result_to_handle_map["unit_test_alerter"], True)
+        result_to_handle_map["unit_test_alerter"] = new_handler
+
+        result = Result()
+
+        self._succeed_until("test_command")
+
+        self.command_runner_return["fetch_results"] = _fail_on_call(FetchResultError)
+        with self.assertRaisesRegex(FetchResultError, "Fail"):
+            with self.assertLogs(logger, "ERROR") as cm:
+                self._run(result)
+                self.assertTrue(any("Could not fetch results" in o for o in cm.output))
+        self.assertEqual(result.return_code, ExitCode.FETCH_RESULT_ERROR.value)
+        self.assertEqual(result.status, "infra_error")
+
+        # Ensure cluster was terminated, no matter what
+        self.assertGreaterEqual(self.sdk.call_counter["terminate_cluster"], 1)
+
     def testLastLogsFails(self):
         result = Result()
 
@@ -647,6 +668,4 @@ def report_result(self, test: Test, result: Result):
 
 
 if __name__ == "__main__":
-    import pytest
-
     sys.exit(pytest.main(["-v", __file__]))

From 585f8aa336c1c07d2b017ea11641e9f7e7f9e554 Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Tue, 7 Feb 2023 23:00:06 -0800
Subject: [PATCH 177/267] [RLlib] Move minibatching into RLTrainer instead of
 TrainerRunner (#32262)

Signed-off-by: Kourosh Hakhamaneshi <kourosh@anyscale.com>
---
 rllib/algorithms/ppo/ppo.py               |  2 +-
 rllib/core/rl_trainer/rl_trainer.py       | 76 ++++++++++++++++----
 rllib/core/rl_trainer/tf/tf_rl_trainer.py | 50 ++++++++++---
 rllib/core/rl_trainer/trainer_runner.py   | 86 ++++++++++-------------
 rllib/utils/minibatch_utils.py            | 30 +++++++-
 5 files changed, 171 insertions(+), 73 deletions(-)

diff --git a/rllib/algorithms/ppo/ppo.py b/rllib/algorithms/ppo/ppo.py
index 7108241fd68c..969755e5f977 100644
--- a/rllib/algorithms/ppo/ppo.py
+++ b/rllib/algorithms/ppo/ppo.py
@@ -398,7 +398,7 @@ def training_step(self) -> ResultDict:
             # communication between driver and the remote
             # trainer workers
 
-            train_results = self.trainer_runner.fit(
+            train_results = self.trainer_runner.update(
                 train_batch,
                 minibatch_size=self.config.sgd_minibatch_size,
                 num_iters=self.config.num_sgd_iter,
diff --git a/rllib/core/rl_trainer/rl_trainer.py b/rllib/core/rl_trainer/rl_trainer.py
index d8b9d1cc3ff6..1c9d93e68e13 100644
--- a/rllib/core/rl_trainer/rl_trainer.py
+++ b/rllib/core/rl_trainer/rl_trainer.py
@@ -24,7 +24,6 @@
     ModuleID,
     SingleAgentRLModuleSpec,
 )
-
 from ray.rllib.core.rl_module.marl_module import (
     MultiAgentRLModule,
     MultiAgentRLModuleSpec,
@@ -32,8 +31,13 @@
 from ray.rllib.policy.sample_batch import SampleBatch, MultiAgentBatch
 from ray.rllib.utils.nested_dict import NestedDict
 from ray.rllib.utils.numpy import convert_to_numpy
-from ray.rllib.utils.typing import TensorType
+from ray.rllib.utils.typing import TensorType, ResultDict
+from ray.rllib.utils.minibatch_utils import (
+    MiniBatchDummyIterator,
+    MiniBatchCyclicIterator,
+)
 from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
+from ray.rllib.core.rl_trainer.reduce_result_dict_fn import _reduce_mean_results
 
 
 torch, _ = try_import_torch()
@@ -337,22 +341,67 @@ def compile_results(
 
         return ret
 
-    def update(self, batch: MultiAgentBatch) -> Mapping[str, Any]:
-        """Perform an update on this Trainer.
+    def update(
+        self,
+        batch: MultiAgentBatch,
+        *,
+        minibatch_size: Optional[int] = None,
+        num_iters: int = 1,
+        reduce_fn: Callable[[ResultDict], ResultDict] = _reduce_mean_results,
+    ) -> Mapping[str, Any]:
+        """Do `num_iters` minibatch updates given the original batch.
+
+        Given a batch of episodes you can use this method to take more
+        than one backward pass on the batch. The same minibatch_size and num_iters
+        will be used for all module ids (previously known as policies) in the
+        multiagent batch
 
         Args:
             batch: A batch of data.
-
+            minibatch_size: The size of the minibatch to use for each update.
+            num_iters: The number of complete passes over all the sub-batches
+                in the input multi-agent batch.
+            reduce_fn: reduce_fn: A function to reduce the results from a list of
+                minibatch updates. This can be any arbitrary function that takes a
+                list of dictionaries and returns a single dictionary. For example you
+                can either take an average (default) or concatenate the results (for
+                example for metrics) or be more selective about you want to report back
+                to the algorithm's training_step. If None is passed, the results will
+                not get reduced.
         Returns:
-            A dictionary of results.
+            A dictionary of results, in numpy format.
         """
         self.__check_if_build_called()
-        if not self.distributed:
-            return self._update(batch)
+
+        batch_iter = (
+            MiniBatchCyclicIterator
+            if minibatch_size is not None
+            else MiniBatchDummyIterator
+        )
+
+        results = []
+        for minibatch in batch_iter(batch, minibatch_size, num_iters):
+
+            if not self.distributed:
+                result = self._update(minibatch)
+            else:
+                result = self.do_distributed_update(minibatch)
+
+            results.append(result)
+
+        # Reduce results across all minibatches, if necessary.
+        if len(results) == 1:
+            return results[0]
         else:
-            return self.do_distributed_update(batch)
+            if reduce_fn is None:
+                return results
+            return reduce_fn(results)
+
+    def _update(
+        self,
+        batch: MultiAgentBatch,
+    ) -> Mapping[str, Any]:
 
-    def _update(self, batch: MultiAgentBatch) -> Mapping[str, Any]:
         # TODO (Kourosh): remove the MultiAgentBatch from the type, it should be
         # NestedDict from the base class.
         batch = self._convert_batch_type(batch)
@@ -361,7 +410,8 @@ def _update(self, batch: MultiAgentBatch) -> Mapping[str, Any]:
         gradients = self.compute_gradients(loss)
         postprocessed_gradients = self.postprocess_gradients(gradients)
         self.apply_gradients(postprocessed_gradients)
-        return self.compile_results(batch, fwd_out, loss, postprocessed_gradients)
+        result = self.compile_results(batch, fwd_out, loss, postprocessed_gradients)
+        return convert_to_numpy(result)
 
     @abc.abstractmethod
     def _convert_batch_type(self, batch: MultiAgentBatch) -> NestedDict[TensorType]:
@@ -578,7 +628,9 @@ def build(self) -> None:
                 self._params[param_ref] = param
                 self._param_to_optim[param_ref] = optimizer
 
-    def do_distributed_update(self, batch: MultiAgentBatch) -> Mapping[str, Any]:
+    def do_distributed_update(
+        self, batch: MultiAgentBatch, **kwargs
+    ) -> Mapping[str, Any]:
         """Perform a distributed update on this Trainer.
 
         Args:
diff --git a/rllib/core/rl_trainer/tf/tf_rl_trainer.py b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
index a66d443f3e95..83cb5124b96d 100644
--- a/rllib/core/rl_trainer/tf/tf_rl_trainer.py
+++ b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
@@ -29,7 +29,11 @@
 from ray.rllib.policy.sample_batch import MultiAgentBatch
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.framework import try_import_tf
-from ray.rllib.utils.typing import TensorType
+from ray.rllib.utils.typing import TensorType, ResultDict
+from ray.rllib.utils.minibatch_utils import (
+    MiniBatchDummyIterator,
+    MiniBatchCyclicIterator,
+)
 from ray.rllib.utils.nested_dict import NestedDict
 
 
@@ -108,6 +112,7 @@ def __init__(
             self._update_fn = self._do_update_fn
 
     def _do_update_fn(self, batch: MultiAgentBatch) -> Mapping[str, Any]:
+        # TODO (Avnish): Match this base class's implementation.
         with tf.GradientTape() as tape:
             fwd_out = self._module.forward_train(batch)
             loss = self.compute_loss(fwd_out=fwd_out, batch=batch)
@@ -131,22 +136,47 @@ def configure_optimizers(self) -> ParamOptimizerPairs:
         ]
 
     @override(RLTrainer)
-    def update(self, batch: MultiAgentBatch) -> Mapping[str, Any]:
+    def update(
+        self,
+        batch: MultiAgentBatch,
+        *,
+        minibatch_size: Optional[int] = None,
+        num_iters: int = 1,
+        reduce_fn: Callable[[ResultDict], ResultDict] = ...,
+    ) -> Mapping[str, Any]:
         if set(batch.policy_batches.keys()) != set(self._module.keys()):
             raise ValueError(
                 "Batch keys must match module keys. RLTrainer does not "
                 "currently support training of only some modules and not others"
             )
         batch = self.convert_batch_to_tf_tensor(batch)
-        if self.distributed:
-            update_outs = self.do_distributed_update(batch)
+
+        batch_iter = (
+            MiniBatchCyclicIterator
+            if minibatch_size is not None
+            else MiniBatchDummyIterator
+        )
+
+        results = []
+        for minibatch in batch_iter(batch, minibatch_size, num_iters):
+
+            if self.distributed:
+                update_outs = self.do_distributed_update(minibatch)
+            else:
+                update_outs = self._update_fn(minibatch)
+            loss = update_outs["loss"]
+            fwd_out = update_outs["fwd_out"]
+            postprocessed_gradients = update_outs["postprocessed_gradients"]
+            result = self.compile_results(batch, fwd_out, loss, postprocessed_gradients)
+            results.append(result)
+
+        # Reduce results across all minibatches, if necessary.
+        if len(results) == 1:
+            return results[0]
         else:
-            update_outs = self._update_fn(batch)
-        loss = update_outs["loss"]
-        fwd_out = update_outs["fwd_out"]
-        postprocessed_gradients = update_outs["postprocessed_gradients"]
-        results = self.compile_results(batch, fwd_out, loss, postprocessed_gradients)
-        return results
+            if reduce_fn is None:
+                return results
+            return reduce_fn(results)
 
     @override(RLTrainer)
     def compute_gradients(
diff --git a/rllib/core/rl_trainer/trainer_runner.py b/rllib/core/rl_trainer/trainer_runner.py
index 55f99dfc0b47..97f514b86e66 100644
--- a/rllib/core/rl_trainer/trainer_runner.py
+++ b/rllib/core/rl_trainer/trainer_runner.py
@@ -1,13 +1,10 @@
 import math
-import tree  # pip install dm-tree
-import numpy as np
 from typing import Any, List, Mapping, Type, Optional, Callable, Set, TYPE_CHECKING
 
 import ray
 
 from ray.rllib.utils.typing import ResultDict
 from ray.rllib.utils.numpy import convert_to_numpy
-from ray.rllib.utils.minibatch_utils import MiniBatchCyclicIterator
 from ray.rllib.core.rl_trainer.reduce_result_dict_fn import _reduce_mean_results
 from ray.rllib.core.rl_module.rl_module import (
     RLModule,
@@ -106,56 +103,21 @@ def __init__(
     def is_local(self) -> bool:
         return self._is_local
 
-    def fit(
-        self,
-        batch: MultiAgentBatch,
-        *,
-        minibatch_size: int,
-        num_iters: int,
-        reduce_fn: Optional[Callable[[ResultDict], ResultDict]] = _reduce_mean_results,
-    ) -> Mapping[str, Any]:
-        """Do `num_iters` minibatch updates given the original batch.
-
-        Given a batch of episodes you can use this method to take more
-        than one backward pass on the batch. The same minibatch_size and num_iters gets
-        will be used for all module ids (previously known as policies) in the
-        multiagent batch
-
-        Args:
-            batch: The data to use for the update.
-            minibatch_size: The size of the minibatch to use for each update.
-            num_iters: The number of complete passes over all the sub-batches
-                in the input multi-agent batch.
-            reduce_fn: See `update()` documenation for more details.
-
-        Returns:
-            A dictionary of results summarizing the statistics of the updates.
-        """
-
-        # TODO (Kourosh): One data transfer is probably better than many for each mini
-        # batch. How should we do this?
-        # loop until the number of passes through all modules batches reaches the
-        # num_iters
-        results = []
-        for minibatch in MiniBatchCyclicIterator(batch, minibatch_size, num_iters):
-            results.append(self.update(minibatch, reduce_fn=reduce_fn))
-
-        # return the average of the results using tree map
-        # TODO (Kourosh): There should be system for reporting back metrics from
-        # RLTrainers. Some metrics should be averaged, while some should be just
-        # concatenated.
-        return tree.map_structure(lambda *x: np.mean(x), *results)
-
     def update(
         self,
         batch: MultiAgentBatch,
         *,
-        reduce_fn: Optional[Callable[[ResultDict], ResultDict]] = _reduce_mean_results,
+        minibatch_size: Optional[int] = None,
+        num_iters: int = 1,
+        reduce_fn: Callable[[ResultDict], ResultDict] = _reduce_mean_results,
     ) -> List[Mapping[str, Any]]:
         """Do one gradient based update to the RLTrainer(s).
 
         Args:
             batch: The data to use for the update.
+            minibatch_size: The minibatch size to use for the update.
+            num_iters: The number of complete passes over all the sub-batches in the
+                input multi-agent batch.
             reduce_fn: A function to reduce the results from a list of RLTrainer Actors
                 into a single result. This can be any arbitrary function that takes a
                 list of dictionaries and returns a single dictionary. For example you
@@ -168,16 +130,35 @@ def update(
             A list of dictionaries of results from the updates from the RLTrainer(s)
         """
         if self.is_local:
-            results = [self._trainer.update(batch)]
+            results = [
+                self._trainer.update(
+                    batch,
+                    minibatch_size=minibatch_size,
+                    num_iters=num_iters,
+                    reduce_fn=reduce_fn,
+                )
+            ]
         else:
-            results = self._distributed_update(batch)
+            results = self._distributed_update(
+                batch,
+                minibatch_size=minibatch_size,
+                num_iters=num_iters,
+                reduce_fn=reduce_fn,
+            )
 
         # TODO (Kourosh): Maybe we should use LearnerInfoBuilder() here?
         if reduce_fn is None:
             return results
         return reduce_fn(results)
 
-    def _distributed_update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]:
+    def _distributed_update(
+        self,
+        batch: MultiAgentBatch,
+        *,
+        minibatch_size: Optional[int] = None,
+        num_iters: int = 1,
+        reduce_fn: Callable[[ResultDict], ResultDict] = _reduce_mean_results,
+    ) -> List[Mapping[str, Any]]:
         """Do a gradient based update to the RLTrainers using DDP training.
 
         Note: this function is used if the num_gpus this TrainerRunner is configured
@@ -186,7 +167,7 @@ def _distributed_update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]
             different backend than the cuda backend.
 
         Args:
-            batch: The data to use for the update.
+            See `.update()` docstring.
 
         Returns:
             A list of dictionaries of results from the updates from the RLTrainer(s)
@@ -202,7 +183,14 @@ def _distributed_update(self, batch: MultiAgentBatch) -> List[Mapping[str, Any]]
                 batch_to_send[pid] = sub_batch[int(start) : int(end)]
             # TODO (Avnish): int(batch_size) ? How should we shard MA batches really?
             new_batch = MultiAgentBatch(batch_to_send, int(batch_size))
-            refs.append(worker.update.remote(new_batch))
+            refs.append(
+                worker.update.remote(
+                    new_batch,
+                    minibatch_size=minibatch_size,
+                    num_iters=num_iters,
+                    reduce_fn=reduce_fn,
+                )
+            )
 
         results = ray.get(refs)
         return results
diff --git a/rllib/utils/minibatch_utils.py b/rllib/utils/minibatch_utils.py
index 5b21b57eacee..b63881489129 100644
--- a/rllib/utils/minibatch_utils.py
+++ b/rllib/utils/minibatch_utils.py
@@ -3,7 +3,25 @@
 
 
 @DeveloperAPI
-class MiniBatchCyclicIterator:
+class MiniBatchIteratorBase:
+    """The base class for all minibatch iterators.
+
+    Args:
+        batch: The input multi-agent batch.
+        minibatch_size: The size of the minibatch for each module_id.
+        num_iters: The number of epochs to cover. If the input batch is smaller than
+            minibatch_size, then the iterator will cycle through the batch until it
+            has covered num_iters epochs.
+    """
+
+    def __init__(
+        self, batch: MultiAgentBatch, minibatch_size: int, num_iters: int = 1
+    ) -> None:
+        pass
+
+
+@DeveloperAPI
+class MiniBatchCyclicIterator(MiniBatchIteratorBase):
     """This implements a simple multi-agent minibatch iterator.
 
 
@@ -23,6 +41,7 @@ class MiniBatchCyclicIterator:
     def __init__(
         self, batch: MultiAgentBatch, minibatch_size: int, num_iters: int = 1
     ) -> None:
+        super().__init__(batch, minibatch_size, num_iters)
         self._batch = batch
         self._minibatch_size = minibatch_size
         self._num_iters = num_iters
@@ -61,3 +80,12 @@ def __iter__(self):
             # this it will be fine for now.
             minibatch = MultiAgentBatch(minibatch, len(self._batch))
             yield minibatch
+
+
+class MiniBatchDummyIterator(MiniBatchIteratorBase):
+    def __init__(self, batch: MultiAgentBatch, minibatch_size: int, num_iters: int = 1):
+        super().__init__(batch, minibatch_size, num_iters)
+        self._batch = batch
+
+    def __iter__(self):
+        yield self._batch

From 59c62e472f747d5dfc44795968358f9e79c62165 Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Wed, 8 Feb 2023 08:47:36 +0100
Subject: [PATCH 178/267] [RLlib] Support empty leafs with NestedDict (#32136)

* add test cases and make nesteddict also support empty elements

Signed-off-by: Artur Niederfahrenhorst <artur@anyscale.com>
---
 rllib/utils/nested_dict.py            | 57 ++++++++++++++++++++-------
 rllib/utils/tests/test_nested_dict.py | 52 +++++++++++++++++++-----
 2 files changed, 85 insertions(+), 24 deletions(-)

diff --git a/rllib/utils/nested_dict.py b/rllib/utils/nested_dict.py
index 1e4d308d1ef5..ce6f70737176 100644
--- a/rllib/utils/nested_dict.py
+++ b/rllib/utils/nested_dict.py
@@ -59,20 +59,26 @@ def __gt__(self, other: SeqStrType):
 
 @ExperimentalAPI
 class NestedDict(Generic[T], MutableMapping[str, Union[T, "NestedDict"]]):
-    """A nested dict type:
-        * The nested dict gives access to nested elements as a sequence of
+    """A dict with special properties to support partial indexing.
+
+    The main properties of NestedDict are::
+        * The NestedDict gives access to nested elements as a sequence of
         strings.
-        * These nested dicts can also be used to filter a superset into a subset of
+        * These NestedDicts can also be used to filter a superset into a subset of
         nested elements with the filter function.
         * This can be instantiated with any mapping of strings, or an iterable of
         key value tuples where the values can themselves be recursively the values
-        that a nested dict can take.
+        that a NestedDict can take.
+        * The length of a NestedDict is the number of leaves in the tree, excluding
+        empty leafs.
+        * Iterating over a NestedDict yields the leaves of the tree, including empty
+        leafs.
 
     Args:
-        x: a representation of a nested dict: it can be an iterable of `SeqStrType`
+        x: a representation of a NestedDict: it can be an iterable of `SeqStrType`
         to values. e.g. `[(("a", "b") , 1), ("b", 2)]` or a mapping of flattened
         keys to values. e.g. `{("a", "b"): 1, ("b",): 2}` or any nested mapping,
-        e.g. `{"a": {"b": 1}, "b": 2}`.
+        e.g. `{"a": {"b": 1}, "b": {}}`.
 
     Example:
         Basic usage:
@@ -131,6 +137,7 @@ def __init__(
             raise ValueError(f"Input must be a Mapping or Iterable, got {type(x)}.")
 
     def __contains__(self, k: SeqStrType) -> bool:
+        """Returns true if the key is in the NestedDict."""
         k = _flatten_index(k)
 
         data_ptr = self._data  # type: Dict[str, Any]
@@ -148,12 +155,13 @@ def get(
         self, k: SeqStrType, default: Optional[T] = None
     ) -> Union[T, "NestedDict[T]"]:
         """Returns `self[k]`, with partial indexing allowed.
+
         If `k` is not in the `NestedDict`, returns default. If default is `None`,
         and `k` is not in the `NestedDict`, a `KeyError` is raised.
 
         Args:
-            k: the key to get. This can be a string or a sequence of strings.
-            default: the default value to return if `k` is not in the `NestedDict`. If
+            k: The key to get. This can be a string or a sequence of strings.
+            default: The default value to return if `k` is not in the `NestedDict`. If
                 default is `None`, and `k` is not in the `NestedDict`, a `KeyError` is
                 raised.
 
@@ -184,10 +192,11 @@ def __getitem__(self, k: SeqStrType) -> T:
         return output
 
     def __setitem__(self, k: SeqStrType, v: Union[T, _NestedMappingType]) -> None:
-        """This is a zero-copy operation. The pointer to value if preserved in the
-        internal data structure."""
-        if isinstance(v, Mapping) and len(v) == 0:
-            return
+        """Sets item at `k` to `v`.
+
+        This is a zero-copy operation. The pointer to value if preserved in the
+        internal data structure.
+        """
         if not k:
             raise IndexError(
                 f"Key for {self.__class__.__name__} cannot be empty. Got {k}."
@@ -206,17 +215,31 @@ def __setitem__(self, k: SeqStrType, v: Union[T, _NestedMappingType]) -> None:
             data_ptr = data_ptr[key]
 
     def __iter__(self) -> Iterator[SeqStrType]:
+        """Iterate over NestedDict, returning tuples of paths.
+
+        Every iteration yields a tuple of strings, with each element of
+        such a tuple representing a branch in the NestedDict. Each yielded tuple
+        represents the path to a leaf. This includes leafs that are empty dicts.
+        For example, if the NestedDict is: {'a': {'b': 1, 'c': {}}}, then this
+        iterator will yield: ('a', 'b'), ('a', 'c').
+        """
         data_ptr = self._data
         # do a DFS to get all the keys
         stack = [((StrKey(k),), v) for k, v in data_ptr.items()]
         while stack:
             k, v = stack.pop(0)
             if isinstance(v, NestedDict):
-                stack = [(k + (StrKey(k2),), v) for k2, v in v._data.items()] + stack
+                if len(v._data) == 0:
+                    yield tuple(k)
+                else:
+                    stack = [
+                        (k + (StrKey(k2),), v) for k2, v in v._data.items()
+                    ] + stack
             else:
                 yield tuple(k)
 
     def __delitem__(self, k: SeqStrType) -> None:
+        """Deletes item at `k`."""
         ks, ns = [], []
         data_ptr = self._data
         for k in _flatten_index(k):
@@ -235,8 +258,11 @@ def __delitem__(self, k: SeqStrType) -> None:
                 del ns[i][ks[i]]
 
     def __len__(self) -> int:
-        """Returns the number of leaf nodes in the `NestedDict` that
-        are not of type Mappings.
+        """Returns the length of the NestedDict.
+
+        The length is defined as the number of leaf nodes in the `NestedDict` that
+        are not of type Mapping. For example, if the `NestedDict` is: {'a': {'b': 1,
+        'c': {}}}, then the length is 1.
         """
 
         # do a DFS to count the number of leaf nodes
@@ -265,6 +291,7 @@ def filter(
         ignore_missing: bool = False,
     ) -> "NestedDict[T]":
         """Returns a NestedDict with only entries present in `other`.
+
         The values in the `other` NestedDict are ignored. Only the keys are used.
 
         Args:
diff --git a/rllib/utils/tests/test_nested_dict.py b/rllib/utils/tests/test_nested_dict.py
index 6dd8b0a059e5..d35ae7e0c3a5 100644
--- a/rllib/utils/tests/test_nested_dict.py
+++ b/rllib/utils/tests/test_nested_dict.py
@@ -22,6 +22,10 @@ def set_invalid_item_2():
             "b": {"c": 200, "d": 300},
             "c": {"e": {"f": 400}},
             "d": {"g": {"h": {"i": 500}}},
+            # An empty dict that has no leafs and thus should be ignored when
+            # counting or iterating
+            "j": {"k": {}},
+            "l": {},
         }
 
         desired_keys = [
@@ -30,32 +34,38 @@ def set_invalid_item_2():
             ("b", "d"),
             ("c", "e", "f"),
             ("d", "g", "h", "i"),
+            ("j", "k"),
+            ("l",),
         ]
 
-        desired_values = [100, 200, 300, 400, 500]
+        # We have 5 leafs that are not empty and two empty leafs
+        desired_values = [100, 200, 300, 400, 500, NestedDict(), NestedDict()]
 
         foo_dict["aa"] = 100
         foo_dict["b", "c"] = 200
         foo_dict[("b", "d")] = 300
         foo_dict["c", "e"] = {"f": 400}
 
-        # Note: key ("c", "f") should not be a valid key since it is empty
-        foo_dict["c", "f"] = NestedDict()
-
         # test __len__
-        self.assertEqual(len(foo_dict), len(desired_keys) - 1)
+        # We have not yet included d, j and l in foo_dict
+        self.assertEqual(len(foo_dict), len(desired_keys) - 3)
 
         # test __iter__
-        self.assertEqual(list(iter(foo_dict)), desired_keys[:-1])
+        self.assertEqual(list(iter(foo_dict)), desired_keys[:-3])
 
         # this call will use __len__ and __iter__
-        foo_dict["d"] = {"g": NestedDict([(("h"), NestedDict({"i": 500}))])}
+        foo_dict["d"] = {"g": NestedDict([("h", NestedDict({"i": 500}))])}
+        foo_dict["j"] = {"k": {}}
+        foo_dict["l"] = {}
 
         # test asdict
         check(foo_dict.asdict(), desired_dict)
 
         # test __len__ again
-        self.assertEqual(len(foo_dict), len(desired_keys))
+        # We have included d, j and l in foo_dict, but j and l don't contribute to
+        # the length because they are empty sub-roots of the tree structure with no
+        # leafs.
+        self.assertEqual(len(foo_dict), len(desired_keys) - 2)
 
         # test __iter__ again
         self.assertEqual(list(iter(foo_dict)), desired_keys)
@@ -98,7 +108,7 @@ def set_invalid_item_2():
         )
 
         # test shallow_keys()
-        self.assertEqual(list(foo_dict.shallow_keys()), ["aa", "b", "c", "d"])
+        self.assertEqual(list(foo_dict.shallow_keys()), ["aa", "b", "c", "d", "j", "l"])
 
         # test copy()
         foo_dict_copy = foo_dict.copy()
@@ -140,6 +150,30 @@ def test_filter(self):
             dict1.filter(dict3, ignore_missing=True).asdict(), {"foo": {"a": 10}}
         )
 
+    def test_init(self):
+        # test init with list
+        foo_dict = NestedDict([(("a", "b"), 1), (("a", "c"), 2)])
+        self.assertEqual(foo_dict.asdict(), {"a": {"b": 1, "c": 2}})
+
+        # test init with dict
+        foo_dict = NestedDict({"a": {"b": 1, "c": 2}})
+        self.assertEqual(foo_dict.asdict(), {"a": {"b": 1, "c": 2}})
+
+        # test init with NestedDict
+        foo_dict = NestedDict(NestedDict({"a": {"b": 1, "c": 2}}))
+        self.assertEqual(foo_dict.asdict(), {"a": {"b": 1, "c": 2}})
+
+        # test init empty element
+        foo_dict = NestedDict({"a": {}})
+        self.assertEqual(foo_dict.asdict(), {"a": {}})
+
+        # test init with nested empty element
+        foo_dict = NestedDict({"a": {"b": {}, "c": 2}})
+        self.assertEqual(foo_dict.asdict(), {"a": {"b": {}, "c": 2}})
+
+        # test init with empty dict
+        self.assertEqual(NestedDict().asdict(), {})
+
 
 if __name__ == "__main__":
     import pytest

From b85eb5285f88fc960e508ce264d611d6d8378a59 Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Tue, 7 Feb 2023 23:48:32 -0800
Subject: [PATCH 179/267] [RLlib] Forward fix for failing PPO Torch RLTrainer
 test (#32308)

Signed-off-by: Kourosh Hakhamaneshi <kourosh@anyscale.com>
---
 rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py b/rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py
index a7eb642a6697..52d52596058f 100644
--- a/rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py
+++ b/rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py
@@ -20,6 +20,10 @@
         [[0.1, 0.2, 0.3, 0.4], [0.5, 0.6, 0.7, 0.8], [0.9, 1.0, 1.1, 1.2]],
         dtype=np.float32,
     ),
+    SampleBatch.NEXT_OBS: np.array(
+        [[0.1, 0.2, 0.3, 0.4], [0.5, 0.6, 0.7, 0.8], [0.9, 1.0, 1.1, 1.2]],
+        dtype=np.float32,
+    ),
     SampleBatch.ACTIONS: np.array([0, 1, 1]),
     SampleBatch.PREV_ACTIONS: np.array([0, 1, 1]),
     SampleBatch.REWARDS: np.array([1.0, -1.0, 0.5], dtype=np.float32),
@@ -57,7 +61,7 @@ def test_loss(self):
             .training(
                 gamma=0.99,
                 model=dict(
-                    fcnet_hiddens=[10],
+                    fcnet_hiddens=[10, 10],
                     fcnet_activation="linear",
                     vf_share_layers=False,
                 ),

From d25650824ed1e2b4c2bd3f97e56dd25514161002 Mon Sep 17 00:00:00 2001
From: Jiajun Yao <jeromeyjj@gmail.com>
Date: Thu, 9 Feb 2023 01:11:43 +0800
Subject: [PATCH 180/267] [Doc] Add tips of writing fault tolerant Ray
 applications (#32191)

Signed-off-by: Jiajun Yao <jeromeyjj@gmail.com>
---
 .../doc_code/anti_pattern_return_ray_put.py   |  3 -
 .../ray-core/doc_code/fault_tolerance_tips.py | 88 +++++++++++++++++++
 doc/source/ray-core/fault-tolerance.rst       | 57 ++++++++++++
 .../ray-core/patterns/return-ray-put.rst      |  6 +-
 4 files changed, 146 insertions(+), 8 deletions(-)
 create mode 100644 doc/source/ray-core/doc_code/fault_tolerance_tips.py

diff --git a/doc/source/ray-core/doc_code/anti_pattern_return_ray_put.py b/doc/source/ray-core/doc_code/anti_pattern_return_ray_put.py
index 1ef55ec0dd33..bd86b7a211fb 100644
--- a/doc/source/ray-core/doc_code/anti_pattern_return_ray_put.py
+++ b/doc/source/ray-core/doc_code/anti_pattern_return_ray_put.py
@@ -138,9 +138,6 @@ def task_with_dynamic_returns_bad(n):
     return return_value_refs
 
 
-# Note: currently actor tasks don't support dynamic returns
-# so the previous approach needs to be used if you want to
-# return dynamic number of objects from an actor task.
 @ray.remote(num_returns="dynamic")
 def task_with_dynamic_returns_good(n):
     for i in range(n):
diff --git a/doc/source/ray-core/doc_code/fault_tolerance_tips.py b/doc/source/ray-core/doc_code/fault_tolerance_tips.py
new file mode 100644
index 000000000000..24f8a8741c31
--- /dev/null
+++ b/doc/source/ray-core/doc_code/fault_tolerance_tips.py
@@ -0,0 +1,88 @@
+# __return_ray_put_start__
+import ray
+
+
+# Non-fault tolerant version:
+@ray.remote
+def a():
+    x_ref = ray.put(1)
+    return x_ref
+
+
+x_ref = ray.get(a.remote())
+# Object x outlives its owner task A.
+try:
+    # If owner of x (i.e. the worker process running task A) dies,
+    # the application can no longer get value of x.
+    print(ray.get(x_ref))
+except ray.exceptions.OwnerDiedError:
+    pass
+# __return_ray_put_end__
+
+
+# __return_directly_start__
+# Fault tolerant version:
+@ray.remote
+def a():
+    # Here we return the value directly instead of calling ray.put() first.
+    return 1
+
+
+# The owner of x is the driver
+# so x is accessible and can be auto recovered
+# during the entire lifetime of the driver.
+x_ref = a.remote()
+print(ray.get(x_ref))
+# __return_directly_end__
+
+
+# __node_ip_resource_start__
+@ray.remote
+def b():
+    return 1
+
+
+# If the node with ip 127.0.0.3 fails while task b is running,
+# Ray cannot retry the task on other nodes.
+b.options(resources={"node:127.0.0.3": 1}).remote()
+# __node_ip_resource_end__
+
+# __node_affinity_scheduling_strategy_start__
+# Prefer running on the particular node specified by node id
+# but can also run on other nodes if the target node fails.
+b.options(
+    scheduling_strategy=ray.util.scheduling_strategies.NodeAffinitySchedulingStrategy(
+        node_id=ray.get_runtime_context().get_node_id(), soft=True
+    )
+).remote()
+# __node_affinity_scheduling_strategy_end__
+
+
+# __manual_retry_start__
+@ray.remote
+class Actor:
+    def read_only(self):
+        import sys
+        import random
+
+        rand = random.random()
+        if rand < 0.2:
+            return 2 / 0
+        elif rand < 0.3:
+            sys.exit(1)
+
+        return 2
+
+
+actor = Actor.remote()
+# Manually retry the actor task.
+while True:
+    try:
+        print(ray.get(actor.read_only.remote()))
+        break
+    except ZeroDivisionError:
+        pass
+    except ray.exceptions.RayActorError:
+        # Manually restart the actor
+        actor = Actor.remote()
+# __manual_retry_end__
diff --git a/doc/source/ray-core/fault-tolerance.rst b/doc/source/ray-core/fault-tolerance.rst
index 2bc5c9a9028e..23843261d1d6 100644
--- a/doc/source/ray-core/fault-tolerance.rst
+++ b/doc/source/ray-core/fault-tolerance.rst
@@ -18,6 +18,63 @@ tolerance for more information on these mechanisms.
 Ray also provides several mechanisms to automatically recover from internal system-level failures. In particular, Ray can automatically recover from some failures in the :ref:`distributed object store <fault-tolerance-objects>`.
 
 
+How to Write Fault Tolerant Ray Applications
+--------------------------------------------
+
+There are several recommendations to make Ray applications fault tolerant:
+
+First, if the fault tolerance mechanisms provided by Ray don't work for you,
+you can always catch :ref:`exceptions <ray-core-exceptions>` caused by failures and recover manually.
+
+.. literalinclude:: doc_code/fault_tolerance_tips.py
+    :language: python
+    :start-after: __manual_retry_start__
+    :end-before: __manual_retry_end__
+
+Second, avoid letting an ``ObjectRef`` outlive its :ref:`owner <fault-tolerance-objects>` task or actor
+(the task or actor that creates the initial ``ObjectRef`` by calling :meth:`ray.put() <ray.put>` or ``foo.remote()``).
+As long as there are still references to an object,
+the owner worker of the object keeps running even after the corresponding task or actor finishes.
+If the owner worker fails, Ray :ref:`cannot recover <fault-tolerance-ownership>` the object automatically for those who try to access the object.
+One example of creating such outlived objects is returning ``ObjectRef`` created by ``ray.put()`` from a task:
+
+.. literalinclude:: doc_code/fault_tolerance_tips.py
+    :language: python
+    :start-after: __return_ray_put_start__
+    :end-before: __return_ray_put_end__
+
+In the above example, object ``x`` outlives its owner task ``a``.
+If the worker process running task ``a`` fails, calling ``ray.get`` on ``x_ref`` afterwards will result in an ``OwnerDiedError`` exception.
+
+A fault tolerant version is returning ``x`` directly so that it is owned by the driver and it's only accessed within the lifetime of the driver.
+If ``x`` is lost, Ray can automatically recover it via :ref:`lineage reconstruction <fault-tolerance-objects-reconstruction>`.
+See :doc:`/ray-core/patterns/return-ray-put` for more details.
+
+.. literalinclude:: doc_code/fault_tolerance_tips.py
+    :language: python
+    :start-after: __return_directly_start__
+    :end-before: __return_directly_end__
+
+Third, avoid using :ref:`custom resource requirements <custom-resources>` that can only be satisfied by a particular node.
+If that particular node fails, the running tasks or actors cannot be retried.
+
+.. literalinclude:: doc_code/fault_tolerance_tips.py
+    :language: python
+    :start-after: __node_ip_resource_start__
+    :end-before: __node_ip_resource_end__
+
+If you prefer running a task on a particular node, you can use the :class:`NodeAffinitySchedulingStrategy <ray.util.scheduling_strategies.NodeAffinitySchedulingStrategy>`.
+It allows you to specify the affinity as a soft constraint so even if the target node fails, the task can still be retried on other nodes.
+
+.. literalinclude:: doc_code/fault_tolerance_tips.py
+    :language: python
+    :start-after: _node_affinity_scheduling_strategy_start__
+    :end-before: __node_affinity_scheduling_strategy_end__
+
+
+More about Ray Fault Tolerance
+------------------------------
+
 .. toctree::
     :maxdepth: 1
 
diff --git a/doc/source/ray-core/patterns/return-ray-put.rst b/doc/source/ray-core/patterns/return-ray-put.rst
index 79dfd4035c36..8bd1ae3e527c 100644
--- a/doc/source/ray-core/patterns/return-ray-put.rst
+++ b/doc/source/ray-core/patterns/return-ray-put.rst
@@ -9,7 +9,7 @@ Returning ray.put() ObjectRefs are considered anti-patterns for the following re
 - It disallows inlining small return values: Ray has a performance optimization to return small (<= 100KB) values inline directly to the caller, avoiding going through the distributed object store.
   On the other hand, ``ray.put()`` will unconditionally store the value to the object store which makes the optimization for small return values impossible.
 - Returning ObjectRefs involves extra distributed reference counting protocol which is slower than returning the values directly.
-- It's less fault tolerant: the worker process that calls ``ray.put()`` is the "owner" of the returned ``ObjectRef`` and the return value fate shares with the owner. If the worker process dies, the return value is lost.
+- It's less :ref:`fault tolerant <fault-tolerance>`: the worker process that calls ``ray.put()`` is the "owner" of the returned ``ObjectRef`` and the return value fate shares with the owner. If the worker process dies, the return value is lost.
   In contrast, the caller process (often the driver) is the owner of the return value if it's returned directly.
 
 Code example
@@ -35,7 +35,3 @@ If you don't know the number of returns before calling the task, you should use
     :language: python
     :start-after: __return_dynamic_multi_values_start__
     :end-before: __return_dynamic_multi_values_end__
-
-.. note::
-
-  Currently actor tasks don't support dynamic returns so you have to use ``ray.put()`` to store each return value and return a list of ObjectRefs in this case.

From 56606aed0bf17b623e8a932b14cc51ecf2b71be0 Mon Sep 17 00:00:00 2001
From: Chen Shen <scv119@gmail.com>
Date: Wed, 8 Feb 2023 10:31:10 -0800
Subject: [PATCH 181/267] [Telemetry] track num tasks created (#32106)

Tracks the total number of tasks created by leveraging the gcs_task_manager.
---
 python/ray/_private/usage/usage_lib.py        |   1 +
 python/ray/tests/test_usage_stats.py          | 155 +++++++++++++++---
 src/ray/gcs/gcs_server/gcs_server.cc          |   1 +
 src/ray/gcs/gcs_server/gcs_task_manager.cc    |  41 ++++-
 src/ray/gcs/gcs_server/gcs_task_manager.h     |   9 +
 .../gcs_server/test/gcs_task_manager_test.cc  |  12 +-
 src/ray/protobuf/usage.proto                  |   5 +
 7 files changed, 195 insertions(+), 29 deletions(-)

diff --git a/python/ray/_private/usage/usage_lib.py b/python/ray/_private/usage/usage_lib.py
index 14e1abdef70f..81e13c3927bf 100644
--- a/python/ray/_private/usage/usage_lib.py
+++ b/python/ray/_private/usage/usage_lib.py
@@ -620,6 +620,7 @@ def get_extra_usage_tags_to_report(gcs_client) -> Dict[str, str]:
             extra_usage_tags[key] = value.decode("utf-8")
     except Exception as e:
         logger.info(f"Failed to get extra usage tags from kv store {e}")
+    print(extra_usage_tags)
     return extra_usage_tags
 
 
diff --git a/python/ray/tests/test_usage_stats.py b/python/ray/tests/test_usage_stats.py
index 67a8e17852db..823b12c1739e 100644
--- a/python/ray/tests/test_usage_stats.py
+++ b/python/ray/tests/test_usage_stats.py
@@ -179,32 +179,46 @@ def test_get_extra_usage_tags_to_report(
             "ray://127.0.0.1:10001" if ray_client else address
         )
         run_string_as_driver(driver)
-        result = ray_usage_lib.get_extra_usage_tags_to_report(
-            ray.experimental.internal_kv.internal_kv_get_gcs_client()
+        wait_for_condition(
+            lambda: ray_usage_lib.get_extra_usage_tags_to_report(
+                ray.experimental.internal_kv.internal_kv_get_gcs_client()
+            )
+            == {
+                "key": "val",
+                "_test1": "val1",
+                "_test2": "val2",
+                "actor_num_created": "0",
+                "pg_num_created": "0",
+                "num_actor_creation_tasks": "0",
+                "num_actor_tasks": "0",
+                "num_normal_tasks": "0",
+                "num_drivers": "2",
+                "gcs_storage": gcs_storage_type,
+                "dashboard_used": "False",
+            },
+            timeout=10,
         )
-        assert result == {
-            "key": "val",
-            "_test1": "val1",
-            "_test2": "val2",
-            "actor_num_created": "0",
-            "pg_num_created": "0",
-            "gcs_storage": gcs_storage_type,
-            "dashboard_used": "False",
-        }
         # Make sure the value is overwritten.
         ray_usage_lib.record_extra_usage_tag(ray_usage_lib.TagKey._TEST2, "val3")
-        result = ray_usage_lib.get_extra_usage_tags_to_report(
-            ray.experimental.internal_kv.internal_kv_get_gcs_client()
+        wait_for_condition(
+            lambda: ray_usage_lib.get_extra_usage_tags_to_report(
+                ray.experimental.internal_kv.internal_kv_get_gcs_client()
+            )
+            == {
+                "key": "val",
+                "_test1": "val1",
+                "_test2": "val3",
+                "actor_num_created": "0",
+                "pg_num_created": "0",
+                "num_actor_creation_tasks": "0",
+                "num_actor_tasks": "0",
+                "num_normal_tasks": "0",
+                "num_drivers": "2",
+                "gcs_storage": gcs_storage_type,
+                "dashboard_used": "False",
+            },
+            timeout=10,
         )
-        assert result == {
-            "key": "val",
-            "_test1": "val1",
-            "_test2": "val3",
-            "gcs_storage": gcs_storage_type,
-            "dashboard_used": "False",
-            "actor_num_created": "0",
-            "pg_num_created": "0",
-        }
 
 
 @pytest.mark.skipif(
@@ -245,10 +259,11 @@ def oomer():
         assert result["worker_crash_oom"] == "1"
 
 
-def test_actor_stats():
+def test_actor_stats(reset_usage_stats):
     @ray.remote
     class Actor:
-        pass
+        def foo(self):
+            pass
 
     with ray.init(
         _system_config={"metrics_report_interval_ms": 1000},
@@ -260,6 +275,10 @@ class Actor:
             lambda: ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
                 "actor_num_created"
             )
+            == "1"
+            and ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
+                "num_actor_creation_tasks"
+            )
             == "1",
             timeout=10,
         )
@@ -268,13 +287,38 @@ class Actor:
             lambda: ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
                 "actor_num_created"
             )
-            == "2",
+            == "2"
+            and ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
+                "num_actor_creation_tasks"
+            )
+            == "2"
+            and ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
+                "num_actor_tasks"
+            )
+            == "0",
+            timeout=10,
+        )
+
+        ray.get(actor.foo.remote())
+        wait_for_condition(
+            lambda: ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
+                "actor_num_created"
+            )
+            == "2"
+            and ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
+                "num_actor_creation_tasks"
+            )
+            == "2"
+            and ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
+                "num_actor_tasks"
+            )
+            == "1",
             timeout=10,
         )
         del actor
 
 
-def test_pg_stats():
+def test_pg_stats(reset_usage_stats):
     with ray.init(
         num_cpus=3,
         _system_config={"metrics_report_interval_ms": 1000},
@@ -301,6 +345,49 @@ def test_pg_stats():
         )
 
 
+def test_task_stats(reset_usage_stats):
+    @ray.remote
+    def foo():
+        pass
+
+    with ray.init(
+        _system_config={"metrics_report_interval_ms": 1000},
+    ) as ctx:
+        gcs_client = gcs_utils.GcsClient(address=ctx.address_info["gcs_address"])
+
+        wait_for_condition(
+            lambda: ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
+                "num_normal_tasks"
+            )
+            == "0"
+            and ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
+                "num_drivers"
+            )
+            == "1",
+            timeout=10,
+        )
+        ray.get(foo.remote())
+        wait_for_condition(
+            lambda: ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
+                "num_normal_tasks"
+            )
+            == "1",
+            timeout=10,
+        )
+        ray.get(foo.remote())
+        wait_for_condition(
+            lambda: ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
+                "num_normal_tasks"
+            )
+            == "2"
+            and ray_usage_lib.get_extra_usage_tags_to_report(gcs_client).get(
+                "num_drivers"
+            )
+            == "1",
+            timeout=10,
+        )
+
+
 def test_usage_stats_enabledness(monkeypatch, tmp_path, reset_usage_stats):
     with monkeypatch.context() as m:
         m.setenv("RAY_USAGE_STATS_ENABLED", "1")
@@ -1131,8 +1218,16 @@ def ready(self):
         assert payload["total_object_store_memory_gb"] > 0
         assert int(payload["extra_usage_tags"]["actor_num_created"]) >= 0
         assert int(payload["extra_usage_tags"]["pg_num_created"]) >= 0
+        assert int(payload["extra_usage_tags"]["num_actor_creation_tasks"]) >= 0
+        assert int(payload["extra_usage_tags"]["num_actor_tasks"]) >= 0
+        assert int(payload["extra_usage_tags"]["num_normal_tasks"]) >= 0
+        assert int(payload["extra_usage_tags"]["num_drivers"]) >= 0
         payload["extra_usage_tags"]["actor_num_created"] = "0"
         payload["extra_usage_tags"]["pg_num_created"] = "0"
+        payload["extra_usage_tags"]["num_actor_creation_tasks"] = "0"
+        payload["extra_usage_tags"]["num_actor_tasks"] = "0"
+        payload["extra_usage_tags"]["num_normal_tasks"] = "0"
+        payload["extra_usage_tags"]["num_drivers"] = "0"
         assert payload["extra_usage_tags"] == {
             "extra_k1": "extra_v1",
             "_test1": "extra_v2",
@@ -1143,6 +1238,10 @@ def ready(self):
             "serve_api_version": "v1",
             "actor_num_created": "0",
             "pg_num_created": "0",
+            "num_actor_creation_tasks": "0",
+            "num_actor_tasks": "0",
+            "num_normal_tasks": "0",
+            "num_drivers": "0",
             "gcs_storage": gcs_storage_type,
             "dashboard_used": "False",
         }
@@ -1486,6 +1585,10 @@ def verify():
                 "dashboard_used": "False",
                 "actor_num_created": "0",
                 "pg_num_created": "0",
+                "num_actor_creation_tasks": "0",
+                "num_actor_tasks": "0",
+                "num_normal_tasks": "0",
+                "num_drivers": "1",
             }
             assert num_nodes == 2
             return True
diff --git a/src/ray/gcs/gcs_server/gcs_server.cc b/src/ray/gcs/gcs_server/gcs_server.cc
index 73715dbddc13..b20fe69e77d9 100644
--- a/src/ray/gcs/gcs_server/gcs_server.cc
+++ b/src/ray/gcs/gcs_server/gcs_server.cc
@@ -183,6 +183,7 @@ void GcsServer::DoStart(const GcsInitData &gcs_init_data) {
   gcs_worker_manager_->SetUsageStatsClient(usage_stats_client_.get());
   gcs_actor_manager_->SetUsageStatsClient(usage_stats_client_.get());
   gcs_placement_group_manager_->SetUsageStatsClient(usage_stats_client_.get());
+  gcs_task_manager_->SetUsageStatsClient(usage_stats_client_.get());
 
   RecordMetrics();
 
diff --git a/src/ray/gcs/gcs_server/gcs_task_manager.cc b/src/ray/gcs/gcs_server/gcs_task_manager.cc
index 4ab9f40148f5..3b326d2a8185 100644
--- a/src/ray/gcs/gcs_server/gcs_task_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_task_manager.cc
@@ -251,6 +251,10 @@ GcsTaskManager::GcsTaskManagerStorage::AddOrReplaceTaskEvent(
     auto &existing_events = task_events_.at(idx);
 
     // Update the events.
+    if (events_by_task.has_task_info() && !existing_events.has_task_info()) {
+      num_tasks_by_type_[events_by_task.task_info().type()]++;
+    }
+
     num_bytes_task_events_ -= existing_events.ByteSizeLong();
     existing_events.MergeFrom(events_by_task);
     num_bytes_task_events_ += existing_events.ByteSizeLong();
@@ -261,6 +265,11 @@ GcsTaskManager::GcsTaskManagerStorage::AddOrReplaceTaskEvent(
 
   // A new task event, add to storage and index.
 
+  // Bump the task counters by type.
+  if (events_by_task.has_task_info() && events_by_task.attempt_number() == 0) {
+    num_tasks_by_type_[events_by_task.task_info().type()]++;
+  }
+
   // If limit enforced, replace one.
   // TODO(rickyx): Optimize this to per job limit with bounded FIFO map.
   // https://github.com/ray-project/ray/issues/31071
@@ -444,8 +453,16 @@ std::string GcsTaskManager::DebugString() {
      << "\n-Total num profile events dropped: " << total_num_profile_task_events_dropped_
      << "\n-Total num bytes of task event stored: "
      << 1.0 * task_event_storage_->GetTaskEventsBytes() / 1024 / 1024 << "MiB"
-     << "\n-Total num of task events stored: "
-     << task_event_storage_->GetTaskEventsCount() << "\n";
+     << "\n-Current num of task events stored: "
+     << task_event_storage_->GetTaskEventsCount()
+     << "\n-Total num of actor creation tasks: "
+     << task_event_storage_->num_tasks_by_type_[rpc::TaskType::ACTOR_CREATION_TASK]
+     << "\n-Total num of actor tasks: "
+     << task_event_storage_->num_tasks_by_type_[rpc::TaskType::ACTOR_TASK]
+     << "\n-Total num of normal tasks: "
+     << task_event_storage_->num_tasks_by_type_[rpc::TaskType::NORMAL_TASK]
+     << "\n-Total num of driver tasks: "
+     << task_event_storage_->num_tasks_by_type_[rpc::TaskType::DRIVER_TASK];
 
   return ss.str();
 }
@@ -464,6 +481,26 @@ void GcsTaskManager::RecordMetrics() {
       task_event_storage_->GetTaskEventsCount());
   ray::stats::STATS_gcs_task_manager_task_events_stored_bytes.Record(
       task_event_storage_->GetTaskEventsBytes());
+
+  if (usage_stats_client_) {
+    usage_stats_client_->RecordExtraUsageCounter(
+        usage::TagKey::NUM_ACTOR_CREATION_TASKS,
+        task_event_storage_->num_tasks_by_type_[rpc::TaskType::ACTOR_CREATION_TASK]);
+    usage_stats_client_->RecordExtraUsageCounter(
+        usage::TagKey::NUM_ACTOR_TASKS,
+        task_event_storage_->num_tasks_by_type_[rpc::TaskType::ACTOR_TASK]);
+    usage_stats_client_->RecordExtraUsageCounter(
+        usage::TagKey::NUM_NORMAL_TASKS,
+        task_event_storage_->num_tasks_by_type_[rpc::TaskType::NORMAL_TASK]);
+    usage_stats_client_->RecordExtraUsageCounter(
+        usage::TagKey::NUM_DRIVERS,
+        task_event_storage_->num_tasks_by_type_[rpc::TaskType::DRIVER_TASK]);
+  }
+}
+
+void GcsTaskManager::SetUsageStatsClient(UsageStatsClient *usage_stats_client) {
+  absl::MutexLock lock(&mutex_);
+  usage_stats_client_ = usage_stats_client;
 }
 
 void GcsTaskManager::OnJobFinished(const JobID &job_id, int64_t job_finish_time_ms) {
diff --git a/src/ray/gcs/gcs_server/gcs_task_manager.h b/src/ray/gcs/gcs_server/gcs_task_manager.h
index f8e779ef7c1a..b628e7d01fb2 100644
--- a/src/ray/gcs/gcs_server/gcs_task_manager.h
+++ b/src/ray/gcs/gcs_server/gcs_task_manager.h
@@ -18,6 +18,7 @@
 #include "absl/container/flat_hash_map.h"
 #include "absl/container/flat_hash_set.h"
 #include "absl/synchronization/mutex.h"
+#include "ray/gcs/gcs_client/usage_stats_client.h"
 #include "ray/rpc/gcs_server/gcs_rpc_server.h"
 #include "src/ray/protobuf/gcs.pb.h"
 
@@ -97,6 +98,9 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
   /// Record metrics.
   void RecordMetrics() LOCKS_EXCLUDED(mutex_);
 
+  /// Set telemetry client.
+  void SetUsageStatsClient(UsageStatsClient *usage_stats_client) LOCKS_EXCLUDED(mutex_);
+
   /// A storage component that stores the task events.
   ///
   /// This is an in-memory storage component that supports adding and getting of task
@@ -255,6 +259,9 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
     /// A iterator into task_events_ that determines which element to be overwritten.
     size_t next_idx_to_overwrite_ = 0;
 
+    /// Total number of tasks by types, including ones have been evicted/finished.
+    absl::flat_hash_map<rpc::TaskType, size_t> num_tasks_by_type_;
+
     /// TODO(rickyx): Refactor this into LRI(least recently inserted) buffer:
     /// https://github.com/ray-project/ray/issues/31158
     /// Current task events stored.
@@ -312,6 +319,8 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
   /// Timer for delay functions.
   boost::asio::deadline_timer timer_;
 
+  UsageStatsClient *usage_stats_client_ GUARDED_BY(mutex_) = nullptr;
+
   FRIEND_TEST(GcsTaskManagerTest, TestHandleAddTaskEventBasic);
   FRIEND_TEST(GcsTaskManagerTest, TestMergeTaskEventsSameTaskAttempt);
   FRIEND_TEST(GcsTaskManagerMemoryLimitedTest, TestLimitTaskEvents);
diff --git a/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc b/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
index 7282b2df1670..294b8a6a158a 100644
--- a/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
@@ -608,7 +608,7 @@ TEST_F(GcsTaskManagerMemoryLimitedTest, TestIndexNoLeak) {
   size_t num_total = 1000;
 
   std::vector<TaskID> task_ids = GenTaskIDs(200);
-  std::vector<int64_t> attempt_numbers{0, 1, 2, 3, 4, 5};
+  std::vector<int64_t> attempt_numbers{0, 1, 2, 3, 4};
   std::vector<int> job_ids{1, 2, 3};
 
   // 10 random parent task ids
@@ -642,6 +642,13 @@ TEST_F(GcsTaskManagerMemoryLimitedTest, TestIndexNoLeak) {
     SyncAddTaskEventData(events_data);
   }
 
+  {
+    absl::MutexLock lock(&task_manager->mutex_);
+    EXPECT_EQ(
+        task_manager->task_event_storage_->num_tasks_by_type_[rpc::TaskType::NORMAL_TASK],
+        task_ids.size());
+  }
+
   // Evict all of them with tasks with single attempt, no parent, same job.
   {
     auto task_ids = GenTaskIDs(num_limit);
@@ -663,6 +670,9 @@ TEST_F(GcsTaskManagerMemoryLimitedTest, TestIndexNoLeak) {
   {
     absl::MutexLock lock(&task_manager->mutex_);
     EXPECT_EQ(task_manager->task_event_storage_->task_events_.size(), num_limit);
+    EXPECT_EQ(
+        task_manager->task_event_storage_->num_tasks_by_type_[rpc::TaskType::NORMAL_TASK],
+        task_ids.size() + num_limit);
     // No task has parent.
     EXPECT_EQ(task_manager->task_event_storage_->parent_to_children_task_index_.size(),
               0);
diff --git a/src/ray/protobuf/usage.proto b/src/ray/protobuf/usage.proto
index 52f397cfbab3..e30501aeb997 100644
--- a/src/ray/protobuf/usage.proto
+++ b/src/ray/protobuf/usage.proto
@@ -89,4 +89,9 @@ enum TagKey {
   // This is to track usage of the buggy behavior that will be fixed.
   // See https://github.com/ray-project/ray/issues/28465 for more details.
   RAY_GET_TIMEOUT_ZERO = 304;
+  // Total number of tasks created.
+  NUM_ACTOR_CREATION_TASKS = 305;
+  NUM_ACTOR_TASKS = 306;
+  NUM_NORMAL_TASKS = 307;
+  NUM_DRIVERS = 308;
 }

From cf1bc835d54b95ea1682aa85b48775e1390cebd5 Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Wed, 8 Feb 2023 10:46:45 -0800
Subject: [PATCH 182/267] [core] Fix the GCS memory usage high issue

It's not because of leak. The root cause is because we allocate more requests when start. This PR fixed it by making the number of call constant.
---
 src/ray/rpc/grpc_server.cc | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/ray/rpc/grpc_server.cc b/src/ray/rpc/grpc_server.cc
index d38e02d57151..208950652a71 100644
--- a/src/ray/rpc/grpc_server.cc
+++ b/src/ray/rpc/grpc_server.cc
@@ -148,7 +148,7 @@ void GrpcServer::Run() {
       if (entry->GetMaxActiveRPCs() != -1) {
         buffer_size = entry->GetMaxActiveRPCs();
       }
-      for (int j = 0; j < buffer_size; j++) {
+      for (int j = 0; j < (buffer_size / num_threads_); j++) {
         entry->CreateCall();
       }
     }

From cb5129c8adb02b1a8a9c04f42b05094fc566bd38 Mon Sep 17 00:00:00 2001
From: Chen Shen <scv119@gmail.com>
Date: Wed, 8 Feb 2023 10:56:59 -0800
Subject: [PATCH 183/267] [telemetry] remove extra print #32322

removing some debugging message i accidentally merged in #32106
---
 python/ray/_private/usage/usage_lib.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/python/ray/_private/usage/usage_lib.py b/python/ray/_private/usage/usage_lib.py
index 81e13c3927bf..14e1abdef70f 100644
--- a/python/ray/_private/usage/usage_lib.py
+++ b/python/ray/_private/usage/usage_lib.py
@@ -620,7 +620,6 @@ def get_extra_usage_tags_to_report(gcs_client) -> Dict[str, str]:
             extra_usage_tags[key] = value.decode("utf-8")
     except Exception as e:
         logger.info(f"Failed to get extra usage tags from kv store {e}")
-    print(extra_usage_tags)
     return extra_usage_tags
 
 
From 468e6064813cbe496d5b98a1972f4134caaa9a31 Mon Sep 17 00:00:00 2001
From: Cade Daniel <cade@anyscale.com>
Date: Wed, 8 Feb 2023 11:22:43 -0800
Subject: [PATCH 184/267] [Ray release infra] Script to compare perf metrics
 between releases (#32290)

---
 release/release_logs/compare_perf_metrics | 148 ++++++++++++++++++++++
 release/util/microbenchmark_analysis.py   |  63 ---------
 2 files changed, 148 insertions(+), 63 deletions(-)
 create mode 100755 release/release_logs/compare_perf_metrics
 delete mode 100644 release/util/microbenchmark_analysis.py

diff --git a/release/release_logs/compare_perf_metrics b/release/release_logs/compare_perf_metrics
new file mode 100755
index 000000000000..6938ca0963bb
--- /dev/null
+++ b/release/release_logs/compare_perf_metrics
@@ -0,0 +1,148 @@
+#!/usr/bin/env python3
+import json
+import pathlib
+import argparse
+import sys
+
+
+def parse_args():
+    parser = argparse.ArgumentParser(
+        description="Automate the process of calculating relative change in "
+        "perf_metrics. This makes catching regressions much easier."
+    )
+    parser.add_argument(
+        "old_dir_name",
+        type=str,
+        help="The name of the directory containing the last release "
+        "performance logs, e.g. 2.2.0",
+    )
+    parser.add_argument(
+        "new_dir_name",
+        type=str,
+        help="The name of the directory containing the new release "
+        "performance logs, e.g. 2.3.0",
+    )
+    args = parser.parse_args()
+    return args
+
+
+def main(old_dir_name, new_dir_name):
+
+    old_paths = paths_without_root_dir(walk(old_dir_name))
+    new_paths = paths_without_root_dir(walk(new_dir_name))
+    to_compare, missing_in_new, missing_in_old = get_compare_list(old_paths, new_paths)
+
+    for path in missing_in_new:
+        print(new_dir_name, "does not have", path)
+
+    for path in missing_in_old:
+        print(old_dir_name, "does not have", path)
+
+    for path in to_compare:
+        old = pathlib.Path(old_dir_name, *path.parts)
+        new = pathlib.Path(new_dir_name, *path.parts)
+
+        regressions, missing_in_new, missing_in_old = get_regressions(old, new)
+
+        for perf_metric in missing_in_new:
+            print(f"{new} does not have {perf_metric}")
+
+        for perf_metric in missing_in_old:
+            print(f"{old} does not have {perf_metric}")
+
+        for regression in regressions:
+            print(regression)
+
+
+def walk(dir_name):
+    stack = [pathlib.Path(dir_name)]
+    while stack:
+        root = stack.pop()
+        if not root.is_dir():
+            yield root
+        else:
+            stack.extend(root.iterdir())
+
+
+def paths_without_root_dir(paths):
+    for p in paths:
+        yield pathlib.Path(*p.parts[1:])
+
+
+def get_compare_list(old, new):
+    old_set = set(old)
+    new_set = set(new)
+
+    return (
+        old_set.intersection(new_set),
+        old_set.difference(new_set),
+        new_set.difference(old_set),
+    )
+
+
+def get_regressions(old_path, new_path):
+
+    with open(old_path, "r") as f:
+        old = json.load(f)
+
+    with open(new_path, "r") as f:
+        new = json.load(f)
+
+    def perf_metrics(root):
+        return root["perf_metrics"]
+
+    def types(perf_metric):
+        return perf_metric["perf_metric_type"]
+
+    def values(perf_metric):
+        return perf_metric["perf_metric_value"]
+
+    def names(perf_metric):
+        return perf_metric["perf_metric_name"]
+
+    def list_to_dict(input_list, key_selector, value_selector):
+        return {key_selector(e): value_selector(e) for e in input_list}
+
+    old_values = list_to_dict(perf_metrics(old), names, values)
+
+    new_values = list_to_dict(perf_metrics(new), names, values)
+
+    perf_metric_types = {
+        **list_to_dict(perf_metrics(old), names, types),
+        **list_to_dict(perf_metrics(new), names, types),
+    }
+
+    to_compare, missing_in_new, missing_in_old = get_compare_list(
+        old_values.keys(),
+        new_values.keys(),
+    )
+
+    regressions = []
+    for perf_metric_name in to_compare:
+        perf_type = perf_metric_types[perf_metric_name]
+        old_value = old_values[perf_metric_name]
+        new_value = new_values[perf_metric_name]
+
+        ratio = new_value / old_value
+
+        if perf_type == "THROUGHPUT":
+            is_regression = ratio < 1.0
+        elif perf_type == "LATENCY":
+            is_regression = ratio > 1.0
+        else:
+            raise ValueError(f"perf_metric_name not of expected type {perf_type}")
+
+        if is_regression:
+            ratio_str = f"{100 * abs(ratio - 1):.02f}%"
+            regressions.append(
+                f"REGRESSION {ratio_str}: {perf_metric_name} ({perf_type}) "
+                f"regresses from {old_value} to {new_value} ({ratio_str}) "
+                f"in {new_path}"
+            )
+
+    return regressions, missing_in_new, missing_in_old
+
+
+if __name__ == "__main__":
+    args = parse_args()
+    sys.exit(main(args.old_dir_name, args.new_dir_name))
diff --git a/release/util/microbenchmark_analysis.py b/release/util/microbenchmark_analysis.py
deleted file mode 100644
index cda37f9f3dbd..000000000000
--- a/release/util/microbenchmark_analysis.py
+++ /dev/null
@@ -1,63 +0,0 @@
-"""
-Compare the last two versions and output the change rate.
-This can also be used to draw graph, which is not
-implemented yet.
-
-Usage: python microbenchmark_analysis.py
-"""
-import glob
-
-from collections import defaultdict
-
-FRIST_VERSION = 0
-LAST_VERSION = 5
-FILES = sorted(glob.glob("./release_logs/[0-9].[0-9].[0-9]/microbenchmark.txt"))
-
-task_info = defaultdict(list)
-task_std_info = defaultdict(list)
-version_list = []
-
-
-def get_task_type(line):
-    return line.split("per")[0]
-
-
-def get_task_performance(line):
-    return float(line.split(" ")[-3])
-
-
-def get_task_std(line):
-    return float(line.split(" ")[-1])
-
-
-def main():
-    for file_name in FILES:
-        version = file_name.split("/")[1]
-        version_list.append(version)
-
-        with open(file_name) as file:
-            for line in file.readlines():
-                if line.startswith("#") or line.startswith("\n"):
-                    continue
-                line = line.strip()
-                task_type = get_task_type(line)
-                task_performance = get_task_performance(line)
-                task_standard_deviation = get_task_std(line)
-                task_info[task_type].append(task_performance)
-                task_std_info[task_type].append(task_standard_deviation)
-
-    for task_type, task_performance_list in task_info.items():
-        # Newly introduced fields are not going to be compared.
-        if len(task_performance_list) < 2:
-            continue
-
-        latest_perf = task_performance_list[-1]
-        second_latest_perf = task_performance_list[-2]
-        change_rate = (latest_perf - second_latest_perf) / second_latest_perf * 100
-        print(
-            "{} performance change rate: {}%".format(task_type, round(change_rate, 2))
-        )
-
-
-if __name__ == "__main__":
-    main()

From 53260af03b6adc0a183ff16e9ee791dd5d6e6616 Mon Sep 17 00:00:00 2001
From: Balaji Veeramani <balaji@anyscale.com>
Date: Wed, 8 Feb 2023 11:40:38 -0800
Subject: [PATCH 185/267] [AIR] Add `TorchDetectionPredictor` (#32199)

TorchPredictor doesn't work with TorchVision detection models because they return List[Dict[str, torch.Tensor]] instead of torch.Tensor. This PR adds a TorchDetectionPredictor so users don't have to extend TorchPredictor themselves.

Signed-off-by: Balaji Veeramani <balaji@anyscale.com>
---
 doc/source/train/api.rst                      |  14 +-
 python/ray/train/BUILD                        |   8 +
 .../tests/test_torch_detection_predictor.py   | 118 +++++++++++++++
 python/ray/train/torch/__init__.py            |   4 +-
 .../train/torch/torch_detection_predictor.py  | 140 ++++++++++++++++++
 python/ray/train/torch/torch_predictor.py     |  24 +--
 6 files changed, 296 insertions(+), 12 deletions(-)
 create mode 100644 python/ray/train/tests/test_torch_detection_predictor.py
 create mode 100644 python/ray/train/torch/torch_detection_predictor.py

diff --git a/doc/source/train/api.rst b/doc/source/train/api.rst
index 61ea64fefa31..de1e986f0e00 100644
--- a/doc/source/train/api.rst
+++ b/doc/source/train/api.rst
@@ -89,11 +89,21 @@ PyTorch
 ``TorchPredictor``
 ******************
 
-.. automodule:: ray.train.torch
+.. autoclass:: ray.train.torch.TorchPredictor
     :members:
-    :exclude-members: TorchTrainer
     :show-inheritance:
 
+    .. automethod:: __init__
+
+``TorchDetectionPredictor``
+***************************
+
+.. autoclass:: ray.train.torch.TorchDetectionPredictor
+    :members:
+    :show-inheritance:
+
+    .. automethod:: __init__
+
 Horovod
 ~~~~~~~
 
diff --git a/python/ray/train/BUILD b/python/ray/train/BUILD
index 6c8a9026ee94..5228f0028038 100644
--- a/python/ray/train/BUILD
+++ b/python/ray/train/BUILD
@@ -496,6 +496,14 @@ py_test(
     deps = [":train_lib", ":conftest"]
 )
 
+py_test(
+    name = "test_torch_detection_predictor",
+    size = "small",
+    srcs = ["tests/test_torch_detection_predictor.py"],
+    tags = ["team:ml", "exclusive", "ray_air", "gpu"],
+    deps = [":train_lib", ":conftest"]
+)
+
 py_test(
     name = "test_torch_trainer",
     size = "medium",
diff --git a/python/ray/train/tests/test_torch_detection_predictor.py b/python/ray/train/tests/test_torch_detection_predictor.py
new file mode 100644
index 000000000000..e0cb9fb3b5a6
--- /dev/null
+++ b/python/ray/train/tests/test_torch_detection_predictor.py
@@ -0,0 +1,118 @@
+import numpy as np
+import pytest
+from torchvision import models
+
+import ray
+from ray.air.util.tensor_extensions.utils import create_ragged_ndarray
+from ray.train.batch_predictor import BatchPredictor
+from ray.train.torch import TorchCheckpoint, TorchDetectionPredictor
+
+
+@pytest.fixture(name="predictor")
+def predictor_fixture():
+    model = models.detection.maskrcnn_resnet50_fpn()
+    yield TorchDetectionPredictor(model=model)
+
+
+@pytest.mark.parametrize(
+    "data",
+    [
+        np.zeros((1, 3, 32, 32), dtype=np.float32),
+        {"image": np.zeros((1, 3, 32, 32), dtype=np.float32)},
+        create_ragged_ndarray(
+            [
+                np.zeros((3, 32, 32), dtype=np.float32),
+                np.zeros((3, 64, 64), dtype=np.float32),
+            ]
+        ),
+    ],
+)
+def test_predict(predictor, data):
+    predictions = predictor.predict(data)
+
+    assert all(len(value) == len(data) for value in predictions.values())
+    # Boxes should have shape `(# detections, 4)`.
+    assert all(boxes.ndim == 2 for boxes in predictions["pred_boxes"])
+    assert all(boxes.shape[-1] == 4 for boxes in predictions["pred_boxes"])
+    # Labels should have shape `(# detections,)`.
+    assert all(labels.ndim == 1 for labels in predictions["pred_labels"])
+    # Scores should have shape `(# detections,)`.
+    assert all(scores.ndim == 1 for scores in predictions["pred_scores"])
+
+
+def test_predict_tensor_dataset():
+    model = models.detection.maskrcnn_resnet50_fpn()
+    checkpoint = TorchCheckpoint.from_model(model)
+    predictor = BatchPredictor.from_checkpoint(checkpoint, TorchDetectionPredictor)
+    dataset = ray.data.from_items([np.zeros((3, 32, 32), dtype=np.float32)])
+
+    predictions = predictor.predict(dataset)
+
+    # Boxes should have shape `(# detections, 4)`.
+    pred_boxes = [row["pred_boxes"] for row in predictions.take_all()]
+    assert all(boxes.ndim == 2 for boxes in pred_boxes)
+    assert all(boxes.shape[-1] == 4 for boxes in pred_boxes)
+    # Labels should have shape `(# detections,)`.
+    pred_labels = [row["pred_labels"] for row in predictions.take_all()]
+    assert all(labels.ndim == 1 for labels in pred_labels)
+    # Scores should have shape `(# detections,)`.
+    pred_scores = [row["pred_scores"] for row in predictions.take_all()]
+    assert all(scores.ndim == 1 for scores in pred_scores)
+
+
+@pytest.mark.parametrize(
+    "items",
+    [
+        [{"image": np.zeros((3, 32, 32), dtype=np.float32)}],
+        [
+            {"image": np.zeros((3, 32, 32), dtype=np.float32)},
+            {"image": np.zeros((3, 64, 64), dtype=np.float32)},
+        ],
+    ],
+)
+def test_predict_tabular_dataset(items):
+    model = models.detection.maskrcnn_resnet50_fpn()
+    checkpoint = TorchCheckpoint.from_model(model)
+    predictor = BatchPredictor.from_checkpoint(checkpoint, TorchDetectionPredictor)
+    dataset = ray.data.from_items(items)
+
+    predictions = predictor.predict(dataset)
+
+    assert predictions.count() == len(items)
+    # Boxes should have shape `(# detections, 4)`.
+    pred_boxes = [row["pred_boxes"] for row in predictions.take_all()]
+    assert all(boxes.ndim == 2 for boxes in pred_boxes)
+    assert all(boxes.shape[-1] == 4 for boxes in pred_boxes)
+    # Labels should have shape `(# detections,)`.
+    pred_labels = [row["pred_labels"] for row in predictions.take_all()]
+    assert all(labels.ndim == 1 for labels in pred_labels)
+    # Scores should have shape `(# detections,)`.
+    pred_scores = [row["pred_scores"] for row in predictions.take_all()]
+    assert all(scores.ndim == 1 for scores in pred_scores)
+
+
+def test_multi_column_batch_raises_value_error(predictor):
+    data = {
+        "image": np.zeros((2, 3, 32, 32), dtype=np.float32),
+        "boxes": np.zeros((2, 0, 4), dtype=np.float32),
+        "labels": np.zeros((2, 0), dtype=np.int64),
+    }
+    with pytest.raises(ValueError):
+        # `data` should only contain one key. Otherwise, `TorchDetectionPredictor`
+        # doesn't know which column contains the input images.
+        predictor.predict(data)
+
+
+def test_invalid_dtype_raises_value_error(predictor):
+    data = np.zeros((1, 3, 32, 32), dtype=np.float32)
+    with pytest.raises(ValueError):
+        # `dtype` should be a single `torch.dtype`.
+        predictor.predict(data, dtype=np.float32)
+
+
+if __name__ == "__main__":
+    import sys
+
+    import pytest
+
+    sys.exit(pytest.main(["-v", "-x", __file__]))
diff --git a/python/ray/train/torch/__init__.py b/python/ray/train/torch/__init__.py
index e041beb51cc4..86b424ca3777 100644
--- a/python/ray/train/torch/__init__.py
+++ b/python/ray/train/torch/__init__.py
@@ -7,8 +7,9 @@
     )
 # isort: on
 
-from ray.train.torch.torch_checkpoint import TorchCheckpoint
 from ray.train.torch.config import TorchConfig
+from ray.train.torch.torch_checkpoint import TorchCheckpoint
+from ray.train.torch.torch_detection_predictor import TorchDetectionPredictor
 from ray.train.torch.torch_predictor import TorchPredictor
 from ray.train.torch.torch_trainer import TorchTrainer
 from ray.train.torch.train_loop_utils import (
@@ -33,4 +34,5 @@
     "backward",
     "enable_reproducibility",
     "TorchPredictor",
+    "TorchDetectionPredictor",
 ]
diff --git a/python/ray/train/torch/torch_detection_predictor.py b/python/ray/train/torch/torch_detection_predictor.py
new file mode 100644
index 000000000000..7de5eee0934a
--- /dev/null
+++ b/python/ray/train/torch/torch_detection_predictor.py
@@ -0,0 +1,140 @@
+import collections
+from typing import Dict, List, Optional, Union
+
+import numpy as np
+import torch
+
+from ray.air.util.tensor_extensions.utils import create_ragged_ndarray
+from ray.train._internal.dl_predictor import TensorDtype
+from ray.train.torch.torch_predictor import TorchPredictor
+from ray.util.annotations import PublicAPI
+
+
+@PublicAPI(stability="alpha")
+class TorchDetectionPredictor(TorchPredictor):
+    """A predictor for TorchVision detection models.
+
+    Unlike other Torch models, instance segmentation models return
+    `List[Dict[str, Tensor]]`. This predictor extends :class:`TorchPredictor` to support
+    the non-standard outputs.
+
+    To learn more about instance segmentation models, read
+    `Instance segmentation models <https://pytorch.org/vision/main/auto_examples/plot_visualization_utils.html#instance-seg-output>`_.
+
+    Example:
+
+        .. testcode::
+
+            import numpy as np
+            from torchvision import models
+
+            from ray.train.torch import TorchDetectionPredictor
+
+            model = models.detection.fasterrcnn_resnet50_fpn_v2(pretrained=True)
+
+            predictor = TorchDetectionPredictor(model=model)
+            predictions = predictor.predict(np.zeros((4, 3, 32, 32), dtype=np.float32))
+
+            print(predictions.keys())
+
+        .. testoutput::
+
+            dict_keys(['pred_boxes', 'pred_labels', 'pred_scores'])
+
+        .. testcode::
+
+            import numpy as np
+            from torchvision import models
+
+            import ray
+            from ray.train.batch_predictor import BatchPredictor
+            from ray.train.torch import TorchCheckpoint, TorchDetectionPredictor
+
+            dataset = ray.data.from_items([{"image": np.zeros((3, 32, 32), dtype=np.float32)}])
+            model = models.detection.fasterrcnn_resnet50_fpn_v2(pretrained=True)
+            checkpoint = TorchCheckpoint.from_model(model)
+            predictor = BatchPredictor.from_checkpoint(checkpoint, TorchDetectionPredictor)
+            predictions = predictor.predict(dataset, feature_columns=["image"])
+
+            print(predictions.take(1))
+
+        .. testoutput::
+
+            [{'pred_boxes': array([], shape=(0, 4), dtype=float32), 'pred_labels': array([], dtype=int64), 'pred_scores': array([], dtype=float32)}]
+    """  # noqa: E501
+
+    def _predict_numpy(
+        self,
+        data: Union[np.ndarray, Dict[str, np.ndarray]],
+        dtype: Optional[Union[TensorDtype, Dict[str, TensorDtype]]],
+    ) -> Dict[str, np.ndarray]:
+        if isinstance(data, dict) and len(data) != 1:
+            raise ValueError(
+                f"""Expected input to contain one key, but got {len(data)} instead.
+
+                If you're using `BatchPredictor`, pass a one-element list to
+                `feature_columns`.
+
+                ---
+                predictor = BatchPredictor(checkpoint, TorchDetectionPredictor)
+                predictor.predict(dataset, feature_columns=["image"])
+                ---
+                """
+            )
+
+        if dtype is not None and not isinstance(dtype, torch.dtype):
+            raise ValueError(
+                "Expected `dtype` to be a `torch.dtype`, but got a "
+                f"{type(dtype).__name__} instead."
+            )
+
+        if isinstance(data, dict):
+            images = next(iter(data.values()))
+        else:
+            images = data
+
+        inputs = [
+            torch.as_tensor(image, dtype=dtype).to(self.device) for image in images
+        ]
+        outputs = self.call_model(inputs)
+        outputs = _convert_outputs_to_ndarray_batch(outputs)
+        outputs = {"pred_" + key: value for key, value in outputs.items()}
+
+        return outputs
+
+
+def _convert_outputs_to_ndarray_batch(
+    outputs: List[Dict[str, torch.Tensor]],
+) -> Dict[str, np.ndarray]:
+    """Batch detection model outputs.
+
+    TorchVision detection models return `List[Dict[Tensor]]`. Each `Dict` contain
+    'boxes', 'labels, and 'scores'.
+
+    >>> import torch
+    >>> from torchvision import models
+    >>> model = models.detection.fasterrcnn_resnet50_fpn_v2()
+    >>> model.eval()  # doctest: +ELLIPSIS
+    FasterRCNN(...)
+    >>> outputs = model(torch.zeros((2, 3, 32, 32)))
+    >>> len(outputs)
+    2
+    >>> outputs[0].keys()
+    dict_keys(['boxes', 'labels', 'scores'])
+
+    This function batches values and returns a `Dict[str, np.ndarray]`.
+
+    >>> from ray.train.torch.torch_detection_predictor import _convert_outputs_to_ndarray_batch
+    >>> batch = _convert_outputs_to_ndarray_batch(outputs)
+    >>> batch.keys()
+    dict_keys(['boxes', 'labels', 'scores'])
+    >>> batch["boxes"].shape
+    (2,)
+    """  # noqa: E501
+    batch = collections.defaultdict(list)
+    for output in outputs:
+        for key, value in output.items():
+            batch[key].append(value.cpu().detach().numpy())
+    for key, value in batch.items():
+        batch[key] = create_ragged_ndarray(value)
+    return batch
diff --git a/python/ray/train/torch/torch_predictor.py b/python/ray/train/torch/torch_predictor.py
index eb74d5e808bd..dee3f6d45597 100644
--- a/python/ray/train/torch/torch_predictor.py
+++ b/python/ray/train/torch/torch_predictor.py
@@ -4,12 +4,12 @@
 import numpy as np
 import torch
 
-from ray.util import log_once
-from ray.train.predictor import DataBatchType
-from ray.air.checkpoint import Checkpoint
 from ray.air._internal.torch_utils import convert_ndarray_batch_to_torch_tensor_batch
-from ray.train.torch.torch_checkpoint import TorchCheckpoint
+from ray.air.checkpoint import Checkpoint
 from ray.train._internal.dl_predictor import DLPredictor
+from ray.train.predictor import DataBatchType
+from ray.train.torch.torch_checkpoint import TorchCheckpoint
+from ray.util import log_once
 from ray.util.annotations import DeveloperAPI, PublicAPI
 
 if TYPE_CHECKING:
@@ -38,12 +38,16 @@ def __init__(
     ):
         self.model = model
         self.model.eval()
-
-        # TODO (jiaodong): #26249 Use multiple GPU devices with sharded input
         self.use_gpu = use_gpu
+
         if use_gpu:
-            # Ensure input tensor and model live on GPU for GPU inference
-            self.model.to(torch.device("cuda"))
+            # TODO (jiaodong): #26249 Use multiple GPU devices with sharded input
+            self.device = torch.device("cuda")
+        else:
+            self.device = torch.device("cpu")
+
+        # Ensure input tensor and model live on the same device
+        self.model.to(self.device)
 
         if (
             not use_gpu
@@ -117,6 +121,8 @@ def call_model(
 
             .. testcode::
 
+                from ray.train.torch import TorchPredictor
+
                 # List outputs are not supported by default TorchPredictor.
                 # So let's define a custom TorchPredictor and override call_model
                 class MyModel(torch.nn.Module):
@@ -231,7 +237,7 @@ def _arrays_to_tensors(
         return convert_ndarray_batch_to_torch_tensor_batch(
             numpy_arrays,
             dtypes=dtype,
-            device="cuda" if self.use_gpu else None,
+            device=self.device,
         )
 
     def _tensor_to_array(self, tensor: torch.Tensor) -> np.ndarray:

From 0466bd3d52ca911e94a555d2f8a7dae2d8111176 Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Wed, 8 Feb 2023 21:35:46 +0100
Subject: [PATCH 186/267] [RLlib] Make one hidden layer config possible for
 TorchMLP (#32310)

* make only one hidden layer possible
* move setting out output dims to setup()

Signed-off-by: Artur Niederfahrenhorst <artur@anyscale.com>
---
 .../ppo/tests/test_ppo_rl_module.py           |  2 +-
 .../ppo/torch/ppo_torch_rl_module.py          | 17 +++++++------
 rllib/models/experimental/torch/primitives.py | 24 ++++++++-----------
 3 files changed, 19 insertions(+), 24 deletions(-)

diff --git a/rllib/algorithms/ppo/tests/test_ppo_rl_module.py b/rllib/algorithms/ppo/tests/test_ppo_rl_module.py
index 18b917dd86e4..f58254387554 100644
--- a/rllib/algorithms/ppo/tests/test_ppo_rl_module.py
+++ b/rllib/algorithms/ppo/tests/test_ppo_rl_module.py
@@ -70,7 +70,7 @@ def get_expected_model_config(
     )
     vf_config = MLPConfig(
         input_dim=32,
-        hidden_layer_dims=[32, 1],
+        hidden_layer_dims=[32],
         hidden_layer_activation="ReLU",
     )
 
diff --git a/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py b/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py
index 2c26c1a02f3c..c4afa2a39e06 100644
--- a/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py
+++ b/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py
@@ -76,6 +76,14 @@ def setup(self) -> None:
         assert self.config.vf_config, "vf_config must be provided."
         assert self.config.encoder_config, "shared encoder config must be " "provided."
 
+        self.config.encoder_config.input_dim = self.config.observation_space.shape[0]
+        self.config.pi_config.input_dim = self.config.encoder_config.output_dim
+        if isinstance(self.config.action_space, gym.spaces.Discrete):
+            self.config.pi_config.output_dim = self.config.action_space.n
+        else:
+            self.config.pi_config.output_dim = self.config.action_space.shape[0] * 2
+        self.config.vf_config.output_dim = 1
+
         # TODO(Artur): Unify to tf and torch setup with Catalog
         self.encoder = self.config.encoder_config.build(framework="torch")
         self.pi = self.config.pi_config.build(framework="torch")
@@ -140,7 +148,6 @@ def from_model_config(
             input_dim=encoder_config.output_dim,
             hidden_layer_dims=[32, 1],
             hidden_layer_activation="ReLU",
-            output_dim=1,
         )
 
         assert isinstance(
@@ -155,14 +162,6 @@ def from_model_config(
             "This simple PPOModule only supports Discrete and Box action space.",
         )
 
-        # build policy network head
-        encoder_config.input_dim = observation_space.shape[0]
-        pi_config.input_dim = encoder_config.output_dim
-        if isinstance(action_space, gym.spaces.Discrete):
-            pi_config.output_dim = action_space.n
-        else:
-            pi_config.output_dim = action_space.shape[0] * 2
-
         config_ = PPOModuleConfig(
             observation_space=observation_space,
             action_space=action_space,
diff --git a/rllib/models/experimental/torch/primitives.py b/rllib/models/experimental/torch/primitives.py
index 11156380133d..235235e77449 100644
--- a/rllib/models/experimental/torch/primitives.py
+++ b/rllib/models/experimental/torch/primitives.py
@@ -10,7 +10,6 @@
 from ray.rllib.utils.framework import try_import_torch
 from ray.rllib.utils.typing import TensorType
 from ray.rllib.models.experimental.base import ModelConfig
-from ray.rllib.models.utils import get_activation_fn
 from ray.rllib.models.specs.checker import (
     check_input_specs,
     check_output_specs,
@@ -74,24 +73,21 @@ def __init__(
         self.input_dim = input_dim
         hidden_layer_dims = hidden_layer_dims
 
-        activation_class = getattr(nn, hidden_layer_activation, lambda: None)()
+        activation = getattr(nn, hidden_layer_activation, lambda: None)()
+
         layers = []
-        layers.append(nn.Linear(input_dim, hidden_layer_dims[0]))
-        for i in range(len(hidden_layer_dims) - 1):
+        dims = [input_dim] + hidden_layer_dims + [output_dim]
+        layers.append(nn.Linear(dims[0], dims[1]))
+        for i in range(1, len(dims) - 1):
             if hidden_layer_activation != "linear":
-                layers.append(activation_class)
-            layers.append(nn.Linear(hidden_layer_dims[i], hidden_layer_dims[i + 1]))
+                layers.append(activation)
+            layers.append(nn.Linear(dims[i], dims[i + 1]))
 
-        if output_dim is not None:
-            if hidden_layer_activation != "linear":
-                layers.append(activation_class)
-            layers.append(nn.Linear(hidden_layer_dims[-1], output_dim))
-            self.output_dim = output_dim
-        else:
-            self.output_dim = hidden_layer_dims[-1]
+        self.output_dim = dims[-1]
 
         if output_activation != "linear":
-            layers.append(get_activation_fn(output_activation, framework="torch"))
+            activation = getattr(nn, output_activation, lambda: None)()
+            layers.append(activation)
 
         self.mlp = nn.Sequential(*layers)
 

From f05eeb4e3afc003f4ddc958ca9361bb53c826fb4 Mon Sep 17 00:00:00 2001
From: Eric Liang <ekhliang@gmail.com>
Date: Wed, 8 Feb 2023 12:56:45 -0800
Subject: [PATCH 187/267] [data] [streaming] No preserve order by default
 (#32300)

Signed-off-by: Eric Liang ekhliang@gmail.com

Why are these changes needed?
Preserve order decreases performance; set it off by default.
---
 python/ray/data/_internal/execution/interfaces.py  |  5 ++---
 python/ray/data/dataset.py                         |  4 ++--
 python/ray/data/grouped_dataset.py                 |  2 +-
 python/ray/data/tests/test_dataset.py              | 14 +++++++++++---
 .../ray/data/tests/test_streaming_integration.py   |  2 +-
 python/ray/train/tests/test_base_trainer.py        |  4 ++++
 6 files changed, 21 insertions(+), 10 deletions(-)

diff --git a/python/ray/data/_internal/execution/interfaces.py b/python/ray/data/_internal/execution/interfaces.py
index 2a350e9efd18..bae2fc205ff8 100644
--- a/python/ray/data/_internal/execution/interfaces.py
+++ b/python/ray/data/_internal/execution/interfaces.py
@@ -150,9 +150,8 @@ class ExecutionOptions:
     # node (node driving the execution).
     locality_with_output: bool = False
 
-    # Always preserve ordering of blocks, even if using operators that
-    # don't require it.
-    preserve_order: bool = True
+    # Set this to preserve the ordering between blocks processed by operators.
+    preserve_order: bool = False
 
 
 @dataclass
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index ed4d8f0ac3b9..be62e288c3e1 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -3665,10 +3665,10 @@ def repeat(self, times: Optional[int] = None) -> "DatasetPipeline[T]":
         Examples:
             >>> import ray
             >>> # Infinite pipeline of numbers [0, 5)
-            >>> ray.data.range(5).repeat().take()
+            >>> ray.data.range(5, parallelism=1).repeat().take()
             [0, 1, 2, 3, 4, 0, 1, 2, 3, 4, ...]
             >>> # Can apply transformations to the pipeline.
-            >>> ray.data.range(5).repeat().map(lambda x: -x).take()
+            >>> ray.data.range(5, parallelism=1).repeat().map(lambda x: -x).take()
             [0, -1, -2, -3, -4, 0, -1, -2, -3, -4, ...]
             >>> # Can shuffle each epoch (dataset) in the pipeline.
             >>> ray.data.range(5).repeat().random_shuffle().take() # doctest: +SKIP
diff --git a/python/ray/data/grouped_dataset.py b/python/ray/data/grouped_dataset.py
index dd27136880d3..01a421eb9712 100644
--- a/python/ray/data/grouped_dataset.py
+++ b/python/ray/data/grouped_dataset.py
@@ -152,7 +152,7 @@ def aggregate(self, *aggs: AggregateFn) -> Dataset[U]:
                     init=lambda k: [],
                     accumulate_row=lambda a, r: a + [r],
                     merge=lambda a1, a2: a1 + a2,
-                    finalize=lambda a: a
+                    finalize=lambda a: sorted(a)
                 ))
                 result.show()
 
diff --git a/python/ray/data/tests/test_dataset.py b/python/ray/data/tests/test_dataset.py
index 1c0c4b748ef4..0f7d7db8d3ae 100644
--- a/python/ray/data/tests/test_dataset.py
+++ b/python/ray/data/tests/test_dataset.py
@@ -2381,7 +2381,10 @@ def test_select_columns(ray_start_regular_shared):
         ds3.select_columns(cols=[]).fully_executed()
 
 
-def test_map_batches_basic(ray_start_regular_shared, tmp_path):
+def test_map_batches_basic(ray_start_regular_shared, tmp_path, restore_dataset_context):
+    ctx = DatasetContext.get_current()
+    ctx.execution_options.preserve_order = True
+
     # Test input validation
     ds = ray.data.range(5)
     with pytest.raises(ValueError):
@@ -2710,8 +2713,11 @@ def test_map_batches_actors_preserves_order(ray_start_regular_shared):
     ],
 )
 def test_map_batches_batch_mutation(
-    ray_start_regular_shared, num_rows, num_blocks, batch_size
+    ray_start_regular_shared, num_rows, num_blocks, batch_size, restore_dataset_context
 ):
+    ctx = DatasetContext.get_current()
+    ctx.execution_options.preserve_order = True
+
     # Test that batch mutation works without encountering a read-only error (e.g. if the
     # batch is a zero-copy view on data in the object store).
     def mutate(df):
@@ -4832,7 +4838,9 @@ def test_random_block_order_schema(ray_start_regular_shared):
     ds.schema().names == ["a", "b"]
 
 
-def test_random_block_order(ray_start_regular_shared):
+def test_random_block_order(ray_start_regular_shared, restore_dataset_context):
+    ctx = DatasetContext.get_current()
+    ctx.execution_options.preserve_order = True
 
     # Test BlockList.randomize_block_order.
     ds = ray.data.range(12).repartition(4)
diff --git a/python/ray/data/tests/test_streaming_integration.py b/python/ray/data/tests/test_streaming_integration.py
index f67ebeaae0a9..82d5ab194d92 100644
--- a/python/ray/data/tests/test_streaming_integration.py
+++ b/python/ray/data/tests/test_streaming_integration.py
@@ -38,7 +38,7 @@ def ref_bundles_to_list(bundles: List[RefBundle]) -> List[List[Any]]:
 
 
 def test_pipelined_execution(ray_start_10_cpus_shared):
-    executor = StreamingExecutor(ExecutionOptions())
+    executor = StreamingExecutor(ExecutionOptions(preserve_order=True))
     inputs = make_ref_bundles([[x] for x in range(20)])
     o1 = InputDataBuffer(inputs)
     o2 = MapOperator.create(make_transform(lambda block: [b * -1 for b in block]), o1)
diff --git a/python/ray/train/tests/test_base_trainer.py b/python/ray/train/tests/test_base_trainer.py
index f864f1a47924..a355d9852bac 100644
--- a/python/ray/train/tests/test_base_trainer.py
+++ b/python/ray/train/tests/test_base_trainer.py
@@ -14,6 +14,7 @@
 from ray.air import session
 from ray.air.checkpoint import Checkpoint
 from ray.air.constants import MAX_REPR_LENGTH
+from ray.data.context import DatasetContext
 from ray.data.preprocessor import Preprocessor
 from ray.data.preprocessors import BatchMapper
 from ray.tune.impl import tuner_internal
@@ -97,6 +98,9 @@ def training_loop(self):
 
 
 def test_preprocess_datasets(ray_start_4_cpus):
+    ctx = DatasetContext.get_current()
+    ctx.execution_options.preserve_order = True
+
     def training_loop(self):
         assert self.datasets["my_dataset"].take() == [2, 3, 4]
 

From 3bb73d32f2eeb2d159a74677d0f4631ab4d310e0 Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Wed, 8 Feb 2023 13:49:57 -0800
Subject: [PATCH 188/267] [core] Fix comments and a corner case in #32302
 (#32323)

This is a corner case where buffer could be 0 and a comments needs to be fixed in the previous PR.
---
 src/ray/rpc/grpc_server.cc | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/ray/rpc/grpc_server.cc b/src/ray/rpc/grpc_server.cc
index 208950652a71..09556cc7ac5d 100644
--- a/src/ray/rpc/grpc_server.cc
+++ b/src/ray/rpc/grpc_server.cc
@@ -40,6 +40,7 @@ GrpcServer::GrpcServer(std::string name,
       is_closed_(true),
       num_threads_(num_threads),
       keepalive_time_ms_(keepalive_time_ms) {
+  RAY_CHECK(num_threads_ > 0) << "Num of threads in gRPC must be greater than 0";
   cqs_.resize(num_threads_);
   // Enable built in health check implemented by gRPC:
   //   https://github.com/grpc/grpc/blob/master/doc/health-checking.md
@@ -148,7 +149,7 @@ void GrpcServer::Run() {
       if (entry->GetMaxActiveRPCs() != -1) {
         buffer_size = entry->GetMaxActiveRPCs();
       }
-      for (int j = 0; j < (buffer_size / num_threads_); j++) {
+      for (int j = 0; j < std::max(1, buffer_size / num_threads_); j++) {
         entry->CreateCall();
       }
     }

From 22bc1e9b3d100a3e5ddae0f3d7620cbb74068c9e Mon Sep 17 00:00:00 2001
From: Sihan Wang <sihanwang41@gmail.com>
Date: Wed, 8 Feb 2023 14:11:44 -0800
Subject: [PATCH 189/267] [Serve][Doc] Refactor the Ray Serve API doc (#32307)

- Add an index page to list all the APIs. (https://ray--32307.org.readthedocs.build/en/32307/serve/api/index.html)
- With this change, when you search specific python API e.g`ray.serve.run`. The search result will show core api link page. (Previously, the user can't get the correct search result, because we put all APIs on one page.)
<img width="604" alt="image" src="https://user-images.githubusercontent.com/6515354/217628692-720b9344-061d-44de-bc77-ee0c0ef27276.png">
---
 doc/source/_toc.yml                     |  2 +-
 doc/source/ray-references/api.rst       |  2 +-
 doc/source/serve/api/index.md           | 12 +++++
 doc/source/serve/api/python_api.md      | 49 +++++++++++++++++
 doc/source/serve/{ => api}/rest_api.md  |  0
 doc/source/serve/{ => api}/serve_cli.md |  0
 doc/source/serve/package-ref.md         | 71 -------------------------
 7 files changed, 63 insertions(+), 73 deletions(-)
 create mode 100644 doc/source/serve/api/index.md
 create mode 100644 doc/source/serve/api/python_api.md
 rename doc/source/serve/{ => api}/rest_api.md (100%)
 rename doc/source/serve/{ => api}/serve_cli.md (100%)
 delete mode 100644 doc/source/serve/package-ref.md

diff --git a/doc/source/_toc.yml b/doc/source/_toc.yml
index 4975ca63a112..2e82bb4cab8a 100644
--- a/doc/source/_toc.yml
+++ b/doc/source/_toc.yml
@@ -315,7 +315,7 @@ parts:
                   - file: serve/tutorials/deployment-graph-patterns/linear_pipeline
                   - file: serve/tutorials/deployment-graph-patterns/branching_input
                   - file: serve/tutorials/deployment-graph-patterns/conditional
-          - file: serve/package-ref
+          - file: serve/api/index
 
       - file: rllib/index
         title: Ray RLlib
diff --git a/doc/source/ray-references/api.rst b/doc/source/ray-references/api.rst
index 2e97eac3dfba..fb55ac2015c2 100644
--- a/doc/source/ray-references/api.rst
+++ b/doc/source/ray-references/api.rst
@@ -9,7 +9,7 @@ API References
     ../data/api/api.rst
     ../train/api.rst
     ../tune/api_docs/overview.rst
-    ../serve/package-ref.rst
+    ../serve/api/index.rst
     ../rllib/package_ref/index.rst
     ../workflows/api/api.rst
     ../cluster/package-overview.rst
diff --git a/doc/source/serve/api/index.md b/doc/source/serve/api/index.md
new file mode 100644
index 000000000000..c124fa6b2bf5
--- /dev/null
+++ b/doc/source/serve/api/index.md
@@ -0,0 +1,12 @@
+(serve-api)=
+# Ray Serve API
+
+```{toctree}
+:maxdepth: '-1'
+
+python_api
+rest_api
+serve_cli
+```
+
+
diff --git a/doc/source/serve/api/python_api.md b/doc/source/serve/api/python_api.md
new file mode 100644
index 000000000000..9b288318842f
--- /dev/null
+++ b/doc/source/serve/api/python_api.md
@@ -0,0 +1,49 @@
+﻿# Ray Serve Python API
+
+(core-apis)=
+
+```{eval-rst}
+.. currentmodule:: ray
+```
+
+## Core APIs
+
+```{eval-rst}
+.. autosummary::
+   :toctree: doc/
+
+   serve.run
+   serve.start
+   serve.shutdown
+   serve.delete
+```
+
+(servehandle-api)=
+## ServeHandle API
+
+```{eval-rst}
+.. autosummary::
+   :toctree: doc/
+
+   serve.handle.RayServeHandle
+   serve.handle.RayServeHandle.remote
+   serve.handle.RayServeHandle.options
+```
+
+## Batching Requests
+
+```{eval-rst}
+.. autosummary::
+   :toctree: doc/
+
+   serve.batch
+```
+
+## Deployment Graph APIs
+
+```{eval-rst}
+.. autosummary::
+   :toctree: doc/
+
+   serve.api.build
+```
\ No newline at end of file
diff --git a/doc/source/serve/rest_api.md b/doc/source/serve/api/rest_api.md
similarity index 100%
rename from doc/source/serve/rest_api.md
rename to doc/source/serve/api/rest_api.md
diff --git a/doc/source/serve/serve_cli.md b/doc/source/serve/api/serve_cli.md
similarity index 100%
rename from doc/source/serve/serve_cli.md
rename to doc/source/serve/api/serve_cli.md
diff --git a/doc/source/serve/package-ref.md b/doc/source/serve/package-ref.md
deleted file mode 100644
index 0206a81339f7..000000000000
--- a/doc/source/serve/package-ref.md
+++ /dev/null
@@ -1,71 +0,0 @@
-(serve-api)=
-# Ray Serve API
-
-(core-apis)=
-
-## Core APIs
-
-```{eval-rst}
-.. autofunction:: ray.serve.run
-```
-
-```{eval-rst}
-.. autofunction:: ray.serve.start
-```
-
-```{eval-rst}
-.. autofunction:: ray.serve.deployment
-```
-
-```{eval-rst}
-.. autofunction:: ray.serve.shutdown
-```
-
-(deployment-api)=
-
-## Deployment API
-
-```{eval-rst}
-.. autoclass:: ray.serve.deployment.Deployment
-    :members: deploy, delete, options, get_handle, bind
-```
-
-(servehandle-api)=
-
-## ServeHandle API
-
-```{eval-rst}
-.. autoclass:: ray.serve.handle.RayServeHandle
-    :members: remote, options
-```
-
-## Batching Requests
-
-```{eval-rst}
-.. autofunction:: ray.serve.batch(max_batch_size=10, batch_wait_timeout_s=0.0)
-```
-
-## Serve CLI and REST API
-
-Check out the [CLI](serve-cli) and [REST API](serve-rest-api) for running, debugging, inspecting, and deploying Serve applications in production:
-
-```{toctree}
-:maxdepth: 1
-:name: serve-non-python-api
-
-serve_cli
-rest_api
-```
-
-## Deployment Graph APIs
-
-```{eval-rst}
-.. autofunction:: ray.serve.api.build
-```
-
-% TODO(architkulkarni): This just compiles to "alias of Deployment(name=DAGDriver,version=None,route_prefix=/)"
-% in the docs, find out how to make Sphinx correctly autodocument this class.
-% ```{eval-rst}
-% .. autoclass:: ray.serve.drivers.DAGDriver
-%     :members: predict, predict_with_route
-% ```

From b73f3eb3a4005fde41e1eb2116c505a9e6ba33c0 Mon Sep 17 00:00:00 2001
From: Avnish Narayan <38871737+avnishn@users.noreply.github.com>
Date: Wed, 8 Feb 2023 16:11:28 -0800
Subject: [PATCH 190/267] [RLlib] Modifications to gpu resource logic in
 rl_trainer (#32149)

* Modifications to gpu resource logic in rl_trainer

- Add support for gpu with local mode for tf trainers in local mode
- remove `_make_distributed_module`
- add support for `local_gpu_id` which is the id of the gpu to use during local mode training with gpu
- refactor tf function tracing logic to include the call to strategy.run
- change tf function logic to prevent unnecessary retracing
- add warning to not do gpu or distributed training in tf without turning on eager tracing.

Signed-off-by: avnish <avnish@anyscale.com>
---
 rllib/algorithms/algorithm_config.py          |   9 ++
 rllib/core/rl_module/marl_module.py           |   8 +-
 rllib/core/rl_trainer/rl_trainer.py           |  44 ++-----
 rllib/core/rl_trainer/scaling_config.py       |   5 +
 .../core/rl_trainer/tests/test_rl_trainer.py  |   3 +-
 .../rl_trainer/tests/test_trainer_runner.py   |  34 +++---
 rllib/core/rl_trainer/tf/tf_rl_trainer.py     | 114 +++++++++---------
 .../core/rl_trainer/torch/torch_rl_trainer.py |  55 ++++-----
 rllib/core/rl_trainer/trainer_runner.py       |   1 -
 .../core/rl_trainer/trainer_runner_config.py  |  11 ++
 rllib/core/testing/utils.py                   |  22 +++-
 11 files changed, 164 insertions(+), 142 deletions(-)

diff --git a/rllib/algorithms/algorithm_config.py b/rllib/algorithms/algorithm_config.py
index 96e777b458b5..8796427f6c00 100644
--- a/rllib/algorithms/algorithm_config.py
+++ b/rllib/algorithms/algorithm_config.py
@@ -246,6 +246,7 @@ def __init__(self, algo_class=None):
         self.num_trainer_workers = 0
         self.num_gpus_per_trainer_worker = 0
         self.num_cpus_per_trainer_worker = 1
+        self.local_gpu_idx = 0
         self.custom_resources_per_worker = {}
         self.placement_strategy = "PACK"
 
@@ -969,6 +970,7 @@ def resources(
         num_trainer_workers: Optional[int] = NotProvided,
         num_cpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
         num_gpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
+        local_gpu_idx: Optional[int] = NotProvided,
         custom_resources_per_worker: Optional[dict] = NotProvided,
         placement_strategy: Optional[str] = NotProvided,
     ) -> "AlgorithmConfig":
@@ -1002,6 +1004,10 @@ def resources(
                 `num_trainer_workers = 0`, any value greater than 0 will run the
                 training on a single GPU on the head node, while a value of 0 will run
                 the training on head node CPU cores.
+            local_gpu_idx: if num_gpus_per_worker > 0, and num_workers<2, then this gpu
+                index will be used for training. This is an index into the available
+                cuda devices. For example if os.environ["CUDA_VISIBLE_DEVICES"] = "1"
+                then a local_gpu_idx of 0 will use the gpu with id 1 on the node.
             custom_resources_per_worker: Any custom Ray resources to allocate per
                 worker.
             num_cpus_for_local_worker: Number of CPUs to allocate for the algorithm.
@@ -1048,6 +1054,8 @@ def resources(
             self.num_cpus_per_trainer_worker = num_cpus_per_trainer_worker
         if num_gpus_per_trainer_worker is not NotProvided:
             self.num_gpus_per_trainer_worker = num_gpus_per_trainer_worker
+        if local_gpu_idx is not NotProvided:
+            self.local_gpu_idx = local_gpu_idx
 
         return self
 
@@ -2696,6 +2704,7 @@ def get_trainer_runner_config(
                 num_trainer_workers=self.num_trainer_workers,
                 num_cpus_per_trainer_worker=self.num_cpus_per_trainer_worker,
                 num_gpus_per_trainer_worker=self.num_gpus_per_trainer_worker,
+                local_gpu_idx=self.local_gpu_idx,
             )
             .framework(eager_tracing=self.eager_tracing)
         )
diff --git a/rllib/core/rl_module/marl_module.py b/rllib/core/rl_module/marl_module.py
index 9319795184e1..e89571e63bcf 100644
--- a/rllib/core/rl_module/marl_module.py
+++ b/rllib/core/rl_module/marl_module.py
@@ -301,7 +301,7 @@ def _forward_train(
         Returns:
             The output of the forward_train pass the specified modules.
         """
-        return self.__run_forward_pass("forward_train", batch, **kwargs)
+        return self._run_forward_pass("forward_train", batch, **kwargs)
 
     @override(RLModule)
     def _forward_inference(
@@ -318,7 +318,7 @@ def _forward_inference(
         Returns:
             The output of the forward_inference pass the specified modules.
         """
-        return self.__run_forward_pass("forward_inference", batch, **kwargs)
+        return self._run_forward_pass("forward_inference", batch, **kwargs)
 
     @override(RLModule)
     def _forward_exploration(
@@ -335,7 +335,7 @@ def _forward_exploration(
         Returns:
             The output of the forward_exploration pass the specified modules.
         """
-        return self.__run_forward_pass("forward_exploration", batch, **kwargs)
+        return self._run_forward_pass("forward_exploration", batch, **kwargs)
 
     @override(RLModule)
     def get_state(self) -> Mapping[str, Any]:
@@ -411,7 +411,7 @@ def deserialize(cls, state: Mapping[str, Any]) -> "MultiAgentRLModule":
     def __repr__(self) -> str:
         return f"MARL({pprint.pformat(self._rl_modules)})"
 
-    def __run_forward_pass(
+    def _run_forward_pass(
         self,
         forward_fn_name: str,
         batch: NestedDict[Any],
diff --git a/rllib/core/rl_trainer/rl_trainer.py b/rllib/core/rl_trainer/rl_trainer.py
index 1c9d93e68e13..eb91583018d8 100644
--- a/rllib/core/rl_trainer/rl_trainer.py
+++ b/rllib/core/rl_trainer/rl_trainer.py
@@ -186,6 +186,12 @@ def __init__(
         self._param_to_optim: Dict[ParamRef, Optimizer] = {}
         self._params: ParamDictType = {}
 
+        # pick the stuff that we need from the scaling config
+        self._use_gpu = trainer_scaling_config.num_gpus_per_worker > 0
+
+        # if we are using gpu but we are not distributed, use this gpu for training
+        self._local_gpu_idx = trainer_scaling_config.local_gpu_idx
+
     @property
     def distributed(self) -> bool:
         return self._distributed
@@ -382,11 +388,7 @@ def update(
         results = []
         for minibatch in batch_iter(batch, minibatch_size, num_iters):
 
-            if not self.distributed:
-                result = self._update(minibatch)
-            else:
-                result = self.do_distributed_update(minibatch)
-
+            result = self._update(minibatch)
             results.append(result)
 
         # Reduce results across all minibatches, if necessary.
@@ -615,11 +617,7 @@ def _make_module(self) -> MultiAgentRLModule:
 
     def build(self) -> None:
         """Initialize the model."""
-        if self.distributed:
-            self._module = self._make_distributed_module()
-        else:
-            self._module = self._make_module()
-
+        self._module = self._make_module()
         for param_seq, optimizer in self.configure_optimizers():
             self._optim_to_param[optimizer] = []
             for param in param_seq:
@@ -628,32 +626,6 @@ def build(self) -> None:
                 self._params[param_ref] = param
                 self._param_to_optim[param_ref] = optimizer
 
-    def do_distributed_update(
-        self, batch: MultiAgentBatch, **kwargs
-    ) -> Mapping[str, Any]:
-        """Perform a distributed update on this Trainer.
-
-        Args:
-            batch: A batch of data.
-
-        Returns:
-            A dictionary of results.
-        """
-        raise NotImplementedError
-
-    def _make_distributed_module(self) -> MultiAgentRLModule:
-        """Initialize this trainer in a distributed training setting.
-
-        This method should be overriden in the framework specific trainer. It is
-        expected the the module creation is wrapped in some context manager that will
-        handle the distributed training. This is a common patterns used in torch and
-        tf.
-
-        Returns:
-            The distributed module.
-        """
-        raise NotImplementedError
-
     @abc.abstractmethod
     def get_param_ref(self, param: ParamType) -> Hashable:
         """Returns a reference to a parameter.
diff --git a/rllib/core/rl_trainer/scaling_config.py b/rllib/core/rl_trainer/scaling_config.py
index 1c8054ef4468..4a81f7e12589 100644
--- a/rllib/core/rl_trainer/scaling_config.py
+++ b/rllib/core/rl_trainer/scaling_config.py
@@ -14,8 +14,13 @@ class TrainerScalingConfig:
         num_gpus_per_worker: The number of GPUs to allocate per worker. If
             num_workers=0, any number greater than 0 will run the training on a single
             GPU. A value of zero will run the training on a single CPU.
+        local_gpu_idx: if num_gpus_per_worker > 0, and num_workers<2, then this gpu
+            index will be used for training. This is an index into the available cuda
+            devices. For example if os.environ["CUDA_VISIBLE_DEVICES"] = "1" then a
+            local_gpu_idx of 0 will use the gpu with id 1 on the node.
     """
 
     num_workers: int = 0
     num_cpus_per_worker: int = 1
     num_gpus_per_worker: int = 0
+    local_gpu_idx: int = 0
diff --git a/rllib/core/rl_trainer/tests/test_rl_trainer.py b/rllib/core/rl_trainer/tests/test_rl_trainer.py
index b33bea2a1cc6..816261ba34f0 100644
--- a/rllib/core/rl_trainer/tests/test_rl_trainer.py
+++ b/rllib/core/rl_trainer/tests/test_rl_trainer.py
@@ -6,7 +6,7 @@
 import ray
 
 from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
-from ray.rllib.core.rl_trainer.rl_trainer import RLTrainer
+from ray.rllib.core.rl_trainer.rl_trainer import RLTrainer, FrameworkHPs
 from ray.rllib.core.testing.tf.bc_module import DiscreteBCTFModule
 from ray.rllib.core.testing.tf.bc_rl_trainer import BCTfRLTrainer
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID
@@ -26,6 +26,7 @@ def get_trainer() -> RLTrainer:
         ),
         optimizer_config={"lr": 1e-3},
         trainer_scaling_config=TrainerScalingConfig(),
+        framework_hyperparameters=FrameworkHPs(eager_tracing=True),
     )
 
     trainer.build()
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner.py b/rllib/core/rl_trainer/tests/test_trainer_runner.py
index fb4ed6dfbd98..4e045ec2ee69 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner.py
@@ -31,18 +31,14 @@
 }
 
 
-class TestTrainerRunner(unittest.TestCase):
-    def setUp(self) -> None:
-        ray.init()
-
-    def tearDown(self) -> None:
-        ray.shutdown()
-
-    @staticmethod
-    def local_training_helper(fw, scaling_mode) -> None:
+# TODO(avnishn) Make this a ray task later. Currently thats not possible because the
+# task is not dying after the test is done. This is a bug with ray core.
+@ray.remote(num_gpus=1)
+class RemoteTrainingHelper:
+    def local_training_helper(self, fw, scaling_mode) -> None:
         env = gym.make("CartPole-v1")
         scaling_config = LOCAL_SCALING_CONFIGS[scaling_mode]
-        runner = get_trainer_runner(fw, env, scaling_config)
+        runner = get_trainer_runner(fw, env, scaling_config, eager_tracing=True)
         local_trainer = get_rl_trainer(fw, env)
         local_trainer.build()
 
@@ -71,16 +67,26 @@ def local_training_helper(fw, scaling_mode) -> None:
 
         check(local_trainer.get_state(), runner.get_state())
 
+
+class TestTrainerRunner(unittest.TestCase):
+    def setUp(self) -> None:
+        ray.init()
+
+    def tearDown(self) -> None:
+        ray.shutdown()
+
     def test_trainer_runner_local(self):
         fws = ["tf", "torch"]
+
         test_iterator = itertools.product(fws, LOCAL_SCALING_CONFIGS)
+
         # run the logic of this test inside of a ray actor because we want tensorflow
         # resources to be gracefully released. Tensorflow blocks the gpu resources
         # otherwise between test cases, causing a gpu oom error.
-        remote_helper_fn = ray.remote(self.local_training_helper)
         for fw, scaling_mode in test_iterator:
             print(f"Testing framework: {fw}, scaling mode: {scaling_mode}")
-            ray.get(remote_helper_fn.remote(fw, scaling_mode))
+            training_helper = RemoteTrainingHelper.remote()
+            ray.get(training_helper.local_training_helper.remote(fw, scaling_mode))
 
     def test_update_multigpu(self):
         fws = ["tf", "torch"]
@@ -92,7 +98,7 @@ def test_update_multigpu(self):
             env = gym.make("CartPole-v1")
 
             scaling_config = REMOTE_SCALING_CONFIGS[scaling_mode]
-            runner = get_trainer_runner(fw, env, scaling_config)
+            runner = get_trainer_runner(fw, env, scaling_config, eager_tracing=True)
             reader = get_cartpole_dataset_reader(batch_size=1024)
 
             min_loss = float("inf")
@@ -129,7 +135,7 @@ def test_add_remove_module(self):
             print(f"Testing framework: {fw}, scaling mode: {scaling_mode}.")
             env = gym.make("CartPole-v1")
             scaling_config = REMOTE_SCALING_CONFIGS[scaling_mode]
-            runner = get_trainer_runner(fw, env, scaling_config)
+            runner = get_trainer_runner(fw, env, scaling_config, eager_tracing=True)
             reader = get_cartpole_dataset_reader(batch_size=512)
             batch = reader.next()
 
diff --git a/rllib/core/rl_trainer/tf/tf_rl_trainer.py b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
index 83cb5124b96d..5be0840c3a5b 100644
--- a/rllib/core/rl_trainer/tf/tf_rl_trainer.py
+++ b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
@@ -25,7 +25,6 @@
     ModuleID,
     SingleAgentRLModuleSpec,
 )
-from ray.rllib.core.rl_module.marl_module import MultiAgentRLModule
 from ray.rllib.policy.sample_batch import MultiAgentBatch
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.framework import try_import_tf
@@ -97,31 +96,54 @@ def __init__(
     ):
         super().__init__(framework_hyperparameters=framework_hyperparameters, **kwargs)
 
-        # TODO (Kourosh): This is required to make sure tf computes the values in the
-        # end. Two question remains:
-        # 1. Why is it not eager by default. Do we do anything in try_import_tf() that
-        # changes this default?
-        # 2. What is the implication of this on the performance? The tf documentation
-        # does not mention this as a requirement?
         tf1.enable_eager_execution()
 
         self._enable_tf_function = framework_hyperparameters.eager_tracing
+        # the default strategy is a no-op that can be used in the local mode
+        # cpu only case
+        self._strategy = tf.distribute.get_strategy()
+
+    @override(RLTrainer)
+    def build(self) -> None:
+        if self._distributed:
+            self._strategy = tf.distribute.MultiWorkerMirroredStrategy()
+        else:
+            if self._use_gpu:
+                # mirrored strategy is typically used for multi-gpu training
+                # on a single machine, however we can use it for single-gpu
+                devices = tf.config.list_logical_devices("GPU")
+                assert self._local_gpu_idx < len(devices), (
+                    f"local_gpu_idx {self._local_gpu_idx} is not a valid GPU id or is "
+                    " not available."
+                )
+                local_gpu = [devices[self._local_gpu_idx].name]
+                self._strategy = tf.distribute.MirroredStrategy(devices=local_gpu)
+        with self._strategy.scope():
+            super().build()
+
         if self._enable_tf_function:
-            self._update_fn = tf.function(self._do_update_fn)
+            self._update_fn = tf.function(self._do_update_fn, reduce_retracing=True)
         else:
             self._update_fn = self._do_update_fn
 
     def _do_update_fn(self, batch: MultiAgentBatch) -> Mapping[str, Any]:
         # TODO (Avnish): Match this base class's implementation.
-        with tf.GradientTape() as tape:
-            fwd_out = self._module.forward_train(batch)
-            loss = self.compute_loss(fwd_out=fwd_out, batch=batch)
-            if isinstance(loss, tf.Tensor):
-                loss = {"total_loss": loss}
-        gradients = self.compute_gradients(loss, tape)
-        gradients = self.postprocess_gradients(gradients)
-        self.apply_gradients(gradients)
-        return {"loss": loss, "fwd_out": fwd_out, "postprocessed_gradients": gradients}
+        def helper(_batch):
+            with tf.GradientTape() as tape:
+                fwd_out = self._module.forward_train(_batch)
+                loss = self.compute_loss(fwd_out=fwd_out, batch=_batch)
+                if isinstance(loss, tf.Tensor):
+                    loss = {"total_loss": loss}
+            gradients = self.compute_gradients(loss, tape)
+            gradients = self.postprocess_gradients(gradients)
+            self.apply_gradients(gradients)
+            return {
+                "loss": loss,
+                "fwd_out": fwd_out,
+                "postprocessed_gradients": gradients,
+            }
+
+        return self._strategy.run(helper, args=(batch,))
 
     @override(RLTrainer)
     def configure_optimizers(self) -> ParamOptimizerPairs:
@@ -149,7 +171,6 @@ def update(
                 "Batch keys must match module keys. RLTrainer does not "
                 "currently support training of only some modules and not others"
             )
-        batch = self.convert_batch_to_tf_tensor(batch)
 
         batch_iter = (
             MiniBatchCyclicIterator
@@ -159,11 +180,10 @@ def update(
 
         results = []
         for minibatch in batch_iter(batch, minibatch_size, num_iters):
-
-            if self.distributed:
-                update_outs = self.do_distributed_update(minibatch)
-            else:
-                update_outs = self._update_fn(minibatch)
+            # TODO (Avnish): converting to tf tensor and then from nested dict back to
+            # dict will most likely hit us in perf. But let's go with this for now.
+            minibatch = self.convert_batch_to_tf_tensor(minibatch)
+            update_outs = self._update_fn(minibatch.asdict())
             loss = update_outs["loss"]
             fwd_out = update_outs["fwd_out"]
             postprocessed_gradients = update_outs["postprocessed_gradients"]
@@ -187,7 +207,6 @@ def compute_gradients(
 
     @override(RLTrainer)
     def apply_gradients(self, gradients: Dict[ParamRef, TensorType]) -> None:
-
         # TODO (Avnishn, kourosh): apply gradients doesn't work in cases where
         # only some agents have a sample batch that is passed but not others.
         # This is probably because of the way that we are iterating over the
@@ -197,19 +216,6 @@ def apply_gradients(self, gradients: Dict[ParamRef, TensorType]) -> None:
             gradient_list = [gradients[param_ref] for param_ref in param_ref_seq]
             optim.apply_gradients(zip(gradient_list, variable_list))
 
-    @override(RLTrainer)
-    def _make_distributed_module(self) -> MultiAgentRLModule:
-        # TODO (Kourosh): Does strategy has to be an attribute here? if so it's very
-        # hidden to the user of this class that there is such an attribute.
-
-        # TODO (Kourosh, Avnish): The optimizers still need to be created within
-        # strategy.scope. Otherwise parameters of optimizers won't be properly
-        # synced
-        self.strategy = tf.distribute.MultiWorkerMirroredStrategy()
-        with self.strategy.scope():
-            module = self._make_module()
-        return module
-
     @override(RLTrainer)
     def add_module(
         self,
@@ -219,15 +225,15 @@ def add_module(
         set_optimizer_fn: Optional[Callable[[RLModule], ParamOptimizerPairs]] = None,
         optimizer_cls: Optional[Type[Optimizer]] = None,
     ) -> None:
-        if self.distributed:
-            with self.strategy.scope():
-                super().add_module(
-                    module_id=module_id,
-                    module_spec=module_spec,
-                    set_optimizer_fn=set_optimizer_fn,
-                    optimizer_cls=optimizer_cls,
-                )
-        else:
+        # TODO(Avnishn):
+        # WARNING:tensorflow:Using MirroredStrategy eagerly has significant overhead
+        # currently. We will be working on improving this in the future, but for now
+        # please wrap `call_for_each_replica` or `experimental_run` or `run` inside a
+        # tf.function to get the best performance.
+        # I get this warning any time I add a new module. I see the warning a few times
+        # and then it disappears. I think that I will need to open an issue with the TF
+        # team.
+        with self._strategy.scope():
             super().add_module(
                 module_id=module_id,
                 module_spec=module_spec,
@@ -235,22 +241,14 @@ def add_module(
                 optimizer_cls=optimizer_cls,
             )
         if self._enable_tf_function:
-            self._update_fn = tf.function(self._do_update_fn)
+            self._update_fn = tf.function(self._do_update_fn, reduce_retracing=True)
 
     @override(RLTrainer)
     def remove_module(self, module_id: ModuleID) -> None:
-        if self.distributed:
-            with self.strategy.scope():
-                super().remove_module(module_id)
-        else:
+        with self._strategy.scope():
             super().remove_module(module_id)
         if self._enable_tf_function:
-            self._update_fn = tf.function(self._do_update_fn)
-
-    @override(RLTrainer)
-    def do_distributed_update(self, batch: NestedDict) -> Mapping[str, Any]:
-        update_outs = self.strategy.run(self._update_fn, args=(batch,))
-        return update_outs
+            self._update_fn = tf.function(self._do_update_fn, reduce_retracing=True)
 
     def convert_batch_to_tf_tensor(self, batch: MultiAgentBatch) -> NestedDict:
         """Convert the arrays of batch to tf.Tensor's.
@@ -264,7 +262,7 @@ def convert_batch_to_tf_tensor(self, batch: MultiAgentBatch) -> NestedDict:
             The converted batch.
 
         """
-        # TODO(sven): This is a hack to get around the fact that
+        # TODO(avnishn): This is a hack to get around the fact that
         # SampleBatch.count becomes 0 after decorating the function with
         # tf.function. This messes with input spec checking. Other fields of
         # the sample batch are possibly modified by tf.function which may lead
diff --git a/rllib/core/rl_trainer/torch/torch_rl_trainer.py b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
index 1ce1762efe74..1c7cb41fa4a7 100644
--- a/rllib/core/rl_trainer/torch/torch_rl_trainer.py
+++ b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
@@ -55,9 +55,6 @@ def __init__(
     ):
         super().__init__(trainer_scaling_config=trainer_scaling_config, **kwargs)
 
-        # pick the stuff that we need from the scaling config
-        self._use_gpu = trainer_scaling_config.num_gpus_per_worker > 0
-
         self._device = None
 
     @property
@@ -91,7 +88,6 @@ def compute_gradients(
 
     @override(RLTrainer)
     def apply_gradients(self, gradients: ParamDictType) -> None:
-
         # make sure the parameters do not carry gradients on their own
         for optim in self._optim_to_param:
             optim.zero_grad(set_to_none=True)
@@ -110,33 +106,44 @@ def build(self) -> None:
         # TODO (Kourosh): Instead of using _TorchAccelerator, we should use the public
         # api in ray.train but allow for session to be None without any errors raised.
         if self._use_gpu:
-            self._device = _TorchAccelerator().get_device()
+            # _TorchAccelerator().get_device() returns the 0th device if
+            # it is called from outside of a Ray Train session. Its necessary to give
+            # the user the option to run on the gpu of their choice, so we enable that
+            # option here via the local gpu id scaling config parameter.
+            if self._distributed:
+                self._device = _TorchAccelerator().get_device()
+            else:
+                assert self._local_gpu_idx < torch.cuda.device_count(), (
+                    f"local_gpu_idx {self._local_gpu_idx} is not a valid GPU id or is "
+                    " not available."
+                )
+                # this is an index into the available cuda devices. For example if
+                # os.environ["CUDA_VISIBLE_DEVICES"] = "1" then
+                # torch.cuda.device_count() = 1 and torch.device(0) will actuall map to
+                # the gpu with id 1 on the node.
+                self._device = torch.device(self._local_gpu_idx)
         else:
             self._device = torch.device("cpu")
         super().build()
-
-    @override(RLTrainer)
-    def _make_module(self) -> MultiAgentRLModule:
-        module = super()._make_module()
-        self._map_module_to_device(module)
-        return module
-
-    @override(RLTrainer)
-    def _make_distributed_module(self) -> MultiAgentRLModule:
-        module = self._make_module()
-
         # if the module is a MultiAgentRLModule and nn.Module we can simply assume
         # all the submodules are registered. Otherwise, we need to loop through
         # each submodule and move it to the correct device.
         # TODO (Kourosh): This can result in missing modules if the user does not
         # register them in the MultiAgentRLModule. We should find a better way to
         # handle this.
-        if isinstance(module, torch.nn.Module):
-            module = TorchDDPRLModule(module)
-        else:
-            for key in module.keys():
-                module.add_module(key, TorchDDPRLModule(module[key]), override=True)
+        if self._distributed:
+            if isinstance(self._module, torch.nn.Module):
+                self._module = TorchDDPRLModule(self._module)
+            else:
+                for key in self._module.keys():
+                    self._module.add_module(
+                        key, TorchDDPRLModule(self._module[key]), override=True
+                    )
 
+    @override(RLTrainer)
+    def _make_module(self) -> MultiAgentRLModule:
+        module = super()._make_module()
+        self._map_module_to_device(module)
         return module
 
     @override(RLTrainer)
@@ -145,14 +152,8 @@ def _convert_batch_type(self, batch: MultiAgentBatch):
         batch = NestedDict(batch)
         return batch
 
-    @override(RLTrainer)
-    def do_distributed_update(self, batch: MultiAgentBatch) -> Mapping[str, Any]:
-        # in torch the distributed update is no different than the normal update
-        return self._update(batch)
-
     def get_weights(self, module_ids: Optional[Set[str]] = None) -> Mapping[str, Any]:
         """Returns the state of the underlying MultiAgentRLModule"""
-
         module_weights = self._module.get_state()
         if module_ids is None:
             return module_weights
diff --git a/rllib/core/rl_trainer/trainer_runner.py b/rllib/core/rl_trainer/trainer_runner.py
index 97f514b86e66..63c1bc87f6aa 100644
--- a/rllib/core/rl_trainer/trainer_runner.py
+++ b/rllib/core/rl_trainer/trainer_runner.py
@@ -333,4 +333,3 @@ def shutdown(self):
 
     def __del__(self):
         self.shutdown()
-        super().__del__()
diff --git a/rllib/core/rl_trainer/trainer_runner_config.py b/rllib/core/rl_trainer/trainer_runner_config.py
index d8de08c05328..33f73f8a04d0 100644
--- a/rllib/core/rl_trainer/trainer_runner_config.py
+++ b/rllib/core/rl_trainer/trainer_runner_config.py
@@ -41,6 +41,13 @@ def __init__(self, cls: Type[TrainerRunner] = None) -> None:
         self.num_cpus_per_trainer_worker = 1
         self.num_trainer_workers = 1
 
+        # TODO (Avnishn): We should come back and revise how to specify algorithm
+        # resources this is a stop gap solution for now so that users can specify the
+        # local gpu id to use when training with gpu and local mode. I doubt this will
+        # be used much since users who have multiple gpus will probably be fine with
+        # using the 0th gpu or will use multi gpu training.
+        self.local_gpu_idx = 0
+
         # `self.framework()`
         self.eager_tracing = False
 
@@ -70,6 +77,7 @@ def build(self) -> TrainerRunner:
             num_workers=self.num_trainer_workers,
             num_gpus_per_worker=self.num_gpus_per_trainer_worker,
             num_cpus_per_worker=self.num_cpus_per_trainer_worker,
+            local_gpu_idx=self.local_gpu_idx,
         )
 
         framework_hps = FrameworkHPs(eager_tracing=self.eager_tracing)
@@ -108,6 +116,7 @@ def resources(
         num_trainer_workers: Optional[int] = NotProvided,
         num_gpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
         num_cpus_per_trainer_worker: Optional[Union[float, int]] = NotProvided,
+        local_gpu_idx: Optional[int] = NotProvided,
     ) -> "TrainerRunnerConfig":
 
         if num_trainer_workers is not NotProvided:
@@ -116,6 +125,8 @@ def resources(
             self.num_gpus_per_trainer_worker = num_gpus_per_trainer_worker
         if num_cpus_per_trainer_worker is not NotProvided:
             self.num_cpus_per_trainer_worker = num_cpus_per_trainer_worker
+        if local_gpu_idx is not NotProvided:
+            self.local_gpu_idx = local_gpu_idx
 
         return self
 
diff --git a/rllib/core/testing/utils.py b/rllib/core/testing/utils.py
index 01e38f07ad8a..6dbf9f60fd17 100644
--- a/rllib/core/testing/utils.py
+++ b/rllib/core/testing/utils.py
@@ -4,7 +4,7 @@
 
 from ray.rllib.utils.annotations import DeveloperAPI
 from ray.rllib.core.rl_trainer.trainer_runner import TrainerRunner
-from ray.rllib.core.rl_trainer.rl_trainer import RLTrainerSpec
+from ray.rllib.core.rl_trainer.rl_trainer import RLTrainerSpec, FrameworkHPs
 from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 
 from ray.rllib.core.rl_module.marl_module import (
@@ -105,8 +105,27 @@ def get_trainer_runner(
     env: "gym.Env",
     scaling_config: TrainerScalingConfig,
     is_multi_agent: bool = False,
+    eager_tracing: bool = False,
 ) -> TrainerRunner:
+    """Construct a trainer runner for testing.
 
+    Args:
+        framework: The framework used for training.
+        env: The environment to train on.
+        scaling_config: A config for the amount and types of resources to use for
+            training.
+        is_multi_agent: Whether to construct a multi agent rl module.
+        eager_tracing: TF Specific. Whether to use tf.function for tracing
+            optimizations.
+
+    Returns:
+        A trainer runner.
+
+    """
+    if framework == "tf":
+        trainer_hps = FrameworkHPs(eager_tracing=eager_tracing)
+    else:
+        trainer_hps = None
     rl_trainer_spec = RLTrainerSpec(
         rl_trainer_class=get_trainer_class(framework),
         module_spec=get_module_spec(
@@ -114,6 +133,7 @@ def get_trainer_runner(
         ),
         optimizer_config={"lr": 0.1},
         trainer_scaling_config=scaling_config,
+        trainer_hyperparameters=trainer_hps,
     )
     runner = TrainerRunner(rl_trainer_spec)
 

From 6cfb541bab44e96cca319d879ae09dc736443b91 Mon Sep 17 00:00:00 2001
From: Huaiwei Sun <scottsun94@gmail.com>
Date: Wed, 8 Feb 2023 16:20:48 -0800
Subject: [PATCH 191/267] [Doc] add job overview diagram (#32050)

This diagram is currently only placed on the key concepts page. However, when I search for ray jobs, I usually only end up on the job overview page and couldn't find this diagram. This diagram will be very helpful to people who need an overview of ray jobs which this page is intended for.
---
 doc/source/cluster/running-applications/job-submission/index.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/doc/source/cluster/running-applications/job-submission/index.md b/doc/source/cluster/running-applications/job-submission/index.md
index 01aeeb0e76fe..64ff075f6da3 100644
--- a/doc/source/cluster/running-applications/job-submission/index.md
+++ b/doc/source/cluster/running-applications/job-submission/index.md
@@ -3,6 +3,7 @@
 # Ray Jobs Overview
 
 Once you have deployed a Ray cluster (on [VMs](vm-cluster-quick-start) or [Kubernetes](kuberay-quickstart)), you are ready to run a Ray application!
+![A diagram that shows three ways of running a job on a Ray cluster.](../../images/ray-job-diagram.svg "Three ways of running a job on a Ray cluster.")
 
 ## Ray Jobs API
 

From b011d5626642177b01a72f3e812009202736419a Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Wed, 8 Feb 2023 16:35:17 -0800
Subject: [PATCH 192/267] [doc] Update running large scale ray cluster doc for
 2.3. (#32336)

---
 doc/source/ray-core/miscellaneous.rst | 55 +++++----------------------
 1 file changed, 9 insertions(+), 46 deletions(-)

diff --git a/doc/source/ray-core/miscellaneous.rst b/doc/source/ray-core/miscellaneous.rst
index 6b02e02a26ee..7eebbdf76e61 100644
--- a/doc/source/ray-core/miscellaneous.rst
+++ b/doc/source/ray-core/miscellaneous.rst
@@ -246,42 +246,11 @@ To run a large cluster, several parameters need to be tuned in Ray.
 Resource broadcasting
 *********************
 
-.. note::
-  There is an ongoing `work <https://github.com/ray-project/ray/issues/30631>`_ changing the
-  algorithm to pull-based which doesn't require tuning these parameters.
-
-
-Another functionality GCS provided is to ensure each worker node has a view of
-available resources of each other in the Ray cluster. Each raylet is going to
-push its local available resource to GCS and GCS will broadcast it to all the
-raylet periodically. The time complexity is O(N^2). In a large Ray cluster, this
-is going to be an issue, since most of the time is spent on broadcasting the
-resources. There are several settings we can use to tune this:
-
-- ``RAY_resource_broadcast_batch_size`` The maximum number of nodes in a single
-  request sent by GCS, by default 512.
-- ``RAY_raylet_report_resources_period_milliseconds`` The interval between two
-  resources report in raylet, 100ms by default.
-
-Be aware that this is a trade-off between scheduling performance and GCS loads.
-Decreasing the resource broadcasting frequency might make scheduling slower.
-
-gRPC threads for GCS
-********************
-
-.. note::
-   There is an ongoing `PR <https://github.com/ray-project/ray/pull/30131>`_
-   setting it to vCPUs/4 by default. It's not necessary to set this up in ray 2.3+.
-
-
-By default, only one gRPC thread is used for server and client polling from the
-completion queue. This might become the bottleneck if QPS is too high.
-
-- ``RAY_gcs_server_rpc_server_thread_num`` Control the number of threads in GCS
-  polling from the server completion queue, by default, 1.
-- ``RAY_gcs_server_rpc_client_thread_num`` Control the number of threads in GCS
-  polling from the client completion queue, by default, 1.
-
+In Ray 2.3+, lightweight resource broadcasting is supported as an experimental feature.
+Turning it on can significantly reduce GCS load and thus
+improve its overall stability and scalability. To turn it on, this OS environment
+should be set: ``RAY_use_ray_syncer=true``. This feature will be turned on by
+default in 2.4+.
 
 Benchmark
 ~~~~~~~~~
@@ -302,10 +271,8 @@ The OS setup:
 
 The Ray setup:
 
-- ``RAY_gcs_server_rpc_client_thread_num=3``
-- ``RAY_gcs_server_rpc_server_thread_num=3``
+- ``RAY_use_ray_syncer=true``
 - ``RAY_event_stats=false``
-- ``RAY_gcs_resource_report_poll_period_ms=1000``
 
 Test workload:
 
@@ -321,10 +288,6 @@ Test workload:
      - Actor ready time
      - Total time
    * - 20k (10 actors / node)
-     - 5.8s
-     - 146.1s
-     - 151.9s
-   * - 80k (40 actors / node)
-     - 21.1s
-     - 583.9s
-     - 605s
+     - 14.5s
+     - 136.1s
+     - 150.7s

From 63d922b33509da1ad2c919c0421cd7f3cc42eb5a Mon Sep 17 00:00:00 2001
From: Cade Daniel <cade@anyscale.com>
Date: Wed, 8 Feb 2023 16:43:57 -0800
Subject: [PATCH 193/267] [core] Improving failure message when ray processes
 fail to start on new node (#32303)

We have a release test named long_running_node_failures which intermittently fails because a node failed to start up. I couldn't debug it despite having all of the Ray logs. I created this PR to add a bit more information (the node socket that should have started up) in the hopes that this enables us to identify the issue next time it happens.

Failure in long_running_node_failures: #32180
---
 python/ray/_private/node.py     | 10 +++++-----
 python/ray/_private/services.py |  6 +++++-
 2 files changed, 10 insertions(+), 6 deletions(-)

diff --git a/python/ray/_private/node.py b/python/ray/_private/node.py
index 5f3652df9d3b..a01a29cc145c 100644
--- a/python/ray/_private/node.py
+++ b/python/ray/_private/node.py
@@ -294,12 +294,12 @@ def __init__(
                     self.gcs_address,
                     self._plasma_store_socket_name,
                 )
-            except TimeoutError:
+            except TimeoutError as te:
                 raise Exception(
-                    "The current node has not been updated within 30 "
-                    "seconds, this could happen because of some of "
-                    "the Ray processes failed to startup."
-                )
+                    "The current node timed out during startup. This "
+                    "could happen because some of the Ray processes "
+                    "failed to startup."
+                ) from te
             node_info = ray._private.services.get_node_to_connect_for_driver(
                 self.gcs_address,
                 self._raylet_ip_address,
diff --git a/python/ray/_private/services.py b/python/ray/_private/services.py
index e85fc528d52c..27731e9de2dc 100644
--- a/python/ray/_private/services.py
+++ b/python/ray/_private/services.py
@@ -433,7 +433,11 @@ def wait_for_node(
             return
         else:
             time.sleep(0.1)
-    raise TimeoutError("Timed out while waiting for node to startup.")
+    raise TimeoutError(
+        f"Timed out after {timeout} seconds while waiting for node to startup. "
+        f"Did not find socket name {node_plasma_store_socket_name} in the list "
+        "of object store socket names."
+    )
 
 
 def get_node_to_connect_for_driver(gcs_address, node_ip_address):

From 5c1c8884190901279284a8ca367539a91ef7f29f Mon Sep 17 00:00:00 2001
From: xwjiang2010 <87673679+xwjiang2010@users.noreply.github.com>
Date: Wed, 8 Feb 2023 17:56:18 -0800
Subject: [PATCH 194/267] [release] update if xgboost test suite requires
 result or not. (#32340)

* [release] update if xgboost test suite require result or not.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* format

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* Revert "format"

This reverts commit 3140401b52d1f76e21e8d16c52aeabe407b3274d.

* Revert "[release] update if xgboost test suite require result or not."

This reverts commit 03ca1c0fd93df6c022fd562dcfcda5d0d42c0c69.

* change to default alert.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* remove tests from xgboost_tests alerts.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

---------

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>
---
 release/ray_release/alerts/xgboost_tests.py | 7 +------
 release/release_tests.yaml                  | 6 +++---
 2 files changed, 4 insertions(+), 9 deletions(-)

diff --git a/release/ray_release/alerts/xgboost_tests.py b/release/ray_release/alerts/xgboost_tests.py
index a133cd932107..b521a418f623 100644
--- a/release/ray_release/alerts/xgboost_tests.py
+++ b/release/ray_release/alerts/xgboost_tests.py
@@ -13,12 +13,7 @@ def handle_result(
     time_taken = result.results.get("time_taken", float("inf"))
     num_terminated = result.results.get("trial_states", {}).get("TERMINATED", 0)
 
-    if test_name in ["distributed_api_test", "ft_small_elastic", "ft_small_nonelastic"]:
-        if not result.status == "finished":
-            return f"Test script did not finish successfully ({result.status})."
-
-        return None
-    elif test_name.startswith("tune_"):
+    if test_name.startswith("tune_"):
         msg = ""
         if test_name == "tune_small":
             target_terminated = 4
diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index 615b630369ec..595a54489279 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -724,7 +724,7 @@
     type: job
 
 
-  alert: xgboost_tests
+  alert: default
 
 - name: xgboost_ft_small_elastic
   group: XGBoost
@@ -751,7 +751,7 @@
     type: job
 
 
-  alert: xgboost_tests
+  alert: default
 
 - name: xgboost_ft_small_non_elastic
   group: XGBoost
@@ -778,7 +778,7 @@
     type: job
 
 
-  alert: xgboost_tests
+  alert: default
 
 - name: xgboost_tune_small
   group: XGBoost

From 5f0f95acc35da6c5a9f8c05792e503c943b3fa8d Mon Sep 17 00:00:00 2001
From: clarng <clarence.wyng@gmail.com>
Date: Wed, 8 Feb 2023 20:29:36 -0800
Subject: [PATCH 195/267] [core] Update oom docs to reflect latest policy
 (#32219)

---
 .../ray-core/doc_code/ray_oom_prevention.py   |  16 +--
 .../ray-core/images/oom_killer_example.svg    |   1 +
 .../images/oom_killer_example_killed_one.svg  |   1 +
 .../images/oom_killer_example_killed_two.svg  |   1 +
 .../scheduling/ray-oom-prevention.rst         | 124 +++++++-----------
 5 files changed, 58 insertions(+), 85 deletions(-)
 create mode 100644 doc/source/ray-core/images/oom_killer_example.svg
 create mode 100644 doc/source/ray-core/images/oom_killer_example_killed_one.svg
 create mode 100644 doc/source/ray-core/images/oom_killer_example_killed_two.svg

diff --git a/doc/source/ray-core/doc_code/ray_oom_prevention.py b/doc/source/ray-core/doc_code/ray_oom_prevention.py
index 9eead11891ae..03aa021c56eb 100644
--- a/doc/source/ray-core/doc_code/ray_oom_prevention.py
+++ b/doc/source/ray-core/doc_code/ray_oom_prevention.py
@@ -7,22 +7,22 @@
     },
 )
 # fmt: off
-# __oom_start__
+# __last_task_start__
 import ray
 
-@ray.remote(max_retries=0)
-def allocate_memory():
+@ray.remote(max_retries=-1)
+def leaks_memory():
     chunks = []
-    bits_to_allocate = 8 * 100 * 1024 * 1024  # ~0.1 GiB
+    bits_to_allocate = 8 * 100 * 1024 * 1024  # ~100 MiB
     while True:
         chunks.append([0] * bits_to_allocate)
 
 
 try:
-    ray.get(allocate_memory.remote())
+    ray.get(leaks_memory.remote())
 except ray.exceptions.OutOfMemoryError as ex:
     print("task failed with OutOfMemoryError, which is expected")
-# __oom_end__
+# __last_task_end__
 # fmt: on
 
 
@@ -78,10 +78,10 @@ def allocate(self, bytes_to_allocate: float) -> None:
     ray.get(first_actor_task)
 except ray.exceptions.OutOfMemoryError as ex:
     error_thrown = True
-    print("first actor was killed by memory monitor")
+    print("First started actor, which is retriable, was killed by the memory monitor.")
 assert error_thrown
 
 ray.get(second_actor_task)
-print("finished second actor")
+print("Second started actor, which is not-retriable, finished.")
 # __two_actors_end__
 # fmt: on
diff --git a/doc/source/ray-core/images/oom_killer_example.svg b/doc/source/ray-core/images/oom_killer_example.svg
new file mode 100644
index 000000000000..b1977b023522
--- /dev/null
+++ b/doc/source/ray-core/images/oom_killer_example.svg
@@ -0,0 +1 @@
+<svg version="1.1" viewBox="0.0 0.0 960.0 540.0" fill="none" stroke="none" stroke-linecap="square" stroke-miterlimit="10" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns="http://www.w3.org/2000/svg"><clipPath id="p.0"><path d="m0 0l960.0 0l0 540.0l-960.0 0l0 -540.0z" clip-rule="nonzero"/></clipPath><g clip-path="url(#p.0)"><path fill="#ffffff" d="m0 0l960.0 0l0 540.0l-960.0 0z" fill-rule="evenodd"/><path fill="#9fc5e8" d="m498.17322 257.24933l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m498.17322 257.24933l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m512.01697 283.55518l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#ffffff" d="m404.5223 159.76115l75.653534 0l0 38.771652l-75.653534 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m404.5223 159.76115l75.653534 0l0 38.771652l-75.653534 0z" fill-rule="evenodd"/><path fill="#595959" d="m414.9598 186.06699l0 -13.359375l4.609375 0q1.546875 0 2.375 0.203125q1.140625 0.25 1.953125 0.953125q1.0625 0.890625 1.578125 2.28125q0.53125 1.390625 0.53125 3.171875q0 1.515625 -0.359375 2.703125q-0.359375 1.171875 -0.921875 1.9375q-0.546875 0.765625 -1.203125 1.21875q-0.65625 0.4375 -1.59375 0.671875q-0.9375 0.21875 -2.140625 0.21875l-4.828125 0zm1.765625 -1.578125l2.859375 0q1.3125 0 2.0625 -0.234375q0.75 -0.25 1.203125 -0.703125q0.625 -0.625 0.96875 -1.6875q0.359375 -1.0625 0.359375 -2.578125q0 -2.09375 -0.6875 -3.21875q-0.6875 -1.125 -1.671875 -1.5q-0.703125 -0.28125 -2.28125 -0.28125l-2.8125 0l0 10.203125zm11.488586 1.578125l0 -9.671875l1.46875 0l0 1.46875q0.5625 -1.03125 1.03125 -1.359375q0.484375 -0.328125 1.0625 -0.328125q0.828125 0 1.6875 0.53125l-0.5625 1.515625q-0.609375 -0.359375 -1.203125 -0.359375q-0.546875 0 -0.96875 0.328125q-0.421875 0.328125 -0.609375 0.890625q-0.28125 0.875 -0.28125 1.921875l0 5.0625l-1.625 0zm6.228302 -11.46875l0 -1.890625l1.640625 0l0 1.890625l-1.640625 0zm0 11.46875l0 -9.671875l1.640625 0l0 9.671875l-1.640625 0zm6.832306 0l-3.6875 -9.671875l1.734375 0l2.078125 5.796875q0.328125 0.9375 0.625 1.9375q0.203125 -0.765625 0.609375 -1.828125l2.140625 -5.90625l1.6875 0l-3.65625 9.671875l-1.53125 0zm13.265625 -3.109375l1.6875 0.203125q-0.40625 1.484375 -1.484375 2.3125q-1.078125 0.8125 -2.765625 0.8125q-2.125 0 -3.375 -1.296875q-1.234375 -1.3125 -1.234375 -3.671875q0 -2.453125 1.25 -3.796875q1.265625 -1.34375 3.265625 -1.34375q1.9375 0 3.15625 1.328125q1.234375 1.3125 1.234375 3.703125q0 0.15625 0 0.4375l-7.21875 0q0.09375 1.59375 0.90625 2.453125q0.8125 0.84375 2.015625 0.84375q0.90625 0 1.546875 -0.46875q0.640625 -0.484375 1.015625 -1.515625zm-5.390625 -2.65625l5.40625 0q-0.109375 -1.21875 -0.625 -1.828125q-0.78125 -0.953125 -2.03125 -0.953125q-1.125 0 -1.90625 0.765625q-0.765625 0.75 -0.84375 2.015625zm9.125732 5.765625l0 -9.671875l1.46875 0l0 1.46875q0.5625 -1.03125 1.03125 -1.359375q0.484375 -0.328125 1.0625 -0.328125q0.828125 0 1.6875 0.53125l-0.5625 1.515625q-0.609375 -0.359375 -1.203125 -0.359375q-0.546875 0 -0.96875 0.328125q-0.421875 0.328125 -0.609375 0.890625q-0.28125 0.875 -0.28125 1.921875l0 5.0625l-1.625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m442.3491 198.5328l85.700775 58.70865" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m442.3491 198.5328l80.750824 55.31775" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m522.16644 255.21323l4.677368 1.2020569l-2.8103638 -3.9273834z" fill-rule="evenodd"/><path fill="#9fc5e8" d="m332.67453 257.25723l59.748047 0l0 38.771637l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m332.67453 257.25723l59.748047 0l0 38.771637l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m346.51828 283.56305l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m442.3491 198.5328l-79.811035 58.740173" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m442.3491 198.5328l-74.97873 55.183624" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m366.3913 252.38615l-2.6758423 4.0202484l4.633972 -1.3596802z" fill-rule="evenodd"/><path fill="#eeeeee" d="m292.6378 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m292.6378 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m306.48154 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#eeeeee" d="m220.5958 349.02362l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m220.5958 349.02362l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m234.43954 375.32944l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5475922 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.54689026 -0.46875 0.54689026 -1.09375q0 -0.546875 -0.48439026 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.85939026 0.328125 1.2656403 0.890625q0.421875 0.5625 0.578125 1.5l-1.6093903 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375153 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90626526 0.390625 -2.0468903 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.98439 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#eeeeee" d="m148.5538 349.02362l59.74803 0l0 38.771667l-59.74803 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m148.5538 349.02362l59.74803 0l0 38.771667l-59.74803 0z" fill-rule="evenodd"/><path fill="#595959" d="m162.39755 375.32944l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5475922 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#0097a7" d="m539.7244 349.01575l59.747986 0l0 38.771667l-59.747986 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m539.7244 349.01575l59.747986 0l0 38.771667l-59.747986 0z" fill-rule="evenodd"/><path fill="#595959" d="m553.5682 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5475464 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#0097a7" d="m617.17584 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m617.17584 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m631.0196 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#0097a7" d="m691.81366 349.02362l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m691.81366 349.02362l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m705.6574 375.32944l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m362.54855 296.02887l-40.031494 52.97638" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m362.54855 296.02887l-36.414215 48.189392" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m324.81653 343.22247l-1.4181213 4.6164246l4.0537415 -2.6248474z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m362.54855 296.02887l-112.06299 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m362.54855 296.02887l-106.63916 50.44229" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m255.20311 344.97806l-3.3960266 3.4335938l4.8085785 -0.44735718z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m362.54855 296.02887l-184.12598 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m362.54855 296.02887l-178.36017 51.34796" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m183.73143 345.78955l-3.904007 2.842743l4.817932 0.3317871z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m528.04724 296.021l41.543335 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m528.04724 296.021l37.842224 48.2854" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m564.5894 345.32526l4.099365 2.5529785l-1.4992676 -4.5907288z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m528.04724 296.021l118.99213 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m528.04724 296.021l113.51135 50.566315" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m640.8865 348.09613l4.817505 0.3378601l-3.4732666 -3.3554688z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m528.04724 296.021l193.63782 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m528.04724 296.021l187.85071 51.423676" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m715.46185 349.03778l4.8131714 -0.39489746l-3.940979 -2.7913208z" fill-rule="evenodd"/><path fill="#eeeeee" d="m364.6378 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m364.6378 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m378.48154 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m362.54855 296.02887l31.968506 52.97638" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m362.54855 296.02887l28.86853 47.839264" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m390.00287 344.72153l3.7588806 3.032074l-0.93048096 -4.738861z" fill-rule="evenodd"/><path fill="#0097a7" d="m462.27298 349.01575l59.748016 0l0 38.771667l-59.748016 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m462.27298 349.01575l59.748016 0l0 38.771667l-59.748016 0z" fill-rule="evenodd"/><path fill="#595959" d="m476.11673 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.547577 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m528.04724 296.021l-35.905518 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m528.04724 296.021l-32.54059 48.040222" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m494.1391 343.13492l-1.1775208 4.6835938l3.9125977 -2.8309631z" fill-rule="evenodd"/></g></svg>
\ No newline at end of file
diff --git a/doc/source/ray-core/images/oom_killer_example_killed_one.svg b/doc/source/ray-core/images/oom_killer_example_killed_one.svg
new file mode 100644
index 000000000000..31e5f448674e
--- /dev/null
+++ b/doc/source/ray-core/images/oom_killer_example_killed_one.svg
@@ -0,0 +1 @@
+<svg version="1.1" viewBox="0.0 0.0 960.0 540.0" fill="none" stroke="none" stroke-linecap="square" stroke-miterlimit="10" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns="http://www.w3.org/2000/svg"><clipPath id="g20691a7a7a3_0_481.0"><path d="m0 0l960.0 0l0 540.0l-960.0 0l0 -540.0z" clip-rule="nonzero"/></clipPath><g clip-path="url(#g20691a7a7a3_0_481.0)"><path fill="#ffffff" d="m0 0l960.0 0l0 540.0l-960.0 0z" fill-rule="evenodd"/><path fill="#9fc5e8" d="m498.17322 257.24933l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m498.17322 257.24933l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m512.01697 283.55518l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#ffffff" d="m404.5223 159.76115l75.653534 0l0 38.771652l-75.653534 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m404.5223 159.76115l75.653534 0l0 38.771652l-75.653534 0z" fill-rule="evenodd"/><path fill="#595959" d="m414.9598 186.06699l0 -13.359375l4.609375 0q1.546875 0 2.375 0.203125q1.140625 0.25 1.953125 0.953125q1.0625 0.890625 1.578125 2.28125q0.53125 1.390625 0.53125 3.171875q0 1.515625 -0.359375 2.703125q-0.359375 1.171875 -0.921875 1.9375q-0.546875 0.765625 -1.203125 1.21875q-0.65625 0.4375 -1.59375 0.671875q-0.9375 0.21875 -2.140625 0.21875l-4.828125 0zm1.765625 -1.578125l2.859375 0q1.3125 0 2.0625 -0.234375q0.75 -0.25 1.203125 -0.703125q0.625 -0.625 0.96875 -1.6875q0.359375 -1.0625 0.359375 -2.578125q0 -2.09375 -0.6875 -3.21875q-0.6875 -1.125 -1.671875 -1.5q-0.703125 -0.28125 -2.28125 -0.28125l-2.8125 0l0 10.203125zm11.488586 1.578125l0 -9.671875l1.46875 0l0 1.46875q0.5625 -1.03125 1.03125 -1.359375q0.484375 -0.328125 1.0625 -0.328125q0.828125 0 1.6875 0.53125l-0.5625 1.515625q-0.609375 -0.359375 -1.203125 -0.359375q-0.546875 0 -0.96875 0.328125q-0.421875 0.328125 -0.609375 0.890625q-0.28125 0.875 -0.28125 1.921875l0 5.0625l-1.625 0zm6.228302 -11.46875l0 -1.890625l1.640625 0l0 1.890625l-1.640625 0zm0 11.46875l0 -9.671875l1.640625 0l0 9.671875l-1.640625 0zm6.832306 0l-3.6875 -9.671875l1.734375 0l2.078125 5.796875q0.328125 0.9375 0.625 1.9375q0.203125 -0.765625 0.609375 -1.828125l2.140625 -5.90625l1.6875 0l-3.65625 9.671875l-1.53125 0zm13.265625 -3.109375l1.6875 0.203125q-0.40625 1.484375 -1.484375 2.3125q-1.078125 0.8125 -2.765625 0.8125q-2.125 0 -3.375 -1.296875q-1.234375 -1.3125 -1.234375 -3.671875q0 -2.453125 1.25 -3.796875q1.265625 -1.34375 3.265625 -1.34375q1.9375 0 3.15625 1.328125q1.234375 1.3125 1.234375 3.703125q0 0.15625 0 0.4375l-7.21875 0q0.09375 1.59375 0.90625 2.453125q0.8125 0.84375 2.015625 0.84375q0.90625 0 1.546875 -0.46875q0.640625 -0.484375 1.015625 -1.515625zm-5.390625 -2.65625l5.40625 0q-0.109375 -1.21875 -0.625 -1.828125q-0.78125 -0.953125 -2.03125 -0.953125q-1.125 0 -1.90625 0.765625q-0.765625 0.75 -0.84375 2.015625zm9.125732 5.765625l0 -9.671875l1.46875 0l0 1.46875q0.5625 -1.03125 1.03125 -1.359375q0.484375 -0.328125 1.0625 -0.328125q0.828125 0 1.6875 0.53125l-0.5625 1.515625q-0.609375 -0.359375 -1.203125 -0.359375q-0.546875 0 -0.96875 0.328125q-0.421875 0.328125 -0.609375 0.890625q-0.28125 0.875 -0.28125 1.921875l0 5.0625l-1.625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m442.3491 198.5328l85.700775 58.70865" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m442.3491 198.5328l80.750824 55.31775" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m522.16644 255.21323l4.677368 1.2020569l-2.8103638 -3.9273834z" fill-rule="evenodd"/><path fill="#9fc5e8" d="m332.67453 257.25723l59.748047 0l0 38.771637l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m332.67453 257.25723l59.748047 0l0 38.771637l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m346.51828 283.56305l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m442.3491 198.5328l-79.811035 58.740173" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m442.3491 198.5328l-74.97873 55.183624" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m366.3913 252.38615l-2.6758423 4.0202484l4.633972 -1.3596802z" fill-rule="evenodd"/><path fill="#eeeeee" d="m292.6378 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m292.6378 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m306.48154 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#eeeeee" d="m220.5958 349.02362l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m220.5958 349.02362l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m234.43954 375.32944l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5475922 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.54689026 -0.46875 0.54689026 -1.09375q0 -0.546875 -0.48439026 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.85939026 0.328125 1.2656403 0.890625q0.421875 0.5625 0.578125 1.5l-1.6093903 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375153 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90626526 0.390625 -2.0468903 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.98439 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#eeeeee" d="m148.5538 349.02362l59.74803 0l0 38.771667l-59.74803 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m148.5538 349.02362l59.74803 0l0 38.771667l-59.74803 0z" fill-rule="evenodd"/><path fill="#595959" d="m162.39755 375.32944l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5475922 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#0097a7" d="m539.7244 349.01575l59.747986 0l0 38.771667l-59.747986 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m539.7244 349.01575l59.747986 0l0 38.771667l-59.747986 0z" fill-rule="evenodd"/><path fill="#595959" d="m553.5682 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5475464 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#0097a7" d="m617.17584 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m617.17584 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m631.0196 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#0097a7" d="m691.81366 349.02362l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m691.81366 349.02362l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m705.6574 375.32944l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m362.54855 296.02887l-40.031494 52.97638" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m362.54855 296.02887l-36.414215 48.189392" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m324.81653 343.22247l-1.4181213 4.6164246l4.0537415 -2.6248474z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m362.54855 296.02887l-112.06299 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m362.54855 296.02887l-106.63916 50.44229" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m255.20311 344.97806l-3.3960266 3.4335938l4.8085785 -0.44735718z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m362.54855 296.02887l-184.12598 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m362.54855 296.02887l-178.36017 51.34796" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m183.73143 345.78955l-3.904007 2.842743l4.817932 0.3317871z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m528.04724 296.021l41.543335 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m528.04724 296.021l37.842224 48.2854" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m564.5894 345.32526l4.099365 2.5529785l-1.4992676 -4.5907288z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m528.04724 296.021l118.99213 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m528.04724 296.021l113.51135 50.566315" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m640.8865 348.09613l4.817505 0.3378601l-3.4732666 -3.3554688z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m528.04724 296.021l193.63782 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m528.04724 296.021l187.85071 51.423676" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m715.46185 349.03778l4.8131714 -0.39489746l-3.940979 -2.7913208z" fill-rule="evenodd"/><path fill="#0097a7" d="m462.27298 349.01575l59.748016 0l0 38.771667l-59.748016 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m462.27298 349.01575l59.748016 0l0 38.771667l-59.748016 0z" fill-rule="evenodd"/><path fill="#595959" d="m476.11673 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.547577 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m528.04724 296.021l-35.905518 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m528.04724 296.021l-32.54059 48.040222" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m494.1391 343.13492l-1.1775208 4.6835938l3.9125977 -2.8309631z" fill-rule="evenodd"/></g></svg>
\ No newline at end of file
diff --git a/doc/source/ray-core/images/oom_killer_example_killed_two.svg b/doc/source/ray-core/images/oom_killer_example_killed_two.svg
new file mode 100644
index 000000000000..1ae1d01e3cdd
--- /dev/null
+++ b/doc/source/ray-core/images/oom_killer_example_killed_two.svg
@@ -0,0 +1 @@
+<svg version="1.1" viewBox="0.0 0.0 960.0 540.0" fill="none" stroke="none" stroke-linecap="square" stroke-miterlimit="10" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns="http://www.w3.org/2000/svg"><clipPath id="g1f08cf0ef6d_0_0.0"><path d="m0 0l960.0 0l0 540.0l-960.0 0l0 -540.0z" clip-rule="nonzero"/></clipPath><g clip-path="url(#g1f08cf0ef6d_0_0.0)"><path fill="#ffffff" d="m0 0l960.0 0l0 540.0l-960.0 0z" fill-rule="evenodd"/><path fill="#9fc5e8" d="m498.17322 257.24933l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m498.17322 257.24933l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m512.01697 283.55518l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#ffffff" d="m404.5223 159.76115l75.653534 0l0 38.771652l-75.653534 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m404.5223 159.76115l75.653534 0l0 38.771652l-75.653534 0z" fill-rule="evenodd"/><path fill="#595959" d="m414.9598 186.06699l0 -13.359375l4.609375 0q1.546875 0 2.375 0.203125q1.140625 0.25 1.953125 0.953125q1.0625 0.890625 1.578125 2.28125q0.53125 1.390625 0.53125 3.171875q0 1.515625 -0.359375 2.703125q-0.359375 1.171875 -0.921875 1.9375q-0.546875 0.765625 -1.203125 1.21875q-0.65625 0.4375 -1.59375 0.671875q-0.9375 0.21875 -2.140625 0.21875l-4.828125 0zm1.765625 -1.578125l2.859375 0q1.3125 0 2.0625 -0.234375q0.75 -0.25 1.203125 -0.703125q0.625 -0.625 0.96875 -1.6875q0.359375 -1.0625 0.359375 -2.578125q0 -2.09375 -0.6875 -3.21875q-0.6875 -1.125 -1.671875 -1.5q-0.703125 -0.28125 -2.28125 -0.28125l-2.8125 0l0 10.203125zm11.488586 1.578125l0 -9.671875l1.46875 0l0 1.46875q0.5625 -1.03125 1.03125 -1.359375q0.484375 -0.328125 1.0625 -0.328125q0.828125 0 1.6875 0.53125l-0.5625 1.515625q-0.609375 -0.359375 -1.203125 -0.359375q-0.546875 0 -0.96875 0.328125q-0.421875 0.328125 -0.609375 0.890625q-0.28125 0.875 -0.28125 1.921875l0 5.0625l-1.625 0zm6.228302 -11.46875l0 -1.890625l1.640625 0l0 1.890625l-1.640625 0zm0 11.46875l0 -9.671875l1.640625 0l0 9.671875l-1.640625 0zm6.832306 0l-3.6875 -9.671875l1.734375 0l2.078125 5.796875q0.328125 0.9375 0.625 1.9375q0.203125 -0.765625 0.609375 -1.828125l2.140625 -5.90625l1.6875 0l-3.65625 9.671875l-1.53125 0zm13.265625 -3.109375l1.6875 0.203125q-0.40625 1.484375 -1.484375 2.3125q-1.078125 0.8125 -2.765625 0.8125q-2.125 0 -3.375 -1.296875q-1.234375 -1.3125 -1.234375 -3.671875q0 -2.453125 1.25 -3.796875q1.265625 -1.34375 3.265625 -1.34375q1.9375 0 3.15625 1.328125q1.234375 1.3125 1.234375 3.703125q0 0.15625 0 0.4375l-7.21875 0q0.09375 1.59375 0.90625 2.453125q0.8125 0.84375 2.015625 0.84375q0.90625 0 1.546875 -0.46875q0.640625 -0.484375 1.015625 -1.515625zm-5.390625 -2.65625l5.40625 0q-0.109375 -1.21875 -0.625 -1.828125q-0.78125 -0.953125 -2.03125 -0.953125q-1.125 0 -1.90625 0.765625q-0.765625 0.75 -0.84375 2.015625zm9.125732 5.765625l0 -9.671875l1.46875 0l0 1.46875q0.5625 -1.03125 1.03125 -1.359375q0.484375 -0.328125 1.0625 -0.328125q0.828125 0 1.6875 0.53125l-0.5625 1.515625q-0.609375 -0.359375 -1.203125 -0.359375q-0.546875 0 -0.96875 0.328125q-0.421875 0.328125 -0.609375 0.890625q-0.28125 0.875 -0.28125 1.921875l0 5.0625l-1.625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m442.3491 198.5328l85.700775 58.70865" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m442.3491 198.5328l80.750824 55.31775" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m522.16644 255.21323l4.677368 1.2020569l-2.8103638 -3.9273834z" fill-rule="evenodd"/><path fill="#9fc5e8" d="m332.67453 257.25723l59.748047 0l0 38.771637l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m332.67453 257.25723l59.748047 0l0 38.771637l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m346.51828 283.56305l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m442.3491 198.5328l-79.811035 58.740173" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m442.3491 198.5328l-74.97873 55.183624" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m366.3913 252.38615l-2.6758423 4.0202484l4.633972 -1.3596802z" fill-rule="evenodd"/><path fill="#eeeeee" d="m292.6378 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m292.6378 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m306.48154 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#eeeeee" d="m220.5958 349.02362l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m220.5958 349.02362l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m234.43954 375.32944l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5475922 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.54689026 -0.46875 0.54689026 -1.09375q0 -0.546875 -0.48439026 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.85939026 0.328125 1.2656403 0.890625q0.421875 0.5625 0.578125 1.5l-1.6093903 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375153 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90626526 0.390625 -2.0468903 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.98439 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#eeeeee" d="m148.5538 349.02362l59.74803 0l0 38.771667l-59.74803 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m148.5538 349.02362l59.74803 0l0 38.771667l-59.74803 0z" fill-rule="evenodd"/><path fill="#595959" d="m162.39755 375.32944l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5475922 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#0097a7" d="m539.7244 349.01575l59.747986 0l0 38.771667l-59.747986 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m539.7244 349.01575l59.747986 0l0 38.771667l-59.747986 0z" fill-rule="evenodd"/><path fill="#595959" d="m553.5682 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5475464 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#0097a7" d="m617.17584 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m617.17584 349.01575l59.748047 0l0 38.771667l-59.748047 0z" fill-rule="evenodd"/><path fill="#595959" d="m631.0196 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.5476074 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m362.54855 296.02887l-40.031494 52.97638" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m362.54855 296.02887l-36.414215 48.189392" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m324.81653 343.22247l-1.4181213 4.6164246l4.0537415 -2.6248474z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m362.54855 296.02887l-112.06299 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m362.54855 296.02887l-106.63916 50.44229" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m255.20311 344.97806l-3.3960266 3.4335938l4.8085785 -0.44735718z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m362.54855 296.02887l-184.12598 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m362.54855 296.02887l-178.36017 51.34796" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m183.73143 345.78955l-3.904007 2.842743l4.817932 0.3317871z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m528.04724 296.021l41.543335 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m528.04724 296.021l37.842224 48.2854" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m564.5894 345.32526l4.099365 2.5529785l-1.4992676 -4.5907288z" fill-rule="evenodd"/><path fill="#000000" fill-opacity="0.0" d="m528.04724 296.021l118.99213 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m528.04724 296.021l113.51135 50.566315" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m640.8865 348.09613l4.817505 0.3378601l-3.4732666 -3.3554688z" fill-rule="evenodd"/><path fill="#0097a7" d="m462.27298 349.01575l59.748016 0l0 38.771667l-59.748016 0z" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m462.27298 349.01575l59.748016 0l0 38.771667l-59.748016 0z" fill-rule="evenodd"/><path fill="#595959" d="m476.11673 375.32156l0 -11.78125l-4.40625 0l0 -1.578125l10.578125 0l0 1.578125l-4.40625 0l0 11.78125l-1.765625 0zm12.03009 -1.1875q-0.921875 0.765625 -1.765625 1.09375q-0.828125 0.3125 -1.796875 0.3125q-1.59375 0 -2.453125 -0.78125q-0.859375 -0.78125 -0.859375 -1.984375q0 -0.71875 0.328125 -1.296875q0.328125 -0.59375 0.84375 -0.9375q0.53125 -0.359375 1.1875 -0.546875q0.46875 -0.125 1.453125 -0.25q1.984375 -0.234375 2.921875 -0.5625q0.015625 -0.34375 0.015625 -0.421875q0 -1.0 -0.46875 -1.421875q-0.625 -0.546875 -1.875 -0.546875q-1.15625 0 -1.703125 0.40625q-0.546875 0.40625 -0.8125 1.421875l-1.609375 -0.21875q0.21875 -1.015625 0.71875 -1.640625q0.5 -0.640625 1.453125 -0.984375q0.953125 -0.34375 2.1875 -0.34375q1.25 0 2.015625 0.296875q0.78125 0.28125 1.140625 0.734375q0.375 0.4375 0.515625 1.109375q0.078125 0.421875 0.078125 1.515625l0 2.1875q0 2.28125 0.109375 2.890625q0.109375 0.59375 0.40625 1.15625l-1.703125 0q-0.265625 -0.515625 -0.328125 -1.1875zm-0.140625 -3.671875q-0.890625 0.375 -2.671875 0.625q-1.015625 0.140625 -1.4375 0.328125q-0.421875 0.1875 -0.65625 0.53125q-0.21875 0.34375 -0.21875 0.78125q0 0.65625 0.5 1.09375q0.5 0.4375 1.453125 0.4375q0.9375 0 1.671875 -0.40625q0.75 -0.421875 1.09375 -1.140625q0.265625 -0.5625 0.265625 -1.640625l0 -0.609375zm3.547577 1.96875l1.625 -0.25q0.125 0.96875 0.75 1.5q0.625 0.515625 1.75 0.515625q1.125 0 1.671875 -0.453125q0.546875 -0.46875 0.546875 -1.09375q0 -0.546875 -0.484375 -0.875q-0.328125 -0.21875 -1.671875 -0.546875q-1.8125 -0.46875 -2.515625 -0.796875q-0.6875 -0.328125 -1.046875 -0.90625q-0.359375 -0.59375 -0.359375 -1.3125q0 -0.640625 0.296875 -1.1875q0.296875 -0.5625 0.8125 -0.921875q0.375 -0.28125 1.03125 -0.46875q0.671875 -0.203125 1.421875 -0.203125q1.140625 0 2.0 0.328125q0.859375 0.328125 1.265625 0.890625q0.421875 0.5625 0.578125 1.5l-1.609375 0.21875q-0.109375 -0.75 -0.640625 -1.171875q-0.515625 -0.421875 -1.46875 -0.421875q-1.140625 0 -1.625 0.375q-0.46875 0.375 -0.46875 0.875q0 0.3125 0.1875 0.578125q0.203125 0.265625 0.640625 0.4375q0.234375 0.09375 1.4375 0.421875q1.75 0.453125 2.4375 0.75q0.6875 0.296875 1.078125 0.859375q0.390625 0.5625 0.390625 1.40625q0 0.828125 -0.484375 1.546875q-0.46875 0.71875 -1.375 1.125q-0.90625 0.390625 -2.046875 0.390625q-1.875 0 -2.875 -0.78125q-0.984375 -0.78125 -1.25 -2.328125zm9.984375 2.890625l0 -13.359375l1.640625 0l0 7.625l3.890625 -3.9375l2.109375 0l-3.6875 3.59375l4.0625 6.078125l-2.015625 0l-3.203125 -4.953125l-1.15625 1.125l0 3.828125l-1.640625 0z" fill-rule="nonzero"/><path fill="#000000" fill-opacity="0.0" d="m528.04724 296.021l-35.905518 53.007874" fill-rule="evenodd"/><path stroke="#595959" stroke-width="1.0" stroke-linejoin="round" stroke-linecap="butt" d="m528.04724 296.021l-32.54059 48.040222" fill-rule="evenodd"/><path fill="#595959" stroke="#595959" stroke-width="1.0" stroke-linecap="butt" d="m494.1391 343.13492l-1.1775208 4.6835938l3.9125977 -2.8309631z" fill-rule="evenodd"/></g></svg>
\ No newline at end of file
diff --git a/doc/source/ray-core/scheduling/ray-oom-prevention.rst b/doc/source/ray-core/scheduling/ray-oom-prevention.rst
index ca60d826313c..c3c79828c636 100644
--- a/doc/source/ray-core/scheduling/ray-oom-prevention.rst
+++ b/doc/source/ray-core/scheduling/ray-oom-prevention.rst
@@ -16,42 +16,22 @@ What is the memory monitor?
 
 The memory monitor is a component that runs within the :ref:`raylet <whitepaper>` process on each node. It periodically checks the memory usage, which includes the worker heap, the object store, and the raylet as described in :ref:`memory management <memory>`. If the combined usage exceeds a configurable threshold the raylet will kill a task or actor process to free up memory and prevent Ray from failing.
 
-.. note::
+It is available on Linux and is tested with Ray running inside a container that is using cgroup v1. If you encounter issues when running the memory monitor outside of a container or the container is using cgroup v2, please :ref:`file an issue or post a question <oom-questions>`.
 
-    The memory monitor is in :ref:`beta <api-stability-beta>`. It is enabled by default and can be disabled by setting the environment variable ``RAY_memory_monitor_refresh_ms`` to zero when Ray starts. It is available on Linux and is tested with Ray running inside a container that is using cgroup v1. If you encounter issues when running the memory monitor outside of a container or the container is using cgroup v2, please :ref:`file an issue or post a question <oom-questions>`.
+How do I disable the memory monitor?
+--------------------------------------
+
+The memory monitor is enabled by default and can be disabled by setting the environment variable ``RAY_memory_monitor_refresh_ms`` to zero when Ray starts (e.g., RAY_memory_monitor_refresh_ms=0 ray start ...). 
 
 How do I configure the memory monitor?
 --------------------------------------
 
 The memory monitor is controlled by the following environment variables:
 
-- ``RAY_memory_monitor_refresh_ms (int, defaults to 250)`` is the interval to check memory usage and kill tasks or actors if needed. It is disabled when this value is 0.
+- ``RAY_memory_monitor_refresh_ms (int, defaults to 250)`` is the interval to check memory usage and kill tasks or actors if needed. Task killing is disabled when this value is 0. The memory monitor selects and kills one task at a time and waits for it to be killed before choosing another one, regardless of how frequent the memory monitor runs.
 
 - ``RAY_memory_usage_threshold (float, defaults to 0.95)`` is the threshold when the node is beyond the memory
-  capacity. If the memory usage is above this value and the free space is
-  below min_memory_free_bytes then it will start killing processes to free up space. Ranges from [0, 1].
-
-- ``RAY_task_oom_retries (int, defaults to 15):`` The number of retries for the task or actor when
-  it fails due to the process being killed by the memory monitor.
-  If the task or actor is not retriable then this value is not used. This value is used
-  only when the process is killed by the memory monitor, and the retry counter of the
-  task or actor (:ref:`max_retries <task-fault-tolerance>` or :ref:`max_restarts <actor-fault-tolerance>`) is used when it fails 
-  in other ways. If the process is killed by the operating system OOM killer it will use the task retry and not ``task_oom_retries``.
-  It will retry indefinitely if this value is set to -1.
-
-  When the task is retried due to OOM it applies a delay before re-executing the task. The delay is calculated as
-
-  .. code-block:: bash
-
-      delay_seconds = 2 ^ attempt
-
-  Where the first retry will be delayed by 1 second as ``attempt`` starts from 0.
-
-  .. note::
-
-      Keep the value of ``RAY_task_oom_retries`` low, below 25, to avoid extremely long delays as it is using exponential backoff.
-      The delay is capped at 1 minute.
-  
+  capacity. If the memory usage is above this fraction it will start killing processes to free up memory. Ranges from [0, 1].
 
 Using the Memory Monitor
 ------------------------
@@ -59,74 +39,63 @@ Using the Memory Monitor
 Retry policy
 ~~~~~~~~~~~~
 
-When a task or actor is killed by the memory monitor, it will retry using a separate retry counter based off of ``RAY_task_oom_retries`` instead of the typical number of retries specified by :ref:`max_retries <task-fault-tolerance>` for tasks and :ref:`max_restarts <actor-fault-tolerance>` for actors. The number of memory monitor retries is the same for tasks and actors and defaults to ``15``. To override this value, the environment variable ``RAY_task_oom_retries`` should be set when starting Ray as well as the application.
+When a task or actor is killed by the memory monitor it will be retried with exponential backoff. There is a cap on the retry delay, which is 60 seconds. If tasks are killed by the memory monitor, it retries infinitely (not respecting :ref:`max_retries <task-fault-tolerance>`). If actors are killed by the memory monitor, it doesn't recreate the actor infinitely (It respects :ref:`max_restarts <actor-fault-tolerance>`, which is 0 by default).
 
-Let's create an application oom.py that will trigger the out-of-memory condition.
+Worker killing policy
+~~~~~~~~~~~~~~~~~~~~~
 
-.. literalinclude:: ../doc_code/ray_oom_prevention.py
-      :language: python
-      :start-after: __oom_start__
-      :end-before: __oom_end__
+The memory monitor avoids infinite loops of task retries by ensuring at least one task is able to run for each caller on each node. If it is unable to ensure this, the workload will fail with an OOM error. Note that this is only an issue for tasks, since the memory monitor will not indefinitely retry actors. If the workload fails, refer to :ref:`how to address memory issues <addressing-memory-issues>` on how to adjust the workload to make it pass. For code example, see the :ref:`last task <last-task-example>` example below.
 
+When a worker needs to be killed, the policy first prioritizes tasks that are retriable, i.e. when :ref:`max_retries <task-fault-tolerance>` or :ref:`max_restarts <actor-fault-tolerance>` is > 0. This is done to minimize workload failure. Actors by default are not retriable since :ref:`max_restarts <actor-fault-tolerance>` defaults to 0. Therefore, by default, tasks are preferred to actors when it comes to what gets killed first.
 
-To speed up the example, set ``RAY_task_oom_retries=1`` on the application so the task will only retry once if it is killed by the memory monitor. Also set ``RAY_event_stats_print_interval_ms=1000`` so it prints the worker kill summary, which by default is every minute.
+When there are multiple callers that has created tasks, the policy will pick a task from the caller with the most number of running tasks. If two callers have the same number of tasks it picks the caller whose earliest task has a later start time. This is done to ensure fairness and allow each caller to make progress.
 
-.. code-block:: bash
+Amongst the tasks that share the same caller, the latest started task will be killed first.
 
-    RAY_event_stats_print_interval_ms=1000 RAY_task_oom_retries=1 python oom.py
+Below is an example to demonstrate the policy. In the example we have a script that creates two tasks, which in turn creates four more tasks each. The tasks are colored such that each color forms a "group" of tasks where they belong to the same caller.
 
-    2022-11-17 09:16:40,792 INFO worker.py:1534 -- Started a local Ray instance. View the dashboard at http://127.0.0.1:8265
+.. image:: ../images/oom_killer_example.svg
+  :width: 1024
+  :alt: Initial state of the task graph
 
-    (raylet) [2022-11-17 09:16:52,264 E 90996 90996] (raylet) node_manager.cc:3096: 1 Workers (tasks / actors) killed due to memory pressure (OOM), 0 Workers crashed due to other reasons at node (ID: 90efe99b630d4b1f6ac1504df64764732d555b526049638f9d86552f, IP: 172.17.0.2) over the last time period. To see more information about the Workers killed on this node, use `ray logs raylet.out -ip 172.17.0.2`
-    (raylet) 
-    (raylet) Refer to the documentation on how to address the out of memory issue: https://docs.ray.io/en/latest/ray-core/scheduling/ray-oom-prevention.html. Consider provisioning more memory on this node or reducing task parallelism by requesting more CPUs per task. To adjust the kill threshold, set the environment variable `RAY_memory_usage_threshold` when starting Ray. To disable worker killing, set the environment variable `RAY_memory_monitor_refresh_ms` to zero.
+If, at this point, the node runs out of memory, it will pick a task from the caller with the most number of tasks, and kill its task whose started the last:
 
-    (raylet) [2022-11-17 09:17:03,461 E 90996 90996] (raylet) node_manager.cc:3096: 1 Workers (tasks / actors) killed due to memory pressure (OOM), 0 Workers crashed due to other reasons at node (ID: 90efe99b630d4b1f6ac1504df64764732d555b526049638f9d86552f, IP: 172.17.0.2) over the last time period. To see more information about the Workers killed on this node, use `ray logs raylet.out -ip 172.17.0.2`
-    (raylet) 
-    (raylet) Refer to the documentation on how to address the out of memory issue: https://docs.ray.io/en/latest/ray-core/scheduling/ray-oom-prevention.html. Consider provisioning more memory on this node or reducing task parallelism by requesting more CPUs per task. To adjust the kill threshold, set the environment variable `RAY_memory_usage_threshold` when starting Ray. To disable worker killing, set the environment variable `RAY_memory_monitor_refresh_ms` to zero.
+.. image:: ../images/oom_killer_example_killed_one.svg
+  :width: 1024
+  :alt: Initial state of the task graph
 
-    Traceback (most recent call last):
-      File "oom.py", line 11, in <module>
-        ray.get(allocate_memory.remote())
-      File "/home/ray/github/rayclarng/ray/python/ray/_private/client_mode_hook.py", line 105, in wrapper
-        return func(*args, **kwargs)
-      File "/home/ray/github/rayclarng/ray/python/ray/_private/worker.py", line 2310, in get
-        raise value
-    ray.exceptions.OutOfMemoryError: Task was killed due to the node running low on memory.
-    Memory on the node (IP: 172.17.0.2, ID: 90efe99b630d4b1f6ac1504df64764732d555b526049638f9d86552f) where the task (task ID: a6755d1708846b10007fda8a687eb57eb8a083c001000000, name=allocate_memory, pid=91085, memory used=24.99GB) was running was 32.62GB / 33.28GB (0.980175), which exceeds the memory usage threshold of 0.96. Ray killed this worker (ID: a8101629b7605f88776a08193f108adcc637248d976add819bbecbba) because it was the most recently scheduled task; to see more information about memory usage on this node, use `ray logs raylet.out -ip 172.17.0.2`. To see the logs of the worker, use `ray logs worker-a8101629b7605f88776a08193f108adcc637248d976add819bbecbba*out -ip 172.17.0.2.Top 10 memory users:
-    PID     MEM(GB) COMMAND
-    91085   24.99   ray::allocate_memory
-    57330   2.63    /home/ray/.vscode-server/extensions/ms-vscode.cpptools-1.12.4-linux-x64/bin/cpptools
-    48949   1.70    /home/ray/.vscode-server/bin/d045a5eda657f4d7b676dedbfa7aab8207f8a075/node /home/ray/.vscode-server/...
-    54387   0.80    bazel(ray) -XX:+HeapDumpOnOutOfMemoryError -XX:HeapDumpPath=/home/ray/.cache/bazel/_bazel_ray/8c472b...
-    35099   0.66    /home/ray/.vscode-server/extensions/ms-vscode.cpptools-1.12.4-linux-x64/bin/cpptools-srv 57330 {1729...
-    16821   0.23    /home/ray/.vscode-server/bin/d045a5eda657f4d7b676dedbfa7aab8207f8a075/node /home/ray/.vscode-server/...
-    61800   0.17    /home/ray/.vscode-server/extensions/ms-vscode.cpptools-1.12.4-linux-x64/bin/cpptools-srv 57330 {54EF...
-    91043   0.07    /home/ray/anaconda3/bin/python -u /home/ray/github/rayclarng/ray/python/ray/dashboard/agent.py --nod...
-    90935   0.07    /home/ray/anaconda3/bin/python /home/ray/github/rayclarng/ray/python/ray/dashboard/dashboard.py --ho...
-    90870   0.07    python oom.py
-    Refer to the documentation on how to address the out of memory issue: https://docs.ray.io/en/latest/ray-core/scheduling/ray-oom-prevention.html. Consider provisioning more memory on this node or reducing task parallelism by requesting more CPUs per task. To adjust the kill threshold, set the environment variable `RAY_memory_usage_threshold` when starting Ray. To disable worker killing, set the environment variable `RAY_memory_monitor_refresh_ms` to zero.
+If, at this point, the node still runs out of memory, the process will repeat:
 
-Verify the task was indeed executed twice via ``task_oom_retry``:
+.. image:: ../images/oom_killer_example_killed_two.svg
+  :width: 1024
+  :alt: Initial state of the task graph
 
-.. code-block:: bash
+.. _last-task-example:
 
-    $ grep -r "retries left" /tmp/ray/session_latest/logs/
+.. dropdown:: Example: Workloads fails if the last task of the caller is killed
 
-    /tmp/ray/session_latest/logs/python-core-driver-01000000ffffffffffffffffffffffffffffffffffffffffffffffff_87487.log:[2022-11-15 13:50:27,653 I 87487 87703] task_manager.cc:458: task c8ef45ccd0112571ffffffffffffffffffffffff01000000 retries left: 3, oom retries left: 1, task failed due to oom: 1
+    Let's create an application oom.py that runs a single task that requires more memory than what is available. It is set to infinite retry by setting ``max_retries`` to -1.
 
-    /tmp/ray/session_latest/logs/python-core-driver-01000000ffffffffffffffffffffffffffffffffffffffffffffffff_87487.log:[2022-11-15 13:50:36,671 I 87487 87703] task_manager.cc:458: task c8ef45ccd0112571ffffffffffffffffffffffff01000000 retries left: 3, oom retries left: 0, task failed due to oom: 1
+    The worker killer policy sees that it is the last task of the caller, and will fail the workload when it kills the task as it is the last one for the caller, even when the task is set to retry forver.
 
-    /tmp/ray/session_latest/logs/python-core-driver-01000000ffffffffffffffffffffffffffffffffffffffffffffffff_87487.log:[2022-11-15 13:50:36,671 I 87487 87703] task_manager.cc:466: No retries left for task c8ef45ccd0112571ffffffffffffffffffffffff01000000, not going to resubmit.
+    .. literalinclude:: ../doc_code/ray_oom_prevention.py
+          :language: python
+          :start-after: __last_task_start__
+          :end-before: __last_task_end__
 
-.. note::
 
-    Actors by default are not retriable since :ref:`max_restarts <actor-fault-tolerance>` defaults to 0, therefore tasks are preferred to actors when it comes to what gets killed first. Actors currently don't use ``RAY_task_oom_retries`` and instead use :ref:`max_restarts <actor-fault-tolerance>` when killed by the memory monitor.
+    Set ``RAY_event_stats_print_interval_ms=1000`` so it prints the worker kill summary every second, since by default it prints every minute.
 
-Worker killing policy
-~~~~~~~~~~~~~~~~~~~~~
+    .. code-block:: bash
+
+        RAY_event_stats_print_interval_ms=1000 python oom.py
+
+        (raylet) node_manager.cc:3040: 1 Workers (tasks / actors) killed due to memory pressure (OOM), 0 Workers crashed due to other reasons at node (ID: 2c82620270df6b9dd7ae2791ef51ee4b5a9d5df9f795986c10dd219c, IP: 172.31.183.172) over the last time period. To see more information about the Workers killed on this node, use `ray logs raylet.out -ip 172.31.183.172`
+        (raylet) 
+        (raylet) Refer to the documentation on how to address the out of memory issue: https://docs.ray.io/en/latest/ray-core/scheduling/ray-oom-prevention.html. Consider provisioning more memory on this node or reducing task parallelism by requesting more CPUs per task. To adjust the kill threshold, set the environment variable `RAY_memory_usage_threshold` when starting Ray. To disable worker killing, set the environment variable `RAY_memory_monitor_refresh_ms` to zero.
+                task failed with OutOfMemoryError, which is expected
+                Verify the task was indeed executed twice via ``task_oom_retry``:
 
-The raylet prioritizes killing tasks that are retriable, i.e. when ``max_retries`` or ``max_restarts`` is > 0. This is done to minimize workload failure. It then looks for the last one to start executing and kills that worker process. It selects and kills one process at a time and waits for it to be killed before choosing another one, regardless of how frequent the monitor runs.
 
 .. dropdown:: Example: memory monitor prefers to kill a retriable task
 
@@ -151,9 +120,10 @@ The raylet prioritizes killing tasks that are retriable, i.e. when ``max_retries
 
         $ python two_actors.py
         
-        first actor was killed by memory monitor
-        finished second actor
+        First started actor, which is retriable, was killed by the memory monitor.
+        Second started actor, which is not-retriable, finished.
 
+.. _addressing-memory-issues:
 
 Addressing memory issues
 ------------------------

From 67d1515b70344d39fda8d4319100390fac4ecb5e Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Wed, 8 Feb 2023 20:30:30 -0800
Subject: [PATCH 196/267] [Datasets] Fix sort nightly test to skip `stats()` if
 exception is raised (#32329)

---
 release/nightly_tests/dataset/sort.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/release/nightly_tests/dataset/sort.py b/release/nightly_tests/dataset/sort.py
index 55d726f9c93c..d47fe89221c9 100644
--- a/release/nightly_tests/dataset/sort.py
+++ b/release/nightly_tests/dataset/sort.py
@@ -113,12 +113,14 @@ def make_block(count: int, num_columns: int) -> Block:
         num_columns=1,
     )
     exc = None
+    ds_stats = None
     try:
         if args.shuffle:
             ds = ds.random_shuffle()
         else:
             ds = ds.sort(key="c_0")
         ds.fully_executed()
+        ds_stats = ds.stats()
     except Exception as e:
         exc = e
         pass
@@ -143,7 +145,8 @@ def make_block(count: int, num_columns: int) -> Block:
         print(traceback.format_exc())
     print("")
 
-    print(ds.stats())
+    if ds_stats is not None:
+        print(ds_stats)
 
     if "TEST_OUTPUT_JSON" in os.environ:
         out_file = open(os.environ["TEST_OUTPUT_JSON"], "w")

From b2e76997057b7326b0604bd45a37d92e328f3012 Mon Sep 17 00:00:00 2001
From: Jian Xiao <99709935+jianoaix@users.noreply.github.com>
Date: Wed, 8 Feb 2023 20:31:06 -0800
Subject: [PATCH 197/267] Use dataset random_shuffle() for shuffle nightly
 (#32343)

---
 release/release_tests.yaml | 21 ---------------------
 1 file changed, 21 deletions(-)

diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index 595a54489279..afd01e73ca2c 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -3535,27 +3535,6 @@
     script: python stress_tests/test_placement_group.py
     type: sdk_command
 
-- name: shuffle_1tb_5000_partitions
-  group: core-multi-test
-  working_dir: nightly_tests
-  legacy:
-    test_name: shuffle_1tb_5000_partitions
-    test_suite: nightly_tests
-
-  frequency: nightly-3x
-  team: core
-  env: staging
-  cluster:
-    cluster_env: shuffle/shuffle_app_config.yaml
-    cluster_compute: shuffle/shuffle_compute_large_scale.yaml
-
-  run:
-    timeout: 9000
-    script: python shuffle/shuffle_test.py --num-partitions=5000 --partition-size=200e6
-    wait_for_nodes:
-      num_nodes: 20
-
-
 - name: decision_tree_autoscaling_20_runs
   group: core-multi-test
   working_dir: nightly_tests

From d653f73ebbe2eca3799993683cfaab4c01857e17 Mon Sep 17 00:00:00 2001
From: Alex Wu <alex@anyscale.io>
Date: Wed, 8 Feb 2023 20:32:12 -0800
Subject: [PATCH 198/267] [autoscaler][observability] Better memory formatting
 (#32337)

This PR updates the memory formatting to show usage and total in independent, friendly units. This is should make it easier to tell when there's a small amount of memory being used that could otherwise be rounded to 0, which is often confusing for downscaling.

```
======== Autoscaler status: 2020-12-28 01:02:03 ========
Node status
--------------------------------------------------------
Healthy:
 2 p3.2xlarge
 20 m4.4xlarge
Pending:
 m4.4xlarge, 2 launching
 1.2.3.4: m4.4xlarge, waiting-for-ssh
 1.2.3.5: m4.4xlarge, waiting-for-ssh
Recent failures:
 p3.2xlarge: RayletUnexpectedlyDied (ip: 1.2.3.6)

Resources
--------------------------------------------------------
Usage:
 0/2 AcceleratorType:V100
 530.0/544.0 CPU
 2/2 GPU
 2.00GiB/8.00GiB memory
 0B/16.00GiB object_store_memory

Demands:
 {'CPU': 1}: 150+ pending tasks/actors
 {'CPU': 4} * 5 (PACK): 420+ pending placement groups
 {'CPU': 16}: 100+ from request_resources()
```

and

```
======== Autoscaler status: 2020-12-28 01:02:03 ========
Node status
--------------------------------------------------------
Healthy:
 2 p3.2xlarge
 20 m4.4xlarge
Pending:
 m4.4xlarge, 2 launching
 1.2.3.4: m4.4xlarge, waiting-for-ssh
 1.2.3.5: m4.4xlarge, waiting-for-ssh
Recent failures:
 p3.2xlarge: RayletUnexpectedlyDied (ip: 1.2.3.6)

Resources
--------------------------------------------------------
Usage:
 0/2 AcceleratorType:V100
 530.0/544.0 CPU
 2/2 GPU
 2.00GiB/8.00GiB memory
 3.14GiB/16.00GiB object_store_memory

Demands:
 {'CPU': 1}: 150+ pending tasks/actors
 {'CPU': 4} * 5 (PACK): 420+ pending placement groups
 {'CPU': 16}: 100+ from request_resources()
```

are some examples of what the updated output may look like.

Co-authored-by: matthewdeng <matthew.j.deng@gmail.com>
Co-authored-by: Alex <alex@anyscale.com>
---
 python/ray/autoscaler/_private/util.py        | 32 +++++++++--
 .../tests/test_resource_demand_scheduler.py   | 53 ++++++++++++++-----
 2 files changed, 67 insertions(+), 18 deletions(-)

diff --git a/python/ray/autoscaler/_private/util.py b/python/ray/autoscaler/_private/util.py
index 39a6c158d250..085e38366c7d 100644
--- a/python/ray/autoscaler/_private/util.py
+++ b/python/ray/autoscaler/_private/util.py
@@ -537,6 +537,27 @@ def parse_placement_group_resource_str(
     return (placement_group_resource_str, None, True)
 
 
+MEMORY_SUFFIXES = [
+    ("TiB", 2**40),
+    ("GiB", 2**30),
+    ("MiB", 2**20),
+    ("KiB", 2**10),
+]
+
+
+def format_memory(mem_bytes: Number) -> str:
+    """Formats memory in bytes in friendly unit. E.g. (2**30 + 1) bytes should
+    be displayed as 1GiB but 1 byte should be displayed as 1B, (as opposed to
+    rounding it to 0GiB).
+    """
+    for suffix, bytes_per_unit in MEMORY_SUFFIXES:
+        if mem_bytes >= bytes_per_unit:
+            mem_in_unit = mem_bytes / bytes_per_unit
+            return f"{mem_in_unit:.2f}{suffix}"
+
+    return f"{int(mem_bytes)}B"
+
+
 def parse_usage(usage: Usage) -> List[str]:
     # first collect resources used in placement groups
     placement_group_resource_usage = {}
@@ -574,12 +595,15 @@ def parse_usage(usage: Usage) -> List[str]:
             used = used - pg_total + pg_used
 
         if resource in ["memory", "object_store_memory"]:
-            to_GiB = 1 / 2**30
-            line = f"{(used * to_GiB):.2f}/" f"{(total * to_GiB):.3f} GiB {resource}"
+            formatted_used = format_memory(used)
+            formatted_total = format_memory(total)
+            line = f"{formatted_used}/{formatted_total} {resource}"
             if used_in_pg:
+                formatted_pg_used = format_memory(pg_used)
+                formatted_pg_total = format_memory(pg_total)
                 line = line + (
-                    f" ({(pg_used * to_GiB):.2f} used of "
-                    f"{(pg_total * to_GiB):.2f} GiB " + "reserved in placement groups)"
+                    f" ({formatted_pg_used} used of "
+                    f"{formatted_pg_total} " + "reserved in placement groups)"
                 )
             usage_lines.append(line)
         else:
diff --git a/python/ray/tests/test_resource_demand_scheduler.py b/python/ray/tests/test_resource_demand_scheduler.py
index f575ab359a31..2a6d0b1341d5 100644
--- a/python/ray/tests/test_resource_demand_scheduler.py
+++ b/python/ray/tests/test_resource_demand_scheduler.py
@@ -2998,6 +2998,31 @@ def format_pg(pg):
     return f"{bundles_str} ({strategy})"
 
 
+def test_memory_string_formatting():
+    assert ray.autoscaler._private.util.format_memory(0) == "0B"
+    assert (
+        ray.autoscaler._private.util.format_memory(0.0) == "0B"
+    ), "Bytes aren't decimals"
+    assert ray.autoscaler._private.util.format_memory(1) == "1B"
+    assert ray.autoscaler._private.util.format_memory(1023) == "1023B"
+    assert ray.autoscaler._private.util.format_memory(1024) == "1.00KiB"
+    assert ray.autoscaler._private.util.format_memory(1025) == "1.00KiB"
+    assert ray.autoscaler._private.util.format_memory(1037) == "1.01KiB"
+    assert ray.autoscaler._private.util.format_memory(1200) == "1.17KiB"
+    assert ray.autoscaler._private.util.format_memory(2**20 - 10) == "1023.99KiB"
+    assert ray.autoscaler._private.util.format_memory(2**20 - 1) == "1024.00KiB"
+    assert ray.autoscaler._private.util.format_memory(2**20) == "1.00MiB"
+    assert ray.autoscaler._private.util.format_memory(2**30) == "1.00GiB"
+    assert ray.autoscaler._private.util.format_memory(5.001 * 2**30) == "5.00GiB"
+    assert (
+        ray.autoscaler._private.util.format_memory(5.004 * 2**30) == "5.00GiB"
+    ), "rounds down"
+    assert (
+        ray.autoscaler._private.util.format_memory(5.005 * 2**30) == "5.00GiB"
+    ), "rounds down"
+    assert ray.autoscaler._private.util.format_memory(2**40) == "1.00TiB"
+
+
 def test_info_string():
     lm_summary = LoadMetricsSummary(
         usage={
@@ -3042,8 +3067,8 @@ def test_info_string():
  0/2 AcceleratorType:V100
  530.0/544.0 CPU
  2/2 GPU
- 2.00/8.000 GiB memory
- 3.14/16.000 GiB object_store_memory
+ 2.00GiB/8.00GiB memory
+ 3.14GiB/16.00GiB object_store_memory
 
 Demands:
  {'CPU': 1}: 150+ pending tasks/actors
@@ -3122,8 +3147,8 @@ def test_info_string_verbose():
  1/2 AcceleratorType:V100
  530.0/544.0 CPU
  2/2 GPU
- 2.00/8.000 GiB memory
- 3.14/16.000 GiB object_store_memory
+ 2.00GiB/8.00GiB memory
+ 3.14GiB/16.00GiB object_store_memory
 
 Total Demands:
  {'CPU': 1}: 150+ pending tasks/actors
@@ -3135,16 +3160,16 @@ def test_info_string_verbose():
   0.1/1 AcceleratorType:V100
   5.0/20.0 CPU
   0.7/1 GPU
-  1.00/4.000 GiB memory
-  3.14/4.000 GiB object_store_memory
+  1.00GiB/4.00GiB memory
+  3.14GiB/4.00GiB object_store_memory
 
 Node: 192.168.1.2
  Usage:
   0.9/1 AcceleratorType:V100
   15.0/20.0 CPU
   0.3/1 GPU
-  1.00/12.000 GiB memory
-  0.00/4.000 GiB object_store_memory
+  1.00GiB/12.00GiB memory
+  0B/4.00GiB object_store_memory
 """.strip()
     actual = format_info_string(
         lm_summary,
@@ -3209,8 +3234,8 @@ def test_info_string_verbose_no_breakdown():
  1/2 AcceleratorType:V100
  530.0/544.0 CPU
  2/2 GPU
- 2.00/8.000 GiB memory
- 3.14/16.000 GiB object_store_memory
+ 2.00GiB/8.00GiB memory
+ 3.14GiB/16.00GiB object_store_memory
 
 Total Demands:
  {'CPU': 1}: 150+ pending tasks/actors
@@ -3300,8 +3325,8 @@ def test_info_string_with_launch_failures():
  0/2 AcceleratorType:V100
  530.0/544.0 CPU
  2/2 GPU
- 2.00/8.000 GiB memory
- 3.14/16.000 GiB object_store_memory
+ 2.00GiB/8.00GiB memory
+ 3.14GiB/16.00GiB object_store_memory
 
 Demands:
  {'CPU': 1}: 150+ pending tasks/actors
@@ -3384,8 +3409,8 @@ def test_info_string_failed_node_cap():
  0/2 AcceleratorType:V100
  530.0/544.0 CPU (2.0 used of 2.0 reserved in placement groups)
  2/2 GPU
- 2.00/8.000 GiB memory
- 3.14/16.000 GiB object_store_memory
+ 2.00GiB/8.00GiB memory
+ 3.14GiB/16.00GiB object_store_memory
 
 Demands:
  {'CPU': 2.0}: 153+ pending tasks/actors (3+ using placement groups)

From 90f8511139e99e28ebb7cb5d2ba2ff31a5c5e254 Mon Sep 17 00:00:00 2001
From: Stephanie Wang <swang@cs.berkeley.edu>
Date: Thu, 9 Feb 2023 11:56:28 -0600
Subject: [PATCH 199/267] [core] Add opt-in flag for Windows and OSX clusters,
 update `ray start` output to match docs (#31166)

This PR cleans up a few usability issues around Ray clusters:

    Makes some cleanups to the ray start log output to match the new documentation on Ray clusters. Mainly, de-emphasize Ray Client and recommend jobs instead.
    Add an opt-in flag for enabling multi-node clusters for OSX and Windows. Previously, it was possible to start a multi-node cluster, but then any Ray programs would fail mysteriously after connecting to the cluster. Now, it will warn the user with an error message if the opt-in flag is not set.
    Document multi-node support for OSX and Windows.

Signed-off-by: Stephanie Wang <swang@cs.berkeley.edu>
Co-authored-by: Archit Kulkarni <architkulkarni@users.noreply.github.com>
---
 .bazelrc                                      |   3 +
 .buildkite/pipeline.windows.yml               |   1 +
 doc/source/cluster/getting-started.rst        |   6 +
 doc/source/ray-overview/installation.rst      |   6 +-
 python/ray/_private/ray_constants.py          |  19 ++-
 python/ray/_private/services.py               |  13 +-
 python/ray/_private/worker.py                 |  17 +-
 python/ray/scripts/scripts.py                 | 159 +++++++++++-------
 python/ray/tests/test_basic_4.py              |   4 +
 .../test_cli_patterns/test_ray_start.txt      |  21 ++-
 .../gcs/gcs_client/global_state_accessor.cc   |   6 +-
 11 files changed, 167 insertions(+), 88 deletions(-)

diff --git a/.bazelrc b/.bazelrc
index 1b98b8f72a3f..f8b916446e54 100644
--- a/.bazelrc
+++ b/.bazelrc
@@ -29,6 +29,9 @@ test --test_env=PYENV_VERSION
 test --test_env=PYENV_SHELL
 # Do not send usage stats to the server for tests
 test --test_env=RAY_USAGE_STATS_REPORT_URL="http://127.0.0.1:8000"
+# Enable cluster mode for OSX and Windows. By default, Ray
+# will not allow multinode OSX and Windows clusters.
+test --test_env=RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER="1"
 # This is needed for some core tests to run correctly
 build:windows --enable_runfiles
 # TODO(mehrdadn): Revert the "-\\.(asm|S)$" exclusion when this Bazel bug
diff --git a/.buildkite/pipeline.windows.yml b/.buildkite/pipeline.windows.yml
index fef6b5187115..0aa3816ff747 100644
--- a/.buildkite/pipeline.windows.yml
+++ b/.buildkite/pipeline.windows.yml
@@ -35,6 +35,7 @@ steps:
     - conda init
     - . ./ci/ci.sh init
     - ./ci/ci.sh build
+    - export RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER="1"
     - if [ "${BUILDKITE_PARALLEL_JOB}" = "0" ]; then ./ci/ci.sh test_core; fi
     # The next command will be sharded into $parallelism shards.
     - ./ci/ci.sh test_python
diff --git a/doc/source/cluster/getting-started.rst b/doc/source/cluster/getting-started.rst
index 1538fbacb63d..8024ef751a33 100644
--- a/doc/source/cluster/getting-started.rst
+++ b/doc/source/cluster/getting-started.rst
@@ -22,6 +22,12 @@ Ray provides native cluster deployment support on the following technology stack
 Advanced users may want to :ref:`deploy Ray manually <on-prem>`
 or onto :ref:`platforms not listed here <ref-cluster-setup>`.
 
+.. note::
+
+    Multi-node Ray clusters are only supported on Linux. At your own risk, you
+    may deploy Windows and OSX clusters by setting the environment variable
+    ``RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER=1`` during deployment.
+
 What's next?
 ------------
 
diff --git a/doc/source/ray-overview/installation.rst b/doc/source/ray-overview/installation.rst
index 3c7f41dbe18e..bc35960eac54 100644
--- a/doc/source/ray-overview/installation.rst
+++ b/doc/source/ray-overview/installation.rst
@@ -203,7 +203,8 @@ You can install and use Ray C++ API as follows.
 M1 Mac (Apple Silicon) Support
 ------------------------------
 
-Ray has experimental support for machines running Apple Silicon (such as M1 macs). To get started:
+Ray has experimental support for machines running Apple Silicon (such as M1 macs).
+Multi-node clusters are untested. To get started with local Ray development:
 
 #. Install `miniforge <https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-MacOSX-arm64.sh>`_.
 
@@ -236,7 +237,8 @@ Ray has experimental support for machines running Apple Silicon (such as M1 macs
 Windows Support
 ---------------
 
-Windows support is currently in beta. Please submit any issues you encounter on
+Windows support is currently in beta, and multi-node Ray clusters are untested.
+Please submit any issues you encounter on
 `GitHub <https://github.com/ray-project/ray/issues/>`_.
 
 Installing Ray on Arch Linux
diff --git a/python/ray/_private/ray_constants.py b/python/ray/_private/ray_constants.py
index 1b555c389409..3494cbdf2efa 100644
--- a/python/ray/_private/ray_constants.py
+++ b/python/ray/_private/ray_constants.py
@@ -2,6 +2,7 @@
 
 import logging
 import os
+import sys
 
 logger = logging.getLogger(__name__)
 
@@ -23,10 +24,18 @@ def env_integer(key, default):
 
 def env_bool(key, default):
     if key in os.environ:
-        return True if os.environ[key].lower() == "true" else False
+        return (
+            True
+            if os.environ[key].lower() == "true" or os.environ[key] == "1"
+            else False
+        )
     return default
 
 
+def env_set_by_user(key):
+    return key in os.environ
+
+
 # Whether event logging to driver is enabled. Set to 0 to disable.
 AUTOSCALER_EVENTS = env_integer("RAY_SCHEDULER_EVENTS", 1)
 
@@ -370,3 +379,11 @@ def gcs_actor_scheduling_enabled():
 # Ray wheels into the conda environment, so the Ray wheels for these Python
 # versions must be available online.
 RUNTIME_ENV_CONDA_PY_VERSIONS = [(3, 6), (3, 7), (3, 8), (3, 9), (3, 10)]
+
+# Whether to enable Ray clusters (in addition to local Ray).
+# Ray clusters are not explicitly supported for Windows and OSX.
+ENABLE_RAY_CLUSTERS_ENV_VAR = "RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER"
+ENABLE_RAY_CLUSTER = env_bool(
+    ENABLE_RAY_CLUSTERS_ENV_VAR,
+    not (sys.platform == "darwin" or sys.platform == "win32"),
+)
diff --git a/python/ray/_private/services.py b/python/ray/_private/services.py
index 27731e9de2dc..14fba2de6716 100644
--- a/python/ray/_private/services.py
+++ b/python/ray/_private/services.py
@@ -583,8 +583,11 @@ def resolve_ip_for_localhost(address: str):
     if not address:
         raise ValueError(f"Malformed address: {address}")
     address_parts = address.split(":")
-    # Make sure localhost isn't resolved to the loopback ip
     if address_parts[0] == "127.0.0.1" or address_parts[0] == "localhost":
+        # Clusters are disabled by default for OSX and Windows.
+        if not ray_constants.ENABLE_RAY_CLUSTER:
+            return address
+        # Make sure localhost isn't resolved to the loopback ip
         ip_address = get_node_ip_address()
         return ":".join([ip_address] + address_parts[1:])
     else:
@@ -627,10 +630,10 @@ def node_ip_address_from_perspective(address: str):
 def get_node_ip_address(address="8.8.8.8:53"):
     if ray._private.worker._global_node is not None:
         return ray._private.worker._global_node.node_ip_address
-    if sys.platform == "darwin" or sys.platform == "win32":
-        # Due to the mac osx/windows firewall,
-        # we use loopback ip as the ip address
-        # to prevent security popups.
+    if not ray_constants.ENABLE_RAY_CLUSTER:
+        # Use loopback IP as the local IP address to prevent bothersome
+        # firewall popups on OSX and Windows.
+        # https://github.com/ray-project/ray/issues/18730.
         return "127.0.0.1"
     return node_ip_address_from_perspective(address)
 
diff --git a/python/ray/_private/worker.py b/python/ray/_private/worker.py
index a1dcfa8277cf..531e3839b96b 100644
--- a/python/ray/_private/worker.py
+++ b/python/ray/_private/worker.py
@@ -1353,15 +1353,24 @@ def init(
                 job_config = ray.job_config.JobConfig()
             job_config.set_runtime_env(runtime_env)
 
-    if _node_ip_address is not None:
-        node_ip_address = services.resolve_ip_for_localhost(_node_ip_address)
-    raylet_ip_address = node_ip_address
-
     redis_address, gcs_address = None, None
     bootstrap_address = services.canonicalize_bootstrap_address(address, _temp_dir)
     if bootstrap_address is not None:
         gcs_address = bootstrap_address
         logger.info("Connecting to existing Ray cluster at address: %s...", gcs_address)
+        if not ray_constants.env_set_by_user(ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR):
+            # If the cluster already exists, then assume it's safe to connect
+            # to the cluster even if we're on Windows or OSX (unless the user
+            # explicitly set the flag).
+            ray_constants.ENABLE_RAY_CLUSTER = True
+
+    # NOTE(swang): We must set the node IP address *after* we determine whether
+    # this is an existing cluster or not. For Windows and OSX, the resolved IP
+    # is localhost for new clusters and the usual public IP for existing
+    # clusters.
+    if _node_ip_address is not None:
+        node_ip_address = services.resolve_ip_for_localhost(_node_ip_address)
+    raylet_ip_address = node_ip_address
 
     if local_mode:
         driver_mode = LOCAL_MODE
diff --git a/python/ray/scripts/scripts.py b/python/ray/scripts/scripts.py
index 048a7afe0f97..f032cffdd030 100644
--- a/python/ray/scripts/scripts.py
+++ b/python/ray/scripts/scripts.py
@@ -578,10 +578,7 @@ def start(
             cf.bold("--port"),
         )
 
-    # Whether the original arguments include node_ip_address.
-    include_node_ip_address = False
     if node_ip_address is not None:
-        include_node_ip_address = True
         node_ip_address = services.resolve_ip_for_localhost(node_ip_address)
 
     resources = parse_resources_json(resources, cli_logger, cf)
@@ -749,87 +746,121 @@ def start(
         cli_logger.success("-" * len(startup_msg))
         cli_logger.newline()
         with cli_logger.group("Next steps"):
-            cli_logger.print("To connect to this Ray runtime from another node, run")
-            # NOTE(kfstorm): Java driver rely on this line to get the address
-            # of the cluster. Please be careful when updating this line.
-            cli_logger.print(
-                cf.bold("  ray start --address='{}'"),
-                bootstrap_address,
-            )
+            dashboard_url = node.address_info["webui_url"]
             if bootstrap_address.startswith("127.0.0.1:"):
+                if ray_constants.ENABLE_RAY_CLUSTER:
+                    cli_logger.print(
+                        "This Ray runtime only accepts connections from local host."
+                    )
+                    cli_logger.print(
+                        "To accept connections from remote hosts, "
+                        "specify a public ip when starting"
+                    )
+                    cli_logger.print(
+                        "the head node: ray start --head --node-ip-address=<public-ip>."
+                    )
+                else:
+                    cli_logger.print(
+                        "Multi-node Ray clusters are not supported on OSX and Windows."
+                    )
+                    cli_logger.print(
+                        "If you would like to proceed anyway, restart Ray with:"
+                    )
+                    cli_logger.print(
+                        cf.bold("  ray stop"),
+                    )
+                    cli_logger.print(
+                        cf.bold("  {}=true ray start"),
+                        ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR,
+                    )
+                cli_logger.newline()
+            else:
+                cli_logger.print("To add another node to this Ray cluster, run")
+                # NOTE(kfstorm): Java driver rely on this line to get the address
+                # of the cluster. Please be careful when updating this line.
                 cli_logger.print(
-                    "This Ray runtime only accepts connections from local host."
+                    cf.bold("  ray start --address='{}'"),
+                    bootstrap_address,
                 )
+                cli_logger.newline()
+            if ray_constants.ENABLE_RAY_CLUSTER:
                 cli_logger.print(
-                    "To accept connections from remote hosts, "
-                    "specify a public ip when starting"
+                    "To connect to this Ray cluster, run `ray.init()` as usual:"
+                )
+                with cli_logger.indented():
+                    cli_logger.print("{} ray", cf.magenta("import"))
+                    cli_logger.print(
+                        "ray{}init()",
+                        cf.magenta("."),
+                    )
+                cli_logger.newline()
+                cli_logger.print(
+                    "To connect to this Ray instance from outside of "
+                    "the cluster, for example "
                 )
                 cli_logger.print(
-                    "the head node: ray start --head --node-ip-address=<public-ip>."
+                    "when connecting to a remote cluster from your laptop, "
+                    "make sure the"
                 )
-            cli_logger.newline()
-            cli_logger.print("Alternatively, use the following Python code:")
-            with cli_logger.indented():
-                cli_logger.print("{} ray", cf.magenta("import"))
-                # Note: In the case of joining an existing cluster using
-                # `address="auto"`, the _node_ip_address parameter is
-                # unnecessary.
                 cli_logger.print(
-                    "ray{}init(address{}{}{})",
-                    cf.magenta("."),
-                    cf.magenta("="),
-                    cf.yellow("'auto'"),
-                    ", _node_ip_address{}{}".format(
-                        cf.magenta("="), cf.yellow("'" + node_ip_address + "'")
+                    "dashboard {}is accessible and use the Ray Jobs API. For example:",
+                    f"({dashboard_url}) " if dashboard_url else "",
+                )
+                if dashboard_url:
+                    cli_logger.print(
+                        cf.bold(
+                            "  RAY_ADDRESS='http://<dashboard URL>:{}' ray job submit "
+                            "--working-dir . "
+                            "-- python my_script.py"
+                        ),
+                        ray_params.dashboard_port,
                     )
-                    if include_node_ip_address
-                    else "",
+                cli_logger.newline()
+                cli_logger.print(
+                    "See https://docs.ray.io/en/latest/cluster/running-applications"
+                    "/job-submission/index.html"
                 )
-            cli_logger.newline()
-            cli_logger.print(
-                "To connect to this Ray runtime from outside of "
-                "the cluster, for example to"
-            )
-            cli_logger.print(
-                "connect to a remote cluster from your laptop "
-                "directly, use the following"
-            )
-            cli_logger.print("Python code:")
-            with cli_logger.indented():
-                cli_logger.print("{} ray", cf.magenta("import"))
                 cli_logger.print(
-                    "ray{}init(address{}{})",
-                    cf.magenta("."),
-                    cf.magenta("="),
-                    cf.yellow(
-                        "'ray://<head_node_ip_address>:" f"{ray_client_server_port}'"
-                    ),
+                    "for more information on connecting to the Ray cluster from "
+                    "a remote client."
                 )
-            cli_logger.newline()
-            cli_logger.print("To see the status of the cluster, use")
-            cli_logger.print("  {}".format(cf.bold("ray status")))
-            dashboard_url = node.address_info["webui_url"]
-            if dashboard_url:
-                cli_logger.print("To monitor and debug Ray, view the dashboard at ")
+                cli_logger.newline()
+                cli_logger.print("To see the status of the cluster, use")
+                cli_logger.print("  {}".format(cf.bold("ray status")))
+                if dashboard_url:
+                    cli_logger.print("To monitor and debug Ray, view the dashboard at ")
+                    cli_logger.print(
+                        "  {}".format(
+                            cf.bold(dashboard_url),
+                        )
+                    )
+                cli_logger.newline()
                 cli_logger.print(
-                    "  {}".format(
-                        cf.bold(dashboard_url),
+                    cf.underlined(
+                        "If connection fails, check your "
+                        "firewall settings and "
+                        "network configuration."
                     )
                 )
-            cli_logger.newline()
-            cli_logger.print(
-                cf.underlined(
-                    "If connection fails, check your "
-                    "firewall settings and "
-                    "network configuration."
-                )
-            )
-            cli_logger.newline()
+                cli_logger.newline()
             cli_logger.print("To terminate the Ray runtime, run")
             cli_logger.print(cf.bold("  ray stop"))
         ray_params.gcs_address = bootstrap_address
     else:
         # Start worker node.
+        if not ray_constants.ENABLE_RAY_CLUSTER:
+            cli_logger.abort(
+                "Multi-node Ray clusters are not supported on Windows and OSX. "
+                "Restart the Ray cluster with the environment variable `{}=1` "
+                "to proceed anyway.",
+                cf.bold(ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR),
+            )
+            raise Exception(
+                "Multi-node Ray clusters are not supported on Windows and OSX. "
+                "Restart the Ray cluster with the environment variable "
+                f"`{ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR}=1` to proceed "
+                "anyway.",
+            )
 
         # Ensure `--address` flag is specified.
         if address is None:
diff --git a/python/ray/tests/test_basic_4.py b/python/ray/tests/test_basic_4.py
index 083ba0eaf605..43eb63e5ee95 100644
--- a/python/ray/tests/test_basic_4.py
+++ b/python/ray/tests/test_basic_4.py
@@ -4,9 +4,11 @@
 import sys
 import time
 from pathlib import Path
+import os
 
 import numpy as np
 import pytest
+from unittest import mock
 
 import ray
 import ray.cluster_utils
@@ -163,6 +165,8 @@ def g():
     sys.platform not in ["win32", "darwin"],
     reason="Only listen on localhost by default on mac and windows.",
 )
+@mock.patch("ray._private.services.ray_constants.ENABLE_RAY_CLUSTER", False)
+@mock.patch.dict(os.environ, {"RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER": "0"})
 @pytest.mark.parametrize("start_ray", ["ray_start_regular", "call_ray_start"])
 def test_listen_on_localhost(start_ray, request):
     """All ray processes should listen on localhost by default
diff --git a/python/ray/tests/test_cli_patterns/test_ray_start.txt b/python/ray/tests/test_cli_patterns/test_ray_start.txt
index 31df71daea0a..bddb03bb7619 100644
--- a/python/ray/tests/test_cli_patterns/test_ray_start.txt
+++ b/python/ray/tests/test_cli_patterns/test_ray_start.txt
@@ -7,25 +7,28 @@ Ray runtime started.
 --------------------
 
 Next steps
-  To connect to this Ray runtime from another node, run
+  To add another node to this Ray cluster, run
     ray start --address='.+'
 
-  Alternatively, use the following Python code:
+  To connect to this Ray cluster, run `ray.init\(\)` as usual:
     import ray
-    ray\.init\(address='auto'\)
+    ray\.init\(\)
 
-  To connect to this Ray runtime from outside of the cluster, for example to
-  connect to a remote cluster from your laptop directly, use the following
-  Python code:
-    import ray
-    ray\.init\(address='ray://.*'\)
+  To connect to this Ray instance from outside of the cluster, for example
+  when connecting to a remote cluster from your laptop, make sure the
+  dashboard (.*) is accessible and use the Ray Jobs API\. For example:
+    RAY_ADDRESS='http://<dashboard URL>:8265' ray job submit --working-dir \. -- python my_script\.py
+
+  See https://docs\.ray\.io/en/latest/cluster/running-applications/job-submission/index\.html
+  for more information on connecting to the Ray cluster from a remote client\.
 
   To see the status of the cluster, use
     ray status
-  To monitor and debug Ray, view the dashboard at 
+  To monitor and debug Ray, view the dashboard at
     127.0.0.1:8265
 
   If connection fails, check your firewall settings and network configuration.
 
   To terminate the Ray runtime, run
     ray stop
+
diff --git a/src/ray/gcs/gcs_client/global_state_accessor.cc b/src/ray/gcs/gcs_client/global_state_accessor.cc
index e6376567913d..377a2076e852 100644
--- a/src/ray/gcs/gcs_client/global_state_accessor.cc
+++ b/src/ray/gcs/gcs_client/global_state_accessor.cc
@@ -354,9 +354,9 @@ ray::Status GlobalStateAccessor::GetNodeToConnectForDriver(
 
       if (relevant_client_index < 0 && head_node_client_index >= 0) {
         RAY_LOG(INFO) << "This node has an IP address of " << node_ip_address
-                      << ", while we can not find the matched Raylet address. "
-                      << "This maybe come from when you connect the Ray cluster "
-                      << "with a different IP address or connect a container.";
+                      << ", but we cannot find a local Raylet with the same address. "
+                      << "This can happen when you connect to the Ray cluster "
+                      << "with a different IP address or when connecting to a container.";
         relevant_client_index = head_node_client_index;
       }
       if (relevant_client_index < 0) {

From 0e56dffde9bf80a6e21c77ad59680ace2516b4f4 Mon Sep 17 00:00:00 2001
From: Eric Liang <ekhliang@gmail.com>
Date: Thu, 9 Feb 2023 10:21:03 -0800
Subject: [PATCH 200/267] [data] [streaming] Implement locality-aware actor
 task assignment (#32278)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

This implements a very simple version of locality-aware task assignment. The locality assignment problem is complex, but here we will start by just preferentially assigning tasks to actors if the first block of the bundle is local. We will record perf metrics on the locality hit/miss rate.

This feature is flag protected (on by default).

Actor locality on:
```
MapBatches(Model): 0 active, 0 queued, 0 actors [987 locality hits, 13 misses]:
100%|█████████| 1000/1000 [01:01<00:00, 16.28it/s]

Average throughput 16.072036005250155 GiB/s
```

Actor locality off:
```
MapBatches(Model): 0 active, 0 queued, 0 actors [locality off]:
100%|███████████████████████████| 1000/1000 [03:01<00:00,  5.50it/s]

Average throughput 5.471759229068149 GiB/s
```
---
 .../data/_internal/execution/interfaces.py    |   9 ++
 .../operators/actor_pool_map_operator.py      |  95 ++++++++++++---
 .../tests/test_actor_pool_map_operator.py     | 111 +++++++++++++++---
 python/ray/data/tests/test_operators.py       |  54 ++++++++-
 4 files changed, 234 insertions(+), 35 deletions(-)

diff --git a/python/ray/data/_internal/execution/interfaces.py b/python/ray/data/_internal/execution/interfaces.py
index bae2fc205ff8..98a9e8679503 100644
--- a/python/ray/data/_internal/execution/interfaces.py
+++ b/python/ray/data/_internal/execution/interfaces.py
@@ -70,6 +70,12 @@ def destroy_if_owned(self) -> int:
             trace_deallocation(b[0], "RefBundle.destroy_if_owned", free=should_free)
         return self.size_bytes() if should_free else 0
 
+    def __eq__(self, other) -> bool:
+        return self is other
+
+    def __hash__(self) -> int:
+        return id(self)
+
 
 @dataclass
 class ExecutionResources:
@@ -153,6 +159,9 @@ class ExecutionOptions:
     # Set this to preserve the ordering between blocks processed by operators.
     preserve_order: bool = False
 
+    # Whether to enable locality-aware task dispatch to actors (on by default).
+    actor_locality_enabled: bool = True
+
 
 @dataclass
 class TaskContext:
diff --git a/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py b/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
index d5a2bafa7a6d..cc2700890de7 100644
--- a/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
+++ b/python/ray/data/_internal/execution/operators/actor_pool_map_operator.py
@@ -21,6 +21,9 @@
 from ray.types import ObjectRef
 from ray._raylet import ObjectRefGenerator
 
+# Type alias for a node id.
+NodeIdStr = str
+
 
 class ActorPoolMapOperator(MapOperator):
     """A MapOperator implementation that executes tasks on an actor pool."""
@@ -74,6 +77,7 @@ def internal_queue_size(self) -> int:
         return len(self._bundle_queue)
 
     def start(self, options: ExecutionOptions):
+        self._actor_locality_enabled = options.actor_locality_enabled
         super().start(options)
 
         # Create the actor workers and add them to the pool.
@@ -85,7 +89,7 @@ def _start_actor(self):
         """Start a new actor and add it to the actor pool as a pending actor."""
         assert self._cls is not None
         actor = self._cls.remote()
-        self._actor_pool.add_pending_actor(actor, actor.ready.remote())
+        self._actor_pool.add_pending_actor(actor, actor.get_location.remote())
 
     def _add_bundled_input(self, bundle: RefBundle):
         self._bundle_queue.append(bundle)
@@ -102,7 +106,10 @@ def _dispatch_tasks(self):
         """
         while self._bundle_queue:
             # Pick an actor from the pool.
-            actor = self._actor_pool.pick_actor()
+            if self._actor_locality_enabled:
+                actor = self._actor_pool.pick_actor(self._bundle_queue[0])
+            else:
+                actor = self._actor_pool.pick_actor()
             if actor is None:
                 # No actors available for executing the next task.
                 break
@@ -208,6 +215,11 @@ def progress_str(self) -> str:
         pending = self._actor_pool.num_pending_actors()
         if pending:
             base += f" ({pending} pending)"
+        if self._actor_locality_enabled:
+            base += f" [{self._actor_pool._locality_hits} locality hits,"
+            base += f" {self._actor_pool._locality_misses} misses]"
+        else:
+            base += " [locality off]"
         return base
 
     def base_resource_usage(self) -> ExecutionResources:
@@ -244,6 +256,13 @@ def incremental_resource_usage(self) -> ExecutionResources:
             num_gpus = 0
         return ExecutionResources(cpu=num_cpus, gpu=num_gpus)
 
+    def get_metrics(self) -> Dict[str, int]:
+        parent = super().get_metrics()
+        if self._actor_locality_enabled:
+            parent["locality_hits"] = self._actor_pool._locality_hits
+            parent["locality_misses"] = self._actor_pool._locality_misses
+        return parent
+
     @staticmethod
     def _apply_default_remote_args(ray_remote_args: Dict[str, Any]) -> Dict[str, Any]:
         """Apply defaults to the actor creation remote args."""
@@ -260,8 +279,8 @@ def _apply_default_remote_args(ray_remote_args: Dict[str, Any]) -> Dict[str, Any
 class _MapWorker:
     """An actor worker for MapOperator."""
 
-    def ready(self):
-        return "ok"
+    def get_location(self) -> NodeIdStr:
+        return ray.get_runtime_context().get_node_id()
 
     def submit(
         self,
@@ -406,11 +425,16 @@ def __init__(self, max_tasks_in_flight: int = float("inf")):
         self._max_tasks_in_flight = max_tasks_in_flight
         # Number of tasks in flight per actor.
         self._num_tasks_in_flight: Dict[ray.actor.ActorHandle, int] = {}
+        # Node id of each ready actor.
+        self._actor_locations: Dict[ray.actor.ActorHandle, str] = {}
         # Actors that are not yet ready (still pending creation).
         self._pending_actors: Dict[ObjectRef, ray.actor.ActorHandle] = {}
         # Whether actors that become idle should be eagerly killed. This is False until
         # the first call to kill_idle_actors().
         self._should_kill_idle_actors = False
+        # Track locality matching stats.
+        self._locality_hits: int = 0
+        self._locality_misses: int = 0
 
     def add_pending_actor(self, actor: ray.actor.ActorHandle, ready_ref: ray.ObjectRef):
         """Adds a pending actor to the pool.
@@ -445,29 +469,52 @@ def pending_to_running(self, ready_ref: ray.ObjectRef) -> bool:
             return False
         actor = self._pending_actors.pop(ready_ref)
         self._num_tasks_in_flight[actor] = 0
+        self._actor_locations[actor] = ray.get(ready_ref)
         return True
 
-    def pick_actor(self) -> Optional[ray.actor.ActorHandle]:
-        """Provides the least heavily loaded running actor in the pool for task
-        submission.
+    def pick_actor(
+        self, locality_hint: Optional[RefBundle] = None
+    ) -> Optional[ray.actor.ActorHandle]:
+        """Picks an actor for task submission based on busyness and locality.
 
         None will be returned if all actors are either at capacity (according to
         max_tasks_in_flight) or are still pending.
+
+        Args:
+            locality_hint: Try to pick an actor that is local for this bundle.
         """
         if not self._num_tasks_in_flight:
             # Actor pool is empty or all actors are still pending.
             return None
 
-        actor = min(
-            self._num_tasks_in_flight.keys(),
-            key=lambda actor: self._num_tasks_in_flight[actor],
-        )
+        if locality_hint:
+            preferred_loc = self._get_location(locality_hint)
+        else:
+            preferred_loc = None
+
+        def penalty_key(actor):
+            """Returns the key that should be minimized for the best actor.
+
+            We prioritize valid actors, those with argument locality, and those that
+            are not busy, in that order.
+            """
+            busyness = self._num_tasks_in_flight[actor]
+            invalid = busyness >= self._max_tasks_in_flight
+            requires_remote_fetch = self._actor_locations[actor] != preferred_loc
+            return invalid, requires_remote_fetch, busyness
+
+        actor = min(self._num_tasks_in_flight.keys(), key=penalty_key)
         if self._num_tasks_in_flight[actor] >= self._max_tasks_in_flight:
             # All actors are at capacity.
             return None
-        else:
-            self._num_tasks_in_flight[actor] += 1
-            return actor
+
+        if locality_hint:
+            if self._actor_locations[actor] == preferred_loc:
+                self._locality_hits += 1
+            else:
+                self._locality_misses += 1
+        self._num_tasks_in_flight[actor] += 1
+        return actor
 
     def return_actor(self, actor: ray.actor.ActorHandle):
         """Returns the provided actor to the pool."""
@@ -587,3 +634,23 @@ def _kill_pending_actor(self, ready_ref: ray.ObjectRef):
         """Kill the provided pending actor and remove it from the pool."""
         actor = self._pending_actors.pop(ready_ref)
         ray.kill(actor)
+
+    def _get_location(self, bundle: RefBundle) -> Optional[NodeIdStr]:
+        """Ask Ray for the node id of the given bundle.
+
+        This method may be overriden for testing.
+
+        Returns:
+            A node id associated with the bundle, or None if unknown.
+        """
+        # Only consider the first block in the bundle for now. TODO(ekl) consider
+        # taking into account other blocks.
+        ref = bundle.blocks[0][0]
+        # This call is pretty fast for owned objects (~5k/s), so we don't need to
+        # batch it for now.
+        locs = ray.experimental.get_object_locations([ref])
+        nodes = locs[ref]["node_ids"]
+        if nodes:
+            return nodes[0]
+        else:
+            return None
diff --git a/python/ray/data/tests/test_actor_pool_map_operator.py b/python/ray/data/tests/test_actor_pool_map_operator.py
index 0a9f6dbab3f9..ab9a85f00845 100644
--- a/python/ray/data/tests/test_actor_pool_map_operator.py
+++ b/python/ray/data/tests/test_actor_pool_map_operator.py
@@ -11,18 +11,22 @@
     AutoscalingConfig,
     AutoscalingPolicy,
 )
+from ray.data._internal.execution.util import make_ref_bundles
 
 
 @ray.remote
 class PoolWorker:
-    def ready(self) -> str:
-        return "ok"
+    def __init__(self, node_id: str = "node1"):
+        self.node_id = node_id
+
+    def get_location(self) -> str:
+        return self.node_id
 
 
 class TestActorPool:
     def _add_ready_worker(self, pool: _ActorPool) -> ray.actor.ActorHandle:
         actor = PoolWorker.remote()
-        ready_ref = actor.ready.remote()
+        ready_ref = actor.get_location.remote()
         pool.add_pending_actor(actor, ready_ref)
         # Wait until actor has started.
         ray.get(ready_ref)
@@ -35,7 +39,7 @@ def test_add_pending(self, ray_start_regular_shared):
         # Test that pending actor is added in the correct state.
         pool = _ActorPool()
         actor = PoolWorker.remote()
-        ready_ref = actor.ready.remote()
+        ready_ref = actor.get_location.remote()
         pool.add_pending_actor(actor, ready_ref)
         # Check that the pending actor is not pickable.
         assert pool.pick_actor() is None
@@ -160,7 +164,7 @@ def test_kill_inactive_pending_actor(self, ray_start_regular_shared):
         # Test that a pending actor is killed on the kill_inactive_actor() call.
         pool = _ActorPool()
         actor = PoolWorker.remote()
-        ready_ref = actor.ready.remote()
+        ready_ref = actor.get_location.remote()
         pool.add_pending_actor(actor, ready_ref)
         # Kill inactive actor.
         killed = pool.kill_inactive_actor()
@@ -172,7 +176,7 @@ def test_kill_inactive_pending_actor(self, ray_start_regular_shared):
         # Wait a second to let actor killing happen.
         time.sleep(1)
         with pytest.raises(ray.exceptions.RayActorError):
-            ray.get(actor.ready.remote())
+            ray.get(actor.get_location.remote())
         # Check that the per-state pool sizes are as expected.
         assert pool.num_total_actors() == 0
         assert pool.num_pending_actors() == 0
@@ -194,7 +198,7 @@ def test_kill_inactive_idle_actor(self, ray_start_regular_shared):
         # Wait a second to let actor killing happen.
         time.sleep(1)
         with pytest.raises(ray.exceptions.RayActorError):
-            ray.get(actor.ready.remote())
+            ray.get(actor.get_location.remote())
         # Check that the per-state pool sizes are as expected.
         assert pool.num_total_actors() == 0
         assert pool.num_pending_actors() == 0
@@ -221,7 +225,7 @@ def test_kill_inactive_pending_over_idle(self, ray_start_regular_shared):
         pool = _ActorPool()
         # Add pending worker.
         pending_actor = PoolWorker.remote()
-        ready_ref = pending_actor.ready.remote()
+        ready_ref = pending_actor.get_location.remote()
         pool.add_pending_actor(pending_actor, ready_ref)
         # Add idle worker.
         idle_actor = self._add_ready_worker(pool)
@@ -238,7 +242,7 @@ def test_kill_inactive_pending_over_idle(self, ray_start_regular_shared):
         # Wait a second to let actor killing happen.
         time.sleep(1)
         with pytest.raises(ray.exceptions.RayActorError):
-            ray.get(pending_actor.ready.remote())
+            ray.get(pending_actor.get_location.remote())
         # Check that the per-state pool sizes are as expected.
         assert pool.num_total_actors() == 1
         assert pool.num_pending_actors() == 0
@@ -250,7 +254,7 @@ def test_kill_all_inactive_pending_actor_killed(self, ray_start_regular_shared):
         # Test that pending actors are killed on the kill_all_inactive_actors() call.
         pool = _ActorPool()
         actor = PoolWorker.remote()
-        ready_ref = actor.ready.remote()
+        ready_ref = actor.get_location.remote()
         pool.add_pending_actor(actor, ready_ref)
         # Kill inactive actors.
         pool.kill_all_inactive_actors()
@@ -263,7 +267,7 @@ def test_kill_all_inactive_pending_actor_killed(self, ray_start_regular_shared):
         # Wait a few seconds to let actor killing happen.
         time.sleep(1)
         with pytest.raises(ray.exceptions.RayActorError):
-            ray.get(actor.ready.remote())
+            ray.get(actor.get_location.remote())
         # Check that the per-state pool sizes are as expected.
         assert pool.num_total_actors() == 0
         assert pool.num_pending_actors() == 0
@@ -283,7 +287,7 @@ def test_kill_all_inactive_idle_actor_killed(self, ray_start_regular_shared):
         # Wait a few seconds to let actor killing happen.
         time.sleep(1)
         with pytest.raises(ray.exceptions.RayActorError):
-            ray.get(actor.ready.remote())
+            ray.get(actor.get_location.remote())
         # Check that the per-state pool sizes are as expected.
         assert pool.num_total_actors() == 0
         assert pool.num_pending_actors() == 0
@@ -325,7 +329,7 @@ def test_kill_all_inactive_future_idle_actors_killed(
         # Wait a few seconds to let actor killing happen.
         time.sleep(1)
         with pytest.raises(ray.exceptions.RayActorError):
-            ray.get(actor.ready.remote())
+            ray.get(actor.get_location.remote())
         # Check that the per-state pool sizes are as expected.
         assert pool.num_total_actors() == 0
         assert pool.num_pending_actors() == 0
@@ -345,7 +349,7 @@ def test_kill_all_inactive_mixture(self, ray_start_regular_shared):
         self._add_ready_worker(pool)
         # Add pending actor.
         actor3 = PoolWorker.remote()
-        ready_ref = actor3.ready.remote()
+        ready_ref = actor3.get_location.remote()
         pool.add_pending_actor(actor3, ready_ref)
         # Check that the per-state pool sizes are as expected.
         assert pool.num_total_actors() == 3
@@ -374,7 +378,7 @@ def test_kill_all_inactive_mixture(self, ray_start_regular_shared):
         # Wait a few seconds to let actor killing happen.
         time.sleep(1)
         with pytest.raises(ray.exceptions.RayActorError):
-            ray.get(actor1.ready.remote())
+            ray.get(actor1.get_location.remote())
         # Check that the per-state pool sizes are as expected.
         assert pool.num_total_actors() == 0
         assert pool.num_pending_actors() == 0
@@ -397,9 +401,9 @@ def test_all_actors_killed(self, ray_start_regular_shared):
         # Wait a few seconds to let actor killing happen.
         time.sleep(1)
         with pytest.raises(ray.exceptions.RayActorError):
-            ray.get(idle_actor.ready.remote())
+            ray.get(idle_actor.get_location.remote())
         with pytest.raises(ray.exceptions.RayActorError):
-            ray.get(active_actor.ready.remote())
+            ray.get(active_actor.get_location.remote())
         # Check that the per-state pool sizes are as expected.
         assert pool.num_total_actors() == 0
         assert pool.num_pending_actors() == 0
@@ -407,6 +411,79 @@ def test_all_actors_killed(self, ray_start_regular_shared):
         assert pool.num_active_actors() == 0
         assert pool.num_idle_actors() == 0
 
+    def test_locality_manager_actor_ranking(self):
+        pool = _ActorPool(max_tasks_in_flight=2)
+
+        # Setup bundle mocks.
+        bundles = make_ref_bundles([[0] for _ in range(10)])
+        fake_loc_map = {}
+        for i, b in enumerate(bundles):
+            fake_loc_map[b] = "node1"
+        pool._get_location = lambda b: fake_loc_map[b]
+
+        # Setup an actor on each node.
+        actor1 = PoolWorker.remote(node_id="node1")
+        ready_ref = actor1.get_location.remote()
+        pool.add_pending_actor(actor1, ready_ref)
+        ray.get(ready_ref)
+        pool.pending_to_running(ready_ref)
+        actor2 = PoolWorker.remote(node_id="node2")
+        ready_ref = actor2.get_location.remote()
+        pool.add_pending_actor(actor2, ready_ref)
+        ray.get(ready_ref)
+        pool.pending_to_running(ready_ref)
+
+        # Actors on node1 should be preferred.
+        res1 = pool.pick_actor(bundles[0])
+        assert res1 == actor1
+        res2 = pool.pick_actor(bundles[1])
+        assert res2 == actor1
+
+        # Fallback to remote actors.
+        res3 = pool.pick_actor(bundles[2])
+        assert res3 == actor2
+        res4 = pool.pick_actor(bundles[3])
+        assert res4 == actor2
+        res5 = pool.pick_actor(bundles[4])
+        assert res5 is None
+
+    def test_locality_manager_busyness_ranking(self):
+        pool = _ActorPool(max_tasks_in_flight=2)
+
+        # Setup bundle mocks.
+        bundles = make_ref_bundles([[0] for _ in range(10)])
+        fake_loc_map = {}
+        # Also test unknown location handling.
+        for i, b in enumerate(bundles):
+            fake_loc_map[b] = None
+        pool._get_location = lambda b: fake_loc_map[b]
+
+        # Setup two actors on the same node.
+        actor1 = PoolWorker.remote(node_id="node1")
+        ready_ref = actor1.get_location.remote()
+        pool.add_pending_actor(actor1, ready_ref)
+        ray.get(ready_ref)
+        pool.pending_to_running(ready_ref)
+        actor2 = PoolWorker.remote(node_id="node1")
+        ready_ref = actor2.get_location.remote()
+        pool.add_pending_actor(actor2, ready_ref)
+        ray.get(ready_ref)
+        pool.pending_to_running(ready_ref)
+
+        # Fake actor 2 as more busy.
+        pool._num_tasks_in_flight[actor2] = 1
+        res1 = pool.pick_actor(bundles[0])
+        assert res1 == actor1
+
+        # Fake actor 2 as more busy again.
+        pool._num_tasks_in_flight[actor2] = 2
+        res2 = pool.pick_actor(bundles[0])
+        assert res2 == actor1
+
+        # Nothing left
+        res3 = pool.pick_actor(bundles[0])
+        assert res3 is None
+
 
 class TestAutoscalingConfig:
     def test_min_workers_validation(self):
diff --git a/python/ray/data/tests/test_operators.py b/python/ray/data/tests/test_operators.py
index 960ab96c5b79..0119d0326766 100644
--- a/python/ray/data/tests/test_operators.py
+++ b/python/ray/data/tests/test_operators.py
@@ -112,10 +112,10 @@ def test_map_operator_bulk(ray_start_regular_shared, use_actors):
     )
 
     # Feed data and block on exec.
-    op.start(ExecutionOptions())
+    op.start(ExecutionOptions(actor_locality_enabled=False))
     if use_actors:
         # Actor will be pending after starting the operator.
-        assert op.progress_str() == "0 actors (1 pending)"
+        assert op.progress_str() == "0 actors (1 pending) [locality off]"
     assert op.internal_queue_size() == 0
     i = 0
     while input_op.has_next():
@@ -135,11 +135,11 @@ def test_map_operator_bulk(ray_start_regular_shared, use_actors):
         if use_actors and work_refs:
             # After actor is ready (first work ref resolved), actor will remain ready
             # while there is work to do.
-            assert op.progress_str() == "1 actors"
+            assert op.progress_str() == "1 actors [locality off]"
     assert op.internal_queue_size() == 0
     if use_actors:
         # After all work is done, actor will have been killed to free up resources..
-        assert op.progress_str() == "0 actors"
+        assert op.progress_str() == "0 actors [locality off]"
     else:
         assert op.progress_str() == ""
 
@@ -192,6 +192,52 @@ def test_map_operator_streamed(ray_start_regular_shared, use_actors):
     assert metrics["obj_store_mem_alloc"] == pytest.approx(8800, 0.5), metrics
     assert metrics["obj_store_mem_peak"] == pytest.approx(88, 0.5), metrics
     assert metrics["obj_store_mem_freed"] == pytest.approx(6400, 0.5), metrics
+    if use_actors:
+        assert "locality_hits" in metrics, metrics
+        assert "locality_misses" in metrics, metrics
+    else:
+        assert "locality_hits" not in metrics, metrics
+        assert "locality_misses" not in metrics, metrics
+    assert not op.completed()
+
+
+def test_map_operator_actor_locality_stats(ray_start_regular_shared):
+    # Create with inputs.
+    input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
+    compute_strategy = ActorPoolStrategy()
+    op = MapOperator.create(
+        _mul2_transform,
+        input_op=input_op,
+        name="TestMapper",
+        compute_strategy=compute_strategy,
+    )
+
+    # Feed data and implement streaming exec.
+    output = []
+    options = ExecutionOptions()
+    options.preserve_order = True
+    options.actor_locality_enabled = True
+    op.start(options)
+    while input_op.has_next():
+        op.add_input(input_op.get_next(), 0)
+        while not op.has_next():
+            work_refs = op.get_work_refs()
+            ready, _ = ray.wait(work_refs, num_returns=1, fetch_local=False)
+            op.notify_work_completed(ready[0])
+        while op.has_next():
+            ref = op.get_next()
+            assert ref.owns_blocks, ref
+            _get_blocks(ref, output)
+
+    # Check equivalent to bulk execution in order.
+    assert output == [[i * 2] for i in range(100)]
+    metrics = op.get_metrics()
+    assert metrics["obj_store_mem_alloc"] == pytest.approx(8800, 0.5), metrics
+    assert metrics["obj_store_mem_peak"] == pytest.approx(88, 0.5), metrics
+    assert metrics["obj_store_mem_freed"] == pytest.approx(6400, 0.5), metrics
+    # Check e2e locality manager working.
+    assert metrics["locality_hits"] == 100, metrics
+    assert metrics["locality_misses"] == 0, metrics
     assert not op.completed()
 
 
From f80badcdb002ba90198d79ce1a815ca522d3b86f Mon Sep 17 00:00:00 2001
From: Avnish Narayan <38871737+avnishn@users.noreply.github.com>
Date: Thu, 9 Feb 2023 12:29:44 -0800
Subject: [PATCH 201/267] [RLlib] Remove leela chess from release tests
 (#32325)

* Temporary fix to the leela chess example
* Remove leela chess from the release test framework, move it to tuned examples

Signed-off-by: avnish <avnish@anyscale.com>
---
 release/release_tests.yaml                    | 24 -------------------
 .../multi-agent-connect4.yaml                 |  3 +--
 2 files changed, 1 insertion(+), 26 deletions(-)
 rename {release/rllib_tests/learning_tests/yaml_files => rllib/tuned_examples}/leela_chess_zero/multi-agent-connect4.yaml (92%)

diff --git a/release/release_tests.yaml b/release/release_tests.yaml
index afd01e73ca2c..d86f42e93ced 100644
--- a/release/release_tests.yaml
+++ b/release/release_tests.yaml
@@ -3467,30 +3467,6 @@
 
   alert: default
 
-- name: rllib_learning_tests_leela_chess_zero
-  group: RLlib tests
-  working_dir: rllib_tests
-
-  legacy:
-    test_name: learning_tests
-    test_suite: rllib_tests
-
-  frequency: nightly
-  team: rl
-  env: staging
-
-  cluster:
-    cluster_env: app_config.yaml
-    cluster_compute: 1gpu_16cpus.yaml  
-
-  run:
-    timeout: 18000
-    script: python learning_tests/run.py --yaml-sub-dir=leela_chess_zero
-    type: sdk_command
-    file_manager: job
-
-  alert: default
-
 ########################
 # Core Nightly Tests
 ########################
diff --git a/release/rllib_tests/learning_tests/yaml_files/leela_chess_zero/multi-agent-connect4.yaml b/rllib/tuned_examples/leela_chess_zero/multi-agent-connect4.yaml
similarity index 92%
rename from release/rllib_tests/learning_tests/yaml_files/leela_chess_zero/multi-agent-connect4.yaml
rename to rllib/tuned_examples/leela_chess_zero/multi-agent-connect4.yaml
index 2a5d820ec3fb..c60ef2661779 100644
--- a/release/rllib_tests/learning_tests/yaml_files/leela_chess_zero/multi-agent-connect4.yaml
+++ b/rllib/tuned_examples/leela_chess_zero/multi-agent-connect4.yaml
@@ -1,8 +1,6 @@
 connect-4-leela-zero:
     env: ray.rllib.examples.env.pettingzoo_connect4.MultiAgentConnect4
     run: LeelaChessZero
-    pass_criteria:
-      episode_reward_mean: 0.5
     stop:
       policy_reward_mean/p_0: 0.9
       timesteps_total: 1000000
@@ -12,6 +10,7 @@ connect-4-leela-zero:
       num_workers: 8
       model:
         custom_model: ray.rllib.tuned_examples.leela_chess_zero.custom_model.DenseModel
+        max_seq_len: 0
       multiagent:
         policies: ["p_0","p_1"]
         policies_to_train: ["p_0"]

From 69a14e764891d62a1df9e1ef14ba7a736308b0e2 Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Thu, 9 Feb 2023 12:56:40 -0800
Subject: [PATCH 202/267] [core][state] Task backend improve performance
 (#32251)

Signed-off-by: rickyyx <rickyx@anyscale.com>

This PR aims to improve performance of the task backend with 3 changes:

Delay conversion of protobuf. We found the protobuf conversion, especially from TaskSpecification to TaskInfoEntry that's needed for the task metadata has been slow, and was in the critical path of task execution and submission. This PR delays the generation of rpc::TaskEvnets before sending in the flush thread. During task execution, it will simply generate a TaskEvent entry that's in-memory with a lower overhead.
Fixed the circular buffer that's used as the underlying data structures for the buffered events. This prevents constant resizing when the buffer gets filled up or flushed, which is costly.
Adjust the niceness of the flushing thread, so it has a lower priority than the worker thread.
---
 src/ray/common/constants.h                    |   3 +
 src/ray/common/ray_config_def.h               |   4 +-
 src/ray/core_worker/core_worker.cc            |  30 ++--
 src/ray/core_worker/profile_event.cc          |  31 ++--
 src/ray/core_worker/profile_event.h           |   9 +-
 src/ray/core_worker/task_event_buffer.cc      | 118 +++++++++++++--
 src/ray/core_worker/task_event_buffer.h       | 111 +++++++++++++-
 src/ray/core_worker/task_manager.cc           |  85 +++--------
 src/ray/core_worker/task_manager.h            |   6 -
 .../test/task_event_buffer_test.cc            | 136 +++++++++---------
 src/ray/core_worker/test/task_manager_test.cc |   5 +-
 src/ray/gcs/gcs_server/gcs_server.cc          |   2 +
 src/ray/gcs/pb_util.h                         |  40 ++++++
 13 files changed, 377 insertions(+), 203 deletions(-)

diff --git a/src/ray/common/constants.h b/src/ray/common/constants.h
index b55b0ee4b753..df4bc8ff2ed3 100644
--- a/src/ray/common/constants.h
+++ b/src/ray/common/constants.h
@@ -53,3 +53,6 @@ constexpr char kSetupWorkerFilename[] = "setup_worker.py";
 
 /// The version of Ray
 constexpr char kRayVersion[] = "3.0.0.dev0";
+
+/// Added niceness for thread in TaskEventBuffer
+constexpr int kTaskEventBufferAdditionalNice = 5;
diff --git a/src/ray/common/ray_config_def.h b/src/ray/common/ray_config_def.h
index 097f7ab12c70..5ac38df00291 100644
--- a/src/ray/common/ray_config_def.h
+++ b/src/ray/common/ray_config_def.h
@@ -469,9 +469,7 @@ RAY_CONFIG(int64_t, task_events_max_num_task_in_gcs, 100000)
 
 /// Max number of task events stored in the buffer on workers. Any additional events
 /// will be dropped. This is set to a large value to avoid worker side data loss.
-/// For now, avg size of task event is 200Bytes, 1M task events would incur 200MiB
-/// overhead.
-RAY_CONFIG(uint64_t, task_events_max_num_task_events_in_buffer, 1 * 1000 * 1000)
+RAY_CONFIG(uint64_t, task_events_max_buffer_size, 10 * 1000)
 
 /// Max number of task events to be send in a single message to GCS. This caps both
 /// the message size, and also the processing work on GCS.
diff --git a/src/ray/core_worker/core_worker.cc b/src/ray/core_worker/core_worker.cc
index 3255d092f3de..1d49cfbb1a05 100644
--- a/src/ray/core_worker/core_worker.cc
+++ b/src/ray/core_worker/core_worker.cc
@@ -388,16 +388,14 @@ CoreWorker::CoreWorker(const CoreWorkerOptions &options, const WorkerID &worker_
 
     // Add the driver task info.
     if (task_event_buffer_->Enabled()) {
-      rpc::TaskEvents task_event;
       const auto spec = builder.Build();
-      auto task_info = task_manager_->MakeTaskInfoEntry(spec);
-      task_event.set_task_id(task_id.Binary());
-      task_event.set_job_id(spec.JobId().Binary());
-      task_event.set_attempt_number(0);
-      task_event.mutable_task_info()->Swap(&task_info);
-      gcs::FillTaskStatusUpdateTime(rpc::TaskStatus::RUNNING,
-                                    absl::GetCurrentTimeNanos(),
-                                    task_event.mutable_state_updates());
+      auto task_event = std::make_unique<worker::TaskStatusEvent>(
+          task_id,
+          spec.JobId(),
+          /* attempt_number */ 0,
+          rpc::TaskStatus::RUNNING,
+          /* timestamp */ absl::GetCurrentTimeNanos(),
+          std::make_shared<const TaskSpecification>(spec));
       task_event_buffer_->AddTaskEvent(std::move(task_event));
     }
   }
@@ -683,14 +681,12 @@ void CoreWorker::Disconnect(
 
   // Driver exiting.
   if (options_.worker_type == WorkerType::DRIVER && task_event_buffer_->Enabled()) {
-    // Mark Driver as finished.
-    rpc::TaskEvents task_event;
-    task_event.set_task_id(worker_context_.GetCurrentTaskID().Binary());
-    task_event.set_job_id(worker_context_.GetCurrentJobID().Binary());
-    task_event.set_attempt_number(0);
-    gcs::FillTaskStatusUpdateTime(rpc::TaskStatus::FINISHED,
-                                  absl::GetCurrentTimeNanos(),
-                                  task_event.mutable_state_updates());
+    auto task_event = std::make_unique<worker::TaskStatusEvent>(
+        worker_context_.GetCurrentTaskID(),
+        worker_context_.GetCurrentJobID(),
+        /* attempt_number */ 0,
+        rpc::TaskStatus::FINISHED,
+        /* timestamp */ absl::GetCurrentTimeNanos());
     task_event_buffer_->AddTaskEvent(std::move(task_event));
   }
 
diff --git a/src/ray/core_worker/profile_event.cc b/src/ray/core_worker/profile_event.cc
index 83ddf840b9e5..e7b139d63dd7 100644
--- a/src/ray/core_worker/profile_event.cc
+++ b/src/ray/core_worker/profile_event.cc
@@ -26,32 +26,25 @@ ProfileEvent::ProfileEvent(TaskEventBuffer &task_event_buffer,
                            const std::string &node_ip_address,
                            const std::string &event_name)
     : task_event_buffer_(task_event_buffer) {
-  rpc_profile_event_.set_job_id(worker_context.GetCurrentJobID().Binary());
-  rpc_profile_event_.set_task_id(worker_context.GetCurrentTaskID().Binary());
-  auto task_spec = worker_context.GetCurrentTask();
-  rpc_profile_event_.set_attempt_number(
-      task_spec == nullptr ? 0 : task_spec->AttemptNumber());
-
-  auto profile_events = rpc_profile_event_.mutable_profile_events();
-  profile_events->set_component_type(WorkerTypeString(worker_context.GetWorkerType()));
-  profile_events->set_component_id(worker_context.GetWorkerID().Binary());
-  profile_events->set_node_ip_address(node_ip_address);
-  auto event_entry = profile_events->add_events();
-  event_entry->set_event_name(event_name);
-
-  event_entry->set_start_time(absl::GetCurrentTimeNanos());
+  const auto &task_spec = worker_context.GetCurrentTask();
+  event_.reset(new TaskProfileEvent(worker_context.GetCurrentTaskID(),
+                                    worker_context.GetCurrentJobID(),
+                                    task_spec == nullptr ? 0 : task_spec->AttemptNumber(),
+                                    WorkerTypeString(worker_context.GetWorkerType()),
+                                    worker_context.GetWorkerID().Binary(),
+                                    node_ip_address,
+                                    event_name,
+                                    absl::GetCurrentTimeNanos()));
 }
 
 ProfileEvent::~ProfileEvent() {
-  auto &event = rpc_profile_event_.mutable_profile_events()->mutable_events()->at(0);
-  event.set_end_time(absl::GetCurrentTimeNanos());
+  event_->SetEndTime(absl::GetCurrentTimeNanos());
   // Add task event to the task event buffer
-  task_event_buffer_.AddTaskEvent(std::move(rpc_profile_event_));
+  task_event_buffer_.AddTaskEvent(std::move(event_));
 }
 
 void ProfileEvent::SetExtraData(const std::string &extra_data) {
-  auto &event = rpc_profile_event_.mutable_profile_events()->mutable_events()->at(0);
-  event.set_extra_data(extra_data);
+  event_->SetExtraData(extra_data);
 }
 
 }  // namespace worker
diff --git a/src/ray/core_worker/profile_event.h b/src/ray/core_worker/profile_event.h
index 0c442322a3d9..9851818f0e1e 100644
--- a/src/ray/core_worker/profile_event.h
+++ b/src/ray/core_worker/profile_event.h
@@ -21,6 +21,11 @@ namespace ray {
 namespace core {
 
 namespace worker {
+
+/// A wrapper that wraps a TaskProfileEvent, will be wrapped by a Cython class.
+///
+/// This class's lifetime measures the duration of a target event. Upon destruction,
+/// this class will be added to TaskEventBuffer to be sent.
 class ProfileEvent {
  public:
   ProfileEvent(TaskEventBuffer &task_event_buffer,
@@ -35,9 +40,11 @@ class ProfileEvent {
   void SetExtraData(const std::string &extra_data);
 
  private:
+  // Reference to the TaskEventBuffer.
   TaskEventBuffer &task_event_buffer_;
 
-  rpc::TaskEvents rpc_profile_event_;
+  // The underlying event.
+  std::unique_ptr<TaskProfileEvent> event_ = nullptr;
 };
 
 }  // namespace worker
diff --git a/src/ray/core_worker/task_event_buffer.cc b/src/ray/core_worker/task_event_buffer.cc
index 03cb3a4fbda0..3a5c7265c8e1 100644
--- a/src/ray/core_worker/task_event_buffer.cc
+++ b/src/ray/core_worker/task_event_buffer.cc
@@ -14,11 +14,95 @@
 
 #include "ray/core_worker/task_event_buffer.h"
 
+#include "ray/gcs/pb_util.h"
+
 namespace ray {
 namespace core {
 
 namespace worker {
 
+TaskEvent::TaskEvent(TaskID task_id, JobID job_id, int32_t attempt_number)
+    : task_id_(task_id), job_id_(job_id), attempt_number_(attempt_number) {}
+
+TaskStatusEvent::TaskStatusEvent(
+    TaskID task_id,
+    JobID job_id,
+    int32_t attempt_number,
+    const rpc::TaskStatus &task_status,
+    int64_t timestamp,
+    const std::shared_ptr<const TaskSpecification> &task_spec,
+    absl::optional<NodeID> node_id,
+    absl::optional<WorkerID> worker_id)
+    : TaskEvent(task_id, job_id, attempt_number),
+      task_status_(task_status),
+      timestamp_(timestamp),
+      task_spec_(task_spec),
+      node_id_(node_id),
+      worker_id_(worker_id) {}
+
+TaskProfileEvent::TaskProfileEvent(TaskID task_id,
+                                   JobID job_id,
+                                   int32_t attempt_number,
+                                   const std::string &component_type,
+                                   const std::string &component_id,
+                                   const std::string &node_ip_address,
+                                   const std::string &event_name,
+                                   int64_t start_time)
+    : TaskEvent(task_id, job_id, attempt_number),
+      component_type_(component_type),
+      component_id_(component_id),
+      node_ip_address_(node_ip_address),
+      event_name_(event_name),
+      start_time_(start_time) {}
+
+void TaskStatusEvent::ToRpcTaskEvents(rpc::TaskEvents *rpc_task_events) {
+  // Base fields
+  rpc_task_events->set_task_id(task_id_.Binary());
+  rpc_task_events->set_job_id(job_id_.Binary());
+  rpc_task_events->set_attempt_number(attempt_number_);
+
+  // Task info.
+  if (task_spec_) {
+    gcs::FillTaskInfo(rpc_task_events->mutable_task_info(), *task_spec_);
+  }
+
+  // Task status update.
+  auto state_updates = rpc_task_events->mutable_state_updates();
+
+  if (node_id_.has_value()) {
+    RAY_CHECK(task_status_ == rpc::TaskStatus::SUBMITTED_TO_WORKER)
+        << "Node ID should be included when task status changes to "
+           "SUBMITTED_TO_WORKER.";
+    state_updates->set_node_id(node_id_->Binary());
+  }
+
+  if (worker_id_.has_value()) {
+    RAY_CHECK(task_status_ == rpc::TaskStatus::SUBMITTED_TO_WORKER)
+        << "Worker ID should be included when task status changes to "
+           "SUBMITTED_TO_WORKER.";
+    state_updates->set_worker_id(worker_id_->Binary());
+  }
+  gcs::FillTaskStatusUpdateTime(task_status_, timestamp_, state_updates);
+}
+
+void TaskProfileEvent::ToRpcTaskEvents(rpc::TaskEvents *rpc_task_events) {
+  // Base fields
+  rpc_task_events->set_task_id(task_id_.Binary());
+  rpc_task_events->set_job_id(job_id_.Binary());
+  rpc_task_events->set_attempt_number(attempt_number_);
+
+  // Profile data
+  auto profile_events = rpc_task_events->mutable_profile_events();
+  profile_events->set_component_type(std::move(component_type_));
+  profile_events->set_component_id(std::move(component_id_));
+  profile_events->set_node_ip_address(std::move(node_ip_address_));
+  auto event_entry = profile_events->add_events();
+  event_entry->set_event_name(std::move(event_name_));
+  event_entry->set_start_time(start_time_);
+  event_entry->set_end_time(end_time_);
+  event_entry->set_extra_data(std::move(extra_data_));
+}
+
 TaskEventBufferImpl::TaskEventBufferImpl(std::unique_ptr<gcs::GcsClient> gcs_client)
     : work_guard_(boost::asio::make_work_guard(io_service_)),
       periodical_runner_(io_service_),
@@ -31,8 +115,7 @@ Status TaskEventBufferImpl::Start(bool auto_flush) {
   RAY_CHECK(report_interval_ms > 0)
       << "RAY_task_events_report_interval_ms should be > 0 to use TaskEventBuffer.";
 
-  buffer_.set_capacity(
-      {RayConfig::instance().task_events_max_num_task_events_in_buffer()});
+  buffer_.set_capacity(RayConfig::instance().task_events_max_buffer_size());
   // Reporting to GCS, set up gcs client and and events flushing.
   auto status = gcs_client_->Connect(io_service_);
   if (!status.ok()) {
@@ -53,6 +136,18 @@ Status TaskEventBufferImpl::Start(bool auto_flush) {
     sigaddset(&mask, SIGINT);
     sigaddset(&mask, SIGTERM);
     pthread_sigmask(SIG_BLOCK, &mask, NULL);
+
+    // Decrease the thread priority to allow worker threads to run.
+    int new_nice = std::min(
+        RayConfig::instance().worker_niceness() + kTaskEventBufferAdditionalNice, 19);
+    new_nice = nice(new_nice);
+    if (new_nice == -1) {
+      RAY_LOG(WARNING) << "Failed to set nice(" << new_nice
+                       << ") for task event buffer io thread: " << strerror(errno);
+    } else {
+      RAY_LOG(INFO) << "Current task event io thread's nice = " << new_nice;
+    }
+
 #endif
     SetThreadName("task_event_buffer.io");
     io_service_.run();
@@ -94,22 +189,21 @@ void TaskEventBufferImpl::Stop() {
 
 bool TaskEventBufferImpl::Enabled() const { return enabled_; }
 
-void TaskEventBufferImpl::AddTaskEvent(rpc::TaskEvents task_events) {
+void TaskEventBufferImpl::AddTaskEvent(std::unique_ptr<TaskEvent> task_event) {
   if (!enabled_) {
     return;
   }
   absl::MutexLock lock(&mutex_);
 
-  auto limit = RayConfig::instance().task_events_max_num_task_events_in_buffer();
-  if (limit > 0 && buffer_.full()) {
+  if (buffer_.full()) {
     const auto &to_evict = buffer_.front();
-    if (to_evict.has_profile_events()) {
+    if (to_evict->IsProfileEvent()) {
       num_profile_task_events_dropped_++;
     } else {
       num_status_task_events_dropped_++;
     }
   }
-  buffer_.push_back(std::move(task_events));
+  buffer_.push_back(std::move(task_event));
 }
 
 void TaskEventBufferImpl::FlushEvents(bool forced) {
@@ -118,7 +212,8 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
   }
   size_t num_status_task_events_dropped = 0;
   size_t num_profile_task_events_dropped = 0;
-  std::vector<rpc::TaskEvents> to_send;
+  std::vector<std::unique_ptr<TaskEvent>> to_send;
+  to_send.reserve(RayConfig::instance().task_events_send_batch_size());
 
   {
     absl::MutexLock lock(&mutex_);
@@ -164,13 +259,14 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
   size_t num_status_event_to_send = 0;
   for (auto &task_event : to_send) {
     auto events_by_task = data->add_events_by_task();
-    if (task_event.has_profile_events()) {
+    if (task_event->IsProfileEvent()) {
       num_profile_event_to_send++;
     } else {
       num_status_event_to_send++;
     }
-    events_by_task->Swap(&task_event);
+    task_event->ToRpcTaskEvents(events_by_task);
   }
+  size_t data_size = data->ByteSizeLong();
 
   gcs::TaskInfoAccessor *task_accessor;
   {
@@ -178,7 +274,7 @@ void TaskEventBufferImpl::FlushEvents(bool forced) {
     absl::MutexLock lock(&mutex_);
     // Some debug tracking.
     total_num_events_ += num_task_events;
-    total_events_bytes_ += data->ByteSizeLong();
+    total_events_bytes_ += data_size;
     // The flag should be unset when on_complete is invoked.
     grpc_in_progress_ = true;
     task_accessor = &gcs_client_->Tasks();
diff --git a/src/ray/core_worker/task_event_buffer.h b/src/ray/core_worker/task_event_buffer.h
index 7deee0c2e3b7..2ee359846ffc 100644
--- a/src/ray/core_worker/task_event_buffer.h
+++ b/src/ray/core_worker/task_event_buffer.h
@@ -33,6 +33,100 @@ namespace core {
 
 namespace worker {
 
+/// A  wrapper class that will be converted to rpc::TaskEvents
+///
+/// This will be created by CoreWorker and stored in TaskEventBuffer, and
+/// when it is being flushed periodically to GCS, it will be converted to
+/// rpc::TaskEvents.
+/// This is an optimization so that converting to protobuf (which is costly)
+/// will not happen in the critical path of task execution/submission.
+class TaskEvent {
+ public:
+  /// Constructor for Profile events
+  explicit TaskEvent(TaskID task_id, JobID job_id, int32_t attempt_number);
+
+  virtual ~TaskEvent() = default;
+
+  /// Convert itself a rpc::TaskEvents
+  ///
+  /// NOTE: this method will modify internal states by moving fields to the
+  /// rpc::TaskEvents.
+  /// \param[out] rpc_task_events The rpc task event to be filled.
+  virtual void ToRpcTaskEvents(rpc::TaskEvents *rpc_task_events) = 0;
+
+  /// If it is a profile event.
+  virtual bool IsProfileEvent() const = 0;
+
+ protected:
+  /// Task Id.
+  const TaskID task_id_ = TaskID::Nil();
+  /// Job id.
+  const JobID job_id_ = JobID::Nil();
+  /// Attempt number
+  const int32_t attempt_number_ = -1;
+};
+
+/// TaskStatusEvent is generated when a task changes its status.
+class TaskStatusEvent : public TaskEvent {
+ public:
+  explicit TaskStatusEvent(
+      TaskID task_id,
+      JobID job_id,
+      int32_t attempt_number,
+      const rpc::TaskStatus &task_status,
+      int64_t timestamp,
+      const std::shared_ptr<const TaskSpecification> &task_spec = nullptr,
+      absl::optional<NodeID> node_id = absl::nullopt,
+      absl::optional<WorkerID> worker_id = absl::nullopt);
+
+  void ToRpcTaskEvents(rpc::TaskEvents *rpc_task_events) override;
+
+  bool IsProfileEvent() const override { return false; }
+
+ private:
+  /// The task status change if it's a status change event.
+  const rpc::TaskStatus task_status_ = rpc::TaskStatus::NIL;
+  /// The time when the task status change happens.
+  const int64_t timestamp_ = -1;
+  /// Pointer to the task spec.
+  const std::shared_ptr<const TaskSpecification> task_spec_ = nullptr;
+  /// Node id if it's a SUBMITTED_TO_WORKER status change.
+  const absl::optional<NodeID> node_id_ = absl::nullopt;
+  /// Worker id if it's a SUBMITTED_TO_WORKER status change.
+  const absl::optional<WorkerID> worker_id_ = absl::nullopt;
+};
+
+/// TaskProfileEvent is generated when `RAY_enable_timeline` is on.
+class TaskProfileEvent : public TaskEvent {
+ public:
+  explicit TaskProfileEvent(TaskID task_id,
+                            JobID job_id,
+                            int32_t attempt_number,
+                            const std::string &component_type,
+                            const std::string &component_id,
+                            const std::string &node_ip_address,
+                            const std::string &event_name,
+                            int64_t start_time);
+
+  void ToRpcTaskEvents(rpc::TaskEvents *rpc_task_events) override;
+
+  bool IsProfileEvent() const override { return true; }
+
+  void SetEndTime(int64_t end_time) { end_time_ = end_time; }
+
+  void SetExtraData(const std::string &extra_data) { extra_data_ = extra_data; }
+
+ private:
+  /// The below fields mirror rpc::ProfileEvent
+  const std::string component_type_;
+  const std::string component_id_;
+  const std::string node_ip_address_;
+  const std::string event_name_;
+  const int64_t start_time_;
+  int64_t end_time_;
+  std::string extra_data_;
+};
+
 /// An interface for a buffer that stores task status changes and profiling events,
 /// and reporting these events to the GCS periodically.
 ///
@@ -42,7 +136,7 @@ namespace worker {
 ///   1. If any of the gRPC call failed, the task events will be dropped and warnings
 ///   logged. This is probably fine since this usually indicated a much worse issue.
 ///
-///   2. More than `RAY_task_events_max_num_task_events_in_buffer` tasks have been stored
+///   2. More than `RAY_task_events_max_buffer_size` tasks have been stored
 ///   in the buffer, any new task events will be dropped. In this case, the number of
 ///   dropped task events will also be included in the next flush to surface this.
 ///
@@ -57,7 +151,7 @@ class TaskEventBuffer {
   /// Add a task event to be reported.
   ///
   /// \param task_events Task events.
-  virtual void AddTaskEvent(rpc::TaskEvents task_events) = 0;
+  virtual void AddTaskEvent(std::unique_ptr<TaskEvent> task_event) = 0;
 
   /// Flush all task events stored in the buffer to GCS.
   ///
@@ -111,7 +205,8 @@ class TaskEventBufferImpl : public TaskEventBuffer {
   /// \param gcs_client GCS client
   TaskEventBufferImpl(std::unique_ptr<gcs::GcsClient> gcs_client);
 
-  void AddTaskEvent(rpc::TaskEvents task_events) LOCKS_EXCLUDED(mutex_) override;
+  void AddTaskEvent(std::unique_ptr<TaskEvent> task_event)
+      LOCKS_EXCLUDED(mutex_) override;
 
   void FlushEvents(bool forced) LOCKS_EXCLUDED(mutex_) override;
 
@@ -125,9 +220,13 @@ class TaskEventBufferImpl : public TaskEventBuffer {
 
  private:
   /// Test only functions.
-  std::vector<rpc::TaskEvents> GetAllTaskEvents() LOCKS_EXCLUDED(mutex_) {
+  std::vector<std::reference_wrapper<const TaskEvent>> GetAllTaskEvents()
+      LOCKS_EXCLUDED(mutex_) {
     absl::MutexLock lock(&mutex_);
-    std::vector<rpc::TaskEvents> copy(buffer_.begin(), buffer_.end());
+    std::vector<std::reference_wrapper<const TaskEvent>> copy;
+    for (const auto &e : buffer_) {
+      copy.push_back(std::cref(*e));
+    }
     return copy;
   }
 
@@ -171,7 +270,7 @@ class TaskEventBufferImpl : public TaskEventBuffer {
   std::atomic<bool> enabled_ = false;
 
   /// Circular buffered task events.
-  boost::circular_buffer_space_optimized<rpc::TaskEvents> buffer_ GUARDED_BY(mutex_);
+  boost::circular_buffer<std::unique_ptr<TaskEvent>> buffer_ GUARDED_BY(mutex_);
 
   /// Number of profile task events dropped since the last report flush.
   size_t num_profile_task_events_dropped_ GUARDED_BY(mutex_) = 0;
diff --git a/src/ray/core_worker/task_manager.cc b/src/ray/core_worker/task_manager.cc
index 8b91e3161a5f..f7126fcff0fe 100644
--- a/src/ray/core_worker/task_manager.cc
+++ b/src/ray/core_worker/task_manager.cc
@@ -103,7 +103,10 @@ std::vector<rpc::ObjectReference> TaskManager::AddPendingTask(
     RAY_CHECK(inserted.second);
     num_pending_tasks_++;
   }
-  RecordTaskStatusEvent(spec.AttemptNumber(), spec, rpc::TaskStatus::PENDING_ARGS_AVAIL);
+  RecordTaskStatusEvent(spec.AttemptNumber(),
+                        spec,
+                        rpc::TaskStatus::PENDING_ARGS_AVAIL,
+                        /* include_task_info */ true);
 
   return returned_refs;
 }
@@ -815,7 +818,8 @@ void TaskManager::MarkTaskRetryOnResubmit(TaskEntry &task_entry) {
   // the new task attempt, we pass the the attempt number explicitly.
   RecordTaskStatusEvent(task_entry.spec.AttemptNumber() + 1,
                         task_entry.spec,
-                        rpc::TaskStatus::PENDING_ARGS_AVAIL);
+                        rpc::TaskStatus::PENDING_ARGS_AVAIL,
+                        /* include_task_info */ true);
 }
 
 void TaskManager::MarkTaskRetryOnFailed(TaskEntry &task_entry) {
@@ -837,49 +841,6 @@ void TaskManager::SetTaskStatus(TaskEntry &task_entry, rpc::TaskStatus status) {
   RecordTaskStatusEvent(task_entry.spec.AttemptNumber(), task_entry.spec, status);
 }
 
-rpc::TaskInfoEntry TaskManager::MakeTaskInfoEntry(
-    const TaskSpecification &task_spec) const {
-  rpc::TaskInfoEntry task_info;
-  rpc::TaskType type;
-  if (task_spec.IsNormalTask()) {
-    type = rpc::TaskType::NORMAL_TASK;
-  } else if (task_spec.IsDriverTask()) {
-    type = rpc::TaskType::DRIVER_TASK;
-  } else if (task_spec.IsActorCreationTask()) {
-    type = rpc::TaskType::ACTOR_CREATION_TASK;
-    task_info.set_actor_id(task_spec.ActorCreationId().Binary());
-  } else {
-    RAY_CHECK(task_spec.IsActorTask());
-    type = rpc::TaskType::ACTOR_TASK;
-    task_info.set_actor_id(task_spec.ActorId().Binary());
-  }
-  task_info.set_type(type);
-  task_info.set_name(task_spec.GetName());
-  task_info.set_language(task_spec.GetLanguage());
-  task_info.set_func_or_class_name(task_spec.FunctionDescriptor()->CallString());
-  // NOTE(rickyx): we will have scheduling states recorded in the events list.
-  task_info.set_scheduling_state(rpc::TaskStatus::NIL);
-  task_info.set_job_id(task_spec.JobId().Binary());
-
-  task_info.set_task_id(task_spec.TaskId().Binary());
-  // NOTE: we set the parent task id of a task to be submitter's task id, where
-  // the submitter depends on the owner coreworker's:
-  // - if the owner coreworker runs a normal task, the submitter's task id is the task id.
-  // - if the owner coreworker runs an actor, the submitter's task id will be the actor's
-  // creation task id.
-  task_info.set_parent_task_id(task_spec.SubmitterTaskId().Binary());
-  const auto &resources_map = task_spec.GetRequiredResources().GetResourceMap();
-  task_info.mutable_required_resources()->insert(resources_map.begin(),
-                                                 resources_map.end());
-  task_info.mutable_runtime_env_info()->CopyFrom(task_spec.RuntimeEnvInfo());
-  const auto &pg_id = task_spec.PlacementGroupBundleId().first;
-  if (!pg_id.IsNil()) {
-    task_info.set_placement_group_id(pg_id.Binary());
-  }
-
-  return task_info;
-}
-
 void TaskManager::FillTaskInfo(rpc::GetCoreWorkerStatsReply *reply,
                                const int64_t limit) const {
   absl::MutexLock lock(&mu_);
@@ -940,30 +901,16 @@ void TaskManager::RecordTaskStatusEvent(int32_t attempt_number,
   if (!task_event_buffer_.Enabled()) {
     return;
   }
-  // Make task event
-  rpc::TaskEvents task_event;
-  task_event.set_task_id(spec.TaskId().Binary());
-  task_event.set_job_id(spec.JobId().Binary());
-  task_event.set_attempt_number(attempt_number);
-  auto state_updates = task_event.mutable_state_updates();
-  if (include_task_info || status == rpc::TaskStatus::PENDING_ARGS_AVAIL) {
-    // Initialize a new TaskInfoEntry
-    auto task_info = MakeTaskInfoEntry(spec);
-    task_event.mutable_task_info()->Swap(&task_info);
-  }
-
-  if (node_id.has_value()) {
-    RAY_CHECK(status == rpc::TaskStatus::SUBMITTED_TO_WORKER)
-        << "Node ID should be included when task status changes to SUBMITTED_TO_WORKER.";
-    state_updates->set_node_id(node_id->Binary());
-  }
-  if (worker_id.has_value()) {
-    RAY_CHECK(status == rpc::TaskStatus::SUBMITTED_TO_WORKER)
-        << "Worker ID should be included when task status changes to "
-           "SUBMITTED_TO_WORKER.";
-    state_updates->set_worker_id(worker_id->Binary());
-  }
-  gcs::FillTaskStatusUpdateTime(status, absl::GetCurrentTimeNanos(), state_updates);
+  auto task_event = std::make_unique<worker::TaskStatusEvent>(
+      spec.TaskId(),
+      spec.JobId(),
+      attempt_number,
+      status,
+      /* timestamp */ absl::GetCurrentTimeNanos(),
+      include_task_info ? std::make_shared<const TaskSpecification>(spec) : nullptr,
+      node_id,
+      worker_id);
+
   task_event_buffer_.AddTaskEvent(std::move(task_event));
 }
 
diff --git a/src/ray/core_worker/task_manager.h b/src/ray/core_worker/task_manager.h
index b50c58dd26b1..6b17729700e9 100644
--- a/src/ray/core_worker/task_manager.h
+++ b/src/ray/core_worker/task_manager.h
@@ -304,12 +304,6 @@ class TaskManager : public TaskFinisherInterface, public TaskResubmissionInterfa
   /// Fill every task information of the current worker to GetCoreWorkerStatsReply.
   void FillTaskInfo(rpc::GetCoreWorkerStatsReply *reply, const int64_t limit) const;
 
-  /// Make a rpc::TaskInfoEntry based on the TaskSpecification.
-  ///
-  /// \param[in] task_spec TaskSpecification of the task.
-  /// \return TaskInfoEntry based on the spec.
-  rpc::TaskInfoEntry MakeTaskInfoEntry(const TaskSpecification &task_spec) const;
-
   /// Returns the generator ID that contains the dynamically allocated
   /// ObjectRefs, if the task is dynamic. Else, returns Nil.
   ObjectID TaskGeneratorId(const TaskID &task_id) const;
diff --git a/src/ray/core_worker/test/task_event_buffer_test.cc b/src/ray/core_worker/test/task_event_buffer_test.cc
index 5f8088cb0261..e751868012e1 100644
--- a/src/ray/core_worker/test/task_event_buffer_test.cc
+++ b/src/ray/core_worker/test/task_event_buffer_test.cc
@@ -38,7 +38,7 @@ class TaskEventBufferTest : public ::testing::Test {
         R"(
 {
   "task_events_report_interval_ms": 1000,
-  "task_events_max_num_task_events_in_buffer": 100,
+  "task_events_max_buffer_size": 100,
   "task_events_send_batch_size": 100
 }
   )");
@@ -59,26 +59,16 @@ class TaskEventBufferTest : public ::testing::Test {
     return task_ids;
   }
 
-  rpc::TaskEvents GenStatusTaskEvents(TaskID task_id,
-                                      uint64_t attempt_num,
-                                      int64_t running_ts = 1) {
-    rpc::TaskEvents task_events;
-    task_events.set_task_id(task_id.Binary());
-    task_events.set_attempt_number(attempt_num);
-    auto status_update = task_events.mutable_state_updates();
-    status_update->set_running_ts(running_ts);
-    return task_events;
+  std::unique_ptr<TaskEvent> GenStatusTaskEvent(TaskID task_id,
+                                                int32_t attempt_num,
+                                                int64_t running_ts = 1) {
+    return std::make_unique<TaskStatusEvent>(
+        task_id, JobID::FromInt(0), attempt_num, rpc::TaskStatus::RUNNING, running_ts);
   }
 
-  rpc::TaskEvents GenProfileTaskEvents(TaskID task_id, uint64_t attempt_num) {
-    rpc::TaskEvents task_events;
-    task_events.set_task_id(task_id.Binary());
-    task_events.set_attempt_number(attempt_num);
-    auto profile_events = task_events.mutable_profile_events();
-    auto event = profile_events->add_events();
-    event->set_event_name("test_event");
-
-    return task_events;
+  std::unique_ptr<TaskEvent> GenProfileTaskEvent(TaskID task_id, int32_t attempt_num) {
+    return std::make_unique<TaskProfileEvent>(
+        task_id, JobID::FromInt(0), attempt_num, "", "", "", "test_event", 1);
   }
 
   static bool SortTaskEvents(const rpc::TaskEvents &a, const rpc::TaskEvents &b) {
@@ -99,7 +89,7 @@ class TaskEventBufferTestBatchSend : public TaskEventBufferTest {
         R"(
 {
   "task_events_report_interval_ms": 1000,
-  "task_events_max_num_task_events_in_buffer": 100,
+  "task_events_max_buffer_size": 100,
   "task_events_send_batch_size": 10
 }
   )");
@@ -131,12 +121,12 @@ TEST_F(TaskEventBufferTest, TestAddEvent) {
 
   // Test add status event
   auto task_id_1 = RandomTaskId();
-  task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id_1, 0));
+  task_event_buffer_->AddTaskEvent(GenStatusTaskEvent(task_id_1, 0));
 
   ASSERT_EQ(task_event_buffer_->GetAllTaskEvents().size(), 1);
 
   // Test add profile events
-  task_event_buffer_->AddTaskEvent(GenProfileTaskEvents(task_id_1, 1));
+  task_event_buffer_->AddTaskEvent(GenProfileTaskEvent(task_id_1, 1));
   ASSERT_EQ(task_event_buffer_->GetAllTaskEvents().size(), 2);
 }
 
@@ -144,13 +134,22 @@ TEST_F(TaskEventBufferTest, TestFlushEvents) {
   size_t num_events = 20;
   auto task_ids = GenTaskIDs(num_events);
 
-  std::vector<rpc::TaskEvents> task_events;
+  std::vector<std::unique_ptr<TaskEvent>> task_events;
   for (const auto &task_id : task_ids) {
-    task_events.push_back(GenStatusTaskEvents(task_id, 0));
+    task_events.push_back(GenStatusTaskEvent(task_id, 0));
   }
 
+  // Expect data flushed match
+  rpc::TaskEventData expected_data;
+  expected_data.set_num_profile_task_events_dropped(0);
+  expected_data.set_num_status_task_events_dropped(0);
   for (const auto &task_event : task_events) {
-    task_event_buffer_->AddTaskEvent(task_event);
+    auto event = expected_data.add_events_by_task();
+    task_event->ToRpcTaskEvents(event);
+  }
+
+  for (auto &task_event : task_events) {
+    task_event_buffer_->AddTaskEvent(std::move(task_event));
   }
 
   ASSERT_EQ(task_event_buffer_->GetAllTaskEvents().size(), num_events);
@@ -160,15 +159,6 @@ TEST_F(TaskEventBufferTest, TestFlushEvents) {
       static_cast<ray::gcs::MockGcsClient *>(task_event_buffer_->GetGcsClient())
           ->mock_task_accessor;
 
-  // Expect data flushed match
-  rpc::TaskEventData expected_data;
-  expected_data.set_num_profile_task_events_dropped(0);
-  expected_data.set_num_status_task_events_dropped(0);
-  for (const auto &task_event : task_events) {
-    auto event = expected_data.add_events_by_task();
-    event->CopyFrom(task_event);
-  }
-
   EXPECT_CALL(*task_gcs_accessor, AsyncAddTaskEventData(_, _))
       .WillOnce([&](std::unique_ptr<rpc::TaskEventData> actual_data,
                     ray::gcs::StatusCallback callback) {
@@ -197,9 +187,9 @@ TEST_F(TaskEventBufferTest, TestFailedFlush) {
   for (size_t i = 0; i < num_status_events + num_profile_events; ++i) {
     auto task_id = RandomTaskId();
     if (i % 2 == 0) {
-      task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id, 0));
+      task_event_buffer_->AddTaskEvent(GenStatusTaskEvent(task_id, 0));
     } else {
-      task_event_buffer_->AddTaskEvent(GenProfileTaskEvents(task_id, 0));
+      task_event_buffer_->AddTaskEvent(GenProfileTaskEvent(task_id, 0));
     }
   }
 
@@ -224,9 +214,9 @@ TEST_F(TaskEventBufferTest, TestFailedFlush) {
   for (size_t i = 0; i < num_status_events + num_profile_events; ++i) {
     auto task_id = RandomTaskId();
     if (i % 2 == 0) {
-      task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id, 1));
+      task_event_buffer_->AddTaskEvent(GenStatusTaskEvent(task_id, 1));
     } else {
-      task_event_buffer_->AddTaskEvent(GenProfileTaskEvents(task_id, 1));
+      task_event_buffer_->AddTaskEvent(GenProfileTaskEvent(task_id, 1));
     }
   }
 
@@ -241,7 +231,7 @@ TEST_F(TaskEventBufferTest, TestBackPressure) {
   // Adding some events
   for (size_t i = 0; i < num_events; ++i) {
     auto task_id = RandomTaskId();
-    task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id, 0));
+    task_event_buffer_->AddTaskEvent(GenStatusTaskEvent(task_id, 0));
   }
 
   auto task_gcs_accessor =
@@ -253,11 +243,11 @@ TEST_F(TaskEventBufferTest, TestBackPressure) {
   task_event_buffer_->FlushEvents(false);
 
   auto task_id_1 = RandomTaskId();
-  task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id_1, 0));
+  task_event_buffer_->AddTaskEvent(GenStatusTaskEvent(task_id_1, 0));
   task_event_buffer_->FlushEvents(false);
 
   auto task_id_2 = RandomTaskId();
-  task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id_2, 0));
+  task_event_buffer_->AddTaskEvent(GenStatusTaskEvent(task_id_2, 0));
   task_event_buffer_->FlushEvents(false);
 }
 
@@ -266,7 +256,7 @@ TEST_F(TaskEventBufferTest, TestForcedFlush) {
   // Adding some events
   for (size_t i = 0; i < num_events; ++i) {
     auto task_id = RandomTaskId();
-    task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id, 0));
+    task_event_buffer_->AddTaskEvent(GenStatusTaskEvent(task_id, 0));
   }
 
   auto task_gcs_accessor =
@@ -277,11 +267,11 @@ TEST_F(TaskEventBufferTest, TestForcedFlush) {
   EXPECT_CALL(*task_gcs_accessor, AsyncAddTaskEventData).Times(2);
 
   auto task_id_1 = RandomTaskId();
-  task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id_1, 0));
+  task_event_buffer_->AddTaskEvent(GenStatusTaskEvent(task_id_1, 0));
   task_event_buffer_->FlushEvents(false);
 
   auto task_id_2 = RandomTaskId();
-  task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id_2, 0));
+  task_event_buffer_->AddTaskEvent(GenStatusTaskEvent(task_id_2, 0));
   task_event_buffer_->FlushEvents(true);
 }
 
@@ -293,7 +283,7 @@ TEST_F(TaskEventBufferTestBatchSend, TestBatchedSend) {
   for (size_t i = 0; i < num_events; ++i) {
     auto task_id = RandomTaskId();
     task_ids.push_back(task_id);
-    task_event_buffer_->AddTaskEvent(GenStatusTaskEvents(task_id, 0));
+    task_event_buffer_->AddTaskEvent(GenStatusTaskEvent(task_id, 0));
   }
 
   auto task_gcs_accessor =
@@ -332,45 +322,51 @@ TEST_F(TaskEventBufferTest, TestBufferSizeLimit) {
   size_t num_status = 50;
 
   // Generate 2 batches of events each, where batch 1 will be evicted by batch 2.
-  std::vector<rpc::TaskEvents> profile_events_1;
-  std::vector<rpc::TaskEvents> status_events_1;
-  std::vector<rpc::TaskEvents> profile_events_2;
-  std::vector<rpc::TaskEvents> status_events_2;
+  std::vector<std::unique_ptr<TaskEvent>> profile_events_1;
+  std::vector<std::unique_ptr<TaskEvent>> status_events_1;
+  std::vector<std::unique_ptr<TaskEvent>> profile_events_2;
+  std::vector<std::unique_ptr<TaskEvent>> status_events_2;
 
   // Generate data
   for (size_t i = 0; i < 50; ++i) {
-    status_events_1.push_back(GenStatusTaskEvents(RandomTaskId(), 0));
-    status_events_2.push_back(GenStatusTaskEvents(RandomTaskId(), 0));
-    profile_events_1.push_back(GenProfileTaskEvents(RandomTaskId(), 0));
-    profile_events_2.push_back(GenProfileTaskEvents(RandomTaskId(), 0));
+    status_events_1.push_back(GenStatusTaskEvent(RandomTaskId(), 0));
+    status_events_2.push_back(GenStatusTaskEvent(RandomTaskId(), 0));
+    profile_events_1.push_back(GenProfileTaskEvent(RandomTaskId(), 0));
+    profile_events_2.push_back(GenProfileTaskEvent(RandomTaskId(), 0));
   }
 
-  auto data = {profile_events_1, status_events_1, profile_events_2, status_events_2};
-  for (auto &events : data) {
-    for (auto &event : events) {
-      task_event_buffer_->AddTaskEvent(event);
-    }
-  }
-
-  // Expect only limit in buffer.
-  ASSERT_EQ(task_event_buffer_->GetAllTaskEvents().size(), num_limit);
-
-  // Expect the reported data to match.
-  auto task_gcs_accessor =
-      static_cast<ray::gcs::MockGcsClient *>(task_event_buffer_->GetGcsClient())
-          ->mock_task_accessor;
-
   rpc::TaskEventData expected_data;
   expected_data.set_num_profile_task_events_dropped(num_profile);
   expected_data.set_num_status_task_events_dropped(num_status);
   for (const auto &event : profile_events_2) {
     auto expect_event = expected_data.add_events_by_task();
-    expect_event->CopyFrom(event);
+    event->ToRpcTaskEvents(expect_event);
   }
   for (const auto &event : status_events_2) {
     auto expect_event = expected_data.add_events_by_task();
-    expect_event->CopyFrom(event);
+    event->ToRpcTaskEvents(expect_event);
+  }
+
+  for (auto &event : profile_events_1) {
+    task_event_buffer_->AddTaskEvent(std::move(event));
+  }
+  for (auto &event : status_events_1) {
+    task_event_buffer_->AddTaskEvent(std::move(event));
   }
+  for (auto &event : profile_events_2) {
+    task_event_buffer_->AddTaskEvent(std::move(event));
+  }
+  for (auto &event : status_events_2) {
+    task_event_buffer_->AddTaskEvent(std::move(event));
+  }
+
+  // Expect only limit in buffer.
+  ASSERT_EQ(task_event_buffer_->GetAllTaskEvents().size(), num_limit);
+
+  // Expect the reported data to match.
+  auto task_gcs_accessor =
+      static_cast<ray::gcs::MockGcsClient *>(task_event_buffer_->GetGcsClient())
+          ->mock_task_accessor;
 
   EXPECT_CALL(*task_gcs_accessor, AsyncAddTaskEventData(_, _))
       .WillOnce([&](std::unique_ptr<rpc::TaskEventData> actual_data,
diff --git a/src/ray/core_worker/test/task_manager_test.cc b/src/ray/core_worker/test/task_manager_test.cc
index 1cd73cda00a6..94d7749f521a 100644
--- a/src/ray/core_worker/test/task_manager_test.cc
+++ b/src/ray/core_worker/test/task_manager_test.cc
@@ -53,7 +53,10 @@ rpc::Address GetRandomWorkerAddr() {
 
 class MockTaskEventBuffer : public worker::TaskEventBuffer {
  public:
-  MOCK_METHOD(void, AddTaskEvent, (rpc::TaskEvents task_events), (override));
+  MOCK_METHOD(void,
+              AddTaskEvent,
+              (std::unique_ptr<worker::TaskEvent> task_event),
+              (override));
 
   MOCK_METHOD(void, FlushEvents, (bool forced), (override));
 
diff --git a/src/ray/gcs/gcs_server/gcs_server.cc b/src/ray/gcs/gcs_server/gcs_server.cc
index b20fe69e77d9..7c1d5b4b9c2e 100644
--- a/src/ray/gcs/gcs_server/gcs_server.cc
+++ b/src/ray/gcs/gcs_server/gcs_server.cc
@@ -755,6 +755,8 @@ void GcsServer::PrintAsioStats() {
       RayConfig::instance().event_stats_print_interval_ms();
   if (event_stats_print_interval_ms != -1 && RayConfig::instance().event_stats()) {
     RAY_LOG(INFO) << "Event stats:\n\n" << main_service_.stats().StatsString() << "\n\n";
+    RAY_LOG(INFO) << "GcsTaskManager Event stats:\n\n"
+                  << gcs_task_manager_->GetIoContext().stats().StatsString() << "\n\n";
   }
 }
 
diff --git a/src/ray/gcs/pb_util.h b/src/ray/gcs/pb_util.h
index e45a3932c79b..3e74ea8042d2 100644
--- a/src/ray/gcs/pb_util.h
+++ b/src/ray/gcs/pb_util.h
@@ -230,6 +230,46 @@ inline TaskID GetParentTaskId(const rpc::TaskEvents &task_event) {
   return TaskID::Nil();
 }
 
+inline void FillTaskInfo(rpc::TaskInfoEntry *task_info,
+                         const TaskSpecification &task_spec) {
+  rpc::TaskType type;
+  if (task_spec.IsNormalTask()) {
+    type = rpc::TaskType::NORMAL_TASK;
+  } else if (task_spec.IsDriverTask()) {
+    type = rpc::TaskType::DRIVER_TASK;
+  } else if (task_spec.IsActorCreationTask()) {
+    type = rpc::TaskType::ACTOR_CREATION_TASK;
+    task_info->set_actor_id(task_spec.ActorCreationId().Binary());
+  } else {
+    RAY_CHECK(task_spec.IsActorTask());
+    type = rpc::TaskType::ACTOR_TASK;
+    task_info->set_actor_id(task_spec.ActorId().Binary());
+  }
+  task_info->set_type(type);
+  task_info->set_name(task_spec.GetName());
+  task_info->set_language(task_spec.GetLanguage());
+  task_info->set_func_or_class_name(task_spec.FunctionDescriptor()->CallString());
+  // NOTE(rickyx): we will have scheduling states recorded in the events list.
+  task_info->set_scheduling_state(rpc::TaskStatus::NIL);
+  task_info->set_job_id(task_spec.JobId().Binary());
+
+  task_info->set_task_id(task_spec.TaskId().Binary());
+  // NOTE: we set the parent task id of a task to be submitter's task id, where
+  // the submitter depends on the owner coreworker's:
+  // - if the owner coreworker runs a normal task, the submitter's task id is the task id.
+  // - if the owner coreworker runs an actor, the submitter's task id will be the actor's
+  // creation task id.
+  task_info->set_parent_task_id(task_spec.SubmitterTaskId().Binary());
+  const auto &resources_map = task_spec.GetRequiredResources().GetResourceMap();
+  task_info->mutable_required_resources()->insert(resources_map.begin(),
+                                                  resources_map.end());
+  task_info->mutable_runtime_env_info()->CopyFrom(task_spec.RuntimeEnvInfo());
+  const auto &pg_id = task_spec.PlacementGroupBundleId().first;
+  if (!pg_id.IsNil()) {
+    task_info->set_placement_group_id(pg_id.Binary());
+  }
+}
+
 /// Get the timestamp of the task status if available.
 ///
 /// \param task_event Task event.

From 8bf1d0382dfe598bf24a51aa9e432a224342a234 Mon Sep 17 00:00:00 2001
From: Wendi-anyscale <97252176+Wendi-anyscale@users.noreply.github.com>
Date: Thu, 9 Feb 2023 13:39:33 -0800
Subject: [PATCH 203/267] [docs]Fix wording of Many model training guidance
 (#32319)

Co-authored-by: Richard Liaw <rliaw@berkeley.edu>
Co-authored-by: Cade Daniel <cade@anyscale.com>
---
 doc/source/ray-overview/use-cases.rst | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/doc/source/ray-overview/use-cases.rst b/doc/source/ray-overview/use-cases.rst
index 43f7851dbdc1..8752ad75edab 100644
--- a/doc/source/ray-overview/use-cases.rst
+++ b/doc/source/ray-overview/use-cases.rst
@@ -99,8 +99,8 @@ How do I do many model training on Ray?
 There are three ways of using Ray to express this workload.
 
 1. If you have a large amount of data, use Ray Data (:ref:`Tutorial <mmt-datasets>`).
-2. If you have a small amount of data (<10GB), want to integrate with tools, such as wandb and mlflow, and you have less than 20,000 models, use Ray Tune (:ref:`Tutorial <mmt-tune>`).
-3. If your use case does not fit in any of the above categories, for example if you need to scale up to 1 million models, use Ray Core (:ref:`Tutorial <mmt-core>`), which gives you finer-grained control over the application. However, note that this is for advanced users and will require understanding of Ray Core :ref:`design patterns and anti-patterns <core-patterns>`.
+2. If you have a small amount of data (<10GB), want to integrate with tools such as Weights & Biases and MLflow, and have less than 20,000 models, use Ray Tune (:ref:`Tutorial <mmt-tune>`).
+3. If your use case does not fit in any of the above categories (e.g., you need to scale up to 1 million models), use Ray Core (:ref:`Tutorial <mmt-core>`), which gives you finer-grained control over the application. This option requires you to understand the Ray Core :ref:`design patterns and anti-patterns <core-patterns>`.
 
 .. TODO
   Add link to many model training blog.

From fc81af1d60302f82da5b5f7786972f19cc46f6df Mon Sep 17 00:00:00 2001
From: Yi Cheng <74173148+iycheng@users.noreply.github.com>
Date: Thu, 9 Feb 2023 13:50:44 -0800
Subject: [PATCH 204/267] [core] Fix gRPC callback API destruction issues.
 (#32151)

For gRPC callback API, in the server and client side, the lifecycle is different.

For server, it has to call Finish to make the call be considered as dead by gRPC and this can only be called once.
For client, it will destruct itself if it receive the signal from the server or the connection is broken due to some reasons.

There are two issues here in ray syncer:

server might call Finish twice because server has OnWriteDone/OnReadDone.
The fix is that when error happened, we'll call Finish and we'll guarantee that it's only called once.
client might destruct itself, because client didn't have anything added to control that.
The fix is to add AddHole/RemoveHole in the code to explicit control that just like server side.
Testing is tricky, but it can be caught by nightly tests.
---
 src/ray/common/ray_syncer/ray_syncer-inl.h | 11 +++----
 src/ray/common/ray_syncer/ray_syncer.cc    | 36 ++++++++++++++++------
 src/ray/common/test/ray_syncer_test.cc     |  1 +
 3 files changed, 33 insertions(+), 15 deletions(-)

diff --git a/src/ray/common/ray_syncer/ray_syncer-inl.h b/src/ray/common/ray_syncer/ray_syncer-inl.h
index 7726bc3da654..ebb65f890a10 100644
--- a/src/ray/common/ray_syncer/ray_syncer-inl.h
+++ b/src/ray/common/ray_syncer/ray_syncer-inl.h
@@ -267,11 +267,9 @@ class RaySyncerBidiReactorBase : public RaySyncerBidiReactor, public T {
     if (ok) {
       io_context_.dispatch([this]() { SendNext(); }, "");
     } else {
-      // No need to resent the message since if ok=false, it's the end
-      // of gRPC call and client will reconnect in case of a failure.
-      // In gRPC, OnDone will be called after.
       RAY_LOG_EVERY_N(ERROR, 100)
           << "Failed to send the message to: " << NodeID::FromBinary(GetRemoteNodeID());
+      Disconnect();
     }
   }
 
@@ -285,11 +283,9 @@ class RaySyncerBidiReactorBase : public RaySyncerBidiReactor, public T {
           },
           "");
     } else {
-      // No need to resent the message since if ok=false, it's the end
-      // of gRPC call and client will reconnect in case of a failure.
-      // In gRPC, OnDone will be called after.
       RAY_LOG_EVERY_N(ERROR, 100)
           << "Failed to read the message from: " << NodeID::FromBinary(GetRemoteNodeID());
+      Disconnect();
     }
   }
 
@@ -354,6 +350,8 @@ class RayServerBidiReactor : public RaySyncerBidiReactorBase<ServerBidiReactor>
 
   /// grpc callback context
   grpc::CallbackServerContext *server_context_;
+  bool disconnected_ = false;
+  FRIEND_TEST(SyncerReactorTest, TestReactorFailure);
 };
 
 /// Reactor for gRPC client side. It defines the client's specific behavior for a
@@ -383,6 +381,7 @@ class RayClientBidiReactor : public RaySyncerBidiReactorBase<ClientBidiReactor>
   grpc::ClientContext client_context_;
 
   std::unique_ptr<ray::rpc::syncer::RaySyncer::Stub> stub_;
+  bool disconnected_ = false;
 };
 
 }  // namespace syncer
diff --git a/src/ray/common/ray_syncer/ray_syncer.cc b/src/ray/common/ray_syncer/ray_syncer.cc
index 7dd8420e78a9..2bb2f0bab311 100644
--- a/src/ray/common/ray_syncer/ray_syncer.cc
+++ b/src/ray/common/ray_syncer/ray_syncer.cc
@@ -105,7 +105,14 @@ RayServerBidiReactor::RayServerBidiReactor(
 }
 
 void RayServerBidiReactor::Disconnect() {
-  io_context_.dispatch([this]() { Finish(grpc::Status::OK); }, "");
+  io_context_.dispatch(
+      [this]() {
+        if (!disconnected_) {
+          disconnected_ = true;
+          Finish(grpc::Status::OK);
+        }
+      },
+      "");
 }
 
 void RayServerBidiReactor::OnCancel() { Disconnect(); }
@@ -132,6 +139,10 @@ RayClientBidiReactor::RayClientBidiReactor(
       stub_(std::move(stub)) {
   client_context_.AddMetadata("node_id", NodeID::FromBinary(local_node_id).Hex());
   stub_->async()->StartSync(&client_context_, this);
+  // Prevent this call from being terminated.
+  // Check https://github.com/grpc/proposal/blob/master/L67-cpp-callback-api.md
+  // for details.
+  AddHold();
   StartPull();
 }
 
@@ -145,7 +156,16 @@ void RayClientBidiReactor::OnDone(const grpc::Status &status) {
 }
 
 void RayClientBidiReactor::Disconnect() {
-  io_context_.dispatch([this]() { StartWritesDone(); }, "");
+  io_context_.dispatch(
+      [this]() {
+        if (!disconnected_) {
+          disconnected_ = true;
+          StartWritesDone();
+          // Free the hold to allow OnDone being called.
+          RemoveHold();
+        }
+      },
+      "");
 }
 
 RaySyncer::RaySyncer(instrumented_io_context &io_context,
@@ -232,12 +252,12 @@ void RaySyncer::Connect(RaySyncerBidiReactor *reactor) {
 }
 
 void RaySyncer::Disconnect(const std::string &node_id) {
-  std::promise<RaySyncerBidiReactor *> promise;
+  std::promise<void> promise;
   io_context_.dispatch(
       [&]() {
         auto iter = sync_reactors_.find(node_id);
         if (iter == sync_reactors_.end()) {
-          promise.set_value(nullptr);
+          promise.set_value();
           return;
         }
 
@@ -245,13 +265,11 @@ void RaySyncer::Disconnect(const std::string &node_id) {
         if (iter != sync_reactors_.end()) {
           sync_reactors_.erase(iter);
         }
-        promise.set_value(reactor);
+        reactor->Disconnect();
+        promise.set_value();
       },
       "RaySyncerDisconnect");
-  auto reactor = promise.get_future().get();
-  if (reactor != nullptr) {
-    reactor->Disconnect();
-  }
+  promise.get_future().get();
 }
 
 void RaySyncer::Register(MessageType message_type,
diff --git a/src/ray/common/test/ray_syncer_test.cc b/src/ray/common/test/ray_syncer_test.cc
index ff0652d22be3..ae9391f1a6dc 100644
--- a/src/ray/common/test/ray_syncer_test.cc
+++ b/src/ray/common/test/ray_syncer_test.cc
@@ -905,6 +905,7 @@ TEST_F(SyncerReactorTest, TestReactorFailure) {
   ASSERT_TRUE(s != nullptr);
   ASSERT_TRUE(c != nullptr);
   s->Finish(grpc::Status::CANCELLED);
+  s->disconnected_ = true;
   auto c_cleanup = client_cleanup.get_future().get();
   ASSERT_EQ(node_s, c_cleanup.first);
   ASSERT_EQ(true, c_cleanup.second);

From 741b7a0da6dd0b32c605cef248fbe12241984eb5 Mon Sep 17 00:00:00 2001
From: Jiajun Yao <jeromeyjj@gmail.com>
Date: Fri, 10 Feb 2023 06:00:53 +0800
Subject: [PATCH 205/267] [Doc] Move actor checkpointing to actor fault
 tolerance page  (#32153)

Actor fault tolerance page is a better place for actor checkpointing. Also make the code example testable.

Signed-off-by: Jiajun Yao <jeromeyjj@gmail.com>
---
 .../fault-tolerance-actor-checkpointing.rst   | 89 -------------------
 doc/source/ray-core/actors/patterns/index.rst |  1 -
 .../ray-core/doc_code/actor_checkpointing.py  | 89 +++++++++++++++++++
 .../ray-core/fault_tolerance/actors.rst       | 29 ++++++
 4 files changed, 118 insertions(+), 90 deletions(-)
 delete mode 100644 doc/source/ray-core/actors/patterns/fault-tolerance-actor-checkpointing.rst
 create mode 100644 doc/source/ray-core/doc_code/actor_checkpointing.py

diff --git a/doc/source/ray-core/actors/patterns/fault-tolerance-actor-checkpointing.rst b/doc/source/ray-core/actors/patterns/fault-tolerance-actor-checkpointing.rst
deleted file mode 100644
index 0ca4ee5911d1..000000000000
--- a/doc/source/ray-core/actors/patterns/fault-tolerance-actor-checkpointing.rst
+++ /dev/null
@@ -1,89 +0,0 @@
-Pattern: Fault Tolerance with Actor Checkpointing
-=================================================
-
-Ray offers support for task and actor `fault tolerance <https://docs.ray.io/en/latest/ray-core/actors/fault-tolerance.html>`__. Specifically for actors, you can specify max_restarts to automatically enable restart for Ray actors. This means when your actor or the node hosting that actor crashed, the actor will be automatically reconstructed. However, this doesn’t provide ways for you to restore application level states in your actor. You checkpoint your actor periodically and read from the checkpoint if possible.
-
-There are several ways to checkpoint:
-
-- Write the state to local disk. This can cause trouble when actors are instantiated in multi-node clusters.
-- Write the state to local disk and use cluster launcher to sync file across cluster.
-- Write the state to Ray internal kv store. (This is an experimental feature and not suitable for large files).
-- Write the state to a Ray actor placed on head node (using custom resource constraints).
-
-
-Code example
-------------
-
-.. code-block:: python
-
-    # max_restarts tells Ray to restart the actor infinite times
-    # max_task_retries tells Ray to transparently retries actor call when you call ray.get(actor.process.remote())
-    @ray.remote(max_restarts=-1, max_task_retries=-1)
-    class ImmortalActor:
-        def __init__(self):
-            if os.path.exists("/tmp/checkpoint.pkl"):
-                self.state = pickle.load(open("/tmp/checkpoint.pkl"))
-            else:
-                self.state = MyState()
-
-        def process(self):
-            ....
-
-You can also achieve the same result just using regular Ray actors and some custom logic:
-
-.. code-block:: python
-
-    @ray.remote
-    class Worker:
-        def __init__(*args, **kwargs):
-            self.state = {}
-
-        def perform_task(*args, **kwargs):
-            # This task might fail.
-            ...
-
-        def get_state():
-            # Returns actor state.
-            return self.state
-
-
-        def load_state(state):
-            # Loads actor state.
-            self.state = state
-
-    class Controller:
-        def create_workers(num_workers):
-            self.workers = [Worker.remote(...) for _ in range(num_workers)]
-
-        def perform_task_with_fault_tol(max_retries, *args, **kwargs):
-            # Perform tasks in a fault tolerant manner.
-            for _ in range(max_retries):
-                worker_states = ray.get(
-                          [w.get_state.remote() for w in self.workers])
-                success, result = self.perform_task_on_all_workers(
-                          *args, **kwargs)
-                if success:
-                    return result
-                else:
-                    self.create_workers()
-                    ray.get(
-                                [w.load_state.remote(state)
-                                      for w, state in zip(
-                                          self.workers, worker_states)])
-            return None
-
-
-        def perform_task_on_all_workers(*args, **kwargs):
-            futures = [
-                   w.perform_task.remote(
-                       *args, **kwargs) for w in self.workers]
-            output = []
-            unfinished = futures
-            try:
-                while len(unfinished) > 0:
-                    finished, unfinished = ray.wait(unfinished)
-                    output.extend(ray.get(finished))
-            except RayActorError:
-                return False, None
-
-            return True, output
diff --git a/doc/source/ray-core/actors/patterns/index.rst b/doc/source/ray-core/actors/patterns/index.rst
index 607306337d21..86be341848e3 100644
--- a/doc/source/ray-core/actors/patterns/index.rst
+++ b/doc/source/ray-core/actors/patterns/index.rst
@@ -14,4 +14,3 @@ You may also be interested in visiting the design patterns section for :ref:`tas
     :maxdepth: -1
 
     concurrent-operations-async-actor
-    fault-tolerance-actor-checkpointing
diff --git a/doc/source/ray-core/doc_code/actor_checkpointing.py b/doc/source/ray-core/doc_code/actor_checkpointing.py
new file mode 100644
index 000000000000..e924fabbe0f0
--- /dev/null
+++ b/doc/source/ray-core/doc_code/actor_checkpointing.py
@@ -0,0 +1,89 @@
+# __actor_checkpointing_manual_restart_begin__
+import os
+import sys
+import ray
+import json
+
+
+@ray.remote(num_cpus=1)
+class Worker:
+    def __init__(self):
+        self.state = {"num_tasks_executed": 0}
+
+    def execute_task(self, crash=False):
+        if crash:
+            sys.exit(1)
+
+        # Execute the task
+        # ...
+
+        # Update the internal state
+        self.state["num_tasks_executed"] = self.state["num_tasks_executed"] + 1
+
+    def checkpoint(self):
+        return self.state
+
+    def restore(self, state):
+        self.state = state
+
+
+class Controller:
+    def __init__(self):
+        self.worker = Worker.remote()
+        self.worker_state = ray.get(self.worker.checkpoint.remote())
+
+    def execute_task_with_fault_tolerance(self):
+        i = 0
+        while True:
+            i = i + 1
+            try:
+                ray.get(self.worker.execute_task.remote(crash=(i % 2 == 1)))
+                # Checkpoint the latest worker state
+                self.worker_state = ray.get(self.worker.checkpoint.remote())
+                return
+            except ray.exceptions.RayActorError:
+                print("Actor crashes, restarting...")
+                # Restart the actor and restore the state
+                self.worker = Worker.remote()
+                ray.get(self.worker.restore.remote(self.worker_state))
+
+
+controller = Controller()
+controller.execute_task_with_fault_tolerance()
+controller.execute_task_with_fault_tolerance()
+assert ray.get(controller.worker.checkpoint.remote())["num_tasks_executed"] == 2
+# __actor_checkpointing_manual_restart_end__
+
+
+# __actor_checkpointing_auto_restart_begin__
+@ray.remote(max_restarts=-1, max_task_retries=-1)
+class ImmortalActor:
+    def __init__(self):
+        if os.path.exists("/tmp/checkpoint.json"):
+            # Restore from a checkpoint
+            with open("/tmp/checkpoint.json", "r") as f:
+                self.state = json.load(f)
+        else:
+            self.state = {}
+
+    def update(self, key, value):
+        import random
+
+        if random.randrange(10) < 5:
+            sys.exit(1)
+
+        self.state[key] = value
+
+        # Checkpoint the latest state
+        with open("/tmp/checkpoint.json", "w") as f:
+            json.dump(self.state, f)
+
+    def get(self, key):
+        return self.state[key]
+
+
+actor = ImmortalActor.remote()
+actor.update.remote("1", 1)
+actor.update.remote("2", 2)
+assert ray.get(actor.get.remote("1")) == 1
+# __actor_checkpointing_auto_restart_end__
diff --git a/doc/source/ray-core/fault_tolerance/actors.rst b/doc/source/ray-core/fault_tolerance/actors.rst
index d1ea3d67e524..9d01df1e9448 100644
--- a/doc/source/ray-core/fault_tolerance/actors.rst
+++ b/doc/source/ray-core/fault_tolerance/actors.rst
@@ -73,6 +73,35 @@ state, e.g., by taking periodic checkpoints and recovering from the checkpoint
 upon actor restart.
 
 
+Actor checkpointing
+~~~~~~~~~~~~~~~~~~~
+
+``max_restarts`` automatically restarts the crashed actor,
+but it doesn't automatically restore application level state in your actor.
+Instead, you should manually checkpoint your actor's state and recover upon actor restart.
+
+For actors that are restarted manually, the actor's creator should manage the checkpoint and manually restart and recover the actor upon failure. This is recommended if you want the creator to decide when the actor should be restarted and/or if the creator is coordinating actor checkpoints with other execution:
+
+.. literalinclude:: ../doc_code/actor_checkpointing.py
+  :language: python
+  :start-after: __actor_checkpointing_manual_restart_begin__
+  :end-before: __actor_checkpointing_manual_restart_end__
+
+Alternatively, if you are using Ray's automatic actor restart, the actor can checkpoint itself manually and restore from a checkpoint in the constructor:
+
+.. literalinclude:: ../doc_code/actor_checkpointing.py
+  :language: python
+  :start-after: __actor_checkpointing_auto_restart_begin__
+  :end-before: __actor_checkpointing_auto_restart_end__
+
+.. note::
+
+  If the checkpoint is saved to external storage, make sure
+  it's accessible to the entire cluster since the actor can be restarted
+  on a different node.
+  For example, save the checkpoint to cloud storage (e.g., S3) or a shared directory (e.g., via NFS).
+
+
 Actor creator failure
 ---------------------
 

From 188c4115eaa7827b60e0770aa4230fe53882977b Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Thu, 9 Feb 2023 14:28:12 -0800
Subject: [PATCH 206/267] [Core/Observability] Fix the timeline bugs (#32287)

Signed-off-by: SangBin Cho <rkooo567@gmail.com>

There are 2 issues.

The duration should be recorded in microseconds. I made a mistake to record it as 10*microseconds which make the duration incorrect.
The metadata event should be recorded only once. I made a mistake it is recorded for every task, which blows up the timeline file size.
This PR fixes both issues + add relevant tests.

I also created a dataclass for chrome tracing events for a better schema tracking.
---
 python/ray/_private/profiling.py     | 131 +++++++++++++++++----------
 python/ray/tests/test_state_api_2.py |  21 ++++-
 2 files changed, 101 insertions(+), 51 deletions(-)

diff --git a/python/ray/_private/profiling.py b/python/ray/_private/profiling.py
index 76b39e8e0e4b..be957eda1425 100644
--- a/python/ray/_private/profiling.py
+++ b/python/ray/_private/profiling.py
@@ -1,7 +1,8 @@
 import os
 import json
 from collections import defaultdict
-from typing import List
+from dataclasses import dataclass, asdict
+from typing import List, Dict, Union
 
 import ray
 
@@ -40,6 +41,46 @@ def __exit__(self, type, value, tb):
 )
 
 
+@dataclass(init=True)
+class ChromeTracingCompleteEvent:
+    # https://docs.google.com/document/d/1CvAClvFfyA5R-PhYUmn5OOQtYMH4h6I0nSsKchNAySU/preview#heading=h.lpfof2aylapb # noqa
+    # The event categories. This is a comma separated list of categories
+    # for the event. The categories can be used to hide events in
+    # the Trace Viewer UI.
+    cat: str
+    # The string displayed on the event.
+    name: str
+    # The identifier for the group of rows that the event
+    # appears in.
+    pid: int
+    # The identifier for the row that the event appears in.
+    tid: int
+    # The start time in microseconds.
+    ts: int
+    # The duration in microseconds.
+    dur: int
+    # This is the name of the color to display the box in.
+    cname: str
+    # The extra user-defined data.
+    args: Dict[str, Union[str, int]]
+    # The event type (X means the complete event).
+    ph: str = "X"
+
+
+@dataclass(init=True)
+class ChromeTracingMetadataEvent:
+    # https://docs.google.com/document/d/1CvAClvFfyA5R-PhYUmn5OOQtYMH4h6I0nSsKchNAySU/preview#bookmark=id.iycbnb4z7i9g # noqa
+    name: str
+    # Metadata arguments. E.g., name: <metadata_name>
+    args: Dict[str, str]
+    # The process id of this event. In Ray, pid indicates the node.
+    pid: int
+    # The thread id of this event. In Ray, tid indicates each worker.
+    tid: int = None
+    # M means the metadata event.
+    ph: str = "M"
+
+
 def profile(event_type, extra_data=None):
     """Profile a span of time so that it appears in the timeline visualization.
 
@@ -156,58 +197,50 @@ def chrome_tracing_dump(
                     ] = worker_idx  # noqa
                     worker_idx += 1
 
-                new_event = {
-                    # The category of the event.
-                    "cat": event_name,
-                    # The string displayed on the event.
-                    "name": event_name,
-                    # The identifier for the group of rows that the event
-                    # appears in.
-                    "pid": node_to_index[node_ip_address],
-                    # The identifier for the row that the event appears in.
-                    "tid": worker_to_index[
-                        (node_to_index[node_ip_address], component_id)
-                    ],
-                    # The start time is in ms. Convert it to microseconds.
-                    "ts": event["start_time"] * 10e3,
-                    # The duration is in ms. Convert it to microseconds.
-                    "dur": (event["end_time"] * 10e3) - (event["start_time"] * 10e3),
-                    # What is this?
-                    "ph": "X",
-                    # This is the name of the color to display the box in.
-                    "cname": _default_color_mapping[event["event_name"]],
-                    # The extra user-defined data.
-                    "args": extra_data,
-                }
-
-                # Modify the json with the additional user-defined extra data.
-                # This can be used to add fields or override existing fields.
+                # Modify the name with the additional user-defined extra data.
+                cname = _default_color_mapping[event["event_name"]]
+                name = event_name
+
                 if "cname" in extra_data:
-                    new_event["cname"] = event["extra_data"]["cname"]
+                    cname = _default_color_mapping[event["extra_data"]["cname"]]
                 if "name" in extra_data:
-                    new_event["name"] = extra_data["name"]
-                all_events.append(new_event)
-
-            for node, i in node_to_index.items():
-                all_events.append(
-                    {
-                        "name": "process_name",
-                        "ph": "M",
-                        "pid": i,
-                        "args": {"name": f"Node {node}"},
-                    }
+                    name = extra_data["name"]
+
+                new_event = ChromeTracingCompleteEvent(
+                    cat=event_name,
+                    name=name,
+                    pid=node_to_index[node_ip_address],
+                    tid=worker_to_index[(node_to_index[node_ip_address], component_id)],
+                    ts=event["start_time"] * 1e3,
+                    dur=(event["end_time"] * 1e3) - (event["start_time"] * 1e3),
+                    cname=cname,
+                    args=extra_data,
                 )
-
-            for worker, i in worker_to_index.items():
-                all_events.append(
-                    {
-                        "name": "thread_name",
-                        "ph": "M",
-                        "tid": i,
-                        "pid": worker[0],
-                        "args": {"name": worker[1]},
-                    }
+                all_events.append(asdict(new_event))
+
+    for node, i in node_to_index.items():
+        all_events.append(
+            asdict(
+                ChromeTracingMetadataEvent(
+                    name="process_name",
+                    pid=i,
+                    args={"name": f"Node {node}"},
+                )
+            )
+        )
+
+    for worker, i in worker_to_index.items():
+        all_events.append(
+            asdict(
+                ChromeTracingMetadataEvent(
+                    name="thread_name",
+                    ph="M",
+                    tid=i,
+                    pid=worker[0],
+                    args={"name": worker[1]},
                 )
+            )
+        )
 
     # Handle task event disabled.
     return json.dumps(all_events)
diff --git a/python/ray/tests/test_state_api_2.py b/python/ray/tests/test_state_api_2.py
index 1a7339c2d8a2..7ecdfb7d0102 100644
--- a/python/ray/tests/test_state_api_2.py
+++ b/python/ray/tests/test_state_api_2.py
@@ -14,12 +14,15 @@
 
 
 def test_timeline(shutdown_only):
-    ray.init()
+    ray.init(num_cpus=8)
     job_id = ray.get_runtime_context().get_job_id()
+    TASK_SLEEP_TIME_S = 1
 
     @ray.remote
     def f():
-        pass
+        import time
+
+        time.sleep(TASK_SLEEP_TIME_S)
 
     @ray.remote
     class Actor:
@@ -125,12 +128,26 @@ def g(self):
                 event["args"]["func_or_class_name"]
                 == tasks[task_id]["func_or_class_name"]
             )  # noqa
+            # Make sure the duration is correct.
+            # duration is in microseconds.
+            # Since the task sleeps for TASK_SLEEP_TIME_S,
+            # task:execute should have a similar sleep time.
+            if event["cat"] == "task:execute":
+                assert (
+                    TASK_SLEEP_TIME_S * 1e6 * 0.9
+                    < event["dur"]
+                    < TASK_SLEEP_TIME_S * 1e6 * 1.1
+                )  # noqa
         # Make sure the worker id is correct.
         worker_id_from_event = index_to_workers[event["tid"]].split(":")[1]
         node_id_from_event = index_to_nodes[event["pid"]].split(" ")[1]
         assert tasks[task_id]["worker_id"] == worker_id_from_event
         assert tasks[task_id]["node_id"] == nodes[node_id_from_event]["node_id"]
 
+    # Verify the number of metadata events are correct.
+    metadata_events = list(filter(lambda e: e["ph"] == "M", result))
+    assert len(metadata_events) == len(index_to_workers) + len(index_to_nodes)
+
 
 def test_timeline_request(shutdown_only):
     context = ray.init()

From 2bbe8c1e62898fbe0c0c5a699c6ccff82d54198b Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Thu, 9 Feb 2023 14:43:07 -0800
Subject: [PATCH 207/267] [core][state] Task Backend - reduce lock contention
 on debug stats / metric recording on counters.  (#32355)

Signed-off-by: rickyyx <rickyx@anyscale.com>

When GcsTaskManager is busy processing task events, it is not supposed to slow down the GCS. However, we previously have mutexes protecting some of the counter states. So the main io service/thread will get blocked when trying to acquire locks to print debug states + record metrics + add telemetry data.

Global stats: 196276 total (5 active)
Queueing time: mean = 5.255 ms, max = 4.545 s, min = -0.000 s, total = 1031.389 s
Execution time:  mean = 295.864 us, total = 58.071 s
Event stats:
....
        GCSServer.deadline_timer.debug_state_dump - 85 total (1 active), CPU time: mean = 521.750 ms, total = 44.349 s
        GCSServer.deadline_timer.debug_state_event_stats_print - 15 total (1 active, 1 running), CPU time: mean = 404.255 ms, total = 6.064 s
....

This PR

introduced a thread-safe wrapper on CounterMap, such that modifying and reading various debug counters will have minimal lock contentions. Also merged the count by task type for telemetry into the counter map. This way, we will not need to acquire locks at various places.
With access to counters thread-safe now, we could also remove the mutex locks on the GcsTaskManagerStorage since it's now thread-safe (only accessed from its dedicated io thread)
---
 src/ray/gcs/gcs_server/gcs_task_manager.cc    | 109 +++++++++---------
 src/ray/gcs/gcs_server/gcs_task_manager.h     |  91 +++++++++------
 .../gcs_server/test/gcs_task_manager_test.cc  |  63 +++++-----
 src/ray/util/counter_map.h                    |  71 ++++++++++++
 4 files changed, 214 insertions(+), 120 deletions(-)

diff --git a/src/ray/gcs/gcs_server/gcs_task_manager.cc b/src/ray/gcs/gcs_server/gcs_task_manager.cc
index 3b326d2a8185..37144bf77d32 100644
--- a/src/ray/gcs/gcs_server/gcs_task_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_task_manager.cc
@@ -252,12 +252,13 @@ GcsTaskManager::GcsTaskManagerStorage::AddOrReplaceTaskEvent(
 
     // Update the events.
     if (events_by_task.has_task_info() && !existing_events.has_task_info()) {
-      num_tasks_by_type_[events_by_task.task_info().type()]++;
+      stats_counter_.Increment(
+          kTaskTypeToCounterType.at(events_by_task.task_info().type()));
     }
 
-    num_bytes_task_events_ -= existing_events.ByteSizeLong();
+    stats_counter_.Decrement(kNumTaskEventsBytesStored, existing_events.ByteSizeLong());
     existing_events.MergeFrom(events_by_task);
-    num_bytes_task_events_ += existing_events.ByteSizeLong();
+    stats_counter_.Increment(kNumTaskEventsBytesStored, existing_events.ByteSizeLong());
 
     MarkTaskTreeFailedIfNeeded(task_id, parent_task_id);
     return absl::nullopt;
@@ -267,7 +268,8 @@ GcsTaskManager::GcsTaskManagerStorage::AddOrReplaceTaskEvent(
 
   // Bump the task counters by type.
   if (events_by_task.has_task_info() && events_by_task.attempt_number() == 0) {
-    num_tasks_by_type_[events_by_task.task_info().type()]++;
+    stats_counter_.Increment(
+        kTaskTypeToCounterType.at(events_by_task.task_info().type()));
   }
 
   // If limit enforced, replace one.
@@ -280,8 +282,9 @@ GcsTaskManager::GcsTaskManagerStorage::AddOrReplaceTaskEvent(
            "`RAY_task_events_max_num_task_in_gcs` to a higher value to "
            "store more.";
 
-    num_bytes_task_events_ -= task_events_[next_idx_to_overwrite_].ByteSizeLong();
-    num_bytes_task_events_ += events_by_task.ByteSizeLong();
+    stats_counter_.Decrement(kNumTaskEventsBytesStored,
+                             task_events_[next_idx_to_overwrite_].ByteSizeLong());
+    stats_counter_.Increment(kNumTaskEventsBytesStored, events_by_task.ByteSizeLong());
 
     // Change the underlying storage.
     auto &to_replaced = task_events_.at(next_idx_to_overwrite_);
@@ -341,6 +344,9 @@ GcsTaskManager::GcsTaskManagerStorage::AddOrReplaceTaskEvent(
   job_to_task_attempt_index_[job_id].insert(task_attempt);
   task_to_task_attempt_index_[task_id].insert(task_attempt);
   // Add a new task events.
+  stats_counter_.Increment(kNumTaskEventsBytesStored, events_by_task.ByteSizeLong());
+  stats_counter_.Increment(kNumTaskEventsStored);
+
   task_events_.push_back(std::move(events_by_task));
 
   MarkTaskTreeFailedIfNeeded(task_id, parent_task_id);
@@ -351,7 +357,6 @@ void GcsTaskManager::HandleGetTaskEvents(rpc::GetTaskEventsRequest request,
                                          rpc::GetTaskEventsReply *reply,
                                          rpc::SendReplyCallback send_reply_callback) {
   RAY_LOG(DEBUG) << "Getting task status:" << request.ShortDebugString();
-  absl::MutexLock lock(&mutex_);
 
   // Select candidate events by indexing.
   std::vector<rpc::TaskEvents> task_events;
@@ -398,10 +403,10 @@ void GcsTaskManager::HandleGetTaskEvents(rpc::GetTaskEventsRequest request,
   // TODO(rickyx): We will need to revisit the data loss semantics, to report data loss
   // on a single task retry(attempt) rather than the actual events.
   // https://github.com/ray-project/ray/issues/31280
-  reply->set_num_profile_task_events_dropped(total_num_profile_task_events_dropped_ +
-                                             num_profile_event_limit);
-  reply->set_num_status_task_events_dropped(total_num_status_task_events_dropped_ +
-                                            num_status_event_limit);
+  reply->set_num_profile_task_events_dropped(
+      stats_counter_.Get(kTotalNumProfileTaskEventsDropped) + num_profile_event_limit);
+  reply->set_num_status_task_events_dropped(
+      stats_counter_.Get(kTotalNumStatusTaskEventsDropped) + num_status_event_limit);
 
   GCS_RPC_SEND_REPLY(send_reply_callback, reply, Status::OK());
   return;
@@ -410,15 +415,15 @@ void GcsTaskManager::HandleGetTaskEvents(rpc::GetTaskEventsRequest request,
 void GcsTaskManager::HandleAddTaskEventData(rpc::AddTaskEventDataRequest request,
                                             rpc::AddTaskEventDataReply *reply,
                                             rpc::SendReplyCallback send_reply_callback) {
-  absl::MutexLock lock(&mutex_);
-  // Dispatch to the handler
   auto data = std::move(request.data());
   // Update counters.
-  total_num_profile_task_events_dropped_ += data.num_profile_task_events_dropped();
-  total_num_status_task_events_dropped_ += data.num_status_task_events_dropped();
+  stats_counter_.Increment(kTotalNumProfileTaskEventsDropped,
+                           data.num_profile_task_events_dropped());
+  stats_counter_.Increment(kTotalNumStatusTaskEventsDropped,
+                           data.num_status_task_events_dropped());
 
   for (auto events_by_task : *data.mutable_events_by_task()) {
-    total_num_task_events_reported_++;
+    stats_counter_.Increment(kTotalNumTaskEventsReported);
     // TODO(rickyx): add logic to handle too many profile events for a single task
     // attempt.  https://github.com/ray-project/ray/issues/31279
 
@@ -430,11 +435,11 @@ void GcsTaskManager::HandleAddTaskEventData(rpc::AddTaskEventDataRequest request
         // TODO(rickyx): should we un-flatten the status updates into a list of
         // StatusEvents? so that we could get an accurate number of status change
         // events being dropped like profile events.
-        total_num_status_task_events_dropped_++;
+        stats_counter_.Increment(kTotalNumStatusTaskEventsDropped);
       }
       if (replaced_task_events->has_profile_events()) {
-        total_num_profile_task_events_dropped_ +=
-            replaced_task_events->profile_events().events_size();
+        stats_counter_.Increment(kTotalNumProfileTaskEventsDropped,
+                                 replaced_task_events->profile_events().events_size());
       }
     }
   }
@@ -444,57 +449,52 @@ void GcsTaskManager::HandleAddTaskEventData(rpc::AddTaskEventDataRequest request
 }
 
 std::string GcsTaskManager::DebugString() {
-  absl::MutexLock lock(&mutex_);
   std::ostringstream ss;
+  auto counters = stats_counter_.GetAll();
   ss << "GcsTaskManager: "
-     << "\n-Total num task events reported: " << total_num_task_events_reported_
+     << "\n-Total num task events reported: " << counters[kTotalNumTaskEventsReported]
      << "\n-Total num status task events dropped: "
-     << total_num_status_task_events_dropped_
-     << "\n-Total num profile events dropped: " << total_num_profile_task_events_dropped_
+     << counters[kTotalNumStatusTaskEventsDropped]
+     << "\n-Total num profile events dropped: "
+     << counters[kTotalNumProfileTaskEventsDropped]
      << "\n-Total num bytes of task event stored: "
-     << 1.0 * task_event_storage_->GetTaskEventsBytes() / 1024 / 1024 << "MiB"
-     << "\n-Current num of task events stored: "
-     << task_event_storage_->GetTaskEventsCount()
-     << "\n-Total num of actor creation tasks: "
-     << task_event_storage_->num_tasks_by_type_[rpc::TaskType::ACTOR_CREATION_TASK]
-     << "\n-Total num of actor tasks: "
-     << task_event_storage_->num_tasks_by_type_[rpc::TaskType::ACTOR_TASK]
-     << "\n-Total num of normal tasks: "
-     << task_event_storage_->num_tasks_by_type_[rpc::TaskType::NORMAL_TASK]
-     << "\n-Total num of driver tasks: "
-     << task_event_storage_->num_tasks_by_type_[rpc::TaskType::DRIVER_TASK];
+     << 1.0 * counters[kNumTaskEventsBytesStored] / 1024 / 1024 << "MiB"
+     << "\n-Current num of task events stored: " << counters[kNumTaskEventsStored]
+     << "\n-Total num of actor creation tasks: " << counters[kTotalNumActorCreationTask]
+     << "\n-Total num of actor tasks: " << counters[kTotalNumActorTask]
+     << "\n-Total num of normal tasks: " << counters[kTotalNumNormalTask]
+     << "\n-Total num of driver tasks: " << counters[kTotalNumDriverTask];
 
   return ss.str();
 }
 
 void GcsTaskManager::RecordMetrics() {
-  absl::MutexLock lock(&mutex_);
+  auto counters = stats_counter_.GetAll();
   ray::stats::STATS_gcs_task_manager_task_events_reported.Record(
-      total_num_task_events_reported_);
+      counters[kTotalNumTaskEventsReported]);
 
   ray::stats::STATS_gcs_task_manager_task_events_dropped.Record(
-      total_num_status_task_events_dropped_, ray::stats::kGcsTaskStatusEventDropped);
+      counters[kTotalNumStatusTaskEventsDropped], ray::stats::kGcsTaskStatusEventDropped);
   ray::stats::STATS_gcs_task_manager_task_events_dropped.Record(
-      total_num_profile_task_events_dropped_, ray::stats::kGcsProfileEventDropped);
+      counters[kTotalNumProfileTaskEventsDropped], ray::stats::kGcsProfileEventDropped);
 
   ray::stats::STATS_gcs_task_manager_task_events_stored.Record(
-      task_event_storage_->GetTaskEventsCount());
+      counters[kNumTaskEventsStored]);
   ray::stats::STATS_gcs_task_manager_task_events_stored_bytes.Record(
-      task_event_storage_->GetTaskEventsBytes());
-
-  if (usage_stats_client_) {
-    usage_stats_client_->RecordExtraUsageCounter(
-        usage::TagKey::NUM_ACTOR_CREATION_TASKS,
-        task_event_storage_->num_tasks_by_type_[rpc::TaskType::ACTOR_CREATION_TASK]);
-    usage_stats_client_->RecordExtraUsageCounter(
-        usage::TagKey::NUM_ACTOR_TASKS,
-        task_event_storage_->num_tasks_by_type_[rpc::TaskType::ACTOR_TASK]);
-    usage_stats_client_->RecordExtraUsageCounter(
-        usage::TagKey::NUM_NORMAL_TASKS,
-        task_event_storage_->num_tasks_by_type_[rpc::TaskType::NORMAL_TASK]);
-    usage_stats_client_->RecordExtraUsageCounter(
-        usage::TagKey::NUM_DRIVERS,
-        task_event_storage_->num_tasks_by_type_[rpc::TaskType::DRIVER_TASK]);
+      counters[kNumTaskEventsBytesStored]);
+
+  {
+    absl::MutexLock lock(&mutex_);
+    if (usage_stats_client_) {
+      usage_stats_client_->RecordExtraUsageCounter(
+          usage::TagKey::NUM_ACTOR_CREATION_TASKS, counters[kTotalNumActorCreationTask]);
+      usage_stats_client_->RecordExtraUsageCounter(usage::TagKey::NUM_ACTOR_TASKS,
+                                                   counters[kTotalNumActorTask]);
+      usage_stats_client_->RecordExtraUsageCounter(usage::TagKey::NUM_NORMAL_TASKS,
+                                                   counters[kTotalNumNormalTask]);
+      usage_stats_client_->RecordExtraUsageCounter(usage::TagKey::NUM_DRIVERS,
+                                                   counters[kTotalNumDriverTask]);
+    }
   }
 }
 
@@ -513,7 +513,6 @@ void GcsTaskManager::OnJobFinished(const JobID &job_id, int64_t job_finish_time_
           // timer canceled or aborted.
           return;
         }
-        absl::MutexLock lock(&mutex_);
         // If there are any non-terminated tasks from the job, mark them failed since all
         // workers associated with the job will be killed.
         task_event_storage_->MarkTasksFailed(job_id, job_finish_time_ms * 1000 * 1000);
diff --git a/src/ray/gcs/gcs_server/gcs_task_manager.h b/src/ray/gcs/gcs_server/gcs_task_manager.h
index b628e7d01fb2..52829e5af09c 100644
--- a/src/ray/gcs/gcs_server/gcs_task_manager.h
+++ b/src/ray/gcs/gcs_server/gcs_task_manager.h
@@ -20,6 +20,7 @@
 #include "absl/synchronization/mutex.h"
 #include "ray/gcs/gcs_client/usage_stats_client.h"
 #include "ray/rpc/gcs_server/gcs_rpc_server.h"
+#include "ray/util/counter_map.h"
 #include "src/ray/protobuf/gcs.pb.h"
 
 namespace ray {
@@ -28,6 +29,25 @@ namespace gcs {
 /// Type alias for a single task attempt, i.e. <task id and attempt number>.
 using TaskAttempt = std::pair<TaskID, int32_t>;
 
+enum GcsTaskManagerCounter {
+  kTotalNumTaskEventsReported,
+  kTotalNumStatusTaskEventsDropped,
+  kTotalNumProfileTaskEventsDropped,
+  kNumTaskEventsBytesStored,
+  kNumTaskEventsStored,
+  kTotalNumActorCreationTask,
+  kTotalNumActorTask,
+  kTotalNumNormalTask,
+  kTotalNumDriverTask,
+};
+
+const absl::flat_hash_map<rpc::TaskType, GcsTaskManagerCounter> kTaskTypeToCounterType = {
+    {rpc::TaskType::NORMAL_TASK, kTotalNumNormalTask},
+    {rpc::TaskType::ACTOR_CREATION_TASK, kTotalNumActorCreationTask},
+    {rpc::TaskType::ACTOR_TASK, kTotalNumActorTask},
+    {rpc::TaskType::DRIVER_TASK, kTotalNumDriverTask},
+};
+
 /// GcsTaskManger is responsible for capturing task states change reported by
 /// TaskEventBuffer from other components.
 ///
@@ -42,8 +62,9 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
  public:
   /// Create a GcsTaskManager.
   GcsTaskManager()
-      : task_event_storage_(std::make_unique<GcsTaskManagerStorage>(
-            RayConfig::instance().task_events_max_num_task_in_gcs())),
+      : stats_counter_(),
+        task_event_storage_(std::make_unique<GcsTaskManagerStorage>(
+            RayConfig::instance().task_events_max_num_task_in_gcs(), stats_counter_)),
         io_service_thread_(std::make_unique<std::thread>([this] {
           SetThreadName("task_events");
           // Keep io_service_ alive.
@@ -59,8 +80,7 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
   /// \param send_reply_callback Callback to invoke when sending reply.
   void HandleAddTaskEventData(rpc::AddTaskEventDataRequest request,
                               rpc::AddTaskEventDataReply *reply,
-                              rpc::SendReplyCallback send_reply_callback)
-      LOCKS_EXCLUDED(mutex_) override;
+                              rpc::SendReplyCallback send_reply_callback) override;
 
   /// Handle GetTaskEvent request.
   ///
@@ -69,14 +89,13 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
   /// \param send_reply_callback Callback to invoke when sending reply.
   void HandleGetTaskEvents(rpc::GetTaskEventsRequest request,
                            rpc::GetTaskEventsReply *reply,
-                           rpc::SendReplyCallback send_reply_callback)
-      LOCKS_EXCLUDED(mutex_) override;
+                           rpc::SendReplyCallback send_reply_callback) override;
 
   /// Stops the event loop and the thread of the task event handler.
   ///
   /// After this is called, no more requests will be handled.
   /// This function returns when the io thread is joined.
-  void Stop() LOCKS_EXCLUDED(mutex_);
+  void Stop();
 
   /// Handler to be called when a job finishes. This marks all non-terminated tasks
   /// of the job as failed.
@@ -93,7 +112,7 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
   /// Return string of debug state.
   ///
   /// \return Debug string
-  std::string DebugString() LOCKS_EXCLUDED(mutex_);
+  std::string DebugString();
 
   /// Record metrics.
   void RecordMetrics() LOCKS_EXCLUDED(mutex_);
@@ -120,8 +139,9 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
     ///
     /// \param max_num_task_events Max number of task events stored before replacing older
     /// ones.
-    GcsTaskManagerStorage(size_t max_num_task_events)
-        : max_num_task_events_(max_num_task_events) {}
+    GcsTaskManagerStorage(size_t max_num_task_events,
+                          CounterMapThreadSafe<GcsTaskManagerCounter> &stats_counter)
+        : max_num_task_events_(max_num_task_events), stats_counter_(stats_counter) {}
 
     /// Add a new task event or replace an existing task event in the storage.
     ///
@@ -247,21 +267,12 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
     /// could be found or there's data loss.
     absl::optional<TaskAttempt> GetLatestTaskAttempt(const TaskID &task_id) const;
 
-    /// Get the number of task events stored.
-    size_t GetTaskEventsCount() const { return task_events_.size(); }
-
-    /// Get the total number of bytes of task events stored.
-    uint64_t GetTaskEventsBytes() const { return num_bytes_task_events_; }
-
     /// Max number of task events allowed in the storage.
     const size_t max_num_task_events_ = 0;
 
     /// A iterator into task_events_ that determines which element to be overwritten.
     size_t next_idx_to_overwrite_ = 0;
 
-    /// Total number of tasks by types, including ones have been evicted/finished.
-    absl::flat_hash_map<rpc::TaskType, size_t> num_tasks_by_type_;
-
     /// TODO(rickyx): Refactor this into LRI(least recently inserted) buffer:
     /// https://github.com/ray-project/ray/issues/31158
     /// Current task events stored.
@@ -283,9 +294,8 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
     absl::flat_hash_map<TaskID, absl::flat_hash_set<TaskID>>
         parent_to_children_task_index_;
 
-    /// Counter for tracking the size of task event. This assumes tasks events are never
-    /// removed actively.
-    uint64_t num_bytes_task_events_ = 0;
+    /// Reference to the counter map owned by the GcsTaskManager.
+    CounterMapThreadSafe<GcsTaskManagerCounter> &stats_counter_;
 
     friend class GcsTaskManager;
     FRIEND_TEST(GcsTaskManagerTest, TestHandleAddTaskEventBasic);
@@ -295,20 +305,35 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
   };
 
  private:
-  /// Mutex guarding all fields that will be accessed by main_io as well.
-  absl::Mutex mutex_;
+  /// Test only
+  size_t GetTotalNumStatusTaskEventsDropped() {
+    return stats_counter_.Get(kTotalNumStatusTaskEventsDropped);
+  }
 
-  /// Total number of task events reported.
-  uint32_t total_num_task_events_reported_ GUARDED_BY(mutex_) = 0;
+  /// Test only
+  size_t GetTotalNumProfileTaskEventsDropped() {
+    return stats_counter_.Get(kTotalNumProfileTaskEventsDropped);
+  }
 
-  /// Total number of status task events dropped on the worker.
-  uint32_t total_num_status_task_events_dropped_ GUARDED_BY(mutex_) = 0;
+  /// Test only
+  size_t GetTotalNumTaskEventsReported() {
+    return stats_counter_.Get(kTotalNumTaskEventsReported);
+  }
 
-  /// Total number of profile task events dropped on the worker.
-  uint32_t total_num_profile_task_events_dropped_ GUARDED_BY(mutex_) = 0;
+  /// Test only
+  size_t GetNumTaskEventsStored() { return stats_counter_.Get(kNumTaskEventsStored); }
 
-  // Pointer to the underlying task events storage.
-  std::unique_ptr<GcsTaskManagerStorage> task_event_storage_ GUARDED_BY(mutex_);
+  // Mutex guarding the usage stats client
+  absl::Mutex mutex_;
+
+  UsageStatsClient *usage_stats_client_ GUARDED_BY(mutex_) = nullptr;
+
+  /// Counter map for GcsTaskManager stats.
+  CounterMapThreadSafe<GcsTaskManagerCounter> stats_counter_;
+
+  // Pointer to the underlying task events storage. This is only accessed from
+  // the io_service_thread_. Access to it is *not* thread safe.
+  std::unique_ptr<GcsTaskManagerStorage> task_event_storage_;
 
   /// Its own separate IO service separated from the main service.
   instrumented_io_context io_service_;
@@ -319,8 +344,6 @@ class GcsTaskManager : public rpc::TaskInfoHandler {
   /// Timer for delay functions.
   boost::asio::deadline_timer timer_;
 
-  UsageStatsClient *usage_stats_client_ GUARDED_BY(mutex_) = nullptr;
-
   FRIEND_TEST(GcsTaskManagerTest, TestHandleAddTaskEventBasic);
   FRIEND_TEST(GcsTaskManagerTest, TestMergeTaskEventsSameTaskAttempt);
   FRIEND_TEST(GcsTaskManagerMemoryLimitedTest, TestLimitTaskEvents);
diff --git a/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc b/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
index 294b8a6a158a..f1cebaf39ae9 100644
--- a/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_task_manager_test.cc
@@ -83,12 +83,17 @@ class GcsTaskManagerTest : public ::testing::Test {
     std::promise<bool> promise;
 
     request.mutable_data()->CopyFrom(events_data);
-    task_manager->HandleAddTaskEventData(
-        request,
-        &reply,
-        [&promise](Status, std::function<void()>, std::function<void()>) {
-          promise.set_value(true);
-        });
+    // Dispatch so that it runs in GcsTaskManager's io service.
+    task_manager->GetIoContext().dispatch(
+        [this, &promise, &request, &reply]() {
+          task_manager->HandleAddTaskEventData(
+              request,
+              &reply,
+              [&promise](Status, std::function<void()>, std::function<void()>) {
+                promise.set_value(true);
+              });
+        },
+        "SyncAddTaskEventData");
 
     promise.get_future().get();
 
@@ -120,13 +125,16 @@ class GcsTaskManagerTest : public ::testing::Test {
     }
 
     request.set_exclude_driver(exclude_driver);
-
-    task_manager->HandleGetTaskEvents(
-        request,
-        &reply,
-        [&promise](Status, std::function<void()>, std::function<void()>) {
-          promise.set_value(true);
-        });
+    task_manager->GetIoContext().dispatch(
+        [this, &promise, &request, &reply]() {
+          task_manager->HandleGetTaskEvents(
+              request,
+              &reply,
+              [&promise](Status, std::function<void()>, std::function<void()>) {
+                promise.set_value(true);
+              });
+        },
+        "SyncGetTaskEvents");
 
     promise.get_future().get();
 
@@ -248,12 +256,11 @@ TEST_F(GcsTaskManagerTest, TestHandleAddTaskEventBasic) {
 
   // Assert on actual data.
   {
-    absl::MutexLock lock(&task_manager->mutex_);
     EXPECT_EQ(task_manager->task_event_storage_->task_events_.size(), num_task_events);
-    EXPECT_EQ(task_manager->total_num_task_events_reported_, num_task_events);
-    EXPECT_EQ(task_manager->total_num_profile_task_events_dropped_,
+    EXPECT_EQ(task_manager->GetTotalNumTaskEventsReported(), num_task_events);
+    EXPECT_EQ(task_manager->GetTotalNumProfileTaskEventsDropped(),
               num_profile_events_dropped);
-    EXPECT_EQ(task_manager->total_num_status_task_events_dropped_,
+    EXPECT_EQ(task_manager->GetTotalNumStatusTaskEventsDropped(),
               num_status_events_dropped);
   }
 }
@@ -274,7 +281,6 @@ TEST_F(GcsTaskManagerTest, TestMergeTaskEventsSameTaskAttempt) {
 
   // Assert on actual data
   {
-    absl::MutexLock lock(&task_manager->mutex_);
     EXPECT_EQ(task_manager->task_event_storage_->task_events_.size(), 1);
     // Assert on events
     auto task_events = task_manager->task_event_storage_->task_events_[0];
@@ -643,10 +649,8 @@ TEST_F(GcsTaskManagerMemoryLimitedTest, TestIndexNoLeak) {
   }
 
   {
-    absl::MutexLock lock(&task_manager->mutex_);
-    EXPECT_EQ(
-        task_manager->task_event_storage_->num_tasks_by_type_[rpc::TaskType::NORMAL_TASK],
-        task_ids.size());
+    EXPECT_EQ(task_manager->task_event_storage_->stats_counter_.Get(kTotalNumNormalTask),
+              task_ids.size());
   }
 
   // Evict all of them with tasks with single attempt, no parent, same job.
@@ -668,11 +672,9 @@ TEST_F(GcsTaskManagerMemoryLimitedTest, TestIndexNoLeak) {
   }
   // Assert on the indexes and the storage
   {
-    absl::MutexLock lock(&task_manager->mutex_);
     EXPECT_EQ(task_manager->task_event_storage_->task_events_.size(), num_limit);
-    EXPECT_EQ(
-        task_manager->task_event_storage_->num_tasks_by_type_[rpc::TaskType::NORMAL_TASK],
-        task_ids.size() + num_limit);
+    EXPECT_EQ(task_manager->task_event_storage_->stats_counter_.Get(kTotalNumNormalTask),
+              task_ids.size() + num_limit);
     // No task has parent.
     EXPECT_EQ(task_manager->task_event_storage_->parent_to_children_task_index_.size(),
               0);
@@ -729,9 +731,8 @@ TEST_F(GcsTaskManagerMemoryLimitedTest, TestLimitTaskEvents) {
 
   // Assert on actual data.
   {
-    absl::MutexLock lock(&task_manager->mutex_);
-    EXPECT_EQ(task_manager->task_event_storage_->task_events_.size(), num_limit);
-    EXPECT_EQ(task_manager->total_num_task_events_reported_, num_batch1 + num_batch2);
+    EXPECT_EQ(task_manager->GetNumTaskEventsStored(), num_limit);
+    EXPECT_EQ(task_manager->GetTotalNumTaskEventsReported(), num_batch1 + num_batch2);
 
     std::sort(expected_events.begin(), expected_events.end(), SortByTaskAttempt);
     auto actual_events = task_manager->task_event_storage_->task_events_;
@@ -743,9 +744,9 @@ TEST_F(GcsTaskManagerMemoryLimitedTest, TestLimitTaskEvents) {
     }
 
     // Assert on drop counts.
-    EXPECT_EQ(task_manager->total_num_status_task_events_dropped_,
+    EXPECT_EQ(task_manager->GetTotalNumStatusTaskEventsDropped(),
               num_status_events_to_drop + num_status_events_dropped_on_worker);
-    EXPECT_EQ(task_manager->total_num_profile_task_events_dropped_,
+    EXPECT_EQ(task_manager->GetTotalNumProfileTaskEventsDropped(),
               num_profile_events_to_drop + num_profile_events_dropped_on_worker);
   }
 }
diff --git a/src/ray/util/counter_map.h b/src/ray/util/counter_map.h
index 2a758c99f207..3351940e8e40 100644
--- a/src/ray/util/counter_map.h
+++ b/src/ray/util/counter_map.h
@@ -18,6 +18,7 @@
 
 #include "absl/container/flat_hash_map.h"
 #include "absl/container/flat_hash_set.h"
+#include "absl/synchronization/mutex.h"
 #include "ray/util/logging.h"
 
 /// \class CounterMap
@@ -118,9 +119,79 @@ class CounterMap {
     }
   }
 
+  /// Return a snapshot of all the counters.
+  absl::flat_hash_map<K, int64_t> GetAll() const { return counters_; }
+
  private:
   absl::flat_hash_map<K, int64_t> counters_;
   absl::flat_hash_set<K> pending_changes_;
   std::function<void(const K &)> on_change_;
   size_t total_ = 0;
 };
+
+/// \class A thread safe version of CounterMap with mutex guarded all methods.
+template <typename K>
+class CounterMapThreadSafe {
+ public:
+  CounterMapThreadSafe() = default;
+
+  void SetOnChangeCallback(std::function<void(const K &)> on_change)
+      LOCKS_EXCLUDED(mutex_) {
+    absl::WriterMutexLock lock(&mutex_);
+    counter_map_.SetOnChangeCallback(std::move(on_change));
+  }
+
+  void FlushOnChangeCallbacks() LOCKS_EXCLUDED(mutex_) {
+    absl::WriterMutexLock lock(&mutex_);
+    counter_map_.FlushOnChangeCallbacks();
+  }
+
+  void Increment(const K &key, int64_t val = 1) LOCKS_EXCLUDED(mutex_) {
+    absl::WriterMutexLock lock(&mutex_);
+    counter_map_.Increment(key, val);
+  }
+
+  void Decrement(const K &key, int64_t val = 1) LOCKS_EXCLUDED(mutex_) {
+    absl::WriterMutexLock lock(&mutex_);
+    counter_map_.Decrement(key, val);
+  }
+
+  int64_t Get(const K &key) {
+    absl::ReaderMutexLock lock(&mutex_);
+    return counter_map_.Get(key);
+  }
+
+  void Swap(const K &old_key, const K &new_key, int64_t val = 1) LOCKS_EXCLUDED(mutex_) {
+    absl::WriterMutexLock lock(&mutex_);
+    counter_map_.Swap(old_key, new_key, val);
+  }
+
+  size_t Size() {
+    absl::ReaderMutexLock lock(&mutex_);
+    return counter_map_.Size();
+  }
+
+  size_t Total() {
+    absl::ReaderMutexLock lock(&mutex_);
+    return counter_map_.Total();
+  }
+
+  size_t NumPendingCallbacks() {
+    absl::ReaderMutexLock lock(&mutex_);
+    return counter_map_.NumPendingCallbacks();
+  }
+
+  void ForEachEntry(std::function<void(const K &, int64_t)> callback) {
+    absl::ReaderMutexLock lock(&mutex_);
+    counter_map_.ForEachEntry(std::move(callback));
+  }
+
+  absl::flat_hash_map<K, int64_t> GetAll() {
+    absl::ReaderMutexLock lock(&mutex_);
+    return counter_map_.GetAll();
+  }
+
+ private:
+  absl::Mutex mutex_;
+  CounterMap<K> counter_map_;
+};

From b4ad23a6051862ace309c2009fb66f9166ed3b7a Mon Sep 17 00:00:00 2001
From: Amog Kamsetty <amogkam@users.noreply.github.com>
Date: Thu, 9 Feb 2023 16:28:09 -0800
Subject: [PATCH 208/267] [Data] Add rule for `ReorderRandomizeBlockOrder`
 (#32254)

Ports over previous rule to move RandomizeBlockOrder to the end of a DAG into the new execution backend as an optimizer rule.

Closes #31894

Signed-off-by: amogkam <amogkamsetty@yahoo.com>
---
 .../ray/data/_internal/logical/interfaces.py  |   8 +-
 .../ray/data/_internal/logical/optimizers.py  |   9 +-
 .../data/_internal/logical/rules/__init__.py  |   3 +-
 .../logical/rules/randomize_blocks.py         |  72 +++++++++
 .../data/tests/test_execution_optimizer.py    |  23 ---
 .../data/tests/test_randomize_block_order.py  | 147 ++++++++++++++++++
 6 files changed, 234 insertions(+), 28 deletions(-)
 create mode 100644 python/ray/data/_internal/logical/rules/randomize_blocks.py
 create mode 100644 python/ray/data/tests/test_randomize_block_order.py

diff --git a/python/ray/data/_internal/logical/interfaces.py b/python/ray/data/_internal/logical/interfaces.py
index 4e88d0b67e2e..7852369a1c83 100644
--- a/python/ray/data/_internal/logical/interfaces.py
+++ b/python/ray/data/_internal/logical/interfaces.py
@@ -1,4 +1,4 @@
-from typing import List, Dict, TYPE_CHECKING
+from typing import Dict, Iterator, List, TYPE_CHECKING
 
 if TYPE_CHECKING:
     from ray.data._internal.execution.interfaces import PhysicalOperator
@@ -28,6 +28,12 @@ def input_dependencies(self) -> List["Operator"]:
         ), "Operator.__init__() was not called."
         return self._input_dependencies
 
+    def post_order_iter(self) -> Iterator["Operator"]:
+        """Depth-first traversal of this operator and its input dependencies."""
+        for op in self.input_dependencies:
+            yield from op.post_order_iter()
+        yield self
+
     def __repr__(self) -> str:
         if self.input_dependencies:
             out_str = ", ".join([str(x) for x in self.input_dependencies])
diff --git a/python/ray/data/_internal/logical/optimizers.py b/python/ray/data/_internal/logical/optimizers.py
index df14f99ba5c0..f1c0d83ff16b 100644
--- a/python/ray/data/_internal/logical/optimizers.py
+++ b/python/ray/data/_internal/logical/optimizers.py
@@ -6,7 +6,10 @@
     LogicalPlan,
     PhysicalPlan,
 )
-from ray.data._internal.logical.rules import OperatorFusionRule
+from ray.data._internal.logical.rules import (
+    OperatorFusionRule,
+    ReorderRandomizeBlocksRule,
+)
 from ray.data._internal.planner.planner import Planner
 
 
@@ -15,8 +18,7 @@ class LogicalOptimizer(Optimizer):
 
     @property
     def rules(self) -> List[Rule]:
-        # TODO: Add logical optimizer rules.
-        return []
+        return [ReorderRandomizeBlocksRule()]
 
 
 class PhysicalOptimizer(Optimizer):
@@ -35,6 +37,7 @@ def get_execution_plan(logical_plan: LogicalPlan) -> PhysicalPlan:
     (2) planning: convert logical to physical operators.
     (3) physical optimization: optimize physical operators.
     """
+
     logical_plan = LogicalOptimizer().optimize(logical_plan)
     physical_plan = Planner().plan(logical_plan)
     return PhysicalOptimizer().optimize(physical_plan)
diff --git a/python/ray/data/_internal/logical/rules/__init__.py b/python/ray/data/_internal/logical/rules/__init__.py
index d138fe4b1193..32cdb85bdf9b 100644
--- a/python/ray/data/_internal/logical/rules/__init__.py
+++ b/python/ray/data/_internal/logical/rules/__init__.py
@@ -1,3 +1,4 @@
+from ray.data._internal.logical.rules.randomize_blocks import ReorderRandomizeBlocksRule
 from ray.data._internal.logical.rules.operator_fusion import OperatorFusionRule
 
-__all__ = ["OperatorFusionRule"]
+__all__ = ["ReorderRandomizeBlocksRule", "OperatorFusionRule"]
diff --git a/python/ray/data/_internal/logical/rules/randomize_blocks.py b/python/ray/data/_internal/logical/rules/randomize_blocks.py
new file mode 100644
index 000000000000..b11e7e875088
--- /dev/null
+++ b/python/ray/data/_internal/logical/rules/randomize_blocks.py
@@ -0,0 +1,72 @@
+from collections import deque
+
+from ray.data._internal.logical.interfaces import LogicalOperator, LogicalPlan, Rule
+from ray.data._internal.logical.operators.all_to_all_operator import (
+    AbstractAllToAll,
+    RandomizeBlocks,
+)
+
+
+class ReorderRandomizeBlocksRule(Rule):
+    """Rule for reordering RandomizeBlocks logical operator.
+
+    Reordering RandomizeBlocks operators is to help fuse multiple
+    AbstractMap operators together for better performance.
+
+    1. Dedupes multiple RandomizeBlocks operators if they are not seeded.
+    2. Moves RandomizeBlocks operator to the end of a sequence of AbstractMap
+    operators. RandomizeBlocks operators are not moved across AbstractAllToAll operator
+    boundaries.
+    """
+
+    def apply(self, plan: LogicalPlan) -> LogicalPlan:
+        optimized_dag: LogicalOperator = self._apply(plan.dag)
+        return LogicalPlan(dag=optimized_dag)
+
+    def _apply(self, op: LogicalOperator) -> LogicalOperator:
+        operators = []
+
+        # Post-order traversal.
+        nodes = deque()
+        for node in op.post_order_iter():
+            nodes.appendleft(node)
+
+        while len(nodes) > 0:
+            current_op = nodes.pop()
+            upstream_ops = current_op.input_dependencies
+
+            # Iterate through all upstream ops, and remove all RandomizeBlocks
+            # operators.
+            for i in range(len(upstream_ops)):
+                if isinstance(upstream_ops[i], RandomizeBlocks):
+                    # If no seeds are provided, then collapse into a single
+                    # RandomizeBlocks operator.
+                    current_seed = upstream_ops[i]._seed
+                    if not operators or current_seed or operators[-1]._seed:
+                        operators.append(upstream_ops[i])
+
+                    # Remove RandomizeBlocks operator from the dag and wire in new input
+                    # dependencies.
+                    assert len(upstream_ops[i].input_dependencies) == 1
+                    upstream_ops[i] = upstream_ops[i].input_dependencies[0]
+            if isinstance(current_op, AbstractAllToAll) and not isinstance(
+                current_op, RandomizeBlocks
+            ):
+                # If this operator is a an AllToAll Operator, then insert
+                # RandomizeBlocks right before this operator rather than the end of the
+                # DAG.
+                # All-to-all operators can have only 1 input operator.
+                assert len(upstream_ops) == 1
+                input_op = upstream_ops[0]
+                for random_op in operators:
+                    random_op._input_dependencies = [input_op]
+                    input_op = random_op
+                upstream_ops[0] = input_op
+                operators = []
+
+        # Add RandomizeBlocks operator as the last operator in the DAG if necessary.
+        for random_op in operators:
+            random_op._input_dependencies = [op]
+            op = random_op
+
+        return op
diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index 1cc091391b7f..122823b078c7 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -8,7 +8,6 @@
 from ray.data._internal.logical.optimizers import PhysicalOptimizer
 from ray.data._internal.logical.operators.all_to_all_operator import (
     RandomShuffle,
-    RandomizeBlocks,
     Repartition,
     Sort,
 )
@@ -157,28 +156,6 @@ def ensure_sample_size_close(dataset, sample_percent=0.5):
     ensure_sample_size_close(ds)
 
 
-def test_randomize_blocks_operator(ray_start_regular_shared, enable_optimizer):
-    planner = Planner()
-    read_op = Read(ParquetDatasource())
-    op = RandomizeBlocks(
-        read_op,
-        seed=0,
-    )
-    plan = LogicalPlan(op)
-    physical_op = planner.plan(plan).dag
-
-    assert op.name == "RandomizeBlocks"
-    assert isinstance(physical_op, AllToAllOperator)
-    assert len(physical_op.input_dependencies) == 1
-    assert isinstance(physical_op.input_dependencies[0], MapOperator)
-
-
-def test_randomize_blocks_e2e(ray_start_regular_shared, enable_optimizer):
-    ds = ray.data.range(12, parallelism=4)
-    ds = ds.randomize_block_order(seed=0)
-    assert ds.take_all() == [6, 7, 8, 0, 1, 2, 3, 4, 5, 9, 10, 11], ds
-
-
 def test_random_shuffle_operator(ray_start_regular_shared, enable_optimizer):
     planner = Planner()
     read_op = Read(ParquetDatasource())
diff --git a/python/ray/data/tests/test_randomize_block_order.py b/python/ray/data/tests/test_randomize_block_order.py
new file mode 100644
index 000000000000..0de72b6f38c0
--- /dev/null
+++ b/python/ray/data/tests/test_randomize_block_order.py
@@ -0,0 +1,147 @@
+import pytest
+
+import ray
+from ray.data._internal.execution.operators.all_to_all_operator import AllToAllOperator
+from ray.data._internal.execution.operators.map_operator import MapOperator
+from ray.data._internal.logical.operators.read_operator import Read
+from ray.data._internal.logical.operators.map_operator import AbstractMap
+from ray.data._internal.logical.operators.all_to_all_operator import (
+    RandomizeBlocks,
+    Repartition,
+)
+from ray.data._internal.logical.operators.map_operator import MapBatches
+from ray.data._internal.logical.rules.randomize_blocks import ReorderRandomizeBlocksRule
+from ray.data._internal.logical.interfaces import LogicalPlan
+from ray.data._internal.logical.optimizers import LogicalOptimizer
+from ray.data._internal.planner.planner import Planner
+
+
+def test_randomize_blocks_operator(ray_start_regular_shared, enable_optimizer):
+    planner = Planner()
+    read_op = Read(datasource=None)
+    op = RandomizeBlocks(
+        read_op,
+        seed=0,
+    )
+    plan = LogicalPlan(op)
+    physical_op = planner.plan(plan).dag
+
+    assert op.name == "RandomizeBlocks"
+    assert isinstance(physical_op, AllToAllOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], MapOperator)
+
+
+def test_randomize_block_order_rule():
+    read = Read(datasource=None)
+    operator1 = RandomizeBlocks(input_op=read, seed=None)
+    operator2 = RandomizeBlocks(input_op=operator1, seed=None)
+    operator3 = MapBatches(input_op=operator2, fn=lambda x: x)
+    original_plan = LogicalPlan(dag=operator3)
+
+    rule = ReorderRandomizeBlocksRule()
+    optimized_plan = rule.apply(original_plan)
+
+    # Check that RandomizeBlocks is the last operator in the DAG.
+    assert isinstance(optimized_plan.dag, RandomizeBlocks)
+    # Check that the seed is maintained.
+    assert optimized_plan.dag._seed is None
+
+    # Check that multiple RandomizeBlocks operators are deduped.
+    operator_count = 0
+    for _ in optimized_plan.dag.post_order_iter():
+        operator_count += 1
+
+    assert operator_count == 3
+
+
+def test_randomize_block_order_rule_seed():
+    read = Read(datasource=None)
+    operator1 = RandomizeBlocks(input_op=read, seed=None)
+    operator2 = RandomizeBlocks(input_op=operator1, seed=2)
+    operator3 = MapBatches(input_op=operator2, fn=lambda x: x)
+    original_plan = LogicalPlan(dag=operator3)
+
+    rule = ReorderRandomizeBlocksRule()
+    optimized_plan = rule.apply(original_plan)
+
+    # Check that RandomizeBlocks is the last operator in the DAG.
+    assert isinstance(optimized_plan.dag, RandomizeBlocks)
+    # Check that the seed is maintained.
+    assert optimized_plan.dag._seed == 2
+
+    # Check that the two RandomizeBlocks operators are not collapsed since seeds are
+    # provided.
+    assert isinstance(optimized_plan.dag.input_dependencies[0], RandomizeBlocks)
+    assert optimized_plan.dag.input_dependencies[0]._seed is None
+    operator_count = 0
+    for _ in optimized_plan.dag.post_order_iter():
+        operator_count += 1
+
+    # RandomizeBlocks operators should not be deduped.
+    assert operator_count == 4
+
+
+def test_randomize_block_order_after_repartition():
+    read = Read(datasource=None)
+    operator1 = RandomizeBlocks(input_op=read)
+    operator2 = Repartition(input_op=operator1, num_outputs=1, shuffle=False)
+    operator3 = RandomizeBlocks(input_op=operator2)
+    operator4 = RandomizeBlocks(input_op=operator3)
+    operator5 = MapBatches(input_op=operator4, fn=lambda x: x)
+    operator6 = Repartition(input_op=operator5, num_outputs=1, shuffle=False)
+    original_plan = LogicalPlan(dag=operator6)
+
+    rule = ReorderRandomizeBlocksRule()
+    optimized_plan = rule.apply(original_plan)
+
+    assert isinstance(optimized_plan.dag, Repartition)
+    assert isinstance(optimized_plan.dag.input_dependencies[0], RandomizeBlocks)
+
+    # Check that multiple RandomizeBlocks operators are deduped within repartition
+    # boundaries.
+    operator_count = 0
+    for _ in optimized_plan.dag.post_order_iter():
+        operator_count += 1
+
+    # Read -> RandomizeBlocks -> Repartition -> MapBatches -> RandomizeBlocks ->
+    # Repartition
+    assert operator_count == 6
+
+
+def test_randomize_blocks_e2e(ray_start_regular_shared, enable_optimizer):
+    ds = ray.data.range(12, parallelism=4)
+    ds = ds.randomize_block_order(seed=0)
+    assert ds.take_all() == [6, 7, 8, 0, 1, 2, 3, 4, 5, 9, 10, 11], ds
+
+
+def test_randomize_blocks_rule_e2e(ray_start_regular_shared, enable_optimizer):
+    def dummy_map(x):
+        return x
+
+    ds = ray.data.range(10).randomize_block_order().map_batches(dummy_map)
+    plan = ds._logical_plan
+    optimized_plan = LogicalOptimizer().optimize(plan)
+
+    inverse_order = iter([Read, AbstractMap, RandomizeBlocks])
+    for node in optimized_plan.dag.post_order_iter():
+        assert isinstance(node, next(inverse_order))
+
+    ds = (
+        ray.data.range(10)
+        .randomize_block_order()
+        .repartition(10)
+        .map_batches(dummy_map)
+    )
+    plan = ds._logical_plan
+    optimized_plan = LogicalOptimizer().optimize(plan)
+
+    inverse_order = iter([Read, RandomizeBlocks, Repartition, AbstractMap])
+    for node in optimized_plan.dag.post_order_iter():
+        assert isinstance(node, next(inverse_order))
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))

From 4420120006e76ea049905ad1b1e037f3ea04677f Mon Sep 17 00:00:00 2001
From: Amog Kamsetty <amogkam@users.noreply.github.com>
Date: Thu, 9 Feb 2023 16:28:45 -0800
Subject: [PATCH 209/267] [AIR] Automatically move `DatasetIterator` torch
 tensors to correct device (#31753)

When DatasetIterator is used with Ray Train, automatically move the torch tensors returned by iter_torch_batches to the correct device.

Signed-off-by: amogkam <amogkamsetty@yahoo.com>
---
 doc/source/ray-air/doc_code/hvd_trainer.py    |  4 +-
 doc/source/ray-air/doc_code/torch_trainer.py  |  2 +-
 .../data/_internal/bulk_dataset_iterator.py   | 32 ++-------
 .../_internal/pipelined_dataset_iterator.py   | 32 ++-------
 python/ray/data/dataset_iterator.py           | 11 ++-
 .../ray/train/_internal/dataset_iterator.py   | 67 +++++++++++++++++++
 python/ray/train/_internal/dataset_spec.py    |  2 +-
 python/ray/train/horovod/horovod_trainer.py   |  4 +-
 python/ray/train/tests/test_gpu.py            | 31 +++++++++
 python/ray/train/torch/torch_trainer.py       |  2 +-
 10 files changed, 119 insertions(+), 68 deletions(-)
 create mode 100644 python/ray/train/_internal/dataset_iterator.py

diff --git a/doc/source/ray-air/doc_code/hvd_trainer.py b/doc/source/ray-air/doc_code/hvd_trainer.py
index 7c4e4fd67c42..8b83fd40eadb 100644
--- a/doc/source/ray-air/doc_code/hvd_trainer.py
+++ b/doc/source/ray-air/doc_code/hvd_trainer.py
@@ -47,11 +47,9 @@ def train_loop_per_worker():
     for epoch in range(num_epochs):
         model.train()
         for batch in dataset_shard.iter_torch_batches(
-            batch_size=32, dtypes=torch.float, device=train.torch.get_device()
+            batch_size=32, dtypes=torch.float
         ):
             inputs, labels = torch.unsqueeze(batch["x"], 1), batch["y"]
-            inputs.to(device)
-            labels.to(device)
             outputs = model(inputs)
             loss = loss_fn(outputs, labels)
             optimizer.zero_grad()
diff --git a/doc/source/ray-air/doc_code/torch_trainer.py b/doc/source/ray-air/doc_code/torch_trainer.py
index f8d4dc45bcfe..0d6d21f92738 100644
--- a/doc/source/ray-air/doc_code/torch_trainer.py
+++ b/doc/source/ray-air/doc_code/torch_trainer.py
@@ -39,7 +39,7 @@ def train_loop_per_worker():
 
     for epoch in range(num_epochs):
         for batches in dataset_shard.iter_torch_batches(
-            batch_size=32, dtypes=torch.float, device=train.torch.get_device()
+            batch_size=32, dtypes=torch.float
         ):
             inputs, labels = torch.unsqueeze(batches["x"], 1), batches["y"]
             output = model(inputs)
diff --git a/python/ray/data/_internal/bulk_dataset_iterator.py b/python/ray/data/_internal/bulk_dataset_iterator.py
index 936749f9c284..be1188911b69 100644
--- a/python/ray/data/_internal/bulk_dataset_iterator.py
+++ b/python/ray/data/_internal/bulk_dataset_iterator.py
@@ -1,5 +1,4 @@
 from typing import TYPE_CHECKING, Dict, List, Optional, Union, Iterator
-import warnings
 
 from ray.data.block import DataBatch
 from ray.data.dataset_iterator import DatasetIterator
@@ -9,6 +8,7 @@
     import torch
     from ray.data import Dataset
     from ray.data._internal.torch_iterable_dataset import TorchTensorBatchType
+    from ray.train._internal.dataset_iterator import TrainDatasetIterator
 
 
 class BulkDatasetIterator(DatasetIterator):
@@ -87,31 +87,7 @@ def to_tf(
     def stats(self) -> str:
         return self._base_dataset.stats()
 
-    def _with_backward_compat(self) -> DatasetIterator:
-        return BulkDatasetIteratorWithBackwardCompat(self)
+    def _to_train_iterator(self) -> "TrainDatasetIterator":
+        from ray.train._internal.dataset_iterator import TrainDatasetIterator
 
-
-class BulkDatasetIteratorWithBackwardCompat(BulkDatasetIterator):
-    def __init__(
-        self,
-        dataset_iterator: BulkDatasetIterator,
-    ):
-        self._dataset_iterator = dataset_iterator
-
-    def __getattr__(self, name):
-        if name == "_dataset_iterator":
-            raise AttributeError
-
-        if hasattr(self._dataset_iterator, name):
-            return getattr(self._dataset_iterator, name)
-
-        warnings.warn(
-            "session.get_dataset_shard returns a ray.data.DatasetIterator "
-            "instead of a Dataset as of Ray v2.3. "
-            "Use iter_torch_batches(), to_tf(), or iter_batches() to "
-            "iterate over one epoch. See "
-            "https://docs.ray.io/en/latest/data/api/dataset_iterator.html "
-            "for full DatasetIterator docs."
-        )
-
-        return getattr(self._dataset_iterator._base_dataset, name)
+        return TrainDatasetIterator(self)
diff --git a/python/ray/data/_internal/pipelined_dataset_iterator.py b/python/ray/data/_internal/pipelined_dataset_iterator.py
index efc0c6933f16..7401583338cc 100644
--- a/python/ray/data/_internal/pipelined_dataset_iterator.py
+++ b/python/ray/data/_internal/pipelined_dataset_iterator.py
@@ -1,5 +1,4 @@
 from typing import TYPE_CHECKING, Dict, List, Optional, Union, Iterator
-import warnings
 
 from ray.data import Dataset
 from ray.data.block import DataBatch
@@ -10,6 +9,7 @@
     import torch
     from ray.data import DatasetPipeline
     from ray.data._internal.torch_iterable_dataset import TorchTensorBatchType
+    from ray.train._internal.dataset_iterator import TrainDatasetIterator
 
 
 class PipelinedDatasetIterator(DatasetIterator):
@@ -105,31 +105,7 @@ def to_tf(
     def stats(self) -> str:
         return self._base_dataset_pipeline.stats()
 
-    def _with_backward_compat(self) -> DatasetIterator:
-        return PipelinedDatasetIteratorWithBackwardCompat(self)
+    def _to_train_iterator(self) -> "TrainDatasetIterator":
+        from ray.train._internal.dataset_iterator import TrainDatasetIterator
 
-
-class PipelinedDatasetIteratorWithBackwardCompat(PipelinedDatasetIterator):
-    def __init__(
-        self,
-        dataset_iterator: PipelinedDatasetIterator,
-    ):
-        self._dataset_iterator = dataset_iterator
-
-    def __getattr__(self, name):
-        if name == "_dataset_iterator":
-            raise AttributeError
-
-        if hasattr(self._dataset_iterator, name):
-            return getattr(self._dataset_iterator, name)
-
-        warnings.warn(
-            "session.get_dataset_shard returns a ray.data.DatasetIterator "
-            "instead of a DatasetPipeline as of Ray v2.3. "
-            "Use iter_torch_batches(), to_tf(), or iter_batches() to "
-            "iterate over one epoch. See "
-            "https://docs.ray.io/en/latest/data/api/dataset_iterator.html "
-            "for full DatasetIterator docs."
-        )
-
-        return getattr(self._dataset_iterator._base_dataset_pipeline, name)
+        return TrainDatasetIterator(self)
diff --git a/python/ray/data/dataset_iterator.py b/python/ray/data/dataset_iterator.py
index 8388a3d5fc9d..13aa8fbdc27a 100644
--- a/python/ray/data/dataset_iterator.py
+++ b/python/ray/data/dataset_iterator.py
@@ -9,6 +9,7 @@
     import tensorflow as tf
     import torch
     from ray.data._internal.torch_iterable_dataset import TorchTensorBatchType
+    from ray.train._internal.dataset_iterator import TrainDatasetIterator
 
 
 if sys.version_info >= (3, 8):
@@ -247,9 +248,13 @@ def iter_epochs(self, max_epoch: int = -1) -> None:
             "iter_torch_batches(), or to_tf()."
         )
 
-    @abc.abstractmethod
-    def _with_backward_compat(self) -> "DatasetIterator":
+    def _to_train_iterator(self) -> "TrainDatasetIterator":
         """
-        Provide backwards compatibility for AIR users.
+        Convert this DatasetIterator to one that is specific
+        to Ray Train Trainers.
+
+        The Train-specific iterator has training specific logic,
+        for example, automatically moving batches to GPU when GPU training
+        is enabled.
         """
         raise NotImplementedError
diff --git a/python/ray/train/_internal/dataset_iterator.py b/python/ray/train/_internal/dataset_iterator.py
new file mode 100644
index 000000000000..843986ffa639
--- /dev/null
+++ b/python/ray/train/_internal/dataset_iterator.py
@@ -0,0 +1,67 @@
+from typing import Iterator, Optional, TYPE_CHECKING
+import warnings
+
+from ray.data.block import DataBatch
+from ray.data.dataset_iterator import DatasetIterator
+from ray.train.error import SessionMisuseError
+
+if TYPE_CHECKING:
+    import tensorflow as tf
+    from ray.data._internal.torch_iterable_dataset import TorchTensorBatchType
+
+
+class TrainDatasetIterator(DatasetIterator):
+    """A DatasetIterator with Ray Train specific logic.
+
+    Args:
+        dataset_iterator: The base dataset iterator.
+    """
+
+    def __init__(
+        self,
+        dataset_iterator: DatasetIterator,
+    ):
+        self._dataset_iterator = dataset_iterator
+
+    def iter_batches(self, *args, **kwargs) -> Iterator["DataBatch"]:
+        return self._dataset_iterator.iter_batches(*args, **kwargs)
+
+    def iter_torch_batches(
+        self, *, device: Optional[str] = None, **kwargs
+    ) -> Iterator["TorchTensorBatchType"]:
+
+        # Automatically move torch tensors to the appropriate device.
+        if device is None:
+            from ray.train.torch import get_device
+
+            try:
+                device = get_device()
+            except SessionMisuseError:
+                pass
+
+        return self._dataset_iterator.iter_torch_batches(device=device, **kwargs)
+
+    def to_tf(self, *args, **kwargs) -> "tf.data.Dataset":
+        return self._dataset_iterator.to_tf(*args, **kwargs)
+
+    def stats(self) -> str:
+        return self._dataset_iterator.stats()
+
+    def __getattr__(self, name):
+        if name == "_dataset_iterator":
+            raise AttributeError
+
+        if hasattr(self._dataset_iterator, name):
+            return getattr(self._dataset_iterator, name)
+
+        # Warning for backwards compatibility.
+        warnings.warn(
+            "session.get_dataset_shard returns a ray.data.DatasetIterator "
+            "instead of a Dataset/DatasetPipeline as of Ray v2.3. "
+            "Use iter_torch_batches(), to_tf(), or iter_batches() to "
+            "iterate over one epoch. See "
+            "https://docs.ray.io/en/latest/data/api/dataset_iterator.html "
+            "for full DatasetIterator docs."
+        )
+
+        return getattr(self._dataset_iterator._base_dataset, name)
diff --git a/python/ray/train/_internal/dataset_spec.py b/python/ray/train/_internal/dataset_spec.py
index 43377a6a1ff9..2a1e671121e9 100644
--- a/python/ray/train/_internal/dataset_spec.py
+++ b/python/ray/train/_internal/dataset_spec.py
@@ -232,7 +232,7 @@ def get_dataset_shards(
                 dataset_splits = [dataset] * len(training_worker_handles)
 
             for i, dataset_split in enumerate(dataset_splits):
-                dataset_splits[i] = dataset_split.iterator()._with_backward_compat()
+                dataset_splits[i] = dataset_split.iterator()._to_train_iterator()
 
             for i in range(len(dataset_splits)):
                 dataset_dict_splits[i][key] = dataset_splits[i]
diff --git a/python/ray/train/horovod/horovod_trainer.py b/python/ray/train/horovod/horovod_trainer.py
index d148e6775fae..a4209cec65a2 100644
--- a/python/ray/train/horovod/horovod_trainer.py
+++ b/python/ray/train/horovod/horovod_trainer.py
@@ -127,11 +127,9 @@ def train_loop_per_worker():
             for epoch in range(num_epochs):
                 model.train()
                 for batch in dataset_shard.iter_torch_batches(
-                    batch_size=32, dtypes=torch.float, device=train.torch.get_device()
+                    batch_size=32, dtypes=torch.float
                 ):
                     inputs, labels = torch.unsqueeze(batch["x"], 1), batch["y"]
-                    inputs.to(device)
-                    labels.to(device)
                     outputs = model(inputs)
                     loss = loss_fn(outputs, labels)
                     optimizer.zero_grad()
diff --git a/python/ray/train/tests/test_gpu.py b/python/ray/train/tests/test_gpu.py
index 9d096cf66a3e..ca710efb5264 100644
--- a/python/ray/train/tests/test_gpu.py
+++ b/python/ray/train/tests/test_gpu.py
@@ -4,12 +4,14 @@
 
 from unittest.mock import patch
 import pytest
+import numpy as np
 import torch
 import torchvision
 from torch.nn.parallel import DistributedDataParallel
 from torch.utils.data import DataLoader, DistributedSampler
 
 import ray
+import ray.data
 from ray.exceptions import RayTaskError
 from ray.air import session
 from ray import tune
@@ -335,6 +337,35 @@ def train_fn():
         trainer.fit()
 
 
+@pytest.mark.parametrize("use_gpu", (True, False))
+def test_torch_iter_torch_batches_auto_device(ray_start_4_cpus_2_gpus, use_gpu):
+    """
+    Tests that iter_torch_batches in TorchTrainer worker function uses the
+    default device.
+    """
+
+    def train_fn():
+        dataset = session.get_dataset_shard("train")
+        for batch in dataset.iter_torch_batches(dtypes=torch.float, device="cpu"):
+            assert str(batch.device) == "cpu"
+
+        # Autodetect
+        for batch in dataset.iter_torch_batches(dtypes=torch.float):
+            assert str(batch.device) == str(train.torch.get_device())
+
+    dataset = ray.data.from_numpy(np.array([[1, 2, 3, 4, 5], [1, 2, 3, 4, 5]]).T)
+    # Test that this works outside a Train function
+    for batch in dataset.iter_torch_batches(dtypes=torch.float, device="cpu"):
+        assert str(batch.device) == "cpu"
+
+    trainer = TorchTrainer(
+        train_fn,
+        scaling_config=ScalingConfig(num_workers=2, use_gpu=use_gpu),
+        datasets={"train": dataset},
+    )
+    trainer.fit()
+
+
 if __name__ == "__main__":
     import sys
 
diff --git a/python/ray/train/torch/torch_trainer.py b/python/ray/train/torch/torch_trainer.py
index 7a1987a77315..7a74fc0dae1b 100644
--- a/python/ray/train/torch/torch_trainer.py
+++ b/python/ray/train/torch/torch_trainer.py
@@ -182,7 +182,7 @@ def train_loop_per_worker():
                 # Iterate over epochs and batches
                 for epoch in range(num_epochs):
                     for batches in dataset_shard.iter_torch_batches(batch_size=32,
-                                dtypes=torch.float, device=train.torch.get_device()):
+                                dtypes=torch.float):
 
                         # Add batch or unsqueeze as an additional dimension [32, x]
                         inputs, labels = torch.unsqueeze(batches["x"], 1), batches["y"]

From 492ff7e75c7c2e24d211f3de5180c90ea666e820 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Thu, 9 Feb 2023 16:50:55 -0800
Subject: [PATCH 210/267] [air/execution] Event manager part 2: Implementation
 (#31811)

This implements the abstractions introduced in #31236.

Changes:
- We move to a static callback definition to better match other existing APIs
- We split the RayEventManager into an RayActorManager (for actors) and a RayEventManager (for futures)
- Instead of awaiting an arbitrary number of results, we have a `next()` method to await exactly one event, as this is the only thing needed for Train/Tune
- We simplified the APIs and reduced the number of concepts.

This PR comes with two end-to-end example flows for Ray Train- and Ray Tune-like flows.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 python/ray/air/BUILD                          |  72 +-
 .../ray/air/execution/_internal/__init__.py   |  15 +-
 .../air/execution/_internal/actor_manager.py  | 773 ++++++++++++++++++
 python/ray/air/execution/_internal/barrier.py | 125 +--
 .../air/execution/_internal/event_manager.py  | 384 +++------
 .../air/execution/_internal/tracked_actor.py  |  31 +-
 .../execution/_internal/tracked_actor_task.py |  99 +--
 python/ray/air/execution/resources/fixed.py   |   4 +-
 python/ray/air/tests/execution/__init__.py    |   0
 .../ray/air/tests/execution/test_barrier.py   |  53 ++
 .../tests/execution/test_e2e_train_flow.py    | 266 ++++++
 .../air/tests/execution/test_e2e_tune_flow.py | 227 +++++
 .../air/tests/execution/test_event_manager.py | 195 +++++
 .../test_resource_manager_fixed.py            |   0
 .../test_resource_manager_placement_group.py  |   0
 .../{ => execution}/test_resource_request.py  |   0
 .../air/tests/execution/test_tracked_actor.py | 240 ++++++
 .../execution/test_tracked_actor_task.py      | 123 +++
 18 files changed, 2122 insertions(+), 485 deletions(-)
 create mode 100644 python/ray/air/execution/_internal/actor_manager.py
 create mode 100644 python/ray/air/tests/execution/__init__.py
 create mode 100644 python/ray/air/tests/execution/test_barrier.py
 create mode 100644 python/ray/air/tests/execution/test_e2e_train_flow.py
 create mode 100644 python/ray/air/tests/execution/test_e2e_tune_flow.py
 create mode 100644 python/ray/air/tests/execution/test_event_manager.py
 rename python/ray/air/tests/{ => execution}/test_resource_manager_fixed.py (100%)
 rename python/ray/air/tests/{ => execution}/test_resource_manager_placement_group.py (100%)
 rename python/ray/air/tests/{ => execution}/test_resource_request.py (100%)
 create mode 100644 python/ray/air/tests/execution/test_tracked_actor.py
 create mode 100644 python/ray/air/tests/execution/test_tracked_actor_task.py

diff --git a/python/ray/air/BUILD b/python/ray/air/BUILD
index bbd2879674c6..03c55323c9e5 100644
--- a/python/ray/air/BUILD
+++ b/python/ray/air/BUILD
@@ -131,10 +131,64 @@ py_test(
     deps = [":ml_lib"]
 )
 
+py_test(
+    name = "test_tensor_extension",
+    size = "small",
+    srcs = ["tests/test_tensor_extension.py"],
+    tags = ["team:ml", "exclusive", "ray_data"],
+    deps = [":ml_lib"]
+)
+
+py_test(
+    name = "test_tracebacks",
+    size = "small",
+    srcs = ["tests/test_tracebacks.py"],
+    tags = ["team:ml", "exclusive"],
+    deps = [":ml_lib"]
+)
+
+# --------------------------------------------------------------------
+# Tests from the python/ray/air/tests/execution directory.
+# Covers all tests starting with `test_`.
+# Please keep these sorted alphabetically.
+# --------------------------------------------------------------------
+
+py_test(
+    name = "test_barrier",
+    size = "small",
+    srcs = ["tests/execution/test_barrier.py"],
+    tags = ["team:ml", "exclusive"],
+    deps = [":ml_lib"]
+)
+
+py_test(
+    name = "test_e2e_train_flow",
+    size = "medium",
+    srcs = ["tests/execution/test_e2e_train_flow.py"],
+    tags = ["team:ml", "exclusive"],
+    deps = [":ml_lib"]
+)
+
+py_test(
+    name = "test_e2e_tune_flow",
+    size = "medium",
+    srcs = ["tests/execution/test_e2e_tune_flow.py"],
+    tags = ["team:ml", "exclusive"],
+    deps = [":ml_lib"]
+)
+
+py_test(
+    name = "test_event_manager",
+    size = "medium",
+    srcs = ["tests/execution/test_event_manager.py"],
+    tags = ["team:ml", "exclusive"],
+    deps = [":ml_lib"]
+)
+
 py_test(
     name = "test_resource_manager_fixed",
     size = "small",
-    srcs = ["tests/test_resource_manager_fixed.py"],
+    srcs = ["tests/execution/test_resource_manager_fixed.py"],
     tags = ["team:ml", "exclusive"],
     deps = [":ml_lib"]
 )
@@ -142,7 +196,7 @@ py_test(
 py_test(
     name = "test_resource_manager_placement_group",
     size = "small",
-    srcs = ["tests/test_resource_manager_placement_group.py"],
+    srcs = ["tests/execution/test_resource_manager_placement_group.py"],
     tags = ["team:ml", "exclusive"],
     deps = [":ml_lib"]
 )
@@ -150,27 +204,29 @@ py_test(
 py_test(
     name = "test_resource_request",
     size = "small",
-    srcs = ["tests/test_resource_request.py"],
+    srcs = ["tests/execution/test_resource_request.py"],
     tags = ["team:ml", "exclusive"],
     deps = [":ml_lib"]
 )
 
 py_test(
-    name = "test_tensor_extension",
+    name = "test_tracked_actor",
     size = "small",
-    srcs = ["tests/test_tensor_extension.py"],
-    tags = ["team:ml", "exclusive", "ray_data"],
+    srcs = ["tests/execution/test_tracked_actor.py"],
+    tags = ["team:ml", "exclusive"],
     deps = [":ml_lib"]
 )
 
 py_test(
-    name = "test_tracebacks",
+    name = "test_tracked_actor_task",
     size = "small",
-    srcs = ["tests/test_tracebacks.py"],
+    srcs = ["tests/execution/test_tracked_actor_task.py"],
     tags = ["team:ml", "exclusive"],
     deps = [":ml_lib"]
 )
 
+
+
 # This is a dummy test dependency that causes the above tests to be
 # re-run if any of these files changes.
 py_library(
diff --git a/python/ray/air/execution/_internal/__init__.py b/python/ray/air/execution/_internal/__init__.py
index f3b1260269e5..37fb5d71d158 100644
--- a/python/ray/air/execution/_internal/__init__.py
+++ b/python/ray/air/execution/_internal/__init__.py
@@ -1,17 +1,6 @@
 from ray.air.execution._internal.barrier import Barrier
-from ray.air.execution._internal.event_manager import EventType, RayEventManager
+from ray.air.execution._internal.actor_manager import RayActorManager
 from ray.air.execution._internal.tracked_actor import TrackedActor
-from ray.air.execution._internal.tracked_actor_task import (
-    TrackedActorTask,
-    TrackedActorTaskCollection,
-)
 
 
-__all__ = [
-    "Barrier",
-    "EventType",
-    "RayEventManager",
-    "TrackedActor",
-    "TrackedActorTask",
-    "TrackedActorTaskCollection",
-]
+__all__ = ["Barrier", "RayActorManager", "TrackedActor"]
diff --git a/python/ray/air/execution/_internal/actor_manager.py b/python/ray/air/execution/_internal/actor_manager.py
new file mode 100644
index 000000000000..84f16bb6a60b
--- /dev/null
+++ b/python/ray/air/execution/_internal/actor_manager.py
@@ -0,0 +1,773 @@
+import logging
+import random
+import time
+import uuid
+from collections import defaultdict
+from typing import Any, Callable, Dict, List, Optional, Set, Tuple, Type, Union
+
+import ray
+from ray.air.execution._internal.event_manager import RayEventManager
+from ray.air.execution.resources import (
+    AcquiredResources,
+    ResourceManager,
+    ResourceRequest,
+)
+
+from ray.air.execution._internal.tracked_actor import TrackedActor
+from ray.air.execution._internal.tracked_actor_task import TrackedActorTask
+from ray.exceptions import RayTaskError, RayActorError
+
+
+logger = logging.getLogger(__name__)
+
+
+class RayActorManager:
+    """Management class for Ray actors and actor tasks.
+
+    This class provides an event-based management interface for actors, and
+    actor tasks.
+
+    The manager can be used to start actors, stop actors, and schedule and
+    track task futures on these actors.
+    The manager will then invoke callbacks related to the tracked entities.
+
+    For instance, when an actor is added with
+    :meth:`add_actor() <RayActorManager.add_actor>`,
+    a :ref:`TrackedActor <ray.air.execution._internal.tracked_actor.TrackedActor`
+    object is returned. An ``on_start`` callback can be specified that is invoked
+    once the actor successfully started. Similarly, ``on_stop`` and ``on_error``
+    can be used to specify callbacks relating to the graceful or ungraceful
+    end of an actor's lifetime.
+
+    When scheduling an actor task using
+    :meth:`schedule_actor_task()
+    <ray.air.execution._internal.actor_manager.RayActorManager.schedule_actor_task>`,
+    an ``on_result`` callback can be specified that is invoked when the task
+    successfully resolves, and an ``on_error`` callback will resolve when the
+    task fails.
+
+    The RayActorManager does not implement any true asynchronous processing. Control
+    has to be explicitly yielded to the event manager via :meth:`RayActorManager.next`.
+    Callbacks will only be invoked when control is with the RayActorManager, and
+    callbacks will always be executed sequentially in order of arriving events.
+
+    Args:
+        resource_manager: Resource manager used to request resources for the actors.
+
+    Example:
+
+        .. code-block:: python
+
+            from ray.air.execution import ResourceRequest
+            from ray.air.execution._internal import RayActorManager
+
+            actor_manager = RayActorManager()
+
+            # Request an actor
+            tracked_actor = actor_manager.add_actor(
+                ActorClass,
+                kwargs={},
+                resource_request=ResourceRequest([{"CPU": 1}]),
+                on_start=actor_start_callback,
+                on_stop=actor_stop_callback,
+                on_error=actor_error_callback
+            )
+
+            # Yield control to event manager to start actor
+            actor_manager.next()
+
+            # Start task on the actor (ActorClass.foo.remote())
+            tracked_actor_task = actor_manager.schedule_actor_task(
+                tracked_actor,
+                method_name="foo",
+                on_result=task_result_callback,
+                on_error=task_error_callback
+            )
+
+            # Again yield control to event manager to process task futures
+            actor_manager.wait()
+
+    """
+
+    def __init__(self, resource_manager: ResourceManager):
+        self._resource_manager: ResourceManager = resource_manager
+
+        self._actor_state_events = RayEventManager()
+        self._actor_task_events = RayEventManager()
+
+        # ---
+        # Tracked actor futures.
+
+        # This maps TrackedActor objects to their futures. We use this to see if an
+        # actor has any futures scheduled and to remove them when we terminate an actor.
+
+        # Actors to actor task futures
+        self._tracked_actors_to_task_futures: Dict[
+            TrackedActor, Set[ray.ObjectRef]
+        ] = defaultdict(set)
+
+        # Actors to actor state futures (start/terminate)
+        self._tracked_actors_to_state_futures: Dict[
+            TrackedActor, Set[ray.ObjectRef]
+        ] = defaultdict(set)
+
+        # ---
+        # Pending actors.
+        # We use three dicts for actors that are requested but not yet started.
+
+        # This dict keeps a list of actors associated with each resource request.
+        # We use this to start actors in the correct order when their resources
+        # become available.
+        self._resource_request_to_pending_actors: Dict[
+            ResourceRequest, List[TrackedActor]
+        ] = defaultdict(list)
+
+        # This dict stores the actor class, kwargs, and resource request of
+        # pending actors. Once the resources are available, we start the remote
+        # actor class with its args. We need the resource request to cancel it
+        # if needed.
+        self._pending_actors_to_attrs: Dict[
+            TrackedActor, Tuple[Type, Dict[str, Any], ResourceRequest]
+        ] = {}
+
+        # This dict keeps track of cached actor tasks. We can't schedule actor
+        # tasks before the actor is actually scheduled/live. So when the caller
+        # tries to schedule a task, we cache it here, and schedule it once the
+        # actor is started.
+        self._pending_actors_to_enqueued_actor_tasks: Dict[
+            TrackedActor, List[Tuple[TrackedActorTask, str, Tuple[Any], Dict[str, Any]]]
+        ] = defaultdict(list)
+
+        # ---
+        # Live actors.
+        # We keep one dict for actors that are currently running and a set of
+        # actors that we should forcefully kill.
+
+        # This dict associates the TrackedActor object with the Ray actor handle
+        # and the resources associated to the actor. We use it to schedule the
+        # actual ray tasks, and to return the resources when the actor stopped.
+        self._live_actors_to_ray_actors_resources: Dict[
+            TrackedActor, Tuple[ray.actor.ActorHandle, AcquiredResources]
+        ] = {}
+
+        # This dict contains all actors that should be killed (after calling
+        # `remove_actor()`). Kill requests will be handled in wait().
+        self._live_actors_to_kill: Set[TrackedActor] = set()
+
+    def next(self, timeout: Optional[Union[int, float]] = None) -> None:
+        """Yield control to event manager to await the next event and invoke callbacks.
+
+        Calling this method will wait for up to ``timeout`` seconds for the next
+        event to arrive.
+
+        When events arrive, callbacks relating to the events will be
+        invoked. A timeout of ``None`` will block until the next event arrives.
+
+        Note:
+            If an actor task fails with a ``RayActorError``, this is one event,
+            but it may trigger _two_ `on_error` callbacks: One for the actor,
+            and one for the task.
+
+        Note:
+            The ``timeout`` argument is used for pure waiting time for events. It does
+            not include time spent on processing callbacks. Depending on the processing
+            time of the callbacks, it can take much longer for this function to
+            return than the specified timeout.
+
+        Args:
+            timeout: Timeout in seconds to wait for next event.
+
+        """
+        # First issue any pending forceful actor kills
+        actor_killed = self._try_kill_actor()
+
+        # We always try to start actors as this won't trigger an event callback
+        self._try_start_actors()
+
+        # If an actor was killed, this was our event, and we return.
+        if actor_killed:
+            return
+
+        # Otherwise, collect all futures and await the next.
+        resource_futures = self._resource_manager.get_resource_futures()
+        actor_state_futures = self._actor_state_events.get_futures()
+        actor_task_futures = self._actor_task_events.get_futures()
+
+        # Shuffle state futures
+        shuffled_state_futures = list(actor_state_futures)
+        random.shuffle(shuffled_state_futures)
+
+        # Shuffle task futures
+        shuffled_task_futures = list(actor_task_futures)
+        random.shuffle(shuffled_task_futures)
+
+        # Prioritize resource futures over actor state over task futures
+        all_futures = resource_futures + shuffled_state_futures + shuffled_task_futures
+
+        start_wait = time.monotonic()
+        ready, _ = ray.wait(all_futures, num_returns=1, timeout=timeout)
+
+        if not ready:
+            return
+
+        [future] = ready
+
+        if future in actor_state_futures:
+            self._actor_state_events.resolve_future(future)
+        elif future in actor_task_futures:
+            self._actor_task_events.resolve_future(future)
+        else:
+            self._handle_ready_resource_future()
+            # Ready resource futures don't count as one event as they don't trigger
+            # any callbacks. So we repeat until we hit anything that is not a resource
+            # future.
+            time_taken = time.monotonic() - start_wait
+            return self.next(
+                timeout=max(1e-9, timeout - time_taken) if timeout is not None else None
+            )
+
+        self._try_start_actors()
+
+    def _actor_start_resolved(self, tracked_actor: TrackedActor, future: ray.ObjectRef):
+        """Callback to be invoked when actor started"""
+        self._tracked_actors_to_state_futures[tracked_actor].remove(future)
+
+        if tracked_actor._on_start:
+            tracked_actor._on_start(tracked_actor)
+
+    def _actor_stop_resolved(self, tracked_actor: TrackedActor):
+        """Callback to be invoked when actor stopped"""
+        self._cleanup_actor(tracked_actor=tracked_actor)
+
+        if tracked_actor._on_stop:
+            tracked_actor._on_stop(tracked_actor)
+
+    def _actor_start_failed(self, tracked_actor: TrackedActor, exception: Exception):
+        """Callback to be invoked when actor start/stop failed"""
+        self._cleanup_actor(tracked_actor=tracked_actor)
+
+        if tracked_actor._on_error:
+            tracked_actor._on_error(tracked_actor, exception)
+
+    def _actor_task_failed(
+        self, tracked_actor_task: TrackedActorTask, exception: Exception
+    ):
+        """Handle an actor task future that became ready.
+
+        - On actor error, trigger actor error callback AND error task error callback
+        - On task error, trigger actor task error callback
+        - On success, trigger actor task result callback
+        """
+        tracked_actor = tracked_actor_task._tracked_actor
+
+        if isinstance(exception, RayActorError):
+            # Here the actual actor process died.
+            # First, clean up any references to the actor and its futures
+            self._cleanup_actor(tracked_actor=tracked_actor)
+
+            if tracked_actor._on_error:
+                tracked_actor._on_error(tracked_actor, exception)
+
+            # Then trigger actor task error callback
+            if tracked_actor_task._on_error:
+                tracked_actor_task._on_error(tracked_actor, exception)
+        elif isinstance(exception, RayTaskError):
+            # Otherwise only the task failed. Invoke callback
+            if tracked_actor_task._on_error:
+                tracked_actor_task._on_error(tracked_actor, exception)
+        else:
+            raise RuntimeError(
+                f"Caught unexpected exception: {exception}"
+            ) from exception
+
+    def _actor_task_resolved(self, tracked_actor_task: TrackedActorTask, result: Any):
+        tracked_actor = tracked_actor_task._tracked_actor
+
+        # Trigger actor task result callback
+        if tracked_actor_task._on_result:
+            tracked_actor_task._on_result(tracked_actor, result)
+
+    def _handle_ready_resource_future(self):
+        """Handle a resource future that became ready.
+
+        - Update state of the resource manager
+        - Try to start one actor
+        """
+        # Force resource manager to update internal state
+        self._resource_manager.update_state()
+        # We handle resource futures one by one, so only try to start 1 actor at a time
+        self._try_start_actors(max_actors=1)
+
+    def _try_start_actors(self, max_actors: Optional[int] = None) -> int:
+        """Try to start up to ``max_actors`` actors.
+
+        This function will iterate through all resource requests we collected for
+        pending actors. As long as a resource request can be fulfilled (resources
+        are available), we try to start as many actors as possible.
+
+        This will schedule a `Actor.__ray_ready__()` future which, once resolved,
+        will trigger the `TrackedActor.on_start` callback.
+        """
+        started_actors = 0
+
+        # Iterate through all resource requests
+        for resource_request in self._resource_request_to_pending_actors:
+            if max_actors and started_actors >= max_actors:
+                break
+
+            # While we have resources ready and there are actors left to schedule
+            while (
+                self._resource_manager.has_resources_ready(resource_request)
+                and self._resource_request_to_pending_actors[resource_request]
+            ):
+                # Acquire resources for actor
+                acquired_resources = self._resource_manager.acquire_resources(
+                    resource_request
+                )
+                assert acquired_resources
+
+                # Get tracked actor to start
+                candidate_actors = self._resource_request_to_pending_actors[
+                    resource_request
+                ]
+                assert candidate_actors
+
+                tracked_actor = candidate_actors.pop(0)
+
+                # Get actor class and arguments
+                actor_cls, kwargs, _ = self._pending_actors_to_attrs.pop(tracked_actor)
+
+                if not isinstance(actor_cls, ray.actor.ActorClass):
+                    actor_cls = ray.remote(actor_cls)
+
+                # Associate to acquired resources
+                [remote_actor_cls] = acquired_resources.annotate_remote_entities(
+                    [actor_cls]
+                )
+
+                # Start Ray actor
+                actor = remote_actor_cls.remote(**kwargs)
+
+                # Schedule ready future
+                future = actor.__ray_ready__.remote()
+
+                self._tracked_actors_to_state_futures[tracked_actor].add(future)
+
+                # We need to create the callbacks in a function so tracked_actors
+                # are captured correctly.
+                def create_callbacks(
+                    tracked_actor: TrackedActor, future: ray.ObjectRef
+                ):
+                    def on_actor_start(result: Any):
+                        self._actor_start_resolved(
+                            tracked_actor=tracked_actor, future=future
+                        )
+
+                    def on_error(exception: Exception):
+                        self._actor_start_failed(
+                            tracked_actor=tracked_actor, exception=exception
+                        )
+
+                    return on_actor_start, on_error
+
+                on_actor_start, on_error = create_callbacks(
+                    tracked_actor=tracked_actor, future=future
+                )
+
+                self._actor_state_events.track_future(
+                    future=future,
+                    on_result=on_actor_start,
+                    on_error=on_error,
+                )
+
+                self._live_actors_to_ray_actors_resources[tracked_actor] = (
+                    actor,
+                    acquired_resources,
+                )
+
+                self._enqueue_cached_actor_tasks(tracked_actor=tracked_actor)
+
+        return started_actors
+
+    def _enqueue_cached_actor_tasks(self, tracked_actor: TrackedActor):
+        assert tracked_actor in self._live_actors_to_ray_actors_resources
+
+        # Enqueue cached futures
+        cached_tasks = self._pending_actors_to_enqueued_actor_tasks.pop(
+            tracked_actor, []
+        )
+        for tracked_actor_task, method_name, args, kwargs in cached_tasks:
+            self._schedule_tracked_actor_task(
+                tracked_actor_task=tracked_actor_task,
+                method_name=method_name,
+                args=args,
+                kwargs=kwargs,
+            )
+
+    def _try_kill_actor(self) -> bool:
+        """Try to kill actor scheduled for termination."""
+        if not self._live_actors_to_kill:
+            return False
+
+        tracked_actor = self._live_actors_to_kill.pop()
+
+        # Remove from tracked actors
+        (
+            ray_actor,
+            acquired_resources,
+        ) = self._live_actors_to_ray_actors_resources[tracked_actor]
+
+        # Hard kill if requested
+        ray.kill(ray_actor)
+
+        self._actor_stop_resolved(tracked_actor)
+
+        return True
+
+    def _cleanup_actor(self, tracked_actor: TrackedActor):
+        # Remove all actor task futures
+        futures = self._tracked_actors_to_task_futures.pop(tracked_actor, [])
+        for future in futures:
+            self._actor_task_events.discard_future(future)
+
+        # Remove all actor state futures
+        futures = self._tracked_actors_to_state_futures.pop(tracked_actor, [])
+        for future in futures:
+            self._actor_state_events.discard_future(future)
+
+        # Remove from tracked actors
+        (
+            ray_actor,
+            acquired_resources,
+        ) = self._live_actors_to_ray_actors_resources.pop(tracked_actor)
+
+        # Return resources
+        self._resource_manager.free_resources(acquired_resource=acquired_resources)
+
+    @property
+    def all_actors(self) -> List[TrackedActor]:
+        """Return all ``TrackedActor`` objects managed by this manager instance."""
+        return self.live_actors + self.pending_actors
+
+    @property
+    def live_actors(self) -> List[TrackedActor]:
+        """Return all ``TrackedActor`` objects that are currently alive."""
+        return list(self._live_actors_to_ray_actors_resources)
+
+    @property
+    def pending_actors(self) -> List[TrackedActor]:
+        """Return all ``TrackedActor`` objects that are currently pending."""
+        return list(self._pending_actors_to_attrs)
+
+    @property
+    def num_live_actors(self):
+        """Return number of started actors."""
+        return len(self.live_actors)
+
+    @property
+    def num_pending_actors(self) -> int:
+        """Return number of pending (not yet started) actors."""
+        return len(self.pending_actors)
+
+    @property
+    def num_total_actors(self):
+        """Return number of total actors."""
+        return len(self.all_actors)
+
+    def add_actor(
+        self,
+        cls: Union[Type, ray.actor.ActorClass],
+        kwargs: Dict[str, Any],
+        resource_request: ResourceRequest,
+        *,
+        on_start: Optional[Callable[[TrackedActor], None]] = None,
+        on_stop: Optional[Callable[[TrackedActor], None]] = None,
+        on_error: Optional[Callable[[TrackedActor, Exception], None]] = None,
+    ) -> TrackedActor:
+        """Add an actor to be tracked.
+
+        This method will request resources to start the actor. Once the resources
+        are available, the actor will be started and the
+        :meth:`TrackedActor.on_start
+        <ray.air.execution._internal.tracked_actor.TrackedActor.on_start>` callback
+        will be invoked.
+
+        Args:
+            cls: Actor class to schedule.
+            kwargs: Keyword arguments to pass to actor class on construction.
+            resource_request: Resources required to start the actor.
+            on_start: Callback to invoke when the actor started.
+            on_stop: Callback to invoke when the actor stopped.
+            on_error: Callback to invoke when the actor failed.
+
+        Returns:
+            Tracked actor object to reference actor in subsequent API calls.
+
+        """
+        tracked_actor = TrackedActor(
+            uuid.uuid4().int, on_start=on_start, on_stop=on_stop, on_error=on_error
+        )
+
+        self._pending_actors_to_attrs[tracked_actor] = cls, kwargs, resource_request
+        self._resource_request_to_pending_actors[resource_request].append(tracked_actor)
+
+        self._resource_manager.request_resources(resource_request=resource_request)
+
+        return tracked_actor
+
+    def remove_actor(
+        self,
+        tracked_actor: TrackedActor,
+        kill: bool = False,
+    ) -> None:
+        """Remove a tracked actor.
+
+        If the actor has already been started, this will stop the actor. This will
+        trigger the :meth:`TrackedActor.on_stop
+        <ray.air.execution._internal.tracked_actor.TrackedActor.on_stop>`
+        callback once the actor stopped.
+
+        If the actor has only been requested, but not started, yet, this will cancel
+        the actor request. This will not trigger any callback.
+
+
+        If ``kill=True``, this will use ``ray.kill()`` to forcefully terminate the
+        actor. Otherwise, graceful actor deconstruction will be scheduled after
+        all currently tracked futures are resolved.
+
+        Args:
+            tracked_actor: Tracked actor to be removed.
+            kill: If set, will forcefully terminate the actor instead of gracefully
+                scheduling termination.
+        """
+        if tracked_actor in self._live_actors_to_ray_actors_resources:
+            # Ray actor is running.
+
+            if not kill:
+                # Schedule __ray_terminate__ future
+                ray_actor, _ = self._live_actors_to_ray_actors_resources[tracked_actor]
+
+                def on_actor_stop(*args, **kwargs):
+                    self._actor_stop_resolved(tracked_actor=tracked_actor)
+
+                stop_future = ray_actor.__ray_terminate__.remote()
+                self._actor_state_events.track_future(
+                    future=stop_future,
+                    on_result=on_actor_stop,
+                    on_error=on_actor_stop,
+                )
+                self._tracked_actors_to_state_futures[tracked_actor].add(stop_future)
+
+            else:
+                # kill = True
+                self._live_actors_to_kill.add(tracked_actor)
+
+        elif tracked_actor in self._pending_actors_to_attrs:
+            # Actor is pending, stop
+            _, _, resource_request = self._pending_actors_to_attrs.pop(tracked_actor)
+            self._resource_manager.cancel_resource_request(
+                resource_request=resource_request
+            )
+        else:
+            raise ValueError(f"Unknown tracked actor: {tracked_actor}")
+
+    def is_actor_started(self, tracked_actor: TrackedActor) -> bool:
+        """Returns True if the actor has been started.
+
+        Args:
+            tracked_actor: Tracked actor object.
+        """
+        return tracked_actor in self._live_actors_to_ray_actors_resources
+
+    def get_actor_resources(
+        self, tracked_actor: TrackedActor
+    ) -> Optional[AcquiredResources]:
+        """Returns the acquired resources of an actor that has been started.
+
+        This will return ``None`` if the actor has not been started, yet.
+
+        Args:
+            tracked_actor: Tracked actor object.
+        """
+        if not self.is_actor_started(tracked_actor):
+            return None
+
+        return self._live_actors_to_ray_actors_resources[tracked_actor][1]
+
+    def schedule_actor_task(
+        self,
+        tracked_actor: TrackedActor,
+        method_name: str,
+        args: Optional[Tuple] = None,
+        kwargs: Optional[Dict] = None,
+        on_result: Optional[Callable[[TrackedActor, Any], None]] = None,
+        on_error: Optional[Callable[[TrackedActor, Exception], None]] = None,
+    ) -> None:
+        """Schedule and track a task on an actor.
+
+        This method will schedule a remote task ``method_name`` on the
+        ``tracked_actor``.
+
+        This method accepts two optional callbacks that will be invoked when
+        their respective events are triggered.
+
+        The ``on_result`` callback is triggered when a task resolves successfully.
+        It should accept two arguments: The actor for which the
+        task resolved, and the result received from the remote call.
+
+        The ``on_error`` callback is triggered when a task fails.
+        It should accept two arguments: The actor for which the
+        task threw an error, and the exception.
+
+        Args:
+            tracked_actor: Actor to schedule task on.
+            method_name: Remote method name to invoke on the actor. If this is
+                e.g. ``foo``, then ``actor.foo.remote(*args, **kwargs)`` will be
+                scheduled.
+            args: Arguments to pass to the task.
+            kwargs: Keyword arguments to pass to the task.
+            on_result: Callback to invoke when the task resolves.
+            on_error: Callback to invoke when the task fails.
+
+        Raises:
+            ValueError: If the ``tracked_actor`` is not managed by this event manager.
+
+        """
+        args = args or tuple()
+        kwargs = kwargs or {}
+
+        tracked_actor_task = TrackedActorTask(
+            tracked_actor=tracked_actor, on_result=on_result, on_error=on_error
+        )
+
+        if tracked_actor not in self._live_actors_to_ray_actors_resources:
+            # Actor is not started, yet
+            if tracked_actor not in self._pending_actors_to_attrs:
+                raise ValueError(
+                    f"Tracked actor is not managed by this event manager: "
+                    f"{tracked_actor}"
+                )
+
+            # Cache tasks for future execution
+            self._pending_actors_to_enqueued_actor_tasks[tracked_actor].append(
+                (tracked_actor_task, method_name, args, kwargs)
+            )
+        else:
+            self._schedule_tracked_actor_task(
+                tracked_actor_task=tracked_actor_task,
+                method_name=method_name,
+                args=args,
+                kwargs=kwargs,
+            )
+
+    def _schedule_tracked_actor_task(
+        self,
+        tracked_actor_task: TrackedActorTask,
+        method_name: str,
+        *,
+        args: Optional[Tuple] = None,
+        kwargs: Optional[Dict] = None,
+    ) -> TrackedActorTask:
+        tracked_actor = tracked_actor_task._tracked_actor
+        ray_actor, _ = self._live_actors_to_ray_actors_resources[tracked_actor]
+
+        try:
+            remote_fn = getattr(ray_actor, method_name)
+        except AttributeError as e:
+            raise AttributeError(
+                f"Remote function `{method_name}()` does not exist for this actor."
+            ) from e
+
+        def on_result(result: Any):
+            self._actor_task_resolved(
+                tracked_actor_task=tracked_actor_task, result=result
+            )
+
+        def on_error(exception: Exception):
+            self._actor_task_failed(
+                tracked_actor_task=tracked_actor_task, exception=exception
+            )
+
+        future = remote_fn.remote(*args, **kwargs)
+
+        self._actor_task_events.track_future(
+            future=future, on_result=on_result, on_error=on_error
+        )
+
+        self._tracked_actors_to_task_futures[tracked_actor].add(future)
+
+        return tracked_actor_task
+
+    def schedule_actor_tasks(
+        self,
+        tracked_actors: List[TrackedActor],
+        method_name: str,
+        *,
+        args: Optional[Union[Tuple, List[Tuple]]] = None,
+        kwargs: Optional[Union[Dict, List[Dict]]] = None,
+        on_result: Optional[Callable[[TrackedActor, Any], None]] = None,
+        on_error: Optional[Callable[[TrackedActor, Exception], None]] = None,
+    ) -> None:
+        """Schedule and track tasks on a list of actors.
+
+        This method will schedule a remote task ``method_name`` on all
+        ``tracked_actors``.
+
+        ``args`` and ``kwargs`` can be a single tuple/dict, in which case the same
+        (keyword) arguments are passed to all actors. If a list is passed instead,
+        they are mapped to the respective actors. In that case, the list of
+        (keyword) arguments must be the same length as the list of actors.
+
+        This method accepts two optional callbacks that will be invoked when
+        their respective events are triggered.
+
+        The ``on_result`` callback is triggered when a task resolves successfully.
+        It should accept two arguments: The actor for which the
+        task resolved, and the result received from the remote call.
+
+        The ``on_error`` callback is triggered when a task fails.
+        It should accept two arguments: The actor for which the
+        task threw an error, and the exception.
+
+        Args:
+            tracked_actors: List of actors to schedule tasks on.
+            method_name: Remote actor method to invoke on the actors. If this is
+                e.g. ``foo``, then ``actor.foo.remote(*args, **kwargs)`` will be
+                scheduled on all actors.
+            args: Arguments to pass to the task.
+            kwargs: Keyword arguments to pass to the task.
+            on_result: Callback to invoke when the task resolves.
+            on_error: Callback to invoke when the task fails.
+
+        """
+        if not isinstance(args, List):
+            args_list = [args] * len(tracked_actors)
+        else:
+            if len(tracked_actors) != len(args):
+                raise ValueError(
+                    f"Length of args must be the same as tracked_actors "
+                    f"list. Got `len(kwargs)={len(kwargs)}` and "
+                    f"`len(tracked_actors)={len(tracked_actors)}"
+                )
+            args_list = args
+
+        if not isinstance(kwargs, List):
+            kwargs_list = [kwargs] * len(tracked_actors)
+        else:
+            if len(tracked_actors) != len(kwargs):
+                raise ValueError(
+                    f"Length of kwargs must be the same as tracked_actors "
+                    f"list. Got `len(args)={len(args)}` and "
+                    f"`len(tracked_actors)={len(tracked_actors)}"
+                )
+            kwargs_list = kwargs
+
+        for tracked_actor, args, kwargs in zip(tracked_actors, args_list, kwargs_list):
+            self.schedule_actor_task(
+                tracked_actor=tracked_actor,
+                method_name=method_name,
+                args=args,
+                kwargs=kwargs,
+                on_result=on_result,
+                on_error=on_error,
+            )
diff --git a/python/ray/air/execution/_internal/barrier.py b/python/ray/air/execution/_internal/barrier.py
index bba82dedf6ed..8cb0c5a2bf55 100644
--- a/python/ray/air/execution/_internal/barrier.py
+++ b/python/ray/air/execution/_internal/barrier.py
@@ -7,24 +7,38 @@ class Barrier:
     A barrier can be used to collect multiple results and process them in bulk once
     a certain count or a timeout is reached.
 
-    For instance, if ``max_results=N``, the :meth:`on_completion` callback will be
+    For instance, if ``max_results=N``, the ``on_completion`` callback will be
     invoked once :meth:`arrive` has been called ``N`` times.
 
-    ``max_results`` can be ``None``, in which case an infinite amount of results
-    will be collected. In this case, the :meth:`on_completion` callback
-    will not be invoked on successful task resolution.
+    The completion callback will only be invoked once, even if more results
+    arrive after completion. The collected results can be resetted
+    with :meth:`reset`, after which the callback may be invoked again.
+
+    The completion callback should expect one argument, which is the barrier
+    object that completed.
 
     Args:
         max_results: Maximum number of results to collect before a call to
             :meth:`wait` resolves or the :meth:`on_completion` callback is invoked.
-            If ``None``, will collect an infinite number of results.
+        on_completion: Callback to invoke when ``max_results`` results
+            arrived at the barrier.
 
     """
 
     def __init__(
-        self, max_results: Optional[int] = None, complete_on_first_error: bool = False
+        self,
+        max_results: int,
+        *,
+        on_completion: Optional[Callable[["Barrier"], None]] = None,
     ):
-        raise NotImplementedError
+        self._max_results = max_results
+
+        # on_completion callback
+        self._completed = False
+        self._on_completion = on_completion
+
+        # Collect received results
+        self._results: List[Tuple[Any]] = []
 
     def arrive(self, *data):
         """Notify barrier that a result successfully arrived.
@@ -36,97 +50,44 @@ def arrive(self, *data):
             *data: Result data to be cached. Can be obtained via :meth:`get_results`.
 
         """
-        raise NotImplementedError
-
-    def error(self, *data):
-        """Notify barrier that an error arrived.
-
-        This will count against the ``max_results`` limit. The received arguments
-        will be included in a call to :meth:`get_errors`.
-
-        If ``Barrier.complete_on_first_error`` is set, this will immediately trigger
-        the completion callback.
-
-        Args:
-            *data: Error data to be cached. Can be obtained via :meth:`get_errors`.
-        """
-        raise NotImplementedError
-
-    def on_completion(self, callback: Callable[["Barrier"], None]) -> "Barrier":
-        """Define callback to be invoked when the barrier is full.
-
-        Whenever ``max_results`` results and errors arrived at the barrier,
-        the completion callback is invoked.
-
-        The completion callback should expect one argument, which is the barrier
-        object that completed.
-
-        The completion callback will only be invoked once, even if more results
-        arrive after completion. The collected results and errors can be flushed
-        with :meth:`flush`, after which the callback may be invoked again.
-
-        If ``max_results=None``, an infinite number of events are collected. In this
-        case, the ``on_completion`` callback will never be invoked.
-
-        Args:
-            callback: Callback to invoke when ``max_results`` results and errors
-            arrived at the barrier.
-
-        """
-        raise NotImplementedError
-
-    def on_first_error(self, callback: Callable[["Barrier"], None]) -> "Barrier":
-        """Define callback to be invoked when the first error arrived.
+        if len(data) == 1:
+            data = data[0]
 
-        When :meth:`error` is called the first time, the first error callback is
-        invoked.
+        self._results.append(data)
+        self._check_completion()
 
-        The first error callback should expect one argument, which is the barrier
-        object that received the error.
+    def _check_completion(self):
+        if self._completed:
+            # Already fired completion callback
+            return
 
-        The first error callback will only be invoked once, even if more errors
-        arrive afterwards. The collected results and errors can be flushed
-        with :meth:`flush`, after which the callback may be invoked again.
+        if self.num_results >= self._max_results:
+            # Barrier is complete
+            self._completed = True
 
-        Args:
-            callback: Callback to invoke when meth:`error` was invoked for the
-                first time.
-
-        """
-        raise NotImplementedError
+            if self._on_completion:
+                self._on_completion(self)
 
     @property
     def completed(self) -> bool:
         """Returns True if the barrier is completed."""
-        raise NotImplementedError
+        return self._completed
 
     @property
     def num_results(self) -> int:
         """Number of received (successful) results."""
-        raise NotImplementedError
-
-    @property
-    def num_errors(self) -> int:
-        """Number of received errors."""
-        raise NotImplementedError
+        return len(self._results)
 
     def get_results(self) -> List[Tuple[Any]]:
         """Return list of received results."""
-        raise NotImplementedError
-
-    def get_errors(self) -> List[Tuple[Any]]:
-        """Return list of received errors."""
-        raise NotImplementedError
-
-    def flush(self) -> None:
-        """Reset barrier, removing all received results and errors.
+        return self._results
 
-        This method can be used for a persistent barrier that can receive more
-        results than ``max_results``. In that case, the received results can be
-        flushed after processing so that new results can be received.
+    def reset(self) -> None:
+        """Reset barrier, removing all received results.
 
-        Flushing the barrier will reset the completion status. When ``max_results``
-        is set and enough new events arrive after flushing, the
+        Resetting the barrier will reset the completion status. When ``max_results``
+        is set and enough new events arrive after resetting, the
         :meth:`on_completion` callback will be invoked again.
         """
-        raise NotImplementedError
+        self._completed = False
+        self._results = []
diff --git a/python/ray/air/execution/_internal/event_manager.py b/python/ray/air/execution/_internal/event_manager.py
index 9b5ef0d186cd..0dab6354fb0e 100644
--- a/python/ray/air/execution/_internal/event_manager.py
+++ b/python/ray/air/execution/_internal/event_manager.py
@@ -1,332 +1,144 @@
-import enum
-from numbers import Number
-from typing import Any, Dict, List, Optional, Tuple, Type, Union
+import random
 
-from ray.air.execution.resources import (
-    AcquiredResources,
-    ResourceManager,
-    ResourceRequest,
-)
+import ray
+from typing import Any, Callable, Dict, Iterable, Optional, Set, Tuple, Union
 
-from ray.air.execution._internal.tracked_actor import TrackedActor
-from ray.air.execution._internal.tracked_actor_task import (
-    TrackedActorTask,
-    TrackedActorTaskCollection,
-)
-
-
-class EventType(enum.Enum):
-    """Event type to specify when yielding control to the :class:`RayEventManager`.
-
-    This enum can be passed to
-    :meth:`RayEventManager.wait() <RayEventManager.wait>`
-    to specify which kind of events to await.
-
-    Attributes:
-        ALL: All event types are awaited.
-        TASKS: Only events relating to tasks or actor tasks will be awaited.
-        ACTORS: Only events relating to actor starts or stops will be awaited.
-
-    """
-
-    ALL = 0
-    TASKS = 1
-    ACTORS = 2
+_ResultCallback = Callable[[Any], None]
+_ErrorCallback = Callable[[Exception], None]
 
 
 class RayEventManager:
-    """Management class for Ray actors, tasks, and actor tasks.
-
-    This class provides an event-based management interface for actors, tasks, and
-    actor tasks.
-
-    The manager can be used to start actors, stop actors, and schedule and
-    track task futures individually or on these actors.
-    The manager will then invoke callbacks related to the tracked entities.
-
-    For instance, when an actor is added with
-    :meth:`add_actor() <RayEventManager.add_actor>`,
-    a :ref:`TrackedActor <ray.air.execution._internal.tracked_actor.TrackedActor`
-    object is returned.
-    The :meth:`TrackedActor.on_start()
-    <ray.air.execution._internal.tracked_actor.TrackedActor.on_start>`
-    method can then be used to specify a callback that is invoked once the actor
-    successfully started. The other callbacks relating to tracked actors
-    :meth:`TrackedActor.on_stop()
-    <ray.air.execution._internal.tracked_actor.TrackedActor.on_stop>` and
-    :meth:`TrackedActor.on_error()
-    <ray.air.execution._internal.tracked_actor.TrackedActor.on_error>`
-
-    Similarly, when scheduling an actor task using
-    :meth:`schedule_actor_task()
-    <ray.air.execution._internal.event_manager.RayEventManager.schedule_actor_task>`,
-    a :ref:`TrackedActorTask <TrackedActorTask>`
-    object is returned.
-    The :meth:`TrackedActorTask.on_result()
-    <ray.air.execution._internal.tracked_actor_task.TrackedActorTask.on_result>`
-    method can then be used to specify a callback that is invoked when the task
-    successfully resolved.
-    The :meth:`TrackedActorTask.on_error()
-    <ray.air.execution._internal.tracked_actor_task.TrackedActorTask.on_error>`
-    method can then be used to specify a callback that is invoked when the task
-    fails.
-
-    The RayEventManager does not implement any true asynchronous processing. Control
-    has to be explicitly yielded to the event manager via :meth:`RayEventManager.wait`.
-    Callbacks will only be invoked when control is with the RayEventManager, and
-    callbacks will always be executed sequentially in order of arriving events.
-
-    Args:
-        resource_manager: Resource manager used to request resources for the actors.
-
-    Example:
-
-        .. code-block:: python
-
-            from ray.air.execution import ResourceRequest
-            from ray.air.execution._internal import EventType, RayEventManager
+    """Event manager for Ray futures.
 
-            event_manager = RayEventManager()
+    The event manager can be used to track futures and invoke callbacks when
+    they resolve.
 
-            # Request an actor
-            tracked_actor = event_manager.add_actor(
-                ActorClass,
-                kwargs={},
-                resource_request=ResourceRequest([{"CPU": 1}])
-            )
-            tracked_actor.on_start(actor_start_callback)
-            tracked_actor.on_stop(actor_stop_callback)
-            tracked_actor.on_fail(actor_fail_callback)
-
-            # Yield control to event manager to start actor
-            event_manager.wait(timeout=1)
-
-            # Start task on the actor (ActorClass.foo.remote())
-            tracked_actor_task = event_manager.schedule_actor_task(
-                tracked_actor,
-                method_name="foo"
-            )
-            tracked_actor_task.on_result(task_result_callback)
-            tracked_actor_task.on_error(task_error_callback)
-
-            # Again yield control to event manager to process task futures
-            event_manager.wait(event_type=EventType.TASKS)
+    Futures are tracked with :meth:`track_future`. Future can then be awaited with
+    :meth:`wait`. When futures successfully resolve, they trigger an optional
+    ``on_result`` callback that can be passed to :meth:`track_future`. If they
+    fail, they trigger an optional ``on_error`` callback.
 
+    Args:
+        shuffle_futures: If True, futures will be shuffled before awaited. This
+            will avoid implicit prioritization of futures within Ray.
     """
 
-    def __init__(self, resource_manager: ResourceManager):
-        self._resource_manager: ResourceManager = resource_manager
+    def __init__(self, shuffle_futures: bool = True):
+        self._shuffle_futures = shuffle_futures
 
-        raise NotImplementedError
+        # Map of futures to callbacks (result, error)
+        self._tracked_futures: Dict[
+            ray.ObjectRef, Tuple[Optional[_ResultCallback], Optional[_ErrorCallback]]
+        ] = {}
 
-    def wait(
+    def track_future(
         self,
-        num_events: Optional[int] = None,
-        timeout: Optional[Number] = None,
-        event_type: EventType = EventType.ALL,
-    ) -> None:
-        """Yield control to event manager to await events and invoke callbacks.
-
-        Calling this method will wait for up to ``timeout`` seconds for up to
-        ``num_events`` new events to arrive.
-        When events arrive, callbacks relating to the events will be
-        invoked. A timeout of ``None`` will block until the next event arrives.
-
-        If ``num_events`` is set, it will only wait for that many events to arrive
-        before returning control to the caller. If ``num_events=None``, this will
-        block until all tracked tasks resolved.
-
-        ``event_type`` specifies the event types to await. If this includes
-        Ray Actor events (i.e. ``EventType.ACTORS`` or ``EventType.ALL``), a
-        timeout must be specified. This is to ensure that we don't run into a
-        deadlock if not enough resources are available to start ``num_events``
-        actors.
-
-        Note:
-            If an actor task fails with a ``RayActorError``, this is one event,
-            but it may trigger _two_ `on_error` callbacks: One for the actor,
-            and one for the task.
-
-        Note:
-            The ``timeout`` argument is used for pure waiting time for events. It does
-            not include time spent on processing callbacks. Depending on the processing
-            time of the callbacks, it can take much longer for this function to
-            return than the specified timeout.
+        future: ray.ObjectRef,
+        on_result: Optional[_ResultCallback] = None,
+        on_error: Optional[_ErrorCallback] = None,
+    ):
+        """Track a single future and invoke callbacks on resolution.
 
-        Args:
-            num_events: Number of events to await before returning control
-                to the caller.
-            timeout: Timeout in seconds to wait for events.
-            event_type: Type of events to await. Defaults to ``EventType.ALL``.
+        Control has to be yielded to the event manager for the callbacks to
+        be invoked, either via :meth:`wait` or via :meth:`resolve_future`.
 
-        Raises:
-            ValueError: If awaiting actor events and no ``timeout`` is set.
+        Args:
+            future: Ray future to await.
+            on_result: Callback to invoke when the future resolves successfully.
+            on_error: Callback to invoke when the future fails.
 
         """
-        raise RuntimeError
-
-    @property
-    def all_actors(self) -> List[TrackedActor]:
-        """Return all ``TrackedActor`` objects managed by this manager instance."""
-        raise NotImplementedError
-
-    @property
-    def live_actors(self) -> List[TrackedActor]:
-        """Return all ``TrackedActor`` objects that are currently alive."""
-        raise NotImplementedError
+        self._tracked_futures[future] = (on_result, on_error)
 
-    @property
-    def pending_actors(self) -> List[TrackedActor]:
-        """Return all ``TrackedActor`` objects that are currently pending."""
-        raise NotImplementedError
-
-    @property
-    def num_started_actors(self):
-        """Return number of started actors."""
-        raise NotImplementedError
-
-    @property
-    def num_pending_actors(self):
-        """Return number of pending (not yet started) actors."""
-        raise NotImplementedError
-
-    @property
-    def num_total_actors(self):
-        """Return number of total actors."""
-        raise NotImplementedError
-
-    def add_actor(
-        self, cls: Type, kwargs: Dict[str, Any], resource_request: ResourceRequest
-    ) -> TrackedActor:
-        """Add an actor to be tracked.
+    def track_futures(
+        self,
+        futures: Iterable[ray.ObjectRef],
+        on_result: Optional[_ResultCallback] = None,
+        on_error: Optional[_ErrorCallback] = None,
+    ):
+        """Track multiple futures and invoke callbacks on resolution.
 
-        This method will request resources to start the actor. Once the resources
-        are available, the actor will be started and the
-        :meth:`TrackedActor.on_start
-        <ray.air.execution._internal.tracked_actor.TrackedActor.on_start>` callback
-        will be invoked.
+        Control has to be yielded to the event manager for the callbacks to
+        be invoked, either via :meth:`wait` or via :meth:`resolve_future`.
 
         Args:
-            cls: Actor class to schedule.
-            kwargs: Keyword arguments to pass to actor class on construction.
-            resource_request: Resources required to start the actor.
-
-        Returns:
-            Tracked actor object to reference actor in subsequent API calls.
+            futures: Ray futures to await.
+            on_result: Callback to invoke when the future resolves successfully.
+            on_error: Callback to invoke when the future fails.
 
         """
-        raise NotImplementedError
-
-    def remove_actor(
-        self,
-        tracked_actor: TrackedActor,
-        resolve_futures: bool = True,
-        kill: bool = False,
-    ) -> None:
-        """Remove a tracked actor.
-
-        If the actor has already been started, this will stop the actor. This will
-        trigger the :meth:`TrackedActor.on_stop
-        <ray.air.execution._internal.tracked_actor.TrackedActor.on_stop>`
-        callback once the actor stopped.
-
-        If the actor has only been requested, but not started, yet, this will cancel
-        the actor request. This will not trigger any callback.
+        for future in futures:
+            self.track_future(future, on_result=on_result, on_error=on_error)
 
-        If ``resolve_futures=True``, this will cache the actor removal and only
-        remove it once all its tracked futures are resolved.
+    def discard_future(self, future: ray.ObjectRef):
+        """Remove future from tracking.
 
-        If ``kill=True``, this will use ``ray.kill()`` to forcefully terminate the
-        actor. Otherwise, graceful actor deconstruction will be scheduled after
-        all currently tracked futures are resolved.
+        The future will not be awaited anymore, and it will not trigger any callbacks.
 
         Args:
-            tracked_actor: Tracked actor to be removed.
-            resolve_futures: If True, will resolve associated futures (and emit
-                events) first before stopping the actor.
-            kill: If set, will forcefully terminate the actor instead of gracefully
-                scheduling termination.
+            future: Ray futures to discard.
         """
-        raise NotImplementedError
+        self._tracked_futures.pop(future, None)
 
-    def is_actor_started(self, tracked_actor: TrackedActor) -> bool:
-        """Returns True if the actor has been started.
+    def get_futures(self) -> Set[ray.ObjectRef]:
+        """Get futures tracked by the event manager."""
+        return set(self._tracked_futures)
 
-        Args:
-            tracked_actor: Tracked actor object.
-        """
-        raise NotImplementedError
+    @property
+    def num_futures(self) -> int:
+        return len(self._tracked_futures)
 
-    def get_actor_resources(
-        self, tracked_actor: TrackedActor
-    ) -> Optional[AcquiredResources]:
-        """Returns the acquired resources of an actor that has been started.
+    def resolve_future(self, future: ray.ObjectRef):
+        """Resolve a single future.
 
-        This will return ``None`` if the actor has not been started, yet.
+        This method will block until the future is available. It will then
+        trigger the callback associated to the future and the event (success
+        or error), if specified.
 
         Args:
-            tracked_actor: Tracked actor object.
+            future: Ray future to resolve.
+
         """
-        raise NotImplementedError
+        try:
+            on_result, on_error = self._tracked_futures.pop(future)
+        except KeyError as e:
+            raise ValueError(
+                f"Future {future} is not tracked by this RayEventManager"
+            ) from e
+
+        try:
+            result = ray.get(future)
+        except Exception as e:
+            on_error(e)
+        else:
+            on_result(result)
 
-    def schedule_actor_task(
+    def wait(
         self,
-        tracked_actor: TrackedActor,
-        method_name: str,
-        args: Optional[Tuple] = None,
-        kwargs: Optional[Dict] = None,
-    ) -> TrackedActorTask:
-        """Schedule and track a task on an actor.
+        timeout: Optional[Union[float, int]] = None,
+        num_results: Optional[int] = 1,
+    ):
+        """Wait up to ``timeout`` seconds for ``num_results`` futures to resolve.
 
-        This method will schedule a remote task ``method_name`` on the
-        ``tracked_actor`` and return a
-        :ref:`TrackedActorTask
-        <ray.air.execution._internal.tracked_actor_task.TrackedActorTask>` object.
+        If ``timeout=None``, this method will block until all `num_results`` futures
+        resolve. If ``num_results=None``, this method will await all tracked futures.
 
-        The ``TrackedActorTask`` object can be used to specify callbacks that are
-        invoked when the task resolves, errors, or times out.
+        For every future that resolves, the respective associated callbacks will be
+        invoked.
 
         Args:
-            tracked_actor: Actor to schedule task on.
-            method_name: Remote method name to invoke on the actor. If this is
-                e.g. ``foo``, then ``actor.foo.remote(*args, **kwargs)`` will be
-                scheduled.
-            args: Arguments to pass to the task.
-            kwargs: Keyword arguments to pass to the task.
+            timeout: Timeout in second to wait for futures to resolve.
+            num_results: Number of futures to await. If ``None``, will wait for
+                all tracked futures to resolve.
 
         """
-        raise NotImplementedError
+        futures = list(self.get_futures())
 
-    def schedule_actor_tasks(
-        self,
-        tracked_actors: List[TrackedActor],
-        method_name: str,
-        args: Optional[Union[Tuple, List[Tuple]]] = None,
-        kwargs: Optional[Union[Dict, List[Dict]]] = None,
-    ) -> TrackedActorTaskCollection:
-        """Schedule and track tasks on a list of actors.
-
-        This method will schedule a remote task ``method_name`` on all
-        ``tracked_actors`` and return a
-        :ref:`TrackedActorTaskCollection
-        <ray.air.execution._internal.tracked_actor_task.TrackedActorTaskCollection>`
-        object.
-
-        The ``TrackedActorTaskCollection`` object can be used to specify callbacks that
-        are invoked when the actor tasks resolve, error, or time out.
-
-        ``args`` and ``kwargs`` can be a single tuple/dict, in which case the same
-        (keyword) arguments are passed to all actors. If a list is passed instead,
-        they are mapped to the respective actors. In that case, the list of
-        (keyword) arguments must be the same length as the list of actors.
+        if self._shuffle_futures:
+            random.shuffle(futures)
 
-        Args:
-            tracked_actors: List of actors to schedule tasks on.
-            method_name: Remote actor method to invoke on the actors. If this is
-                e.g. ``foo``, then ``actor.foo.remote(*args, **kwargs)`` will be
-                scheduled on all actors.
-            args: Arguments to pass to the task.
-            kwargs: Keyword arguments to pass to the task.
+        num_results = num_results or len(futures)
 
-        """
-        raise NotImplementedError
+        ready, _ = ray.wait(list(futures), timeout=timeout, num_returns=num_results)
+        for future in ready:
+            self.resolve_future(future)
diff --git a/python/ray/air/execution/_internal/tracked_actor.py b/python/ray/air/execution/_internal/tracked_actor.py
index 5c7f5a0c1f79..b6b3637a28af 100644
--- a/python/ray/air/execution/_internal/tracked_actor.py
+++ b/python/ray/air/execution/_internal/tracked_actor.py
@@ -1,4 +1,4 @@
-from typing import Callable
+from typing import Callable, Optional
 
 
 class TrackedActor:
@@ -10,7 +10,7 @@ class TrackedActor:
     Actor state can be inquired from the actor manager tracking the Ray actor.
 
     Note:
-        Objects of this class are returned by the :class:`RayEventManager`.
+        Objects of this class are returned by the :class:`RayActorManager`.
         This class should not be instantiated manually.
 
     Attributes:
@@ -19,19 +19,20 @@ class TrackedActor:
 
     """
 
-    def __init__(self, actor_id: int):
+    def __init__(
+        self,
+        actor_id: int,
+        on_start: Optional[Callable[["TrackedActor"], None]] = None,
+        on_stop: Optional[Callable[["TrackedActor"], None]] = None,
+        on_error: Optional[Callable[["TrackedActor", Exception], None]] = None,
+    ):
         self.actor_id = actor_id
+        self._on_start = on_start
+        self._on_stop = on_stop
+        self._on_error = on_error
 
-    def on_start(self, callback: Callable[["TrackedActor"], None]) -> "TrackedActor":
-        """Set callback to invoke when actor started."""
-        raise NotImplementedError
+    def __eq__(self, other):
+        return self.actor_id == other.actor_id
 
-    def on_stop(self, callback: Callable[["TrackedActor"], None]) -> "TrackedActor":
-        """Set callback to invoke when actor stopped gracefully."""
-        raise NotImplementedError
-
-    def on_error(
-        self, callback: Callable[["TrackedActor", Exception], None]
-    ) -> "TrackedActor":
-        """Set callback to invoke when actor died."""
-        raise NotImplementedError
+    def __hash__(self):
+        return hash(self.actor_id)
diff --git a/python/ray/air/execution/_internal/tracked_actor_task.py b/python/ray/air/execution/_internal/tracked_actor_task.py
index f7470dd49ca2..2fb21cbfb514 100644
--- a/python/ray/air/execution/_internal/tracked_actor_task.py
+++ b/python/ray/air/execution/_internal/tracked_actor_task.py
@@ -1,4 +1,4 @@
-from typing import Callable, Any
+from typing import Any, Callable, Optional
 
 from ray.air.execution._internal.tracked_actor import TrackedActor
 
@@ -10,92 +10,33 @@ class TrackedActorTask:
     the task resolves, errors, or times out.
 
     Note:
-        Objects of this class are returned by the :class:`RayEventManager`.
+        Objects of this class are returned by the :class:`RayActorManager`.
         This class should not be instantiated manually.
 
-    Example:
-
-        .. code-block:: python
-
-            tracked_futures = event_manager.schedule_actor_tasks(
-                actor_manager.live_actors,
-                "foo")
-            tracked_futures.on_result(lambda actor, result: print(result))
-
-    """
-
-    def on_result(
-        self, callback: Callable[[TrackedActor, Any], None]
-    ) -> "TrackedActorTask":
-        """Specify callback to handle successful task resolution.
-
-        The callback should accept two arguments: The actor for which the
-        task resolved, and the result received from the remote call.
-
-        Args:
-            callback: Callback to invoke when the task resolves.
-        """
-        raise NotImplementedError
-
-    def on_error(
-        self, callback: Callable[[TrackedActor, Exception], None]
-    ) -> "TrackedActorTask":
-        """Specify callback to handle any errors on task resolution.
-
-        The callback should accept two arguments: The actor for which the
-        task threw an error, and the exception.
-
-        Args:
-            callback: Callback to invoke when the task errors.
-        """
-        raise NotImplementedError
-
-
-class TrackedActorTaskCollection:
-    """Collection of actor tasks tracked by a Ray event manager.
-
-    This container class contains one or more :ref:`TrackedActorTask`s.
-
-    Callbacks specified for this collection will be propagated to each single
-    actor task.
-
-    Note:
-        Objects of this class are returned by the :class:`RayEventManager`.
-        This class should not be instantiated manually.
+    Args:
+        tracked_actor: Tracked actor object this task is scheduled on.
+        on_result: Callback to invoke when the task resolves.
+        on_error: Callback to invoke when the task fails.
 
     Example:
 
         .. code-block:: python
 
-            tracked_actor_tasks = event_manager.schedule_actor_tasks(
-                event_manager.live_actors,
-                "foo")
-            tracked_actor_tasks.on_result(lambda actor, result: print(result))
+            tracked_futures = actor_manager.schedule_actor_tasks(
+                actor_manager.live_actors,
+                "foo",
+                on_result=lambda actor, result: print(result)
+                )
 
     """
 
-    def on_result(
-        self, callback: Callable[[TrackedActor, Any], None]
-    ) -> "TrackedActorTaskCollection":
-        """Specify callback to handle successful task resolution.
-
-        The callback should accept two arguments: The actor for which the
-        task resolved, and the result received from the remote call.
-
-        Args:
-            callback: Callback to invoke when a task resolves.
-        """
-        raise NotImplementedError
-
-    def on_error(
-        self, callback: Callable[[TrackedActor, Exception], None]
-    ) -> "TrackedActorTaskCollection":
-        """Specify callback to handle any errors on future resolution.
-
-        The callback should accept two arguments: The actor for which the
-        task threw an error, and the exception.
+    def __init__(
+        self,
+        tracked_actor: TrackedActor,
+        on_result: Optional[Callable[[TrackedActor, Any], None]] = None,
+        on_error: Optional[Callable[[TrackedActor, Exception], None]] = None,
+    ):
+        self._tracked_actor = tracked_actor
 
-        Args:
-            callback: Callback to invoke when a task errors.
-        """
-        raise NotImplementedError
+        self._on_result = on_result
+        self._on_error = on_error
diff --git a/python/ray/air/execution/resources/fixed.py b/python/ray/air/execution/resources/fixed.py
index 2ab2ac707d22..3ee473d45bc3 100644
--- a/python/ray/air/execution/resources/fixed.py
+++ b/python/ray/air/execution/resources/fixed.py
@@ -73,7 +73,7 @@ def __init__(self, total_resources: Optional[Dict[str, float]] = None):
 
         if not total_resources:
             if rtc.worker.mode in {None, SCRIPT_MODE, LOCAL_MODE}:
-                total_resources = ray.available_resources()
+                total_resources = ray.cluster_resources()
             else:
                 total_resources = rtc.get_assigned_resources()
 
@@ -124,7 +124,7 @@ def has_resources_ready(self, resource_request: ResourceRequest) -> bool:
         available_resources = self._available_resources
         all_resources = resource_request.required_resources
         for k, v in all_resources.items():
-            if available_resources[k] < v:
+            if available_resources.get(k, 0.0) < v:
                 return False
         return True
 
diff --git a/python/ray/air/tests/execution/__init__.py b/python/ray/air/tests/execution/__init__.py
new file mode 100644
index 000000000000..e69de29bb2d1
diff --git a/python/ray/air/tests/execution/test_barrier.py b/python/ray/air/tests/execution/test_barrier.py
new file mode 100644
index 000000000000..7293c083a898
--- /dev/null
+++ b/python/ray/air/tests/execution/test_barrier.py
@@ -0,0 +1,53 @@
+import pytest
+from typing import Optional, Type
+
+from ray.air.execution._internal.barrier import Barrier
+
+
+def _raise(exception_type: Type[Exception] = RuntimeError, msg: Optional[str] = None):
+    def _raise_exception(*args, **kwargs):
+        raise exception_type(msg)
+
+    return _raise_exception
+
+
+def test_barrier_max_results():
+    """Test the `max_results` attribute.
+
+    - Set max_results=10
+    - Assert that the barrier completion callback is not invoked with num_results<10
+    - Assert that callback is invoked with num_results=10
+    - Assert that callback is not invoked again when more events arrive
+    - Assert that more events can arrive without triggering the callback after resetting
+    """
+    barrier = Barrier(max_results=10, on_completion=_raise(AssertionError))
+
+    for i in range(9):
+        barrier.arrive(i)
+
+    assert not barrier.completed
+
+    # Will trigger the on_completion callback
+    with pytest.raises(AssertionError):
+        barrier.arrive(10)
+
+    assert barrier.completed
+
+    assert barrier.num_results == 10
+
+    # Further events will not trigger callback again
+    barrier.arrive(11)
+
+    barrier.reset()
+
+    assert not barrier.completed
+
+    # After flushing more events can arrive
+    barrier.arrive(12)
+    assert barrier.num_results == 1
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/python/ray/air/tests/execution/test_e2e_train_flow.py b/python/ray/air/tests/execution/test_e2e_train_flow.py
new file mode 100644
index 000000000000..e5acf4c047ee
--- /dev/null
+++ b/python/ray/air/tests/execution/test_e2e_train_flow.py
@@ -0,0 +1,266 @@
+import random
+from typing import Any, List, Optional
+
+import pytest
+
+import ray
+from ray.air import ResourceRequest
+from ray.air.execution import FixedResourceManager, PlacementGroupResourceManager
+from ray.air.execution._internal import Barrier
+from ray.air.execution._internal.actor_manager import RayActorManager
+from ray.air.execution._internal.tracked_actor import TrackedActor
+from ray.exceptions import RayActorError
+
+
+@pytest.fixture(scope="module")
+def ray_start_4_cpus():
+    address_info = ray.init(num_cpus=4)
+    yield address_info
+    ray.shutdown()
+
+
+@ray.remote
+class Actor:
+    """Simple actor for testing an execution flow.
+
+    This actor can fail in these ways:
+
+    1. On init if ``actor_init_kill`` is passed as a kwarg
+    2. On setup_1() if ``actor_setup_kill`` is passed as a kwarg (RayActorError)
+    3. On setup_1() if ``actor_setup_fail`` is passed as a kwarg (RayTaskError)
+    4. On train() if ``actor_train_kill`` is passed as a kwarg (RayTaskError)
+    5. On train() if ``actor_train_fail`` is passed as a kwarg (RayTaskError)
+    """
+
+    def __init__(self, **kwargs):
+        self.kwargs = kwargs
+
+        if self.kwargs.get("actor_init_kill"):
+            raise RuntimeError("INIT")
+
+    def get_kwargs(self):
+        return self.kwargs
+
+    def setup_1(self):
+        if self.kwargs.get("actor_setup_kill"):
+            raise SystemExit
+
+        if self.kwargs.get("actor_setup_fail"):
+            raise RuntimeError("Setup")
+
+        return True
+
+    def setup_2(self):
+        return True
+
+    def train(self, value: float) -> float:
+        if value == 4:
+            if self.kwargs.get("actor_train_kill"):
+                # SystemExit will invoke a RayActorError
+                raise SystemExit
+
+            if self.kwargs.get("actor_train_fail"):
+                # RuntimeError will invoke a RayTaskError
+                raise RuntimeError("TASK")
+
+        return value
+
+
+class TrainFlow:
+    """This is a Ray Train-like execution flow.
+
+    - We want to run 4 actors in total ("trials")
+    - Each actor runs two init functions
+    - We train all actors in parallel for 10 iterations
+    - Errors can come up on actor construction, in the init functions,
+      or during training
+    - When an actor fails, restart that actor
+    - When a task fails, stop actor, and restart
+    """
+
+    def __init__(
+        self, actor_manager: RayActorManager, errors: Optional[List[str]] = None
+    ):
+        self._actor_manager = actor_manager
+        self._finished = False
+
+        self._actors_to_run = 4
+        self._tracked_actors = []
+        self._actors_stopped = 0
+
+        self._actors_to_replace = set()
+
+        self._ready_actors = set()
+        self._training_barrier = Barrier(
+            max_results=self._actors_to_run,
+            on_completion=self.training_barrier_completed,
+        )
+        self._restart_training = None
+
+        self._training_iter = 0
+        self._results = []
+
+        self._errors = errors
+
+    def setup_actors(self):
+        for actor_id in range(self._actors_to_run):
+            error_kwargs = {}
+            if self._errors:
+                error = random.choice(self._errors)
+                error_kwargs[error] = True
+
+            print("Actor", actor_id, "will be failing with", error_kwargs)
+
+            tracked_actor = self._actor_manager.add_actor(
+                cls=Actor,
+                kwargs={"id": actor_id, **error_kwargs},
+                resource_request=ResourceRequest([{"CPU": 1}]),
+                on_start=self.actor_started,
+                on_stop=self.actor_stopped,
+                on_error=self.actor_error,
+            )
+            self._tracked_actors.append(tracked_actor)
+
+    def actor_started(self, tracked_actor: TrackedActor):
+        self._actor_manager.schedule_actor_task(
+            tracked_actor,
+            "setup_1",
+            on_error=self.setup_error,
+            on_result=self.setup_1_result,
+        )
+
+    def actor_stopped(self, tracked_actor: TrackedActor):
+        self._ready_actors.discard(tracked_actor)
+
+        if tracked_actor in self._actors_to_replace:
+            self._replace_actor(tracked_actor=tracked_actor)
+        else:
+            self._actors_stopped += 1
+            self._finished = self._actors_stopped >= self._actors_to_run
+
+    def actor_error(self, tracked_actor: TrackedActor, exception: Exception):
+        self._ready_actors.discard(tracked_actor)
+        self._replace_actor(tracked_actor=tracked_actor)
+
+    def _replace_actor(self, tracked_actor: TrackedActor):
+        actor_index = self._tracked_actors.index(tracked_actor)
+
+        replacement_actor = self._actor_manager.add_actor(
+            cls=Actor,
+            kwargs={"id": actor_index},
+            resource_request=ResourceRequest([{"CPU": 1}]),
+            on_start=self.actor_started,
+            on_stop=self.actor_stopped,
+            on_error=self.actor_error,
+        )
+
+        self._tracked_actors[actor_index] = replacement_actor
+
+    def setup_1_result(self, tracked_actor: TrackedActor, result: Any):
+        self._actor_manager.schedule_actor_task(
+            tracked_actor,
+            "setup_2",
+            on_error=self.setup_error,
+            on_result=self.setup_2_result,
+        )
+
+    def setup_2_result(self, tracked_actor: TrackedActor, result: Any):
+        self._ready_actors.add(tracked_actor)
+
+        if len(self._ready_actors) == self._actors_to_run:
+            self.continue_training()
+
+    def setup_error(self, tracked_actor: TrackedActor, exception: Exception):
+        if isinstance(exception, RayActorError):
+            return
+
+        self._actors_to_replace.add(tracked_actor)
+        self._actor_manager.remove_actor(tracked_actor)
+
+    def continue_training(self):
+        if self._restart_training:
+            self._training_iter = self._restart_training
+            self._restart_training = None
+        else:
+            self._training_iter += 1
+
+        self._training_barrier.reset()
+        self._actor_manager.schedule_actor_tasks(
+            self._tracked_actors,
+            "train",
+            args=(self._training_iter,),
+            on_result=self._training_barrier.arrive,
+            on_error=self.training_error,
+        )
+
+    def training_barrier_completed(self, barrier: Barrier):
+        self._results.append([res for _, res in barrier.get_results()])
+
+        # If less than 10 epochs, continue training
+        if self._training_iter < 10:
+            return self.continue_training()
+
+        # Else, training finished
+        for tracked_actor in self._tracked_actors:
+            self._actor_manager.remove_actor(tracked_actor)
+
+    def training_error(self, tracked_actor: TrackedActor, exception: Exception):
+        if not self._restart_training:
+            self._restart_training = self._training_iter
+
+        if isinstance(exception, RayActorError):
+            return
+
+        self._actors_to_replace.add(tracked_actor)
+        self._actor_manager.remove_actor(tracked_actor)
+
+    def run(self):
+        self.setup_actors()
+
+        while not self._finished:
+            self._actor_manager.next()
+
+    def get_results(self) -> List[List[float]]:
+        return self._results
+
+
+@pytest.mark.parametrize(
+    "resource_manager_cls", [FixedResourceManager, PlacementGroupResourceManager]
+)
+@pytest.mark.parametrize(
+    "errors",
+    [
+        None,
+        "actor_init_kill",
+        "actor_setup_kill",
+        "actor_setup_fail",
+        "actor_train_kill",
+        "actor_train_fail",
+        # Chaos - every actor fails somehow, but in different ways
+        [
+            "actor_init_kill",
+            "actor_setup_kill",
+            "actor_setup_fail",
+            "actor_train_kill",
+            "actor_train_fail",
+        ],
+    ],
+)
+def test_e2e(ray_start_4_cpus, resource_manager_cls, errors):
+    actor_manager = RayActorManager(resource_manager=resource_manager_cls())
+
+    if errors and isinstance(errors, str):
+        errors = [errors]
+
+    flow = TrainFlow(actor_manager=actor_manager, errors=errors)
+    flow.run()
+
+    results = flow.get_results()
+
+    assert results == [[i] * 4 for i in range(1, 11)], results
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/python/ray/air/tests/execution/test_e2e_tune_flow.py b/python/ray/air/tests/execution/test_e2e_tune_flow.py
new file mode 100644
index 000000000000..f2c8898b1d10
--- /dev/null
+++ b/python/ray/air/tests/execution/test_e2e_tune_flow.py
@@ -0,0 +1,227 @@
+import random
+from collections import defaultdict
+from typing import Dict, List, Optional
+
+import pytest
+
+import ray
+from ray.air import ResourceRequest
+from ray.air.execution import FixedResourceManager, PlacementGroupResourceManager
+from ray.air.execution._internal.actor_manager import RayActorManager
+from ray.air.execution._internal.tracked_actor import TrackedActor
+from ray.exceptions import RayActorError
+
+
+@pytest.fixture(scope="module")
+def ray_start_4_cpus():
+    address_info = ray.init(num_cpus=4)
+    yield address_info
+    ray.shutdown()
+
+
+@ray.remote
+class Actor:
+    """Simple actor for testing an execution flow.
+
+    This actor can fail in three ways:
+
+    1. On init if ``actor_error_init`` is passed as a kwarg
+    2. On run() if ``actor_error_task`` is passed as a kwarg (RayActorError)
+    3. On run() if ``task_error`` is passed as a kwarg (RayTaskError)
+    """
+
+    def __init__(self, **kwargs):
+        self.kwargs = kwargs
+
+        if self.kwargs.get("actor_error_init"):
+            raise RuntimeError("INIT")
+
+    def get_kwargs(self):
+        return self.kwargs
+
+    def run(self, value: float) -> float:
+        if value == 2:
+            if self.kwargs.get("actor_error_task"):
+                # SystemExit will invoke a RayActorError
+                raise SystemExit
+
+            if self.kwargs.get("task_error"):
+                # RuntimeError will invoke a RayTaskError
+                raise RuntimeError("TASK")
+
+        return value
+
+
+class TuneFlow:
+    """This is a Ray Tune-like execution flow.
+
+    - We want to run 10 actors in total ("trials")
+    - Each actor collects 11 results sequentially
+    - We schedule up to 6 actors at the same time
+    - Every step, we see if we should add any new actors
+    - Otherwise, we just yield control to the event manager and process events one
+      by one
+    - When an actor is started, start training flow
+    - When a result comes in, schedule next future
+      - If this is the 11th result, stop actor
+    - When the last actor is stopped, set state to finished
+
+    - When an actor fails, restart
+    - When a task fails, stop actor, and restart
+    """
+
+    def __init__(
+        self, actor_manager: RayActorManager, errors: Optional[List[str]] = None
+    ):
+        self._actor_manager = actor_manager
+        self._finished = False
+
+        self._actors_to_run = 10
+        self._actors_started = 0
+        self._actors_stopped = 0
+        self._max_pending = 6
+
+        self._actor_to_id = {}
+        self._results = defaultdict(list)
+
+        self._errors = errors
+
+    def maybe_add_actors(self):
+        if self._actors_started >= self._actors_to_run:
+            return
+
+        if self._actor_manager.num_pending_actors >= self._max_pending:
+            return
+
+        error_kwargs = {}
+        if self._errors:
+            error = random.choice(self._errors)
+            error_kwargs[error] = True
+
+        actor_id = self._actors_started
+
+        print("Actor", actor_id, "will be failing with", error_kwargs)
+
+        tracked_actor = self._actor_manager.add_actor(
+            cls=Actor,
+            kwargs={"id": actor_id, **error_kwargs},
+            resource_request=ResourceRequest([{"CPU": 1}]),
+            on_start=self.actor_started,
+            on_stop=self.actor_stopped,
+            on_error=self.actor_error,
+        )
+        self._actor_to_id[tracked_actor] = actor_id
+
+        self._actors_started += 1
+
+    def actor_started(self, tracked_actor: TrackedActor):
+        self._actor_manager.schedule_actor_task(
+            tracked_actor,
+            "run",
+            kwargs={"value": 0},
+            on_error=self.task_error,
+            on_result=self.task_result,
+        )
+
+    def actor_stopped(self, tracked_actor: TrackedActor):
+        self._actors_stopped += 1
+        self._finished = self._actors_stopped >= self._actors_to_run
+
+    def actor_error(self, tracked_actor: TrackedActor, exception: Exception):
+        actor_id = self._actor_to_id.pop(tracked_actor)
+
+        replacement_actor = self._actor_manager.add_actor(
+            cls=Actor,
+            kwargs={
+                "id": actor_id,
+                "actor_error_init": False,
+                "actor_error_task": False,
+                "task_error": False,
+            },
+            resource_request=ResourceRequest([{"CPU": 1}]),
+            on_start=self.actor_started,
+            on_stop=self.actor_stopped,
+            on_error=self.actor_error,
+        )
+
+        self._actor_to_id[replacement_actor] = actor_id
+
+    def task_result(self, tracked_actor: TrackedActor, result: float):
+        actor_id = self._actor_to_id[tracked_actor]
+        self._results[actor_id].append(result)
+
+        if result == 10:
+            self._actor_manager.remove_actor(tracked_actor)
+        else:
+            self._actor_manager.schedule_actor_task(
+                tracked_actor,
+                "run",
+                kwargs={"value": result + 1},
+                on_result=self.task_result,
+                on_error=self.task_error,
+            )
+
+    def task_error(self, tracked_actor: TrackedActor, exception: Exception):
+        if isinstance(exception, RayActorError):
+            return
+
+        self._actors_stopped -= 1  # account for extra stop
+        self._actor_manager.remove_actor(tracked_actor)
+        actor_id = self._actor_to_id.pop(tracked_actor)
+
+        replacement_actor = self._actor_manager.add_actor(
+            cls=Actor,
+            kwargs={
+                "id": actor_id,
+                "actor_error_init": False,
+                "actor_error_task": False,
+                "task_error": False,
+            },
+            resource_request=ResourceRequest([{"CPU": 1}]),
+            on_start=self.actor_started,
+            on_stop=self.actor_stopped,
+            on_error=self.actor_error,
+        )
+        self._actor_to_id[replacement_actor] = actor_id
+
+    def run(self):
+        while not self._finished:
+            self.maybe_add_actors()
+            self._actor_manager.next(timeout=1)
+
+    def get_results(self) -> Dict[int, List[float]]:
+        return self._results
+
+
+@pytest.mark.parametrize(
+    "resource_manager_cls", [FixedResourceManager, PlacementGroupResourceManager]
+)
+@pytest.mark.parametrize(
+    "errors",
+    [
+        None,
+        "actor_error_init",
+        "actor_error_task",
+        "task_error",
+        # Chaos - every actor fails somehow, but in different ways
+        ["actor_error_init", "actor_error_task", "task_error"],
+    ],
+)
+def test_e2e(ray_start_4_cpus, resource_manager_cls, errors):
+    actor_manager = RayActorManager(resource_manager=resource_manager_cls())
+
+    if errors and isinstance(errors, str):
+        errors = [errors]
+
+    flow = TuneFlow(actor_manager=actor_manager, errors=errors)
+    flow.run()
+
+    results = flow.get_results()
+
+    assert all(res[-1] == 10 for res in results.values()), results
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/python/ray/air/tests/execution/test_event_manager.py b/python/ray/air/tests/execution/test_event_manager.py
new file mode 100644
index 000000000000..4c45bdf14bc2
--- /dev/null
+++ b/python/ray/air/tests/execution/test_event_manager.py
@@ -0,0 +1,195 @@
+import time
+from typing import Any, Type
+
+import pytest
+
+import ray
+from ray.air.execution._internal import Barrier
+from ray.air.execution._internal.event_manager import RayEventManager
+from ray.exceptions import RayTaskError
+
+
+@pytest.fixture(scope="module")
+def ray_start_4_cpus():
+    address_info = ray.init(num_cpus=4)
+    yield address_info
+    ray.shutdown()
+
+
+@ray.remote
+def succeeding(ret: Any = None) -> Any:
+    return ret
+
+
+@ray.remote
+def failing(exc: Type[Exception], *args) -> None:
+    raise exc(*args)
+
+
+@ray.remote
+def sleeping(seconds: int, result: Any) -> Any:
+    time.sleep(seconds)
+    return result
+
+
+def test_track_future_success(ray_start_4_cpus):
+    """Schedule a future that return successfully.
+
+    Check that the on_result callback was triggered.
+    """
+    event_manager = RayEventManager()
+
+    seen = set()
+
+    def on_result(result: Any):
+        seen.add(result)
+
+    event_manager.track_future(succeeding.remote("a"), on_result=on_result)
+
+    event_manager.wait()
+    assert "a" in seen
+
+    assert not event_manager._tracked_futures
+
+
+def test_track_future_error(ray_start_4_cpus):
+    """Schedule a future that fails.
+
+    Check that the on_error callback was triggered.
+    """
+    event_manager = RayEventManager()
+
+    seen = set()
+
+    class CustomError(RuntimeError):
+        pass
+
+    def on_error(exception: Exception):
+        seen.add(exception)
+
+    event_manager.track_future(failing.remote(CustomError), on_error=on_error)
+
+    event_manager.wait()
+    assert isinstance(seen.pop(), CustomError)
+
+    assert not event_manager._tracked_futures
+
+
+@pytest.mark.parametrize("results_per_wait", [None, 1, 5, 10, 100])
+def test_many_futures(ray_start_4_cpus, results_per_wait):
+    """Schedule 500 succeeding and failing futures.
+
+    Check that the callbacks get triggered correctly, independent of the number
+    of results we await per call to RayEventManager.wait().
+    """
+    num_futures = 500
+
+    event_manager = RayEventManager()
+
+    seen_results = set()
+    seen_errors = set()
+
+    def on_result(result: Any):
+        seen_results.add(result)
+
+    def on_error(exception: RayTaskError):
+        seen_errors.add(exception.cause.args[0])
+
+    for i in range(num_futures):
+        event_manager.track_futures(
+            [
+                succeeding.remote("a" + str(i)),
+                failing.remote(RuntimeError, "b" + str(i)),
+            ],
+            on_result=on_result,
+            on_error=on_error,
+        )
+
+    while event_manager.num_futures > 0:
+        event_manager.wait(num_results=results_per_wait)
+
+    for i in range(num_futures):
+        assert "a" + str(i) in seen_results
+        assert "b" + str(i) in seen_errors
+
+
+def test_timeout(ray_start_4_cpus):
+    """Test the timeout parameter.
+
+    Start 4 tasks: Two succeed immediately, two after 1 second.
+
+    After waiting for 0.5 seconds, the first two tasks should have returned.
+    After waiting for up to 5 seconds, the other two tasks should have returned.
+    But because the tasks take only 0.5 seconds to run, we should have waited
+    way less than 5 seconds.
+    """
+    event_manager = RayEventManager()
+
+    seen = set()
+
+    def on_result(result: Any):
+        seen.add(result)
+
+    event_manager.track_futures(
+        [
+            succeeding.remote("a"),
+            succeeding.remote("b"),
+            sleeping.remote(1, "c"),
+            sleeping.remote(1, "d"),
+        ],
+        on_result=on_result,
+    )
+
+    start = time.monotonic()
+    event_manager.wait(num_results=None, timeout=0.5)
+    assert "a" in seen
+    assert "b" in seen
+    assert "c" not in seen
+    assert "d" not in seen
+
+    event_manager.wait(num_results=None, timeout=5)
+    taken = time.monotonic() - start
+
+    assert "c" in seen
+    assert "d" in seen
+
+    # Should have returned much earlier than after 5 seconds
+    assert taken < 3
+
+    assert not event_manager._tracked_futures
+
+
+def test_task_barrier(ray_start_4_cpus):
+    event_manager = RayEventManager()
+
+    seen = set()
+
+    def on_completion(barrier: Barrier):
+        seen.update(barrier.get_results())
+
+    barrier = Barrier(max_results=4, on_completion=on_completion)
+
+    event_manager.track_futures(
+        [
+            succeeding.remote("a"),
+            succeeding.remote("b"),
+            succeeding.remote("c"),
+            succeeding.remote("d"),
+            sleeping.remote(2, "e"),
+        ],
+        on_result=barrier.arrive,
+    )
+
+    event_manager.wait(num_results=4)
+
+    assert "a" in seen
+    assert "b" in seen
+    assert "c" in seen
+    assert "d" in seen
+    assert "e" not in seen
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/python/ray/air/tests/test_resource_manager_fixed.py b/python/ray/air/tests/execution/test_resource_manager_fixed.py
similarity index 100%
rename from python/ray/air/tests/test_resource_manager_fixed.py
rename to python/ray/air/tests/execution/test_resource_manager_fixed.py
diff --git a/python/ray/air/tests/test_resource_manager_placement_group.py b/python/ray/air/tests/execution/test_resource_manager_placement_group.py
similarity index 100%
rename from python/ray/air/tests/test_resource_manager_placement_group.py
rename to python/ray/air/tests/execution/test_resource_manager_placement_group.py
diff --git a/python/ray/air/tests/test_resource_request.py b/python/ray/air/tests/execution/test_resource_request.py
similarity index 100%
rename from python/ray/air/tests/test_resource_request.py
rename to python/ray/air/tests/execution/test_resource_request.py
diff --git a/python/ray/air/tests/execution/test_tracked_actor.py b/python/ray/air/tests/execution/test_tracked_actor.py
new file mode 100644
index 000000000000..924ee88f7f25
--- /dev/null
+++ b/python/ray/air/tests/execution/test_tracked_actor.py
@@ -0,0 +1,240 @@
+from collections import Counter
+from typing import Any, Optional, Type
+
+import pytest
+
+import ray
+from ray.air import ResourceRequest
+from ray.air.execution import FixedResourceManager, PlacementGroupResourceManager
+from ray.air.execution._internal.actor_manager import RayActorManager
+
+
+def _raise(exception_type: Type[Exception] = RuntimeError, msg: Optional[str] = None):
+    def _raise_exception(*args, **kwargs):
+        raise exception_type(msg)
+
+    return _raise_exception
+
+
+class Started(RuntimeError):
+    pass
+
+
+class Stopped(RuntimeError):
+    pass
+
+
+class Failed(RuntimeError):
+    pass
+
+
+class Result(RuntimeError):
+    pass
+
+
+@pytest.fixture(scope="module")
+def ray_start_4_cpus():
+    address_info = ray.init(num_cpus=4)
+    yield address_info
+    ray.shutdown()
+
+
+class Actor:
+    def __init__(self, **kwargs):
+        self.kwargs = kwargs
+
+    def get_kwargs(self):
+        return self.kwargs
+
+    def task(self, value: Any):
+        return value
+
+
+@ray.remote(num_cpus=4)
+def fn():
+    return True
+
+
+@pytest.mark.parametrize(
+    "resource_manager_cls", [FixedResourceManager, PlacementGroupResourceManager]
+)
+@pytest.mark.parametrize("actor_cls", [Actor, ray.remote(Actor)])
+@pytest.mark.parametrize("kill", [False, True])
+def test_start_stop_actor(ray_start_4_cpus, resource_manager_cls, actor_cls, kill):
+    """Test that starting and stopping actors work and invokes a callback.
+
+    - Start an actor
+    - Starting should trigger start callback
+    - Schedule actor task, which should resolve (meaning actor successfully started)
+    - Stop actor, which should resolve and trigger stop callback
+    - Schedule remote fn that takes up all cluster resources. This should resolve,
+      meaning that the actor was stopped successfully.
+    """
+    actor_manager = RayActorManager(resource_manager=resource_manager_cls())
+
+    # Start actor, set callbacks
+    tracked_actor = actor_manager.add_actor(
+        cls=actor_cls,
+        kwargs={"key": "val"},
+        resource_request=ResourceRequest([{"CPU": 4}]),
+        on_start=_raise(Started),
+        on_stop=_raise(Stopped),
+        on_error=_raise(Failed),
+    )
+
+    # Actor should be started
+    with pytest.raises(Started):
+        actor_manager.next()
+
+    # Schedule task on actor which should resolve (actor successfully started)
+    actor_manager.schedule_actor_task(
+        tracked_actor, "task", (1,), on_result=_raise(Result)
+    )
+
+    with pytest.raises(Result):
+        actor_manager.next()
+
+    # Now we can assert that there are no CPUS resources available anymore.
+    # Note that actor starting is asynchronous, so we can't assert this right away
+    # - that's why we wait for the actor task to resolve first.
+    assert ray.available_resources().get("CPU", 0.0) == 0, ray.available_resources()
+
+    # Stop actor
+    actor_manager.remove_actor(tracked_actor, kill=kill)
+
+    with pytest.raises(Stopped):
+        actor_manager.next()
+
+    # This task takes up all the cluster resources. It should resolve now that
+    # the actor was terminated.
+    assert ray.get(fn.remote(), timeout=5)
+
+
+@pytest.mark.parametrize(
+    "resource_manager_cls", [FixedResourceManager, PlacementGroupResourceManager]
+)
+def test_start_many_actors(ray_start_4_cpus, resource_manager_cls):
+    """Test that starting more actors than fit onto the cluster works.
+
+    - Request 10 actors
+    - 4 can be started. Assert they are started
+    - Stop 2
+    - Assert 2 are stopped and 2 new ones are started
+    """
+    actor_manager = RayActorManager(resource_manager=resource_manager_cls())
+
+    running_actors = []
+    # stats keeps track of started/stopped actors
+    stats = Counter()
+
+    def start_callback(tracked_actor):
+        running_actors.append(tracked_actor)
+        stats["started"] += 1
+
+    def stop_callback(tracked_actor):
+        running_actors.remove(tracked_actor)
+        stats["stopped"] += 1
+
+    # start 10 actors
+    expected_actors = []
+    for i in range(10):
+        tracked_actor = actor_manager.add_actor(
+            cls=Actor,
+            kwargs={"key": "val"},
+            resource_request=ResourceRequest([{"CPU": 1}]),
+            on_start=start_callback,
+            on_stop=stop_callback,
+            on_error=_raise(Failed),
+        )
+        expected_actors.append(tracked_actor)
+
+    # wait for some actor starts
+    for i in range(4):
+        actor_manager.next()
+
+    # we should now have 4 started actors
+    assert stats["started"] == 4
+    assert stats["stopped"] == 0
+    assert len(running_actors) == 4
+    assert set(running_actors) == set(expected_actors[:4])
+
+    # stop 2 actors
+    actor_manager.remove_actor(running_actors[0])
+    actor_manager.remove_actor(running_actors[1])
+
+    # Wait four times, twice for termination, twice for start
+    for i in range(4):
+        actor_manager.next()
+
+    # we should have 4 running actors, 6 started and 2 stopped
+    assert stats["started"] == 6
+    assert stats["stopped"] == 2
+    assert len(running_actors) == 4
+
+
+@pytest.mark.parametrize(
+    "resource_manager_cls", [FixedResourceManager, PlacementGroupResourceManager]
+)
+@pytest.mark.parametrize("where", ["init", "fn"])
+def test_actor_fail(ray_start_4_cpus, resource_manager_cls, where):
+    """Test that actor failures are handled properly.
+
+    - Start actor that either fails on init or in a task (RayActorError)
+    - Schedule task on actor
+    - Assert that the correct callbacks are called
+    """
+    actor_manager = RayActorManager(resource_manager=resource_manager_cls())
+
+    # keep track of failed tasks and actors
+    stats = Counter()
+
+    @ray.remote
+    class FailingActor:
+        def __init__(self, where):
+            self._where = where
+            if self._where == "init":
+                raise RuntimeError("INIT")
+
+        def fn(self):
+            if self._where == "fn":
+                # SystemExit will invoke a RayActorError
+                raise SystemExit
+            return True
+
+    def fail_callback_actor(tracked_actor, exception):
+        stats["failed_actor"] += 1
+
+    def fail_callback_task(tracked_actor, exception):
+        stats["failed_task"] += 1
+
+    # Start actor
+    tracked_actor = actor_manager.add_actor(
+        cls=FailingActor,
+        kwargs={"where": where},
+        resource_request=ResourceRequest([{"CPU": 1}]),
+        on_error=fail_callback_actor,
+    )
+
+    if where != "init":
+        # Wait until it is started. This won't invoke any callback, yet
+        actor_manager.next()
+
+        assert stats["failed_actor"] == 0
+        assert stats["failed_task"] == 0
+
+        # Schedule task
+        actor_manager.schedule_actor_task(
+            tracked_actor, "fn", on_error=fail_callback_task
+        )
+
+    # Yield control and wait for task resolution. This will invoke the callback.
+    actor_manager.next()
+
+    assert stats["failed_actor"] == 1
+    assert stats["failed_task"] == bool(where != "init")
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/python/ray/air/tests/execution/test_tracked_actor_task.py b/python/ray/air/tests/execution/test_tracked_actor_task.py
new file mode 100644
index 000000000000..732de6020944
--- /dev/null
+++ b/python/ray/air/tests/execution/test_tracked_actor_task.py
@@ -0,0 +1,123 @@
+from collections import Counter
+
+import pytest
+
+import ray
+from ray.air import ResourceRequest
+from ray.air.execution import FixedResourceManager, PlacementGroupResourceManager
+from ray.air.execution._internal.actor_manager import RayActorManager
+
+
+RESOURCE_MANAGERS = [FixedResourceManager, PlacementGroupResourceManager]
+
+
+@pytest.fixture(scope="module")
+def ray_start_4_cpus():
+    address_info = ray.init(num_cpus=4)
+    yield address_info
+    ray.shutdown()
+
+
+@ray.remote
+class Actor:
+    def foo(self, val, error: bool = False):
+        if error:
+            raise RuntimeError
+        return val
+
+
+@pytest.mark.parametrize("resource_manager_cls", RESOURCE_MANAGERS)
+def test_resolve(ray_start_4_cpus, resource_manager_cls):
+    """Test that the `on_result` callback is invoked when a task completes.
+
+    - Instantiate global data object
+    - Schedule task that returns a value
+    - The callback writes the returned value to the global data object
+    """
+    actor_manager = RayActorManager(resource_manager=resource_manager_cls())
+
+    seen = {"data": 0}
+
+    def result_callback(tracked_actor, result):
+        seen["data"] = result
+
+    tracked_actor = actor_manager.add_actor(
+        cls=Actor, kwargs={}, resource_request=ResourceRequest([{"CPU": 4}])
+    )
+    actor_manager.schedule_actor_task(
+        tracked_actor, "foo", (4, False), on_result=result_callback
+    )
+    actor_manager.next()
+    actor_manager.next()
+
+    assert seen["data"] == 4
+
+
+@pytest.mark.parametrize("resource_manager_cls", RESOURCE_MANAGERS)
+@pytest.mark.parametrize("num_tasks", [1, 10, 100])
+def test_resolve_many(ray_start_4_cpus, resource_manager_cls, num_tasks):
+    """Schedule ``num_tasks`` tasks and wait until ``wait_for_events`` of them resolve.
+
+    Every resolved task will increase a counter by its return value (1).
+    """
+    actor_manager = RayActorManager(resource_manager=resource_manager_cls())
+
+    seen = {"data": 0}
+
+    def result_callback(tracked_actor, result):
+        seen["data"] += result
+
+    tracked_actor = actor_manager.add_actor(
+        cls=Actor, kwargs={}, resource_request=ResourceRequest([{"CPU": 4}])
+    )
+    actor_manager.next()
+
+    for i in range(num_tasks):
+        actor_manager.schedule_actor_task(
+            tracked_actor, "foo", (1, False), on_result=result_callback
+        )
+
+    for i in range(num_tasks):
+        actor_manager.next()
+        assert seen["data"] == i + 1
+
+
+@pytest.mark.parametrize("resource_manager_cls", RESOURCE_MANAGERS)
+def test_error_noop(ray_start_4_cpus, resource_manager_cls):
+    """When no `on_error` callback is specified, errors should be ignored."""
+    actor_manager = RayActorManager(resource_manager=resource_manager_cls())
+
+    tracked_actor = actor_manager.add_actor(
+        cls=Actor, kwargs={}, resource_request=ResourceRequest([{"CPU": 4}])
+    )
+    actor_manager.schedule_actor_task(tracked_actor, "foo", (1, True))
+    actor_manager.next()
+    actor_manager.next()
+
+
+@pytest.mark.parametrize("resource_manager_cls", RESOURCE_MANAGERS)
+def test_error_custom(ray_start_4_cpus, resource_manager_cls):
+    """When an `on_error` callback is specified, it is invoked."""
+    actor_manager = RayActorManager(resource_manager=resource_manager_cls())
+
+    stats = Counter()
+
+    def error_callback(tracked_actor, exception):
+        stats["exception"] += 1
+
+    tracked_actor = actor_manager.add_actor(
+        cls=Actor, kwargs={}, resource_request=ResourceRequest([{"CPU": 4}])
+    )
+    actor_manager.schedule_actor_task(
+        tracked_actor, "foo", (1, True), on_error=error_callback
+    )
+
+    actor_manager.next()
+    actor_manager.next()
+    assert stats["exception"] == 1
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))

From c9cf2ef332b2d95eeb764e71a8c260bf8fcb0e75 Mon Sep 17 00:00:00 2001
From: Avnish Narayan <38871737+avnishn@users.noreply.github.com>
Date: Thu, 9 Feb 2023 17:20:44 -0800
Subject: [PATCH 211/267] [RLlib] Async trainer manager (#32282)

Implement asynchronous update function along with a small
test to see that it converges to the same results as the synchronous
update

Signed-off-by: avnish <avnish@anyscale.com>
---
 rllib/core/rl_trainer/rl_trainer.py           |   5 +-
 .../rl_trainer/tests/test_trainer_runner.py   |  54 ++++++
 rllib/core/rl_trainer/trainer_runner.py       | 162 ++++++++++++------
 rllib/utils/minibatch_utils.py                |  31 ++++
 4 files changed, 196 insertions(+), 56 deletions(-)

diff --git a/rllib/core/rl_trainer/rl_trainer.py b/rllib/core/rl_trainer/rl_trainer.py
index eb91583018d8..00f61eeeb935 100644
--- a/rllib/core/rl_trainer/rl_trainer.py
+++ b/rllib/core/rl_trainer/rl_trainer.py
@@ -681,10 +681,13 @@ def __check_if_build_called(self):
                 "RLTrainer and before calling any methods on it."
             )
 
+    def apply(self, func, *_args, **_kwargs):
+        return func(self, *_args, **_kwargs)
+
 
 @dataclass
 class RLTrainerSpec:
-    """The spec for construcitng RLTrainer actors.
+    """The spec for constructing RLTrainer actors.
 
     Args:
         rl_trainer_class: The RLTrainer class to use.
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner.py b/rllib/core/rl_trainer/tests/test_trainer_runner.py
index 4e045ec2ee69..bc13442dfccd 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner.py
@@ -12,6 +12,7 @@
     get_rl_trainer,
     add_module_to_runner_or_trainer,
 )
+from ray.util.timer import _Timer
 
 
 REMOTE_SCALING_CONFIGS = {
@@ -197,6 +198,59 @@ def test_add_remove_module(self):
             runner.shutdown()
             del runner
 
+    def test_async_update(self):
+        """Test that async style updates converge to the same result as sync."""
+        fws = ["tf", "torch"]
+        # block=True only needs to be tested for the most complex case.
+        # so we'll only test it for multi-gpu-ddp.
+        scaling_modes = ["multi-gpu-ddp"]
+        test_iterator = itertools.product(fws, scaling_modes)
+
+        for fw, scaling_mode in test_iterator:
+            print(f"Testing framework: {fw}, scaling mode: {scaling_mode}.")
+            env = gym.make("CartPole-v1")
+            scaling_config = REMOTE_SCALING_CONFIGS[scaling_mode]
+            runner = get_trainer_runner(fw, env, scaling_config)
+            reader = get_cartpole_dataset_reader(batch_size=512)
+            min_loss = float("inf")
+            batch = reader.next()
+            timer_sync = _Timer()
+            timer_async = _Timer()
+            with timer_sync:
+                runner.update(batch.as_multi_agent(), block=True, reduce_fn=None)
+            with timer_async:
+                result_async = runner.update(
+                    batch.as_multi_agent(), block=False, reduce_fn=None
+                )
+            # ideally the the first async update will return nothing, and an easy
+            # way to check that is if the time for an async update call is faster
+            # than the time for a sync update call.
+            self.assertLess(timer_async.mean, timer_sync.mean)
+            self.assertIsInstance(result_async, list)
+            self.assertEqual(len(result_async), 0)
+            for iter_i in range(1000):
+                batch = reader.next()
+                results = runner.update(
+                    batch.as_multi_agent(), block=False, reduce_fn=None
+                )
+                if not results:
+                    continue
+                loss = np.mean([res["loss"]["total_loss"] for res in results])
+                min_loss = min(loss, min_loss)
+                print(f"[iter = {iter_i}] Loss: {loss:.3f}, Min Loss: {min_loss:.3f}")
+                # The loss is initially around 0.69 (ln2). When it gets to around
+                # 0.57 the return of the policy gets to around 100.
+                if min_loss < 0.57:
+                    break
+
+                for res1, res2 in zip(results, results[1:]):
+                    self.assertEqual(
+                        res1["mean_weight"]["default_policy"],
+                        res2["mean_weight"]["default_policy"],
+                    )
+            runner.shutdown()
+            self.assertLess(min_loss, 0.57)
+
 
 if __name__ == "__main__":
     import pytest
diff --git a/rllib/core/rl_trainer/trainer_runner.py b/rllib/core/rl_trainer/trainer_runner.py
index 63c1bc87f6aa..5b6f193195bb 100644
--- a/rllib/core/rl_trainer/trainer_runner.py
+++ b/rllib/core/rl_trainer/trainer_runner.py
@@ -1,10 +1,8 @@
-import math
+from collections import deque
 from typing import Any, List, Mapping, Type, Optional, Callable, Set, TYPE_CHECKING
 
 import ray
 
-from ray.rllib.utils.typing import ResultDict
-from ray.rllib.utils.numpy import convert_to_numpy
 from ray.rllib.core.rl_trainer.reduce_result_dict_fn import _reduce_mean_results
 from ray.rllib.core.rl_module.rl_module import (
     RLModule,
@@ -17,6 +15,10 @@
     Optimizer,
 )
 from ray.rllib.policy.sample_batch import MultiAgentBatch
+from ray.rllib.utils.actor_manager import FaultTolerantActorManager
+from ray.rllib.utils.minibatch_utils import ShardBatchIterator
+from ray.rllib.utils.typing import ResultDict
+from ray.rllib.utils.numpy import convert_to_numpy
 from ray.train._internal.backend_executor import BackendExecutor
 
 if TYPE_CHECKING:
@@ -47,24 +49,23 @@ class TrainerRunner:
         .get_state() -> returns the state of the RLModule and RLOptimizer from
                         all of the RLTrainers.
         .set_state() -> sets the state of all the RLTrainers.
+        .get_weights() -> returns the weights of the RLModule from the RLTrainer(s).
+        .set_weights() -> sets the weights of the RLModule in the RLTrainer(s).
         .add_module() -> add a new RLModule to the MultiAgentRLModule being trained by
                          this TrainerRunner.
         .remove_module() -> remove an RLModule from the MultiAgentRLModule being trained
                             by this TrainerRunner.
-
-    TODO(avnishn):
-        1. Add trainer runner with async operations
-        2. Use fault tolerant actor manager to handle failures
-        3. Add from_xxx constructor pattern. For example
-           add a `from_policy_map(self.local_worker().policy_map, cfg)`
-           constructor to make it easier to create a TrainerRunner from a
-           rollout worker.
-
+    Args:
+        rl_trainer_spec: The specification for constructing RLTrainers.
+        max_queue_len: The maximum number of batches to queue up if doing non-blocking
+            updates (e.g. `self.update(batch, block=False)`). If the queue is full it
+            will evict the oldest batch first.
     """
 
     def __init__(
         self,
         rl_trainer_spec: RLTrainerSpec,
+        max_queue_len: int = 20,
     ):
         scaling_config = rl_trainer_spec.trainer_scaling_config
         rl_trainer_class = rl_trainer_spec.rl_trainer_class
@@ -74,10 +75,16 @@ def __init__(
         self._is_local = scaling_config.num_workers == 0
         self._trainer = None
         self._workers = None
+        # if a user calls self.shutdown() on their own then this flag is set to true.
+        # When del is called the backend executor isn't shutdown twice if this flag is
+        # true. the backend executor would otherwise log a warning to the console from
+        # ray train
+        self._is_shut_down = False
 
         if self._is_local:
             self._trainer = rl_trainer_class(**rl_trainer_spec.get_params_dict())
             self._trainer.build()
+            self._worker_manager = None
         else:
             backend_config = _get_backend_config(rl_trainer_class)
             backend_executor = BackendExecutor(
@@ -98,6 +105,13 @@ def __init__(
 
             # run the neural network building code on remote workers
             ray.get([w.build.remote() for w in self._workers])
+            # use only 1 max in flight request per worker since training workers have to
+            # be synchronously executed.
+            self._worker_manager = FaultTolerantActorManager(
+                self._workers,
+                max_remote_requests_in_flight_per_actor=1,
+            )
+            self._in_queue = deque(maxlen=max_queue_len)
 
     @property
     def is_local(self) -> bool:
@@ -110,6 +124,7 @@ def update(
         minibatch_size: Optional[int] = None,
         num_iters: int = 1,
         reduce_fn: Callable[[ResultDict], ResultDict] = _reduce_mean_results,
+        block: bool = True,
     ) -> List[Mapping[str, Any]]:
         """Do one gradient based update to the RLTrainer(s).
 
@@ -125,11 +140,17 @@ def update(
                 example for metrics) or be more selective about you want to report back
                 to the algorithm's training_step. If None is passed, the results will
                 not get reduced.
+            block: Whether to block until the update is complete.
 
         Returns:
             A list of dictionaries of results from the updates from the RLTrainer(s)
         """
         if self.is_local:
+            if not block:
+                raise ValueError(
+                    "Cannot run update in non-blocking mode when running in local "
+                    "mode with num_workers=0."
+                )
             results = [
                 self._trainer.update(
                     batch,
@@ -144,10 +165,11 @@ def update(
                 minibatch_size=minibatch_size,
                 num_iters=num_iters,
                 reduce_fn=reduce_fn,
+                block=block,
             )
 
         # TODO (Kourosh): Maybe we should use LearnerInfoBuilder() here?
-        if reduce_fn is None:
+        if reduce_fn is None or not results:
             return results
         return reduce_fn(results)
 
@@ -158,6 +180,7 @@ def _distributed_update(
         minibatch_size: Optional[int] = None,
         num_iters: int = 1,
         reduce_fn: Callable[[ResultDict], ResultDict] = _reduce_mean_results,
+        block: bool = True,
     ) -> List[Mapping[str, Any]]:
         """Do a gradient based update to the RLTrainers using DDP training.
 
@@ -172,28 +195,51 @@ def _distributed_update(
         Returns:
             A list of dictionaries of results from the updates from the RLTrainer(s)
         """
-        refs = []
-        global_size = len(self._workers)
-        for i, worker in enumerate(self._workers):
-            batch_to_send = {}
-            for pid, sub_batch in batch.policy_batches.items():
-                batch_size = math.ceil(len(sub_batch) / global_size)
-                start = batch_size * i
-                end = min(start + batch_size, len(sub_batch))
-                batch_to_send[pid] = sub_batch[int(start) : int(end)]
-            # TODO (Avnish): int(batch_size) ? How should we shard MA batches really?
-            new_batch = MultiAgentBatch(batch_to_send, int(batch_size))
-            refs.append(
-                worker.update.remote(
-                    new_batch,
-                    minibatch_size=minibatch_size,
-                    num_iters=num_iters,
-                    reduce_fn=reduce_fn,
-                )
+
+        if block:
+            results = self._worker_manager.foreach_actor(
+                [
+                    lambda w: w.update(
+                        b,
+                        minibatch_size=minibatch_size,
+                        num_iters=num_iters,
+                        reduce_fn=reduce_fn,
+                    )
+                    for b in ShardBatchIterator(batch, len(self._workers))
+                ]
             )
+        else:
+            if batch is not None:
+                self._in_queue.append(batch)
+            results = self._worker_manager.fetch_ready_async_reqs()
+            if self._worker_manager_ready() and self._in_queue:
+                batch = self._in_queue.popleft()
+                self._worker_manager.foreach_actor_async(
+                    [
+                        lambda w: w.update(
+                            b,
+                            minibatch_size=minibatch_size,
+                            num_iters=num_iters,
+                            reduce_fn=reduce_fn,
+                        )
+                        for b in ShardBatchIterator(batch, len(self._workers))
+                    ]
+                )
+
+        return self._get_results(results)
 
-        results = ray.get(refs)
-        return results
+    def _worker_manager_ready(self):
+        return self._worker_manager.num_outstanding_async_reqs() == 0
+
+    def _get_results(self, results):
+        processed_results = []
+        for result in results:
+            result_or_error = result.get()
+            if result.ok:
+                processed_results.append(result_or_error)
+            else:
+                raise result_or_error
+        return processed_results
 
     def additional_update(
         self,
@@ -219,13 +265,13 @@ def additional_update(
         if self.is_local:
             results = [self._trainer.additional_update(**kwargs)]
         else:
-            refs = []
-            for worker in self._workers:
-                refs.append(worker.additional_update.remote(**kwargs))
-            results = ray.get(refs)
-        if reduce_fn is None:
-            return results
-        return reduce_fn(results)
+            results = self._worker_manager.foreach_actor(
+                [lambda w: w.additional_update(**kwargs) for worker in self._workers]
+            )
+            results = self._get_results(results)
+            if reduce_fn is None:
+                return results
+            return reduce_fn(results)
 
     def add_module(
         self,
@@ -256,16 +302,15 @@ def add_module(
                 optimizer_cls=optimizer_cls,
             )
         else:
-            refs = []
-            for worker in self._workers:
-                ref = worker.add_module.remote(
+            results = self._worker_manager.foreach_actor(
+                lambda w: w.add_module(
                     module_id=module_id,
                     module_spec=module_spec,
                     set_optimizer_fn=set_optimizer_fn,
                     optimizer_cls=optimizer_cls,
                 )
-                refs.append(ref)
-            ray.get(refs)
+            )
+            return self._get_results(results)
 
     def remove_module(self, module_id: ModuleID) -> None:
         """Remove a module from the RLTrainers maintained by this TrainerRunner.
@@ -289,14 +334,18 @@ def set_weights(self, weights) -> None:
         if self.is_local:
             self._trainer.set_weights(weights)
         else:
-            ray.get([worker.set_weights.remote(weights) for worker in self._workers])
+            self._worker_manager.foreach_actor(lambda w: w.set_weights(weights))
 
     def get_weights(self, module_ids: Optional[Set[str]] = None) -> Mapping[str, Any]:
         if self.is_local:
             weights = self._trainer.get_weights(module_ids)
         else:
-            worker = next(iter(self._workers))
-            weights = ray.get(worker.get_weights.remote(module_ids))
+            worker = self._worker_manager.healthy_actor_ids()[0]
+            assert len(self._workers) == self._worker_manager.num_healthy_actors()
+            weights = self._worker_manager.foreach_actor(
+                lambda w: w.get_weights(module_ids), remote_actor_ids=[worker]
+            )
+            weights = self._get_results(weights)[0]
 
         return convert_to_numpy(weights)
 
@@ -308,8 +357,12 @@ def get_state(self) -> Mapping[ModuleID, Mapping[str, Any]]:
         if self.is_local:
             return self._trainer.get_state()
         else:
-            worker = next(iter(self._workers))
-            return ray.get(worker.get_state.remote())
+            worker = self._worker_manager.healthy_actor_ids()[0]
+            assert len(self._workers) == self._worker_manager.num_healthy_actors()
+            results = self._worker_manager.foreach_actor(
+                lambda w: w.get_state(), remote_actor_ids=[worker]
+            )
+            return self._get_results(results)[0]
 
     def set_state(self, state: List[Mapping[ModuleID, Mapping[str, Any]]]) -> None:
         """Sets the states of the RLTrainers.
@@ -321,15 +374,14 @@ def set_state(self, state: List[Mapping[ModuleID, Mapping[str, Any]]]) -> None:
         if self.is_local:
             self._trainer.set_state(state)
         else:
-            refs = []
-            for worker in self._workers:
-                refs.append(worker.set_state.remote(state))
-            ray.get(refs)
+            self._worker_manager.foreach_actor(lambda w: w.set_state(state))
 
     def shutdown(self):
         """Shuts down the TrainerRunner."""
         if not self._is_local:
             self._backend_executor.shutdown()
+            self._is_shut_down = True
 
     def __del__(self):
-        self.shutdown()
+        if not self._is_shut_down:
+            self.shutdown()
diff --git a/rllib/utils/minibatch_utils.py b/rllib/utils/minibatch_utils.py
index b63881489129..b47afd2f4cf3 100644
--- a/rllib/utils/minibatch_utils.py
+++ b/rllib/utils/minibatch_utils.py
@@ -1,3 +1,5 @@
+import math
+
 from ray.rllib.policy.sample_batch import MultiAgentBatch, concat_samples
 from ray.rllib.utils.annotations import DeveloperAPI
 
@@ -89,3 +91,32 @@ def __init__(self, batch: MultiAgentBatch, minibatch_size: int, num_iters: int =
 
     def __iter__(self):
         yield self._batch
+
+
+@DeveloperAPI
+class ShardBatchIterator:
+    """Iterator for sharding batch into num_shards batches.
+
+    Args:
+        batch: The input multi-agent batch.
+        num_shards: The number of shards to split the batch into.
+
+    Yields:
+        A MultiAgentBatch of size len(batch) / num_shards.
+    """
+
+    def __init__(self, batch: MultiAgentBatch, num_shards: int):
+        self._batch = batch
+        self._num_shards = num_shards
+
+    def __iter__(self):
+        for i in range(self._num_shards):
+            batch_to_send = {}
+            for pid, sub_batch in self._batch.policy_batches.items():
+                batch_size = math.ceil(len(sub_batch) / self._num_shards)
+                start = batch_size * i
+                end = min(start + batch_size, len(sub_batch))
+                batch_to_send[pid] = sub_batch[int(start) : int(end)]
+            # TODO (Avnish): int(batch_size) ? How should we shard MA batches really?
+            new_batch = MultiAgentBatch(batch_to_send, int(batch_size))
+            yield new_batch

From d807ce0876c575947578de33d77b31b6f441b023 Mon Sep 17 00:00:00 2001
From: Chen Shen <scv119@gmail.com>
Date: Thu, 9 Feb 2023 17:41:02 -0800
Subject: [PATCH 212/267] Revert "[core] Add opt-in flag for Windows and OSX
 clusters, update `ray start` output to match docs (#31166)" (#32403)

This reverts commit 90f8511139e99e28ebb7cb5d2ba2ff31a5c5e254.
---
 .bazelrc                                      |   3 -
 .buildkite/pipeline.windows.yml               |   1 -
 doc/source/cluster/getting-started.rst        |   6 -
 doc/source/ray-overview/installation.rst      |   6 +-
 python/ray/_private/ray_constants.py          |  19 +--
 python/ray/_private/services.py               |  13 +-
 python/ray/_private/worker.py                 |  17 +-
 python/ray/scripts/scripts.py                 | 159 +++++++-----------
 python/ray/tests/test_basic_4.py              |   4 -
 .../test_cli_patterns/test_ray_start.txt      |  21 +--
 .../gcs/gcs_client/global_state_accessor.cc   |   6 +-
 11 files changed, 88 insertions(+), 167 deletions(-)

diff --git a/.bazelrc b/.bazelrc
index f8b916446e54..1b98b8f72a3f 100644
--- a/.bazelrc
+++ b/.bazelrc
@@ -29,9 +29,6 @@ test --test_env=PYENV_VERSION
 test --test_env=PYENV_SHELL
 # Do not send usage stats to the server for tests
 test --test_env=RAY_USAGE_STATS_REPORT_URL="http://127.0.0.1:8000"
-# Enable cluster mode for OSX and Windows. By default, Ray
-# will not allow multinode OSX and Windows clusters.
-test --test_env=RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER="1"
 # This is needed for some core tests to run correctly
 build:windows --enable_runfiles
 # TODO(mehrdadn): Revert the "-\\.(asm|S)$" exclusion when this Bazel bug
diff --git a/.buildkite/pipeline.windows.yml b/.buildkite/pipeline.windows.yml
index 0aa3816ff747..fef6b5187115 100644
--- a/.buildkite/pipeline.windows.yml
+++ b/.buildkite/pipeline.windows.yml
@@ -35,7 +35,6 @@ steps:
     - conda init
     - . ./ci/ci.sh init
     - ./ci/ci.sh build
-    - export RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER="1"
     - if [ "${BUILDKITE_PARALLEL_JOB}" = "0" ]; then ./ci/ci.sh test_core; fi
     # The next command will be sharded into $parallelism shards.
     - ./ci/ci.sh test_python
diff --git a/doc/source/cluster/getting-started.rst b/doc/source/cluster/getting-started.rst
index 8024ef751a33..1538fbacb63d 100644
--- a/doc/source/cluster/getting-started.rst
+++ b/doc/source/cluster/getting-started.rst
@@ -22,12 +22,6 @@ Ray provides native cluster deployment support on the following technology stack
 Advanced users may want to :ref:`deploy Ray manually <on-prem>`
 or onto :ref:`platforms not listed here <ref-cluster-setup>`.
 
-.. note::
-
-    Multi-node Ray clusters are only supported on Linux. At your own risk, you
-    may deploy Windows and OSX clusters by setting the environment variable
-    ``RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER=1`` during deployment.
-
 What's next?
 ------------
 
diff --git a/doc/source/ray-overview/installation.rst b/doc/source/ray-overview/installation.rst
index bc35960eac54..3c7f41dbe18e 100644
--- a/doc/source/ray-overview/installation.rst
+++ b/doc/source/ray-overview/installation.rst
@@ -203,8 +203,7 @@ You can install and use Ray C++ API as follows.
 M1 Mac (Apple Silicon) Support
 ------------------------------
 
-Ray has experimental support for machines running Apple Silicon (such as M1 macs).
-Multi-node clusters are untested. To get started with local Ray development:
+Ray has experimental support for machines running Apple Silicon (such as M1 macs). To get started:
 
 #. Install `miniforge <https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-MacOSX-arm64.sh>`_.
 
@@ -237,8 +236,7 @@ Multi-node clusters are untested. To get started with local Ray development:
 Windows Support
 ---------------
 
-Windows support is currently in beta, and multi-node Ray clusters are untested.
-Please submit any issues you encounter on
+Windows support is currently in beta. Please submit any issues you encounter on
 `GitHub <https://github.com/ray-project/ray/issues/>`_.
 
 Installing Ray on Arch Linux
diff --git a/python/ray/_private/ray_constants.py b/python/ray/_private/ray_constants.py
index 3494cbdf2efa..1b555c389409 100644
--- a/python/ray/_private/ray_constants.py
+++ b/python/ray/_private/ray_constants.py
@@ -2,7 +2,6 @@
 
 import logging
 import os
-import sys
 
 logger = logging.getLogger(__name__)
 
@@ -24,18 +23,10 @@ def env_integer(key, default):
 
 def env_bool(key, default):
     if key in os.environ:
-        return (
-            True
-            if os.environ[key].lower() == "true" or os.environ[key] == "1"
-            else False
-        )
+        return True if os.environ[key].lower() == "true" else False
     return default
 
 
-def env_set_by_user(key):
-    return key in os.environ
-
-
 # Whether event logging to driver is enabled. Set to 0 to disable.
 AUTOSCALER_EVENTS = env_integer("RAY_SCHEDULER_EVENTS", 1)
 
@@ -379,11 +370,3 @@ def gcs_actor_scheduling_enabled():
 # Ray wheels into the conda environment, so the Ray wheels for these Python
 # versions must be available online.
 RUNTIME_ENV_CONDA_PY_VERSIONS = [(3, 6), (3, 7), (3, 8), (3, 9), (3, 10)]
-
-# Whether to enable Ray clusters (in addition to local Ray).
-# Ray clusters are not explicitly supported for Windows and OSX.
-ENABLE_RAY_CLUSTERS_ENV_VAR = "RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER"
-ENABLE_RAY_CLUSTER = env_bool(
-    ENABLE_RAY_CLUSTERS_ENV_VAR,
-    not (sys.platform == "darwin" or sys.platform == "win32"),
-)
diff --git a/python/ray/_private/services.py b/python/ray/_private/services.py
index 14fba2de6716..27731e9de2dc 100644
--- a/python/ray/_private/services.py
+++ b/python/ray/_private/services.py
@@ -583,11 +583,8 @@ def resolve_ip_for_localhost(address: str):
     if not address:
         raise ValueError(f"Malformed address: {address}")
     address_parts = address.split(":")
+    # Make sure localhost isn't resolved to the loopback ip
     if address_parts[0] == "127.0.0.1" or address_parts[0] == "localhost":
-        # Clusters are disabled by default for OSX and Windows.
-        if not ray_constants.ENABLE_RAY_CLUSTER:
-            return address
-        # Make sure localhost isn't resolved to the loopback ip
         ip_address = get_node_ip_address()
         return ":".join([ip_address] + address_parts[1:])
     else:
@@ -630,10 +627,10 @@ def node_ip_address_from_perspective(address: str):
 def get_node_ip_address(address="8.8.8.8:53"):
     if ray._private.worker._global_node is not None:
         return ray._private.worker._global_node.node_ip_address
-    if not ray_constants.ENABLE_RAY_CLUSTER:
-        # Use loopback IP as the local IP address to prevent bothersome
-        # firewall popups on OSX and Windows.
-        # https://github.com/ray-project/ray/issues/18730.
+    if sys.platform == "darwin" or sys.platform == "win32":
+        # Due to the mac osx/windows firewall,
+        # we use loopback ip as the ip address
+        # to prevent security popups.
         return "127.0.0.1"
     return node_ip_address_from_perspective(address)
 
diff --git a/python/ray/_private/worker.py b/python/ray/_private/worker.py
index 531e3839b96b..a1dcfa8277cf 100644
--- a/python/ray/_private/worker.py
+++ b/python/ray/_private/worker.py
@@ -1353,24 +1353,15 @@ def init(
                 job_config = ray.job_config.JobConfig()
             job_config.set_runtime_env(runtime_env)
 
+    if _node_ip_address is not None:
+        node_ip_address = services.resolve_ip_for_localhost(_node_ip_address)
+    raylet_ip_address = node_ip_address
+
     redis_address, gcs_address = None, None
     bootstrap_address = services.canonicalize_bootstrap_address(address, _temp_dir)
     if bootstrap_address is not None:
         gcs_address = bootstrap_address
         logger.info("Connecting to existing Ray cluster at address: %s...", gcs_address)
-        if not ray_constants.env_set_by_user(ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR):
-            # If the cluster already exists, then assume it's safe to connect
-            # to the cluster even if we're on Windows or OSX (unless the user
-            # explicitly set the flag).
-            ray_constants.ENABLE_RAY_CLUSTER = True
-
-    # NOTE(swang): We must set the node IP address *after* we determine whether
-    # this is an existing cluster or not. For Windows and OSX, the resolved IP
-    # is localhost for new clusters and the usual public IP for existing
-    # clusters.
-    if _node_ip_address is not None:
-        node_ip_address = services.resolve_ip_for_localhost(_node_ip_address)
-    raylet_ip_address = node_ip_address
 
     if local_mode:
         driver_mode = LOCAL_MODE
diff --git a/python/ray/scripts/scripts.py b/python/ray/scripts/scripts.py
index f032cffdd030..048a7afe0f97 100644
--- a/python/ray/scripts/scripts.py
+++ b/python/ray/scripts/scripts.py
@@ -578,7 +578,10 @@ def start(
             cf.bold("--port"),
         )
 
+    # Whether the original arguments include node_ip_address.
+    include_node_ip_address = False
     if node_ip_address is not None:
+        include_node_ip_address = True
         node_ip_address = services.resolve_ip_for_localhost(node_ip_address)
 
     resources = parse_resources_json(resources, cli_logger, cf)
@@ -746,121 +749,87 @@ def start(
         cli_logger.success("-" * len(startup_msg))
         cli_logger.newline()
         with cli_logger.group("Next steps"):
-            dashboard_url = node.address_info["webui_url"]
+            cli_logger.print("To connect to this Ray runtime from another node, run")
+            # NOTE(kfstorm): Java driver rely on this line to get the address
+            # of the cluster. Please be careful when updating this line.
+            cli_logger.print(
+                cf.bold("  ray start --address='{}'"),
+                bootstrap_address,
+            )
             if bootstrap_address.startswith("127.0.0.1:"):
-                if ray_constants.ENABLE_RAY_CLUSTER:
-                    cli_logger.print(
-                        "This Ray runtime only accepts connections from local host."
-                    )
-                    cli_logger.print(
-                        "To accept connections from remote hosts, "
-                        "specify a public ip when starting"
-                    )
-                    cli_logger.print(
-                        "the head node: ray start --head --node-ip-address=<public-ip>."
-                    )
-                else:
-                    cli_logger.print(
-                        "Multi-node Ray clusters are not supported on OSX and Windows."
-                    )
-                    cli_logger.print(
-                        "If you would like to proceed anyway, restart Ray with:"
-                    )
-                    cli_logger.print(
-                        cf.bold("  ray stop"),
-                    )
-                    cli_logger.print(
-                        cf.bold("  {}=true ray start"),
-                        ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR,
-                    )
-                cli_logger.newline()
-            else:
-                cli_logger.print("To add another node to this Ray cluster, run")
-                # NOTE(kfstorm): Java driver rely on this line to get the address
-                # of the cluster. Please be careful when updating this line.
                 cli_logger.print(
-                    cf.bold("  ray start --address='{}'"),
-                    bootstrap_address,
+                    "This Ray runtime only accepts connections from local host."
                 )
-                cli_logger.newline()
-            if ray_constants.ENABLE_RAY_CLUSTER:
                 cli_logger.print(
-                    "To connect to this Ray cluster, run `ray.init()` as usual:"
-                )
-                with cli_logger.indented():
-                    cli_logger.print("{} ray", cf.magenta("import"))
-                    cli_logger.print(
-                        "ray{}init()",
-                        cf.magenta("."),
-                    )
-                cli_logger.newline()
-                cli_logger.print(
-                    "To connect to this Ray instance from outside of "
-                    "the cluster, for example "
+                    "To accept connections from remote hosts, "
+                    "specify a public ip when starting"
                 )
                 cli_logger.print(
-                    "when connecting to a remote cluster from your laptop, "
-                    "make sure the"
+                    "the head node: ray start --head --node-ip-address=<public-ip>."
                 )
+            cli_logger.newline()
+            cli_logger.print("Alternatively, use the following Python code:")
+            with cli_logger.indented():
+                cli_logger.print("{} ray", cf.magenta("import"))
+                # Note: In the case of joining an existing cluster using
+                # `address="auto"`, the _node_ip_address parameter is
+                # unnecessary.
                 cli_logger.print(
-                    "dashboard {}is accessible and use the Ray Jobs API. For example:",
-                    f"({dashboard_url}) " if dashboard_url else "",
-                )
-                if dashboard_url:
-                    cli_logger.print(
-                        cf.bold(
-                            "  RAY_ADDRESS='http://<dashboard URL>:{}' ray job submit "
-                            "--working-dir . "
-                            "-- python my_script.py"
-                        ),
-                        ray_params.dashboard_port,
+                    "ray{}init(address{}{}{})",
+                    cf.magenta("."),
+                    cf.magenta("="),
+                    cf.yellow("'auto'"),
+                    ", _node_ip_address{}{}".format(
+                        cf.magenta("="), cf.yellow("'" + node_ip_address + "'")
                     )
-                cli_logger.newline()
-                cli_logger.print(
-                    "See https://docs.ray.io/en/latest/cluster/running-applications"
-                    "/job-submission/index.html"
+                    if include_node_ip_address
+                    else "",
                 )
+            cli_logger.newline()
+            cli_logger.print(
+                "To connect to this Ray runtime from outside of "
+                "the cluster, for example to"
+            )
+            cli_logger.print(
+                "connect to a remote cluster from your laptop "
+                "directly, use the following"
+            )
+            cli_logger.print("Python code:")
+            with cli_logger.indented():
+                cli_logger.print("{} ray", cf.magenta("import"))
                 cli_logger.print(
-                    "for more information on connecting to the Ray cluster from "
-                    "a remote client."
+                    "ray{}init(address{}{})",
+                    cf.magenta("."),
+                    cf.magenta("="),
+                    cf.yellow(
+                        "'ray://<head_node_ip_address>:" f"{ray_client_server_port}'"
+                    ),
                 )
-                cli_logger.newline()
-                cli_logger.print("To see the status of the cluster, use")
-                cli_logger.print("  {}".format(cf.bold("ray status")))
-                if dashboard_url:
-                    cli_logger.print("To monitor and debug Ray, view the dashboard at ")
-                    cli_logger.print(
-                        "  {}".format(
-                            cf.bold(dashboard_url),
-                        )
-                    )
-                cli_logger.newline()
+            cli_logger.newline()
+            cli_logger.print("To see the status of the cluster, use")
+            cli_logger.print("  {}".format(cf.bold("ray status")))
+            dashboard_url = node.address_info["webui_url"]
+            if dashboard_url:
+                cli_logger.print("To monitor and debug Ray, view the dashboard at ")
                 cli_logger.print(
-                    cf.underlined(
-                        "If connection fails, check your "
-                        "firewall settings and "
-                        "network configuration."
+                    "  {}".format(
+                        cf.bold(dashboard_url),
                     )
                 )
-                cli_logger.newline()
+            cli_logger.newline()
+            cli_logger.print(
+                cf.underlined(
+                    "If connection fails, check your "
+                    "firewall settings and "
+                    "network configuration."
+                )
+            )
+            cli_logger.newline()
             cli_logger.print("To terminate the Ray runtime, run")
             cli_logger.print(cf.bold("  ray stop"))
         ray_params.gcs_address = bootstrap_address
     else:
         # Start worker node.
-        if not ray_constants.ENABLE_RAY_CLUSTER:
-            cli_logger.abort(
-                "Multi-node Ray clusters are not supported on Windows and OSX. "
-                "Restart the Ray cluster with the environment variable `{}=1` "
-                "to proceed anyway.",
-                cf.bold(ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR),
-            )
-            raise Exception(
-                "Multi-node Ray clusters are not supported on Windows and OSX. "
-                "Restart the Ray cluster with the environment variable "
-                f"`{ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR}=1` to proceed "
-                "anyway.",
-            )
 
         # Ensure `--address` flag is specified.
         if address is None:
diff --git a/python/ray/tests/test_basic_4.py b/python/ray/tests/test_basic_4.py
index 43eb63e5ee95..083ba0eaf605 100644
--- a/python/ray/tests/test_basic_4.py
+++ b/python/ray/tests/test_basic_4.py
@@ -4,11 +4,9 @@
 import sys
 import time
 from pathlib import Path
-import os
 
 import numpy as np
 import pytest
-from unittest import mock
 
 import ray
 import ray.cluster_utils
@@ -165,8 +163,6 @@ def g():
     sys.platform not in ["win32", "darwin"],
     reason="Only listen on localhost by default on mac and windows.",
 )
-@mock.patch("ray._private.services.ray_constants.ENABLE_RAY_CLUSTER", False)
-@mock.patch.dict(os.environ, {"RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER": "0"})
 @pytest.mark.parametrize("start_ray", ["ray_start_regular", "call_ray_start"])
 def test_listen_on_localhost(start_ray, request):
     """All ray processes should listen on localhost by default
diff --git a/python/ray/tests/test_cli_patterns/test_ray_start.txt b/python/ray/tests/test_cli_patterns/test_ray_start.txt
index bddb03bb7619..31df71daea0a 100644
--- a/python/ray/tests/test_cli_patterns/test_ray_start.txt
+++ b/python/ray/tests/test_cli_patterns/test_ray_start.txt
@@ -7,28 +7,25 @@ Ray runtime started.
 --------------------
 
 Next steps
-  To add another node to this Ray cluster, run
+  To connect to this Ray runtime from another node, run
     ray start --address='.+'
 
-  To connect to this Ray cluster, run `ray.init\(\)` as usual:
+  Alternatively, use the following Python code:
     import ray
-    ray\.init\(\)
+    ray\.init\(address='auto'\)
 
-  To connect to this Ray instance from outside of the cluster, for example
-  when connecting to a remote cluster from your laptop, make sure the
-  dashboard (.*) is accessible and use the Ray Jobs API\. For example:
-    RAY_ADDRESS='http://<dashboard URL>:8265' ray job submit --working-dir \. -- python my_script\.py
-
-  See https://docs\.ray\.io/en/latest/cluster/running-applications/job-submission/index\.html
-  for more information on connecting to the Ray cluster from a remote client\.
+  To connect to this Ray runtime from outside of the cluster, for example to
+  connect to a remote cluster from your laptop directly, use the following
+  Python code:
+    import ray
+    ray\.init\(address='ray://.*'\)
 
   To see the status of the cluster, use
     ray status
-  To monitor and debug Ray, view the dashboard at
+  To monitor and debug Ray, view the dashboard at 
     127.0.0.1:8265
 
   If connection fails, check your firewall settings and network configuration.
 
   To terminate the Ray runtime, run
     ray stop
-
diff --git a/src/ray/gcs/gcs_client/global_state_accessor.cc b/src/ray/gcs/gcs_client/global_state_accessor.cc
index 377a2076e852..e6376567913d 100644
--- a/src/ray/gcs/gcs_client/global_state_accessor.cc
+++ b/src/ray/gcs/gcs_client/global_state_accessor.cc
@@ -354,9 +354,9 @@ ray::Status GlobalStateAccessor::GetNodeToConnectForDriver(
 
       if (relevant_client_index < 0 && head_node_client_index >= 0) {
         RAY_LOG(INFO) << "This node has an IP address of " << node_ip_address
-                      << ", but we cannot find a local Raylet with the same address. "
-                      << "This can happen when you connect to the Ray cluster "
-                      << "with a different IP address or when connecting to a container.";
+                      << ", while we can not find the matched Raylet address. "
+                      << "This maybe come from when you connect the Ray cluster "
+                      << "with a different IP address or connect a container.";
         relevant_client_index = head_node_client_index;
       }
       if (relevant_client_index < 0) {

From 73b52e0adde16f446ebe9184e15fb782a0ce71a1 Mon Sep 17 00:00:00 2001
From: clarng <clarence.wyng@gmail.com>
Date: Thu, 9 Feb 2023 19:06:12 -0800
Subject: [PATCH 213/267]  [core][oom] Use retriable lifo policy for dask 3x
 nightly test (#32361)

Signed-off-by: Clarence Ng <clarence.wyng@gmail.com>

3x nightly dask test is failing, due to enabling of group-by-owner oom killer policy

This switches the test to use the previous policy
---
 .../nightly_tests/dask_on_ray/dask_on_ray_app_config.yaml    | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/release/nightly_tests/dask_on_ray/dask_on_ray_app_config.yaml b/release/nightly_tests/dask_on_ray/dask_on_ray_app_config.yaml
index f4098b019262..5f0871723e3a 100644
--- a/release/nightly_tests/dask_on_ray/dask_on_ray_app_config.yaml
+++ b/release/nightly_tests/dask_on_ray/dask_on_ray_app_config.yaml
@@ -1,4 +1,9 @@
 base_image: {{ env["RAY_IMAGE_NIGHTLY_CPU"] | default("anyscale/ray:nightly-py37") }}
+# We use retriable_lifo as the workload can crash due to multiple tasks from different
+# callers running on the same node, we also observed raylet memory leak that would
+# trigger the group-by-policy to fail the workload.
+# https://github.com/ray-project/ray/issues/32195
+env_vars: {"RAY_worker_killing_policy": "retriable_lifo"}
 debian_packages: []
 
 python:

From a1938c3d5924cabb73a4eb35d4a506d1550e15dc Mon Sep 17 00:00:00 2001
From: Antoni Baum <antoni.baum@protonmail.com>
Date: Thu, 9 Feb 2023 20:02:11 -0800
Subject: [PATCH 214/267] [Train] Fix `use_gpu` with `HuggingFacePredictor`
 (#32333)

HuggingFacePredictor's use_gpu was set in the wrong method, causing it to not really work correctly. This PR fixes that.

Signed-off-by: Antoni Baum <antoni.baum@protonmail.com>
---
 .../huggingface/huggingface_predictor.py      | 13 ++++++-----
 .../ray/train/tests/test_huggingface_gpu.py   | 22 ++++++++++++-------
 2 files changed, 22 insertions(+), 13 deletions(-)

diff --git a/python/ray/train/huggingface/huggingface_predictor.py b/python/ray/train/huggingface/huggingface_predictor.py
index 7690ffdcc9a9..b469dcaf819d 100644
--- a/python/ray/train/huggingface/huggingface_predictor.py
+++ b/python/ray/train/huggingface/huggingface_predictor.py
@@ -91,6 +91,7 @@ def from_checkpoint(
         checkpoint: Checkpoint,
         *,
         pipeline_cls: Optional[Type[Pipeline]] = None,
+        use_gpu: bool = False,
         **pipeline_kwargs,
     ) -> "HuggingFacePredictor":
         """Instantiate the predictor from a Checkpoint.
@@ -104,6 +105,8 @@ def from_checkpoint(
             pipeline_cls: A ``transformers.pipelines.Pipeline`` class to use.
                 If not specified, will use the ``pipeline`` abstraction
                 wrapper.
+            use_gpu: If set, the model will be moved to GPU on instantiation and
+                prediction happens on GPU.
             **pipeline_kwargs: Any kwargs to pass to the pipeline
                 initialization. If ``pipeline`` is None, this must contain
                 the 'task' argument. Cannot contain 'model'. Can be used
@@ -114,6 +117,9 @@ def from_checkpoint(
             raise ValueError(
                 "If `pipeline_cls` is not specified, 'task' must be passed as a kwarg."
             )
+        if use_gpu:
+            # default to using the GPU with the first index
+            pipeline_kwargs.setdefault("device", 0)
         pipeline_cls = pipeline_cls or pipeline_factory
         preprocessor = checkpoint.get_preprocessor()
         with checkpoint.as_directory() as checkpoint_path:
@@ -123,14 +129,12 @@ def from_checkpoint(
         return cls(
             pipeline=pipeline,
             preprocessor=preprocessor,
+            use_gpu=use_gpu,
         )
 
     def _predict(
         self, data: Union[list, pd.DataFrame], **pipeline_call_kwargs
     ) -> pd.DataFrame:
-        if self.use_gpu:
-            # default to using the GPU with the first index
-            pipeline_call_kwargs.setdefault("device", 0)
         ret = self.pipeline(data, **pipeline_call_kwargs)
         # Remove unnecessary lists
         try:
@@ -180,8 +184,7 @@ def predict(
                 data to use as features to predict on. If None, use all
                 columns.
             **pipeline_call_kwargs: additional kwargs to pass to the
-                ``pipeline`` object. If ``use_gpu`` is True, 'device'
-                will be set to 0 by default.
+                ``pipeline`` object.
 
         Examples:
             >>> import pandas as pd
diff --git a/python/ray/train/tests/test_huggingface_gpu.py b/python/ray/train/tests/test_huggingface_gpu.py
index 2137a871b91e..24aff99667dd 100644
--- a/python/ray/train/tests/test_huggingface_gpu.py
+++ b/python/ray/train/tests/test_huggingface_gpu.py
@@ -1,4 +1,3 @@
-import logging
 import tempfile
 
 import numpy as np
@@ -31,13 +30,25 @@ def create_checkpoint():
         return HuggingFaceCheckpoint.from_dict(checkpoint.to_dict())
 
 
+class AssertingHuggingFacePredictor(HuggingFacePredictor):
+    def __init__(self, pipeline=None, preprocessor=None, use_gpu: bool = False):
+        super().__init__(pipeline, preprocessor, use_gpu)
+        assert use_gpu
+        assert "cuda" in str(pipeline.device)
+
+
 # TODO(ml-team): Add np.ndarray to batch_type
 @pytest.mark.parametrize("batch_type", [pd.DataFrame])
 @pytest.mark.parametrize("device", [None, 0])
 def test_predict_batch(ray_start_4_cpus, caplog, batch_type, device):
     checkpoint = create_checkpoint()
+    kwargs = {}
+
+    if device is not None:
+        kwargs["device"] = device
+
     predictor = BatchPredictor.from_checkpoint(
-        checkpoint, HuggingFacePredictor, task="text-generation"
+        checkpoint, AssertingHuggingFacePredictor, task="text-generation", **kwargs
     )
 
     # Todo: Ray data does not support numpy string arrays well
@@ -50,12 +61,7 @@ def test_predict_batch(ray_start_4_cpus, caplog, batch_type, device):
     else:
         raise RuntimeError("Invalid batch_type")
 
-    kwargs = {}
-    if device:
-        kwargs["device"] = device
-    with caplog.at_level(logging.WARNING):
-        predictions = predictor.predict(dataset, num_gpus_per_worker=1, **kwargs)
-    assert "enable GPU prediction" not in caplog.text
+    predictions = predictor.predict(dataset, num_gpus_per_worker=1)
 
     assert predictions.count() == 3
 

From 841a4fb19b7153e9dfc0f2c10d910d65d7064054 Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Thu, 9 Feb 2023 23:07:58 -0800
Subject: [PATCH 215/267] [RLlib] Clean up RLModule  (#32328)

Signed-off-by: Kourosh Hakhamaneshi <kourosh@anyscale.com>
---
 .../ppo/torch/ppo_torch_rl_module.py          |  4 +--
 rllib/core/rl_module/marl_module.py           |  4 +--
 rllib/core/rl_module/rl_module.py             | 34 +++++++++++++------
 rllib/core/testing/tf/bc_module.py            | 26 +++++---------
 rllib/core/testing/torch/bc_module.py         | 26 +++++---------
 rllib/models/specs/checker.py                 | 21 ++++++------
 rllib/models/specs/tests/test_check_specs.py  | 10 +++---
 7 files changed, 61 insertions(+), 64 deletions(-)

diff --git a/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py b/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py
index c4afa2a39e06..3c7baebc9c60 100644
--- a/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py
+++ b/rllib/algorithms/ppo/torch/ppo_torch_rl_module.py
@@ -1,5 +1,5 @@
 from dataclasses import dataclass
-from typing import Mapping, Any, Union
+from typing import Mapping, Any
 
 import gymnasium as gym
 
@@ -102,7 +102,7 @@ def from_model_config(
         action_space: gym.Space,
         *,
         model_config: Mapping[str, Any],
-    ) -> Union["RLModule", Mapping[str, Any]]:
+    ) -> "PPOTorchRLModule":
 
         # TODO: use the new catalog to perform this logic and construct the final config
 
diff --git a/rllib/core/rl_module/marl_module.py b/rllib/core/rl_module/marl_module.py
index e89571e63bcf..b95bc9659638 100644
--- a/rllib/core/rl_module/marl_module.py
+++ b/rllib/core/rl_module/marl_module.py
@@ -144,8 +144,6 @@ def from_multi_agent_config(cls, config: Mapping[str, Any]) -> "MultiAgentRLModu
         multiagent_module = cls()
 
         for module_id, module_spec in module_configs.items():
-            # module_cls: RLModule = module_spec.pop("module_class")
-            # module = module_cls.from_model_config(**module_spec)
             module = module_spec.build()
             multiagent_module.add_module(module_id, module)
 
@@ -281,7 +279,7 @@ def _get_specs_for_modules(self, method_name: str) -> SpecDict:
         """Returns a ModelSpec from the given method_name for all modules."""
         return SpecDict(
             {
-                module_id: getattr(module, method_name)()
+                module_id: getattr(module, f"_{method_name}")
                 for module_id, module in self._rl_modules.items()
             }
         )
diff --git a/rllib/core/rl_module/rl_module.py b/rllib/core/rl_module/rl_module.py
index 26dc32ced2a1..560d24e18d20 100644
--- a/rllib/core/rl_module/rl_module.py
+++ b/rllib/core/rl_module/rl_module.py
@@ -1,7 +1,7 @@
 import abc
 from dataclasses import dataclass
 import gymnasium as gym
-from typing import Mapping, Any, TYPE_CHECKING, Union, Optional, Type, Dict
+from typing import Mapping, Any, TYPE_CHECKING, Optional, Type, Dict
 
 if TYPE_CHECKING:
     from ray.rllib.core.rl_module.marl_module import MultiAgentRLModule
@@ -13,7 +13,11 @@
 from ray.rllib.utils.serialization import check_if_args_kwargs_serializable
 
 from ray.rllib.models.specs.typing import SpecType
-from ray.rllib.models.specs.checker import check_input_specs, check_output_specs
+from ray.rllib.models.specs.checker import (
+    check_input_specs,
+    check_output_specs,
+    convert_to_canonical_format,
+)
 from ray.rllib.models.distributions import Distribution
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID
 from ray.rllib.utils.nested_dict import NestedDict
@@ -159,20 +163,31 @@ def __post_init__(self):
         This is a good place to do any initialization that requires access to the
         subclass's attributes.
         """
-        self._input_specs_train = self.input_specs_train()
-        self._output_specs_train = self.output_specs_train()
-        self._input_specs_exploration = self.input_specs_exploration()
-        self._output_specs_exploration = self.output_specs_exploration()
-        self._input_specs_inference = self.input_specs_inference()
-        self._output_specs_inference = self.output_specs_inference()
+        self._input_specs_train = convert_to_canonical_format(self.input_specs_train())
+        self._output_specs_train = convert_to_canonical_format(
+            self.output_specs_train()
+        )
+        self._input_specs_exploration = convert_to_canonical_format(
+            self.input_specs_exploration()
+        )
+        self._output_specs_exploration = convert_to_canonical_format(
+            self.output_specs_exploration()
+        )
+        self._input_specs_inference = convert_to_canonical_format(
+            self.input_specs_inference()
+        )
+        self._output_specs_inference = convert_to_canonical_format(
+            self.output_specs_inference()
+        )
 
     @classmethod
     def from_model_config(
         cls,
         observation_space: gym.Space,
         action_space: gym.Space,
+        *,
         model_config: Mapping[str, Any],
-    ) -> Union["RLModule", Mapping[str, Any]]:
+    ) -> "RLModule":
         """Creates a RLModule instance from a model config dict and spaces.
 
         The model config dict is the same as the one passed to the AlgorithmConfig
@@ -195,7 +210,6 @@ def from_model_config(
                     observation_space: gym.Space,
                     action_space: gym.Space,
                     model_config: Mapping[str, Any],
-                    return_config: bool = False,
                 ):
                     return cls(
                         input_dim=observation_space.shape[0],
diff --git a/rllib/core/testing/tf/bc_module.py b/rllib/core/testing/tf/bc_module.py
index 46d1651afa3f..aaad27e594fa 100644
--- a/rllib/core/testing/tf/bc_module.py
+++ b/rllib/core/testing/tf/bc_module.py
@@ -1,13 +1,11 @@
 import gymnasium as gym
 import tensorflow as tf
 import tensorflow_probability as tfp
-from typing import Any, Mapping, Union
+from typing import Any, Mapping
 
 from ray.rllib.core.rl_module.rl_module import RLModule
 from ray.rllib.core.rl_module.tf.tf_rl_module import TfRLModule
-from ray.rllib.models.specs.specs_dict import SpecDict
 from ray.rllib.models.specs.typing import SpecType
-from ray.rllib.models.specs.specs_tf import TFTensorSpecs
 from ray.rllib.policy.sample_batch import SampleBatch
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.nested_dict import NestedDict
@@ -36,27 +34,27 @@ def __init__(
 
     @override(RLModule)
     def input_specs_exploration(self) -> SpecType:
-        return self._default_inputs()
+        return ["obs"]
 
     @override(RLModule)
     def input_specs_inference(self) -> SpecType:
-        return self._default_inputs()
+        return ["obs"]
 
     @override(RLModule)
     def input_specs_train(self) -> SpecType:
-        return self._default_inputs()
+        return ["obs"]
 
     @override(RLModule)
     def output_specs_exploration(self) -> SpecType:
-        return self._default_outputs()
+        return ["action_dist"]
 
     @override(RLModule)
     def output_specs_inference(self) -> SpecType:
-        return self._default_outputs()
+        return ["action_dist"]
 
     @override(RLModule)
     def output_specs_train(self) -> SpecType:
-        return self._default_outputs()
+        return ["action_dist"]
 
     @override(RLModule)
     def _forward_inference(self, batch: NestedDict) -> Mapping[str, Any]:
@@ -91,8 +89,9 @@ def from_model_config(
         cls,
         observation_space: "gym.Space",
         action_space: "gym.Space",
+        *,
         model_config: Mapping[str, Any],
-    ) -> Union["RLModule", Mapping[str, Any]]:
+    ) -> "DiscreteBCTFModule":
 
         config = {
             "input_dim": observation_space.shape[0],
@@ -101,10 +100,3 @@ def from_model_config(
         }
 
         return cls(**config)
-
-    def _default_inputs(self) -> SpecDict:
-        obs_dim = self._input_dim
-        return {"obs": TFTensorSpecs("b, do", do=obs_dim)}
-
-    def _default_outputs(self) -> SpecDict:
-        return {"action_dist": tfp.distributions.Distribution}
diff --git a/rllib/core/testing/torch/bc_module.py b/rllib/core/testing/torch/bc_module.py
index bdbf8ced9a37..5701f5ddac6a 100644
--- a/rllib/core/testing/torch/bc_module.py
+++ b/rllib/core/testing/torch/bc_module.py
@@ -1,9 +1,8 @@
 import gymnasium as gym
-from typing import Any, Mapping, Union
+from typing import Any, Mapping
 
 from ray.rllib.core.rl_module import RLModule
 from ray.rllib.core.rl_module.torch.torch_rl_module import TorchRLModule
-from ray.rllib.models.specs.specs_torch import TorchTensorSpec
 from ray.rllib.models.specs.typing import SpecType
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.framework import try_import_torch
@@ -32,27 +31,27 @@ def __init__(
 
     @override(RLModule)
     def input_specs_exploration(self) -> SpecType:
-        return self._default_inputs()
+        return ["obs"]
 
     @override(RLModule)
     def input_specs_inference(self) -> SpecType:
-        return self._default_inputs()
+        return ["obs"]
 
     @override(RLModule)
     def input_specs_train(self) -> SpecType:
-        return self._default_inputs()
+        return ["obs"]
 
     @override(RLModule)
     def output_specs_exploration(self) -> SpecType:
-        return self._default_outputs()
+        return ["action_dist"]
 
     @override(RLModule)
     def output_specs_inference(self) -> SpecType:
-        return self._default_outputs()
+        return ["action_dist"]
 
     @override(RLModule)
     def output_specs_train(self) -> SpecType:
-        return self._default_outputs()
+        return ["action_dist"]
 
     @override(RLModule)
     def _forward_inference(self, batch: NestedDict) -> Mapping[str, Any]:
@@ -75,8 +74,9 @@ def from_model_config(
         cls,
         observation_space: "gym.Space",
         action_space: "gym.Space",
+        *,
         model_config: Mapping[str, Any],
-    ) -> Union["RLModule", Mapping[str, Any]]:
+    ) -> "DiscreteBCTorchModule":
 
         config = {
             "input_dim": observation_space.shape[0],
@@ -85,11 +85,3 @@ def from_model_config(
         }
 
         return cls(**config)
-
-    def _default_inputs(self) -> dict:
-        return {
-            "obs": TorchTensorSpec("b, do", do=self.input_dim),
-        }
-
-    def _default_outputs(self) -> dict:
-        return {"action_dist": torch.distributions.Categorical}
diff --git a/rllib/models/specs/checker.py b/rllib/models/specs/checker.py
index 1662c58aa07d..f281dab95e86 100644
--- a/rllib/models/specs/checker.py
+++ b/rllib/models/specs/checker.py
@@ -10,7 +10,8 @@
 from ray.rllib.models.specs.typing import SpecType
 
 
-def _convert_to_canonical_format(spec: SpecType) -> Union[Spec, SpecDict]:
+@DeveloperAPI
+def convert_to_canonical_format(spec: SpecType) -> Union[Spec, SpecDict]:
     """Converts a spec type input to the canonical format.
 
     The canonical format is either
@@ -34,23 +35,23 @@ def _convert_to_canonical_format(spec: SpecType) -> Union[Spec, SpecDict]:
 
     .. code-block:: python
         spec = ["foo", ("bar", "baz")]
-        output = _convert_to_canonical_format(spec)
+        output = convert_to_canonical_format(spec)
         # output = SpecDict({"foo": None, ("bar", "baz"): None})
 
         spec = {"foo": int, "bar": {"baz": None}}
-        output = _convert_to_canonical_format(spec)
+        output = convert_to_canonical_format(spec)
         # output = SpecDict(
         #   {"foo": TypeSpec(int), "bar": SpecDict({"baz": None})}
         # )
 
         spec = {"foo": int, "bar": {"baz": str}}
-        output = _convert_to_canonical_format(spec)
+        output = convert_to_canonical_format(spec)
         # output = SpecDict(
         #   {"foo": TypeSpec(int), "bar": SpecDict({"baz": TypeSpec(str)})}
         # )
 
         spec = {"foo": int, "bar": {"baz": TorchTensorSpec("b,h")}}
-        output = _convert_to_canonical_format(spec)
+        output = convert_to_canonical_format(spec)
         # output = SpecDict(
         #   {"foo": TypeSpec(int), "bar": SpecDict({"baz": TorchTensorSpec("b,h")})}
         # )
@@ -60,15 +61,15 @@ def _convert_to_canonical_format(spec: SpecType) -> Union[Spec, SpecDict]:
 
     .. code-block:: python
         spec = int
-        output = _convert_to_canonical_format(spec)
+        output = convert_to_canonical_format(spec)
         # output = TypeSpec(int)
 
         spec = None
-        output = _convert_to_canonical_format(spec)
+        output = convert_to_canonical_format(spec)
         # output = None
 
         spec = TorchTensorSpec("b,h")
-        output = _convert_to_canonical_format(spec)
+        output = convert_to_canonical_format(spec)
         # output = TorchTensorSpec("b,h")
 
     Args:
@@ -232,7 +233,7 @@ def wrapper(self, input_data, **kwargs):
                 spec = getattr(self, input_spec, "___NOT_FOUND___")
                 if spec == "___NOT_FOUND___":
                     raise ValueError(f"object {self} has no attribute {input_spec}.")
-                spec = _convert_to_canonical_format(spec)
+                spec = convert_to_canonical_format(spec)
                 checked_data = _validate(
                     cls_instance=self,
                     method=func,
@@ -318,7 +319,7 @@ def wrapper(self, input_data, **kwargs):
                 spec = getattr(self, output_spec, "___NOT_FOUND___")
                 if spec == "___NOT_FOUND___":
                     raise ValueError(f"object {self} has no attribute {output_spec}.")
-                spec = _convert_to_canonical_format(spec)
+                spec = convert_to_canonical_format(spec)
                 _validate(
                     cls_instance=self,
                     method=func,
diff --git a/rllib/models/specs/tests/test_check_specs.py b/rllib/models/specs/tests/test_check_specs.py
index 60a026c15a61..8e7388a778dc 100644
--- a/rllib/models/specs/tests/test_check_specs.py
+++ b/rllib/models/specs/tests/test_check_specs.py
@@ -11,7 +11,7 @@
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.nested_dict import NestedDict
 from ray.rllib.models.specs.checker import (
-    _convert_to_canonical_format,
+    convert_to_canonical_format,
     check_input_specs,
     check_output_specs,
 )
@@ -275,18 +275,18 @@ def test_convert_to_canonical_format(self):
 
         # Case: input is a list of strs
         self.assertDictEqual(
-            _convert_to_canonical_format(["foo", "bar"]).asdict(),
+            convert_to_canonical_format(["foo", "bar"]).asdict(),
             SpecDict({"foo": None, "bar": None}).asdict(),
         )
 
         # Case: input is a list of strs and nested strs
         self.assertDictEqual(
-            _convert_to_canonical_format(["foo", ("bar", "jar")]).asdict(),
+            convert_to_canonical_format(["foo", ("bar", "jar")]).asdict(),
             SpecDict({"foo": None, "bar": {"jar": None}}).asdict(),
         )
 
         # Case: input is a Nested Mapping
-        returned = _convert_to_canonical_format(
+        returned = convert_to_canonical_format(
             {"foo": {"bar": TorchTensorSpec("b")}, "jar": {"tar": int, "car": None}}
         )
         self.assertIsInstance(returned, SpecDict)
@@ -301,7 +301,7 @@ def test_convert_to_canonical_format(self):
         )
 
         # Case: input is a SpecDict already
-        returned = _convert_to_canonical_format(
+        returned = convert_to_canonical_format(
             SpecDict({"foo": {"bar": TorchTensorSpec("b")}, "jar": {"tar": int}})
         )
         self.assertIsInstance(returned, SpecDict)

From 60fa8fe49b7dd6ccfcd5cd8982959fbe37374776 Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Thu, 9 Feb 2023 23:11:13 -0800
Subject: [PATCH 216/267] [RLlib] Cleanup RLTrainer (#32345)

* Modifications to gpu resource logic in rl_trainer

- Add support for gpu with local mode for tf trainers in local mode
- remove `_make_distributed_module`
- add support for `local_gpu_id` which is the id of the gpu to use
  during local mode training with gpu
- refactor tf function tracing logic to include the call to strategy.run
- change tf function logic to prevent unnecessary retracing
- add warning to not do gpu or distributed training in tf without
turning on eager tracing.

Signed-off-by: avnish <avnish@anyscale.com>
---
 .../ppo/torch/ppo_torch_rl_trainer.py         |  30 +-
 rllib/core/rl_trainer/rl_trainer.py           | 774 ++++++++++--------
 .../core/rl_trainer/tests/test_rl_trainer.py  |   2 +-
 rllib/core/rl_trainer/tf/tf_rl_trainer.py     | 305 ++++---
 .../torch/tests/test_torch_rl_trainer.py      |   2 +-
 .../core/rl_trainer/torch/torch_rl_trainer.py | 139 ++--
 rllib/core/testing/tf/bc_rl_trainer.py        |   2 +-
 rllib/core/testing/torch/bc_rl_trainer.py     |   2 +-
 8 files changed, 660 insertions(+), 596 deletions(-)

diff --git a/rllib/algorithms/ppo/torch/ppo_torch_rl_trainer.py b/rllib/algorithms/ppo/torch/ppo_torch_rl_trainer.py
index ab65abf22eb8..9b645b5ff6c2 100644
--- a/rllib/algorithms/ppo/torch/ppo_torch_rl_trainer.py
+++ b/rllib/algorithms/ppo/torch/ppo_torch_rl_trainer.py
@@ -29,24 +29,24 @@ def __init__(self, *args, **kwargs):
 
         # TODO (Kourosh): Move these failures to config.validate() or support them.
         self.entropy_coeff_scheduler = None
-        if self.config.entropy_coeff_schedule:
+        if self.hps.entropy_coeff_schedule:
             raise ValueError("entropy_coeff_schedule is not supported in RLTrainer yet")
 
         # TODO (Kourosh): Create a way on the base class for users to define arbitrary
         # schedulers for learning rates.
         self.lr_scheduler = None
-        if self.config.lr_schedule:
+        if self.hps.lr_schedule:
             raise ValueError("lr_schedule is not supported in RLTrainer yet")
 
         # TODO (Kourosh): We can still use mix-ins in the new design. Do we want that?
         # Most likely not. I rather be specific about everything. kl_coeff is a
         # none-gradient based update which we can define here and add as update with
         # additional_update() method.
-        self.kl_coeff = self.config.kl_coeff
-        self.kl_target = self.config.kl_target
+        self.kl_coeff = self.hps.kl_coeff
+        self.kl_target = self.hps.kl_target
 
     @override(TorchRLTrainer)
-    def _compute_loss_per_module(
+    def compute_loss_per_module(
         self, module_id: str, batch: SampleBatch, fwd_out: Mapping[str, TensorType]
     ) -> TensorType:
         # TODO (Kourosh): batch type is NestedDict.
@@ -66,7 +66,7 @@ def _compute_loss_per_module(
         )
 
         # Only calculate kl loss if necessary (kl-coeff > 0.0).
-        if self.config.kl_coeff > 0.0:
+        if self.hps.kl_coeff > 0.0:
             action_kl = prev_action_dist.kl(curr_action_dist)
             mean_kl_loss = torch.mean(action_kl)
             if mean_kl_loss.isinf():
@@ -89,16 +89,14 @@ def _compute_loss_per_module(
         surrogate_loss = torch.min(
             batch[Postprocessing.ADVANTAGES] * logp_ratio,
             batch[Postprocessing.ADVANTAGES]
-            * torch.clamp(
-                logp_ratio, 1 - self.config.clip_param, 1 + self.config.clip_param
-            ),
+            * torch.clamp(logp_ratio, 1 - self.hps.clip_param, 1 + self.hps.clip_param),
         )
 
         # Compute a value function loss.
-        if self.config.use_critic:
+        if self.hps.use_critic:
             value_fn_out = fwd_out[SampleBatch.VF_PREDS]
             vf_loss = torch.pow(value_fn_out - batch[Postprocessing.VALUE_TARGETS], 2.0)
-            vf_loss_clipped = torch.clamp(vf_loss, 0, self.config.vf_clip_param)
+            vf_loss_clipped = torch.clamp(vf_loss, 0, self.hps.vf_clip_param)
             mean_vf_loss = torch.mean(vf_loss_clipped)
         # Ignore the value function.
         else:
@@ -107,14 +105,14 @@ def _compute_loss_per_module(
 
         total_loss = torch.mean(
             -surrogate_loss
-            + self.config.vf_loss_coeff * vf_loss_clipped
-            - self.config.entropy_coeff * curr_entropy
+            + self.hps.vf_loss_coeff * vf_loss_clipped
+            - self.hps.entropy_coeff * curr_entropy
         )
 
         # Add mean_kl_loss (already processed through `reduce_mean_valid`),
         # if necessary.
-        if self.config.kl_coeff > 0.0:
-            total_loss += self.config.kl_coeff * mean_kl_loss
+        if self.hps.kl_coeff > 0.0:
+            total_loss += self.hps.kl_coeff * mean_kl_loss
 
         return {
             self.TOTAL_LOSS_KEY: total_loss,
@@ -128,7 +126,7 @@ def _compute_loss_per_module(
         }
 
     @override(TorchRLTrainer)
-    def _additional_update_per_module(
+    def additional_update_per_module(
         self, module_id: str, sampled_kl_values: dict, timestep: int
     ) -> Mapping[str, Any]:
 
diff --git a/rllib/core/rl_trainer/rl_trainer.py b/rllib/core/rl_trainer/rl_trainer.py
index 00f61eeeb935..87a8269d70c3 100644
--- a/rllib/core/rl_trainer/rl_trainer.py
+++ b/rllib/core/rl_trainer/rl_trainer.py
@@ -38,7 +38,10 @@
 )
 from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 from ray.rllib.core.rl_trainer.reduce_result_dict_fn import _reduce_mean_results
-
+from ray.rllib.utils.annotations import (
+    OverrideToImplementCustomLogic,
+    OverrideToImplementCustomLogic_CallToSuperRecommended,
+)
 
 torch, _ = try_import_torch()
 tf1, tf, tfv = try_import_tf()
@@ -83,62 +86,110 @@ class RLTrainerHPs:
 
 
 class RLTrainer:
-    """Base class for RLlib algorithm trainers.
+    """Base class for learners.
+
+    This class will be used to train RLModules. It is responsible for defining the loss
+    function, and updating the neural network weights that it owns. It also provides a
+    way to add/remove modules to/from RLModules in a multi-agent scenario, in the
+    middle of training (This is useful for league based training).
+
+    TF and Torch specific implementation of this class fills in the framework-specific
+    implementation details for distributed training, and for computing and applying
+    gradients. User should not need to sub-class this class, but instead inherit from
+    the TF or Torch specific sub-classes to implement their algorithm-specific update
+    logic.
+
 
     Args:
-        module_class: The (MA)RLModule class to use.
-        module_kwargs: The kwargs for the (MA)RLModule.
-        optimizer_config: The config for the optimizer.
-        in_test: Whether to enable additional logging behavior for testing purposes.
-        distributed: Whether this trainer is distributed or not.
-
-    Abstract Methods:
-        compute_gradients: Compute gradients for the module being optimized.
-        apply_gradients: Apply gradients to the module being optimized with respect to
-            a loss that is computed by the optimizer. Both compute_gradients and
-            apply_gradients are meant for framework-specific specializations.
-        compute_loss: Compute the loss for the module being optimized. Override this
-            method to customize the loss function of the multi-agent RLModule that is
-            being optimized.
-        configure_optimizers: Configure the optimizers for the module being optimized.
-            Override this to cutomize the optimizers and the parameters that they are
-            optimizing.
-
-
-    Example:
+        module_spec: The module specification for the RLModule that is being trained.
+            If the module is a single agent module, after building the module it will
+            be converted to a multi-agent module with a default key. Can be none if the
+            module is provided directly via the `module` argument. Refer to
+            ray.rllib.core.rl_module.SingleAgentRLModuleSpec
+            or ray.rllib.core.rl_module.MultiAgentRLModuleSpec for more info.
+        module: If learner is being used stand-alone, the RLModule can be optionally
+            passed in directly instead of the through the `module_spec`.
+        optimizer_config: The deep learning gradient optimizer configuration to be
+            used. For example lr=0.0001, momentum=0.9, etc.
+        scaling_config: Configuration for scaling the learner actors.
+            Refer to ray.rllib.core.rl_trainer.scaling_config.TrainerScalingConfig
+            for more info.
+        trainer_hyperparameters: The hyper-parameters for the Learner.
+            Algorithm specific learner hyper-parameters will passed in via this
+            argument. For example in PPO the `vf_loss_coeff` hyper-parameter will be
+            passed in via this argument. Refer to
+            ray.rllib.core.rl_trainer.rl_trainer.RLTrainerHPs for more info.
+        framework_hps: The framework specific hyper-parameters. This will be used to
+            pass in any framework specific hyper-parameter that will impact the module
+            creation. For example eager_tracing in TF or compile in Torch.
+            Refer to ray.rllib.core.rl_trainer.rl_trainer.FrameworkHPs for more info.
+
+
+    Usage pattern:
+
         .. code-block:: python
 
-        trainer = MyRLTrainer(
-            module_class,
-            module_kwargs,
-            optimizer_config
+        # create a single agent RL module spec.
+        module_spec = SingleAgentRLModuleSpec(
+            module_class=MyModule,
+            observation_space=env.observation_space,
+            action_space=env.action_space,
+            model_config = {"hidden": [128, 128]}
         )
-        trainer.build()
-        batch = ...
-        results = trainer.update(batch)
 
-        # add a new module, perhaps for league based training or lru caching
-        trainer.add_module(
+        # create a learner instance that will train the module
+        learner = MyLearner(module_spec=module_spec)
+
+        # Note: the learner should be built before it can be used.
+        learner.build()
+
+        # take one gradient update on the module and report the results
+        results = learner.update(batch)
+
+        # add a new module, perhaps for league based training
+        learner.add_module(
             module_id="new_player",
-            module_cls=NewPlayerCls,
-            module_kwargs=new_player_kwargs,
+            module_spec=SingleAgentRLModuleSpec(
+                module_class=NewPlayerModule,
+                observation_space=env.observation_space,
+                action_space=env.action_space,
+                model_config = {"hidden": [128, 128]}
+            )
         )
 
-        batch = ...
-        results = trainer.update(batch)  # will train previous and new modules.
+        # Take another gradient update with both previous and new modules.
+        results = learner.update(batch)
 
         # remove a module
-        trainer.remove_module("new_player")
+        learner.remove_module("new_player")
 
-        batch = ...
-        results = trainer.update(batch)  # will train previous modules only.
+        # will train previous modules only.
+        results = learner.update(batch)
 
         # get the state of the trainer
-        state = trainer.get_state()
+        state = learner.get_state()
 
         # set the state of the trainer
-        trainer.set_state(state)
+        learner.set_state(state)
+
+        # get the weights of the underly multi-agent RLModule
+        weights = learner.get_weights()
+
+        # set the weights of the underly multi-agent RLModule
+        learner.set_weights(weights)
+
+
+    Extension pattern:
+
+        .. code-block:: python
+
+        class MyLearner(TorchLearner):
 
+            def compute_loss(self, fwd_out, batch):
+                # compute the loss based on batch and output of the forward pass
+                # to access the learner hyper-parameters use `self.hps`
+
+                return {self.TOTAL_LOSS_KEY: loss}
     """
 
     framework: str = None
@@ -156,10 +207,6 @@ def __init__(
         trainer_hyperparameters: Optional[RLTrainerHPs] = RLTrainerHPs(),
         framework_hyperparameters: Optional[FrameworkHPs] = FrameworkHPs(),
     ):
-        # TODO (Kourosh): Having the entire algorithm_config inside trainer may not be
-        # the best idea in the world, but it's easy to implement and user will
-        # understand it. If we can find a better way to make subset of the config
-        # available to the trainer, that would be great.
         # TODO (Kourosh): convert optimizer configs to dataclasses
         if module_spec is not None and module is not None:
             raise ValueError(
@@ -171,13 +218,16 @@ def __init__(
                 "Either module_spec or module should be provided to RLTrainer."
             )
 
-        self.module_spec = module_spec
-        self.module_obj = module
-        self.optimizer_config = optimizer_config
-        self.config = trainer_hyperparameters
+        self._module_spec = module_spec
+        self._module_obj = module
+        self._optimizer_config = optimizer_config
+        self._hps = trainer_hyperparameters
 
         # pick the configs that we need for the trainer from scaling config
         self._distributed = trainer_scaling_config.num_workers > 1
+        self._use_gpu = trainer_scaling_config.num_gpus_per_worker > 0
+        # if we are using gpu but we are not distributed, use this gpu for training
+        self._local_gpu_idx = trainer_scaling_config.local_gpu_idx
 
         # These are the attributes that are set during build
         self._module: MultiAgentRLModule = None
@@ -186,23 +236,24 @@ def __init__(
         self._param_to_optim: Dict[ParamRef, Optimizer] = {}
         self._params: ParamDictType = {}
 
-        # pick the stuff that we need from the scaling config
-        self._use_gpu = trainer_scaling_config.num_gpus_per_worker > 0
-
-        # if we are using gpu but we are not distributed, use this gpu for training
-        self._local_gpu_idx = trainer_scaling_config.local_gpu_idx
-
     @property
     def distributed(self) -> bool:
+        """Whether the learner is running in distributed mode."""
         return self._distributed
 
     @property
     def module(self) -> MultiAgentRLModule:
+        """The multi-agent RLModule that is being trained."""
         return self._module
 
+    @property
+    def hps(self) -> RLTrainerHPs:
+        """The hyper-parameters for the trainer."""
+        return self._hps
+
     @abc.abstractmethod
     def configure_optimizers(self) -> ParamOptimizerPairs:
-        """Configures the optimizers for the trainer.
+        """Configures the optimizers for the Learner.
 
         This method is responsible for setting up the optimizers that will be used to
         train the model. The optimizers are responsible for updating the model's
@@ -212,108 +263,113 @@ def configure_optimizers(self) -> ParamOptimizerPairs:
         parameters. To support both tf and torch, we must explicitly return the
         parameters as the first element of the tuple regardless of whether those
         exist in the optimizer objects or not. This method is called once at
-        initialization and everytime a new sub-module is added to the module.
+        initialization.
 
         Returns:
             A list of tuples (parameters, optimizer), where parameters is a list of
             model parameters and optimizer is a deep learning optimizer.
+        """
+
+    @abc.abstractmethod
+    def compute_gradients(self, loss: Mapping[str, Any]) -> ParamDictType:
+        """Computes the gradients based on the loss.
 
+        Args:
+            loss: The computed loss dict. It should include the key
+                `self.TOTAL_LOSS_KEY` that contains the total loss.
+        Returns:
+            The gradients in teh same format as self._params.
         """
 
-    def compute_loss(
-        self,
-        *,
-        fwd_out: MultiAgentBatch,
-        batch: MultiAgentBatch,
-    ) -> Union[TensorType, Mapping[str, Any]]:
-        """Computes the loss for the module being optimized.
+    @abc.abstractmethod
+    def apply_gradients(self, gradients: ParamDictType) -> None:
+        """Applies the gradients to the MultiAgentRLModule parameters.
+
+        Args:
+            gradients: A dictionary of gradients, in the same format as self._params.
+        """
+
+    @abc.abstractmethod
+    def get_weights(self, module_ids: Optional[Set[str]] = None) -> Mapping[str, Any]:
+        """Returns the weights of the underlying MultiAgentRLModule.
 
-        This method must be overridden by each algorithm's trainer to specify the
-        specific loss computation logic. The input "fwd_out" is the output of a call to
-        the "forward_train" method on the instance's "_module" attribute during
-        training. The input "batch" is the data that was used to compute "fwd_out". The
-        returned dictionary must contain a key called "total_loss", which will be used
-        to compute gradients. It is recommended to not compute any forward passes
-        within this method, and to use the "forward_train" outputs to compute the
-        required tensors for loss calculation.
+        The output should be numpy-friendly for easy serialization, not framework
+        specific tensors.
 
         Args:
-            fwd_out: Output from a call to `forward_train` on self._module during
-                training.
-            batch: The data that was used to compute fwd_out.
+            module_ids: The ids of the modules to get the weights for. If None, all
+                modules will be returned.
 
         Returns:
-            A dictionary of losses. NOTE that the dictionary
-            must contain one protected key "total_loss" which will be used for
-            computing gradients through.
+            A dictionary that holds the weights of the modules in a numpy-friendly
+            format.
         """
-        # TODO (Kourosh): This method is built for multi-agent. While it is still
-        # possible to write single-agent losses, it may become confusing to users. We
-        # should find a way to allow them to specify single-agent losses as well,
-        # without having to think about one extra layer of hierarchy for module ids.
 
-        loss_total = None
-        results_all_modules = {}
-        for module_id in fwd_out:
-            module_batch = batch[module_id]
-            module_fwd_out = fwd_out[module_id]
+    @abc.abstractmethod
+    def set_weights(self, weights: Mapping[str, Any]) -> None:
+        """Sets the weights of the underlying MultiAgentRLModule"""
 
-            module_results = self._compute_loss_per_module(
-                module_id, module_batch, module_fwd_out
-            )
-            results_all_modules[module_id] = module_results
-            loss = module_results[self.TOTAL_LOSS_KEY]
+    @abc.abstractmethod
+    def get_param_ref(self, param: ParamType) -> Hashable:
+        """Returns a hashable reference to a trainable parameter.
 
-            if loss_total is None:
-                loss_total = loss
-            else:
-                loss_total += loss
+        This should be overriden in framework specific specialization. For example in
+        torch it will return the parameter itself, while in tf it returns the .ref() of
+        the variable. The purpose is to retrieve a unique reference to the parameters.
 
-        results_all_modules[self.TOTAL_LOSS_KEY] = loss_total
+        Args:
+            param: The parameter to get the reference to.
 
-        return results_all_modules
+        Returns:
+            A reference to the parameter.
+        """
 
-    def _compute_loss_per_module(
-        self, module_id: str, batch: SampleBatch, fwd_out: Mapping[str, TensorType]
-    ) -> Mapping[str, Any]:
-        """Computes the loss for a single module.
+    @abc.abstractmethod
+    def get_parameters(self, module: RLModule) -> Sequence[ParamType]:
+        """Returns the list of parameters of a module.
 
-        Think of this as computing loss for a
-        single agent. For multi-agent use-cases that require more complicated
-        computation for loss, consider overriding the `compute_loss` method instead.
+        This should be overriden in framework specific trainer. For example in torch it
+        will return .parameters(), while in tf it returns .trainable_variables.
 
         Args:
-            module_id: The id of the module.
-            batch: The sample batch for this particular module.
-            fwd_out: The output of the forward pass for this particular module.
+            module: The module to get the parameters from.
 
         Returns:
-            A dictionary of losses. NOTE that the dictionary
-            must contain one protected key "total_loss" which will be used for
-            computing gradients through.
+            The parameters of the module.
         """
-        raise NotImplementedError
 
-    def postprocess_gradients(
-        self, gradients_dict: Mapping[str, Any]
-    ) -> Mapping[str, Any]:
-        """Called after gradients have been computed.
+    @abc.abstractmethod
+    def get_optimizer_obj(
+        self, module: RLModule, optimizer_cls: Type[Optimizer]
+    ) -> Optimizer:
+        """Returns the optimizer instance of type optimizer_cls given the module.
+
+        In torch this is the optimizer object initialize with module parameters. In tf
+        this is initialized without module parameters.
 
         Args:
-            gradients_dict (Mapping[str, Any]): A dictionary of gradients.
+            module: The module of type RLModule to get the optimizer from.
+            optimizer_cls: The optimizer class to use.
+
+        Returns:
+            The optimizer object.
+        """
 
-        Note the relative order of operations looks like this:
-            fwd_out = forward_train(batch)
-            loss = compute_loss(batch, fwd_out)
-            gradients = compute_gradients(loss)
-            ---> postprocessed_gradients = postprocess_gradients(gradients)
-            apply_gradients(postprocessed_gradients)
+    @abc.abstractmethod
+    def _convert_batch_type(self, batch: MultiAgentBatch) -> NestedDict[TensorType]:
+        """Converts a MultiAgentBatch to a NestedDict of Tensors.
+
+        This should convert the input batch from a MultiAgentBatch format to framework
+        specific tensor format located on the correct device.
+
+        Args:
+            batch: A MultiAgentBatch.
 
         Returns:
-            Mapping[str, Any]: A dictionary of gradients.
+            A NestedDict.
         """
-        return gradients_dict
 
+    @OverrideToImplementCustomLogic_CallToSuperRecommended
     def compile_results(
         self,
         batch: NestedDict,
@@ -321,7 +377,7 @@ def compile_results(
         postprocessed_loss: Mapping[str, Any],
         postprocessed_gradients: Mapping[str, Any],
     ) -> Mapping[str, Any]:
-        """Compile results from the update.
+        """Compile results from the update in a numpy-friendly format.
 
         Args:
             batch: The batch that was used for the update.
@@ -332,10 +388,6 @@ def compile_results(
         Returns:
             A dictionary of results.
         """
-        # TODO (Kourosh): This method assumes that all the modules with in the
-        # marl_module are accessible via looping through it rl_modules. This may not be
-        # true for centralized critic for example. Therefore we need a better
-        # generalization of this base-class implementation.
         loss_numpy = convert_to_numpy(postprocessed_loss)
         mean_grads = [
             np.mean(grad) for grad in convert_to_numpy(postprocessed_gradients.values())
@@ -347,97 +399,197 @@ def compile_results(
 
         return ret
 
-    def update(
+    @OverrideToImplementCustomLogic_CallToSuperRecommended
+    def add_module(
         self,
-        batch: MultiAgentBatch,
         *,
-        minibatch_size: Optional[int] = None,
-        num_iters: int = 1,
-        reduce_fn: Callable[[ResultDict], ResultDict] = _reduce_mean_results,
-    ) -> Mapping[str, Any]:
-        """Do `num_iters` minibatch updates given the original batch.
+        module_id: ModuleID,
+        module_spec: SingleAgentRLModuleSpec,
+        set_optimizer_fn: Optional[Callable[[RLModule], ParamOptimizerPairs]] = None,
+        optimizer_cls: Optional[Type[Optimizer]] = None,
+    ) -> None:
+        """Add a module to the underlying MultiAgentRLModule and the Learner.
 
-        Given a batch of episodes you can use this method to take more
-        than one backward pass on the batch. The same minibatch_size and num_iters
-        will be used for all module ids (previously known as policies) in the
-        multiagent batch
+        Args:
+            module_id: The id of the module to add.
+            module_spec: The module spec of the module to add.
+            set_optimizer_fn: A function that takes in the module and returns a list of
+                (param, optimizer) pairs. Each element in the tuple describes a
+                parameter group that share the same optimizer object, if None, the
+                default optimizer_cls will be used with all the parameters from the
+                module.
+            optimizer_cls: The optimizer class to use. If None, the set_optimizer_fn
+                should be provided.
+        """
+        self.__check_if_build_called()
+        module = module_spec.build()
+
+        # construct a default set_optimizer_fn if not provided
+        if set_optimizer_fn is None:
+            if optimizer_cls is None:
+                raise ValueError(
+                    "Either set_optimizer_fn or optimizer_cls must be provided."
+                )
+
+            def set_optimizer_fn(module):
+                optimizer = self.get_optimizer_obj(module, optimizer_cls)
+                parameters = self.get_parameters(module)
+                return [(parameters, optimizer)]
+
+        for param_seq, optimizer in set_optimizer_fn(module):
+            self._optim_to_param[optimizer] = []
+            for param in param_seq:
+                param_ref = self.get_param_ref(param)
+                self._optim_to_param[optimizer].append(param_ref)
+                self._params[param_ref] = param
+                self._param_to_optim[param_ref] = optimizer
+
+        self._module.add_module(module_id, module)
+
+    @OverrideToImplementCustomLogic_CallToSuperRecommended
+    def remove_module(self, module_id: ModuleID) -> None:
+        """Remove a module from the Learner.
 
         Args:
-            batch: A batch of data.
-            minibatch_size: The size of the minibatch to use for each update.
-            num_iters: The number of complete passes over all the sub-batches
-                in the input multi-agent batch.
-            reduce_fn: reduce_fn: A function to reduce the results from a list of
-                minibatch updates. This can be any arbitrary function that takes a
-                list of dictionaries and returns a single dictionary. For example you
-                can either take an average (default) or concatenate the results (for
-                example for metrics) or be more selective about you want to report back
-                to the algorithm's training_step. If None is passed, the results will
-                not get reduced.
-        Returns:
-            A dictionary of results, in numpy format.
+            module_id: The id of the module to remove.
         """
         self.__check_if_build_called()
+        module = self._module[module_id]
 
-        batch_iter = (
-            MiniBatchCyclicIterator
-            if minibatch_size is not None
-            else MiniBatchDummyIterator
-        )
+        parameters = self.get_parameters(module)
+        for param in parameters:
+            param_ref = self.get_param_ref(param)
+            if param_ref in self._params:
+                del self._params[param_ref]
+            if param_ref in self._param_to_optim:
+                optimizer = self._param_to_optim[param_ref]
+                if optimizer in self._optim_to_param:
+                    del self._optim_to_param[optimizer]
+                del self._param_to_optim[param_ref]
 
-        results = []
-        for minibatch in batch_iter(batch, minibatch_size, num_iters):
+        self._module.remove_module(module_id)
 
-            result = self._update(minibatch)
-            results.append(result)
+    @OverrideToImplementCustomLogic_CallToSuperRecommended
+    def build(self) -> None:
+        """Builds the Learner.
 
-        # Reduce results across all minibatches, if necessary.
-        if len(results) == 1:
-            return results[0]
-        else:
-            if reduce_fn is None:
-                return results
-            return reduce_fn(results)
+        This method should be called before the learner is used. It is responsible for
+        setting up the module and optimizers.
+        """
+        self._module = self._make_module()
+        for param_seq, optimizer in self.configure_optimizers():
+            self._optim_to_param[optimizer] = []
+            for param in param_seq:
+                param_ref = self.get_param_ref(param)
+                self._optim_to_param[optimizer].append(param_ref)
+                self._params[param_ref] = param
+                self._param_to_optim[param_ref] = optimizer
 
-    def _update(
+    @OverrideToImplementCustomLogic
+    def compute_loss(
         self,
-        batch: MultiAgentBatch,
-    ) -> Mapping[str, Any]:
+        *,
+        fwd_out: Union[MultiAgentBatch, NestedDict],
+        batch: Union[MultiAgentBatch, NestedDict],
+    ) -> Union[TensorType, Mapping[str, Any]]:
+        """Computes the loss for the module being optimized.
 
-        # TODO (Kourosh): remove the MultiAgentBatch from the type, it should be
-        # NestedDict from the base class.
-        batch = self._convert_batch_type(batch)
-        fwd_out = self._module.forward_train(batch)
-        loss = self.compute_loss(fwd_out=fwd_out, batch=batch)
-        gradients = self.compute_gradients(loss)
-        postprocessed_gradients = self.postprocess_gradients(gradients)
-        self.apply_gradients(postprocessed_gradients)
-        result = self.compile_results(batch, fwd_out, loss, postprocessed_gradients)
-        return convert_to_numpy(result)
+        This method must be overridden multiagent-specific algorithm learners to
+        specify the specific loss computation logic. If the algorithm is single agent
+        `compute_loss_per_module()` should be overriden instead.
+        The input "fwd_out" is the output "forward_train" method of the underlying
+        MultiAgentRLModule. The input "batch" is the data that was used to compute
+        "fwd_out". The returned dictionary must contain a key called "total_loss",
+        which will be used to compute gradients. It is recommended to not compute any
+        forward passes within this method, and to use the "forward_train" outputs to
+        compute the required tensors for loss calculation.
 
-    @abc.abstractmethod
-    def _convert_batch_type(self, batch: MultiAgentBatch) -> NestedDict[TensorType]:
-        """Converts a MultiAgentBatch to a NestedDict of Tensors.
+        Args:
+            fwd_out: Output from a call to `forward_train` on self._module during
+                training.
+            batch: The data that was used to compute fwd_out.
 
-        This should convert the input batch from a MultiAgentBatch format to framework
-        specific tensor format located on the correct device.
+        Returns:
+            A dictionary of losses. NOTE that the dictionary
+            must contain one protected key "total_loss" which will be used for
+            computing gradients through.
+        """
+        loss_total = None
+        results_all_modules = {}
+        for module_id in fwd_out:
+            module_batch = batch[module_id]
+            module_fwd_out = fwd_out[module_id]
+
+            module_results = self.compute_loss_per_module(
+                module_id, module_batch, module_fwd_out
+            )
+            results_all_modules[module_id] = module_results
+            loss = module_results[self.TOTAL_LOSS_KEY]
+
+            if loss_total is None:
+                loss_total = loss
+            else:
+                loss_total += loss
+
+        results_all_modules[self.TOTAL_LOSS_KEY] = loss_total
+
+        return results_all_modules
+
+    @OverrideToImplementCustomLogic
+    def compute_loss_per_module(
+        self, module_id: str, batch: SampleBatch, fwd_out: Mapping[str, TensorType]
+    ) -> Mapping[str, Any]:
+        """Computes the loss for a single module.
+
+        Think of this as computing loss for a single agent. For multi-agent use-cases
+        that require more complicated computation for loss, consider overriding the
+        `compute_loss` method instead.
 
         Args:
-            batch: A MultiAgentBatch.
+            module_id: The id of the module.
+            batch: The sample batch for this particular module.
+            fwd_out: The output of the forward pass for this particular module.
 
         Returns:
-            A NestedDict.
+            A dictionary of losses. NOTE that the dictionary
+            must contain one protected key "total_loss" which will be used for
+            computing gradients through.
         """
+        raise NotImplementedError
 
+    @OverrideToImplementCustomLogic
     def additional_update(self, *args, **kwargs) -> Mapping[str, Any]:
         """Apply additional non-gradient based updates to this Trainer.
 
         For example, this could be used to do a polyak averaging update
         of a target network in off policy algorithms like SAC or DQN.
 
-        This can be called on its own, or via a call to a `TrainerRunner`
-        that is managing multiple RLTrainer instances via a call to
-        `TrainerRunner.additional_update`.
+        Example:
+
+        .. code-block:: python
+
+            class DQNLearner(TorchLearner):
+
+                def additional_update_per_module(self, module_id: str, tau: float):
+                    # perform polyak averaging update
+                    main = self._module[module_id].main
+                    target = self._module[module_id].target
+                    for param, target_param in zip(
+                        main.parameters(), target.parameters()
+                    ):
+                        target_param.data.copy_(
+                            tau * param.data + (1.0 - tau) * target_param.data
+                        )
+
+        And inside a training loop:
+
+        .. code-block:: python
+
+            for _ in range(100):
+                sample = ...
+                self.learner.update(sample)
+                if self.learner.global_step % 10 == 0:
+                    self.learner.additional_update(tau=0.01)
 
         Args:
             *args: Arguments to use for the update.
@@ -448,18 +600,21 @@ def additional_update(self, *args, **kwargs) -> Mapping[str, Any]:
         """
         results_all_modules = {}
         for module_id in self._module.keys():
-            module_results = self._additional_update_per_module(
+            module_results = self.additional_update_per_module(
                 module_id, *args, **kwargs
             )
             results_all_modules[module_id] = module_results
 
         return results_all_modules
 
-    def _additional_update_per_module(
+    @OverrideToImplementCustomLogic
+    def additional_update_per_module(
         self, module_id: str, *args, **kwargs
     ) -> Mapping[str, Any]:
         """Apply additional non-gradient based updates for a single module.
 
+        See `additional_update` for more details.
+
         Args:
             module_id: The id of the module to update.
             *args: Arguments to use for the update.
@@ -468,40 +623,76 @@ def _additional_update_per_module(
         Returns:
             A dictionary of results from the update
         """
-
         raise NotImplementedError
 
-    @abc.abstractmethod
-    def compute_gradients(
-        self, loss: Union[TensorType, Mapping[str, Any]]
-    ) -> ParamDictType:
-        """Perform an update on self._module.
+    @OverrideToImplementCustomLogic
+    def postprocess_gradients(
+        self, gradients_dict: Mapping[str, Any]
+    ) -> Mapping[str, Any]:
+        """Applies potential postprocessings to the gradients.
 
-        For example compute and apply gradients to self._module if
-        necessary.
+        In some algorithms, we may want to perform some postprocessing on the
+        gradients before they are applied. This method is called after gradients
+        have been computed, and modifies them before they are applied.
 
         Args:
-            loss: variable(s) used for optimizing self._module.
+            gradients_dict: A dictionary of gradients.
 
         Returns:
-            A dictionary of extra information and statistics.
+            A dictionary of updated gradients.
         """
+        return gradients_dict
 
-    @abc.abstractmethod
-    def apply_gradients(self, gradients: Dict[ParamRef, TensorType]) -> None:
-        """Perform an update on self._module
+    def update(
+        self,
+        batch: MultiAgentBatch,
+        *,
+        minibatch_size: Optional[int] = None,
+        num_iters: int = 1,
+        reduce_fn: Callable[[ResultDict], ResultDict] = _reduce_mean_results,
+    ) -> Mapping[str, Any]:
+        """Do `num_iters` minibatch updates given the original batch.
+
+        Given a batch of episodes you can use this method to take more
+        than one backward pass on the batch. The same minibatch_size and num_iters
+        will be used for all module ids in MultiAgentRLModule.
 
         Args:
-            gradients: A dictionary of gradients.
+            batch: A batch of data.
+            minibatch_size: The size of the minibatch to use for each update.
+            num_iters: The number of complete passes over all the sub-batches
+                in the input multi-agent batch.
+            reduce_fn: reduce_fn: A function to reduce the results from a list of
+                minibatch updates. This can be any arbitrary function that takes a
+                list of dictionaries and returns a single dictionary. For example you
+                can either take an average (default) or concatenate the results (for
+                example for metrics) or be more selective about you want to report back
+                to the algorithm's training_step. If None is passed, the results will
+                not get reduced.
+        Returns:
+            A dictionary of results, in numpy format.
         """
+        self.__check_if_build_called()
 
-    @abc.abstractmethod
-    def get_weights(self, module_ids: Optional[Set[str]] = None) -> Mapping[str, Any]:
-        """Returns the state of the underlying MultiAgentRLModule"""
+        batch_iter = (
+            MiniBatchCyclicIterator
+            if minibatch_size is not None
+            else MiniBatchDummyIterator
+        )
 
-    @abc.abstractmethod
-    def set_weights(self, weights: Mapping[str, Any]) -> None:
-        """Sets the state of the underlying MultiAgentRLModule"""
+        results = []
+        for minibatch in batch_iter(batch, minibatch_size, num_iters):
+
+            result = self._update(minibatch)
+            results.append(result)
+
+        # Reduce results across all minibatches, if necessary.
+        if len(results) == 1:
+            return results[0]
+        else:
+            if reduce_fn is None:
+                return results
+            return reduce_fn(results)
 
     def set_state(self, state: Mapping[str, Any]) -> None:
         """Set the state of the trainer.
@@ -528,151 +719,42 @@ def get_state(self) -> Mapping[str, Any]:
         # TODO: once we figure out the optimizer format, we can set/get the state
         return {"module_state": self._module.get_state()}
 
-    def add_module(
-        self,
-        *,
-        module_id: ModuleID,
-        module_spec: SingleAgentRLModuleSpec,
-        set_optimizer_fn: Optional[Callable[[RLModule], ParamOptimizerPairs]] = None,
-        optimizer_cls: Optional[Type[Optimizer]] = None,
-    ) -> None:
-        """Add a module to the underlying MultiAgentRLModule and the trainer.
-
-        Args:
-            module_id: The id of the module to add.
-            module_cls: The module class to add.
-            module_kwargs: The config for the module.
-            set_optimizer_fn: A function that takes in the module and returns a list of
-                (param, optimizer) pairs. Each element in the tuple describes a
-                parameter group that share the same optimizer object, if None, the
-                default optimizer_cls will be used with all the parameters from the
-                module.
-            optimizer_cls: The optimizer class to use. If None, the set_optimizer_fn
-                should be provided.
-        """
-        self.__check_if_build_called()
-        module = module_spec.build()
-
-        # construct a default set_optimizer_fn if not provided
-        if set_optimizer_fn is None:
-            if optimizer_cls is None:
-                raise ValueError(
-                    "Either set_optimizer_fn or optimizer_cls must be provided."
-                )
-
-            def set_optimizer_fn(module):
-                optimizer = self.get_optimizer_obj(module, optimizer_cls)
-                parameters = self.get_parameters(module)
-                return [(parameters, optimizer)]
-
-        for param_seq, optimizer in set_optimizer_fn(module):
-            self._optim_to_param[optimizer] = []
-            for param in param_seq:
-                param_ref = self.get_param_ref(param)
-                self._optim_to_param[optimizer].append(param_ref)
-                self._params[param_ref] = param
-                self._param_to_optim[param_ref] = optimizer
-
-        self._module.add_module(module_id, module)
-
-    def remove_module(self, module_id: ModuleID) -> None:
-        """Remove a module from the trainer.
-
-        Args:
-            module_id: The id of the module to remove.
-
-        """
-        self.__check_if_build_called()
-        module = self._module[module_id]
-
-        parameters = self.get_parameters(module)
-        for param in parameters:
-            param_ref = self.get_param_ref(param)
-            if param_ref in self._params:
-                del self._params[param_ref]
-            if param_ref in self._param_to_optim:
-                optimizer = self._param_to_optim[param_ref]
-                if optimizer in self._optim_to_param:
-                    del self._optim_to_param[optimizer]
-                del self._param_to_optim[param_ref]
-
-        self._module.remove_module(module_id)
-
     def _make_module(self) -> MultiAgentRLModule:
         """Construct the multi-agent RL module for the trainer.
 
-        This method uses `self.module_class` and `self.module_kwargs` to construct the
+        This method uses `self._module_specs` or `self._module_obj` to construct the
         module. If the module_class is a single agent RL module it will be wrapped to a
-        multi-agent RL module.
+        multi-agent RL module. Override this method if there are other things than
+        needs to happen for instantiation of the module.
+
 
         Returns:
             The constructed module.
         """
-        if self.module_obj is not None:
-            module = self.module_obj
+        if self._module_obj is not None:
+            module = self._module_obj
         else:
-            module = self.module_spec.build()
+            module = self._module_spec.build()
         module = module.as_multi_agent()
         return module
 
-    def build(self) -> None:
-        """Initialize the model."""
-        self._module = self._make_module()
-        for param_seq, optimizer in self.configure_optimizers():
-            self._optim_to_param[optimizer] = []
-            for param in param_seq:
-                param_ref = self.get_param_ref(param)
-                self._optim_to_param[optimizer].append(param_ref)
-                self._params[param_ref] = param
-                self._param_to_optim[param_ref] = optimizer
-
-    @abc.abstractmethod
-    def get_param_ref(self, param: ParamType) -> Hashable:
-        """Returns a reference to a parameter.
-
-        This should be overriden in framework specific trainer. For example in torch it
-        will return the parameter itself, while in tf it returns the .ref() of the
-        variable. The purpose is to retrieve a unique reference to the parameters.
-
-        Args:
-            param: The parameter to get the reference to.
-
-        Returns:
-            A reference to the parameter.
-        """
-
-    @abc.abstractmethod
-    def get_parameters(self, module: RLModule) -> Sequence[ParamType]:
-        """Returns the parameters of a module.
-
-        This should be overriden in framework specific trainer. For example in torch it
-        will return .parameters(), while in tf it returns .trainable_variables.
-
-        Args:
-            module: The module to get the parameters from.
-
-        Returns:
-            The parameters of the module.
-        """
-        # TODO (Kourosh): Make this method a classmethod. This function's purpose is to
-        # get the parameters of a module based on what the underlying framework is.
-
-    @abc.abstractmethod
-    def get_optimizer_obj(
-        self, module: RLModule, optimizer_cls: Type[Optimizer]
-    ) -> Optimizer:
-        """Returns the optimizer instance of type optimizer_cls from the module
-
-        In torch this is the optimizer object initialize with module parameters. In tf
-        this is initialized without module parameters.
-
-        Args:
-            module: The module of type RLModule to get the optimizer from.
-            optimizer_cls: The optimizer class to use.
+    @OverrideToImplementCustomLogic_CallToSuperRecommended
+    def _update(
+        self,
+        batch: Union[MultiAgentBatch, NestedDict],
+    ) -> Mapping[str, Any]:
+        """Performs a single update given a batch of data."""
 
-        Returns:
-            The optimizer object.
-        """
+        # TODO (Kourosh): remove the MultiAgentBatch from the type, it should be
+        # NestedDict from the base class.
+        batch = self._convert_batch_type(batch)
+        fwd_out = self._module.forward_train(batch)
+        loss = self.compute_loss(fwd_out=fwd_out, batch=batch)
+        gradients = self.compute_gradients(loss)
+        postprocessed_gradients = self.postprocess_gradients(gradients)
+        self.apply_gradients(postprocessed_gradients)
+        result = self.compile_results(batch, fwd_out, loss, postprocessed_gradients)
+        return convert_to_numpy(result)
 
     def __check_if_build_called(self):
         if self._module is None:
diff --git a/rllib/core/rl_trainer/tests/test_rl_trainer.py b/rllib/core/rl_trainer/tests/test_rl_trainer.py
index 816261ba34f0..6b431600cc79 100644
--- a/rllib/core/rl_trainer/tests/test_rl_trainer.py
+++ b/rllib/core/rl_trainer/tests/test_rl_trainer.py
@@ -94,7 +94,7 @@ def test_apply_gradients(self):
         params = trainer.module[DEFAULT_POLICY_ID].trainable_variables
         n_steps = 100
         expected = [
-            param - n_steps * trainer.optimizer_config["lr"] * np.ones(param.shape)
+            param - n_steps * trainer._optimizer_config["lr"] * np.ones(param.shape)
             for param in params
         ]
         for _ in range(n_steps):
diff --git a/rllib/core/rl_trainer/tf/tf_rl_trainer.py b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
index 5be0840c3a5b..6944cc1db1d3 100644
--- a/rllib/core/rl_trainer/tf/tf_rl_trainer.py
+++ b/rllib/core/rl_trainer/tf/tf_rl_trainer.py
@@ -6,7 +6,6 @@
     Type,
     Optional,
     Callable,
-    Dict,
     Sequence,
     Hashable,
 )
@@ -15,7 +14,6 @@
     FrameworkHPs,
     RLTrainer,
     ParamOptimizerPairs,
-    ParamRef,
     Optimizer,
     ParamType,
     ParamDictType,
@@ -42,49 +40,6 @@
 
 
 class TfRLTrainer(RLTrainer):
-    """Base class for RLlib TF algorithm trainers
-
-    Args:
-        module_class: The (MA)RLModule class to use.
-        module_kwargs: The kwargs for the (MA)RLModule.
-        optimizer_config: The config for the optimizer.
-        distributed: Whether this trainer is distributed or not.
-        enable_tf_function: Whether to enable tf.function tracing for the update
-            function.
-
-    Abstract Methods:
-        compute_gradients: Compute gradients for the module being optimized.
-        apply_gradients: Apply gradients to the module being optimized with respect to
-            a loss that is computed by the optimizer.
-
-    Example:
-        .. code-block:: python
-
-        trainer = MyRLTrainer(module_class, module_kwargs, optimizer_config)
-        trainer.init_trainer()
-        batch = ...
-        results = trainer.update(batch)
-
-        # add a new module, perhaps for league based training or lru caching
-        trainer.add_module("new_player", NewPlayerCls, new_player_kwargs,
-            NewPlayerOptimCls, new_player_optim_kwargs)
-
-        batch = ...
-        results = trainer.update(batch)  # will train previous and new modules.
-
-        # remove a module
-        trainer.remove_module("new_player")
-
-        batch = ...
-        results = trainer.update(batch)  # will train previous modules only.
-
-        # get the state of the trainer
-        state = trainer.get_state()
-
-        # set the state of the trainer
-        trainer.set_state(state)
-
-    """
 
     framework: str = "tf"
 
@@ -100,55 +55,18 @@ def __init__(
 
         self._enable_tf_function = framework_hyperparameters.eager_tracing
         # the default strategy is a no-op that can be used in the local mode
-        # cpu only case
+        # cpu only case, build will override this if needed.
         self._strategy = tf.distribute.get_strategy()
 
-    @override(RLTrainer)
-    def build(self) -> None:
-        if self._distributed:
-            self._strategy = tf.distribute.MultiWorkerMirroredStrategy()
-        else:
-            if self._use_gpu:
-                # mirrored strategy is typically used for multi-gpu training
-                # on a single machine, however we can use it for single-gpu
-                devices = tf.config.list_logical_devices("GPU")
-                assert self._local_gpu_idx < len(devices), (
-                    f"local_gpu_idx {self._local_gpu_idx} is not a valid GPU id or is "
-                    " not available."
-                )
-                local_gpu = [devices[self._local_gpu_idx].name]
-                self._strategy = tf.distribute.MirroredStrategy(devices=local_gpu)
-        with self._strategy.scope():
-            super().build()
-
-        if self._enable_tf_function:
-            self._update_fn = tf.function(self._do_update_fn, reduce_retracing=True)
-        else:
-            self._update_fn = self._do_update_fn
-
-    def _do_update_fn(self, batch: MultiAgentBatch) -> Mapping[str, Any]:
-        # TODO (Avnish): Match this base class's implementation.
-        def helper(_batch):
-            with tf.GradientTape() as tape:
-                fwd_out = self._module.forward_train(_batch)
-                loss = self.compute_loss(fwd_out=fwd_out, batch=_batch)
-                if isinstance(loss, tf.Tensor):
-                    loss = {"total_loss": loss}
-            gradients = self.compute_gradients(loss, tape)
-            gradients = self.postprocess_gradients(gradients)
-            self.apply_gradients(gradients)
-            return {
-                "loss": loss,
-                "fwd_out": fwd_out,
-                "postprocessed_gradients": gradients,
-            }
-
-        return self._strategy.run(helper, args=(batch,))
-
     @override(RLTrainer)
     def configure_optimizers(self) -> ParamOptimizerPairs:
+        """Configures the optimizers for the Learner.
+
+        By default it sets up a single Adam optimizer for each sub-module in module
+        accessible via `moduel.keys()`.
+        """
         # TODO (Kourosh): convert optimizer_config to dataclass later.
-        lr = self.optimizer_config["lr"]
+        lr = self._optimizer_config["lr"]
         return [
             (
                 self._module[key].trainable_variables,
@@ -157,47 +75,6 @@ def configure_optimizers(self) -> ParamOptimizerPairs:
             for key in self._module.keys()
         ]
 
-    @override(RLTrainer)
-    def update(
-        self,
-        batch: MultiAgentBatch,
-        *,
-        minibatch_size: Optional[int] = None,
-        num_iters: int = 1,
-        reduce_fn: Callable[[ResultDict], ResultDict] = ...,
-    ) -> Mapping[str, Any]:
-        if set(batch.policy_batches.keys()) != set(self._module.keys()):
-            raise ValueError(
-                "Batch keys must match module keys. RLTrainer does not "
-                "currently support training of only some modules and not others"
-            )
-
-        batch_iter = (
-            MiniBatchCyclicIterator
-            if minibatch_size is not None
-            else MiniBatchDummyIterator
-        )
-
-        results = []
-        for minibatch in batch_iter(batch, minibatch_size, num_iters):
-            # TODO (Avnish): converting to tf tensor and then from nested dict back to
-            # dict will most likely hit us in perf. But let's go with this for now.
-            minibatch = self.convert_batch_to_tf_tensor(minibatch)
-            update_outs = self._update_fn(minibatch.asdict())
-            loss = update_outs["loss"]
-            fwd_out = update_outs["fwd_out"]
-            postprocessed_gradients = update_outs["postprocessed_gradients"]
-            result = self.compile_results(batch, fwd_out, loss, postprocessed_gradients)
-            results.append(result)
-
-        # Reduce results across all minibatches, if necessary.
-        if len(results) == 1:
-            return results[0]
-        else:
-            if reduce_fn is None:
-                return results
-            return reduce_fn(results)
-
     @override(RLTrainer)
     def compute_gradients(
         self, loss: Union[TensorType, Mapping[str, Any]], tape: "tf.GradientTape"
@@ -206,7 +83,7 @@ def compute_gradients(
         return grads
 
     @override(RLTrainer)
-    def apply_gradients(self, gradients: Dict[ParamRef, TensorType]) -> None:
+    def apply_gradients(self, gradients: ParamDictType) -> None:
         # TODO (Avnishn, kourosh): apply gradients doesn't work in cases where
         # only some agents have a sample batch that is passed but not others.
         # This is probably because of the way that we are iterating over the
@@ -216,6 +93,54 @@ def apply_gradients(self, gradients: Dict[ParamRef, TensorType]) -> None:
             gradient_list = [gradients[param_ref] for param_ref in param_ref_seq]
             optim.apply_gradients(zip(gradient_list, variable_list))
 
+    @override(RLTrainer)
+    def get_weights(self) -> Mapping[str, Any]:
+        # TODO (Kourosh) Implement this.
+        raise NotImplementedError
+
+    @override(RLTrainer)
+    def set_weights(self, weights: Mapping[str, Any]) -> None:
+        # TODO (Kourosh) Implement this.
+        raise NotImplementedError
+
+    @override(RLTrainer)
+    def get_param_ref(self, param: ParamType) -> Hashable:
+        return param.ref()
+
+    @override(RLTrainer)
+    def get_parameters(self, module: RLModule) -> Sequence[ParamType]:
+        return list(module.trainable_variables)
+
+    @override(RLTrainer)
+    def get_optimizer_obj(
+        self, module: RLModule, optimizer_cls: Type[Optimizer]
+    ) -> Optimizer:
+        lr = self._optimizer_config["lr"]
+        return optimizer_cls(learning_rate=lr)
+
+    @override(RLTrainer)
+    def _convert_batch_type(self, batch: MultiAgentBatch) -> NestedDict[TensorType]:
+        """Convert the arrays of batch to tf.Tensor's.
+
+        Note: This is an in place operation.
+
+        Args:
+            batch: The batch to convert.
+
+        Returns:
+            The converted batch.
+
+        """
+        # TODO(avnishn): This is a hack to get around the fact that
+        # SampleBatch.count becomes 0 after decorating the function with
+        # tf.function. This messes with input spec checking. Other fields of
+        # the sample batch are possibly modified by tf.function which may lead
+        # to unwanted consequences. We'll need to further investigate this.
+        batch = NestedDict(batch.policy_batches)
+        for key, value in batch.items():
+            batch[key] = tf.convert_to_tensor(value, dtype=tf.float32)
+        return batch.asdict()
+
     @override(RLTrainer)
     def add_module(
         self,
@@ -250,47 +175,95 @@ def remove_module(self, module_id: ModuleID) -> None:
         if self._enable_tf_function:
             self._update_fn = tf.function(self._do_update_fn, reduce_retracing=True)
 
-    def convert_batch_to_tf_tensor(self, batch: MultiAgentBatch) -> NestedDict:
-        """Convert the arrays of batch to tf.Tensor's.
+    @override(RLTrainer)
+    def build(self) -> None:
+        """Build the TfLearner.
 
-        Note: This is an in place operation.
+        This method is specific TfLearner. Before running super() it sets the correct
+        distributing strategy with the right device, so that computational graph is
+        placed on the correct device. After running super(), depending on eager_tracing
+        flag it will decide whether to wrap the update function with tf.function or not.
+        """
+        if self._distributed:
+            self._strategy = tf.distribute.MultiWorkerMirroredStrategy()
+        else:
+            if self._use_gpu:
+                # mirrored strategy is typically used for multi-gpu training
+                # on a single machine, however we can use it for single-gpu
+                devices = tf.config.list_logical_devices("GPU")
+                assert self._local_gpu_idx < len(devices), (
+                    f"local_gpu_idx {self._local_gpu_idx} is not a valid GPU id or is "
+                    " not available."
+                )
+                local_gpu = [devices[self._local_gpu_idx].name]
+                self._strategy = tf.distribute.MirroredStrategy(devices=local_gpu)
+        with self._strategy.scope():
+            super().build()
 
-        Args:
-            batch: The batch to convert.
+        if self._enable_tf_function:
+            self._update_fn = tf.function(self._do_update_fn, reduce_retracing=True)
+        else:
+            self._update_fn = self._do_update_fn
 
-        Returns:
-            The converted batch.
+    @override(RLTrainer)
+    def update(
+        self,
+        batch: MultiAgentBatch,
+        *,
+        minibatch_size: Optional[int] = None,
+        num_iters: int = 1,
+        reduce_fn: Callable[[ResultDict], ResultDict] = ...,
+    ) -> Mapping[str, Any]:
+        # TODO (Kourosh): The update of rl_trainer is vastly differnet than the base
+        # class. So we need to unify them.
 
-        """
-        # TODO(avnishn): This is a hack to get around the fact that
-        # SampleBatch.count becomes 0 after decorating the function with
-        # tf.function. This messes with input spec checking. Other fields of
-        # the sample batch are possibly modified by tf.function which may lead
-        # to unwanted consequences. We'll need to further investigate this.
-        batch = NestedDict(batch.policy_batches)
-        for key, value in batch.items():
-            batch[key] = tf.convert_to_tensor(value, dtype=tf.float32)
-        return batch
+        if set(batch.policy_batches.keys()) != set(self._module.keys()):
+            raise ValueError(
+                "Batch keys must match module keys. RLTrainer does not "
+                "currently support training of only some modules and not others"
+            )
 
-    def get_weights(self) -> Mapping[str, Any]:
-        # TODO (Kourosh) Implement this.
-        raise NotImplementedError
+        batch_iter = (
+            MiniBatchCyclicIterator
+            if minibatch_size is not None
+            else MiniBatchDummyIterator
+        )
 
-    def set_weights(self, weights: Mapping[str, Any]) -> None:
-        # TODO (Kourosh) Implement this.
-        raise NotImplementedError
+        results = []
+        for minibatch in batch_iter(batch, minibatch_size, num_iters):
+            # TODO (Avnish): converting to tf tensor and then from nested dict back to
+            # dict will most likely hit us in perf. But let's go with this for now.
+            minibatch = self._convert_batch_type(minibatch)
+            update_outs = self._update_fn(minibatch)
+            loss = update_outs["loss"]
+            fwd_out = update_outs["fwd_out"]
+            postprocessed_gradients = update_outs["postprocessed_gradients"]
+            result = self.compile_results(batch, fwd_out, loss, postprocessed_gradients)
+            results.append(result)
 
-    @override(RLTrainer)
-    def get_parameters(self, module: RLModule) -> Sequence[ParamType]:
-        return module.trainable_variables
+        # Reduce results across all minibatches, if necessary.
+        if len(results) == 1:
+            return results[0]
+        else:
+            if reduce_fn is None:
+                return results
+            return reduce_fn(results)
 
-    @override(RLTrainer)
-    def get_param_ref(self, param: ParamType) -> Hashable:
-        return param.ref()
+    def _do_update_fn(self, batch: MultiAgentBatch) -> Mapping[str, Any]:
+        # TODO (Avnish): Match this base class's implementation.
+        def helper(_batch):
+            with tf.GradientTape() as tape:
+                fwd_out = self._module.forward_train(_batch)
+                loss = self.compute_loss(fwd_out=fwd_out, batch=_batch)
+                if isinstance(loss, tf.Tensor):
+                    loss = {"total_loss": loss}
+            gradients = self.compute_gradients(loss, tape)
+            gradients = self.postprocess_gradients(gradients)
+            self.apply_gradients(gradients)
+            return {
+                "loss": loss,
+                "fwd_out": fwd_out,
+                "postprocessed_gradients": gradients,
+            }
 
-    @override(RLTrainer)
-    def get_optimizer_obj(
-        self, module: RLModule, optimizer_cls: Type[Optimizer]
-    ) -> Optimizer:
-        lr = self.optimizer_config.get("lr", 1e-3)
-        return optimizer_cls(learning_rate=lr)
+        return self._strategy.run(helper, args=(batch,))
diff --git a/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py b/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
index 9de3c1d47259..0be8428599e6 100644
--- a/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
+++ b/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
@@ -94,7 +94,7 @@ def test_apply_gradients(self):
         n_steps = 100
         expected = [
             convert_to_numpy(param)
-            - n_steps * trainer.optimizer_config["lr"] * np.ones(param.shape)
+            - n_steps * trainer._optimizer_config["lr"] * np.ones(param.shape)
             for param in params
         ]
         for _ in range(n_steps):
diff --git a/rllib/core/rl_trainer/torch/torch_rl_trainer.py b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
index 1c7cb41fa4a7..b86daf604a21 100644
--- a/rllib/core/rl_trainer/torch/torch_rl_trainer.py
+++ b/rllib/core/rl_trainer/torch/torch_rl_trainer.py
@@ -18,6 +18,7 @@
 )
 from ray.rllib.core.rl_module.marl_module import MultiAgentRLModule
 from ray.rllib.core.rl_trainer.rl_trainer import (
+    FrameworkHPs,
     RLTrainer,
     ParamOptimizerPairs,
     Optimizer,
@@ -25,7 +26,6 @@
     ParamDictType,
 )
 from ray.rllib.core.rl_module.torch.torch_rl_module import TorchDDPRLModule
-from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
 from ray.rllib.policy.sample_batch import MultiAgentBatch
 from ray.rllib.utils.annotations import override
 from ray.rllib.utils.torch_utils import convert_to_torch_tensor
@@ -44,28 +44,28 @@
 
 
 class TorchRLTrainer(RLTrainer):
-
     framework: str = "torch"
 
     def __init__(
         self,
         *,
-        trainer_scaling_config: TrainerScalingConfig = TrainerScalingConfig(),
+        framework_hyperparameters: Optional[FrameworkHPs] = FrameworkHPs(),
         **kwargs,
     ):
-        super().__init__(trainer_scaling_config=trainer_scaling_config, **kwargs)
+        super().__init__(**kwargs)
 
+        # will be set during build
         self._device = None
 
-    @property
-    @override(RLTrainer)
-    def module(self) -> MultiAgentRLModule:
-        return self._module
-
     @override(RLTrainer)
     def configure_optimizers(self) -> ParamOptimizerPairs:
+        """Configures the optimizers for the Learner.
+
+        By default it sets up a single Adam optimizer for each sub-module in module
+        accessible via `moduel.keys()`.
+        """
         # TODO (Kourosh): convert optimizer_config to dataclass later.
-        lr = self.optimizer_config["lr"]
+        lr = self._optimizer_config["lr"]
         return [
             (
                 self.get_parameters(self._module[key]),
@@ -101,59 +101,8 @@ def apply_gradients(self, gradients: ParamDictType) -> None:
             optim.step()
 
     @override(RLTrainer)
-    def build(self) -> None:
-        # TODO (Kourosh): How do we handle model parallism?
-        # TODO (Kourosh): Instead of using _TorchAccelerator, we should use the public
-        # api in ray.train but allow for session to be None without any errors raised.
-        if self._use_gpu:
-            # _TorchAccelerator().get_device() returns the 0th device if
-            # it is called from outside of a Ray Train session. Its necessary to give
-            # the user the option to run on the gpu of their choice, so we enable that
-            # option here via the local gpu id scaling config parameter.
-            if self._distributed:
-                self._device = _TorchAccelerator().get_device()
-            else:
-                assert self._local_gpu_idx < torch.cuda.device_count(), (
-                    f"local_gpu_idx {self._local_gpu_idx} is not a valid GPU id or is "
-                    " not available."
-                )
-                # this is an index into the available cuda devices. For example if
-                # os.environ["CUDA_VISIBLE_DEVICES"] = "1" then
-                # torch.cuda.device_count() = 1 and torch.device(0) will actuall map to
-                # the gpu with id 1 on the node.
-                self._device = torch.device(self._local_gpu_idx)
-        else:
-            self._device = torch.device("cpu")
-        super().build()
-        # if the module is a MultiAgentRLModule and nn.Module we can simply assume
-        # all the submodules are registered. Otherwise, we need to loop through
-        # each submodule and move it to the correct device.
-        # TODO (Kourosh): This can result in missing modules if the user does not
-        # register them in the MultiAgentRLModule. We should find a better way to
-        # handle this.
-        if self._distributed:
-            if isinstance(self._module, torch.nn.Module):
-                self._module = TorchDDPRLModule(self._module)
-            else:
-                for key in self._module.keys():
-                    self._module.add_module(
-                        key, TorchDDPRLModule(self._module[key]), override=True
-                    )
-
-    @override(RLTrainer)
-    def _make_module(self) -> MultiAgentRLModule:
-        module = super()._make_module()
-        self._map_module_to_device(module)
-        return module
-
-    @override(RLTrainer)
-    def _convert_batch_type(self, batch: MultiAgentBatch):
-        batch = convert_to_torch_tensor(batch.policy_batches, device=self._device)
-        batch = NestedDict(batch)
-        return batch
-
     def get_weights(self, module_ids: Optional[Set[str]] = None) -> Mapping[str, Any]:
-        """Returns the state of the underlying MultiAgentRLModule"""
+        """Returns the weights of the underlying MultiAgentRLModule"""
         module_weights = self._module.get_state()
         if module_ids is None:
             return module_weights
@@ -162,8 +111,9 @@ def get_weights(self, module_ids: Optional[Set[str]] = None) -> Mapping[str, Any
             {k: v for k, v in module_weights.items() if k in module_ids}
         )
 
+    @override(RLTrainer)
     def set_weights(self, weights: Mapping[str, Any]) -> None:
-        """Sets the state of the underlying MultiAgentRLModule"""
+        """Sets the weights of the underlying MultiAgentRLModule"""
         weights = convert_to_torch_tensor(weights, device=self._device)
         return self._module.set_state(weights)
 
@@ -181,9 +131,15 @@ def get_optimizer_obj(
     ) -> Optimizer:
         # TODO (Kourosh): the abstraction should take in optimizer_config as a
         # parameter as well.
-        lr = self.optimizer_config.get("lr", 1e-3)
+        lr = self._optimizer_config["lr"]
         return optimizer_cls(module.parameters(), lr=lr)
 
+    @override(RLTrainer)
+    def _convert_batch_type(self, batch: MultiAgentBatch):
+        batch = convert_to_torch_tensor(batch.policy_batches, device=self._device)
+        batch = NestedDict(batch)
+        return batch
+
     @override(RLTrainer)
     def add_module(
         self,
@@ -207,6 +163,61 @@ def add_module(
                 module_id, TorchDDPRLModule(self._module[module_id]), override=True
             )
 
+    @override(RLTrainer)
+    def build(self) -> None:
+        """Builds the TorchLearner.
+
+        This method is specific to TorchLearner. Before running super() it will
+        initialzed the device properly based on use_gpu and distributed flags, so that
+        _make_module() can place the created module on the correct device. After
+        running super() it will wrap the module in a TorchDDPRLModule if distributed is
+        set.
+        """
+        # TODO (Kourosh): How do we handle model parallism?
+        # TODO (Kourosh): Instead of using _TorchAccelerator, we should use the public
+        # api in ray.train but allow for session to be None without any errors raised.
+        if self._use_gpu:
+            # _TorchAccelerator().get_device() returns the 0th device if
+            # it is called from outside of a Ray Train session. Its necessary to give
+            # the user the option to run on the gpu of their choice, so we enable that
+            # option here via the local gpu id scaling config parameter.
+            if self._distributed:
+                self._device = _TorchAccelerator().get_device()
+            else:
+                assert self._local_gpu_idx < torch.cuda.device_count(), (
+                    f"local_gpu_idx {self._local_gpu_idx} is not a valid GPU id or is "
+                    " not available."
+                )
+                # this is an index into the available cuda devices. For example if
+                # os.environ["CUDA_VISIBLE_DEVICES"] = "1" then
+                # torch.cuda.device_count() = 1 and torch.device(0) will actuall map to
+                # the gpu with id 1 on the node.
+                self._device = torch.device(self._local_gpu_idx)
+        else:
+            self._device = torch.device("cpu")
+
+        super().build()
+        # if the module is a MultiAgentRLModule and nn.Module we can simply assume
+        # all the submodules are registered. Otherwise, we need to loop through
+        # each submodule and move it to the correct device.
+        # TODO (Kourosh): This can result in missing modules if the user does not
+        # register them in the MultiAgentRLModule. We should find a better way to
+        # handle this.
+        if self._distributed:
+            if isinstance(self._module, torch.nn.Module):
+                self._module = TorchDDPRLModule(self._module)
+            else:
+                for key in self._module.keys():
+                    self._module.add_module(
+                        key, TorchDDPRLModule(self._module[key]), override=True
+                    )
+
+    @override(RLTrainer)
+    def _make_module(self) -> MultiAgentRLModule:
+        module = super()._make_module()
+        self._map_module_to_device(module)
+        return module
+
     def _map_module_to_device(self, module: MultiAgentRLModule) -> None:
         """Moves the module to the correct device."""
         if isinstance(module, torch.nn.Module):
diff --git a/rllib/core/testing/tf/bc_rl_trainer.py b/rllib/core/testing/tf/bc_rl_trainer.py
index 7d890f5bc23d..fca29c502828 100644
--- a/rllib/core/testing/tf/bc_rl_trainer.py
+++ b/rllib/core/testing/tf/bc_rl_trainer.py
@@ -9,7 +9,7 @@
 
 
 class BCTfRLTrainer(TfRLTrainer, BaseTestingTrainer):
-    def _compute_loss_per_module(
+    def compute_loss_per_module(
         self, module_id: str, batch: SampleBatch, fwd_out: Mapping[str, TensorType]
     ) -> Mapping[str, Any]:
 
diff --git a/rllib/core/testing/torch/bc_rl_trainer.py b/rllib/core/testing/torch/bc_rl_trainer.py
index 9667c84df7b6..9de288b982fd 100644
--- a/rllib/core/testing/torch/bc_rl_trainer.py
+++ b/rllib/core/testing/torch/bc_rl_trainer.py
@@ -8,7 +8,7 @@
 
 
 class BCTorchRLTrainer(TorchRLTrainer, BaseTestingTrainer):
-    def _compute_loss_per_module(
+    def compute_loss_per_module(
         self, module_id: str, batch: SampleBatch, fwd_out: Mapping[str, TensorType]
     ) -> Mapping[str, Any]:
 

From 9cbf406ddd3368b70003b03045c9e86d523d686b Mon Sep 17 00:00:00 2001
From: Jialing He <burglarralgrub@gmail.com>
Date: Fri, 10 Feb 2023 16:59:44 +0800
Subject: [PATCH 217/267] [Bug Fix][Object Store] race condition: Pull Manager
 will hang in certain timings  (#31464)

Restore will fail if the object is still in the creation, so in certain timings, the pull will hang.
---
 src/ray/object_manager/pull_manager.cc         |  3 +++
 .../object_manager/test/pull_manager_test.cc   | 18 ++++++++++++------
 2 files changed, 15 insertions(+), 6 deletions(-)

diff --git a/src/ray/object_manager/pull_manager.cc b/src/ray/object_manager/pull_manager.cc
index bc826b4598d4..4e954b9f86ec 100644
--- a/src/ray/object_manager/pull_manager.cc
+++ b/src/ray/object_manager/pull_manager.cc
@@ -475,6 +475,9 @@ void PullManager::TryToMakeObjectLocal(const ObjectID &object_id) {
   if (!direct_restore_url.empty()) {
     // Select an url from the object directory update
     UpdateRetryTimer(request, object_id);
+    // Avoid restore failure by the object already exists.
+    // Details: https://github.com/ray-project/ray/issues/31390
+    cancel_pull_request_(object_id);
     restore_spilled_object_(object_id,
                             request.object_size,
                             direct_restore_url,
diff --git a/src/ray/object_manager/test/pull_manager_test.cc b/src/ray/object_manager/test/pull_manager_test.cc
index 2f2d78807ed4..9e0b170e4b11 100644
--- a/src/ray/object_manager/test/pull_manager_test.cc
+++ b/src/ray/object_manager/test/pull_manager_test.cc
@@ -408,11 +408,13 @@ TEST_P(PullManagerTest, TestRestoreSpilledObjectLocal) {
   ASSERT_EQ(num_send_pull_request_calls_, 0);
   ASSERT_EQ(num_restore_spilled_object_calls_, 2);
 
-  ASSERT_TRUE(num_abort_calls_.empty());
+  // Abort create obj1 before try to restore it.
+  ASSERT_EQ(num_abort_calls_[obj1], num_restore_spilled_object_calls_);
+  ASSERT_EQ(num_abort_calls_.size(), 1);
   ASSERT_TRUE(pull_manager_.PullRequestActiveOrWaitingForMetadata(req_id));
   auto objects_to_cancel = pull_manager_.CancelPull(req_id);
   ASSERT_EQ(objects_to_cancel, ObjectRefsToIds(refs));
-  ASSERT_EQ(num_abort_calls_[obj1], 1);
+  ASSERT_EQ(num_abort_calls_[obj1], num_restore_spilled_object_calls_ + 1);
 
   AssertNoLeaks();
 }
@@ -453,11 +455,13 @@ TEST_P(PullManagerTest, TestRestoreSpilledObjectOnLocalStorage) {
   ASSERT_EQ(num_send_pull_request_calls_, 0);
   ASSERT_EQ(num_restore_spilled_object_calls_, 2);
 
-  ASSERT_TRUE(num_abort_calls_.empty());
+  // Abort create obj1 before try to restore it.
+  ASSERT_EQ(num_abort_calls_[obj1], num_restore_spilled_object_calls_);
+  ASSERT_EQ(num_abort_calls_.size(), 1);
   ASSERT_TRUE(pull_manager_.PullRequestActiveOrWaitingForMetadata(req_id));
   auto objects_to_cancel = pull_manager_.CancelPull(req_id);
   ASSERT_EQ(objects_to_cancel, ObjectRefsToIds(refs));
-  ASSERT_EQ(num_abort_calls_[obj1], 1);
+  ASSERT_EQ(num_abort_calls_[obj1], num_restore_spilled_object_calls_ + 1);
 
   AssertNoLeaks();
 }
@@ -507,11 +511,13 @@ TEST_P(PullManagerTest, TestRestoreSpilledObjectOnExternalStorage) {
   ASSERT_EQ(num_send_pull_request_calls_, 0);
   ASSERT_EQ(num_restore_spilled_object_calls_, 2);
 
-  ASSERT_TRUE(num_abort_calls_.empty());
+  // Abort create obj1 before try to restore it.
+  ASSERT_EQ(num_abort_calls_[obj1], num_restore_spilled_object_calls_);
+  ASSERT_EQ(num_abort_calls_.size(), 1);
   ASSERT_TRUE(pull_manager_.PullRequestActiveOrWaitingForMetadata(req_id));
   auto objects_to_cancel = pull_manager_.CancelPull(req_id);
   ASSERT_EQ(objects_to_cancel, ObjectRefsToIds(refs));
-  ASSERT_EQ(num_abort_calls_[obj1], 1);
+  ASSERT_EQ(num_abort_calls_[obj1], num_restore_spilled_object_calls_ + 1);
 
   AssertNoLeaks();
 }

From d9a17f29e6bb9b6e7329f20e9f673ba28797272a Mon Sep 17 00:00:00 2001
From: xwjiang2010 <87673679+xwjiang2010@users.noreply.github.com>
Date: Fri, 10 Feb 2023 09:35:15 -0800
Subject: [PATCH 218/267] [Tune] Improve logging, unify trial retry logic,
 improve trial restore retry test. (#32242)

* [Tune] Improve logging, unify requeue logic, improve trial restore retry test.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* fix unit test.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* lint

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* fix test_tuner_restore

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

---------

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>
---
 .../ray/tune/execution/ray_trial_executor.py  | 37 ++++++--------
 python/ray/tune/execution/trial_runner.py     | 50 ++++++-------------
 .../tune/tests/test_trial_runner_callbacks.py |  8 +--
 python/ray/tune/tests/test_tuner_restore.py   | 29 +++++++----
 4 files changed, 55 insertions(+), 69 deletions(-)

diff --git a/python/ray/tune/execution/ray_trial_executor.py b/python/ray/tune/execution/ray_trial_executor.py
index 239c6b562f1d..09ebb04421d8 100644
--- a/python/ray/tune/execution/ray_trial_executor.py
+++ b/python/ray/tune/execution/ray_trial_executor.py
@@ -157,8 +157,7 @@ class _ExecutorEventType(Enum):
     SAVING_RESULT = 4
     RESTORING_RESULT = 5
     STOP_RESULT = 6  # Internally to executor only.
-    ERROR = 7  # This is to signal to TrialRunner that there is an error.
-    YIELD = 8  # Yielding back to TrialRunner's main event loop.
+    YIELD = 7  # Yielding back to TrialRunner's main event loop.
 
 
 class _ExecutorEvent:
@@ -1295,37 +1294,29 @@ def get_next_executor_event(
             else:
                 trial = trial_or_acquired_resources
                 assert isinstance(trial, Trial)
+                assert result_type in (
+                    _ExecutorEventType.TRAINING_RESULT,
+                    _ExecutorEventType.SAVING_RESULT,
+                    _ExecutorEventType.RESTORING_RESULT,
+                )
                 try:
                     future_result = ray.get(ready_future)
                     # For local mode
                     if isinstance(future_result, _LocalWrapper):
                         future_result = future_result.unwrap()
-                    if result_type in (
-                        _ExecutorEventType.TRAINING_RESULT,
-                        _ExecutorEventType.SAVING_RESULT,
-                        _ExecutorEventType.RESTORING_RESULT,
-                    ):
-                        logger.debug(f"Returning [{result_type}] for trial {trial}")
-                        return _ExecutorEvent(
-                            result_type,
-                            trial,
-                            result={_ExecutorEvent.KEY_FUTURE_RESULT: future_result},
-                        )
-                    else:
-                        raise TuneError(f"Unexpected future type - [{result_type}]")
-                except RayTaskError as e:
+                    logger.debug(f"Returning [{result_type}] for trial {trial}")
                     return _ExecutorEvent(
-                        _ExecutorEventType.ERROR,
+                        result_type,
                         trial,
-                        result={_ExecutorEvent.KEY_EXCEPTION: e.as_instanceof_cause()},
+                        result={_ExecutorEvent.KEY_FUTURE_RESULT: future_result},
                     )
-                except Exception:
+                except Exception as e:
                     return _ExecutorEvent(
-                        _ExecutorEventType.ERROR,
+                        result_type,
                         trial,
                         result={
-                            _ExecutorEvent.KEY_EXCEPTION: _TuneNoNextExecutorEventError(
-                                traceback.format_exc()
-                            )
+                            _ExecutorEvent.KEY_EXCEPTION: e.as_instanceof_cause()
+                            if isinstance(e, RayTaskError)
+                            else _TuneNoNextExecutorEventError(traceback.format_exc())
                         },
                     )
diff --git a/python/ray/tune/execution/trial_runner.py b/python/ray/tune/execution/trial_runner.py
index b6d6b9715068..52c2ee05b50f 100644
--- a/python/ray/tune/execution/trial_runner.py
+++ b/python/ray/tune/execution/trial_runner.py
@@ -911,10 +911,17 @@ def _wait_and_handle_event(self, next_trial: Optional[Trial]):
             elif event.type == _ExecutorEventType.YIELD:
                 pass
             else:
+                assert event.type in (
+                    _ExecutorEventType.TRAINING_RESULT,
+                    _ExecutorEventType.SAVING_RESULT,
+                    _ExecutorEventType.RESTORING_RESULT,
+                )
                 trial = event.trial
                 result = event.result
-                if event.type == _ExecutorEventType.ERROR:
-                    self._on_executor_error(trial, result[_ExecutorEvent.KEY_EXCEPTION])
+                if _ExecutorEvent.KEY_EXCEPTION in result:
+                    self._on_executor_error(
+                        trial, event.type, result[_ExecutorEvent.KEY_EXCEPTION]
+                    )
                 elif event.type == _ExecutorEventType.RESTORING_RESULT:
                     self._on_restoring_result(trial)
                 else:
@@ -1055,8 +1062,10 @@ def _post_process_on_training_saving_result(self, trial):
         if final_decision:
             self._execute_action(trial, final_decision)
 
-    def _on_executor_error(self, trial, e: Union[RayTaskError, TuneError]):
-        error_msg = f"Trial {trial}: Error processing event."
+    def _on_executor_error(
+        self, trial, event_type: _ExecutorEventType, e: Union[RayTaskError, TuneError]
+    ):
+        error_msg = f"Trial {trial}: Error happened when processing {str(event_type)}."
         if self._fail_fast == TrialRunner.RAISE:
             raise e
         else:
@@ -1412,37 +1421,9 @@ def _try_recover(self, trial: Trial, exc: Union[TuneError, RayTaskError]):
             error=exc is not None,
             exc=exc,
         )
-        if self.trial_executor.has_resources_for_trial(trial):
-            requeue_trial = False
-            logger.info(
-                "Trial %s: Attempting to restore trial state from last checkpoint.",
-                trial,
-            )
-            # TODO(xwjiang): For better consistency, consider not starting
-            #  trials here. Instead rely on requeuing the trial.
-            started = self.trial_executor.start_trial(trial)
-            if not started:
-                requeue_trial = True
-            elif trial.status == Trial.ERROR:
-                logger.exception(
-                    "Trial %s: Error restoring trial from checkpoint, abort.", trial
-                )
-                if started:
-                    # Clean up again if an actor was launched
-                    self.trial_executor.stop_trial(trial, error=True)
-                self._scheduler_alg.on_trial_error(self, trial)
-                self._search_alg.on_trial_complete(trial.trial_id, error=True)
-                self._callbacks.on_trial_error(
-                    iteration=self._iteration, trials=self._trials, trial=trial
-                )
-            else:
-                logger.debug("Trial %s: Restore dispatched correctly.", trial)
-        else:
-            requeue_trial = True
 
-        if requeue_trial:
-            logger.debug("Trial %s: Notifying Scheduler and requeueing.", trial)
-            self._requeue_trial(trial)
+        logger.debug("Trial %s: Notifying Scheduler and requeueing.", trial)
+        self._requeue_trial(trial)
 
     def _requeue_trial(self, trial):
         """Notification to TrialScheduler and requeue trial.
@@ -1606,6 +1587,7 @@ def __getstate__(self):
             "_local_checkpoint_dir",
             "_sync_config",
             "_experiment_dir_name",
+            "_insufficient_resources_manager",
         ]:
             del state[k]
         state["launch_web_server"] = bool(self._server)
diff --git a/python/ray/tune/tests/test_trial_runner_callbacks.py b/python/ray/tune/tests/test_trial_runner_callbacks.py
index 0a226e5a0933..cb67ce31f7e6 100644
--- a/python/ray/tune/tests/test_trial_runner_callbacks.py
+++ b/python/ray/tune/tests/test_trial_runner_callbacks.py
@@ -172,7 +172,7 @@ def testCallbackSteps(self):
         self.executor.next_future_result = _ExecutorEvent(
             event_type=_ExecutorEventType.TRAINING_RESULT,
             trial=trials[1],
-            result={"future_result": result},
+            result={_ExecutorEvent.KEY_FUTURE_RESULT: result},
         )
         self.assertTrue(not trials[1].has_reported_at_least_once)
         self.trial_runner.step()
@@ -184,7 +184,9 @@ def testCallbackSteps(self):
         # Let the second trial restore from a checkpoint
         trials[1].restoring_from = cp
         self.executor.next_future_result = _ExecutorEvent(
-            event_type=_ExecutorEventType.RESTORING_RESULT, trial=trials[1]
+            event_type=_ExecutorEventType.RESTORING_RESULT,
+            trial=trials[1],
+            result={_ExecutorEvent.KEY_FUTURE_RESULT: None},
         )
         self.trial_runner.step()
         self.assertEqual(self.callback.state["trial_restore"]["iteration"], 4)
@@ -209,7 +211,7 @@ def testCallbackSteps(self):
 
         # Let the first trial error
         self.executor.next_future_result = _ExecutorEvent(
-            event_type=_ExecutorEventType.ERROR,
+            event_type=_ExecutorEventType.TRAINING_RESULT,
             trial=trials[0],
             result={_ExecutorEvent.KEY_EXCEPTION: Exception()},
         )
diff --git a/python/ray/tune/tests/test_tuner_restore.py b/python/ray/tune/tests/test_tuner_restore.py
index 0eb7a5e917a6..d46f5eb5668a 100644
--- a/python/ray/tune/tests/test_tuner_restore.py
+++ b/python/ray/tune/tests/test_tuner_restore.py
@@ -1,10 +1,10 @@
 import json
+import logging
 import os
+from pathlib import Path
 import shutil
 import time
 import unittest
-from pathlib import Path
-import logging
 
 import pytest
 
@@ -481,14 +481,18 @@ def test_tuner_restore_latest_available_checkpoint(
     assert result.metrics["iterations_since_restore"] == 5
 
 
-@pytest.mark.parametrize("retry_num", [0, 1])
+@pytest.mark.parametrize("retry_num", [0, 2])
 def test_restore_retry(ray_start_4_cpus, tmpdir, retry_num):
-    """Test retrying restore on a trial level."""
+    """Test retrying restore on a trial level by setting `TUNE_RESTORE_RETRY_NUM`."""
 
     class MockTrainable(Trainable):
+        """A trainable that can generate one failure during training and
+        another `config["retry_num_to_fail"]` times during restoring."""
+
         def setup(self, config):
             self.idx = 0
             self.tag_file_path = config["tag_file_path"]
+            self.retry_num_to_fail = config.get("retry_num_to_fail", 2)
             self._is_restored = False
 
         def step(self):
@@ -510,10 +514,14 @@ def save_checkpoint(self, checkpoint_dir):
 
         def load_checkpoint(self, checkpoint_path):
             self._is_restored = True
-            if not os.path.exists(self.tag_file_path):
-                Path(self.tag_file_path).touch()
-                raise RuntimeError("===== Failing first restore =====")
-            # The following restore should pass!
+            with open(self.tag_file_path, "r") as f:
+                retried_num = json.loads(f.read())["retried_num"]
+
+            with open(self.tag_file_path, "w") as f:
+                f.write(json.dumps({"retried_num": retried_num + 1}))
+
+            if retried_num < self.retry_num_to_fail:
+                raise RuntimeError(f"===== Failing restore #{retried_num + 1} =====")
             with open(checkpoint_path) as f:
                 self.idx = json.loads(f.read())["idx"]
 
@@ -522,6 +530,9 @@ def load_checkpoint(self, checkpoint_path):
         os.environ, {"TUNE_RESTORE_RETRY_NUM": str(retry_num)}
     ):
         tag_file = os.path.join(tmpdir, "tag")
+        # set up tag file
+        with open(tag_file, "w") as f:
+            f.write(json.dumps({"retried_num": 0}))
         tuner = Tuner(
             MockTrainable,
             run_config=RunConfig(
@@ -535,7 +546,7 @@ def load_checkpoint(self, checkpoint_path):
         )
         results = tuner.fit()
         [result] = list(results)
-        if retry_num == 1:
+        if retry_num > 0:
             assert result.metrics["score"] == 5
         else:
             assert result.metrics["score"] == 2

From 35e106a1b7827d01f2a310c0569b1e4bb67e669b Mon Sep 17 00:00:00 2001
From: Archit Kulkarni <architkulkarni@users.noreply.github.com>
Date: Fri, 10 Feb 2023 09:45:00 -0800
Subject: [PATCH 219/267] [Job API] Handle multiple drivers with same job
 submission id in GCS GetAllJobInfo endpoint (#32388)

The changes to the GetAllJobInfo endpoint in #31046 did not handle the possibility that multiple job table jobs (drivers) could have the same submission_id. This can actually happen, for example if there are multiple ray.init() calls in a Ray Job API entrypoint command. The GCS would crash in this case due to failing a RAY_CHECK that the number of jobs equaled the number of submission_ids seen.

This PR updates the endpoint to handle the above possibility, and adds a unit test which fails without this PR.

Related issue number
Closes #32213
---
 src/ray/gcs/gcs_server/gcs_job_manager.cc     | 22 +++++++-------
 .../gcs_server/test/gcs_job_manager_test.cc   | 29 +++++++++++++++++++
 2 files changed, 41 insertions(+), 10 deletions(-)

diff --git a/src/ray/gcs/gcs_server/gcs_job_manager.cc b/src/ray/gcs/gcs_server/gcs_job_manager.cc
index 734f1795d9cb..52f90bfab7b3 100644
--- a/src/ray/gcs/gcs_server/gcs_job_manager.cc
+++ b/src/ray/gcs/gcs_server/gcs_job_manager.cc
@@ -166,8 +166,10 @@ void GcsJobManager::HandleGetAllJobInfo(rpc::GetAllJobInfoRequest request,
     // Internal KV keys for jobs that were submitted via the Ray Job API.
     std::vector<std::string> job_api_data_keys;
 
-    // Maps job data keys to the index of the job in the table.
-    std::unordered_map<std::string, int> job_data_key_to_index;
+    // Maps a Job API data key to the indices of the corresponding jobs in the table. Note
+    // that multiple jobs can come from the same Ray Job API submission (e.g. if the
+    // entrypoint script calls ray.init() multiple times).
+    std::unordered_map<std::string, std::vector<int>> job_data_key_to_indices;
 
     // Load the job table data into the reply.
     int i = 0;
@@ -183,15 +185,14 @@ void GcsJobManager::HandleGetAllJobInfo(rpc::GetAllJobInfoRequest request,
         std::string job_submission_id = iter->second;
         std::string job_data_key = JobDataKey(job_submission_id);
         job_api_data_keys.push_back(job_data_key);
-        job_data_key_to_index[job_data_key] = i;
+        job_data_key_to_indices[job_data_key].push_back(i);
       }
       i++;
     }
 
-    RAY_CHECK(job_api_data_keys.size() == job_data_key_to_index.size());
-
+    // Load the JobInfo for jobs submitted via the Ray Job API.
     auto kv_multi_get_callback =
-        [reply, send_reply_callback, job_data_key_to_index](
+        [reply, send_reply_callback, job_data_key_to_indices](
             std::unordered_map<std::string, std::string> result) {
           for (auto &data : result) {
             std::string job_data_key = data.first;
@@ -207,10 +208,11 @@ void GcsJobManager::HandleGetAllJobInfo(rpc::GetAllJobInfoRequest request,
                     << "Failed to parse JobInfo JSON into JobsAPIInfo protobuf. JSON: "
                     << job_info_json << " Error: " << status.message();
               }
-              // Add the JobInfo to the correct index in the reply.
-              reply->mutable_job_info_list(job_data_key_to_index.at(job_data_key))
-                  ->mutable_job_info()
-                  ->CopyFrom(std::move(jobs_api_info));
+              // Add the JobInfo to the correct indices in the reply.
+              for (int i : job_data_key_to_indices.at(job_data_key)) {
+                reply->mutable_job_info_list(i)->mutable_job_info()->CopyFrom(
+                    std::move(jobs_api_info));
+              }
             }
           }
           RAY_LOG(INFO) << "Finished getting all job info.";
diff --git a/src/ray/gcs/gcs_server/test/gcs_job_manager_test.cc b/src/ray/gcs/gcs_server/test/gcs_job_manager_test.cc
index afc84ea8ecfc..9a4be623ecf0 100644
--- a/src/ray/gcs/gcs_server/test/gcs_job_manager_test.cc
+++ b/src/ray/gcs/gcs_server/test/gcs_job_manager_test.cc
@@ -234,6 +234,35 @@ TEST_F(GcsJobManagerTest, TestGetAllJobInfo) {
 
   // Make sure the GCS didn't hang or crash.
   all_job_info_promise3.get_future().get();
+
+  // Add another job with the *same* submission ID. This can happen if the entrypoint
+  // script calls ray.init() multiple times.
+  auto job_id2 = JobID::FromInt(2);
+  auto add_job_request2 =
+      Mocker::GenAddJobRequest(job_id2, "namespace_100", submission_id);
+  std::promise<bool> promise4;
+  gcs_job_manager.HandleAddJob(
+      *add_job_request2,
+      &empty_reply,
+      [&promise4](Status, std::function<void()>, std::function<void()>) {
+        promise4.set_value(true);
+      });
+  promise4.get_future().get();
+
+  // Get all job info again.
+  rpc::GetAllJobInfoRequest all_job_info_request4;
+  rpc::GetAllJobInfoReply all_job_info_reply4;
+  std::promise<bool> all_job_info_promise4;
+
+  gcs_job_manager.HandleGetAllJobInfo(
+      all_job_info_request4,
+      &all_job_info_reply4,
+      [&all_job_info_promise4](Status, std::function<void()>, std::function<void()>) {
+        all_job_info_promise4.set_value(true);
+      });
+  all_job_info_promise4.get_future().get();
+
+  ASSERT_EQ(all_job_info_reply4.job_info_list().size(), 101);
 }
 
 TEST_F(GcsJobManagerTest, TestGetAllJobInfoWithLimit) {

From d8639abfa519329d62d522993d62b741922808b8 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Fri, 10 Feb 2023 10:35:53 -0800
Subject: [PATCH 220/267] [Datasets] Not change `map_batches()` UDF name in
 `Dataset.__repr__` (#32411)

This is to fix the Dataset.__repr__ issue in #32410, after we introduce function name in #31526. We should only make operator/stage name to be camel case.

Signed-off-by: Cheng Su <scnju13@gmail.com>
---
 doc/source/data/getting-started.rst   |  2 +-
 python/ray/data/_internal/plan.py     |  9 ++++++++-
 python/ray/data/tests/test_dataset.py | 10 ++++++++++
 3 files changed, 19 insertions(+), 2 deletions(-)

diff --git a/doc/source/data/getting-started.rst b/doc/source/data/getting-started.rst
index 70dc206163f4..0ddb73e10a83 100644
--- a/doc/source/data/getting-started.rst
+++ b/doc/source/data/getting-started.rst
@@ -61,7 +61,7 @@ transform datasets. Ray executes transformations in parallel for performance at
 
 .. testoutput::
 
-    MapBatches(transformBatch)
+    MapBatches(transform_batch)
     +- Dataset(num_blocks=1, num_rows=150, schema={sepal length (cm): double, sepal width (cm): double, petal length (cm): double, petal width (cm): double, target: int64})
 
 To learn more about transforming datasets, read
diff --git a/python/ray/data/_internal/plan.py b/python/ray/data/_internal/plan.py
index c1c30078daf5..ecd588adf745 100644
--- a/python/ray/data/_internal/plan.py
+++ b/python/ray/data/_internal/plan.py
@@ -182,7 +182,14 @@ def get_plan_as_string(self) -> str:
             # Get string representation of each stage in reverse order.
             for stage in self._stages_after_snapshot[::-1]:
                 # Get name of each stage in camel case.
-                stage_name = capitalize(stage.name)
+                # The stage representation should be in "<stage-name>(...)" format,
+                # e.g. "MapBatches(my_udf)".
+                #
+                # TODO(chengsu): create a class to represent stage name to make it less
+                # fragile to parse.
+                stage_str = stage.name.split("(")
+                stage_str[0] = capitalize(stage_str[0])
+                stage_name = "(".join(stage_str)
                 if num_stages == 0:
                     plan_str += f"{stage_name}\n"
                 else:
diff --git a/python/ray/data/tests/test_dataset.py b/python/ray/data/tests/test_dataset.py
index 0f7d7db8d3ae..c188ec150f7f 100644
--- a/python/ray/data/tests/test_dataset.py
+++ b/python/ray/data/tests/test_dataset.py
@@ -1563,6 +1563,16 @@ def test_dataset_repr(ray_start_regular_shared):
         "Zip\n" "+- Dataset(num_blocks=10, num_rows=9, schema=<class 'int'>)"
     )
 
+    def my_dummy_fn(x):
+        return x
+
+    ds = ray.data.range(10, parallelism=10)
+    ds = ds.map_batches(my_dummy_fn)
+    assert repr(ds) == (
+        "MapBatches(my_dummy_fn)\n"
+        "+- Dataset(num_blocks=10, num_rows=10, schema=<class 'int'>)"
+    )
+
 
 @pytest.mark.parametrize("lazy", [False, True])
 def test_limit(ray_start_regular_shared, lazy):

From b7e671dee5a5acbb89237fa57b38d3690646d7d7 Mon Sep 17 00:00:00 2001
From: SangBin Cho <rkooo567@gmail.com>
Date: Fri, 10 Feb 2023 11:04:35 -0800
Subject: [PATCH 221/267] [Metrics] Fix flaky test_task_metrics + fix slow
 report issue from unit tests (#32342)

Every X seconds, when we record metrics, we check all pending updates from counter_map. If there's pending updates, we invoke the registered callback for the relevant updates, which record metrics.

Currently, we have 3 counter_map. Regular (containing all data) & get & wait counter_map. For get and wait  counter_map, although there are updates, we don't register callbacks (they are used to calculate correct RUNNING / GET / WAIT counts).

So normally, this is what will happen.

Task gets into RUNNING state. counter_map is updated and add a callback.
Get is called, and get counter_map is updated. Callback is not updated (by design).
If metrics are recorded after 2, the callback from regular counter_map is invoked and we record correct metrics.

If metrics are recorded after 1, RUNNING state is recorded. But since we don't register callbacks for get counter map, when the next metrics are recorded, the relevant updates are not recorded.

Flakiness comes from the latter case.

This fixes the issue by having "no-op update" to the regular counter_map (e.g., Increment(0)). This will trigger counter_map to invoke a callback again which will correctly update get & wait status.

I could also refactor the code to not use get&wait counter map, but this approach is much easier, so I decide to go with this approach.

This PR also fixes the slow stats report issue.
---
 python/ray/tests/test_object_store_metrics.py | 37 -------------------
 src/ray/core_worker/core_worker.cc            | 16 ++++++--
 src/ray/core_worker/core_worker.h             |  6 +++
 src/ray/stats/stats.h                         |  8 ++--
 src/ray/util/counter_map.h                    | 15 ++++++++
 5 files changed, 37 insertions(+), 45 deletions(-)

diff --git a/python/ray/tests/test_object_store_metrics.py b/python/ray/tests/test_object_store_metrics.py
index 6243c0009030..fb7799248058 100644
--- a/python/ray/tests/test_object_store_metrics.py
+++ b/python/ray/tests/test_object_store_metrics.py
@@ -220,43 +220,6 @@ def test_spilling(object_spilling_config, shutdown_only):
     )
 
 
-@pytest.mark.skipif(
-    sys.platform == "darwin", reason="Timing out on macos. Not enough time to run."
-)
-@pytest.mark.parametrize("metric_report_interval_ms", [500, 1000, 3000])
-def test_object_metric_report_interval(shutdown_only, metric_report_interval_ms):
-    """Test object store metric on raylet controlled by `metric_report_interval_ms`"""
-    import time
-
-    info = ray.init(
-        object_store_memory=100 * MiB,
-        _system_config={"metrics_report_interval_ms": metric_report_interval_ms},
-    )
-
-    # Put object to make sure metric shows up
-    obj = ray.get(ray.put(np.zeros(20 * MiB, dtype=np.uint8)))
-
-    expected = {
-        "MMAP_SHM": 20 * MiB,
-        "MMAP_DISK": 0,
-        "SPILLED": 0,
-        "WORKER_HEAP": 0,
-    }
-    start = time.time()
-    wait_for_condition(
-        # 1KiB for metadata difference
-        lambda: approx_eq_dict_in(objects_by_loc(info), expected, 1 * KiB),
-        timeout=10,
-        retry_interval_ms=100,
-    )
-
-    end = time.time()
-    # Also shouldn't have metrics reported too quickly
-    assert (end - start) * 1000 > metric_report_interval_ms, "Reporting too quickly"
-
-    del obj
-
-
 @pytest.mark.skipif(
     sys.platform == "darwin", reason="Timing out on macos. Not enough time to run."
 )
diff --git a/src/ray/core_worker/core_worker.cc b/src/ray/core_worker/core_worker.cc
index 1d49cfbb1a05..8dc7934732ce 100644
--- a/src/ray/core_worker/core_worker.cc
+++ b/src/ray/core_worker/core_worker.cc
@@ -1250,8 +1250,12 @@ Status CoreWorker::SealExisting(const ObjectID &object_id,
 Status CoreWorker::Get(const std::vector<ObjectID> &ids,
                        const int64_t timeout_ms,
                        std::vector<std::shared_ptr<RayObject>> *results) {
-  ScopedTaskMetricSetter state(
-      worker_context_, task_counter_, rpc::TaskStatus::RUNNING_IN_RAY_GET);
+  std::unique_ptr<ScopedTaskMetricSetter> state = nullptr;
+  if (options_.worker_type == WorkerType::WORKER) {
+    // We track the state change only from workers.
+    state = std::make_unique<ScopedTaskMetricSetter>(
+        worker_context_, task_counter_, rpc::TaskStatus::RUNNING_IN_RAY_GET);
+  }
   results->resize(ids.size(), nullptr);
 
   absl::flat_hash_set<ObjectID> plasma_object_ids;
@@ -1412,8 +1416,12 @@ Status CoreWorker::Wait(const std::vector<ObjectID> &ids,
                         int64_t timeout_ms,
                         std::vector<bool> *results,
                         bool fetch_local) {
-  ScopedTaskMetricSetter state(
-      worker_context_, task_counter_, rpc::TaskStatus::RUNNING_IN_RAY_WAIT);
+  std::unique_ptr<ScopedTaskMetricSetter> state = nullptr;
+  if (options_.worker_type == WorkerType::WORKER) {
+    // We track the state change only from workers.
+    state = std::make_unique<ScopedTaskMetricSetter>(
+        worker_context_, task_counter_, rpc::TaskStatus::RUNNING_IN_RAY_WAIT);
+  }
 
   results->resize(ids.size(), false);
 
diff --git a/src/ray/core_worker/core_worker.h b/src/ray/core_worker/core_worker.h
index 58be90803bc5..08052a2a72a5 100644
--- a/src/ray/core_worker/core_worker.h
+++ b/src/ray/core_worker/core_worker.h
@@ -188,6 +188,9 @@ class TaskCounter {
                        rpc::TaskStatus status,
                        bool is_retry) {
     absl::MutexLock l(&mu_);
+    // Add a no-op increment to counter_ so that
+    // it will invoke a callback upon RecordMetrics.
+    counter_.Increment({func_name, TaskStatusType::kRunning, is_retry}, 0);
     if (status == rpc::TaskStatus::RUNNING_IN_RAY_GET) {
       running_in_get_counter_.Increment({func_name, is_retry});
     } else if (status == rpc::TaskStatus::RUNNING_IN_RAY_WAIT) {
@@ -201,6 +204,9 @@ class TaskCounter {
                          rpc::TaskStatus status,
                          bool is_retry) {
     absl::MutexLock l(&mu_);
+    // Add a no-op decrement to counter_ so that
+    // it will invoke a callback upon RecordMetrics.
+    counter_.Decrement({func_name, TaskStatusType::kRunning, is_retry}, 0);
     if (status == rpc::TaskStatus::RUNNING_IN_RAY_GET) {
       running_in_get_counter_.Decrement({func_name, is_retry});
     } else if (status == rpc::TaskStatus::RUNNING_IN_RAY_WAIT) {
diff --git a/src/ray/stats/stats.h b/src/ray/stats/stats.h
index fbc004d8de67..6383fac518bc 100644
--- a/src/ray/stats/stats.h
+++ b/src/ray/stats/stats.h
@@ -96,14 +96,14 @@ static inline void Init(const TagsType &global_tags,
   StatsConfig::instance().SetHarvestInterval(
       absl::Milliseconds(std::max(RayConfig::instance().metrics_report_interval_ms() / 2,
                                   static_cast<uint64_t>(500))));
-
-  MetricPointExporter::Register(exporter, metrics_report_batch_size);
-  OpenCensusProtoExporter::Register(
-      metrics_agent_port, (*metrics_io_service), "127.0.0.1", worker_id);
   opencensus::stats::StatsExporter::SetInterval(
       StatsConfig::instance().GetReportInterval());
   opencensus::stats::DeltaProducer::Get()->SetHarvestInterval(
       StatsConfig::instance().GetHarvestInterval());
+
+  MetricPointExporter::Register(exporter, metrics_report_batch_size);
+  OpenCensusProtoExporter::Register(
+      metrics_agent_port, (*metrics_io_service), "127.0.0.1", worker_id);
   StatsConfig::instance().SetGlobalTags(global_tags);
   for (auto &f : StatsConfig::instance().PopInitializers()) {
     f();
diff --git a/src/ray/util/counter_map.h b/src/ray/util/counter_map.h
index 3351940e8e40..8f61bcb7ab32 100644
--- a/src/ray/util/counter_map.h
+++ b/src/ray/util/counter_map.h
@@ -60,6 +60,14 @@ class CounterMap {
 
   /// Increment the specified key by `val`, default to 1.
   void Increment(const K &key, int64_t val = 1) {
+    // If value is 0, it is no-op and only registers the callback.
+    if (val == 0) {
+      if (on_change_ != nullptr) {
+        pending_changes_.insert(key);
+      }
+      return;
+    }
+
     counters_[key] += val;
     total_ += val;
     if (on_change_ != nullptr) {
@@ -71,6 +79,13 @@ class CounterMap {
   /// to zero, the entry for the key is erased from the counter. It is not allowed for the
   /// count to be decremented below zero.
   void Decrement(const K &key, int64_t val = 1) {
+    // If value is 0, it is no-op and only registers the callback.
+    if (val == 0) {
+      if (on_change_ != nullptr) {
+        pending_changes_.insert(key);
+      }
+      return;
+    }
     auto it = counters_.find(key);
     RAY_CHECK(it != counters_.end());
     it->second -= val;

From db9cfa64a418da14446e5b1b5910cf8e92aa7752 Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Fri, 10 Feb 2023 11:05:58 -0800
Subject: [PATCH 222/267] [core][state] State API scale losing data (#32408)

We are dropping data at 10K as default, changing the buffer size larger right now before we figure out a way to store bursty task submissions.
---
 release/nightly_tests/stress_tests/state_api_app_config.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/release/nightly_tests/stress_tests/state_api_app_config.yaml b/release/nightly_tests/stress_tests/state_api_app_config.yaml
index 1aadcdd37272..a2bc0f50bf32 100644
--- a/release/nightly_tests/stress_tests/state_api_app_config.yaml
+++ b/release/nightly_tests/stress_tests/state_api_app_config.yaml
@@ -1,6 +1,6 @@
 base_image: {{ env["RAY_IMAGE_NIGHTLY_CPU"] | default("anyscale/ray:nightly-py37") }}
 debian_packages: []
-env_vars: {"RAY_MAX_LIMIT_FROM_API_SERVER": "1000000000", "RAY_MAX_LIMIT_FROM_DATA_SOURCE":"1000000000"}
+env_vars: {"RAY_MAX_LIMIT_FROM_API_SERVER": "1000000000", "RAY_MAX_LIMIT_FROM_DATA_SOURCE":"1000000000", "RAY_task_events_max_buffer_size":"100000"}
 
 python:
   pip_packages:

From 613f4b006f30cf28840f0b1a88157c89b90902b0 Mon Sep 17 00:00:00 2001
From: Justin Yu <justinvyu@berkeley.edu>
Date: Fri, 10 Feb 2023 12:21:08 -0800
Subject: [PATCH 223/267] [Tune][Doc] Restructure API reference (#32311)

---
 .gitignore                                    |    1 +
 doc/source/_toc.yml                           |    2 +-
 doc/source/ray-air/package-ref.rst            |   25 +-
 doc/source/ray-references/api.rst             |    2 +-
 .../{api_docs/overview.rst => api/api.rst}    |    3 +-
 doc/source/tune/api/callbacks.rst             |   55 +
 doc/source/tune/{api_docs => api}/cli.rst     |    0
 doc/source/tune/{api_docs => api}/client.rst  |    0
 doc/source/tune/{api_docs => api}/env.rst     |    0
 doc/source/tune/api/execution.rst             |   43 +
 doc/source/tune/api/integration.rst           |  115 +
 .../tune/{api_docs => api}/internals.rst      |   27 +-
 doc/source/tune/{api_docs => api}/logging.rst |   52 +-
 .../tune/{api_docs => api}/reporters.rst      |   29 +-
 doc/source/tune/api/result_grid.rst           |   44 +
 .../tune/{api_docs => api}/schedulers.rst     |  153 +-
 .../tune/{api_docs => api}/search_space.rst   |   86 +-
 doc/source/tune/{api_docs => api}/sklearn.rst |    6 +-
 doc/source/tune/api/stoppers.rst              |   41 +
 .../tune/{api_docs => api}/suggestion.rst     |  164 +-
 doc/source/tune/api/syncing.rst               |   46 +
 .../tune/{api_docs => api}/trainable.rst      |   78 +-
 doc/source/tune/api_docs/execution.rst        |   26 -
 doc/source/tune/api_docs/integration.rst      |   91 -
 doc/source/tune/api_docs/result_grid.rst      |   25 -
 doc/source/tune/api_docs/stoppers.rst         |   52 -
 doc/source/tune/api_docs/syncing.rst          |   20 -
 doc/source/tune/examples/tune-xgboost.ipynb   | 2506 ++++++++---------
 doc/source/tune/faq.rst                       |    2 +-
 doc/source/tune/getting-started.rst           |    2 +-
 doc/source/tune/key-concepts.rst              |    4 +-
 doc/source/tune/tutorials/tune-resources.rst  |    2 +-
 .../tune/tutorials/tune-search-spaces.rst     |    4 +-
 .../tutorials/tune_get_data_in_and_out.md     |    4 +-
 .../tune/search/bayesopt/bayesopt_search.py   |   10 +-
 .../ray/tune/search/optuna/optuna_search.py   |    2 +
 python/ray/tune/search/skopt/skopt_search.py  |    6 +-
 37 files changed, 1983 insertions(+), 1745 deletions(-)
 rename doc/source/tune/{api_docs/overview.rst => api/api.rst} (97%)
 create mode 100644 doc/source/tune/api/callbacks.rst
 rename doc/source/tune/{api_docs => api}/cli.rst (100%)
 rename doc/source/tune/{api_docs => api}/client.rst (100%)
 rename doc/source/tune/{api_docs => api}/env.rst (100%)
 create mode 100644 doc/source/tune/api/execution.rst
 create mode 100644 doc/source/tune/api/integration.rst
 rename doc/source/tune/{api_docs => api}/internals.rst (61%)
 rename doc/source/tune/{api_docs => api}/logging.rst (62%)
 rename doc/source/tune/{api_docs => api}/reporters.rst (90%)
 create mode 100644 doc/source/tune/api/result_grid.rst
 rename doc/source/tune/{api_docs => api}/schedulers.rst (81%)
 rename doc/source/tune/{api_docs => api}/search_space.rst (76%)
 rename doc/source/tune/{api_docs => api}/sklearn.rst (71%)
 create mode 100644 doc/source/tune/api/stoppers.rst
 rename doc/source/tune/{api_docs => api}/suggestion.rst (74%)
 create mode 100644 doc/source/tune/api/syncing.rst
 rename doc/source/tune/{api_docs => api}/trainable.rst (90%)
 delete mode 100644 doc/source/tune/api_docs/execution.rst
 delete mode 100644 doc/source/tune/api_docs/integration.rst
 delete mode 100644 doc/source/tune/api_docs/result_grid.rst
 delete mode 100644 doc/source/tune/api_docs/stoppers.rst
 delete mode 100644 doc/source/tune/api_docs/syncing.rst

diff --git a/.gitignore b/.gitignore
index 9268fa948c4e..56b81a8f39c8 100644
--- a/.gitignore
+++ b/.gitignore
@@ -119,6 +119,7 @@ scripts/nodes.txt
 /doc/_build
 /doc/source/_static/thumbs
 /doc/source/tune/generated_guides/
+/doc/source/**/doc/
 
 # User-specific stuff:
 .idea/**/workspace.xml
diff --git a/doc/source/_toc.yml b/doc/source/_toc.yml
index 2e82bb4cab8a..a5b63efb6462 100644
--- a/doc/source/_toc.yml
+++ b/doc/source/_toc.yml
@@ -282,7 +282,7 @@ parts:
               - file: tune/examples/exercises
                 title: "Exercises"
           - file: tune/faq
-          - file: tune/api_docs/overview.rst
+          - file: tune/api/api.rst
 
       - file: serve/index
         title: Ray Serve
diff --git a/doc/source/ray-air/package-ref.rst b/doc/source/ray-air/package-ref.rst
index a1e90d55b2cc..2fa48650e45a 100644
--- a/doc/source/ray-air/package-ref.rst
+++ b/doc/source/ray-air/package-ref.rst
@@ -159,6 +159,7 @@ Training Session
 
 .. automodule:: ray.air.session
     :members:
+    :noindex:
 
 Trainer Configs
 ###############
@@ -364,26 +365,8 @@ Reinforcement Learning (RLlib)
 
 .. _air-builtin-callbacks:
 
-Monitoring Integrations
+Integrations
 ~~~~~~~~~~~~~~~~~~~~~~~
 
-Comet
-#####
-
-.. autoclass:: ray.air.integrations.comet.CometLoggerCallback
-
-Keras
-#####
-
-.. autoclass:: ray.air.integrations.keras.Callback
-    :members:
-
-MLflow
-######
-
-.. autoclass:: ray.air.integrations.mlflow.MLflowLoggerCallback
-
-Weights and Biases
-##################
-
-.. autoclass:: ray.air.integrations.wandb.WandbLoggerCallback
+See :doc:`this API reference </tune/api/integration>` for AIR integrations with other libraries
+such as Weights and Biases, MLFlow, Keras, and more.
diff --git a/doc/source/ray-references/api.rst b/doc/source/ray-references/api.rst
index fb55ac2015c2..55cf2e3dd29e 100644
--- a/doc/source/ray-references/api.rst
+++ b/doc/source/ray-references/api.rst
@@ -8,7 +8,7 @@ API References
     ../ray-air/package-ref.rst
     ../data/api/api.rst
     ../train/api.rst
-    ../tune/api_docs/overview.rst
+    ../tune/api/api.rst
     ../serve/api/index.rst
     ../rllib/package_ref/index.rst
     ../workflows/api/api.rst
diff --git a/doc/source/tune/api_docs/overview.rst b/doc/source/tune/api/api.rst
similarity index 97%
rename from doc/source/tune/api_docs/overview.rst
rename to doc/source/tune/api/api.rst
index a2581cf88495..6d2e3d36c4b7 100644
--- a/doc/source/tune/api_docs/overview.rst
+++ b/doc/source/tune/api/api.rst
@@ -14,15 +14,16 @@ on `Github`_.
     :maxdepth: 2
 
     execution.rst
+    result_grid.rst
     trainable.rst
     search_space.rst
     suggestion.rst
     schedulers.rst
     stoppers.rst
-    result_grid.rst
     reporters.rst
     syncing.rst
     logging.rst
+    callbacks.rst
     env.rst
     sklearn.rst
     integration.rst
diff --git a/doc/source/tune/api/callbacks.rst b/doc/source/tune/api/callbacks.rst
new file mode 100644
index 000000000000..5cee421c13ba
--- /dev/null
+++ b/doc/source/tune/api/callbacks.rst
@@ -0,0 +1,55 @@
+.. _tune-callbacks-docs:
+
+Tune Callbacks (tune.Callback)
+==============================
+
+See :doc:`this user guide </tune/tutorials/tune-metrics>` for more details.
+
+.. seealso::
+
+    :doc:`Tune's built-in loggers </tune/api/logging>` use the ``Callback`` interface.
+
+
+Callback Interface
+------------------
+
+Callback Initialization and Setup
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. currentmodule:: ray.tune
+.. autosummary::
+    :toctree: doc/
+
+    Callback
+    Callback.setup
+
+
+Callback Hooks
+~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    Callback.on_checkpoint
+    Callback.on_experiment_end
+    Callback.on_step_begin
+    Callback.on_step_end
+    Callback.on_trial_complete
+    Callback.on_trial_error
+    Callback.on_trial_restore
+    Callback.on_trial_result
+    Callback.on_trial_save
+    Callback.on_trial_start
+
+
+Stateful Callbacks
+~~~~~~~~~~~~~~~~~~
+
+The following methods must be overriden for stateful callbacks to be saved/restored
+properly by Tune.
+
+.. autosummary::
+    :toctree: doc/
+
+    Callback.get_state
+    Callback.set_state
diff --git a/doc/source/tune/api_docs/cli.rst b/doc/source/tune/api/cli.rst
similarity index 100%
rename from doc/source/tune/api_docs/cli.rst
rename to doc/source/tune/api/cli.rst
diff --git a/doc/source/tune/api_docs/client.rst b/doc/source/tune/api/client.rst
similarity index 100%
rename from doc/source/tune/api_docs/client.rst
rename to doc/source/tune/api/client.rst
diff --git a/doc/source/tune/api_docs/env.rst b/doc/source/tune/api/env.rst
similarity index 100%
rename from doc/source/tune/api_docs/env.rst
rename to doc/source/tune/api/env.rst
diff --git a/doc/source/tune/api/execution.rst b/doc/source/tune/api/execution.rst
new file mode 100644
index 000000000000..50154462a703
--- /dev/null
+++ b/doc/source/tune/api/execution.rst
@@ -0,0 +1,43 @@
+Tune Execution (tune.Tuner)
+===========================
+
+.. _tune-run-ref:
+
+Tuner
+-----
+
+.. currentmodule:: ray.tune
+
+.. autosummary::
+    :toctree: doc/
+
+    Tuner
+    Tuner.fit
+    Tuner.get_results
+
+Tuner Configuration
+~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    TuneConfig
+
+Restoring a Tuner
+~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    Tuner.restore
+    Tuner.can_restore
+
+
+tune.run_experiments
+--------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    run_experiments
+    Experiment
diff --git a/doc/source/tune/api/integration.rst b/doc/source/tune/api/integration.rst
new file mode 100644
index 000000000000..0ad8ff86d2a6
--- /dev/null
+++ b/doc/source/tune/api/integration.rst
@@ -0,0 +1,115 @@
+.. _tune-integration:
+
+External library integrations for Ray Tune
+===========================================
+
+.. TODO: Clean this up. Both tune.integration and air.integrations are
+..   captured here. Most of the `tune.integration` can be deprecated soon.
+..   XGBoost/LightGBM callbacks are no longer recommended - use their trainers instead
+..   which will automatically report+checkpoint.
+..   After PTL trainer is introduced, we can also deprecate that callback.
+
+.. currentmodule:: ray
+
+.. _tune-monitoring-integrations:
+
+Tune Experiment Monitoring Integrations
+----------------------------------------
+
+Comet (air.integrations.comet)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+:ref:`See here for an example. <tune-comet-ref>`
+
+.. autosummary::
+    :toctree: doc/
+
+    ~air.integrations.comet.CometLoggerCallback
+
+
+.. _tune-integration-mlflow:
+
+MLflow (air.integrations.mlflow)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+:ref:`See here for an example. <tune-mlflow-ref>`
+
+.. autosummary::
+    :toctree: doc/
+
+    ~air.integrations.mlflow.MLflowLoggerCallback
+    ~air.integrations.mlflow.setup_mlflow
+
+.. _tune-integration-wandb:
+
+Weights and Biases (air.integrations.wandb)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+:ref:`See here for an example. <tune-wandb-ref>`
+
+.. autosummary::
+    :toctree: doc/
+
+    ~air.integrations.wandb.WandbLoggerCallback
+    ~air.integrations.wandb.setup_wandb
+
+
+Integrations with ML Libraries
+--------------------------------
+
+.. _tune-integration-keras:
+
+Keras (air.integrations.keras)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    ~air.integrations.keras.ReportCheckpointCallback
+
+
+.. _tune-integration-mxnet:
+
+MXNet (tune.integration.mxnet)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    ~tune.integration.mxnet.TuneReportCallback
+    ~tune.integration.mxnet.TuneCheckpointCallback
+
+
+.. _tune-integration-pytorch-lightning:
+
+PyTorch Lightning (tune.integration.pytorch_lightning)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    ~tune.integration.pytorch_lightning.TuneReportCallback
+    ~tune.integration.pytorch_lightning.TuneReportCheckpointCallback
+
+.. _tune-integration-xgboost:
+
+XGBoost (tune.integration.xgboost)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    ~tune.integration.xgboost.TuneReportCallback
+    ~tune.integration.xgboost.TuneReportCheckpointCallback
+
+
+.. _tune-integration-lightgbm:
+
+LightGBM (tune.integration.lightgbm)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    ~tune.integration.lightgbm.TuneReportCallback
+    ~tune.integration.lightgbm.TuneReportCheckpointCallback
diff --git a/doc/source/tune/api_docs/internals.rst b/doc/source/tune/api/internals.rst
similarity index 61%
rename from doc/source/tune/api_docs/internals.rst
rename to doc/source/tune/api/internals.rst
index 3b90dd7ed1d9..d33717ec9ef0 100644
--- a/doc/source/tune/api_docs/internals.rst
+++ b/doc/source/tune/api/internals.rst
@@ -3,6 +3,13 @@ Tune Internals
 
 .. _raytrialexecutor-docstring:
 
+TunerInternal
+---------------
+
+.. autoclass:: ray.tune.impl.tuner_internal.TunerInternal
+    :members:
+
+
 RayTrialExecutor
 ----------------
 
@@ -15,6 +22,7 @@ TrialRunner
 -----------
 
 .. autoclass:: ray.tune.execution.trial_runner.TrialRunner
+    :members:
 
 .. _trial-docstring:
 
@@ -22,23 +30,14 @@ Trial
 -----
 
 .. autoclass:: ray.tune.experiment.trial.Trial
+    :members:
 
-.. _tune-callbacks-docs:
-
-Callbacks
----------
-
-.. autoclass:: ray.tune.callback.Callback
-   :members:
-
-
-.. _resources-docstring:
-
-PlacementGroupFactory
----------------------
+FunctionTrainable
+-----------------
 
-.. autoclass:: ray.tune.execution.placement_groups.PlacementGroupFactory
+.. autoclass:: ray.tune.trainable.function_trainable.FunctionTrainable
 
+.. autofunction:: ray.tune.trainable.function_trainable.wrap_function
 
 
 Registry
diff --git a/doc/source/tune/api_docs/logging.rst b/doc/source/tune/api/logging.rst
similarity index 62%
rename from doc/source/tune/api_docs/logging.rst
rename to doc/source/tune/api/logging.rst
index ec9a3f9e0f90..e5eb8732b626 100644
--- a/doc/source/tune/api_docs/logging.rst
+++ b/doc/source/tune/api/logging.rst
@@ -31,40 +31,54 @@ relevant ones (like accuracy, loss, etc.).
 .. image:: ../images/ray-tune-viskit.png
 
 
-TBXLogger
----------
+.. currentmodule:: ray
 
-.. autoclass:: ray.tune.logger.TBXLoggerCallback
+Tune Built-in Loggers
+---------------------
 
-JsonLogger
-----------
+.. autosummary::
+    :toctree: doc/
 
-.. autoclass:: ray.tune.logger.JsonLoggerCallback
+    tune.logger.JsonLoggerCallback
+    tune.logger.CSVLoggerCallback
+    tune.logger.TBXLoggerCallback
 
-CSVLogger
----------
 
-.. autoclass:: ray.tune.logger.CSVLoggerCallback
-
-MLFlowLogger
-------------
+MLFlow Integration: MLFlowLoggerCallback
+----------------------------------------
 
 Tune also provides a logger for `MLflow <https://mlflow.org>`_.
 You can install MLflow via ``pip install mlflow``.
 You can see the :doc:`tutorial here </tune/examples/tune-mlflow>`.
 
-WandbLogger
------------
+.. autosummary::
+    :toctree: doc/
+
+    air.integrations.mlflow.MLflowLoggerCallback
+
+Wandb Integration: WandbLoggerCallback
+--------------------------------------
 
 Tune also provides a logger for `Weights & Biases <https://www.wandb.ai/>`_.
 You can install Wandb via ``pip install wandb``.
-You can see the :doc:`tutorial here </tune/examples/tune-wandb>`
+You can see the :doc:`tutorial here </tune/examples/tune-wandb>`.
 
+.. autosummary::
+    :toctree: doc/
+
+    air.integrations.wandb.WandbLoggerCallback
 
 .. _logger-interface:
 
-LoggerCallback
---------------
+LoggerCallback Interface
+------------------------
+
+.. autosummary::
+    :toctree: doc/
 
-.. autoclass:: ray.tune.logger.LoggerCallback
-    :members: log_trial_start, log_trial_restore, log_trial_save, log_trial_result, log_trial_end
+    tune.logger.LoggerCallback
+    tune.logger.LoggerCallback.log_trial_start
+    tune.logger.LoggerCallback.log_trial_restore
+    tune.logger.LoggerCallback.log_trial_save
+    tune.logger.LoggerCallback.log_trial_result
+    tune.logger.LoggerCallback.log_trial_end
diff --git a/doc/source/tune/api_docs/reporters.rst b/doc/source/tune/api/reporters.rst
similarity index 90%
rename from doc/source/tune/api_docs/reporters.rst
rename to doc/source/tune/api/reporters.rst
index ade3263deb1c..b163d5695099 100644
--- a/doc/source/tune/api_docs/reporters.rst
+++ b/doc/source/tune/api/reporters.rst
@@ -88,21 +88,26 @@ The default reporting style can also be overridden more broadly by extending the
     results = tuner.fit()
 
 
-CLIReporter
------------
+.. currentmodule:: ray.tune
 
-.. autoclass:: ray.tune.CLIReporter
-    :members: add_metric_column
+Reporter Interface (tune.ProgressReporter)
+------------------------------------------
 
-JupyterNotebookReporter
------------------------
+.. autosummary::
+    :toctree: doc/
+
+    ProgressReporter
+    ProgressReporter.report
+    ProgressReporter.should_report
 
-.. autoclass:: ray.tune.JupyterNotebookReporter
-    :members: add_metric_column
 
+Tune Built-in Reporters
+-----------------------
 
-ProgressReporter
-----------------
+.. autosummary::
+    :toctree: doc/
 
-.. autoclass:: ray.tune.ProgressReporter
-    :members:
+    CLIReporter
+    CLIReporter.add_metric_column
+    JupyterNotebookReporter
+    JupyterNotebookReporter.add_metric_column
diff --git a/doc/source/tune/api/result_grid.rst b/doc/source/tune/api/result_grid.rst
new file mode 100644
index 000000000000..abda7956af8f
--- /dev/null
+++ b/doc/source/tune/api/result_grid.rst
@@ -0,0 +1,44 @@
+.. _tune-analysis-docs:
+
+.. _result-grid-docstring:
+
+Tune Experiment Results (tune.ResultGrid)
+=========================================
+
+ResultGrid (tune.ResultGrid)
+----------------------------
+
+.. currentmodule:: ray
+
+.. autosummary::
+    :toctree: doc/
+
+    tune.ResultGrid
+    tune.ResultGrid.get_best_result
+    tune.ResultGrid.get_dataframe
+
+.. _result-docstring:
+
+Result (air.Result)
+-------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    air.Result
+
+.. _exp-analysis-docstring:
+
+
+ExperimentAnalysis (tune.ExperimentAnalysis)
+--------------------------------------------
+
+.. note::
+
+    An experiment analysis is the output of the ``tune.run`` API.
+    It's now recommended to use ``Tuner.fit``, which outputs a ``ResultGrid`` object.
+
+.. autosummary::
+    :toctree: doc/
+
+    tune.ExperimentAnalysis
diff --git a/doc/source/tune/api_docs/schedulers.rst b/doc/source/tune/api/schedulers.rst
similarity index 81%
rename from doc/source/tune/api_docs/schedulers.rst
rename to doc/source/tune/api/schedulers.rst
index e53353e42399..a7ee7772092a 100644
--- a/doc/source/tune/api_docs/schedulers.rst
+++ b/doc/source/tune/api/schedulers.rst
@@ -13,9 +13,26 @@ Trainable and is maximized or minimized according to ``mode``.
 .. code-block:: python
 
     from ray import tune
-    tuner = tune.Tuner( ... , tune_config=tune.TuneConfig(scheduler=Scheduler(metric="accuracy", mode="max")))
+    from ray.air import session
+    from tune.schedulers import ASHAScheduler
+
+    def train_fn(config):
+        # This objective function is just for demonstration purposes
+        session.report({"loss": config["param"]})
+
+    tuner = tune.Tuner(
+        train_fn,
+        tune_config=tune.TuneConfig(
+            scheduler=ASHAScheduler(),
+            metric="loss",
+            mode="min",
+            num_samples=10,
+        ),
+        param_space={"param": tune.uniform(0, 1)},
+    )
     results = tuner.fit()
 
+.. currentmodule:: ray.tune.schedulers
 
 .. _tune-scheduler-hyperband:
 
@@ -28,15 +45,21 @@ setting the ``scheduler`` parameter of ``tune.TuneConfig``, which is taken in by
 .. code-block:: python
 
     from ray import tune
+    from tune.schedulers import ASHAScheduler
+
     asha_scheduler = ASHAScheduler(
         time_attr='training_iteration',
-        metric='episode_reward_mean',
-        mode='max',
+        metric='loss',
+        mode='min',
         max_t=100,
         grace_period=10,
         reduction_factor=3,
-        brackets=1)
-    tuner = tune.Tuner( ... , tune_config=tune.TuneConfig(scheduler=asha_scheduler))
+        brackets=1,
+    )
+    tuner = tune.Tuner(
+        train_fn,
+        tune_config=tune.TuneConfig(scheduler=asha_scheduler),
+    )
     results = tuner.fit()
 
 Compared to the original version of HyperBand, this implementation provides better
@@ -48,9 +71,11 @@ Even though the original paper mentions a bracket count of 3, discussions with t
 that the value should be left to 1 bracket.
 This is the default used if no value is provided for the ``brackets`` argument.
 
-.. autoclass:: ray.tune.schedulers.AsyncHyperBandScheduler
+.. autosummary::
+    :toctree: doc/
 
-.. autoclass:: ray.tune.schedulers.ASHAScheduler
+    AsyncHyperBandScheduler
+    ASHAScheduler
 
 .. _tune-original-hyperband:
 
@@ -60,7 +85,10 @@ HyperBand (tune.schedulers.HyperBandScheduler)
 Tune implements the `standard version of HyperBand <https://arxiv.org/abs/1603.06560>`__.
 **We recommend using the ASHA Scheduler over the standard HyperBand scheduler.**
 
-.. autoclass:: ray.tune.schedulers.HyperBandScheduler
+.. autosummary::
+    :toctree: doc/
+
+    HyperBandScheduler
 
 
 HyperBand Implementation Details
@@ -105,7 +133,10 @@ Median Stopping Rule (tune.schedulers.MedianStoppingRule)
 The Median Stopping Rule implements the simple strategy of stopping a trial if its performance falls
 below the median of other trials at similar points in time.
 
-.. autoclass:: ray.tune.schedulers.MedianStoppingRule
+.. autosummary::
+    :toctree: doc/
+
+    MedianStoppingRule
 
 .. _tune-scheduler-pbt:
 
@@ -117,23 +148,25 @@ This can be enabled by setting the ``scheduler`` parameter of ``tune.TuneConfig`
 
 .. code-block:: python
 
+    from ray import tune
+    from ray.tune.schedulers import PopulationBasedTraining
+
     pbt_scheduler = PopulationBasedTraining(
         time_attr='training_iteration',
-        metric='mean_accuracy',
-        mode='max',
-        perturbation_interval=600.0,
+        metric='loss',
+        mode='min',
+        perturbation_interval=1,
         hyperparam_mutations={
             "lr": [1e-3, 5e-4, 1e-4, 5e-5, 1e-5],
-            "alpha": lambda: random.uniform(0.0, 1.0),
-            ...
+            "alpha": tune.uniform(0.0, 1.0),
         }
     )
     tuner = tune.Tuner(
-        ...,
+        train_fn,
         tune_config=tune.TuneConfig(
             num_samples=4,
-            scheduler=pbt_scheduler
-        )
+            scheduler=pbt_scheduler,
+        ),
     )
     tuner.fit()
 
@@ -150,7 +183,10 @@ Take a look at :doc:`/tune/examples/pbt_visualization/pbt_visualization` to get
 of how PBT operates. :doc:`/tune/examples/pbt_guide` gives more examples
 of PBT usage.
 
-.. autoclass:: ray.tune.schedulers.PopulationBasedTraining
+.. autosummary::
+    :toctree: doc/
+
+    PopulationBasedTraining
 
 
 .. _tune-scheduler-pbt-replay:
@@ -165,20 +201,26 @@ config according to the obtained schedule.
 
 .. code-block:: python
 
+    from ray import tune
+    from ray.tune.schedulers import PopulationBasedTrainingReplay
+
     replay = PopulationBasedTrainingReplay(
         experiment_dir="~/ray_results/pbt_experiment/",
-        trial_id="XXXXX_00001")
+        trial_id="XXXXX_00001"
+    )
     tuner = tune.Tuner(
-        ...,
+        train_fn,
         tune_config=tune.TuneConfig(scheduler=replay)
-        )
+    )
     results = tuner.fit()
 
 See :ref:`here for an example <tune-advanced-tutorial-pbt-replay>` on how to use the
 replay utility in practice.
 
-.. autoclass:: ray.tune.schedulers.PopulationBasedTrainingReplay
+.. autosummary::
+    :toctree: doc/
 
+    PopulationBasedTrainingReplay
 
 .. _tune-scheduler-pb2:
 
@@ -203,15 +245,16 @@ PB2 can be enabled by setting the ``scheduler`` parameter of ``tune.TuneConfig``
     from ray.tune.schedulers.pb2 import PB2
 
     pb2_scheduler = PB2(
-            time_attr='time_total_s',
-            metric='mean_accuracy',
-            mode='max',
-            perturbation_interval=600.0,
-            hyperparam_bounds={
-                "lr": [1e-3, 1e-5],
-                "alpha": [0.0, 1.0],
-            ...
-            })
+        time_attr='time_total_s',
+        metric='mean_accuracy',
+        mode='max',
+        perturbation_interval=600.0,
+        hyperparam_bounds={
+            "lr": [1e-3, 1e-5],
+            "alpha": [0.0, 1.0],
+        ...
+        }
+    )
     tuner = tune.Tuner( ... , tune_config=tune.TuneConfig(scheduler=pb2_scheduler))
     results = tuner.fit()
 
@@ -227,7 +270,10 @@ With that in mind, you can run this :doc:`PB2 PPO example </tune/examples/includ
 with a population size of ``4`` (as in the paper).
 The example uses the ``BipedalWalker`` environment so does not require any additional licenses.
 
-.. autoclass:: ray.tune.schedulers.pb2.PB2
+.. autosummary::
+    :toctree: doc/
+
+    pb2.PB2
 
 
 .. _tune-scheduler-bohb:
@@ -244,7 +290,11 @@ See :ref:`TuneBOHB <suggest-TuneBOHB>` for package requirements, examples, and d
 
 An example of this in use can be found here: :doc:`/tune/examples/includes/bohb_example`.
 
-.. autoclass:: ray.tune.schedulers.HyperBandForBOHB
+
+.. autosummary::
+    :toctree: doc/
+
+    HyperBandForBOHB
 
 .. _tune-resource-changing-scheduler:
 
@@ -265,28 +315,32 @@ It wraps around another scheduler and uses its decisions.
 
 An example of this in use can be found here: :doc:`/tune/examples/includes/xgboost_dynamic_resources_example`.
 
-.. autoclass:: ray.tune.schedulers.ResourceChangingScheduler
+.. autosummary::
+    :toctree: doc/
 
-DistributeResources
-~~~~~~~~~~~~~~~~~~~
+    ResourceChangingScheduler
+    resource_changing_scheduler.DistributeResources
+    resource_changing_scheduler.DistributeResourcesToTopJob
 
-.. autoclass:: ray.tune.schedulers.resource_changing_scheduler.DistributeResources
+FIFOScheduler (Default Scheduler)
+---------------------------------
 
-DistributeResourcesToTopJob
-~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+    :toctree: doc/
 
-.. autoclass:: ray.tune.schedulers.resource_changing_scheduler.DistributeResourcesToTopJob
+    FIFOScheduler
 
-FIFOScheduler
--------------
+TrialScheduler Interface
+------------------------
 
-.. autoclass:: ray.tune.schedulers.FIFOScheduler
+.. autosummary::
+    :toctree: doc/
 
-TrialScheduler
---------------
+    TrialScheduler
+    TrialScheduler.choose_trial_to_run
+    TrialScheduler.on_trial_result
+    TrialScheduler.on_trial_complete
 
-.. autoclass:: ray.tune.schedulers.TrialScheduler
-    :members:
 
 Shim Instantiation (tune.create_scheduler)
 ------------------------------------------
@@ -295,4 +349,7 @@ There is also a shim function that constructs the scheduler based on the provide
 This can be useful if the scheduler you want to use changes often (e.g., specifying the scheduler
 via a CLI option or config file).
 
-.. automethod:: ray.tune.create_scheduler
+.. autosummary::
+    :toctree: doc/
+
+    create_scheduler
diff --git a/doc/source/tune/api_docs/search_space.rst b/doc/source/tune/api/search_space.rst
similarity index 76%
rename from doc/source/tune/api_docs/search_space.rst
rename to doc/source/tune/api/search_space.rst
index 0ab08b9edb16..21c2e7520f18 100644
--- a/doc/source/tune/api_docs/search_space.rst
+++ b/doc/source/tune/api/search_space.rst
@@ -3,11 +3,6 @@
 Tune Search Space API
 =====================
 
-.. _tune-sample-docs:
-
-Random Distributions API
-------------------------
-
 This section covers the functions you can use to define your search spaces.
 
 .. caution::
@@ -19,7 +14,7 @@ This section covers the functions you can use to define your search spaces.
 .. tip::
 
     Avoid passing large objects as values in the search space, as that will incur a performance overhead.
-    Use :ref:`tune-with-parameters` to pass large objects in or load them inside your trainable
+    Use :func:`tune.with_parameters <ray.tune.with_parameters>` to pass large objects in or load them inside your trainable
     from disk (making sure that all nodes have access to the files) or cloud storage.
     See :ref:`tune-bottlenecks` for more information.
 
@@ -83,70 +78,35 @@ For a high-level overview, see this example:
         "grid": tune.grid_search([32, 64, 128])
     }
 
-tune.uniform
-~~~~~~~~~~~~
-
-.. autofunction:: ray.tune.uniform
-
-tune.quniform
-~~~~~~~~~~~~~
-
-.. autofunction:: ray.tune.quniform
-
-tune.loguniform
-~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.tune.loguniform
-
-tune.qloguniform
-~~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.tune.qloguniform
-
-tune.randn
-~~~~~~~~~~
+.. currentmodule:: ray
 
-.. autofunction:: ray.tune.randn
-
-tune.qrandn
-~~~~~~~~~~~
-
-.. autofunction:: ray.tune.qrandn
-
-tune.randint
-~~~~~~~~~~~~
-
-.. autofunction:: ray.tune.randint
-
-tune.qrandint
-~~~~~~~~~~~~~
-
-.. autofunction:: ray.tune.qrandint
-
-tune.lograndint
-~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.tune.lograndint
-
-tune.qlograndint
-~~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.tune.qlograndint
+Random Distributions API
+------------------------
 
-tune.choice
-~~~~~~~~~~~
+.. autosummary::
+    :toctree: doc/
 
-.. autofunction:: ray.tune.choice
+    tune.uniform
+    tune.quniform
+    tune.loguniform
+    tune.qloguniform
+    tune.randn
+    tune.qrandn
+    tune.randint
+    tune.qrandint
+    tune.lograndint
+    tune.qlograndint
+    tune.choice
 
-tune.sample_from
-~~~~~~~~~~~~~~~~
 
-.. autofunction:: ray.tune.sample_from
+Grid Search and Custom Function APIs
+------------------------------------
 
-Grid Search API
----------------
+.. autosummary::
+    :toctree: doc/
 
-.. autofunction:: ray.tune.grid_search
+    tune.grid_search
+    tune.sample_from
 
 References
 ----------
diff --git a/doc/source/tune/api_docs/sklearn.rst b/doc/source/tune/api/sklearn.rst
similarity index 71%
rename from doc/source/tune/api_docs/sklearn.rst
rename to doc/source/tune/api/sklearn.rst
index 2214303f77c4..3bb733dc8187 100644
--- a/doc/source/tune/api_docs/sklearn.rst
+++ b/doc/source/tune/api/sklearn.rst
@@ -8,7 +8,9 @@ Tune Scikit-Learn API  (tune.sklearn)
 TuneGridSearchCV
 ----------------
 
-.. autoclass:: ray.tune.sklearn.TuneGridSearchCV
+.. currentmodule:: ray.tune.sklearn
+
+.. autoclass:: TuneGridSearchCV
 	:members:
 
 .. _tunesearchcv-docs:
@@ -16,5 +18,5 @@ TuneGridSearchCV
 TuneSearchCV
 ------------
 
-.. autoclass:: ray.tune.sklearn.TuneSearchCV
+.. autoclass:: TuneSearchCV
 	:members:
diff --git a/doc/source/tune/api/stoppers.rst b/doc/source/tune/api/stoppers.rst
new file mode 100644
index 000000000000..28dfa38d8044
--- /dev/null
+++ b/doc/source/tune/api/stoppers.rst
@@ -0,0 +1,41 @@
+.. _tune-stoppers:
+
+Tune Stopping Mechanisms (tune.stopper)
+=======================================
+
+In addition to Trial Schedulers like :ref:`ASHA <tune-scheduler-hyperband>`, where a number of
+trials are stopped if they perform subpar, Ray Tune also supports custom stopping mechanisms to stop trials early. They can also stop the entire experiment after a condition is met.
+For instance, stopping mechanisms can specify to stop trials when they reached a plateau and the metric
+doesn't change anymore.
+
+Ray Tune comes with several stopping mechanisms out of the box. For custom stopping behavior, you can
+inherit from the :class:`Stopper <ray.tune.Stopper>` class.
+
+Other stopping behaviors are described :ref:`in the user guide <tune-stopping-ref>`.
+
+
+.. _tune-stop-ref:
+
+Stopper Interface (tune.Stopper)
+--------------------------------
+
+.. currentmodule:: ray.tune.stopper
+
+.. autosummary::
+    :toctree: doc/
+
+    Stopper
+    Stopper.__call__
+    Stopper.stop_all
+
+Tune Built-in Stoppers
+----------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    MaximumIterationStopper
+    ExperimentPlateauStopper
+    TrialPlateauStopper
+    TimeoutStopper
+    CombinedStopper
diff --git a/doc/source/tune/api_docs/suggestion.rst b/doc/source/tune/api/suggestion.rst
similarity index 74%
rename from doc/source/tune/api_docs/suggestion.rst
rename to doc/source/tune/api/suggestion.rst
index 63d949106c01..bce657c9ecc5 100644
--- a/doc/source/tune/api_docs/suggestion.rst
+++ b/doc/source/tune/api/suggestion.rst
@@ -12,66 +12,87 @@ You can utilize these search algorithms as follows:
 .. code-block:: python
 
     from ray import tune
-    from ray.tune.search.hyperopt import HyperOptSearch
-    tuner = tune.Tuner(my_function, tune_config=tune.TuneConfig(search_alg=HyperOptSearch(...)))
+    from ray.air import session
+    from ray.tune.search.optuna import OptunaSearch
+
+    def train_fn(config):
+        # This objective function is just for demonstration purposes
+        session.report({"loss": config["param"]})
+
+    tuner = tune.Tuner(
+        train_fn,
+        tune_config=tune.TuneConfig(
+            search_alg=OptunaSearch(),
+            num_samples=100,
+            metric="loss",
+            mode="min",
+        ),
+        param_space={"param": tune.uniform(0, 1)},
+    )
     results = tuner.fit()
 
 
-Saving and Restoring Tune Runs
-------------------------------
+Saving and Restoring Tune Search Algorithms
+-------------------------------------------
 
 .. TODO: what to do about this section? It doesn't really belong here and is not worth its own guide.
 .. TODO: at least check that this pseudo-code runs.
 
 Certain search algorithms have ``save/restore`` implemented,
-allowing reuse of learnings across multiple tuning runs.
+allowing reuse of searchers that are fitted on the results of multiple tuning runs.
 
 .. code-block:: python
 
     search_alg = HyperOptSearch()
 
     tuner_1 = tune.Tuner(
-        trainable,
-        tune_config=tune.TuneConfig(search_alg=search_alg))
+        train_fn,
+        tune_config=tune.TuneConfig(search_alg=search_alg)
+    )
     results_1 = tuner_1.fit()
 
     search_alg.save("./my-checkpoint.pkl")
 
-    # Restore the saved state onto another search algorithm
+    # Restore the saved state onto another search algorithm,
+    # in a new tuning script
 
     search_alg2 = HyperOptSearch()
     search_alg2.restore("./my-checkpoint.pkl")
 
     tuner_2 = tune.Tuner(
-        trainable,
-        tune_config=tune.TuneConfig(search_alg=search_alg2))
+        train_fn,
+        tune_config=tune.TuneConfig(search_alg=search_alg2)
+    )
     results_2 = tuner_2.fit()
 
-Tune automatically saves its state inside the current experiment folder ("Result Dir") during tuning.
+Tune automatically saves searcher state inside the current experiment folder during tuning.
+See ``Result logdir: ...`` in the output logs for this location.
 
 Note that if you have two Tune runs with the same experiment folder,
 the previous state checkpoint will be overwritten. You can
 avoid this by making sure ``air.RunConfig(name=...)`` is set to a unique
-identifier.
+identifier:
 
 .. code-block:: python
 
     search_alg = HyperOptSearch()
     tuner_1 = tune.Tuner(
-        cost,
+        train_fn,
         tune_config=tune.TuneConfig(
             num_samples=5,
-            search_alg=search_alg),
+            search_alg=search_alg,
+        ),
         run_config=air.RunConfig(
-            verbose=0,
             name="my-experiment-1",
-            local_dir="~/my_results"
-        ))
+            local_dir="~/my_results",
+        )
+    )
     results = tuner_1.fit()
 
     search_alg2 = HyperOptSearch()
     search_alg2.restore_from_dir(
-      os.path.join("~/my_results", "my-experiment-1"))
+      os.path.join("~/my_results", "my-experiment-1")
+    )
 
 .. _tune-basicvariant:
 
@@ -86,25 +107,32 @@ The :class:`BasicVariantGenerator <ray.tune.search.basic_variant.BasicVariantGen
 default if no search algorithm is passed to
 :func:`Tuner <ray.tune.Tuner>`.
 
-.. autoclass:: ray.tune.search.basic_variant.BasicVariantGenerator
+.. currentmodule:: ray.tune.search
+
+.. autosummary::
+    :toctree: doc/
+
+    basic_variant.BasicVariantGenerator
 
 .. _tune-ax:
 
 Ax (tune.search.ax.AxSearch)
 ----------------------------
 
-.. autoclass:: ray.tune.search.ax.AxSearch
+.. autosummary::
+    :toctree: doc/
+
+    ax.AxSearch
 
 .. _bayesopt:
 
 Bayesian Optimization (tune.search.bayesopt.BayesOptSearch)
 -----------------------------------------------------------
 
+.. autosummary::
+    :toctree: doc/
 
-.. autoclass:: ray.tune.search.bayesopt.BayesOptSearch
-  :members: save, restore
-
-.. _`BayesianOptimization search space specification`: https://github.com/fmfn/BayesianOptimization/blob/master/examples/advanced-tour.ipynb
+    bayesopt.BayesOptSearch
 
 .. _suggest-TuneBOHB:
 
@@ -125,7 +153,10 @@ In order to use this search algorithm, you will need to install ``HpBandSter`` a
 
 See the `BOHB paper <https://arxiv.org/abs/1807.01774>`_ for more details.
 
-.. autoclass:: ray.tune.search.bohb.TuneBOHB
+.. autosummary::
+    :toctree: doc/
+
+    bohb.TuneBOHB
 
 .. _BlendSearch:
 
@@ -144,7 +175,10 @@ In order to use this search algorithm, you will need to install ``flaml``:
 
 See the `BlendSearch paper <https://openreview.net/pdf?id=VbLH04pRA3>`_ and documentation in FLAML `BlendSearch documentation <https://github.com/microsoft/FLAML/tree/main/flaml/tune>`_ for more details.
 
-.. autoclass:: ray.tune.search.flaml.BlendSearch
+.. autosummary::
+    :toctree: doc/
+
+    flaml.BlendSearch
 
 .. _CFO:
 
@@ -164,50 +198,60 @@ In order to use this search algorithm, you will need to install ``flaml``:
 See the `CFO paper <https://arxiv.org/pdf/2005.01571.pdf>`_ and documentation in
 FLAML `CFO documentation <https://github.com/microsoft/FLAML/tree/main/flaml/tune>`_ for more details.
 
-.. autoclass:: ray.tune.search.flaml.CFO
+.. autosummary::
+    :toctree: doc/
+
+    flaml.CFO
 
 .. _Dragonfly:
 
 Dragonfly (tune.search.dragonfly.DragonflySearch)
 -------------------------------------------------
 
-.. autoclass:: ray.tune.search.dragonfly.DragonflySearch
-  :members: save, restore
+.. autosummary::
+    :toctree: doc/
+
+    dragonfly.DragonflySearch
 
 .. _tune-hebo:
 
 HEBO (tune.search.hebo.HEBOSearch)
 ----------------------------------
 
-.. autoclass:: ray.tune.search.hebo.HEBOSearch
-  :members: save, restore
+.. autosummary::
+    :toctree: doc/
+
+    hebo.HEBOSearch
 
 .. _tune-hyperopt:
 
 HyperOpt (tune.search.hyperopt.HyperOptSearch)
 ----------------------------------------------
 
-.. autoclass:: ray.tune.search.hyperopt.HyperOptSearch
-  :members: save, restore
+.. autosummary::
+    :toctree: doc/
+
+    hyperopt.HyperOptSearch
 
 .. _nevergrad:
 
 Nevergrad (tune.search.nevergrad.NevergradSearch)
 -------------------------------------------------
 
-.. autoclass:: ray.tune.search.nevergrad.NevergradSearch
-  :members: save, restore
+.. autosummary::
+    :toctree: doc/
 
-.. _`Nevergrad README's Optimization section`: https://github.com/facebookresearch/nevergrad/blob/master/docs/optimization.rst#choosing-an-optimizer
+    nevergrad.NevergradSearch
 
 .. _tune-optuna:
 
 Optuna (tune.search.optuna.OptunaSearch)
 ----------------------------------------
 
-.. autoclass:: ray.tune.search.optuna.OptunaSearch
+.. autosummary::
+    :toctree: doc/
 
-.. _`Optuna samplers`: https://optuna.readthedocs.io/en/stable/reference/samplers.html
+    optuna.OptunaSearch
 
 .. _sigopt:
 
@@ -217,25 +261,30 @@ SigOpt (tune.search.sigopt.SigOptSearch)
 You will need to use the `SigOpt experiment and space specification <https://docs.sigopt.com/ai-module-api-references/experiments>`__
 to specify your search space.
 
-.. autoclass:: ray.tune.search.sigopt.SigOptSearch
+.. autosummary::
+    :toctree: doc/
+
+    sigopt.SigOptSearch
 
 .. _skopt:
 
 Scikit-Optimize (tune.search.skopt.SkOptSearch)
 -----------------------------------------------
 
-.. autoclass:: ray.tune.search.skopt.SkOptSearch
-  :members: save, restore
+.. autosummary::
+    :toctree: doc/
 
-.. _`skopt Optimizer object`: https://scikit-optimize.github.io/stable/modules/generated/skopt.Optimizer.html#skopt.Optimizer
+    skopt.SkOptSearch
 
 .. _zoopt:
 
 ZOOpt (tune.search.zoopt.ZOOptSearch)
 -------------------------------------
 
-.. autoclass:: ray.tune.search.zoopt.ZOOptSearch
-  :members: save, restore
+.. autosummary::
+    :toctree: doc/
+
+    zoopt.ZOOptSearch
 
 .. _repeater:
 
@@ -255,7 +304,10 @@ will run ``repeat`` trials of the configuration. It will then average the
 .. warning:: It is recommended to not use ``Repeater`` with a TrialScheduler.
     Early termination can negatively affect the average reported metric.
 
-.. autoclass:: ray.tune.search.Repeater
+.. autosummary::
+    :toctree: doc/
+
+    Repeater
 
 .. _limiter:
 
@@ -265,7 +317,10 @@ ConcurrencyLimiter (tune.search.ConcurrencyLimiter)
 Use ``ray.tune.search.ConcurrencyLimiter`` to limit the amount of concurrency when using a search algorithm.
 This is useful when a given optimization algorithm does not parallelize very well (like a naive Bayesian Optimization).
 
-.. autoclass:: ray.tune.search.ConcurrencyLimiter
+.. autosummary::
+    :toctree: doc/
+
+    ConcurrencyLimiter
 
 .. _byo-algo:
 
@@ -274,11 +329,15 @@ Custom Search Algorithms (tune.search.Searcher)
 
 If you are interested in implementing or contributing a new Search Algorithm, provide the following interface:
 
-.. autoclass:: ray.tune.search.Searcher
-    :members:
-    :private-members:
-    :show-inheritance:
+.. autosummary::
+    :toctree: doc/
 
+    Searcher
+    Searcher.suggest
+    Searcher.save
+    Searcher.restore
+    Searcher.on_trial_result
+    Searcher.on_trial_complete
 
 If contributing, make sure to add test cases and an entry in the function described below.
 
@@ -290,4 +349,7 @@ There is also a shim function that constructs the search algorithm based on the
 This can be useful if the search algorithm you want to use changes often
 (e.g., specifying the search algorithm via a CLI option or config file).
 
-.. automethod:: ray.tune.create_searcher
+.. autosummary::
+    :toctree: doc/
+
+    create_searcher
diff --git a/doc/source/tune/api/syncing.rst b/doc/source/tune/api/syncing.rst
new file mode 100644
index 000000000000..d7f24fd44920
--- /dev/null
+++ b/doc/source/tune/api/syncing.rst
@@ -0,0 +1,46 @@
+Syncing in Tune (tune.SyncConfig, tune.Syncer)
+==============================================
+
+.. seealso::
+
+    See :doc:`this user guide </tune/tutorials/tune-storage>` for more details and examples.
+
+
+.. currentmodule:: ray.tune.syncer
+
+.. _tune-sync-config:
+
+Tune Syncing Configuration
+--------------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    SyncConfig
+
+.. _tune-syncer:
+
+Remote Storage Syncer Interface (tune.Syncer)
+---------------------------------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    Syncer
+    Syncer.sync_up
+    Syncer.sync_down
+    Syncer.delete
+    Syncer.wait
+    Syncer.wait_or_retry
+
+
+Tune Built-in Syncers
+---------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    SyncerCallback
+    _DefaultSyncer
+    _BackgroundSyncer
+
diff --git a/doc/source/tune/api_docs/trainable.rst b/doc/source/tune/api/trainable.rst
similarity index 90%
rename from doc/source/tune/api_docs/trainable.rst
rename to doc/source/tune/api/trainable.rst
index 177fc60b6296..3b46f22694c1 100644
--- a/doc/source/tune/api_docs/trainable.rst
+++ b/doc/source/tune/api/trainable.rst
@@ -240,7 +240,7 @@ Trainables can themselves be distributed. If your trainable function / class cre
 that also consume CPU / GPU resources, you will want to add more bundles to the :class:`PlacementGroupFactory`
 to reserve extra resource slots.
 For example, if a trainable class requires 1 GPU itself, but also launches 4 actors, each using another GPU,
-then you should use :ref:`tune-with-resources` like this:
+then you should use :func:`tune.with_resources <ray.tune.with_resources>` like this:
 
 .. code-block:: python
    :emphasize-lines: 4-10
@@ -267,56 +267,72 @@ It is also possible to specify memory (``"memory"``, in bytes) and custom resour
 session (Function API)
 ----------------------
 
-.. autofunction:: ray.air.session.report
-    :noindex:
+.. currentmodule:: ray
 
-.. autofunction:: ray.air.session.get_checkpoint
-    :noindex:
+.. autosummary::
+    :toctree: doc/
 
-.. autofunction:: ray.air.session.get_trial_name
+    air.session.report
     :noindex:
-
-.. autofunction:: ray.air.session.get_trial_id
+    air.session.get_checkpoint
     :noindex:
-
-.. autofunction:: ray.air.session.get_trial_resources
+    air.session.get_trial_name
     :noindex:
-
-.. autofunction:: ray.air.session.get_trial_dir
+    air.session.get_trial_id
+    :noindex:
+    air.session.get_trial_resources
+    :noindex:
+    air.session.get_trial_dir
     :noindex:
 
 .. _tune-trainable-docstring:
 
-tune.Trainable (Class API)
---------------------------
+Trainable (Class API)
+---------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    tune.Trainable
+    tune.Trainable.setup
+    tune.Trainable.save_checkpoint
+    tune.Trainable.load_checkpoint
+    tune.Trainable.step
+    tune.Trainable.reset_config
+    tune.Trainable.cleanup
+    tune.Trainable.default_resource_request
 
-.. autoclass:: ray.tune.Trainable
-    :member-order: groupwise
-    :private-members:
-    :members:
 
 .. _tune-util-ref:
 
-Utilities
----------
+Tune Trainable Utilities
+-------------------------
+
+Tune Data Ingestion Utilities
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-.. autofunction:: ray.tune.utils.wait_for_gpu
+.. autosummary::
+    :toctree: doc/
 
-.. autofunction:: ray.tune.utils.diagnose_serialization
+    tune.with_parameters
 
-.. autofunction:: ray.tune.utils.validate_save_restore
 
+Tune Resource Assignment Utilities
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-.. _tune-with-parameters:
+.. autosummary::
+    :toctree: doc/
 
-tune.with_parameters
---------------------
+    tune.with_resources
+    ~tune.execution.placement_groups.PlacementGroupFactory
+    tune.utils.wait_for_gpu
 
-.. autofunction:: ray.tune.with_parameters
 
-.. _tune-with-resources:
+Tune Trainable Debugging Utilities
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-tune.with_resources
---------------------
+.. autosummary::
+    :toctree: doc/
 
-.. autofunction:: ray.tune.with_resources
\ No newline at end of file
+    tune.utils.diagnose_serialization
+    tune.utils.validate_save_restore
diff --git a/doc/source/tune/api_docs/execution.rst b/doc/source/tune/api_docs/execution.rst
deleted file mode 100644
index 834b5c669f78..000000000000
--- a/doc/source/tune/api_docs/execution.rst
+++ /dev/null
@@ -1,26 +0,0 @@
-Tune Execution (Tuner, tune.Experiment)
-=======================================
-
-.. _tune-run-ref:
-
-Tuner
------
-
-.. autofunction:: ray.tune.Tuner
-
-tune.run_experiments
---------------------
-
-.. autofunction:: ray.tune.run_experiments
-
-tune.Experiment
----------------
-
-.. autofunction:: ray.tune.Experiment
-
-.. _tune-sync-config:
-
-tune.SyncConfig
----------------
-
-.. autofunction:: ray.tune.SyncConfig
diff --git a/doc/source/tune/api_docs/integration.rst b/doc/source/tune/api_docs/integration.rst
deleted file mode 100644
index 63daaa76b4f0..000000000000
--- a/doc/source/tune/api_docs/integration.rst
+++ /dev/null
@@ -1,91 +0,0 @@
-.. _tune-integration:
-
-External library integrations for Ray Tune (tune.integration)
-=============================================================
-
-.. contents::
-    :local:
-    :depth: 1
-
-
-Comet (tune.integration.comet)
--------------------------------------------
-
-:ref:`See also here <tune-comet-ref>`.
-
-.. autoclass:: ray.air.integrations.comet.CometLoggerCallback
-    :noindex:
-
-.. _tune-integration-keras:
-
-Keras (tune.integration.keras)
-------------------------------------------------------
-
-.. autoclass:: ray.tune.integration.keras.TuneReportCallback
-
-.. autoclass:: ray.tune.integration.keras.TuneReportCheckpointCallback
-
-
-.. _tune-integration-mlflow:
-
-MLflow (tune.integration.mlflow)
---------------------------------
-
-:ref:`See also here <tune-mlflow-ref>`.
-
-.. autoclass:: ray.air.integrations.mlflow.MLflowLoggerCallback
-    :noindex:
-
-.. autofunction:: ray.air.integrations.mlflow.setup_mlflow
-
-
-.. _tune-integration-mxnet:
-
-MXNet (tune.integration.mxnet)
-------------------------------
-
-.. autoclass:: ray.tune.integration.mxnet.TuneReportCallback
-
-.. autoclass:: ray.tune.integration.mxnet.TuneCheckpointCallback
-
-
-.. _tune-integration-pytorch-lightning:
-
-PyTorch Lightning (tune.integration.pytorch_lightning)
-------------------------------------------------------
-
-.. autoclass:: ray.tune.integration.pytorch_lightning.TuneReportCallback
-
-.. autoclass:: ray.tune.integration.pytorch_lightning.TuneReportCheckpointCallback
-
-.. _tune-integration-wandb:
-
-Weights and Biases (tune.integration.wandb)
--------------------------------------------
-
-:ref:`See also here <tune-wandb-ref>`.
-
-.. autoclass:: ray.air.integrations.wandb.WandbLoggerCallback
-    :noindex:
-
-.. autofunction:: ray.air.integrations.wandb.setup_wandb
-
-
-.. _tune-integration-xgboost:
-
-XGBoost (tune.integration.xgboost)
-----------------------------------
-
-.. autoclass:: ray.tune.integration.xgboost.TuneReportCallback
-
-.. autoclass:: ray.tune.integration.xgboost.TuneReportCheckpointCallback
-
-
-.. _tune-integration-lightgbm:
-
-LightGBM (tune.integration.lightgbm)
-------------------------------------
-
-.. autoclass:: ray.tune.integration.lightgbm.TuneReportCallback
-
-.. autoclass:: ray.tune.integration.lightgbm.TuneReportCheckpointCallback
diff --git a/doc/source/tune/api_docs/result_grid.rst b/doc/source/tune/api_docs/result_grid.rst
deleted file mode 100644
index 9333494237bb..000000000000
--- a/doc/source/tune/api_docs/result_grid.rst
+++ /dev/null
@@ -1,25 +0,0 @@
-.. _tune-analysis-docs:
-
-.. _result-grid-docstring:
-
-ResultGrid (tune.ResultGrid)
-----------------------------
-
-.. autoclass:: ray.tune.ResultGrid
-    :members:
-
-.. _result-docstring:
-
-Result (air.Result)
--------------------
-
-.. autoclass:: ray.air.Result
-    :members:
-
-.. _exp-analysis-docstring:
-
-ExperimentAnalysis (tune.ExperimentAnalysis)
---------------------------------------------
-
-.. autoclass:: ray.tune.ExperimentAnalysis
-    :members:
diff --git a/doc/source/tune/api_docs/stoppers.rst b/doc/source/tune/api_docs/stoppers.rst
deleted file mode 100644
index 30edfa793e35..000000000000
--- a/doc/source/tune/api_docs/stoppers.rst
+++ /dev/null
@@ -1,52 +0,0 @@
-.. _tune-stoppers:
-
-Tune Stopping mechanisms (tune.stopper)
-=======================================
-
-In addition to Trial Schedulers like :ref:`ASHA <tune-scheduler-hyperband>`, where a number of
-trials are stopped if they perform subpar, Ray Tune also supports custom stopping mechanisms to stop trials early. They can also stop the entire experiment after a condition is met.
-For instance, stopping mechanisms can specify to stop trials when they reached a plateau and the metric
-doesn't change anymore.
-
-Ray Tune comes with several stopping mechanisms out of the box. For custom stopping behavior, you can
-inherit from the :class:`Stopper <ray.tune.Stopper>` class.
-
-Other stopping behaviors are described :ref:`in the user guide <tune-stopping-ref>`.
-
-.. contents::
-    :local:
-    :depth: 1
-
-
-.. _tune-stop-ref:
-
-Stopper (tune.Stopper)
-----------------------
-
-.. autoclass:: ray.tune.Stopper
-    :members: __call__, stop_all
-
-MaximumIterationStopper (tune.stopper.MaximumIterationStopper)
---------------------------------------------------------------
-
-.. autoclass:: ray.tune.stopper.MaximumIterationStopper
-
-ExperimentPlateauStopper (tune.stopper.ExperimentPlateauStopper)
-----------------------------------------------------------------
-
-.. autoclass:: ray.tune.stopper.ExperimentPlateauStopper
-
-TrialPlateauStopper (tune.stopper.TrialPlateauStopper)
-------------------------------------------------------
-
-.. autoclass:: ray.tune.stopper.TrialPlateauStopper
-
-TimeoutStopper (tune.stopper.TimeoutStopper)
---------------------------------------------
-
-.. autoclass:: ray.tune.stopper.TimeoutStopper
-
-CombinedStopper (tune.stopper.CombinedStopper)
-----------------------------------------------
-
-.. autoclass:: ray.tune.stopper.CombinedStopper
diff --git a/doc/source/tune/api_docs/syncing.rst b/doc/source/tune/api_docs/syncing.rst
deleted file mode 100644
index 17e030794e26..000000000000
--- a/doc/source/tune/api_docs/syncing.rst
+++ /dev/null
@@ -1,20 +0,0 @@
-Syncing in Tune (tune.SyncConfig, tune.Syncer)
-==============================================
-
-.. _tune-syncconfig:
-
-SyncConfig
-----------
-
-.. autoclass:: ray.tune.syncer.SyncConfig
-    :members:
-
-
-
-.. _tune-syncer:
-
-Syncer
-------
-
-.. autoclass:: ray.tune.syncer.Syncer
-    :members:
diff --git a/doc/source/tune/examples/tune-xgboost.ipynb b/doc/source/tune/examples/tune-xgboost.ipynb
index b732c1879fb9..edf640b0b30c 100644
--- a/doc/source/tune/examples/tune-xgboost.ipynb
+++ b/doc/source/tune/examples/tune-xgboost.ipynb
@@ -1,1255 +1,1255 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "edce67b9",
-   "metadata": {},
-   "source": [
-    "# Tuning XGBoost hyperparameters with Ray Tune\n",
-    "\n",
-    "(tune-xgboost-ref)=\n",
-    "\n",
-    "XGBoost is currently one of the most popular machine learning algorithms. It performs\n",
-    "very well on a large selection of tasks, and was the key to success in many Kaggle\n",
-    "competitions.\n",
-    "\n",
-    "```{image} /images/xgboost_logo.png\n",
-    ":align: center\n",
-    ":alt: XGBoost\n",
-    ":target: https://xgboost.readthedocs.io/en/latest/\n",
-    ":width: 200px\n",
-    "```\n",
-    "\n",
-    "This tutorial will give you a quick introduction to XGBoost, show you how\n",
-    "to train an XGBoost model, and then guide you on how to optimize XGBoost\n",
-    "parameters using Tune to get the best performance. We tackle the following topics:\n",
-    "\n",
-    "```{contents}\n",
-    ":depth: 2\n",
-    "```\n",
-    "\n",
-    ":::{note}\n",
-    "To run this tutorial, you will need to install the following:\n",
-    "\n",
-    "```bash\n",
-    "$ pip install xgboost\n",
-    "```\n",
-    ":::\n",
-    "\n",
-    "## What is XGBoost\n",
-    "\n",
-    "XGBoost is an acronym for e**X**treme **G**radient **Boost**ing. Internally,\n",
-    "XGBoost uses [decision trees](https://en.wikipedia.org/wiki/Decision_tree). Instead\n",
-    "of training just one large decision tree, XGBoost and other related algorithms train\n",
-    "many small decision trees. The intuition behind this is that even though single\n",
-    "decision trees can be inaccurate and suffer from high variance,\n",
-    "combining the output of a large number of these weak learners can actually lead to\n",
-    "strong learner, resulting in better predictions and less variance.\n",
-    "\n",
-    ":::{figure} /images/tune-xgboost-ensemble.svg\n",
-    ":alt: Single vs. ensemble learning\n",
-    "\n",
-    "A single decision tree (left) might be able to get to an accuracy of 70%\n",
-    "for a binary classification task. By combining the output of several small\n",
-    "decision trees, an ensemble learner (right) might end up with a higher accuracy\n",
-    "of 90%.\n",
-    ":::\n",
-    "\n",
-    "Boosting algorithms start with a single small decision tree and evaluate how well\n",
-    "it predicts the given examples. When building the next tree, those samples that have\n",
-    "been misclassified before have a higher chance of being used to generate the tree.\n",
-    "This is useful because it avoids overfitting to samples that can be easily classified\n",
-    "and instead tries to come up with models that are able to classify hard examples, too.\n",
-    "Please see [here for a more thorough introduction to bagging and boosting algorithms](https://towardsdatascience.com/ensemble-methods-bagging-boosting-and-stacking-c9214a10a205).\n",
-    "\n",
-    "There are many boosting algorithms. In their core, they are all very similar. XGBoost\n",
-    "uses second-level derivatives to find splits that maximize the *gain* (the inverse of\n",
-    "the *loss*) - hence the name. In practice, there really is no drawback in using\n",
-    "XGBoost over other boosting algorithms - in fact, it usually shows the best performance.\n",
-    "\n",
-    "## Training a simple XGBoost classifier\n",
-    "\n",
-    "Let's first see how a simple XGBoost classifier can be trained. We'll use the\n",
-    "`breast_cancer`-Dataset included in the `sklearn` dataset collection. This is\n",
-    "a binary classification dataset. Given 30 different input features, our task is to\n",
-    "learn to identify subjects with breast cancer and those without.\n",
-    "\n",
-    "Here is the full code to train a simple XGBoost model:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 1,
-   "id": "77b3c71c",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Accuracy: 0.9650\n"
-     ]
-    }
-   ],
-   "source": [
-    "import sklearn.datasets\n",
-    "import sklearn.metrics\n",
-    "from sklearn.model_selection import train_test_split\n",
-    "import xgboost as xgb\n",
-    "\n",
-    "\n",
-    "def train_breast_cancer(config):\n",
-    "    # Load dataset\n",
-    "    data, labels = sklearn.datasets.load_breast_cancer(return_X_y=True)\n",
-    "    # Split into train and test set\n",
-    "    train_x, test_x, train_y, test_y = train_test_split(data, labels, test_size=0.25)\n",
-    "    # Build input matrices for XGBoost\n",
-    "    train_set = xgb.DMatrix(train_x, label=train_y)\n",
-    "    test_set = xgb.DMatrix(test_x, label=test_y)\n",
-    "    # Train the classifier\n",
-    "    results = {}\n",
-    "    bst = xgb.train(\n",
-    "        config,\n",
-    "        train_set,\n",
-    "        evals=[(test_set, \"eval\")],\n",
-    "        evals_result=results,\n",
-    "        verbose_eval=False,\n",
-    "    )\n",
-    "    return results\n",
-    "\n",
-    "\n",
-    "if __name__ == \"__main__\":\n",
-    "    results = train_breast_cancer(\n",
-    "        {\"objective\": \"binary:logistic\", \"eval_metric\": [\"logloss\", \"error\"]}\n",
-    "    )\n",
-    "    accuracy = 1.0 - results[\"eval\"][\"error\"][-1]\n",
-    "    print(f\"Accuracy: {accuracy:.4f}\")\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ec2a13f8",
-   "metadata": {},
-   "source": [
-    "As you can see, the code is quite simple. First, the dataset is loaded and split\n",
-    "into a `test` and `train` set. The XGBoost model is trained with `xgb.train()`.\n",
-    "XGBoost automatically evaluates metrics we specified on the test set. In our case\n",
-    "it calculates the *logloss* and the prediction *error*, which is the percentage of\n",
-    "misclassified examples. To calculate the accuracy, we just have to subtract the error\n",
-    "from `1.0`. Even in this simple example, most runs result\n",
-    "in a good accuracy of over `0.90`.\n",
-    "\n",
-    "Maybe you have noticed the `config` parameter we pass to the XGBoost algorithm. This\n",
-    "is a {class}`dict` in which you can specify parameters for the XGBoost algorithm. In this\n",
-    "simple example, the only parameters we passed are the `objective` and `eval_metric` parameters.\n",
-    "The value `binary:logistic` tells XGBoost that we aim to train a logistic regression model for\n",
-    "a binary classification task. You can find an overview over all valid objectives\n",
-    "[here in the XGBoost documentation](https://xgboost.readthedocs.io/en/latest/parameter.html#learning-task-parameters).\n",
-    "\n",
-    "## XGBoost Hyperparameters\n",
-    "\n",
-    "Even with the default settings, XGBoost was able to get to a good accuracy on the\n",
-    "breast cancer dataset. However, as in many machine learning algorithms, there are\n",
-    "many knobs to tune which might lead to even better performance. Let's explore some of\n",
-    "them below.\n",
-    "\n",
-    "### Maximum tree depth\n",
-    "\n",
-    "Remember that XGBoost internally uses many decision tree models to come up with\n",
-    "predictions. When training a decision tree, we need to tell the algorithm how\n",
-    "large the tree may get. The parameter for this is called the tree *depth*.\n",
-    "\n",
-    ":::{figure} /images/tune-xgboost-depth.svg\n",
-    ":align: center\n",
-    ":alt: Decision tree depth\n",
-    "\n",
-    "In this image, the left tree has a depth of 2, and the right tree a depth of 3.\n",
-    "Note that with each level, $2^{(d-1)}$ splits are added, where *d* is the depth\n",
-    "of the tree.\n",
-    ":::\n",
-    "\n",
-    "Tree depth is a property that concerns the model complexity. If you only allow short\n",
-    "trees, the models are likely not very precise - they underfit the data. If you allow\n",
-    "very large trees, the single models are likely to overfit to the data. In practice,\n",
-    "a number between `2` and `6` is often a good starting point for this parameter.\n",
-    "\n",
-    "XGBoost's default value is `3`.\n",
-    "\n",
-    "### Minimum child weight\n",
-    "\n",
-    "When a decision tree creates new leaves, it splits up the remaining data at one node\n",
-    "into two groups. If there are only few samples in one of these groups, it often\n",
-    "doesn't make sense to split it further. One of the reasons for this is that the\n",
-    "model is harder to train when we have fewer samples.\n",
-    "\n",
-    ":::{figure} /images/tune-xgboost-weight.svg\n",
-    ":align: center\n",
-    ":alt: Minimum child weight\n",
-    "\n",
-    "In this example, we start with 100 examples. At the first node, they are split\n",
-    "into 4 and 96 samples, respectively. In the next step, our model might find\n",
-    "that it doesn't make sense to split the 4 examples more. It thus only continues\n",
-    "to add leaves on the right side.\n",
-    ":::\n",
-    "\n",
-    "The parameter used by the model to decide if it makes sense to split a node is called\n",
-    "the *minimum child weight*. In the case of linear regression, this is just the absolute\n",
-    "number of nodes requried in each child. In other objectives, this value is determined\n",
-    "using the weights of the examples, hence the name.\n",
-    "\n",
-    "The larger the value, the more constrained the trees are and the less deep they will be.\n",
-    "This parameter thus also affects the model complexity. Values can range between 0\n",
-    "and infinity and are dependent on the sample size. For our ca. 500 examples in the\n",
-    "breast cancer dataset, values between `0` and `10` should be sensible.\n",
-    "\n",
-    "XGBoost's default value is `1`.\n",
-    "\n",
-    "### Subsample size\n",
-    "\n",
-    "Each decision tree we add is trained on a subsample of the total training dataset.\n",
-    "The probabilities for the samples are weighted according to the XGBoost algorithm,\n",
-    "but we can decide on which fraction of the samples we want to train each decision\n",
-    "tree on.\n",
-    "\n",
-    "Setting this value to `0.7` would mean that we randomly sample `70%` of the\n",
-    "training dataset before each training iteration.\n",
-    "\n",
-    "XGBoost's default value is `1`.\n",
-    "\n",
-    "### Learning rate / Eta\n",
-    "\n",
-    "Remember that XGBoost sequentially trains many decision trees, and that later trees\n",
-    "are more likely trained on data that has been misclassified by prior trees. In effect\n",
-    "this means that earlier trees make decisions for easy samples (i.e. those samples that\n",
-    "can easily be classified) and later trees make decisions for harder samples. It is then\n",
-    "sensible to assume that the later trees are less accurate than earlier trees.\n",
-    "\n",
-    "To address this fact, XGBoost uses a parameter called *Eta*, which is sometimes called\n",
-    "the *learning rate*. Don't confuse this with learning rates from gradient descent!\n",
-    "The original [paper on stochastic gradient boosting](https://www.sciencedirect.com/science/article/abs/pii/S0167947301000652)\n",
-    "introduces this parameter like so:\n",
-    "\n",
-    "$$\n",
-    "F_m(x) = F_{m-1}(x) + \\eta \\cdot \\gamma_{lm} \\textbf{1}(x \\in R_{lm})\n",
-    "$$\n",
-    "\n",
-    "This is just a complicated way to say that when we train we new decision tree,\n",
-    "represented by $\\gamma_{lm} \\textbf{1}(x \\in R_{lm})$, we want to dampen\n",
-    "its effect on the previous prediction $F_{m-1}(x)$ with a factor\n",
-    "$\\eta$.\n",
-    "\n",
-    "Typical values for this parameter are between `0.01` and `` 0.3` ``.\n",
-    "\n",
-    "XGBoost's default value is `0.3`.\n",
-    "\n",
-    "### Number of boost rounds\n",
-    "\n",
-    "Lastly, we can decide on how many boosting rounds we perform, which means how\n",
-    "many decision trees we ultimately train. When we do heavy subsampling or use small\n",
-    "learning rate, it might make sense to increase the number of boosting rounds.\n",
-    "\n",
-    "XGBoost's default value is `10`.\n",
-    "\n",
-    "### Putting it together\n",
-    "\n",
-    "Let's see how this looks like in code! We just need to adjust our `config` dict:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 2,
-   "id": "35073e88",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Accuracy: 0.9790\n"
-     ]
-    }
-   ],
-   "source": [
-    "if __name__ == \"__main__\":\n",
-    "    config = {\n",
-    "        \"objective\": \"binary:logistic\",\n",
-    "        \"eval_metric\": [\"logloss\", \"error\"],\n",
-    "        \"max_depth\": 2,\n",
-    "        \"min_child_weight\": 0,\n",
-    "        \"subsample\": 0.8,\n",
-    "        \"eta\": 0.2,\n",
-    "    }\n",
-    "    results = train_breast_cancer(config)\n",
-    "    accuracy = 1.0 - results[\"eval\"][\"error\"][-1]\n",
-    "    print(f\"Accuracy: {accuracy:.4f}\")\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "69cf0c13",
-   "metadata": {},
-   "source": [
-    "The rest stays the same. Please note that we do not adjust the `num_boost_rounds` here.\n",
-    "The result should also show a high accuracy of over 90%.\n",
-    "\n",
-    "## Tuning the configuration parameters\n",
-    "\n",
-    "XGBoosts default parameters already lead to a good accuracy, and even our guesses in the\n",
-    "last section should result in accuracies well above 90%. However, our guesses were\n",
-    "just that: guesses. Often we do not know what combination of parameters would actually\n",
-    "lead to the best results on a machine learning task.\n",
-    "\n",
-    "Unfortunately, there are infinitely many combinations of hyperparameters we could try\n",
-    "out. Should we combine `max_depth=3` with `subsample=0.8` or with `subsample=0.9`?\n",
-    "What about the other parameters?\n",
-    "\n",
-    "This is where hyperparameter tuning comes into play. By using tuning libraries such as\n",
-    "Ray Tune we can try out combinations of hyperparameters. Using sophisticated search\n",
-    "strategies, these parameters can be selected so that they are likely to lead to good\n",
-    "results (avoiding an expensive *exhaustive search*). Also, trials that do not perform\n",
-    "well can be preemptively stopped to reduce waste of computing resources. Lastly, Ray Tune\n",
-    "also takes care of training these runs in parallel, greatly increasing search speed.\n",
-    "\n",
-    "Let's start with a basic example on how to use Tune for this. We just need to make\n",
-    "a few changes to our code-block:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "id": "ff856a82",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2022-07-22 15:52:52,004\tINFO services.py:1483 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8268\u001b[39m\u001b[22m\n",
-      "2022-07-22 15:52:55,858\tWARNING function_trainable.py:619 -- Function checkpointing is disabled. This may result in unexpected behavior when using checkpointing features or certain schedulers. To enable, set the train function arguments to be `func(config, checkpoint_dir=None)`.\n"
-     ]
+    "cells": [
+        {
+            "cell_type": "markdown",
+            "id": "edce67b9",
+            "metadata": {},
+            "source": [
+                "# Tuning XGBoost hyperparameters with Ray Tune\n",
+                "\n",
+                "(tune-xgboost-ref)=\n",
+                "\n",
+                "XGBoost is currently one of the most popular machine learning algorithms. It performs\n",
+                "very well on a large selection of tasks, and was the key to success in many Kaggle\n",
+                "competitions.\n",
+                "\n",
+                "```{image} /images/xgboost_logo.png\n",
+                ":align: center\n",
+                ":alt: XGBoost\n",
+                ":target: https://xgboost.readthedocs.io/en/latest/\n",
+                ":width: 200px\n",
+                "```\n",
+                "\n",
+                "This tutorial will give you a quick introduction to XGBoost, show you how\n",
+                "to train an XGBoost model, and then guide you on how to optimize XGBoost\n",
+                "parameters using Tune to get the best performance. We tackle the following topics:\n",
+                "\n",
+                "```{contents}\n",
+                ":depth: 2\n",
+                "```\n",
+                "\n",
+                ":::{note}\n",
+                "To run this tutorial, you will need to install the following:\n",
+                "\n",
+                "```bash\n",
+                "$ pip install xgboost\n",
+                "```\n",
+                ":::\n",
+                "\n",
+                "## What is XGBoost\n",
+                "\n",
+                "XGBoost is an acronym for e**X**treme **G**radient **Boost**ing. Internally,\n",
+                "XGBoost uses [decision trees](https://en.wikipedia.org/wiki/Decision_tree). Instead\n",
+                "of training just one large decision tree, XGBoost and other related algorithms train\n",
+                "many small decision trees. The intuition behind this is that even though single\n",
+                "decision trees can be inaccurate and suffer from high variance,\n",
+                "combining the output of a large number of these weak learners can actually lead to\n",
+                "strong learner, resulting in better predictions and less variance.\n",
+                "\n",
+                ":::{figure} /images/tune-xgboost-ensemble.svg\n",
+                ":alt: Single vs. ensemble learning\n",
+                "\n",
+                "A single decision tree (left) might be able to get to an accuracy of 70%\n",
+                "for a binary classification task. By combining the output of several small\n",
+                "decision trees, an ensemble learner (right) might end up with a higher accuracy\n",
+                "of 90%.\n",
+                ":::\n",
+                "\n",
+                "Boosting algorithms start with a single small decision tree and evaluate how well\n",
+                "it predicts the given examples. When building the next tree, those samples that have\n",
+                "been misclassified before have a higher chance of being used to generate the tree.\n",
+                "This is useful because it avoids overfitting to samples that can be easily classified\n",
+                "and instead tries to come up with models that are able to classify hard examples, too.\n",
+                "Please see [here for a more thorough introduction to bagging and boosting algorithms](https://towardsdatascience.com/ensemble-methods-bagging-boosting-and-stacking-c9214a10a205).\n",
+                "\n",
+                "There are many boosting algorithms. In their core, they are all very similar. XGBoost\n",
+                "uses second-level derivatives to find splits that maximize the *gain* (the inverse of\n",
+                "the *loss*) - hence the name. In practice, there really is no drawback in using\n",
+                "XGBoost over other boosting algorithms - in fact, it usually shows the best performance.\n",
+                "\n",
+                "## Training a simple XGBoost classifier\n",
+                "\n",
+                "Let's first see how a simple XGBoost classifier can be trained. We'll use the\n",
+                "`breast_cancer`-Dataset included in the `sklearn` dataset collection. This is\n",
+                "a binary classification dataset. Given 30 different input features, our task is to\n",
+                "learn to identify subjects with breast cancer and those without.\n",
+                "\n",
+                "Here is the full code to train a simple XGBoost model:"
+            ]
+        },
+        {
+            "cell_type": "code",
+            "execution_count": 1,
+            "id": "77b3c71c",
+            "metadata": {},
+            "outputs": [
+                {
+                    "name": "stdout",
+                    "output_type": "stream",
+                    "text": [
+                        "Accuracy: 0.9650\n"
+                    ]
+                }
+            ],
+            "source": [
+                "import sklearn.datasets\n",
+                "import sklearn.metrics\n",
+                "from sklearn.model_selection import train_test_split\n",
+                "import xgboost as xgb\n",
+                "\n",
+                "\n",
+                "def train_breast_cancer(config):\n",
+                "    # Load dataset\n",
+                "    data, labels = sklearn.datasets.load_breast_cancer(return_X_y=True)\n",
+                "    # Split into train and test set\n",
+                "    train_x, test_x, train_y, test_y = train_test_split(data, labels, test_size=0.25)\n",
+                "    # Build input matrices for XGBoost\n",
+                "    train_set = xgb.DMatrix(train_x, label=train_y)\n",
+                "    test_set = xgb.DMatrix(test_x, label=test_y)\n",
+                "    # Train the classifier\n",
+                "    results = {}\n",
+                "    bst = xgb.train(\n",
+                "        config,\n",
+                "        train_set,\n",
+                "        evals=[(test_set, \"eval\")],\n",
+                "        evals_result=results,\n",
+                "        verbose_eval=False,\n",
+                "    )\n",
+                "    return results\n",
+                "\n",
+                "\n",
+                "if __name__ == \"__main__\":\n",
+                "    results = train_breast_cancer(\n",
+                "        {\"objective\": \"binary:logistic\", \"eval_metric\": [\"logloss\", \"error\"]}\n",
+                "    )\n",
+                "    accuracy = 1.0 - results[\"eval\"][\"error\"][-1]\n",
+                "    print(f\"Accuracy: {accuracy:.4f}\")\n"
+            ]
+        },
+        {
+            "cell_type": "markdown",
+            "id": "ec2a13f8",
+            "metadata": {},
+            "source": [
+                "As you can see, the code is quite simple. First, the dataset is loaded and split\n",
+                "into a `test` and `train` set. The XGBoost model is trained with `xgb.train()`.\n",
+                "XGBoost automatically evaluates metrics we specified on the test set. In our case\n",
+                "it calculates the *logloss* and the prediction *error*, which is the percentage of\n",
+                "misclassified examples. To calculate the accuracy, we just have to subtract the error\n",
+                "from `1.0`. Even in this simple example, most runs result\n",
+                "in a good accuracy of over `0.90`.\n",
+                "\n",
+                "Maybe you have noticed the `config` parameter we pass to the XGBoost algorithm. This\n",
+                "is a {class}`dict` in which you can specify parameters for the XGBoost algorithm. In this\n",
+                "simple example, the only parameters we passed are the `objective` and `eval_metric` parameters.\n",
+                "The value `binary:logistic` tells XGBoost that we aim to train a logistic regression model for\n",
+                "a binary classification task. You can find an overview over all valid objectives\n",
+                "[here in the XGBoost documentation](https://xgboost.readthedocs.io/en/latest/parameter.html#learning-task-parameters).\n",
+                "\n",
+                "## XGBoost Hyperparameters\n",
+                "\n",
+                "Even with the default settings, XGBoost was able to get to a good accuracy on the\n",
+                "breast cancer dataset. However, as in many machine learning algorithms, there are\n",
+                "many knobs to tune which might lead to even better performance. Let's explore some of\n",
+                "them below.\n",
+                "\n",
+                "### Maximum tree depth\n",
+                "\n",
+                "Remember that XGBoost internally uses many decision tree models to come up with\n",
+                "predictions. When training a decision tree, we need to tell the algorithm how\n",
+                "large the tree may get. The parameter for this is called the tree *depth*.\n",
+                "\n",
+                ":::{figure} /images/tune-xgboost-depth.svg\n",
+                ":align: center\n",
+                ":alt: Decision tree depth\n",
+                "\n",
+                "In this image, the left tree has a depth of 2, and the right tree a depth of 3.\n",
+                "Note that with each level, $2^{(d-1)}$ splits are added, where *d* is the depth\n",
+                "of the tree.\n",
+                ":::\n",
+                "\n",
+                "Tree depth is a property that concerns the model complexity. If you only allow short\n",
+                "trees, the models are likely not very precise - they underfit the data. If you allow\n",
+                "very large trees, the single models are likely to overfit to the data. In practice,\n",
+                "a number between `2` and `6` is often a good starting point for this parameter.\n",
+                "\n",
+                "XGBoost's default value is `3`.\n",
+                "\n",
+                "### Minimum child weight\n",
+                "\n",
+                "When a decision tree creates new leaves, it splits up the remaining data at one node\n",
+                "into two groups. If there are only few samples in one of these groups, it often\n",
+                "doesn't make sense to split it further. One of the reasons for this is that the\n",
+                "model is harder to train when we have fewer samples.\n",
+                "\n",
+                ":::{figure} /images/tune-xgboost-weight.svg\n",
+                ":align: center\n",
+                ":alt: Minimum child weight\n",
+                "\n",
+                "In this example, we start with 100 examples. At the first node, they are split\n",
+                "into 4 and 96 samples, respectively. In the next step, our model might find\n",
+                "that it doesn't make sense to split the 4 examples more. It thus only continues\n",
+                "to add leaves on the right side.\n",
+                ":::\n",
+                "\n",
+                "The parameter used by the model to decide if it makes sense to split a node is called\n",
+                "the *minimum child weight*. In the case of linear regression, this is just the absolute\n",
+                "number of nodes requried in each child. In other objectives, this value is determined\n",
+                "using the weights of the examples, hence the name.\n",
+                "\n",
+                "The larger the value, the more constrained the trees are and the less deep they will be.\n",
+                "This parameter thus also affects the model complexity. Values can range between 0\n",
+                "and infinity and are dependent on the sample size. For our ca. 500 examples in the\n",
+                "breast cancer dataset, values between `0` and `10` should be sensible.\n",
+                "\n",
+                "XGBoost's default value is `1`.\n",
+                "\n",
+                "### Subsample size\n",
+                "\n",
+                "Each decision tree we add is trained on a subsample of the total training dataset.\n",
+                "The probabilities for the samples are weighted according to the XGBoost algorithm,\n",
+                "but we can decide on which fraction of the samples we want to train each decision\n",
+                "tree on.\n",
+                "\n",
+                "Setting this value to `0.7` would mean that we randomly sample `70%` of the\n",
+                "training dataset before each training iteration.\n",
+                "\n",
+                "XGBoost's default value is `1`.\n",
+                "\n",
+                "### Learning rate / Eta\n",
+                "\n",
+                "Remember that XGBoost sequentially trains many decision trees, and that later trees\n",
+                "are more likely trained on data that has been misclassified by prior trees. In effect\n",
+                "this means that earlier trees make decisions for easy samples (i.e. those samples that\n",
+                "can easily be classified) and later trees make decisions for harder samples. It is then\n",
+                "sensible to assume that the later trees are less accurate than earlier trees.\n",
+                "\n",
+                "To address this fact, XGBoost uses a parameter called *Eta*, which is sometimes called\n",
+                "the *learning rate*. Don't confuse this with learning rates from gradient descent!\n",
+                "The original [paper on stochastic gradient boosting](https://www.sciencedirect.com/science/article/abs/pii/S0167947301000652)\n",
+                "introduces this parameter like so:\n",
+                "\n",
+                "$$\n",
+                "F_m(x) = F_{m-1}(x) + \\eta \\cdot \\gamma_{lm} \\textbf{1}(x \\in R_{lm})\n",
+                "$$\n",
+                "\n",
+                "This is just a complicated way to say that when we train we new decision tree,\n",
+                "represented by $\\gamma_{lm} \\textbf{1}(x \\in R_{lm})$, we want to dampen\n",
+                "its effect on the previous prediction $F_{m-1}(x)$ with a factor\n",
+                "$\\eta$.\n",
+                "\n",
+                "Typical values for this parameter are between `0.01` and `` 0.3` ``.\n",
+                "\n",
+                "XGBoost's default value is `0.3`.\n",
+                "\n",
+                "### Number of boost rounds\n",
+                "\n",
+                "Lastly, we can decide on how many boosting rounds we perform, which means how\n",
+                "many decision trees we ultimately train. When we do heavy subsampling or use small\n",
+                "learning rate, it might make sense to increase the number of boosting rounds.\n",
+                "\n",
+                "XGBoost's default value is `10`.\n",
+                "\n",
+                "### Putting it together\n",
+                "\n",
+                "Let's see how this looks like in code! We just need to adjust our `config` dict:"
+            ]
+        },
+        {
+            "cell_type": "code",
+            "execution_count": 2,
+            "id": "35073e88",
+            "metadata": {},
+            "outputs": [
+                {
+                    "name": "stdout",
+                    "output_type": "stream",
+                    "text": [
+                        "Accuracy: 0.9790\n"
+                    ]
+                }
+            ],
+            "source": [
+                "if __name__ == \"__main__\":\n",
+                "    config = {\n",
+                "        \"objective\": \"binary:logistic\",\n",
+                "        \"eval_metric\": [\"logloss\", \"error\"],\n",
+                "        \"max_depth\": 2,\n",
+                "        \"min_child_weight\": 0,\n",
+                "        \"subsample\": 0.8,\n",
+                "        \"eta\": 0.2,\n",
+                "    }\n",
+                "    results = train_breast_cancer(config)\n",
+                "    accuracy = 1.0 - results[\"eval\"][\"error\"][-1]\n",
+                "    print(f\"Accuracy: {accuracy:.4f}\")\n"
+            ]
+        },
+        {
+            "cell_type": "markdown",
+            "id": "69cf0c13",
+            "metadata": {},
+            "source": [
+                "The rest stays the same. Please note that we do not adjust the `num_boost_rounds` here.\n",
+                "The result should also show a high accuracy of over 90%.\n",
+                "\n",
+                "## Tuning the configuration parameters\n",
+                "\n",
+                "XGBoosts default parameters already lead to a good accuracy, and even our guesses in the\n",
+                "last section should result in accuracies well above 90%. However, our guesses were\n",
+                "just that: guesses. Often we do not know what combination of parameters would actually\n",
+                "lead to the best results on a machine learning task.\n",
+                "\n",
+                "Unfortunately, there are infinitely many combinations of hyperparameters we could try\n",
+                "out. Should we combine `max_depth=3` with `subsample=0.8` or with `subsample=0.9`?\n",
+                "What about the other parameters?\n",
+                "\n",
+                "This is where hyperparameter tuning comes into play. By using tuning libraries such as\n",
+                "Ray Tune we can try out combinations of hyperparameters. Using sophisticated search\n",
+                "strategies, these parameters can be selected so that they are likely to lead to good\n",
+                "results (avoiding an expensive *exhaustive search*). Also, trials that do not perform\n",
+                "well can be preemptively stopped to reduce waste of computing resources. Lastly, Ray Tune\n",
+                "also takes care of training these runs in parallel, greatly increasing search speed.\n",
+                "\n",
+                "Let's start with a basic example on how to use Tune for this. We just need to make\n",
+                "a few changes to our code-block:"
+            ]
+        },
+        {
+            "cell_type": "code",
+            "execution_count": 3,
+            "id": "ff856a82",
+            "metadata": {},
+            "outputs": [
+                {
+                    "name": "stderr",
+                    "output_type": "stream",
+                    "text": [
+                        "2022-07-22 15:52:52,004\tINFO services.py:1483 -- View the Ray dashboard at \u001b[1m\u001b[32mhttp://127.0.0.1:8268\u001b[39m\u001b[22m\n",
+                        "2022-07-22 15:52:55,858\tWARNING function_trainable.py:619 -- Function checkpointing is disabled. This may result in unexpected behavior when using checkpointing features or certain schedulers. To enable, set the train function arguments to be `func(config, checkpoint_dir=None)`.\n"
+                    ]
+                },
+                {
+                    "data": {
+                        "text/html": [
+                            "== Status ==<br>Current time: 2022-07-22 15:53:04 (running for 00:00:07.77)<br>Memory usage on this node: 10.5/16.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/4.57 GiB heap, 0.0/2.0 GiB objects<br>Result logdir: /Users/kai/ray_results/train_breast_cancer_2022-07-22_15-52-48<br>Number of trials: 10/10 (10 TERMINATED)<br><table>\n",
+                            "<thead>\n",
+                            "<tr><th>Trial name                     </th><th>status    </th><th>loc            </th><th style=\"text-align: right;\">        eta</th><th style=\"text-align: right;\">  max_depth</th><th style=\"text-align: right;\">  min_child_weight</th><th style=\"text-align: right;\">  subsample</th><th style=\"text-align: right;\">     acc</th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th></tr>\n",
+                            "</thead>\n",
+                            "<tbody>\n",
+                            "<tr><td>train_breast_cancer_f8669_00000</td><td>TERMINATED</td><td>127.0.0.1:48852</td><td style=\"text-align: right;\">0.0069356  </td><td style=\"text-align: right;\">          5</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.823504</td><td style=\"text-align: right;\">0.944056</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0316169</td></tr>\n",
+                            "<tr><td>train_breast_cancer_f8669_00001</td><td>TERMINATED</td><td>127.0.0.1:48857</td><td style=\"text-align: right;\">0.00145619 </td><td style=\"text-align: right;\">          6</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.832947</td><td style=\"text-align: right;\">0.958042</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0328588</td></tr>\n",
+                            "<tr><td>train_breast_cancer_f8669_00002</td><td>TERMINATED</td><td>127.0.0.1:48858</td><td style=\"text-align: right;\">0.00108208 </td><td style=\"text-align: right;\">          7</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.987319</td><td style=\"text-align: right;\">0.944056</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0319381</td></tr>\n",
+                            "<tr><td>train_breast_cancer_f8669_00003</td><td>TERMINATED</td><td>127.0.0.1:48859</td><td style=\"text-align: right;\">0.00530429 </td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.615691</td><td style=\"text-align: right;\">0.923077</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.028388 </td></tr>\n",
+                            "<tr><td>train_breast_cancer_f8669_00004</td><td>TERMINATED</td><td>127.0.0.1:48860</td><td style=\"text-align: right;\">0.000721843</td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.650973</td><td style=\"text-align: right;\">0.958042</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0299618</td></tr>\n",
+                            "<tr><td>train_breast_cancer_f8669_00005</td><td>TERMINATED</td><td>127.0.0.1:48861</td><td style=\"text-align: right;\">0.0074509  </td><td style=\"text-align: right;\">          1</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.738341</td><td style=\"text-align: right;\">0.874126</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0193682</td></tr>\n",
+                            "<tr><td>train_breast_cancer_f8669_00006</td><td>TERMINATED</td><td>127.0.0.1:48862</td><td style=\"text-align: right;\">0.0879882  </td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.671576</td><td style=\"text-align: right;\">0.944056</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0267372</td></tr>\n",
+                            "<tr><td>train_breast_cancer_f8669_00007</td><td>TERMINATED</td><td>127.0.0.1:48863</td><td style=\"text-align: right;\">0.0765404  </td><td style=\"text-align: right;\">          7</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.708157</td><td style=\"text-align: right;\">0.965035</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0276129</td></tr>\n",
+                            "<tr><td>train_breast_cancer_f8669_00008</td><td>TERMINATED</td><td>127.0.0.1:48864</td><td style=\"text-align: right;\">0.000627649</td><td style=\"text-align: right;\">          6</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.81121 </td><td style=\"text-align: right;\">0.951049</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0310998</td></tr>\n",
+                            "<tr><td>train_breast_cancer_f8669_00009</td><td>TERMINATED</td><td>127.0.0.1:48865</td><td style=\"text-align: right;\">0.000383711</td><td style=\"text-align: right;\">          2</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.990579</td><td style=\"text-align: right;\">0.93007 </td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0274954</td></tr>\n",
+                            "</tbody>\n",
+                            "</table><br><br>"
+                        ],
+                        "text/plain": [
+                            "<IPython.core.display.HTML object>"
+                        ]
+                    },
+                    "metadata": {},
+                    "output_type": "display_data"
+                },
+                {
+                    "name": "stderr",
+                    "output_type": "stream",
+                    "text": [
+                        "2022-07-22 15:52:57,385\tINFO plugin_schema_manager.py:52 -- Loading the default runtime env schemas: ['/Users/kai/coding/ray/python/ray/_private/runtime_env/../../runtime_env/schemas/working_dir_schema.json', '/Users/kai/coding/ray/python/ray/_private/runtime_env/../../runtime_env/schemas/pip_schema.json'].\n"
+                    ]
+                },
+                {
+                    "name": "stdout",
+                    "output_type": "stream",
+                    "text": [
+                        "Result for train_breast_cancer_f8669_00000:\n",
+                        "  date: 2022-07-22_15-53-00\n",
+                        "  done: true\n",
+                        "  experiment_id: 07d10c5f31e74133b53272b7ccf9c528\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  mean_accuracy: 0.9440559440559441\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 48852\n",
+                        "  time_since_restore: 0.031616926193237305\n",
+                        "  time_this_iter_s: 0.031616926193237305\n",
+                        "  time_total_s: 0.031616926193237305\n",
+                        "  timestamp: 1658501580\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: f8669_00000\n",
+                        "  warmup_time: 0.0027849674224853516\n",
+                        "  \n",
+                        "Result for train_breast_cancer_f8669_00009:\n",
+                        "  date: 2022-07-22_15-53-04\n",
+                        "  done: true\n",
+                        "  experiment_id: bc0d5dd2d079432b859faac8a18928f0\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  mean_accuracy: 0.9300699300699301\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 48865\n",
+                        "  time_since_restore: 0.027495384216308594\n",
+                        "  time_this_iter_s: 0.027495384216308594\n",
+                        "  time_total_s: 0.027495384216308594\n",
+                        "  timestamp: 1658501584\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: f8669_00009\n",
+                        "  warmup_time: 0.005235910415649414\n",
+                        "  \n",
+                        "Result for train_breast_cancer_f8669_00001:\n",
+                        "  date: 2022-07-22_15-53-04\n",
+                        "  done: true\n",
+                        "  experiment_id: 4b10d350d4374a0d9e7d0c3b1d4e3203\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  mean_accuracy: 0.958041958041958\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 48857\n",
+                        "  time_since_restore: 0.032858848571777344\n",
+                        "  time_this_iter_s: 0.032858848571777344\n",
+                        "  time_total_s: 0.032858848571777344\n",
+                        "  timestamp: 1658501584\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: f8669_00001\n",
+                        "  warmup_time: 0.004731178283691406\n",
+                        "  \n",
+                        "Result for train_breast_cancer_f8669_00008:\n",
+                        "  date: 2022-07-22_15-53-04\n",
+                        "  done: true\n",
+                        "  experiment_id: 91c25cbbeb6f409d93e1d6537cb8e1ee\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  mean_accuracy: 0.951048951048951\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 48864\n",
+                        "  time_since_restore: 0.031099796295166016\n",
+                        "  time_this_iter_s: 0.031099796295166016\n",
+                        "  time_total_s: 0.031099796295166016\n",
+                        "  timestamp: 1658501584\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: f8669_00008\n",
+                        "  warmup_time: 0.003270864486694336\n",
+                        "  \n",
+                        "Result for train_breast_cancer_f8669_00005:\n",
+                        "  date: 2022-07-22_15-53-04\n",
+                        "  done: true\n",
+                        "  experiment_id: d225b0fb59e14da7adba952456ccf1d5\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  mean_accuracy: 0.8741258741258742\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 48861\n",
+                        "  time_since_restore: 0.01936817169189453\n",
+                        "  time_this_iter_s: 0.01936817169189453\n",
+                        "  time_total_s: 0.01936817169189453\n",
+                        "  timestamp: 1658501584\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: f8669_00005\n",
+                        "  warmup_time: 0.003901958465576172\n",
+                        "  \n",
+                        "Result for train_breast_cancer_f8669_00004:\n",
+                        "  date: 2022-07-22_15-53-04\n",
+                        "  done: true\n",
+                        "  experiment_id: 322484af6ea5422f8aaf8ff6a91af4f7\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  mean_accuracy: 0.958041958041958\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 48860\n",
+                        "  time_since_restore: 0.029961824417114258\n",
+                        "  time_this_iter_s: 0.029961824417114258\n",
+                        "  time_total_s: 0.029961824417114258\n",
+                        "  timestamp: 1658501584\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: f8669_00004\n",
+                        "  warmup_time: 0.003547191619873047\n",
+                        "  \n",
+                        "Result for train_breast_cancer_f8669_00002:\n",
+                        "  date: 2022-07-22_15-53-04\n",
+                        "  done: true\n",
+                        "  experiment_id: 3f588954160b42ce8ce200f68127ebcd\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  mean_accuracy: 0.9440559440559441\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 48858\n",
+                        "  time_since_restore: 0.03193807601928711\n",
+                        "  time_this_iter_s: 0.03193807601928711\n",
+                        "  time_total_s: 0.03193807601928711\n",
+                        "  timestamp: 1658501584\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: f8669_00002\n",
+                        "  warmup_time: 0.003523111343383789\n",
+                        "  \n",
+                        "Result for train_breast_cancer_f8669_00003:\n",
+                        "  date: 2022-07-22_15-53-04\n",
+                        "  done: true\n",
+                        "  experiment_id: a39ea777ce2d4ebca51b3d7a4179dae5\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  mean_accuracy: 0.9230769230769231\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 48859\n",
+                        "  time_since_restore: 0.028388023376464844\n",
+                        "  time_this_iter_s: 0.028388023376464844\n",
+                        "  time_total_s: 0.028388023376464844\n",
+                        "  timestamp: 1658501584\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: f8669_00003\n",
+                        "  warmup_time: 0.0035560131072998047\n",
+                        "  \n",
+                        "Result for train_breast_cancer_f8669_00006:\n",
+                        "  date: 2022-07-22_15-53-04\n",
+                        "  done: true\n",
+                        "  experiment_id: f97c6b9674854f8d89ec26ba58cc1618\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  mean_accuracy: 0.9440559440559441\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 48862\n",
+                        "  time_since_restore: 0.026737213134765625\n",
+                        "  time_this_iter_s: 0.026737213134765625\n",
+                        "  time_total_s: 0.026737213134765625\n",
+                        "  timestamp: 1658501584\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: f8669_00006\n",
+                        "  warmup_time: 0.003425121307373047\n",
+                        "  \n",
+                        "Result for train_breast_cancer_f8669_00007:\n",
+                        "  date: 2022-07-22_15-53-04\n",
+                        "  done: true\n",
+                        "  experiment_id: ff172037065a4d55998ed72f51bdc5df\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  mean_accuracy: 0.965034965034965\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 48863\n",
+                        "  time_since_restore: 0.027612924575805664\n",
+                        "  time_this_iter_s: 0.027612924575805664\n",
+                        "  time_total_s: 0.027612924575805664\n",
+                        "  timestamp: 1658501584\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: f8669_00007\n",
+                        "  warmup_time: 0.0031311511993408203\n",
+                        "  \n"
+                    ]
+                },
+                {
+                    "name": "stderr",
+                    "output_type": "stream",
+                    "text": [
+                        "2022-07-22 15:53:04,846\tINFO tune.py:738 -- Total run time: 8.99 seconds (7.74 seconds for the tuning loop).\n"
+                    ]
+                }
+            ],
+            "source": [
+                "import sklearn.datasets\n",
+                "import sklearn.metrics\n",
+                "\n",
+                "from ray import air, tune\n",
+                "from ray.air import session\n",
+                "\n",
+                "\n",
+                "def train_breast_cancer(config):\n",
+                "    # Load dataset\n",
+                "    data, labels = sklearn.datasets.load_breast_cancer(return_X_y=True)\n",
+                "    # Split into train and test set\n",
+                "    train_x, test_x, train_y, test_y = train_test_split(data, labels, test_size=0.25)\n",
+                "    # Build input matrices for XGBoost\n",
+                "    train_set = xgb.DMatrix(train_x, label=train_y)\n",
+                "    test_set = xgb.DMatrix(test_x, label=test_y)\n",
+                "    # Train the classifier\n",
+                "    results = {}\n",
+                "    xgb.train(\n",
+                "        config,\n",
+                "        train_set,\n",
+                "        evals=[(test_set, \"eval\")],\n",
+                "        evals_result=results,\n",
+                "        verbose_eval=False,\n",
+                "    )\n",
+                "    # Return prediction accuracy\n",
+                "    accuracy = 1.0 - results[\"eval\"][\"error\"][-1]\n",
+                "    session.report({\"mean_accuracy\": accuracy, \"done\": True})\n",
+                "\n",
+                "\n",
+                "if __name__ == \"__main__\":\n",
+                "    config = {\n",
+                "        \"objective\": \"binary:logistic\",\n",
+                "        \"eval_metric\": [\"logloss\", \"error\"],\n",
+                "        \"max_depth\": tune.randint(1, 9),\n",
+                "        \"min_child_weight\": tune.choice([1, 2, 3]),\n",
+                "        \"subsample\": tune.uniform(0.5, 1.0),\n",
+                "        \"eta\": tune.loguniform(1e-4, 1e-1),\n",
+                "    }\n",
+                "    tuner = tune.Tuner(\n",
+                "        train_breast_cancer,\n",
+                "        tune_config=tune.TuneConfig(\n",
+                "            num_samples=10,\n",
+                "        ),\n",
+                "        param_space=config,\n",
+                "    )\n",
+                "    results = tuner.fit()\n"
+            ]
+        },
+        {
+            "cell_type": "markdown",
+            "id": "4999e858",
+            "metadata": {},
+            "source": [
+                "As you can see, the changes in the actual training function are minimal. Instead of\n",
+                "returning the accuracy value, we report it back to Tune using `session.report()`.\n",
+                "Our `config` dictionary only changed slightly. Instead of passing hard-coded\n",
+                "parameters, we tell Tune to choose values from a range of valid options. There are\n",
+                "a number of options we have here, all of which are explained in\n",
+                "{ref}`the Tune docs <tune-search-space>`.\n",
+                "\n",
+                "For a brief explanation, this is what they do:\n",
+                "\n",
+                "- `tune.randint(min, max)` chooses a random integer value between *min* and *max*.\n",
+                "  Note that *max* is exclusive, so it will not be sampled.\n",
+                "- `tune.choice([a, b, c])` chooses one of the items of the list at random. Each item\n",
+                "  has the same chance to be sampled.\n",
+                "- `tune.uniform(min, max)` samples a floating point number between *min* and *max*.\n",
+                "  Note that *max* is exclusive here, too.\n",
+                "- `tune.loguniform(min, max, base=10)` samples a floating point number between *min* and *max*,\n",
+                "  but applies a logarithmic transformation to these boundaries first. Thus, this makes\n",
+                "  it easy to sample values from different orders of magnitude.\n",
+                "\n",
+                "The `num_samples=10` option we pass to the `TuneConfig()` means that we sample 10 different\n",
+                "hyperparameter configurations from this search space.\n",
+                "\n",
+                "The output of our training run coud look like this:\n",
+                "\n",
+                "```{code-block} bash\n",
+                ":emphasize-lines: 14\n",
+                "\n",
+                " Number of trials: 10/10 (10 TERMINATED)\n",
+                " +---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+----------+--------+------------------+\n",
+                " | Trial name                      | status     | loc   |         eta |   max_depth |   min_child_weight |   subsample |      acc |   iter |   total time (s) |\n",
+                " |---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+----------+--------+------------------|\n",
+                " | train_breast_cancer_b63aa_00000 | TERMINATED |       | 0.000117625 |           2 |                  2 |    0.616347 | 0.916084 |      1 |        0.0306492 |\n",
+                " | train_breast_cancer_b63aa_00001 | TERMINATED |       | 0.0382954   |           8 |                  2 |    0.581549 | 0.937063 |      1 |        0.0357082 |\n",
+                " | train_breast_cancer_b63aa_00002 | TERMINATED |       | 0.000217926 |           1 |                  3 |    0.528428 | 0.874126 |      1 |        0.0264609 |\n",
+                " | train_breast_cancer_b63aa_00003 | TERMINATED |       | 0.000120929 |           8 |                  1 |    0.634508 | 0.958042 |      1 |        0.036406  |\n",
+                " | train_breast_cancer_b63aa_00004 | TERMINATED |       | 0.00839715  |           5 |                  1 |    0.730624 | 0.958042 |      1 |        0.0389378 |\n",
+                " | train_breast_cancer_b63aa_00005 | TERMINATED |       | 0.000732948 |           8 |                  2 |    0.915863 | 0.958042 |      1 |        0.0382841 |\n",
+                " | train_breast_cancer_b63aa_00006 | TERMINATED |       | 0.000856226 |           4 |                  1 |    0.645209 | 0.916084 |      1 |        0.0357089 |\n",
+                " | train_breast_cancer_b63aa_00007 | TERMINATED |       | 0.00769908  |           7 |                  1 |    0.729443 | 0.909091 |      1 |        0.0390737 |\n",
+                " | train_breast_cancer_b63aa_00008 | TERMINATED |       | 0.00186339  |           5 |                  3 |    0.595744 | 0.944056 |      1 |        0.0343912 |\n",
+                " | train_breast_cancer_b63aa_00009 | TERMINATED |       | 0.000950272 |           3 |                  2 |    0.835504 | 0.965035 |      1 |        0.0348201 |\n",
+                " +---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+----------+--------+------------------+\n",
+                "```\n",
+                "\n",
+                "The best configuration we found used `eta=0.000950272`, `max_depth=3`,\n",
+                "`min_child_weight=2`, `subsample=0.835504` and reached an accuracy of\n",
+                "`0.965035`.\n",
+                "\n",
+                "## Early stopping\n",
+                "\n",
+                "Currently, Tune samples 10 different hyperparameter configurations and trains a full\n",
+                "XGBoost on all of them. In our small example, training is very fast. However,\n",
+                "if training takes longer, a significant amount of computer resources is spent on trials\n",
+                "that will eventually show a bad performance, e.g. a low accuracy. It would be good\n",
+                "if we could identify these trials early and stop them, so we don't waste any resources.\n",
+                "\n",
+                "This is where Tune's *Schedulers* shine. A Tune `TrialScheduler` is responsible\n",
+                "for starting and stopping trials. Tune implements a number of different schedulers, each\n",
+                "described {ref}`in the Tune documentation <tune-schedulers>`.\n",
+                "For our example, we will use the `AsyncHyperBandScheduler` or `ASHAScheduler`.\n",
+                "\n",
+                "The basic idea of this scheduler: We sample a number of hyperparameter configurations.\n",
+                "Each of these configurations is trained for a specific number of iterations.\n",
+                "After these iterations, only the best performing hyperparameters are retained. These\n",
+                "are selected according to some loss metric, usually an evaluation loss. This cycle is\n",
+                "repeated until we end up with the best configuration.\n",
+                "\n",
+                "The `ASHAScheduler` needs to know three things:\n",
+                "\n",
+                "1. Which metric should be used to identify badly performing trials?\n",
+                "2. Should this metric be maximized or minimized?\n",
+                "3. How many iterations does each trial train for?\n",
+                "\n",
+                "There are more parameters, which are explained in the\n",
+                "{ref}`documentation <tune-scheduler-hyperband>`.\n",
+                "\n",
+                "Lastly, we have to report the loss metric to Tune. We do this with a `Callback` that\n",
+                "XGBoost accepts and calls after each evaluation round. Ray Tune comes\n",
+                "with {ref}`two XGBoost callbacks <tune-integration-xgboost>`\n",
+                "we can use for this. The `TuneReportCallback` just reports the evaluation\n",
+                "metrics back to Tune. The `TuneReportCheckpointCallback` also saves\n",
+                "checkpoints after each evaluation round. We will just use the latter in this\n",
+                "example so that we can retrieve the saved model later.\n",
+                "\n",
+                "These parameters from the `eval_metrics` configuration setting are then automatically\n",
+                "reported to Tune via the callback. Here, the raw error will be reported, not the accuracy.\n",
+                "To display the best reached accuracy, we will inverse it later.\n",
+                "\n",
+                "We will also load the best checkpointed model so that we can use it for predictions.\n",
+                "The best model is selected with respect to the `metric` and `mode` parameters we\n",
+                "pass to the `TunerConfig()`."
+            ]
+        },
+        {
+            "cell_type": "code",
+            "execution_count": 9,
+            "id": "d08b5b0a",
+            "metadata": {},
+            "outputs": [
+                {
+                    "data": {
+                        "text/html": [
+                            "== Status ==<br>Current time: 2022-07-22 16:56:01 (running for 00:00:10.38)<br>Memory usage on this node: 10.3/16.0 GiB<br>Using AsyncHyperBand: num_stopped=10\n",
+                            "Bracket: Iter 8.000: -0.5107275277792991 | Iter 4.000: -0.5876629346317344 | Iter 2.000: -0.6544494184997531 | Iter 1.000: -0.6859214191253369<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/4.57 GiB heap, 0.0/2.0 GiB objects<br>Current best trial: c28a3_00003 with eval-logloss=0.38665050018083796 and parameters={'objective': 'binary:logistic', 'eval_metric': ['logloss', 'error'], 'max_depth': 2, 'min_child_weight': 3, 'subsample': 0.782626252548841, 'eta': 0.06385952388342125}<br>Result logdir: /Users/kai/ray_results/train_breast_cancer_2022-07-22_16-55-50<br>Number of trials: 10/10 (10 TERMINATED)<br><table>\n",
+                            "<thead>\n",
+                            "<tr><th>Trial name                     </th><th>status    </th><th>loc            </th><th style=\"text-align: right;\">        eta</th><th style=\"text-align: right;\">  max_depth</th><th style=\"text-align: right;\">  min_child_weight</th><th style=\"text-align: right;\">  subsample</th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  eval-logloss</th><th style=\"text-align: right;\">  eval-error</th></tr>\n",
+                            "</thead>\n",
+                            "<tbody>\n",
+                            "<tr><td>train_breast_cancer_c28a3_00000</td><td>TERMINATED</td><td>127.0.0.1:54416</td><td style=\"text-align: right;\">0.0186954  </td><td style=\"text-align: right;\">          2</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.516916</td><td style=\"text-align: right;\">    10</td><td style=\"text-align: right;\">       0.22218  </td><td style=\"text-align: right;\">      0.571496</td><td style=\"text-align: right;\">   0.0629371</td></tr>\n",
+                            "<tr><td>train_breast_cancer_c28a3_00001</td><td>TERMINATED</td><td>127.0.0.1:54440</td><td style=\"text-align: right;\">0.0304404  </td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.745969</td><td style=\"text-align: right;\">     2</td><td style=\"text-align: right;\">       0.135674 </td><td style=\"text-align: right;\">      0.650353</td><td style=\"text-align: right;\">   0.0629371</td></tr>\n",
+                            "<tr><td>train_breast_cancer_c28a3_00002</td><td>TERMINATED</td><td>127.0.0.1:54441</td><td style=\"text-align: right;\">0.0217157  </td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.764138</td><td style=\"text-align: right;\">     2</td><td style=\"text-align: right;\">       0.173076 </td><td style=\"text-align: right;\">      0.658545</td><td style=\"text-align: right;\">   0.041958 </td></tr>\n",
+                            "<tr><td>train_breast_cancer_c28a3_00003</td><td>TERMINATED</td><td>127.0.0.1:54442</td><td style=\"text-align: right;\">0.0638595  </td><td style=\"text-align: right;\">          2</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.782626</td><td style=\"text-align: right;\">    10</td><td style=\"text-align: right;\">       0.281865 </td><td style=\"text-align: right;\">      0.386651</td><td style=\"text-align: right;\">   0.041958 </td></tr>\n",
+                            "<tr><td>train_breast_cancer_c28a3_00004</td><td>TERMINATED</td><td>127.0.0.1:54443</td><td style=\"text-align: right;\">0.00442794 </td><td style=\"text-align: right;\">          7</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.792359</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0270212</td><td style=\"text-align: right;\">      0.689577</td><td style=\"text-align: right;\">   0.0699301</td></tr>\n",
+                            "<tr><td>train_breast_cancer_c28a3_00005</td><td>TERMINATED</td><td>127.0.0.1:54444</td><td style=\"text-align: right;\">0.00222624 </td><td style=\"text-align: right;\">          3</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.536331</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0238512</td><td style=\"text-align: right;\">      0.691446</td><td style=\"text-align: right;\">   0.0839161</td></tr>\n",
+                            "<tr><td>train_breast_cancer_c28a3_00006</td><td>TERMINATED</td><td>127.0.0.1:54445</td><td style=\"text-align: right;\">0.000825129</td><td style=\"text-align: right;\">          1</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.82472 </td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.015312 </td><td style=\"text-align: right;\">      0.692624</td><td style=\"text-align: right;\">   0.118881 </td></tr>\n",
+                            "<tr><td>train_breast_cancer_c28a3_00007</td><td>TERMINATED</td><td>127.0.0.1:54446</td><td style=\"text-align: right;\">0.000770826</td><td style=\"text-align: right;\">          7</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.947268</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0175898</td><td style=\"text-align: right;\">      0.692598</td><td style=\"text-align: right;\">   0.132867 </td></tr>\n",
+                            "<tr><td>train_breast_cancer_c28a3_00008</td><td>TERMINATED</td><td>127.0.0.1:54447</td><td style=\"text-align: right;\">0.000429759</td><td style=\"text-align: right;\">          7</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.88524 </td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0193739</td><td style=\"text-align: right;\">      0.692785</td><td style=\"text-align: right;\">   0.0559441</td></tr>\n",
+                            "<tr><td>train_breast_cancer_c28a3_00009</td><td>TERMINATED</td><td>127.0.0.1:54448</td><td style=\"text-align: right;\">0.0149863  </td><td style=\"text-align: right;\">          2</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.722738</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0165932</td><td style=\"text-align: right;\">      0.682266</td><td style=\"text-align: right;\">   0.111888 </td></tr>\n",
+                            "</tbody>\n",
+                            "</table><br><br>"
+                        ],
+                        "text/plain": [
+                            "<IPython.core.display.HTML object>"
+                        ]
+                    },
+                    "metadata": {},
+                    "output_type": "display_data"
+                },
+                {
+                    "name": "stdout",
+                    "output_type": "stream",
+                    "text": [
+                        "Result for train_breast_cancer_c28a3_00000:\n",
+                        "  date: 2022-07-22_16-55-55\n",
+                        "  done: false\n",
+                        "  eval-error: 0.08391608391608392\n",
+                        "  eval-logloss: 0.6790360066440556\n",
+                        "  experiment_id: 2a3189442db341519836a07fb2d65dd9\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54416\n",
+                        "  time_since_restore: 0.01624011993408203\n",
+                        "  time_this_iter_s: 0.01624011993408203\n",
+                        "  time_total_s: 0.01624011993408203\n",
+                        "  timestamp: 1658505355\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: c28a3_00000\n",
+                        "  warmup_time: 0.0035409927368164062\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00000:\n",
+                        "  date: 2022-07-22_16-55-56\n",
+                        "  done: true\n",
+                        "  eval-error: 0.06293706293706294\n",
+                        "  eval-logloss: 0.5714958122560194\n",
+                        "  experiment_id: 2a3189442db341519836a07fb2d65dd9\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 10\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54416\n",
+                        "  time_since_restore: 0.22218012809753418\n",
+                        "  time_this_iter_s: 0.007044076919555664\n",
+                        "  time_total_s: 0.22218012809753418\n",
+                        "  timestamp: 1658505356\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 10\n",
+                        "  trial_id: c28a3_00000\n",
+                        "  warmup_time: 0.0035409927368164062\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00003:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: false\n",
+                        "  eval-error: 0.08391608391608392\n",
+                        "  eval-logloss: 0.6472820101918041\n",
+                        "  experiment_id: 7ff6133237404b4ea4755b9f8cd114f2\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54442\n",
+                        "  time_since_restore: 0.023206233978271484\n",
+                        "  time_this_iter_s: 0.023206233978271484\n",
+                        "  time_total_s: 0.023206233978271484\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: c28a3_00003\n",
+                        "  warmup_time: 0.006722211837768555\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00005:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: true\n",
+                        "  eval-error: 0.08391608391608392\n",
+                        "  eval-logloss: 0.6914464114429234\n",
+                        "  experiment_id: 344762ab6d574b63a9374e19526d0510\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54444\n",
+                        "  time_since_restore: 0.02385115623474121\n",
+                        "  time_this_iter_s: 0.02385115623474121\n",
+                        "  time_total_s: 0.02385115623474121\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: c28a3_00005\n",
+                        "  warmup_time: 0.008936882019042969\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00009:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: true\n",
+                        "  eval-error: 0.11188811188811189\n",
+                        "  eval-logloss: 0.6822656309688008\n",
+                        "  experiment_id: 133901655fa64bf79f2dcc4e8e5e41b1\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54448\n",
+                        "  time_since_restore: 0.016593217849731445\n",
+                        "  time_this_iter_s: 0.016593217849731445\n",
+                        "  time_total_s: 0.016593217849731445\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: c28a3_00009\n",
+                        "  warmup_time: 0.004940032958984375\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00007:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: true\n",
+                        "  eval-error: 0.13286713286713286\n",
+                        "  eval-logloss: 0.6925980357023386\n",
+                        "  experiment_id: b4331027cbaf442ab905b2e51797dbbd\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54446\n",
+                        "  time_since_restore: 0.017589807510375977\n",
+                        "  time_this_iter_s: 0.017589807510375977\n",
+                        "  time_total_s: 0.017589807510375977\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: c28a3_00007\n",
+                        "  warmup_time: 0.003782033920288086\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00006:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: true\n",
+                        "  eval-error: 0.11888111888111888\n",
+                        "  eval-logloss: 0.6926244418104212\n",
+                        "  experiment_id: d3906de5943a4e05a4cc782382f67d24\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54445\n",
+                        "  time_since_restore: 0.015311956405639648\n",
+                        "  time_this_iter_s: 0.015311956405639648\n",
+                        "  time_total_s: 0.015311956405639648\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: c28a3_00006\n",
+                        "  warmup_time: 0.005506038665771484\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00002:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: false\n",
+                        "  eval-error: 0.04895104895104895\n",
+                        "  eval-logloss: 0.6752762102580571\n",
+                        "  experiment_id: a3645fc2d43145d88a1f5b7cc94df703\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54441\n",
+                        "  time_since_restore: 0.027367830276489258\n",
+                        "  time_this_iter_s: 0.027367830276489258\n",
+                        "  time_total_s: 0.027367830276489258\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: c28a3_00002\n",
+                        "  warmup_time: 0.0062830448150634766\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00001:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: false\n",
+                        "  eval-error: 0.07692307692307693\n",
+                        "  eval-logloss: 0.6698804135089154\n",
+                        "  experiment_id: 85766fe4d9fa482a91e396a8fd509a19\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54440\n",
+                        "  time_since_restore: 0.017169952392578125\n",
+                        "  time_this_iter_s: 0.017169952392578125\n",
+                        "  time_total_s: 0.017169952392578125\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: c28a3_00001\n",
+                        "  warmup_time: 0.006204843521118164\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00008:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: true\n",
+                        "  eval-error: 0.05594405594405594\n",
+                        "  eval-logloss: 0.692784742458717\n",
+                        "  experiment_id: 2c7d8bc38ad04536b1dec76819a2b3bf\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54447\n",
+                        "  time_since_restore: 0.01937389373779297\n",
+                        "  time_this_iter_s: 0.01937389373779297\n",
+                        "  time_total_s: 0.01937389373779297\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: c28a3_00008\n",
+                        "  warmup_time: 0.004342079162597656\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00001:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: true\n",
+                        "  eval-error: 0.06293706293706294\n",
+                        "  eval-logloss: 0.6503534216980834\n",
+                        "  experiment_id: 85766fe4d9fa482a91e396a8fd509a19\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 2\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54440\n",
+                        "  time_since_restore: 0.13567376136779785\n",
+                        "  time_this_iter_s: 0.11850380897521973\n",
+                        "  time_total_s: 0.13567376136779785\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 2\n",
+                        "  trial_id: c28a3_00001\n",
+                        "  warmup_time: 0.006204843521118164\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00004:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: true\n",
+                        "  eval-error: 0.06993006993006994\n",
+                        "  eval-logloss: 0.689577207281873\n",
+                        "  experiment_id: ef4fdc645c444112985b4957ab8a84e9\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 1\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54443\n",
+                        "  time_since_restore: 0.027021169662475586\n",
+                        "  time_this_iter_s: 0.027021169662475586\n",
+                        "  time_total_s: 0.027021169662475586\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 1\n",
+                        "  trial_id: c28a3_00004\n",
+                        "  warmup_time: 0.0063669681549072266\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00002:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: true\n",
+                        "  eval-error: 0.04195804195804196\n",
+                        "  eval-logloss: 0.658545415301423\n",
+                        "  experiment_id: a3645fc2d43145d88a1f5b7cc94df703\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 2\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54441\n",
+                        "  time_since_restore: 0.17307591438293457\n",
+                        "  time_this_iter_s: 0.1457080841064453\n",
+                        "  time_total_s: 0.17307591438293457\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 2\n",
+                        "  trial_id: c28a3_00002\n",
+                        "  warmup_time: 0.0062830448150634766\n",
+                        "  \n",
+                        "Result for train_breast_cancer_c28a3_00003:\n",
+                        "  date: 2022-07-22_16-56-01\n",
+                        "  done: true\n",
+                        "  eval-error: 0.04195804195804196\n",
+                        "  eval-logloss: 0.38665050018083796\n",
+                        "  experiment_id: 7ff6133237404b4ea4755b9f8cd114f2\n",
+                        "  hostname: Kais-MacBook-Pro.local\n",
+                        "  iterations_since_restore: 10\n",
+                        "  node_ip: 127.0.0.1\n",
+                        "  pid: 54442\n",
+                        "  time_since_restore: 0.28186488151550293\n",
+                        "  time_this_iter_s: 0.03063178062438965\n",
+                        "  time_total_s: 0.28186488151550293\n",
+                        "  timestamp: 1658505361\n",
+                        "  timesteps_since_restore: 0\n",
+                        "  training_iteration: 10\n",
+                        "  trial_id: c28a3_00003\n",
+                        "  warmup_time: 0.006722211837768555\n",
+                        "  \n"
+                    ]
+                },
+                {
+                    "name": "stderr",
+                    "output_type": "stream",
+                    "text": [
+                        "2022-07-22 16:56:01,498\tINFO tune.py:738 -- Total run time: 10.53 seconds (10.37 seconds for the tuning loop).\n"
+                    ]
+                },
+                {
+                    "name": "stdout",
+                    "output_type": "stream",
+                    "text": [
+                        "Best model parameters: {'objective': 'binary:logistic', 'eval_metric': ['logloss', 'error'], 'max_depth': 2, 'min_child_weight': 3, 'subsample': 0.782626252548841, 'eta': 0.06385952388342125}\n",
+                        "Best model total accuracy: 0.9580\n"
+                    ]
+                }
+            ],
+            "source": [
+                "import sklearn.datasets\n",
+                "import sklearn.metrics\n",
+                "import os\n",
+                "from ray.tune.schedulers import ASHAScheduler\n",
+                "from sklearn.model_selection import train_test_split\n",
+                "import xgboost as xgb\n",
+                "\n",
+                "from ray import air, tune\n",
+                "from ray.air import session\n",
+                "from ray.tune.integration.xgboost import TuneReportCheckpointCallback\n",
+                "\n",
+                "\n",
+                "def train_breast_cancer(config: dict):\n",
+                "    # This is a simple training function to be passed into Tune\n",
+                "    # Load dataset\n",
+                "    data, labels = sklearn.datasets.load_breast_cancer(return_X_y=True)\n",
+                "    # Split into train and test set\n",
+                "    train_x, test_x, train_y, test_y = train_test_split(data, labels, test_size=0.25)\n",
+                "    # Build input matrices for XGBoost\n",
+                "    train_set = xgb.DMatrix(train_x, label=train_y)\n",
+                "    test_set = xgb.DMatrix(test_x, label=test_y)\n",
+                "    # Train the classifier, using the Tune callback\n",
+                "    xgb.train(\n",
+                "        config,\n",
+                "        train_set,\n",
+                "        evals=[(test_set, \"eval\")],\n",
+                "        verbose_eval=False,\n",
+                "        callbacks=[TuneReportCheckpointCallback(filename=\"model.xgb\")],\n",
+                "    )\n",
+                "\n",
+                "\n",
+                "def get_best_model_checkpoint(results):\n",
+                "    best_bst = xgb.Booster()\n",
+                "    best_result = results.get_best_result()\n",
+                "\n",
+                "    with best_result.checkpoint.as_directory() as best_checkpoint_dir:\n",
+                "        best_bst.load_model(os.path.join(best_checkpoint_dir, \"model.xgb\"))\n",
+                "    accuracy = 1.0 - best_result.metrics[\"eval-error\"]\n",
+                "    print(f\"Best model parameters: {best_result.config}\")\n",
+                "    print(f\"Best model total accuracy: {accuracy:.4f}\")\n",
+                "    return best_bst\n",
+                "\n",
+                "\n",
+                "def tune_xgboost(smoke_test=False):\n",
+                "    search_space = {\n",
+                "        # You can mix constants with search space objects.\n",
+                "        \"objective\": \"binary:logistic\",\n",
+                "        \"eval_metric\": [\"logloss\", \"error\"],\n",
+                "        \"max_depth\": tune.randint(1, 9),\n",
+                "        \"min_child_weight\": tune.choice([1, 2, 3]),\n",
+                "        \"subsample\": tune.uniform(0.5, 1.0),\n",
+                "        \"eta\": tune.loguniform(1e-4, 1e-1),\n",
+                "    }\n",
+                "    # This will enable aggressive early stopping of bad trials.\n",
+                "    scheduler = ASHAScheduler(\n",
+                "        max_t=10, grace_period=1, reduction_factor=2  # 10 training iterations\n",
+                "    )\n",
+                "\n",
+                "    tuner = tune.Tuner(\n",
+                "        train_breast_cancer,\n",
+                "        tune_config=tune.TuneConfig(\n",
+                "            metric=\"eval-logloss\",\n",
+                "            mode=\"min\",\n",
+                "            scheduler=scheduler,\n",
+                "            num_samples=1 if smoke_test else 10,\n",
+                "        ),\n",
+                "        param_space=search_space,\n",
+                "    )\n",
+                "    results = tuner.fit()\n",
+                "\n",
+                "    return results\n",
+                "\n",
+                "\n",
+                "if __name__ == \"__main__\":\n",
+                "    import argparse\n",
+                "\n",
+                "    parser = argparse.ArgumentParser()\n",
+                "    parser.add_argument(\n",
+                "        \"--smoke-test\", action=\"store_true\", help=\"Finish quickly for testing\"\n",
+                "    )\n",
+                "    args, _ = parser.parse_known_args()\n",
+                "\n",
+                "    results = tune_xgboost(smoke_test=args.smoke_test)\n",
+                "\n",
+                "    # Load the best model checkpoint.\n",
+                "    best_bst = get_best_model_checkpoint(results)\n",
+                "\n",
+                "    # You could now do further predictions with\n",
+                "    # best_bst.predict(...)\n"
+            ]
+        },
+        {
+            "cell_type": "markdown",
+            "id": "20732fe4",
+            "metadata": {},
+            "source": [
+                "The output of our run could look like this:\n",
+                "\n",
+                "```{code-block} bash\n",
+                ":emphasize-lines: 7\n",
+                "\n",
+                " Number of trials: 10/10 (10 TERMINATED)\n",
+                " +---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+--------+------------------+----------------+--------------+\n",
+                " | Trial name                      | status     | loc   |         eta |   max_depth |   min_child_weight |   subsample |   iter |   total time (s) |   eval-logloss |   eval-error |\n",
+                " |---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+--------+------------------+----------------+--------------|\n",
+                " | train_breast_cancer_ba275_00000 | TERMINATED |       | 0.00205087  |           2 |                  1 |    0.898391 |     10 |        0.380619  |       0.678039 |     0.090909 |\n",
+                " | train_breast_cancer_ba275_00001 | TERMINATED |       | 0.000183834 |           4 |                  3 |    0.924939 |      1 |        0.0228798 |       0.693009 |     0.111888 |\n",
+                " | train_breast_cancer_ba275_00002 | TERMINATED |       | 0.0242721   |           7 |                  2 |    0.501551 |     10 |        0.376154  |       0.54472  |     0.06993  |\n",
+                " | train_breast_cancer_ba275_00003 | TERMINATED |       | 0.000449692 |           5 |                  3 |    0.890212 |      1 |        0.0234981 |       0.692811 |     0.090909 |\n",
+                " | train_breast_cancer_ba275_00004 | TERMINATED |       | 0.000376393 |           7 |                  2 |    0.883609 |      1 |        0.0231569 |       0.692847 |     0.062937 |\n",
+                " | train_breast_cancer_ba275_00005 | TERMINATED |       | 0.00231942  |           3 |                  3 |    0.877464 |      2 |        0.104867  |       0.689541 |     0.083916 |\n",
+                " | train_breast_cancer_ba275_00006 | TERMINATED |       | 0.000542326 |           1 |                  2 |    0.578584 |      1 |        0.0213971 |       0.692765 |     0.083916 |\n",
+                " | train_breast_cancer_ba275_00007 | TERMINATED |       | 0.0016801   |           1 |                  2 |    0.975302 |      1 |        0.02226   |       0.691999 |     0.083916 |\n",
+                " | train_breast_cancer_ba275_00008 | TERMINATED |       | 0.000595756 |           8 |                  3 |    0.58429  |      1 |        0.0221152 |       0.692657 |     0.06993  |\n",
+                " | train_breast_cancer_ba275_00009 | TERMINATED |       | 0.000357845 |           8 |                  1 |    0.637776 |      1 |        0.022635  |       0.692859 |     0.090909 |\n",
+                " +---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+--------+------------------+----------------+--------------+\n",
+                "\n",
+                "\n",
+                " Best model parameters: {'objective': 'binary:logistic', 'eval_metric': ['logloss', 'error'], 'max_depth': 7, 'min_child_weight': 2, 'subsample': 0.5015513240240503, 'eta': 0.024272050872920895}\n",
+                " Best model total accuracy: 0.9301\n",
+                "```\n",
+                "\n",
+                "As you can see, most trials have been stopped only after a few iterations. Only the\n",
+                "two most promising trials were run for the full 10 iterations.\n",
+                "\n",
+                "You can also ensure that all available resources are being used as the scheduler\n",
+                "terminates trials, freeing them up. This can be done through the\n",
+                "`ResourceChangingScheduler`. An example of this can be found here:\n",
+                "{doc}`/tune/examples/includes/xgboost_dynamic_resources_example`.\n",
+                "\n",
+                "## Using fractional GPUs\n",
+                "\n",
+                "You can often accelerate your training by using GPUs in addition to CPUs. However,\n",
+                "you usually don't have as many GPUs as you have trials to run. For instance, if you\n",
+                "run 10 Tune trials in parallel, you usually don't have access to 10 separate GPUs.\n",
+                "\n",
+                "Tune supports *fractional GPUs*. This means that each task is assigned a fraction\n",
+                "of the GPU memory for training. For 10 tasks, this could look like this:"
+            ]
+        },
+        {
+            "cell_type": "code",
+            "execution_count": null,
+            "id": "7d1b20a3",
+            "metadata": {},
+            "outputs": [],
+            "source": [
+                "config = {\n",
+                "    \"objective\": \"binary:logistic\",\n",
+                "    \"eval_metric\": [\"logloss\", \"error\"],\n",
+                "    \"tree_method\": \"gpu_hist\",\n",
+                "    \"max_depth\": tune.randint(1, 9),\n",
+                "    \"min_child_weight\": tune.choice([1, 2, 3]),\n",
+                "    \"subsample\": tune.uniform(0.5, 1.0),\n",
+                "    \"eta\": tune.loguniform(1e-4, 1e-1),\n",
+                "}\n",
+                "\n",
+                "tuner = tune.Tuner(\n",
+                "    tune.with_resources(train_breast_cancer, resources={\"cpu\": 1, \"gpu\": 0.1}),\n",
+                "    tune_config=tune.TuneConfig(\n",
+                "        num_samples=10,\n",
+                "    ),\n",
+                "    param_space=config,\n",
+                ")\n",
+                "results = tuner.fit()\n"
+            ]
+        },
+        {
+            "cell_type": "markdown",
+            "id": "ee131861",
+            "metadata": {},
+            "source": [
+                "Each task thus works with 10% of the available GPU memory. You also have to tell\n",
+                "XGBoost to use the `gpu_hist` tree method, so it knows it should use the GPU.\n",
+                "\n",
+                "## Conclusion\n",
+                "\n",
+                "You should now have a basic understanding on how to train XGBoost models and on how\n",
+                "to tune the hyperparameters to yield the best results. In our simple example,\n",
+                "Tuning the parameters didn't make a huge difference for the accuracy.\n",
+                "But in larger applications, intelligent hyperparameter tuning can make the\n",
+                "difference between a model that doesn't seem to learn at all, and a model\n",
+                "that outperforms all the other ones.\n",
+                "\n",
+                "## More XGBoost Examples\n",
+                "\n",
+                "- {doc}`/tune/examples/includes/xgboost_dynamic_resources_example`:\n",
+                "  Trains a basic XGBoost model with Tune with the class-based API and a ResourceChangingScheduler, ensuring all resources are being used at all time.\n",
+                "\n",
+                "## Learn More\n",
+                "\n",
+                "- [XGBoost Hyperparameter Tuning - A Visual Guide](https://kevinvecmanis.io/machine%20learning/hyperparameter%20tuning/dataviz/python/2019/05/11/XGBoost-Tuning-Visual-Guide.html)\n",
+                "- [Notes on XGBoost Parameter Tuning](https://xgboost.readthedocs.io/en/latest/tutorials/param_tuning.html)\n",
+                "- [Doing XGBoost Hyperparameter Tuning the smart way](https://towardsdatascience.com/doing-xgboost-hyper-parameter-tuning-the-smart-way-part-1-of-2-f6d255a45dde)"
+            ]
+        }
+    ],
+    "metadata": {
+        "kernelspec": {
+            "display_name": "ray_dev_py38",
+            "language": "python",
+            "name": "python3"
+        },
+        "language_info": {
+            "codemirror_mode": {
+                "name": "ipython",
+                "version": 3
+            },
+            "file_extension": ".py",
+            "mimetype": "text/x-python",
+            "name": "python",
+            "nbconvert_exporter": "python",
+            "pygments_lexer": "ipython3",
+            "version": "3.8.13 | packaged by conda-forge | (default, Mar 25 2022, 06:05:16) \n[Clang 12.0.1 ]"
+        },
+        "orphan": true,
+        "vscode": {
+            "interpreter": {
+                "hash": "265d195fda5292fe8f69c6e37c435a5634a1ed3b6799724e66a975f68fa21517"
+            }
+        }
     },
-    {
-     "data": {
-      "text/html": [
-       "== Status ==<br>Current time: 2022-07-22 15:53:04 (running for 00:00:07.77)<br>Memory usage on this node: 10.5/16.0 GiB<br>Using FIFO scheduling algorithm.<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/4.57 GiB heap, 0.0/2.0 GiB objects<br>Result logdir: /Users/kai/ray_results/train_breast_cancer_2022-07-22_15-52-48<br>Number of trials: 10/10 (10 TERMINATED)<br><table>\n",
-       "<thead>\n",
-       "<tr><th>Trial name                     </th><th>status    </th><th>loc            </th><th style=\"text-align: right;\">        eta</th><th style=\"text-align: right;\">  max_depth</th><th style=\"text-align: right;\">  min_child_weight</th><th style=\"text-align: right;\">  subsample</th><th style=\"text-align: right;\">     acc</th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th></tr>\n",
-       "</thead>\n",
-       "<tbody>\n",
-       "<tr><td>train_breast_cancer_f8669_00000</td><td>TERMINATED</td><td>127.0.0.1:48852</td><td style=\"text-align: right;\">0.0069356  </td><td style=\"text-align: right;\">          5</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.823504</td><td style=\"text-align: right;\">0.944056</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0316169</td></tr>\n",
-       "<tr><td>train_breast_cancer_f8669_00001</td><td>TERMINATED</td><td>127.0.0.1:48857</td><td style=\"text-align: right;\">0.00145619 </td><td style=\"text-align: right;\">          6</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.832947</td><td style=\"text-align: right;\">0.958042</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0328588</td></tr>\n",
-       "<tr><td>train_breast_cancer_f8669_00002</td><td>TERMINATED</td><td>127.0.0.1:48858</td><td style=\"text-align: right;\">0.00108208 </td><td style=\"text-align: right;\">          7</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.987319</td><td style=\"text-align: right;\">0.944056</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0319381</td></tr>\n",
-       "<tr><td>train_breast_cancer_f8669_00003</td><td>TERMINATED</td><td>127.0.0.1:48859</td><td style=\"text-align: right;\">0.00530429 </td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.615691</td><td style=\"text-align: right;\">0.923077</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.028388 </td></tr>\n",
-       "<tr><td>train_breast_cancer_f8669_00004</td><td>TERMINATED</td><td>127.0.0.1:48860</td><td style=\"text-align: right;\">0.000721843</td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.650973</td><td style=\"text-align: right;\">0.958042</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0299618</td></tr>\n",
-       "<tr><td>train_breast_cancer_f8669_00005</td><td>TERMINATED</td><td>127.0.0.1:48861</td><td style=\"text-align: right;\">0.0074509  </td><td style=\"text-align: right;\">          1</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.738341</td><td style=\"text-align: right;\">0.874126</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0193682</td></tr>\n",
-       "<tr><td>train_breast_cancer_f8669_00006</td><td>TERMINATED</td><td>127.0.0.1:48862</td><td style=\"text-align: right;\">0.0879882  </td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.671576</td><td style=\"text-align: right;\">0.944056</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0267372</td></tr>\n",
-       "<tr><td>train_breast_cancer_f8669_00007</td><td>TERMINATED</td><td>127.0.0.1:48863</td><td style=\"text-align: right;\">0.0765404  </td><td style=\"text-align: right;\">          7</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.708157</td><td style=\"text-align: right;\">0.965035</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0276129</td></tr>\n",
-       "<tr><td>train_breast_cancer_f8669_00008</td><td>TERMINATED</td><td>127.0.0.1:48864</td><td style=\"text-align: right;\">0.000627649</td><td style=\"text-align: right;\">          6</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.81121 </td><td style=\"text-align: right;\">0.951049</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0310998</td></tr>\n",
-       "<tr><td>train_breast_cancer_f8669_00009</td><td>TERMINATED</td><td>127.0.0.1:48865</td><td style=\"text-align: right;\">0.000383711</td><td style=\"text-align: right;\">          2</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.990579</td><td style=\"text-align: right;\">0.93007 </td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0274954</td></tr>\n",
-       "</tbody>\n",
-       "</table><br><br>"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2022-07-22 15:52:57,385\tINFO plugin_schema_manager.py:52 -- Loading the default runtime env schemas: ['/Users/kai/coding/ray/python/ray/_private/runtime_env/../../runtime_env/schemas/working_dir_schema.json', '/Users/kai/coding/ray/python/ray/_private/runtime_env/../../runtime_env/schemas/pip_schema.json'].\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Result for train_breast_cancer_f8669_00000:\n",
-      "  date: 2022-07-22_15-53-00\n",
-      "  done: true\n",
-      "  experiment_id: 07d10c5f31e74133b53272b7ccf9c528\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  mean_accuracy: 0.9440559440559441\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 48852\n",
-      "  time_since_restore: 0.031616926193237305\n",
-      "  time_this_iter_s: 0.031616926193237305\n",
-      "  time_total_s: 0.031616926193237305\n",
-      "  timestamp: 1658501580\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: f8669_00000\n",
-      "  warmup_time: 0.0027849674224853516\n",
-      "  \n",
-      "Result for train_breast_cancer_f8669_00009:\n",
-      "  date: 2022-07-22_15-53-04\n",
-      "  done: true\n",
-      "  experiment_id: bc0d5dd2d079432b859faac8a18928f0\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  mean_accuracy: 0.9300699300699301\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 48865\n",
-      "  time_since_restore: 0.027495384216308594\n",
-      "  time_this_iter_s: 0.027495384216308594\n",
-      "  time_total_s: 0.027495384216308594\n",
-      "  timestamp: 1658501584\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: f8669_00009\n",
-      "  warmup_time: 0.005235910415649414\n",
-      "  \n",
-      "Result for train_breast_cancer_f8669_00001:\n",
-      "  date: 2022-07-22_15-53-04\n",
-      "  done: true\n",
-      "  experiment_id: 4b10d350d4374a0d9e7d0c3b1d4e3203\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  mean_accuracy: 0.958041958041958\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 48857\n",
-      "  time_since_restore: 0.032858848571777344\n",
-      "  time_this_iter_s: 0.032858848571777344\n",
-      "  time_total_s: 0.032858848571777344\n",
-      "  timestamp: 1658501584\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: f8669_00001\n",
-      "  warmup_time: 0.004731178283691406\n",
-      "  \n",
-      "Result for train_breast_cancer_f8669_00008:\n",
-      "  date: 2022-07-22_15-53-04\n",
-      "  done: true\n",
-      "  experiment_id: 91c25cbbeb6f409d93e1d6537cb8e1ee\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  mean_accuracy: 0.951048951048951\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 48864\n",
-      "  time_since_restore: 0.031099796295166016\n",
-      "  time_this_iter_s: 0.031099796295166016\n",
-      "  time_total_s: 0.031099796295166016\n",
-      "  timestamp: 1658501584\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: f8669_00008\n",
-      "  warmup_time: 0.003270864486694336\n",
-      "  \n",
-      "Result for train_breast_cancer_f8669_00005:\n",
-      "  date: 2022-07-22_15-53-04\n",
-      "  done: true\n",
-      "  experiment_id: d225b0fb59e14da7adba952456ccf1d5\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  mean_accuracy: 0.8741258741258742\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 48861\n",
-      "  time_since_restore: 0.01936817169189453\n",
-      "  time_this_iter_s: 0.01936817169189453\n",
-      "  time_total_s: 0.01936817169189453\n",
-      "  timestamp: 1658501584\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: f8669_00005\n",
-      "  warmup_time: 0.003901958465576172\n",
-      "  \n",
-      "Result for train_breast_cancer_f8669_00004:\n",
-      "  date: 2022-07-22_15-53-04\n",
-      "  done: true\n",
-      "  experiment_id: 322484af6ea5422f8aaf8ff6a91af4f7\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  mean_accuracy: 0.958041958041958\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 48860\n",
-      "  time_since_restore: 0.029961824417114258\n",
-      "  time_this_iter_s: 0.029961824417114258\n",
-      "  time_total_s: 0.029961824417114258\n",
-      "  timestamp: 1658501584\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: f8669_00004\n",
-      "  warmup_time: 0.003547191619873047\n",
-      "  \n",
-      "Result for train_breast_cancer_f8669_00002:\n",
-      "  date: 2022-07-22_15-53-04\n",
-      "  done: true\n",
-      "  experiment_id: 3f588954160b42ce8ce200f68127ebcd\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  mean_accuracy: 0.9440559440559441\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 48858\n",
-      "  time_since_restore: 0.03193807601928711\n",
-      "  time_this_iter_s: 0.03193807601928711\n",
-      "  time_total_s: 0.03193807601928711\n",
-      "  timestamp: 1658501584\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: f8669_00002\n",
-      "  warmup_time: 0.003523111343383789\n",
-      "  \n",
-      "Result for train_breast_cancer_f8669_00003:\n",
-      "  date: 2022-07-22_15-53-04\n",
-      "  done: true\n",
-      "  experiment_id: a39ea777ce2d4ebca51b3d7a4179dae5\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  mean_accuracy: 0.9230769230769231\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 48859\n",
-      "  time_since_restore: 0.028388023376464844\n",
-      "  time_this_iter_s: 0.028388023376464844\n",
-      "  time_total_s: 0.028388023376464844\n",
-      "  timestamp: 1658501584\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: f8669_00003\n",
-      "  warmup_time: 0.0035560131072998047\n",
-      "  \n",
-      "Result for train_breast_cancer_f8669_00006:\n",
-      "  date: 2022-07-22_15-53-04\n",
-      "  done: true\n",
-      "  experiment_id: f97c6b9674854f8d89ec26ba58cc1618\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  mean_accuracy: 0.9440559440559441\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 48862\n",
-      "  time_since_restore: 0.026737213134765625\n",
-      "  time_this_iter_s: 0.026737213134765625\n",
-      "  time_total_s: 0.026737213134765625\n",
-      "  timestamp: 1658501584\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: f8669_00006\n",
-      "  warmup_time: 0.003425121307373047\n",
-      "  \n",
-      "Result for train_breast_cancer_f8669_00007:\n",
-      "  date: 2022-07-22_15-53-04\n",
-      "  done: true\n",
-      "  experiment_id: ff172037065a4d55998ed72f51bdc5df\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  mean_accuracy: 0.965034965034965\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 48863\n",
-      "  time_since_restore: 0.027612924575805664\n",
-      "  time_this_iter_s: 0.027612924575805664\n",
-      "  time_total_s: 0.027612924575805664\n",
-      "  timestamp: 1658501584\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: f8669_00007\n",
-      "  warmup_time: 0.0031311511993408203\n",
-      "  \n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2022-07-22 15:53:04,846\tINFO tune.py:738 -- Total run time: 8.99 seconds (7.74 seconds for the tuning loop).\n"
-     ]
-    }
-   ],
-   "source": [
-    "import sklearn.datasets\n",
-    "import sklearn.metrics\n",
-    "\n",
-    "from ray import air, tune\n",
-    "from ray.air import session\n",
-    "\n",
-    "\n",
-    "def train_breast_cancer(config):\n",
-    "    # Load dataset\n",
-    "    data, labels = sklearn.datasets.load_breast_cancer(return_X_y=True)\n",
-    "    # Split into train and test set\n",
-    "    train_x, test_x, train_y, test_y = train_test_split(data, labels, test_size=0.25)\n",
-    "    # Build input matrices for XGBoost\n",
-    "    train_set = xgb.DMatrix(train_x, label=train_y)\n",
-    "    test_set = xgb.DMatrix(test_x, label=test_y)\n",
-    "    # Train the classifier\n",
-    "    results = {}\n",
-    "    xgb.train(\n",
-    "        config,\n",
-    "        train_set,\n",
-    "        evals=[(test_set, \"eval\")],\n",
-    "        evals_result=results,\n",
-    "        verbose_eval=False,\n",
-    "    )\n",
-    "    # Return prediction accuracy\n",
-    "    accuracy = 1.0 - results[\"eval\"][\"error\"][-1]\n",
-    "    session.report({\"mean_accuracy\": accuracy, \"done\": True})\n",
-    "\n",
-    "\n",
-    "if __name__ == \"__main__\":\n",
-    "    config = {\n",
-    "        \"objective\": \"binary:logistic\",\n",
-    "        \"eval_metric\": [\"logloss\", \"error\"],\n",
-    "        \"max_depth\": tune.randint(1, 9),\n",
-    "        \"min_child_weight\": tune.choice([1, 2, 3]),\n",
-    "        \"subsample\": tune.uniform(0.5, 1.0),\n",
-    "        \"eta\": tune.loguniform(1e-4, 1e-1),\n",
-    "    }\n",
-    "    tuner = tune.Tuner(\n",
-    "        train_breast_cancer,\n",
-    "        tune_config=tune.TuneConfig(\n",
-    "            num_samples=10,\n",
-    "        ),\n",
-    "        param_space=config,\n",
-    "    )\n",
-    "    results = tuner.fit()\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4999e858",
-   "metadata": {},
-   "source": [
-    "As you can see, the changes in the actual training function are minimal. Instead of\n",
-    "returning the accuracy value, we report it back to Tune using `session.report()`.\n",
-    "Our `config` dictionary only changed slightly. Instead of passing hard-coded\n",
-    "parameters, we tell Tune to choose values from a range of valid options. There are\n",
-    "a number of options we have here, all of which are explained in\n",
-    "{ref}`the Tune docs <tune-sample-docs>`.\n",
-    "\n",
-    "For a brief explanation, this is what they do:\n",
-    "\n",
-    "- `tune.randint(min, max)` chooses a random integer value between *min* and *max*.\n",
-    "  Note that *max* is exclusive, so it will not be sampled.\n",
-    "- `tune.choice([a, b, c])` chooses one of the items of the list at random. Each item\n",
-    "  has the same chance to be sampled.\n",
-    "- `tune.uniform(min, max)` samples a floating point number between *min* and *max*.\n",
-    "  Note that *max* is exclusive here, too.\n",
-    "- `tune.loguniform(min, max, base=10)` samples a floating point number between *min* and *max*,\n",
-    "  but applies a logarithmic transformation to these boundaries first. Thus, this makes\n",
-    "  it easy to sample values from different orders of magnitude.\n",
-    "\n",
-    "The `num_samples=10` option we pass to the `TuneConfig()` means that we sample 10 different\n",
-    "hyperparameter configurations from this search space.\n",
-    "\n",
-    "The output of our training run coud look like this:\n",
-    "\n",
-    "```{code-block} bash\n",
-    ":emphasize-lines: 14\n",
-    "\n",
-    " Number of trials: 10/10 (10 TERMINATED)\n",
-    " +---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+----------+--------+------------------+\n",
-    " | Trial name                      | status     | loc   |         eta |   max_depth |   min_child_weight |   subsample |      acc |   iter |   total time (s) |\n",
-    " |---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+----------+--------+------------------|\n",
-    " | train_breast_cancer_b63aa_00000 | TERMINATED |       | 0.000117625 |           2 |                  2 |    0.616347 | 0.916084 |      1 |        0.0306492 |\n",
-    " | train_breast_cancer_b63aa_00001 | TERMINATED |       | 0.0382954   |           8 |                  2 |    0.581549 | 0.937063 |      1 |        0.0357082 |\n",
-    " | train_breast_cancer_b63aa_00002 | TERMINATED |       | 0.000217926 |           1 |                  3 |    0.528428 | 0.874126 |      1 |        0.0264609 |\n",
-    " | train_breast_cancer_b63aa_00003 | TERMINATED |       | 0.000120929 |           8 |                  1 |    0.634508 | 0.958042 |      1 |        0.036406  |\n",
-    " | train_breast_cancer_b63aa_00004 | TERMINATED |       | 0.00839715  |           5 |                  1 |    0.730624 | 0.958042 |      1 |        0.0389378 |\n",
-    " | train_breast_cancer_b63aa_00005 | TERMINATED |       | 0.000732948 |           8 |                  2 |    0.915863 | 0.958042 |      1 |        0.0382841 |\n",
-    " | train_breast_cancer_b63aa_00006 | TERMINATED |       | 0.000856226 |           4 |                  1 |    0.645209 | 0.916084 |      1 |        0.0357089 |\n",
-    " | train_breast_cancer_b63aa_00007 | TERMINATED |       | 0.00769908  |           7 |                  1 |    0.729443 | 0.909091 |      1 |        0.0390737 |\n",
-    " | train_breast_cancer_b63aa_00008 | TERMINATED |       | 0.00186339  |           5 |                  3 |    0.595744 | 0.944056 |      1 |        0.0343912 |\n",
-    " | train_breast_cancer_b63aa_00009 | TERMINATED |       | 0.000950272 |           3 |                  2 |    0.835504 | 0.965035 |      1 |        0.0348201 |\n",
-    " +---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+----------+--------+------------------+\n",
-    "```\n",
-    "\n",
-    "The best configuration we found used `eta=0.000950272`, `max_depth=3`,\n",
-    "`min_child_weight=2`, `subsample=0.835504` and reached an accuracy of\n",
-    "`0.965035`.\n",
-    "\n",
-    "## Early stopping\n",
-    "\n",
-    "Currently, Tune samples 10 different hyperparameter configurations and trains a full\n",
-    "XGBoost on all of them. In our small example, training is very fast. However,\n",
-    "if training takes longer, a significant amount of computer resources is spent on trials\n",
-    "that will eventually show a bad performance, e.g. a low accuracy. It would be good\n",
-    "if we could identify these trials early and stop them, so we don't waste any resources.\n",
-    "\n",
-    "This is where Tune's *Schedulers* shine. A Tune `TrialScheduler` is responsible\n",
-    "for starting and stopping trials. Tune implements a number of different schedulers, each\n",
-    "described {ref}`in the Tune documentation <tune-schedulers>`.\n",
-    "For our example, we will use the `AsyncHyperBandScheduler` or `ASHAScheduler`.\n",
-    "\n",
-    "The basic idea of this scheduler: We sample a number of hyperparameter configurations.\n",
-    "Each of these configurations is trained for a specific number of iterations.\n",
-    "After these iterations, only the best performing hyperparameters are retained. These\n",
-    "are selected according to some loss metric, usually an evaluation loss. This cycle is\n",
-    "repeated until we end up with the best configuration.\n",
-    "\n",
-    "The `ASHAScheduler` needs to know three things:\n",
-    "\n",
-    "1. Which metric should be used to identify badly performing trials?\n",
-    "2. Should this metric be maximized or minimized?\n",
-    "3. How many iterations does each trial train for?\n",
-    "\n",
-    "There are more parameters, which are explained in the\n",
-    "{ref}`documentation <tune-scheduler-hyperband>`.\n",
-    "\n",
-    "Lastly, we have to report the loss metric to Tune. We do this with a `Callback` that\n",
-    "XGBoost accepts and calls after each evaluation round. Ray Tune comes\n",
-    "with {ref}`two XGBoost callbacks <tune-integration-xgboost>`\n",
-    "we can use for this. The `TuneReportCallback` just reports the evaluation\n",
-    "metrics back to Tune. The `TuneReportCheckpointCallback` also saves\n",
-    "checkpoints after each evaluation round. We will just use the latter in this\n",
-    "example so that we can retrieve the saved model later.\n",
-    "\n",
-    "These parameters from the `eval_metrics` configuration setting are then automatically\n",
-    "reported to Tune via the callback. Here, the raw error will be reported, not the accuracy.\n",
-    "To display the best reached accuracy, we will inverse it later.\n",
-    "\n",
-    "We will also load the best checkpointed model so that we can use it for predictions.\n",
-    "The best model is selected with respect to the `metric` and `mode` parameters we\n",
-    "pass to the `TunerConfig()`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 9,
-   "id": "d08b5b0a",
-   "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "== Status ==<br>Current time: 2022-07-22 16:56:01 (running for 00:00:10.38)<br>Memory usage on this node: 10.3/16.0 GiB<br>Using AsyncHyperBand: num_stopped=10\n",
-       "Bracket: Iter 8.000: -0.5107275277792991 | Iter 4.000: -0.5876629346317344 | Iter 2.000: -0.6544494184997531 | Iter 1.000: -0.6859214191253369<br>Resources requested: 0/16 CPUs, 0/0 GPUs, 0.0/4.57 GiB heap, 0.0/2.0 GiB objects<br>Current best trial: c28a3_00003 with eval-logloss=0.38665050018083796 and parameters={'objective': 'binary:logistic', 'eval_metric': ['logloss', 'error'], 'max_depth': 2, 'min_child_weight': 3, 'subsample': 0.782626252548841, 'eta': 0.06385952388342125}<br>Result logdir: /Users/kai/ray_results/train_breast_cancer_2022-07-22_16-55-50<br>Number of trials: 10/10 (10 TERMINATED)<br><table>\n",
-       "<thead>\n",
-       "<tr><th>Trial name                     </th><th>status    </th><th>loc            </th><th style=\"text-align: right;\">        eta</th><th style=\"text-align: right;\">  max_depth</th><th style=\"text-align: right;\">  min_child_weight</th><th style=\"text-align: right;\">  subsample</th><th style=\"text-align: right;\">  iter</th><th style=\"text-align: right;\">  total time (s)</th><th style=\"text-align: right;\">  eval-logloss</th><th style=\"text-align: right;\">  eval-error</th></tr>\n",
-       "</thead>\n",
-       "<tbody>\n",
-       "<tr><td>train_breast_cancer_c28a3_00000</td><td>TERMINATED</td><td>127.0.0.1:54416</td><td style=\"text-align: right;\">0.0186954  </td><td style=\"text-align: right;\">          2</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.516916</td><td style=\"text-align: right;\">    10</td><td style=\"text-align: right;\">       0.22218  </td><td style=\"text-align: right;\">      0.571496</td><td style=\"text-align: right;\">   0.0629371</td></tr>\n",
-       "<tr><td>train_breast_cancer_c28a3_00001</td><td>TERMINATED</td><td>127.0.0.1:54440</td><td style=\"text-align: right;\">0.0304404  </td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.745969</td><td style=\"text-align: right;\">     2</td><td style=\"text-align: right;\">       0.135674 </td><td style=\"text-align: right;\">      0.650353</td><td style=\"text-align: right;\">   0.0629371</td></tr>\n",
-       "<tr><td>train_breast_cancer_c28a3_00002</td><td>TERMINATED</td><td>127.0.0.1:54441</td><td style=\"text-align: right;\">0.0217157  </td><td style=\"text-align: right;\">          8</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.764138</td><td style=\"text-align: right;\">     2</td><td style=\"text-align: right;\">       0.173076 </td><td style=\"text-align: right;\">      0.658545</td><td style=\"text-align: right;\">   0.041958 </td></tr>\n",
-       "<tr><td>train_breast_cancer_c28a3_00003</td><td>TERMINATED</td><td>127.0.0.1:54442</td><td style=\"text-align: right;\">0.0638595  </td><td style=\"text-align: right;\">          2</td><td style=\"text-align: right;\">                 3</td><td style=\"text-align: right;\">   0.782626</td><td style=\"text-align: right;\">    10</td><td style=\"text-align: right;\">       0.281865 </td><td style=\"text-align: right;\">      0.386651</td><td style=\"text-align: right;\">   0.041958 </td></tr>\n",
-       "<tr><td>train_breast_cancer_c28a3_00004</td><td>TERMINATED</td><td>127.0.0.1:54443</td><td style=\"text-align: right;\">0.00442794 </td><td style=\"text-align: right;\">          7</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.792359</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0270212</td><td style=\"text-align: right;\">      0.689577</td><td style=\"text-align: right;\">   0.0699301</td></tr>\n",
-       "<tr><td>train_breast_cancer_c28a3_00005</td><td>TERMINATED</td><td>127.0.0.1:54444</td><td style=\"text-align: right;\">0.00222624 </td><td style=\"text-align: right;\">          3</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.536331</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0238512</td><td style=\"text-align: right;\">      0.691446</td><td style=\"text-align: right;\">   0.0839161</td></tr>\n",
-       "<tr><td>train_breast_cancer_c28a3_00006</td><td>TERMINATED</td><td>127.0.0.1:54445</td><td style=\"text-align: right;\">0.000825129</td><td style=\"text-align: right;\">          1</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.82472 </td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.015312 </td><td style=\"text-align: right;\">      0.692624</td><td style=\"text-align: right;\">   0.118881 </td></tr>\n",
-       "<tr><td>train_breast_cancer_c28a3_00007</td><td>TERMINATED</td><td>127.0.0.1:54446</td><td style=\"text-align: right;\">0.000770826</td><td style=\"text-align: right;\">          7</td><td style=\"text-align: right;\">                 2</td><td style=\"text-align: right;\">   0.947268</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0175898</td><td style=\"text-align: right;\">      0.692598</td><td style=\"text-align: right;\">   0.132867 </td></tr>\n",
-       "<tr><td>train_breast_cancer_c28a3_00008</td><td>TERMINATED</td><td>127.0.0.1:54447</td><td style=\"text-align: right;\">0.000429759</td><td style=\"text-align: right;\">          7</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.88524 </td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0193739</td><td style=\"text-align: right;\">      0.692785</td><td style=\"text-align: right;\">   0.0559441</td></tr>\n",
-       "<tr><td>train_breast_cancer_c28a3_00009</td><td>TERMINATED</td><td>127.0.0.1:54448</td><td style=\"text-align: right;\">0.0149863  </td><td style=\"text-align: right;\">          2</td><td style=\"text-align: right;\">                 1</td><td style=\"text-align: right;\">   0.722738</td><td style=\"text-align: right;\">     1</td><td style=\"text-align: right;\">       0.0165932</td><td style=\"text-align: right;\">      0.682266</td><td style=\"text-align: right;\">   0.111888 </td></tr>\n",
-       "</tbody>\n",
-       "</table><br><br>"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Result for train_breast_cancer_c28a3_00000:\n",
-      "  date: 2022-07-22_16-55-55\n",
-      "  done: false\n",
-      "  eval-error: 0.08391608391608392\n",
-      "  eval-logloss: 0.6790360066440556\n",
-      "  experiment_id: 2a3189442db341519836a07fb2d65dd9\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54416\n",
-      "  time_since_restore: 0.01624011993408203\n",
-      "  time_this_iter_s: 0.01624011993408203\n",
-      "  time_total_s: 0.01624011993408203\n",
-      "  timestamp: 1658505355\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: c28a3_00000\n",
-      "  warmup_time: 0.0035409927368164062\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00000:\n",
-      "  date: 2022-07-22_16-55-56\n",
-      "  done: true\n",
-      "  eval-error: 0.06293706293706294\n",
-      "  eval-logloss: 0.5714958122560194\n",
-      "  experiment_id: 2a3189442db341519836a07fb2d65dd9\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 10\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54416\n",
-      "  time_since_restore: 0.22218012809753418\n",
-      "  time_this_iter_s: 0.007044076919555664\n",
-      "  time_total_s: 0.22218012809753418\n",
-      "  timestamp: 1658505356\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 10\n",
-      "  trial_id: c28a3_00000\n",
-      "  warmup_time: 0.0035409927368164062\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00003:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: false\n",
-      "  eval-error: 0.08391608391608392\n",
-      "  eval-logloss: 0.6472820101918041\n",
-      "  experiment_id: 7ff6133237404b4ea4755b9f8cd114f2\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54442\n",
-      "  time_since_restore: 0.023206233978271484\n",
-      "  time_this_iter_s: 0.023206233978271484\n",
-      "  time_total_s: 0.023206233978271484\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: c28a3_00003\n",
-      "  warmup_time: 0.006722211837768555\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00005:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: true\n",
-      "  eval-error: 0.08391608391608392\n",
-      "  eval-logloss: 0.6914464114429234\n",
-      "  experiment_id: 344762ab6d574b63a9374e19526d0510\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54444\n",
-      "  time_since_restore: 0.02385115623474121\n",
-      "  time_this_iter_s: 0.02385115623474121\n",
-      "  time_total_s: 0.02385115623474121\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: c28a3_00005\n",
-      "  warmup_time: 0.008936882019042969\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00009:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: true\n",
-      "  eval-error: 0.11188811188811189\n",
-      "  eval-logloss: 0.6822656309688008\n",
-      "  experiment_id: 133901655fa64bf79f2dcc4e8e5e41b1\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54448\n",
-      "  time_since_restore: 0.016593217849731445\n",
-      "  time_this_iter_s: 0.016593217849731445\n",
-      "  time_total_s: 0.016593217849731445\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: c28a3_00009\n",
-      "  warmup_time: 0.004940032958984375\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00007:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: true\n",
-      "  eval-error: 0.13286713286713286\n",
-      "  eval-logloss: 0.6925980357023386\n",
-      "  experiment_id: b4331027cbaf442ab905b2e51797dbbd\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54446\n",
-      "  time_since_restore: 0.017589807510375977\n",
-      "  time_this_iter_s: 0.017589807510375977\n",
-      "  time_total_s: 0.017589807510375977\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: c28a3_00007\n",
-      "  warmup_time: 0.003782033920288086\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00006:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: true\n",
-      "  eval-error: 0.11888111888111888\n",
-      "  eval-logloss: 0.6926244418104212\n",
-      "  experiment_id: d3906de5943a4e05a4cc782382f67d24\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54445\n",
-      "  time_since_restore: 0.015311956405639648\n",
-      "  time_this_iter_s: 0.015311956405639648\n",
-      "  time_total_s: 0.015311956405639648\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: c28a3_00006\n",
-      "  warmup_time: 0.005506038665771484\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00002:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: false\n",
-      "  eval-error: 0.04895104895104895\n",
-      "  eval-logloss: 0.6752762102580571\n",
-      "  experiment_id: a3645fc2d43145d88a1f5b7cc94df703\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54441\n",
-      "  time_since_restore: 0.027367830276489258\n",
-      "  time_this_iter_s: 0.027367830276489258\n",
-      "  time_total_s: 0.027367830276489258\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: c28a3_00002\n",
-      "  warmup_time: 0.0062830448150634766\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00001:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: false\n",
-      "  eval-error: 0.07692307692307693\n",
-      "  eval-logloss: 0.6698804135089154\n",
-      "  experiment_id: 85766fe4d9fa482a91e396a8fd509a19\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54440\n",
-      "  time_since_restore: 0.017169952392578125\n",
-      "  time_this_iter_s: 0.017169952392578125\n",
-      "  time_total_s: 0.017169952392578125\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: c28a3_00001\n",
-      "  warmup_time: 0.006204843521118164\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00008:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: true\n",
-      "  eval-error: 0.05594405594405594\n",
-      "  eval-logloss: 0.692784742458717\n",
-      "  experiment_id: 2c7d8bc38ad04536b1dec76819a2b3bf\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54447\n",
-      "  time_since_restore: 0.01937389373779297\n",
-      "  time_this_iter_s: 0.01937389373779297\n",
-      "  time_total_s: 0.01937389373779297\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: c28a3_00008\n",
-      "  warmup_time: 0.004342079162597656\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00001:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: true\n",
-      "  eval-error: 0.06293706293706294\n",
-      "  eval-logloss: 0.6503534216980834\n",
-      "  experiment_id: 85766fe4d9fa482a91e396a8fd509a19\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 2\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54440\n",
-      "  time_since_restore: 0.13567376136779785\n",
-      "  time_this_iter_s: 0.11850380897521973\n",
-      "  time_total_s: 0.13567376136779785\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 2\n",
-      "  trial_id: c28a3_00001\n",
-      "  warmup_time: 0.006204843521118164\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00004:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: true\n",
-      "  eval-error: 0.06993006993006994\n",
-      "  eval-logloss: 0.689577207281873\n",
-      "  experiment_id: ef4fdc645c444112985b4957ab8a84e9\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 1\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54443\n",
-      "  time_since_restore: 0.027021169662475586\n",
-      "  time_this_iter_s: 0.027021169662475586\n",
-      "  time_total_s: 0.027021169662475586\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 1\n",
-      "  trial_id: c28a3_00004\n",
-      "  warmup_time: 0.0063669681549072266\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00002:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: true\n",
-      "  eval-error: 0.04195804195804196\n",
-      "  eval-logloss: 0.658545415301423\n",
-      "  experiment_id: a3645fc2d43145d88a1f5b7cc94df703\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 2\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54441\n",
-      "  time_since_restore: 0.17307591438293457\n",
-      "  time_this_iter_s: 0.1457080841064453\n",
-      "  time_total_s: 0.17307591438293457\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 2\n",
-      "  trial_id: c28a3_00002\n",
-      "  warmup_time: 0.0062830448150634766\n",
-      "  \n",
-      "Result for train_breast_cancer_c28a3_00003:\n",
-      "  date: 2022-07-22_16-56-01\n",
-      "  done: true\n",
-      "  eval-error: 0.04195804195804196\n",
-      "  eval-logloss: 0.38665050018083796\n",
-      "  experiment_id: 7ff6133237404b4ea4755b9f8cd114f2\n",
-      "  hostname: Kais-MacBook-Pro.local\n",
-      "  iterations_since_restore: 10\n",
-      "  node_ip: 127.0.0.1\n",
-      "  pid: 54442\n",
-      "  time_since_restore: 0.28186488151550293\n",
-      "  time_this_iter_s: 0.03063178062438965\n",
-      "  time_total_s: 0.28186488151550293\n",
-      "  timestamp: 1658505361\n",
-      "  timesteps_since_restore: 0\n",
-      "  training_iteration: 10\n",
-      "  trial_id: c28a3_00003\n",
-      "  warmup_time: 0.006722211837768555\n",
-      "  \n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2022-07-22 16:56:01,498\tINFO tune.py:738 -- Total run time: 10.53 seconds (10.37 seconds for the tuning loop).\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Best model parameters: {'objective': 'binary:logistic', 'eval_metric': ['logloss', 'error'], 'max_depth': 2, 'min_child_weight': 3, 'subsample': 0.782626252548841, 'eta': 0.06385952388342125}\n",
-      "Best model total accuracy: 0.9580\n"
-     ]
-    }
-   ],
-   "source": [
-    "import sklearn.datasets\n",
-    "import sklearn.metrics\n",
-    "import os\n",
-    "from ray.tune.schedulers import ASHAScheduler\n",
-    "from sklearn.model_selection import train_test_split\n",
-    "import xgboost as xgb\n",
-    "\n",
-    "from ray import air, tune\n",
-    "from ray.air import session\n",
-    "from ray.tune.integration.xgboost import TuneReportCheckpointCallback\n",
-    "\n",
-    "\n",
-    "def train_breast_cancer(config: dict):\n",
-    "    # This is a simple training function to be passed into Tune\n",
-    "    # Load dataset\n",
-    "    data, labels = sklearn.datasets.load_breast_cancer(return_X_y=True)\n",
-    "    # Split into train and test set\n",
-    "    train_x, test_x, train_y, test_y = train_test_split(data, labels, test_size=0.25)\n",
-    "    # Build input matrices for XGBoost\n",
-    "    train_set = xgb.DMatrix(train_x, label=train_y)\n",
-    "    test_set = xgb.DMatrix(test_x, label=test_y)\n",
-    "    # Train the classifier, using the Tune callback\n",
-    "    xgb.train(\n",
-    "        config,\n",
-    "        train_set,\n",
-    "        evals=[(test_set, \"eval\")],\n",
-    "        verbose_eval=False,\n",
-    "        callbacks=[TuneReportCheckpointCallback(filename=\"model.xgb\")],\n",
-    "    )\n",
-    "\n",
-    "\n",
-    "def get_best_model_checkpoint(results):\n",
-    "    best_bst = xgb.Booster()\n",
-    "    best_result = results.get_best_result()\n",
-    "\n",
-    "    with best_result.checkpoint.as_directory() as best_checkpoint_dir:\n",
-    "        best_bst.load_model(os.path.join(best_checkpoint_dir, \"model.xgb\"))\n",
-    "    accuracy = 1.0 - best_result.metrics[\"eval-error\"]\n",
-    "    print(f\"Best model parameters: {best_result.config}\")\n",
-    "    print(f\"Best model total accuracy: {accuracy:.4f}\")\n",
-    "    return best_bst\n",
-    "\n",
-    "\n",
-    "def tune_xgboost(smoke_test=False):\n",
-    "    search_space = {\n",
-    "        # You can mix constants with search space objects.\n",
-    "        \"objective\": \"binary:logistic\",\n",
-    "        \"eval_metric\": [\"logloss\", \"error\"],\n",
-    "        \"max_depth\": tune.randint(1, 9),\n",
-    "        \"min_child_weight\": tune.choice([1, 2, 3]),\n",
-    "        \"subsample\": tune.uniform(0.5, 1.0),\n",
-    "        \"eta\": tune.loguniform(1e-4, 1e-1),\n",
-    "    }\n",
-    "    # This will enable aggressive early stopping of bad trials.\n",
-    "    scheduler = ASHAScheduler(\n",
-    "        max_t=10, grace_period=1, reduction_factor=2  # 10 training iterations\n",
-    "    )\n",
-    "\n",
-    "    tuner = tune.Tuner(\n",
-    "        train_breast_cancer,\n",
-    "        tune_config=tune.TuneConfig(\n",
-    "            metric=\"eval-logloss\",\n",
-    "            mode=\"min\",\n",
-    "            scheduler=scheduler,\n",
-    "            num_samples=1 if smoke_test else 10,\n",
-    "        ),\n",
-    "        param_space=search_space,\n",
-    "    )\n",
-    "    results = tuner.fit()\n",
-    "\n",
-    "    return results\n",
-    "\n",
-    "\n",
-    "if __name__ == \"__main__\":\n",
-    "    import argparse\n",
-    "\n",
-    "    parser = argparse.ArgumentParser()\n",
-    "    parser.add_argument(\n",
-    "        \"--smoke-test\", action=\"store_true\", help=\"Finish quickly for testing\"\n",
-    "    )\n",
-    "    args, _ = parser.parse_known_args()\n",
-    "\n",
-    "    results = tune_xgboost(smoke_test=args.smoke_test)\n",
-    "\n",
-    "    # Load the best model checkpoint.\n",
-    "    best_bst = get_best_model_checkpoint(results)\n",
-    "\n",
-    "    # You could now do further predictions with\n",
-    "    # best_bst.predict(...)\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "20732fe4",
-   "metadata": {},
-   "source": [
-    "The output of our run could look like this:\n",
-    "\n",
-    "```{code-block} bash\n",
-    ":emphasize-lines: 7\n",
-    "\n",
-    " Number of trials: 10/10 (10 TERMINATED)\n",
-    " +---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+--------+------------------+----------------+--------------+\n",
-    " | Trial name                      | status     | loc   |         eta |   max_depth |   min_child_weight |   subsample |   iter |   total time (s) |   eval-logloss |   eval-error |\n",
-    " |---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+--------+------------------+----------------+--------------|\n",
-    " | train_breast_cancer_ba275_00000 | TERMINATED |       | 0.00205087  |           2 |                  1 |    0.898391 |     10 |        0.380619  |       0.678039 |     0.090909 |\n",
-    " | train_breast_cancer_ba275_00001 | TERMINATED |       | 0.000183834 |           4 |                  3 |    0.924939 |      1 |        0.0228798 |       0.693009 |     0.111888 |\n",
-    " | train_breast_cancer_ba275_00002 | TERMINATED |       | 0.0242721   |           7 |                  2 |    0.501551 |     10 |        0.376154  |       0.54472  |     0.06993  |\n",
-    " | train_breast_cancer_ba275_00003 | TERMINATED |       | 0.000449692 |           5 |                  3 |    0.890212 |      1 |        0.0234981 |       0.692811 |     0.090909 |\n",
-    " | train_breast_cancer_ba275_00004 | TERMINATED |       | 0.000376393 |           7 |                  2 |    0.883609 |      1 |        0.0231569 |       0.692847 |     0.062937 |\n",
-    " | train_breast_cancer_ba275_00005 | TERMINATED |       | 0.00231942  |           3 |                  3 |    0.877464 |      2 |        0.104867  |       0.689541 |     0.083916 |\n",
-    " | train_breast_cancer_ba275_00006 | TERMINATED |       | 0.000542326 |           1 |                  2 |    0.578584 |      1 |        0.0213971 |       0.692765 |     0.083916 |\n",
-    " | train_breast_cancer_ba275_00007 | TERMINATED |       | 0.0016801   |           1 |                  2 |    0.975302 |      1 |        0.02226   |       0.691999 |     0.083916 |\n",
-    " | train_breast_cancer_ba275_00008 | TERMINATED |       | 0.000595756 |           8 |                  3 |    0.58429  |      1 |        0.0221152 |       0.692657 |     0.06993  |\n",
-    " | train_breast_cancer_ba275_00009 | TERMINATED |       | 0.000357845 |           8 |                  1 |    0.637776 |      1 |        0.022635  |       0.692859 |     0.090909 |\n",
-    " +---------------------------------+------------+-------+-------------+-------------+--------------------+-------------+--------+------------------+----------------+--------------+\n",
-    "\n",
-    "\n",
-    " Best model parameters: {'objective': 'binary:logistic', 'eval_metric': ['logloss', 'error'], 'max_depth': 7, 'min_child_weight': 2, 'subsample': 0.5015513240240503, 'eta': 0.024272050872920895}\n",
-    " Best model total accuracy: 0.9301\n",
-    "```\n",
-    "\n",
-    "As you can see, most trials have been stopped only after a few iterations. Only the\n",
-    "two most promising trials were run for the full 10 iterations.\n",
-    "\n",
-    "You can also ensure that all available resources are being used as the scheduler\n",
-    "terminates trials, freeing them up. This can be done through the\n",
-    "`ResourceChangingScheduler`. An example of this can be found here:\n",
-    "{doc}`/tune/examples/includes/xgboost_dynamic_resources_example`.\n",
-    "\n",
-    "## Using fractional GPUs\n",
-    "\n",
-    "You can often accelerate your training by using GPUs in addition to CPUs. However,\n",
-    "you usually don't have as many GPUs as you have trials to run. For instance, if you\n",
-    "run 10 Tune trials in parallel, you usually don't have access to 10 separate GPUs.\n",
-    "\n",
-    "Tune supports *fractional GPUs*. This means that each task is assigned a fraction\n",
-    "of the GPU memory for training. For 10 tasks, this could look like this:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7d1b20a3",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "config = {\n",
-    "    \"objective\": \"binary:logistic\",\n",
-    "    \"eval_metric\": [\"logloss\", \"error\"],\n",
-    "    \"tree_method\": \"gpu_hist\",\n",
-    "    \"max_depth\": tune.randint(1, 9),\n",
-    "    \"min_child_weight\": tune.choice([1, 2, 3]),\n",
-    "    \"subsample\": tune.uniform(0.5, 1.0),\n",
-    "    \"eta\": tune.loguniform(1e-4, 1e-1),\n",
-    "}\n",
-    "\n",
-    "tuner = tune.Tuner(\n",
-    "    tune.with_resources(train_breast_cancer, resources={\"cpu\": 1, \"gpu\": 0.1}),\n",
-    "    tune_config=tune.TuneConfig(\n",
-    "        num_samples=10,\n",
-    "    ),\n",
-    "    param_space=config,\n",
-    ")\n",
-    "results = tuner.fit()\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ee131861",
-   "metadata": {},
-   "source": [
-    "Each task thus works with 10% of the available GPU memory. You also have to tell\n",
-    "XGBoost to use the `gpu_hist` tree method, so it knows it should use the GPU.\n",
-    "\n",
-    "## Conclusion\n",
-    "\n",
-    "You should now have a basic understanding on how to train XGBoost models and on how\n",
-    "to tune the hyperparameters to yield the best results. In our simple example,\n",
-    "Tuning the parameters didn't make a huge difference for the accuracy.\n",
-    "But in larger applications, intelligent hyperparameter tuning can make the\n",
-    "difference between a model that doesn't seem to learn at all, and a model\n",
-    "that outperforms all the other ones.\n",
-    "\n",
-    "## More XGBoost Examples\n",
-    "\n",
-    "- {doc}`/tune/examples/includes/xgboost_dynamic_resources_example`:\n",
-    "  Trains a basic XGBoost model with Tune with the class-based API and a ResourceChangingScheduler, ensuring all resources are being used at all time.\n",
-    "\n",
-    "## Learn More\n",
-    "\n",
-    "- [XGBoost Hyperparameter Tuning - A Visual Guide](https://kevinvecmanis.io/machine%20learning/hyperparameter%20tuning/dataviz/python/2019/05/11/XGBoost-Tuning-Visual-Guide.html)\n",
-    "- [Notes on XGBoost Parameter Tuning](https://xgboost.readthedocs.io/en/latest/tutorials/param_tuning.html)\n",
-    "- [Doing XGBoost Hyperparameter Tuning the smart way](https://towardsdatascience.com/doing-xgboost-hyper-parameter-tuning-the-smart-way-part-1-of-2-f6d255a45dde)"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ray_dev_py38",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.8.13 | packaged by conda-forge | (default, Mar 25 2022, 06:05:16) \n[Clang 12.0.1 ]"
-  },
-  "orphan": true,
-  "vscode": {
-   "interpreter": {
-    "hash": "265d195fda5292fe8f69c6e37c435a5634a1ed3b6799724e66a975f68fa21517"
-   }
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
+    "nbformat": 4,
+    "nbformat_minor": 5
+}
\ No newline at end of file
diff --git a/doc/source/tune/faq.rst b/doc/source/tune/faq.rst
index 20ff41119fc6..ca4db42ef5df 100644
--- a/doc/source/tune/faq.rst
+++ b/doc/source/tune/faq.rst
@@ -341,7 +341,7 @@ are efficiently stored and retrieved on your cluster machines.
 
 :func:`tune.with_parameters() <ray.tune.with_parameters>`
 also works with class trainables. Please see
-:ref:`here for further details <tune-with-parameters>` and examples.
+:func:`tune.with_parameters() <ray.tune.with_parameters>` for more details and examples.
 
 
 How can I reproduce experiments?
diff --git a/doc/source/tune/getting-started.rst b/doc/source/tune/getting-started.rst
index 624fe86d5409..14e303b2dae3 100644
--- a/doc/source/tune/getting-started.rst
+++ b/doc/source/tune/getting-started.rst
@@ -73,7 +73,7 @@ make sure that the function is :ref:`serializable by Ray <serialization-guide>`.
    :start-after: __train_func_begin__
    :end-before: __train_func_end__
 
-Let's run one trial by calling :ref:`Tuner.fit <tune-run-ref>` and :ref:`randomly sample <tune-sample-docs>`
+Let's run one trial by calling :ref:`Tuner.fit <tune-run-ref>` and :ref:`randomly sample <tune-search-space>`
 from a uniform distribution for learning rate and momentum.
 
 .. literalinclude:: /../../python/ray/tune/tests/tutorial.py
diff --git a/doc/source/tune/key-concepts.rst b/doc/source/tune/key-concepts.rst
index 40944fe73a49..0606566d8444 100644
--- a/doc/source/tune/key-concepts.rst
+++ b/doc/source/tune/key-concepts.rst
@@ -81,10 +81,10 @@ how these values are sampled (e.g. from a uniform distribution or a normal
 distribution).
 
 Tune offers various functions to define search spaces and sampling methods.
-:ref:`You can find the documentation of these search space definitions here <tune-sample-docs>`.
+:ref:`You can find the documentation of these search space definitions here <tune-search-space>`.
 
 Here's an example covering all search space functions. Again,
-:ref:`here is the full explanation of all these functions <tune-sample-docs>`.
+:ref:`here is the full explanation of all these functions <tune-search-space>`.
 
 .. literalinclude:: doc_code/key_concepts.py
     :language: python
diff --git a/doc/source/tune/tutorials/tune-resources.rst b/doc/source/tune/tutorials/tune-resources.rst
index aca47a7a2f4f..540533582c5e 100644
--- a/doc/source/tune/tutorials/tune-resources.rst
+++ b/doc/source/tune/tutorials/tune-resources.rst
@@ -18,7 +18,7 @@ of CPUs (cores) on your machine.
     )
     results = tuner.fit()
 
-You can override this per trial resources with :ref:`tune-with-resources`. Here you can
+You can override this per trial resources with :func:`tune.with_resources <ray.tune.with_resources>`. Here you can
 specify your resource requests using either a dictionary, a :class:`~ray.air.config.ScalingConfig`, or a
 :class:`PlacementGroupFactory <ray.tune.execution.placement_groups.PlacementGroupFactory>`
 object. In any case, Ray Tune will try to start a placement group for each trial.
diff --git a/doc/source/tune/tutorials/tune-search-spaces.rst b/doc/source/tune/tutorials/tune-search-spaces.rst
index d10dd84b3a6e..bb2f441b7ecd 100644
--- a/doc/source/tune/tutorials/tune-search-spaces.rst
+++ b/doc/source/tune/tutorials/tune-search-spaces.rst
@@ -16,7 +16,7 @@ Thereby, you can either use the ``tune.grid_search`` primitive to use grid searc
     results = tuner.fit()
 
 
-Or you can use one of the random sampling primitives to specify distributions (:ref:`tune-sample-docs`):
+Or you can use one of the random sampling primitives to specify distributions (:doc:`/tune/api/search_space`):
 
 .. code-block:: python
 
@@ -130,7 +130,7 @@ for a total of 90 trials, each with randomly sampled values of ``alpha`` and ``b
 .. tip::
 
     Avoid passing large objects as values in the search space, as that will incur a performance overhead.
-    Use :ref:`tune-with-parameters` to pass large objects in or load them inside your trainable
+    Use :func:`tune.with_parameters <ray.tune.with_parameters>` to pass large objects in or load them inside your trainable
     from disk (making sure that all nodes have access to the files) or cloud storage.
     See :ref:`tune-bottlenecks` for more information.
 
diff --git a/doc/source/tune/tutorials/tune_get_data_in_and_out.md b/doc/source/tune/tutorials/tune_get_data_in_and_out.md
index 01e12d05571a..6585366114f2 100644
--- a/doc/source/tune/tutorials/tune_get_data_in_and_out.md
+++ b/doc/source/tune/tutorials/tune_get_data_in_and_out.md
@@ -62,7 +62,7 @@ Objects from the outer scope of the `training_function` will also be automatical
 TL;DR - use the `param_space` argument to specify small, serializable constants and variables.
 ```
 
-The first way of passing inputs into Trainables is the [*search space*](tune-key-concepts-search-spaces) (it may also be called *parameter space* or *config*). In the Trainable itself, it maps to the `config` dict passed in as an argument to the function. You define the search space using the `param_space` argument of the `Tuner`. The search space is a dict and may be composed of [*distributions*](<tune-sample-docs>), which will sample a different value for each Trial, or of constant values. The search space may be composed of nested dictionaries, and those in turn can have distributions as well.
+The first way of passing inputs into Trainables is the [*search space*](tune-key-concepts-search-spaces) (it may also be called *parameter space* or *config*). In the Trainable itself, it maps to the `config` dict passed in as an argument to the function. You define the search space using the `param_space` argument of the `Tuner`. The search space is a dict and may be composed of [*distributions*](<tune-search-space>), which will sample a different value for each Trial, or of constant values. The search space may be composed of nested dictionaries, and those in turn can have distributions as well.
 
 ```{warning}
 Each value in the search space will be saved directly in the Trial metadata. This means that every value in the search space **must** be serializable and take up a small amount of memory.
@@ -116,7 +116,7 @@ tuner = Tuner(
 TL;DR - use the `tune.with_parameters` util function to specify large constant parameters.
 ```
 
-If we have large objects that are constant across Trials, we can use the [`tune.with_parameters`](tune-with-parameters) utility to pass them into the Trainable directly. The objects will be stored in the [Ray object store](serialization-guide) so that each Trial worker may access them to obtain a local copy to use in its process.
+If we have large objects that are constant across Trials, we can use the {func}`tune.with_parameters <ray.tune.with_parameters>` utility to pass them into the Trainable directly. The objects will be stored in the [Ray object store](serialization-guide) so that each Trial worker may access them to obtain a local copy to use in its process.
 
 ```{tip}
 Objects put into the Ray object store must be serializable.
diff --git a/python/ray/tune/search/bayesopt/bayesopt_search.py b/python/ray/tune/search/bayesopt/bayesopt_search.py
index 160bab1918d6..d02752b52cbd 100644
--- a/python/ray/tune/search/bayesopt/bayesopt_search.py
+++ b/python/ray/tune/search/bayesopt/bayesopt_search.py
@@ -53,8 +53,14 @@ class BayesOptSearch(Searcher):
 
         pip install bayesian-optimization
 
-    This algorithm requires setting a search space using the
-    `BayesianOptimization search space specification`_.
+    Initializing this search algorithm with a ``space`` requires that it's
+    in the ``BayesianOptimization`` search space format. Otherwise, you
+    should instead pass in a Tune search space into ``Tuner(param_space=...)``,
+    and the search space will be automatically converted for you.
+
+    See this `BayesianOptimization example notebook
+    <https://github.com/fmfn/BayesianOptimization/blob/master/examples/advanced-tour.ipynb>`_
+    for an example.
 
     Args:
         space: Continuous search space. Parameters will be sampled from
diff --git a/python/ray/tune/search/optuna/optuna_search.py b/python/ray/tune/search/optuna/optuna_search.py
index 2462ac1af482..0c20fbb51abc 100644
--- a/python/ray/tune/search/optuna/optuna_search.py
+++ b/python/ray/tune/search/optuna/optuna_search.py
@@ -120,6 +120,8 @@ class OptunaSearch(Searcher):
             draw hyperparameter configurations. Defaults to ``MOTPESampler``
             for multi-objective optimization with Optuna<2.9.0, and
             ``TPESampler`` in every other case.
+            See https://optuna.readthedocs.io/en/stable/reference/samplers/index.html
+            for available Optuna samplers.
 
             .. warning::
                 Please note that with Optuna 2.10.0 and earlier
diff --git a/python/ray/tune/search/skopt/skopt_search.py b/python/ray/tune/search/skopt/skopt_search.py
index a207f938f1df..c3d8acf752aa 100644
--- a/python/ray/tune/search/skopt/skopt_search.py
+++ b/python/ray/tune/search/skopt/skopt_search.py
@@ -43,10 +43,10 @@ class SkOptSearch(Searcher):
 
         pip install scikit-optimize
 
-    This Search Algorithm requires you to pass in a `skopt Optimizer object`_.
+    This Search Algorithm requires you to pass in a `skopt Optimizer object
+    <https://scikit-optimize.github.io/stable/modules/generated/skopt.Optimizer.html#skopt.Optimizer>`_.
 
-    This searcher will automatically filter out any NaN, inf or -inf
-    results.
+    This searcher will automatically filter out any NaN, inf or -inf results.
 
     Parameters:
         optimizer: Optimizer provided

From faeb2cc2cbe92bc6de2b165fc4fe330585362338 Mon Sep 17 00:00:00 2001
From: Balaji Veeramani <balaji@anyscale.com>
Date: Fri, 10 Feb 2023 12:50:04 -0800
Subject: [PATCH 224/267] [AIR] Allow users to pass `Callable[[torch.Tensor],
 torch.Tensor]` to `TorchVisionTransform` (#32383)

Transforms like RandomHorizontalFlip expect Torch tensors as input, but if you're applying the transform per-epoch, then you can't use ToTensor. To fix the problem, this PR updates TorchVisionPreprocessor to convert ndarray inputs to Torch tensors.

You can't use ToTensor to convert the ndarrays to Torch tensors because then you'd be applying ToTensor twice, and your images would get scaled incorrectly.

Signed-off-by: Balaji Veeramani <balaji@anyscale.com>
---
 python/ray/data/preprocessors/torch.py        | 53 +++++++++++++------
 .../data/tests/preprocessors/test_torch.py    | 25 ++++++++-
 2 files changed, 59 insertions(+), 19 deletions(-)

diff --git a/python/ray/data/preprocessors/torch.py b/python/ray/data/preprocessors/torch.py
index 2f27ba178e38..2c531c9e2880 100644
--- a/python/ray/data/preprocessors/torch.py
+++ b/python/ray/data/preprocessors/torch.py
@@ -1,8 +1,8 @@
 from typing import TYPE_CHECKING, Callable, Dict, List, Union
 
 import numpy as np
-from ray.air.util.tensor_extensions.utils import _create_possibly_ragged_ndarray
 
+from ray.air.util.tensor_extensions.utils import _create_possibly_ragged_ndarray
 from ray.data.preprocessor import Preprocessor
 from ray.util.annotations import PublicAPI
 
@@ -21,8 +21,9 @@ class TorchVisionPreprocessor(Preprocessor):
         >>> dataset  # doctest: +ellipsis
         Dataset(num_blocks=..., num_rows=..., schema={image: ArrowTensorType(shape=(..., 3), dtype=float)})
 
-        :class:`TorchVisionPreprocessor` passes ndarrays to your transform. To convert
-        ndarrays to Torch tensors, add ``ToTensor`` to your pipeline.
+        Torch models expect inputs of shape :math:`(B, C, H, W)` in the range
+        :math:`[0.0, 1.0]`. To convert images to this format, add ``ToTensor`` to your
+        preprocessing pipeline.
 
         >>> from torchvision import transforms
         >>> from ray.data.preprocessors import TorchVisionPreprocessor
@@ -57,7 +58,8 @@ class TorchVisionPreprocessor(Preprocessor):
     Args:
         columns: The columns to apply the TorchVision transform to.
         transform: The TorchVision transform you want to apply. This transform should
-            accept an ``np.ndarray`` as input and return a ``torch.Tensor`` as output.
+            accept a ``np.ndarray`` or ``torch.Tensor`` as input and return a
+            ``torch.Tensor`` as output.
         batched: If ``True``, apply ``transform`` to batches of shape
             :math:`(B, H, W, C)`. Otherwise, apply ``transform`` to individual images.
     """  # noqa: E501
@@ -67,37 +69,54 @@ class TorchVisionPreprocessor(Preprocessor):
     def __init__(
         self,
         columns: List[str],
-        transform: Callable[["np.ndarray"], "torch.Tensor"],
+        transform: Callable[[Union["np.ndarray", "torch.Tensor"]], "torch.Tensor"],
         batched: bool = False,
     ):
         self._columns = columns
-        self._fn = transform
+        self._torchvision_transform = transform
         self._batched = batched
 
     def __repr__(self) -> str:
         return (
             f"{self.__class__.__name__}(columns={self._columns}, "
-            f"transform={self._fn!r})"
+            f"transform={self._torchvision_transform!r})"
         )
 
     def _transform_numpy(
         self, np_data: Union["np.ndarray", Dict[str, "np.ndarray"]]
     ) -> Union["np.ndarray", Dict[str, "np.ndarray"]]:
-        def transform(batch: np.ndarray) -> np.ndarray:
+        import torch
+        from ray.air._internal.torch_utils import convert_ndarray_to_torch_tensor
+
+        def apply_torchvision_transform(array: np.ndarray) -> np.ndarray:
+            try:
+                tensor = convert_ndarray_to_torch_tensor(array)
+                output = self._torchvision_transform(tensor)
+            except TypeError:
+                # Transforms like `ToTensor` expect a `np.ndarray` as input.
+                output = self._torchvision_transform(array)
+
+            if not isinstance(output, torch.Tensor):
+                raise ValueError(
+                    "`TorchVisionPreprocessor` expected your transform to return a "
+                    "`torch.Tensor`, but your transform returned a "
+                    f"`{type(output).__name__}` instead."
+                )
+
+            return output.numpy()
+
+        def transform_batch(batch: np.ndarray) -> np.ndarray:
             if self._batched:
-                return self._fn(batch).numpy()
+                return apply_torchvision_transform(batch)
             return _create_possibly_ragged_ndarray(
-                [self._fn(array).numpy() for array in batch],
+                [apply_torchvision_transform(array) for array in batch]
             )
 
         if isinstance(np_data, dict):
-            outputs = {}
-            for column, batch in np_data.items():
-                if column in self._columns:
-                    outputs[column] = transform(batch)
-                else:
-                    outputs[column] = batch
+            outputs = np_data
+            for column in self._columns:
+                outputs[column] = transform_batch(np_data[column])
         else:
-            outputs = transform(np_data)
+            outputs = transform_batch(np_data)
 
         return outputs
diff --git a/python/ray/data/tests/preprocessors/test_torch.py b/python/ray/data/tests/preprocessors/test_torch.py
index 04f473491ac5..1cd348f8d93a 100644
--- a/python/ray/data/tests/preprocessors/test_torch.py
+++ b/python/ray/data/tests/preprocessors/test_torch.py
@@ -24,14 +24,20 @@ def __repr__(self):
             == "TorchVisionPreprocessor(columns=['spam'], transform=StubTransform())"
         )
 
-    def test_transform_images(self):
+    @pytest.mark.parametrize(
+        "transform",
+        [
+            transforms.ToTensor(),  # `ToTensor` accepts an `np.ndarray` as input
+            transforms.Lambda(lambda tensor: tensor.permute(2, 0, 1)),
+        ],
+    )
+    def test_transform_images(self, transform):
         dataset = ray.data.from_items(
             [
                 {"image": np.zeros((32, 32, 3)), "label": 0},
                 {"image": np.zeros((32, 32, 3)), "label": 1},
             ]
         )
-        transform = transforms.ToTensor()
         preprocessor = TorchVisionPreprocessor(columns=["image"], transform=transform)
 
         transformed_dataset = preprocessor.transform(dataset)
@@ -99,6 +105,21 @@ def test_transform_ragged_images(self):
         labels = {record["label"] for record in transformed_dataset.take_all()}
         assert labels == {0, 1}
 
+    def test_invalid_transform_raises_value_error(self):
+        dataset = ray.data.from_items(
+            [
+                {"image": np.zeros((32, 32, 3)), "label": 0},
+                {"image": np.zeros((32, 32, 3)), "label": 1},
+            ]
+        )
+        # `TorchVisionPreprocessor` expects transforms to return `torch.Tensor`s, but
+        # this `transform` returns a `np.ndarray`.
+        transform = transforms.Lambda(lambda tensor: tensor.numpy())
+        preprocessor = TorchVisionPreprocessor(columns=["image"], transform=transform)
+
+        with pytest.raises(ValueError):
+            preprocessor.transform(dataset)
+
 
 if __name__ == "__main__":
     import sys

From 299d8f0e346c03880d5f04c9020497a933a62b3e Mon Sep 17 00:00:00 2001
From: Jiajun Yao <jeromeyjj@gmail.com>
Date: Sat, 11 Feb 2023 05:06:31 +0800
Subject: [PATCH 225/267] Add triage label to enhancement and doc issues as
 well (#32352)

- Add triage label to enhancement and doc issues as well
- Don't auto close issues pending triage

Signed-off-by: Jiajun Yao <jeromeyjj@gmail.com>
---
 .github/ISSUE_TEMPLATE/documentation-issue.yml |  2 +-
 .github/ISSUE_TEMPLATE/feature-request.yml     |  2 +-
 .github/stale.yml                              | 17 +++++++++--------
 3 files changed, 11 insertions(+), 10 deletions(-)

diff --git a/.github/ISSUE_TEMPLATE/documentation-issue.yml b/.github/ISSUE_TEMPLATE/documentation-issue.yml
index a35084dc5669..cd62453616be 100644
--- a/.github/ISSUE_TEMPLATE/documentation-issue.yml
+++ b/.github/ISSUE_TEMPLATE/documentation-issue.yml
@@ -1,7 +1,7 @@
 name: Documentation
 title: "[<Ray component: Core|RLlib|etc...>] "
 description: Report an issue with the Ray documentation
-labels: [docs]
+labels: [docs, triage]
 body:
   - type: markdown
     attributes:
diff --git a/.github/ISSUE_TEMPLATE/feature-request.yml b/.github/ISSUE_TEMPLATE/feature-request.yml
index b198aa88ad31..5e9f21facb70 100644
--- a/.github/ISSUE_TEMPLATE/feature-request.yml
+++ b/.github/ISSUE_TEMPLATE/feature-request.yml
@@ -1,7 +1,7 @@
 name: Ray feature request
 description: Suggest an idea for Ray project
 title: "[<Ray component: Core|RLlib|etc...>] "
-labels: [enhancement]
+labels: [enhancement, triage]
 body:
   - type: markdown
     attributes:
diff --git a/.github/stale.yml b/.github/stale.yml
index 9016df24d8e5..3fc812efef31 100644
--- a/.github/stale.yml
+++ b/.github/stale.yml
@@ -12,6 +12,7 @@ onlyLabels: []
 
 # Issues or Pull Requests with these labels will never be considered stale. Set to `[]` to disable
 exemptLabels:
+  - triage
   - P0
   - P1
   - P2
@@ -37,16 +38,16 @@ staleLabel: stale
 # Comment to post when marking as stale. Set to `false` to disable
 markComment: |
   Hi, I'm a bot from the Ray team :)
-  
+
   To help human contributors to focus on more relevant issues, I will automatically add the stale label to issues that have had no activity for more than 4 months.
 
   If there is no further activity in the 14 days, the issue will be closed!
-  
+
   - If you'd like to keep the issue open, just leave any comment, and the stale label will be removed!
   - If you'd like to get more attention to the issue, please tag one of Ray's contributors.
 
-  You can always ask for help on our [discussion forum](https://discuss.ray.io/) or [Ray's public slack channel](https://github.com/ray-project/ray#getting-involved). 
-  
+  You can always ask for help on our [discussion forum](https://discuss.ray.io/) or [Ray's public slack channel](https://github.com/ray-project/ray#getting-involved).
+
 # Comment to post when removing the stale label.
 # unmarkComment: >
 #   Your comment here.
@@ -54,12 +55,12 @@ markComment: |
 # Comment to post when closing a stale Issue or Pull Request.
 closeComment: |
   Hi again! The issue will be closed because there has been no more activity in the 14 days since the last message.
-  
+
   Please feel free to reopen or open a new issue if you'd still like it to be addressed.
 
-  Again, you can always ask for help on our [discussion forum](https://discuss.ray.io) or [Ray's public slack channel](https://github.com/ray-project/ray#getting-involved). 
+  Again, you can always ask for help on our [discussion forum](https://discuss.ray.io) or [Ray's public slack channel](https://github.com/ray-project/ray#getting-involved).
 
-  Thanks again for opening the issue! 
+  Thanks again for opening the issue!
 
 # Limit the number of actions per hour, from 1-30. Default is 30
 limitPerRun: 30
@@ -75,7 +76,7 @@ pulls:
      This pull request has been automatically marked as stale because it has not had
      recent activity. It will be closed in 14 days if no further activity occurs. Thank you
      for your contributions.
-     
+
      - If you'd like to keep this open, just leave any comment, and the stale label will be removed.
 
 # issues:

From 687918421ffe3853d9785f6a5de9549f02d50dbc Mon Sep 17 00:00:00 2001
From: Chen Shen <scv119@gmail.com>
Date: Fri, 10 Feb 2023 13:29:43 -0800
Subject: [PATCH 226/267] [docs] removing docs referring ray client. (#32209)

Why are these changes needed?
Deprecating ray client related docs.
---
 doc/source/cluster/key-concepts.rst           |  2 +-
 .../job-submission/index.md                   |  2 +-
 doc/source/data/modin/index.rst               | 18 ---------
 doc/source/ray-core/handling-dependencies.rst | 14 +------
 doc/source/ray-core/tasks/generators.rst      |  2 -
 .../using-ray-with-pytorch-lightning.rst      |  1 -
 doc/source/tune/examples/tune-mlflow.ipynb    |  5 ---
 doc/source/workflows/advanced.rst             | 37 +------------------
 doc/source/workflows/management.rst           |  3 +-
 python/ray/scripts/scripts.py                 | 21 +----------
 .../test_cli_patterns/test_ray_start.txt      |  6 ---
 .../test_ray_start_localhost.txt              |  6 ---
 12 files changed, 7 insertions(+), 110 deletions(-)

diff --git a/doc/source/cluster/key-concepts.rst b/doc/source/cluster/key-concepts.rst
index eeff72eb9c7e..a51244ecd2ec 100644
--- a/doc/source/cluster/key-concepts.rst
+++ b/doc/source/cluster/key-concepts.rst
@@ -74,7 +74,7 @@ There are three ways to run a Ray job on a Ray cluster:
 
 1. (Recommended) Submit the job using the :ref:`Ray Jobs API <jobs-overview>`.
 2. Run the driver script directly on any node of the Ray cluster, for interactive development.
-3. Use :ref:`Ray Client <ray-client-ref>` to connect remotely to the cluster within a driver script.
+3. (For Experts only) Use :ref:`Ray Client <ray-client-ref>` to connect remotely to the cluster within a driver script.
 
 For details on these workflows, refer to the :ref:`Ray Jobs API guide <jobs-overview>`.
 
diff --git a/doc/source/cluster/running-applications/job-submission/index.md b/doc/source/cluster/running-applications/job-submission/index.md
index 64ff075f6da3..bf3902efa573 100644
--- a/doc/source/cluster/running-applications/job-submission/index.md
+++ b/doc/source/cluster/running-applications/job-submission/index.md
@@ -33,7 +33,7 @@ If needed, the Ray Jobs API also provides APIs for [programmatic job submission]
 If you would like to run an application *interactively* and see the output in real time (for example, during development or debugging), you can:
 
 - (Recommended) Run your script directly on a cluster node (e.g. after SSHing into the node using [`ray attach`](ray-attach-doc)), or
-- use [Ray Client](ray-client-ref) to run a script from your local machine while maintaining a connection to the cluster.
+- (For Experts only) Use [Ray Client](ray-client-ref) to run a script from your local machine while maintaining a connection to the cluster.
 
 Note that jobs started in these ways are not managed by the Ray Jobs API, so the Ray Jobs API will not be able to see them or interact with them (with the exception of `ray job list` and `JobSubmissionClient.list_jobs()`).
 
diff --git a/doc/source/data/modin/index.rst b/doc/source/data/modin/index.rst
index 148aad5b9dbc..04bfbcb82064 100644
--- a/doc/source/data/modin/index.rst
+++ b/doc/source/data/modin/index.rst
@@ -42,24 +42,6 @@ by simply importing.
 As long as Ray is initialized before any dataframes are created, Modin
 will be able to connect to and use the Ray cluster.
 
-Modin with the Ray Client
--------------------------
-
-When using Modin with the :ref:`Ray Client <ray-client-ref>`, it is important to ensure that the
-cluster has all dependencies installed.
-
-.. code-block:: python
-
-   import modin.pandas as pd
-   import ray
-   import ray.util
-
-   ray.init("ray://<head_node_host>:10001")
-   df = pd.read_parquet("s3://my-bucket/big.parquet")
-
-Modin will automatically use the Ray Client for computation when the file
-is read.
-
 How Modin uses Ray
 ------------------
 
diff --git a/doc/source/ray-core/handling-dependencies.rst b/doc/source/ray-core/handling-dependencies.rst
index 4ce58595e3ce..4e4ea2936641 100644
--- a/doc/source/ray-core/handling-dependencies.rst
+++ b/doc/source/ray-core/handling-dependencies.rst
@@ -28,7 +28,7 @@ Concepts
 
 - **Packages**. External libraries or executables required by your Ray application, often installed via ``pip`` or ``conda``.
 
-- **Local machine** and **Cluster**.  Usually, you may want to separate the Ray cluster compute machines/pods from the machine/pod that handles and submits the application. You can submit a Ray Job via :ref:`the Ray Job Submission mechanism <jobs-overview>`, or the :ref:`Ray Client <ray-client-ref>` to connect to a cluster interactively. We call the machine submitting the job your *local machine*.
+- **Local machine** and **Cluster**.  Usually, you may want to separate the Ray cluster compute machines/pods from the machine/pod that handles and submits the application. You can submit a Ray Job via :ref:`the Ray Job Submission mechanism <jobs-overview>`, or use `ray attach` to connect to a cluster interactively. We call the machine submitting the job your *local machine*.
 
 - **Job**. A :ref:`Ray job <cluster-clients-and-jobs>` is a single application: it is the collection of Ray tasks, objects, and actors that originate from the same script.
 
@@ -110,7 +110,7 @@ There are two primary scopes for which you can specify a runtime environment:
 Specifying a Runtime Environment Per-Job
 ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
-You can specify a runtime environment for your whole job, whether running a script directly on the cluster, using the :ref:`Ray Jobs API <jobs-overview>`, or using :ref:`Ray Client <ray-client-ref>`:
+You can specify a runtime environment for your whole job, whether running a script directly on the cluster, using the :ref:`Ray Jobs API <jobs-overview>`:
 
 .. literalinclude:: /ray-core/doc_code/runtime_env_example.py
    :language: python
@@ -139,16 +139,6 @@ You can specify a runtime environment for your whole job, whether running a scri
     
     This ensures the runtime environment is installed on the cluster before the entrypoint script is run.
 
-..
-  TODO(architkulkarni): run Ray Client doc example in CI
-
-.. code-block:: python
-
-    # Option 4: Connecting to remote cluster using Ray Client
-    ray.init("ray://<head-node-ip>:10001", runtime_env=runtime_env)
-
-This will install the dependencies to the remote cluster.  Any tasks and actors used in the job will use this runtime environment unless otherwise specified.
-
 .. note::
 
   There are two options for when to install the runtime environment:
diff --git a/doc/source/ray-core/tasks/generators.rst b/doc/source/ray-core/tasks/generators.rst
index 1c5eefc4b41d..61bd4c39a5d0 100644
--- a/doc/source/ray-core/tasks/generators.rst
+++ b/doc/source/ray-core/tasks/generators.rst
@@ -100,5 +100,3 @@ Limitations
 -----------
 
 Although a generator function creates ``ObjectRefs`` one at a time, currently Ray will not schedule dependent tasks until the entire task is complete and all values have been created. This is similar to the semantics used by tasks that return multiple values as a list.
-
-``num_returns="dynamic"`` is not yet supported for :ref:`Ray Client <ray-client-ref>`.
diff --git a/doc/source/ray-more-libs/using-ray-with-pytorch-lightning.rst b/doc/source/ray-more-libs/using-ray-with-pytorch-lightning.rst
index f59f24081c45..cd3f9a6a40c8 100644
--- a/doc/source/ray-more-libs/using-ray-with-pytorch-lightning.rst
+++ b/doc/source/ray-more-libs/using-ray-with-pytorch-lightning.rst
@@ -82,7 +82,6 @@ Then, run your Ray script using one of the following options:
 
 1. on the head node of the cluster (``python train_script.py``)
 2. via ``ray job submit`` (:ref:`docs <jobs-overview>`) from your laptop (``ray job submit -- python train.py``)
-3. via the :ref:`Ray Client <ray-client-ref>` from your laptop.
 
 .. _pytorch-lightning-tune:
 
diff --git a/doc/source/tune/examples/tune-mlflow.ipynb b/doc/source/tune/examples/tune-mlflow.ipynb
index 23f66d238c30..ab2d7384cf64 100644
--- a/doc/source/tune/examples/tune-mlflow.ipynb
+++ b/doc/source/tune/examples/tune-mlflow.ipynb
@@ -9,11 +9,6 @@
     "\n",
     "(tune-mlflow-ref)=\n",
     "\n",
-    ":::{warning}\n",
-    "If you are using these MLflow integrations with {ref}`ray-client-ref`, it is recommended that you setup a\n",
-    "remote MLflow tracking server instead of one that is backed by the local filesystem.\n",
-    ":::\n",
-    "\n",
     "[MLflow](https://mlflow.org/) is an open source platform to manage the ML lifecycle, including experimentation,\n",
     "reproducibility, deployment, and a central model registry. It currently offers four components, including\n",
     "MLflow Tracking to record and query experiments, including code, data, config, and results.\n",
diff --git a/doc/source/workflows/advanced.rst b/doc/source/workflows/advanced.rst
index 3adb82bea3e2..d5624a54177b 100644
--- a/doc/source/workflows/advanced.rst
+++ b/doc/source/workflows/advanced.rst
@@ -14,39 +14,4 @@ Checkpoints can be skipped by specifying ``checkpoint=False``:
 
 This example skips checkpointing the output of ``read_data``. During recovery, ``read_data`` would be executed again if recovery requires its output.
 
-If the output of a task is another task (i.e., for dynamic workflows), we skip checkpointing the entire task.
-
-Use Workflows with Ray Client
------------------------------
-
-Ray Workflows supports :ref:`Ray Client API <ray-client-ref>`, so you can submit workflows to a remote
-Ray cluster. This requires starting the Ray cluster with the ``--storage=<storage_uri>`` option
-for specifying the workflow storage.
-
-To submit a workflow to a remote cluster, all you need is connect Ray to the cluster before
-submitting a workflow. No code changes are required. For example:
-
-.. code-block:: python
-
-    import subprocess
-    import ray
-    from ray import workflow
-
-    @ray.remote
-    def hello(count):
-        return ["hello world"] * count
-
-    try:
-        subprocess.check_call(
-            ["ray", "start", "--head", "--ray-client-server-port=10001", "--storage=file:///tmp/ray/workflow_data"])
-        ray.init("ray://127.0.0.1:10001")
-        assert workflow.run(hello.bind(3)) == ["hello world"] * 3
-    finally:
-        subprocess.check_call(["ray", "stop"])
-
-
-.. warning::
-
-  Ray client support is still experimental and has some limitations. One known limitation is that
-  workflows will not work properly with ObjectRefs as workflow task inputs. For example,
-  ``workflow.run(task.bind(ray.put(123)))``.
+If the output of a task is another task (i.e., for dynamic workflows), we skip checkpointing the entire task.
\ No newline at end of file
diff --git a/doc/source/workflows/management.rst b/doc/source/workflows/management.rst
index 2540764bfc6b..750f12930166 100644
--- a/doc/source/workflows/management.rst
+++ b/doc/source/workflows/management.rst
@@ -80,8 +80,7 @@ Recurring workflows
 
 Ray Workflows currently has no built-in job scheduler. You can however easily use
 any external job scheduler to interact with your Ray cluster
-(via :ref:`job submission <jobs-overview>` or :ref:`client connection
-<ray-client-ref>`)
+(via :ref:`job submission <jobs-overview>`)
 to trigger workflow runs.
 
 Storage Configuration
diff --git a/python/ray/scripts/scripts.py b/python/ray/scripts/scripts.py
index 048a7afe0f97..6322fce9521c 100644
--- a/python/ray/scripts/scripts.py
+++ b/python/ray/scripts/scripts.py
@@ -785,26 +785,7 @@ def start(
                     if include_node_ip_address
                     else "",
                 )
-            cli_logger.newline()
-            cli_logger.print(
-                "To connect to this Ray runtime from outside of "
-                "the cluster, for example to"
-            )
-            cli_logger.print(
-                "connect to a remote cluster from your laptop "
-                "directly, use the following"
-            )
-            cli_logger.print("Python code:")
-            with cli_logger.indented():
-                cli_logger.print("{} ray", cf.magenta("import"))
-                cli_logger.print(
-                    "ray{}init(address{}{})",
-                    cf.magenta("."),
-                    cf.magenta("="),
-                    cf.yellow(
-                        "'ray://<head_node_ip_address>:" f"{ray_client_server_port}'"
-                    ),
-                )
+
             cli_logger.newline()
             cli_logger.print("To see the status of the cluster, use")
             cli_logger.print("  {}".format(cf.bold("ray status")))
diff --git a/python/ray/tests/test_cli_patterns/test_ray_start.txt b/python/ray/tests/test_cli_patterns/test_ray_start.txt
index 31df71daea0a..6acae14bab52 100644
--- a/python/ray/tests/test_cli_patterns/test_ray_start.txt
+++ b/python/ray/tests/test_cli_patterns/test_ray_start.txt
@@ -14,12 +14,6 @@ Next steps
     import ray
     ray\.init\(address='auto'\)
 
-  To connect to this Ray runtime from outside of the cluster, for example to
-  connect to a remote cluster from your laptop directly, use the following
-  Python code:
-    import ray
-    ray\.init\(address='ray://.*'\)
-
   To see the status of the cluster, use
     ray status
   To monitor and debug Ray, view the dashboard at 
diff --git a/python/ray/tests/test_cli_patterns/test_ray_start_localhost.txt b/python/ray/tests/test_cli_patterns/test_ray_start_localhost.txt
index 64900045c8cf..949eb5c5694a 100644
--- a/python/ray/tests/test_cli_patterns/test_ray_start_localhost.txt
+++ b/python/ray/tests/test_cli_patterns/test_ray_start_localhost.txt
@@ -17,12 +17,6 @@ Next steps
     import ray
     ray\.init\(address='auto'\)
 
-  To connect to this Ray runtime from outside of the cluster, for example to
-  connect to a remote cluster from your laptop directly, use the following
-  Python code:
-    import ray
-    ray\.init\(address='ray://.*'\)
-
   To see the status of the cluster, use
     ray status
   To monitor and debug Ray, view the dashboard at 

From 16a7683fbda5e4a81c2976430e715d73e5aead61 Mon Sep 17 00:00:00 2001
From: Jiajun Yao <jeromeyjj@gmail.com>
Date: Sat, 11 Feb 2023 05:31:25 +0800
Subject: [PATCH 227/267] [Doc] Document the top-k default scheduling strategy
 (#32331)

Signed-off-by: Jiajun Yao <jeromeyjj@gmail.com>
---
 doc/source/ray-core/scheduling/index.rst | 14 ++++++++++++--
 1 file changed, 12 insertions(+), 2 deletions(-)

diff --git a/doc/source/ray-core/scheduling/index.rst b/doc/source/ray-core/scheduling/index.rst
index 560a2aa2cc05..5ec7f1c9bab6 100644
--- a/doc/source/ray-core/scheduling/index.rst
+++ b/doc/source/ray-core/scheduling/index.rst
@@ -37,8 +37,18 @@ Currently the supported strategies are the followings.
 "DEFAULT"
 ~~~~~~~~~
 
-``"DEFAULT"`` is the default strategy used by Ray. With the current implementation, Ray will try to pack tasks or actors on nodes
-until the resource utilization is beyond a certain threshold and spread them afterwards.
+``"DEFAULT"`` is the default strategy used by Ray.
+Ray schedules tasks or actors onto a group of the top k nodes.
+Specifically, the nodes are sorted to first favor those that already have tasks or actors scheduled (for locality),
+then to favor those that have low resource utilization (for load balancing).
+Within the top k group, nodes are chosen randomly to further improve load-balancing and mitigate delays from cold-start in large clusters.
+
+Implementation-wise, Ray calculates a score for each node in a cluster based on the utilization of its logical resources.
+If the utilization is below a threshold (controlled by the OS environment variable ``RAY_scheduler_spread_threshold``, default is 0.5), the score is 0,
+otherwise it is the resource utilization itself (score 1 means the node is fully utilized).
+Ray selects the best node for scheduling by randomly picking from the top k nodes with the lowest scores.
+The value of ``k`` is the max of (number of nodes in the cluster * ``RAY_scheduler_top_k_fraction`` environment variable) and ``RAY_scheduler_top_k_absolute`` environment variable.
+By default, it's 20% of the total number of nodes.
 
 Currently Ray handles actors that don't require any resources (i.e., ``num_cpus=0`` with no other resources) specially by randomly choosing a node in the cluster without considering resource utilization.
 Since nodes are randomly chosen, actors that don't require any resources are effectively SPREAD across the cluster.

From 08a8c65e99b73fc6f237a51fe93f9bb56e7c02d9 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Fri, 10 Feb 2023 13:49:46 -0800
Subject: [PATCH 228/267] [Datasets] Update Ray Data documentation for lazy
 execution by default (1st part) (#32394)

This is to update Ray Data documentation and code example to reflect lazy execution by default. This covers the rest of documentation other than #32387 .

Signed-off-by: Cheng Su <scnju13@gmail.com>
---
 doc/source/data/creating-datasets.rst         |  12 +-
 doc/source/data/dataset-internals.rst         |   2 +
 doc/source/data/dataset-ml-preprocessing.rst  |  11 +-
 doc/source/data/doc_code/creating_datasets.py |  15 --
 doc/source/data/doc_code/tensor.py            |   2 +
 .../data/doc_code/transforming_datasets.py    | 135 ++++++++++++------
 doc/source/data/key-concepts.rst              |   5 +
 doc/source/data/transforming-datasets.rst     |   2 +-
 8 files changed, 113 insertions(+), 71 deletions(-)

diff --git a/doc/source/data/creating-datasets.rst b/doc/source/data/creating-datasets.rst
index da06b0e3f3aa..2d1a8a702412 100644
--- a/doc/source/data/creating-datasets.rst
+++ b/doc/source/data/creating-datasets.rst
@@ -663,12 +663,10 @@ parallelism.
 Deferred Read Task Execution
 ============================
 
-Datasets created via the ``ray.data.read_*()`` APIs are semi-lazy: initially, only the
-first read task will be executed. This avoids blocking Dataset creation on the reading
-of all data files, enabling inspection functions like
-:meth:`ds.schema() <ray.data.Dataset.schema>` and
-:meth:`ds.show() <ray.data.Dataset.show>` to be used right away. Executing further
-transformations on the Dataset will trigger execution of all read tasks, and execution
+Datasets created via the ``ray.data.read_*()`` APIs are lazy: no read tasks are
+executed until a downstream consumption operation triggers execution. Metadata
+inspection functions like :meth:`ds.schema() <ray.data.Dataset.schema>` and
+:meth:`ds.show() <ray.data.Dataset.show>` will trigger execution of only one or some
+tasks, instead of all tasks. This allows metadata to be inspected right away. Execution
 of all read tasks can be triggered manually using the
 :meth:`ds.fully_executed() <ray.data.Dataset.fully_executed>` API.
-
diff --git a/doc/source/data/dataset-internals.rst b/doc/source/data/dataset-internals.rst
index ee4d666010f3..c40fbb52b476 100644
--- a/doc/source/data/dataset-internals.rst
+++ b/doc/source/data/dataset-internals.rst
@@ -59,6 +59,8 @@ placement group. If you want to force Datasets to schedule tasks within the curr
 
 This should be considered for advanced use cases to improve performance predictability only. We generally recommend letting Datasets run outside placement groups as documented in the :ref:`Datasets and Other Libraries <datasets_tune>` section.
 
+.. _datasets_execution:
+
 Execution
 =========
 
diff --git a/doc/source/data/dataset-ml-preprocessing.rst b/doc/source/data/dataset-ml-preprocessing.rst
index a6395b6d9249..68228a80b5c9 100644
--- a/doc/source/data/dataset-ml-preprocessing.rst
+++ b/doc/source/data/dataset-ml-preprocessing.rst
@@ -80,7 +80,7 @@ Pandas operations to the block columns within the UDF.
 Group-bys and aggregations
 ==========================
 
-Other preprocessing operations require global operations, such as groupbys and grouped/global aggregations. Just like other transformations, grouped/global aggregations are executed *eagerly* and block until the aggregation has been computed.
+Other preprocessing operations require global operations, such as groupbys and grouped/global aggregations. Grouped aggregations are executed lazily. Global aggregations are executed *eagerly* and block until the aggregation has been computed.
 
 .. code-block:: python
 
@@ -90,6 +90,7 @@ Other preprocessing operations require global operations, such as groupbys and g
 
     # Group by the A column and calculate the per-group mean for B and C columns.
     agg_ds: ray.data.Dataset = ds.groupby("A").mean(["B", "C"])
+    agg_ds.fully_executed()
     # -> Sort Sample: 100%|███████████████████████████████████████| 10/10 [00:01<00:00,  9.04it/s]
     # -> GroupBy Map: 100%|███████████████████████████████████████| 10/10 [00:00<00:00, 23.66it/s]
     # -> GroupBy Reduce: 100%|████████████████████████████████████| 10/10 [00:00<00:00, 937.21it/s]
@@ -135,11 +136,12 @@ These aggregations can be combined with batch mapping to transform a dataset usi
         return df
 
     ds = ds.map_batches(impute_b, batch_format="pandas")
-    # -> Map Progress: 100%|██████████████████████████████████████| 10/10 [00:00<00:00, 132.66it/s]
-    # -> Dataset(num_blocks=10, num_rows=10, schema={A: int64, B: int64, C: int64})
+    # -> MapBatches(impute_b)
+    #    +- Dataset(num_blocks=10, num_rows=10, schema={A: int64, B: int64, C: int64})
 
     # Standard scaling of all feature columns.
     stats = ds.aggregate(Mean("B"), Std("B"), Mean("C"), Std("C"))
+    # -> MapBatches(impute_b): 100%|██████████████████████████████| 10/10 [00:01<00:00,  7.16it/s]
     # -> GroupBy Map: 100%|███████████████████████████████████████| 10/10 [00:00<00:00, 1260.99it/s]
     # -> GroupBy Reduce: 100%|████████████████████████████████████| 1/1 [00:00<00:00, 128.77it/s]
     # -> {'mean(B)': 9.0, 'std(B)': 6.0553007081949835, 'mean(C)': 13.5, 'std(C)': 9.082951062292475}
@@ -155,6 +157,7 @@ These aggregations can be combined with batch mapping to transform a dataset usi
         return df
 
     ds = ds.map_batches(batch_standard_scaler, batch_format="pandas")
+    ds.fully_executed()
     # -> Map Progress: 100%|██████████████████████████████████████| 10/10 [00:00<00:00, 144.79it/s]
     # -> Dataset(num_blocks=10, num_rows=10, schema={A: int64, B: double, C: double})
 
@@ -170,6 +173,7 @@ Randomly shuffling data is an important part of training machine learning models
 
     # Global random shuffle.
     ds = ds.random_shuffle()
+    ds.fully_executed()
     # -> Shuffle Map: 100%|███████████████████████████████████████| 10/10 [00:00<00:00, 12.35it/s]
     # -> Shuffle Reduce: 100%|████████████████████████████████████| 10/10 [00:00<00:00, 45.54it/s]
     # -> [7, 1, ..., 3]
@@ -183,6 +187,7 @@ Randomly shuffling data is an important part of training machine learning models
     # Don't run this next one on your laptop; it will probably crash since it will
     # try to read and shuffle ~99 GB of data!
     ds = ds.random_shuffle()
+    ds.fully_executed()
     # -> Shuffle Map: 100%|███████████████████████████████████████| 125/125 [00:00<00:00, 5021.94it/s]
     # -> Shuffle Reduce: 100%|████████████████████████████████████| 125/125 [00:00<00:00, 4034.33it/s]
     # -> Dataset(num_blocks=125, num_rows=1547741381, schema={
diff --git a/doc/source/data/doc_code/creating_datasets.py b/doc/source/data/doc_code/creating_datasets.py
index a1ffe0745423..a4ac38c28347 100644
--- a/doc/source/data/doc_code/creating_datasets.py
+++ b/doc/source/data/doc_code/creating_datasets.py
@@ -112,21 +112,6 @@
 # __from_numpy_begin__
 import numpy as np
 
-# Create a tensor Dataset from a 1D NumPy ndarray.
-arr = np.arange(100)
-ds = ray.data.from_numpy(arr)
-# -> Dataset(
-#        num_blocks=1,
-#        num_rows=100,
-#        schema={value: <ArrowTensorType: shape=(), dtype=int64>},
-#    )
-
-# Each element is a scalar ndarray.
-ds.show(3)
-# -> {'value': array(0)}
-# -> {'value': array(1)}
-# -> {'value': array(2)}
-
 # Create a tensor Dataset from a 3D NumPy ndarray.
 arr = np.ones((3, 4, 4))
 # The outer dimension is treated as the row dimension.
diff --git a/doc/source/data/doc_code/tensor.py b/doc/source/data/doc_code/tensor.py
index 1f1d12efd772..6b41c6bfbd35 100644
--- a/doc/source/data/doc_code/tensor.py
+++ b/doc/source/data/doc_code/tensor.py
@@ -52,6 +52,7 @@ def single_col_udf(batch: pd.DataFrame) -> pd.DataFrame:
 
 
 ds.map_batches(single_col_udf)
+ds.fully_executed()
 # -> Dataset(num_blocks=17, num_rows=1000,
 #            schema={__value__: TensorDtype(shape=(128, 128, 3), dtype=int64)})
 # __create_pandas_end__
@@ -73,6 +74,7 @@ def multi_col_udf(batch: pd.DataFrame) -> pd.DataFrame:
 
 
 ds.map_batches(multi_col_udf)
+ds.fully_executed()
 # -> Dataset(num_blocks=17, num_rows=1000,
 #            schema={image: TensorDtype(shape=(128, 128, 3), dtype=int64),
 #                    embed: TensorDtype(shape=(256,), dtype=uint8)})
diff --git a/doc/source/data/doc_code/transforming_datasets.py b/doc/source/data/doc_code/transforming_datasets.py
index 876526c07f4c..681fd528ea10 100644
--- a/doc/source/data/doc_code/transforming_datasets.py
+++ b/doc/source/data/doc_code/transforming_datasets.py
@@ -22,9 +22,10 @@
 
 # Repartition the dataset to 5 blocks.
 ds = ds.repartition(5)
-# Dataset(num_blocks=5, num_rows=150,
-#         schema={sepal.length: double, sepal.width: double,
-#                 petal.length: double, petal.width: double, variety: string})
+# -> Repartition
+#    +- Dataset(num_blocks=1, num_rows=150,
+#               schema={sepal.length: float64, sepal.width: float64,
+#                       petal.length: float64, petal.width: float64, variety: object})
 
 # Find rows with sepal.length < 5.5 and petal.length > 3.5.
 def transform_batch(df: pandas.DataFrame) -> pandas.DataFrame:
@@ -224,12 +225,10 @@ def normalize(arr: np.ndarray) -> np.ndarray:
     range_[idx] = 1
     return (arr - mins) / range_
 
-ds.map_batches(normalize, batch_format="numpy")
-# -> Dataset(
-#        num_blocks=1,
-#        num_rows=3,
-#        schema={__value__: <ArrowTensorType: shape=(28, 28), dtype=double>}
-#    )
+ds = ds.map_batches(normalize, batch_format="numpy")
+# -> MapBatches(normalize)
+#    +- Dataset(num_blocks=1, num_rows=3,
+#               schema={__value__: <ArrowTensorType: shape=(28, 28), dtype=double>})
 # __writing_numpy_udfs_end__
 # fmt: on
 
@@ -275,7 +274,8 @@ def convert_to_pandas(text: List[str]) -> pd.DataFrame:
     return pd.DataFrame({"text": text})
 
 ds = ds.map_batches(convert_to_pandas)
-# -> Dataset(num_blocks=1, num_rows=10, schema={text: object})
+# -> MapBatches(convert_to_pandas)
+#    +- Dataset(num_blocks=1, num_rows=10, schema={text: string})
 
 ds.show(2)
 # -> {
@@ -303,7 +303,8 @@ def convert_to_arrow(text: List[str]) -> pa.Table:
     return pa.table({"text": text})
 
 ds = ds.map_batches(convert_to_arrow)
-# -> Dataset(num_blocks=1, num_rows=10, schema={text: object})
+# -> MapBatches(convert_to_arrow)
+#    +- Dataset(num_blocks=1, num_rows=10, schema={text: string})
 
 ds.show(2)
 # -> {
@@ -342,11 +343,18 @@ def convert_to_numpy(df: pd.DataFrame) -> np.ndarray:
     return df[["sepal.length", "sepal.width"]].to_numpy()
 
 ds = ds.map_batches(convert_to_numpy)
-# -> Dataset(
-#        num_blocks=1,
-#        num_rows=150,
-#        schema={__value__: <ArrowTensorType: shape=(2,), dtype=double>},
-#    )
+# -> MapBatches(convert_to_numpy)
+#    +- Dataset(
+#           num_blocks=1,
+#           num_rows=150,
+#           schema={
+#               sepal.length: double,
+#               sepal.width: double,
+#               petal.length: double,
+#               petal.width: double,
+#               variety: string,
+#           },
+#      )
 
 ds.show(2)
 # -> [5.1 3.5]
@@ -384,15 +392,18 @@ def convert_to_numpy(df: pd.DataFrame) -> Dict[str, np.ndarray]:
     }
 
 ds = ds.map_batches(convert_to_numpy)
-# -> Dataset(
-#        num_blocks=1,
-#        num_rows=150,
-#        schema={
-#            sepal_len_and_width: <ArrowTensorType: shape=(2,), dtype=double>,
-#            petal_len: double,
-#            petal_width: double,
-#        },
-#    )
+# -> MapBatches(convert_to_numpy)
+#    +- Dataset(
+#           num_blocks=1,
+#           num_rows=150,
+#           schema={
+#               sepal.length: double,
+#               sepal.width: double,
+#               petal.length: double,
+#               petal.width: double,
+#               variety: string,
+#           },
+#      )
 
 ds.show(2)
 # -> {'sepal_len_and_width': array([5.1, 3.5]), 'petal_len': 1.4, 'petal_width': 0.2}
@@ -425,7 +436,18 @@ def convert_to_list(df: pd.DataFrame) -> List[dict]:
     return df.to_dict("records")
 
 ds = ds.map_batches(convert_to_list)
-# -> Dataset(num_blocks=1, num_rows=150, schema=<class 'dict'>)
+# -> MapBatches(convert_to_list)
+#    +- Dataset(
+#           num_blocks=1,
+#           num_rows=150,
+#           schema={
+#               sepal.length: double,
+#               sepal.width: double,
+#               petal.length: double,
+#               petal.width: double,
+#               variety: string,
+#           },
+#      )
 
 ds.show(2)
 # -> {'sepal.length': 5.1, 'sepal.width': 3.5, 'petal.length': 1.4, 'petal.width': 0.2,
@@ -450,7 +472,8 @@ def row_to_dict(row: int) -> Dict[str, int]:
     return {"foo": row}
 
 ds = ds.map(row_to_dict)
-# -> Dataset(num_blocks=10, num_rows=10, schema={foo: int64})
+# -> Map
+#    +- Dataset(num_blocks=10, num_rows=10, schema=<class 'int'>)
 
 ds.show(2)
 # -> {'foo': 0}
@@ -461,6 +484,7 @@ def row_to_dict(row: int) -> Dict[str, int]:
 # fmt: off
 # __writing_table_row_out_row_udfs_begin__
 import ray
+from ray.data.row import TableRow
 import pandas as pd
 from typing import Dict
 
@@ -485,18 +509,18 @@ def map_row(row: TableRow) -> TableRow:
     return row
 
 ds = ds.map(map_row)
-# -> Dataset(
-#        num_blocks=1,
-#        num_rows=150,
-#        schema={
-#            sepal.length: double,
-#            sepal.width: double,
-#            petal.length: double,
-#            petal.width: double,
-#            variety: string,
-#            sepal.area: double,
-#        },
-#   )
+# -> Map
+#    +- Dataset(
+#           num_blocks=1,
+#           num_rows=150,
+#           schema={
+#               sepal.length: double,
+#               sepal.width: double,
+#               petal.length: double,
+#               petal.width: double,
+#               variety: string,
+#           },
+#      )
 
 ds.show(2)
 # -> {'sepal.length': 5.1, 'sepal.width': 3.5, 'petal.length': 1.4, 'petal.width': 0.2,
@@ -521,11 +545,8 @@ def row_to_numpy(row: int) -> np.ndarray:
     return np.full(shape=(2, 2), fill_value=row)
 
 ds = ds.map(row_to_numpy)
-# -> Dataset(
-#        num_blocks=10,
-#        num_rows=10,
-#        schema={__value__: <ArrowTensorType: shape=(2, 2), dtype=int64>},
-#    )
+# -> Map
+#    +- Dataset(num_blocks=10, num_rows=10, schema=<class 'int'>)
 
 ds.show(2)
 # -> [[0 0]
@@ -538,6 +559,7 @@ def row_to_numpy(row: int) -> np.ndarray:
 # fmt: off
 # __writing_simple_out_row_udfs_begin__
 import ray
+from ray.data.row import TableRow
 from typing import List
 
 # Load dataset.
@@ -559,7 +581,18 @@ def map_row(row: TableRow) -> tuple:
     return tuple(row.items())
 
 ds = ds.map(map_row)
-# -> Dataset(num_blocks=1, num_rows=150, schema=<class 'tuple'>)
+# -> Map
+#    +- Dataset(
+#           num_blocks=1,
+#           num_rows=150,
+#           schema={
+#               sepal.length: double,
+#               sepal.width: double,
+#               petal.length: double,
+#               petal.width: double,
+#               variety: string,
+#          },
+#     )
 
 ds.show(2)
 # -> (('sepal.length', 5.1), ('sepal.width', 3.5), ('petal.length', 1.4),
@@ -589,6 +622,18 @@ def pandas_transform(df: pd.DataFrame) -> pd.DataFrame:
 
 # Have each batch that pandas_transform receives contain 10 rows.
 ds = ds.map_batches(pandas_transform, batch_size=10)
+# -> MapBatches(pandas_transform)
+#    +- Dataset(
+#           num_blocks=1,
+#           num_rows=150,
+#           schema={
+#               sepal.length: double,
+#               sepal.width: double,
+#               petal.length: double,
+#               petal.width: double,
+#               variety: string,
+#           },
+#      )
 
 ds.show(2)
 # -> {'sepal.width': 3.2, 'petal.length': 4.7, 'petal.width': 1.4,
diff --git a/doc/source/data/key-concepts.rst b/doc/source/data/key-concepts.rst
index 502dba7dd051..c41f0d721512 100644
--- a/doc/source/data/key-concepts.rst
+++ b/doc/source/data/key-concepts.rst
@@ -79,6 +79,11 @@ Repartition has two modes:
 
 Datasets shuffle can scale to processing hundreds of terabytes of data. See the :ref:`Performance Tips Guide <shuffle_performance_tips>` for an in-depth guide on shuffle performance.
 
+Execution mode
+==============
+
+Most Datasets operations are lazily executed. Operations won't be executed until the dataset is consumed or :meth:`ds.fully_executed() <ray.data.Dataset.fully_executed>` is called to manually trigger execution. See the :ref:`Execution Section <datasets_execution>` for more details.
+
 Fault tolerance
 ===============
 
diff --git a/doc/source/data/transforming-datasets.rst b/doc/source/data/transforming-datasets.rst
index a1a4cfaf7402..d7860a18f81c 100644
--- a/doc/source/data/transforming-datasets.rst
+++ b/doc/source/data/transforming-datasets.rst
@@ -381,7 +381,7 @@ is set to too large of a value for your dataset), the number of parallel tasks
 may be less than expected.
 
 If your ``Dataset`` blocks are smaller than your ``batch_size`` and you want to increase
-`:meth:`ds.map_batches() <ray.data.Dataset.map_batches>` parallelism, decrease your
+:meth:`ds.map_batches() <ray.data.Dataset.map_batches>` parallelism, decrease your
 ``batch_size`` to prevent this block bundling. If you think that your ``Dataset`` blocks
 are too small, try decreasing ``parallelism`` during the read to create larger blocks.
 

From bc2de90fbbded6c660df0d5abf4e2a5386003b88 Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Fri, 10 Feb 2023 14:14:25 -0800
Subject: [PATCH 229/267] [ci][core] Do not set flushing thread niceness for
 task backend #32439

We believe this has minimal impact on the performance. So reverting for non-necessary code.
Signed-off-by: rickyyx <rickyx@anyscale.com>
---
 src/ray/common/constants.h               |  3 ---
 src/ray/core_worker/task_event_buffer.cc | 12 ------------
 2 files changed, 15 deletions(-)

diff --git a/src/ray/common/constants.h b/src/ray/common/constants.h
index df4bc8ff2ed3..b55b0ee4b753 100644
--- a/src/ray/common/constants.h
+++ b/src/ray/common/constants.h
@@ -53,6 +53,3 @@ constexpr char kSetupWorkerFilename[] = "setup_worker.py";
 
 /// The version of Ray
 constexpr char kRayVersion[] = "3.0.0.dev0";
-
-/// Added niceness for thread in TaskEventBuffer
-constexpr int kTaskEventBufferAdditionalNice = 5;
diff --git a/src/ray/core_worker/task_event_buffer.cc b/src/ray/core_worker/task_event_buffer.cc
index 3a5c7265c8e1..15731ad46628 100644
--- a/src/ray/core_worker/task_event_buffer.cc
+++ b/src/ray/core_worker/task_event_buffer.cc
@@ -136,18 +136,6 @@ Status TaskEventBufferImpl::Start(bool auto_flush) {
     sigaddset(&mask, SIGINT);
     sigaddset(&mask, SIGTERM);
     pthread_sigmask(SIG_BLOCK, &mask, NULL);
-
-    // Decrease the thread priority to allow worker threads to run.
-    int new_nice = std::min(
-        RayConfig::instance().worker_niceness() + kTaskEventBufferAdditionalNice, 19);
-    new_nice = nice(new_nice);
-    if (new_nice == -1) {
-      RAY_LOG(WARNING) << "Failed to set nice(" << new_nice
-                       << ") for task event buffer io thread: " << strerror(errno);
-    } else {
-      RAY_LOG(INFO) << "Current task event io thread's nice = " << new_nice;
-    }
-
 #endif
     SetThreadName("task_event_buffer.io");
     io_service_.run();

From ed640b6c8e63bda0bb7e166a125f52cda61b25ad Mon Sep 17 00:00:00 2001
From: Clark Zinzow <clarkzinzow@gmail.com>
Date: Fri, 10 Feb 2023 14:30:22 -0800
Subject: [PATCH 230/267] [Datasets] [Docs] Update docs to reflect
 lazy-by-default execution model. (#32387)

This PR updates the docs for a portion of the feature guides, the FAQ, the examples, and the docstrings for the Dataset, GroupedDataset, and read APIs, to reflect the new lazy-by-default execution semantics.
---
 doc/source/data/dataset-internals.rst         |  33 ++--
 .../examples/nyc_taxi_basic_processing.ipynb  |   4 +-
 doc/source/data/faq.rst                       |   5 -
 python/ray/data/_internal/util.py             | 136 ++++++++++++++++
 python/ray/data/dataset.py                    | 149 ++++++++++++------
 python/ray/data/grouped_dataset.py            |  16 --
 6 files changed, 255 insertions(+), 88 deletions(-)

diff --git a/doc/source/data/dataset-internals.rst b/doc/source/data/dataset-internals.rst
index c40fbb52b476..28c506ef8fc5 100644
--- a/doc/source/data/dataset-internals.rst
+++ b/doc/source/data/dataset-internals.rst
@@ -64,21 +64,26 @@ This should be considered for advanced use cases to improve performance predicta
 Execution
 =========
 
-This section covers Dataset execution modes and performance considerations.
+This section covers the Datasets execution model and performance considerations.
 
-Lazy Execution Mode
-~~~~~~~~~~~~~~~~~~~
+Lazy Execution
+~~~~~~~~~~~~~~
+
+Lazy execution offers opportunities for improved performance and memory stability due
+to stage fusion optimizations and aggressive garbage collection of intermediate results.
 
-By default, most Datasets operations are eager, which provides a simpler iterative
-development experience. Datasets also has a lazy execution mode that can offer
-improved performance due to stage fusion optimizations.
+Dataset creation and transformation APIs are lazy, with execution only triggered via "sink"
+APIs, such as consuming (:meth:`ds.iter_batches() <ray.data.Dataset.iter_batches>`),
+writing (:meth:`ds.write_parquet() <ray.data.Dataset.write_parquet>`), or manually triggering via
+:meth:`ds.fully_executed() <ray.data.Dataset.fully_executed>`. There are a few
+exceptions to this rule, where transformations such as :meth:`ds.union()
+<ray.data.Dataset.union>` and
+:meth:`ds.limit() <ray.data.Dataset.limit>` trigger execution; we plan to make these
+operations lazy in the future.
 
-Lazy execution mode can be enabled by calling
-:meth:`ds = ds.lazy() <ray.data.Dataset.lazy()>`, which
-returns a Dataset whose all subsequent operations will be lazy. These operations
-won't be executed until the dataset is consumed or
-:meth:`ds.fully_executed() <ray.data.Dataset.fully_executed>` is called to manually
-trigger execution.
+Check the API docs for Datasets methods to see if they
+trigger execution. Those that do trigger execution will have a ``Note`` indicating as
+much.
 
 Stage Fusion Optimization
 ~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -104,10 +109,6 @@ You can tell if stage fusion is enabled by checking the :ref:`Dataset stats <dat
     * Remote cpu time: T min, T max, T mean, T total
     * Output num rows: N min, N max, N mean, N total
 
-To avoid unnecessary data movement in the distributed setting,
-:class:`DatasetPipelines <ray.data.dataset_pipelines.DatasetPipeline>` will always use
-lazy execution under the hood.
-
 Memory Management
 =================
 
diff --git a/doc/source/data/examples/nyc_taxi_basic_processing.ipynb b/doc/source/data/examples/nyc_taxi_basic_processing.ipynb
index ed3a9ce98015..1080f7d189ac 100644
--- a/doc/source/data/examples/nyc_taxi_basic_processing.ipynb
+++ b/doc/source/data/examples/nyc_taxi_basic_processing.ipynb
@@ -67,7 +67,7 @@
    "source": [
     "### Reading and Inspecting the Data\n",
     "\n",
-    "Next, we read a few of the files from the dataset. This read is semi-lazy, where reading of the first file is eagerly executed, but reading of all other files is delayed until the underlying data is needed by downstream operations (e.g. consuming the data with {meth}`ds.take() <ray.data.Dataset.take>`, or transforming the data with {meth}`ds.map_batches() <ray.data.Dataset.map_batches>`).\n",
+    "Next, we read a few of the files from the dataset. This read is lazy, where reading and all future transformations are delayed until a downstream operation triggers execution (e.g. consuming the data with {meth}`ds.take() <ray.data.Dataset.take>`)\n",
     "\n",
     "We could process the entire Dataset in a streaming fashion using {ref}`pipelining <dataset_pipeline_concept>` or all of it in parallel using a multi-node Ray cluster, but we'll save that for our large-scale examples. :)"
    ]
@@ -331,7 +331,7 @@
     "For the NYC taxi dataset, instead of reading individual per-month Parquet files, we can read the entire 2009 directory.\n",
     "\n",
     "```{warning}\n",
-    "This could be a lot of data (downsampled with 0.01 ratio leads to ~50.2 MB on disk, ~147 MB in memory), so be careful triggering full reads on a limited-memory machine! This is one place where Datasets' semi-lazy reading comes in handy: Datasets will only read one file eagerly, which allows us to inspect a subset of the data without having to read the entire dataset.\n",
+    "This could be a lot of data (downsampled with 0.01 ratio leads to ~50.2 MB on disk, ~147 MB in memory), so be careful triggering full reads on a limited-memory machine! This is one place where Datasets' lazy reading comes in handy: Datasets will not execute any read tasks eagerly and will execute the minimum number of file reads to satisfy downstream operations, which allows us to inspect a subset of the data without having to read the entire dataset.\n",
     "```"
    ]
   },
diff --git a/doc/source/data/faq.rst b/doc/source/data/faq.rst
index 0c0e47719595..dc2729849faf 100644
--- a/doc/source/data/faq.rst
+++ b/doc/source/data/faq.rst
@@ -134,11 +134,6 @@ TensorFlow datasets
   `separate concepts <https://www.tensorflow.org/api_docs/python/tf/distribute/DistributedDataset>`__
   for distributed data loading and prevents code from being seamlessly scaled to larger
   clusters.
-* **Lazy execution:** Datasets executed operations eagerly by default, while TensorFlow
-  datasets are lazy by default. The formter provides easier iterative development and
-  debuggability, and when needing the optimizations that become available with lazy execution,
-  Ray Datasets has a lazy execution mode that you can turn on when productionizing your
-  integration.
 * **Generic distributed data processing:** Datasets is more general: it can handle
   generic distributed operations, including global per-epoch shuffling,
   which would otherwise have to be implemented by stitching together two separate
diff --git a/python/ray/data/_internal/util.py b/python/ray/data/_internal/util.py
index 37788295b248..f681f9735b7e 100644
--- a/python/ray/data/_internal/util.py
+++ b/python/ray/data/_internal/util.py
@@ -244,3 +244,139 @@ def _is_local_scheme(paths: Union[str, List[str]]) -> bool:
 
 def _is_tensor_schema(column_names: List[str]):
     return column_names == [TENSOR_COLUMN_NAME]
+
+
+def _insert_doc_at_pattern(
+    obj,
+    *,
+    message: str,
+    pattern: str,
+    insert_after: bool = True,
+    directive: Optional[str] = None,
+    skip_matches: int = 0,
+) -> str:
+    if "\n" in message:
+        raise ValueError(
+            "message shouldn't contain any newlines, since this function will insert "
+            f"its own linebreaks when text wrapping: {message}"
+        )
+
+    doc = obj.__doc__.strip()
+    if not doc:
+        doc = ""
+
+    if pattern == "" and insert_after:
+        # Empty pattern + insert_after means that we want to append the message to the
+        # end of the docstring.
+        head = doc
+        tail = ""
+    else:
+        tail = doc
+        i = tail.find(pattern)
+        skip_matches_left = skip_matches
+        while i != -1:
+            if insert_after:
+                # Set offset to the first character after the pattern.
+                offset = i + len(pattern)
+            else:
+                # Set offset to the first character in the matched line.
+                offset = tail[:i].rfind("\n") + 1
+            head = tail[:offset]
+            tail = tail[offset:]
+            skip_matches_left -= 1
+            if skip_matches_left <= 0:
+                break
+            elif not insert_after:
+                # Move past the found pattern, since we're skipping it.
+                tail = tail[i - offset + len(pattern) :]
+            i = tail.find(pattern)
+        else:
+            raise ValueError(
+                f"Pattern {pattern} not found after {skip_matches} skips in docstring "
+                f"{doc}"
+            )
+    # Get indentation of the to-be-inserted text.
+    after_lines = list(filter(bool, tail.splitlines()))
+    if len(after_lines) > 0:
+        lines = after_lines
+    else:
+        lines = list(filter(bool, reversed(head.splitlines())))
+    # Should always have at least one non-empty line in the docstring.
+    assert len(lines) > 0
+    indent = " " * (len(lines[0]) - len(lines[0].lstrip()))
+    # Handle directive.
+    message = message.strip("\n")
+    if directive is not None:
+        base = f"{indent}.. {directive}::\n"
+        message = message.replace("\n", "\n" + indent + " " * 4)
+        message = base + indent + " " * 4 + message
+    else:
+        message = indent + message.replace("\n", "\n" + indent)
+    # Add two blank lines before/after message, if necessary.
+    if insert_after ^ (pattern == "\n\n"):
+        # Only two blank lines before message if:
+        # 1. Inserting message after pattern and pattern is not two blank lines.
+        # 2. Inserting message before pattern and pattern is two blank lines.
+        message = "\n\n" + message
+    if (not insert_after) ^ (pattern == "\n\n"):
+        # Only two blank lines after message if:
+        # 1. Inserting message before pattern and pattern is not two blank lines.
+        # 2. Inserting message after pattern and pattern is two blank lines.
+        message = message + "\n\n"
+
+    # Insert message before/after pattern.
+    parts = [head, message, tail]
+    # Build new docstring.
+    obj.__doc__ = "".join(parts)
+
+
+def _consumption_api(
+    if_more_than_read: bool = False,
+    datasource_metadata: Optional[str] = None,
+    extra_condition: Optional[str] = None,
+    delegate: Optional[str] = None,
+    pattern="Examples:",
+    insert_after=False,
+):
+    """Annotate the function with an indication that it's a consumption API, and that it
+    will trigger Datasets execution.
+    """
+    base = (
+        " will trigger execution of the lazy transformations performed on "
+        "this dataset, and will block until execution completes."
+    )
+    if delegate:
+        message = delegate + base
+    elif not if_more_than_read:
+        message = "This operation" + base
+    else:
+        condition = "If this dataset consists of more than a read, "
+        if datasource_metadata is not None:
+            condition += (
+                f"or if the {datasource_metadata} can't be determined from the "
+                "metadata provided by the datasource, "
+            )
+        if extra_condition is not None:
+            condition += extra_condition + ", "
+        message = condition + "then this operation" + base
+
+    def wrap(obj):
+        _insert_doc_at_pattern(
+            obj,
+            message=message,
+            pattern=pattern,
+            insert_after=insert_after,
+            directive="note",
+        )
+        return obj
+
+    return wrap
+
+
+def ConsumptionAPI(*args, **kwargs):
+    """Annotate the function with an indication that it's a consumption API, and that it
+    will trigger Datasets execution.
+    """
+    if len(args) == 1 and len(kwargs) == 0 and callable(args[0]):
+        return _consumption_api()(args[0])
+    return _consumption_api(*args, **kwargs)
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index be62e288c3e1..41141590e0c9 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -64,6 +64,7 @@
     _estimate_available_parallelism,
     _is_local_scheme,
     _is_tensor_schema,
+    ConsumptionAPI,
 )
 from ray.data._internal.pandas_block import PandasBlockSchema
 from ray.data._internal.plan import (
@@ -188,6 +189,9 @@ class Dataset(Generic[T]):
     outputs a new Dataset (e.g. :py:meth:`.map_batches()`); and consumption, which
     produces values (not Dataset) as output (e.g. :py:meth:`.iter_batches()`).
 
+    Dataset transformations are lazy, with execution of the transformations being
+    triggered by downstream consumption.
+
     Datasets supports parallel processing at scale: transformations such as
     :py:meth:`.map_batches()`, aggregations such as
     :py:meth:`.min()`/:py:meth:`.max()`/:py:meth:`.mean()`, grouping via
@@ -263,8 +267,8 @@ def map(
     ) -> "Dataset[U]":
         """Apply the given function to each record of this dataset.
 
-        This is a blocking operation. Note that mapping individual records
-        can be quite slow. Consider using `.map_batches()` for performance.
+        Note that mapping individual records can be quite slow. Consider using
+        `.map_batches()` for performance.
 
         Examples:
             >>> import ray
@@ -722,8 +726,6 @@ def drop_columns(
     ) -> "Dataset[U]":
         """Drop one or more columns from the dataset.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ds = ray.data.range_table(100)
@@ -801,8 +803,8 @@ def flat_map(
     ) -> "Dataset[U]":
         """Apply the given function to each record and then flatten results.
 
-        This is a blocking operation. Consider using ``.map_batches()`` for
-        better performance (the batch size can be altered in map_batches).
+        Consider using ``.map_batches()`` for better performance (the batch size can be
+        altered in map_batches).
 
         Examples:
             >>> import ray
@@ -879,8 +881,8 @@ def filter(
     ) -> "Dataset[T]":
         """Filter out records that do not satisfy the given predicate.
 
-        This is a blocking operation. Consider using ``.map_batches()`` for
-        better performance (you can implement filter by dropping records).
+        Consider using ``.map_batches()`` for better performance (you can implement
+        filter by dropping records).
 
         Examples:
             >>> import ray
@@ -940,8 +942,8 @@ def filter(
     def repartition(self, num_blocks: int, *, shuffle: bool = False) -> "Dataset[T]":
         """Repartition the dataset into exactly this number of blocks.
 
-        This is a blocking operation. After repartitioning, all blocks in the
-        returned dataset will have approximately the same number of rows.
+        After repartitioning, all blocks in the returned dataset will have approximately
+        the same number of rows.
 
         Examples:
             >>> import ray
@@ -985,8 +987,6 @@ def random_shuffle(
     ) -> "Dataset[T]":
         """Randomly shuffle the elements of this dataset.
 
-        This is a blocking operation similar to repartition().
-
         Examples:
             >>> import ray
             >>> ds = ray.data.range(100)
@@ -1113,6 +1113,7 @@ def process_batch(batch):
 
         return self.map_batches(process_batch)
 
+    @ConsumptionAPI
     def split(
         self, n: int, *, equal: bool = False, locality_hints: Optional[List[Any]] = None
     ) -> List["Dataset[T]"]:
@@ -1316,6 +1317,7 @@ def build_node_id_by_actor(actors: List[Any]) -> Dict[Any, str]:
             for block_split in per_split_block_lists
         ]
 
+    @ConsumptionAPI
     def split_at_indices(self, indices: List[int]) -> List["Dataset[T]"]:
         """Split the dataset at the given indices (like np.split).
 
@@ -1373,6 +1375,7 @@ def split_at_indices(self, indices: List[int]) -> List["Dataset[T]"]:
             )
         return splits
 
+    @ConsumptionAPI
     def split_proportionately(self, proportions: List[float]) -> List["Dataset[T]"]:
         """Split the dataset using proportions.
 
@@ -1439,6 +1442,7 @@ def split_proportionately(self, proportions: List[float]) -> List["Dataset[T]"]:
 
         return self.split_at_indices(split_indices)
 
+    @ConsumptionAPI
     def train_test_split(
         self,
         test_size: Union[int, float],
@@ -1496,14 +1500,16 @@ def train_test_split(
                 )
             return dataset.split_at_indices([dataset_length - test_size])
 
+    @ConsumptionAPI(pattern="Args:")
     def union(self, *other: List["Dataset[T]"]) -> "Dataset[T]":
         """Combine this dataset with others of the same type.
 
         The order of the blocks in the datasets is preserved, as is the
         relative ordering between the datasets passed in the argument list.
 
-        NOTE: Unioned datasets are not lineage-serializable, i.e. they can not be used
-        as a tunable hyperparameter in Ray Tune.
+        .. note::
+            Unioned datasets are not lineage-serializable, i.e. they can not be used as
+            a tunable hyperparameter in Ray Tune.
 
         Args:
             other: List of datasets to combine with this one. The datasets
@@ -1575,8 +1581,6 @@ def union(self, *other: List["Dataset[T]"]) -> "Dataset[T]":
     def groupby(self, key: Optional[KeyFn]) -> "GroupedDataset[T]":
         """Group the dataset by the key function or column name.
 
-        This is a lazy operation.
-
         Examples:
             >>> import ray
             >>> # Group by a key function and aggregate.
@@ -1607,11 +1611,10 @@ def groupby(self, key: Optional[KeyFn]) -> "GroupedDataset[T]":
 
         return GroupedDataset(self, key)
 
+    @ConsumptionAPI
     def aggregate(self, *aggs: AggregateFn) -> U:
         """Aggregate the entire dataset as one group.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> from ray.data.aggregate import Max, Mean
@@ -1638,13 +1641,12 @@ def aggregate(self, *aggs: AggregateFn) -> U:
         ret = self.groupby(None).aggregate(*aggs).take(1)
         return ret[0] if len(ret) > 0 else None
 
+    @ConsumptionAPI
     def sum(
         self, on: Optional[Union[KeyFn, List[KeyFn]]] = None, ignore_nulls: bool = True
     ) -> U:
         """Compute sum over entire dataset.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ray.data.range(100).sum()
@@ -1701,13 +1703,12 @@ def sum(
         ret = self._aggregate_on(Sum, on, ignore_nulls)
         return self._aggregate_result(ret)
 
+    @ConsumptionAPI
     def min(
         self, on: Optional[Union[KeyFn, List[KeyFn]]] = None, ignore_nulls: bool = True
     ) -> U:
         """Compute minimum over entire dataset.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ray.data.range(100).min()
@@ -1764,13 +1765,12 @@ def min(
         ret = self._aggregate_on(Min, on, ignore_nulls)
         return self._aggregate_result(ret)
 
+    @ConsumptionAPI
     def max(
         self, on: Optional[Union[KeyFn, List[KeyFn]]] = None, ignore_nulls: bool = True
     ) -> U:
         """Compute maximum over entire dataset.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ray.data.range(100).max()
@@ -1827,13 +1827,12 @@ def max(
         ret = self._aggregate_on(Max, on, ignore_nulls)
         return self._aggregate_result(ret)
 
+    @ConsumptionAPI
     def mean(
         self, on: Optional[Union[KeyFn, List[KeyFn]]] = None, ignore_nulls: bool = True
     ) -> U:
         """Compute mean over entire dataset.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ray.data.range(100).mean()
@@ -1890,6 +1889,7 @@ def mean(
         ret = self._aggregate_on(Mean, on, ignore_nulls)
         return self._aggregate_result(ret)
 
+    @ConsumptionAPI
     def std(
         self,
         on: Optional[Union[KeyFn, List[KeyFn]]] = None,
@@ -1898,8 +1898,6 @@ def std(
     ) -> U:
         """Compute standard deviation over entire dataset.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ray.data.range(100).std()
@@ -1915,13 +1913,13 @@ def std(
             ...     for i in range(100)]).std(["A", "B"])
             {'std(A)': 29.011491975882016, 'std(B)': 2968.1748039269296}
 
-        NOTE: This uses Welford's online method for an accumulator-style
-        computation of the standard deviation. This method was chosen due to
-        it's numerical stability, and it being computable in a single pass.
-        This may give different (but more accurate) results than NumPy, Pandas,
-        and sklearn, which use a less numerically stable two-pass algorithm.
-        See
-        https://en.wikipedia.org/wiki/Algorithms_for_calculating_variance#Welford's_online_algorithm
+        .. note:: This uses Welford's online method for an accumulator-style computation
+            of the standard deviation. This method was chosen due to it's numerical
+            stability, and it being computable in a single pass. This may give different
+            (but more accurate) results than NumPy, Pandas, and sklearn, which use a
+            less numerically stable two-pass algorithm.
+            See
+            https://en.wikipedia.org/wiki/Algorithms_for_calculating_variance#Welford's_online_algorithm
 
         Args:
             on: The data subset on which to compute the std.
@@ -1975,8 +1973,6 @@ def sort(
         #  How do I create something "simple" here?
         """Sort the dataset by the specified key column or key function.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> # Sort using the entire record as the key.
@@ -2021,13 +2017,14 @@ def sort(
     def zip(self, other: "Dataset[U]") -> "Dataset[(T, U)]":
         """Zip this dataset with the elements of another.
 
-        The datasets must have identical num rows, block types, and block sizes
-        (e.g., one was produced from a ``.map()`` of another). For Arrow
+        The datasets must have identical num rows, block types, and block sizes,
+        e.g. one was produced from a :meth:`~.map` of another. For Arrow
         blocks, the schema will be concatenated, and any duplicate column
         names disambiguated with _1, _2, etc. suffixes.
 
-        NOTE: Zipped datasets are not lineage-serializable, i.e. they can not be used
-        as a tunable hyperparameter in Ray Tune.
+        .. note::
+            Zipped datasets are not lineage-serializable, i.e. they can not be used as a
+            tunable hyperparameter in Ray Tune.
 
         Time complexity: O(dataset size / parallelism)
 
@@ -2048,6 +2045,7 @@ def zip(self, other: "Dataset[U]") -> "Dataset[(T, U)]":
         plan = self._plan.with_stage(ZipStage(other))
         return Dataset(plan, self._epoch, self._lazy)
 
+    @ConsumptionAPI
     def limit(self, limit: int) -> "Dataset[T]":
         """Truncate the dataset to the first ``limit`` records.
 
@@ -2104,6 +2102,7 @@ def limit(self, limit: int) -> "Dataset[T]":
             self._lazy,
         )
 
+    @ConsumptionAPI(pattern="Time complexity:")
     def take(self, limit: int = 20) -> List[T]:
         """Return up to ``limit`` records from the dataset.
 
@@ -2126,6 +2125,7 @@ def take(self, limit: int = 20) -> List[T]:
                 break
         return output
 
+    @ConsumptionAPI(pattern="Time complexity:")
     def take_all(self, limit: Optional[int] = None) -> List[T]:
         """Return all of the records in the dataset.
 
@@ -2152,6 +2152,7 @@ def take_all(self, limit: Optional[int] = None) -> List[T]:
                 )
         return output
 
+    @ConsumptionAPI(pattern="Time complexity:")
     def show(self, limit: int = 20) -> None:
         """Print up to the given number of records from the dataset.
 
@@ -2163,6 +2164,11 @@ def show(self, limit: int = 20) -> None:
         for row in self.take(limit):
             print(row)
 
+    @ConsumptionAPI(
+        if_more_than_read=True,
+        datasource_metadata="row count",
+        pattern="Time complexity:",
+    )
     def count(self) -> int:
         """Count the number of records in the dataset.
 
@@ -2188,6 +2194,12 @@ def count(self) -> int:
             )
         )
 
+    @ConsumptionAPI(
+        if_more_than_read=True,
+        datasource_metadata="schema",
+        extra_condition="or if ``fetch_if_missing=True`` (the default)",
+        pattern="Time complexity:",
+    )
     def schema(
         self, fetch_if_missing: bool = True
     ) -> Union[type, "pyarrow.lib.Schema"]:
@@ -2223,6 +2235,7 @@ def num_blocks(self) -> int:
         """
         return self._plan.initial_num_blocks()
 
+    @ConsumptionAPI(if_more_than_read=True, pattern="Time complexity:")
     def size_bytes(self) -> int:
         """Return the in-memory size of the dataset.
 
@@ -2237,6 +2250,7 @@ def size_bytes(self) -> int:
             return None
         return sum(m.size_bytes for m in metadata)
 
+    @ConsumptionAPI(if_more_than_read=True, pattern="Time complexity:")
     def input_files(self) -> List[str]:
         """Return the list of input files for the dataset.
 
@@ -2253,6 +2267,7 @@ def input_files(self) -> List[str]:
                 files.add(f)
         return list(files)
 
+    @ConsumptionAPI
     def write_parquet(
         self,
         path: str,
@@ -2315,6 +2330,7 @@ def write_parquet(
             **arrow_parquet_args,
         )
 
+    @ConsumptionAPI
     def write_json(
         self,
         path: str,
@@ -2378,6 +2394,7 @@ def write_json(
             **pandas_json_args,
         )
 
+    @ConsumptionAPI
     def write_csv(
         self,
         path: str,
@@ -2438,6 +2455,7 @@ def write_csv(
             **arrow_csv_args,
         )
 
+    @ConsumptionAPI
     def write_tfrecords(
         self,
         path: str,
@@ -2502,6 +2520,7 @@ def write_tfrecords(
             block_path_provider=block_path_provider,
         )
 
+    @ConsumptionAPI
     def write_numpy(
         self,
         path: str,
@@ -2557,6 +2576,7 @@ def write_numpy(
             block_path_provider=block_path_provider,
         )
 
+    @ConsumptionAPI
     def write_mongo(
         self,
         uri: str,
@@ -2615,6 +2635,7 @@ def write_mongo(
             collection=collection,
         )
 
+    @ConsumptionAPI
     def write_datasource(
         self,
         datasource: Datasource[T],
@@ -2719,6 +2740,11 @@ def transform(blocks: Iterable[Block], ctx, fn) -> Iterable[Block]:
             finally:
                 progress.close()
 
+    @ConsumptionAPI(
+        delegate=(
+            "Calling any of the consumption methods on the returned ``DatasetIterator``"
+        )
+    )
     def iterator(self) -> DatasetIterator:
         """Return a :class:`~ray.data.DatasetIterator` that
         can be used to repeatedly iterate over the dataset.
@@ -2736,6 +2762,7 @@ def iterator(self) -> DatasetIterator:
         """
         return BulkDatasetIterator(self)
 
+    @ConsumptionAPI
     def iter_rows(self, *, prefetch_blocks: int = 0) -> Iterator[Union[T, TableRow]]:
         """Return a local row iterator over the dataset.
 
@@ -2785,6 +2812,7 @@ def iter_rows(self, *, prefetch_blocks: int = 0) -> Iterator[Union[T, TableRow]]
             for row in batch.iter_rows():
                 yield row
 
+    @ConsumptionAPI
     def iter_batches(
         self,
         *,
@@ -2850,6 +2878,7 @@ def iter_batches(
 
         stats.iter_total_s.add(time.perf_counter() - time_start)
 
+    @ConsumptionAPI
     def iter_torch_batches(
         self,
         *,
@@ -2924,6 +2953,7 @@ def iter_torch_batches(
                 device=device,
             )
 
+    @ConsumptionAPI
     def iter_tf_batches(
         self,
         *,
@@ -2994,6 +3024,7 @@ def iter_tf_batches(
         ):
             yield convert_ndarray_batch_to_tf_tensor_batch(batch, dtypes=dtypes)
 
+    @ConsumptionAPI(pattern="Time complexity:")
     def to_torch(
         self,
         *,
@@ -3183,6 +3214,7 @@ def make_generator():
 
         return TorchIterableDataset(make_generator)
 
+    @ConsumptionAPI
     def to_tf(
         self,
         feature_columns: Union[str, List[str]],
@@ -3353,6 +3385,7 @@ def generator():
         )
         return dataset.with_options(options)
 
+    @ConsumptionAPI(pattern="Time complexity:")
     def to_dask(
         self,
         meta: Union[
@@ -3455,6 +3488,7 @@ def block_to_df(block: Block):
         )
         return ddf
 
+    @ConsumptionAPI(pattern="Time complexity:")
     def to_mars(self) -> "mars.DataFrame":
         """Convert this dataset into a MARS dataframe.
 
@@ -3484,6 +3518,7 @@ def to_mars(self) -> "mars.DataFrame":
         op = DataFrameReadRayDataset(refs=refs)
         return op(index_value=index_value, columns_value=columns_value, dtypes=dtypes)
 
+    @ConsumptionAPI(pattern="Time complexity:")
     def to_modin(self) -> "modin.DataFrame":
         """Convert this dataset into a Modin dataframe.
 
@@ -3509,6 +3544,7 @@ def to_modin(self) -> "modin.DataFrame":
         pd_objs = self.to_pandas_refs()
         return from_partitions(pd_objs, axis=0)
 
+    @ConsumptionAPI(pattern="Time complexity:")
     def to_spark(self, spark: "pyspark.sql.SparkSession") -> "pyspark.sql.DataFrame":
         """Convert this dataset into a Spark dataframe.
 
@@ -3523,6 +3559,7 @@ def to_spark(self, spark: "pyspark.sql.SparkSession") -> "pyspark.sql.DataFrame"
             spark, self.schema(), self.get_internal_block_refs()
         )
 
+    @ConsumptionAPI(pattern="Time complexity:")
     def to_pandas(self, limit: int = 100000) -> "pandas.DataFrame":
         """Convert this dataset into a single Pandas DataFrame.
 
@@ -3556,6 +3593,7 @@ def to_pandas(self, limit: int = 100000) -> "pandas.DataFrame":
         block = output.build()
         return _block_to_df(block)
 
+    @ConsumptionAPI(pattern="Time complexity:")
     @DeveloperAPI
     def to_pandas_refs(self) -> List[ObjectRef["pandas.DataFrame"]]:
         """Convert this dataset into a distributed set of Pandas dataframes.
@@ -3601,6 +3639,7 @@ def to_numpy_refs(
             for block in self.get_internal_block_refs()
         ]
 
+    @ConsumptionAPI(pattern="Time complexity:")
     @DeveloperAPI
     def to_arrow_refs(self) -> List[ObjectRef["pyarrow.Table"]]:
         """Convert this dataset into a distributed set of Arrow tables.
@@ -3623,6 +3662,7 @@ def to_arrow_refs(self) -> List[ObjectRef["pyarrow.Table"]]:
         block_to_arrow = cached_remote_fn(_block_to_arrow)
         return [block_to_arrow.remote(block) for block in blocks]
 
+    @ConsumptionAPI(pattern="Args:")
     def to_random_access_dataset(
         self,
         key: str,
@@ -3652,6 +3692,7 @@ def to_random_access_dataset(
             num_workers = 4 * len(ray.nodes())
         return RandomAccessDataset(self, key, num_workers=num_workers)
 
+    @ConsumptionAPI
     def repeat(self, times: Optional[int] = None) -> "DatasetPipeline[T]":
         """Convert this into a DatasetPipeline by looping over this dataset.
 
@@ -3948,11 +3989,12 @@ def fully_executed(self) -> "Dataset[T]":
     def is_fully_executed(self) -> bool:
         """Returns whether this Dataset has been fully executed.
 
-        This will return False if this Dataset is lazy and if the output of its final
-        stage hasn't been computed yet.
+        This will return False if the output of its final stage hasn't been computed
+        yet.
         """
         return self._plan.has_computed_output()
 
+    @ConsumptionAPI(pattern="timing information.", insert_after=True)
     def stats(self) -> str:
         """Returns a string containing execution timing information."""
         return self._get_stats_summary().to_string()
@@ -3960,6 +4002,7 @@ def stats(self) -> str:
     def _get_stats_summary(self) -> DatasetStatsSummary:
         return self._plan.stats_summary()
 
+    @ConsumptionAPI(pattern="Time complexity:")
     @DeveloperAPI
     def get_internal_block_refs(self) -> List[ObjectRef[Block]]:
         """Get a list of references to the underlying blocks of this dataset.
@@ -3977,6 +4020,9 @@ def get_internal_block_refs(self) -> List[ObjectRef[Block]]:
     def lazy(self) -> "Dataset[T]":
         """Enable lazy evaluation.
 
+        Datasets are lazy by default, so this is only useful for datasets created from
+        :func:`ray.data.from_items() <ray.data.read_api.from_items>`, which is eager.
+
         The returned dataset is a lazy dataset, where all subsequent operations on the
         dataset won't be executed until the dataset is consumed (e.g. ``.take()``,
         ``.iter_batches()``, ``.to_torch()``, ``.to_tf()``, etc.) or execution is
@@ -3986,9 +4032,6 @@ def lazy(self) -> "Dataset[T]":
         ds._set_uuid(self._get_uuid())
         return ds
 
-    def experimental_lazy(self) -> "Dataset[T]":
-        raise DeprecationWarning("Use self.lazy().")
-
     def has_serializable_lineage(self) -> bool:
         """Whether this dataset's lineage is able to be serialized for storage and
         later deserialized, possibly on a different cluster.
@@ -4013,8 +4056,9 @@ def serialize_lineage(self) -> bytes:
         Use :py:meth:`Dataset.deserialize_lineage` to deserialize the serialized bytes
         returned from this method into a Dataset.
 
-        NOTE: Unioned and zipped datasets, produced by :py:meth`Dataset.union` and
-        :py:meth:`Dataset.zip`, are not lineage-serializable.
+        .. note::
+            Unioned and zipped datasets, produced by :py:meth`Dataset.union` and
+            :py:meth:`Dataset.zip`, are not lineage-serializable.
 
         Returns:
             Serialized bytes containing the lineage of this dataset.
@@ -4099,6 +4143,7 @@ def _divide(self, block_idx: int) -> ("Dataset[T]", "Dataset[T]"):
         )
         return l_ds, r_ds
 
+    @ConsumptionAPI(if_more_than_read=True, datasource_metadata="schema")
     def default_batch_format(self) -> Type:
         """Return this dataset's default batch format.
 
@@ -4106,7 +4151,7 @@ def default_batch_format(self) -> Type:
         about batch formats, read
         :ref:`writing user-defined functions <transform_datasets_writing_udfs>`.
 
-        Example:
+        Examples:
 
             If your dataset represents a list of Python objects, then the default batch
             format is ``list``.
@@ -4183,6 +4228,12 @@ def _is_tensor_dataset(self) -> bool:
             return False
         return _is_tensor_schema(schema.names)
 
+    @ConsumptionAPI(
+        if_more_than_read=True,
+        datasource_metadata="schema",
+        pattern="for the first block.",
+        insert_after=True,
+    )
     def dataset_format(self) -> BlockFormat:
         """The format of the dataset's underlying data blocks. Possible values
         are: "arrow", "pandas" and "simple".
diff --git a/python/ray/data/grouped_dataset.py b/python/ray/data/grouped_dataset.py
index 01a421eb9712..8f3a4b56e33f 100644
--- a/python/ray/data/grouped_dataset.py
+++ b/python/ray/data/grouped_dataset.py
@@ -138,8 +138,6 @@ def __repr__(self) -> str:
     def aggregate(self, *aggs: AggregateFn) -> Dataset[U]:
         """Implements an accumulator-based aggregation.
 
-        This is a blocking operation.
-
         Examples:
 
             .. testcode::
@@ -263,8 +261,6 @@ def map_groups(
 
         In general, prefer to use aggregate() instead of map_groups().
 
-        This is a blocking operation.
-
         Examples:
             >>> # Return a single record per group (list of multiple records in,
             >>> # list of a single record out).
@@ -374,8 +370,6 @@ def group_fn(batch):
     def count(self) -> Dataset[U]:
         """Compute count aggregation.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ray.data.range(100).groupby(lambda x: x % 3).count() # doctest: +SKIP
@@ -396,8 +390,6 @@ def sum(
     ) -> Dataset[U]:
         r"""Compute grouped sum aggregation.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ray.data.range(100).groupby(lambda x: x % 3).sum() # doctest: +SKIP
@@ -457,8 +449,6 @@ def min(
     ) -> Dataset[U]:
         """Compute grouped min aggregation.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ray.data.range(100).groupby(lambda x: x % 3).min() # doctest: +SKIP
@@ -518,8 +508,6 @@ def max(
     ) -> Dataset[U]:
         """Compute grouped max aggregation.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ray.data.range(100).groupby(lambda x: x % 3).max() # doctest: +SKIP
@@ -579,8 +567,6 @@ def mean(
     ) -> Dataset[U]:
         """Compute grouped mean aggregation.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ray.data.range(100).groupby(lambda x: x % 3).mean() # doctest: +SKIP
@@ -644,8 +630,6 @@ def std(
     ) -> Dataset[U]:
         """Compute grouped standard deviation aggregation.
 
-        This is a blocking operation.
-
         Examples:
             >>> import ray
             >>> ray.data.range(100).groupby(lambda x: x % 3).std() # doctest: +SKIP

From dade5955de9ee17ca401dc09e604386a15768f25 Mon Sep 17 00:00:00 2001
From: Jian Xiao <99709935+jianoaix@users.noreply.github.com>
Date: Fri, 10 Feb 2023 14:32:44 -0800
Subject: [PATCH 231/267] Use retriable_lifo policy for shuffle 1tb nightly
 test (#32417)

Fix release blocker issue: #32203

Ran 6 times and all of them passed.

Signed-off-by: jianoaix <iamjianxiao@gmail.com>
---
 release/nightly_tests/shuffle/shuffle_app_config.yaml | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/release/nightly_tests/shuffle/shuffle_app_config.yaml b/release/nightly_tests/shuffle/shuffle_app_config.yaml
index 028cc7ce2a32..cc8c6b550d94 100644
--- a/release/nightly_tests/shuffle/shuffle_app_config.yaml
+++ b/release/nightly_tests/shuffle/shuffle_app_config.yaml
@@ -1,6 +1,12 @@
 base_image: {{ env["RAY_IMAGE_NIGHTLY_CPU"] | default("anyscale/ray:nightly-py37") }}
 debian_packages: []
 
+# We use retriable_lifo as the workload can crash due to multiple tasks from different
+# callers running on the same node, we also observed raylet memory leak that would
+# trigger the group-by-policy to fail the workload.
+# https://github.com/ray-project/ray/issues/32195
+env_vars: {"RAY_worker_killing_policy": "retriable_lifo"}
+
 python:
   pip_packages: []
   conda_packages: []

From 2874e474f503ee61dd845b40dc461b2c5ef43f1c Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Fri, 10 Feb 2023 23:59:05 +0100
Subject: [PATCH 232/267] [Docs] Fix broken Tune links to overview and
 intergration (#32442)

---
 doc/source/ray-contribute/docs.ipynb | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/doc/source/ray-contribute/docs.ipynb b/doc/source/ray-contribute/docs.ipynb
index bf65b26a75f0..d63623ec5623 100644
--- a/doc/source/ray-contribute/docs.ipynb
+++ b/doc/source/ray-contribute/docs.ipynb
@@ -121,7 +121,7 @@
     "  [tabbed content blocks](https://docs.ray.io/en/latest/ray-core/walkthrough.html#starting-ray), this is the right\n",
     "  choice. Most of the documents in Ray Tune are written in this way, for instance the\n",
     "  [key concepts](https://github.com/ray-project/ray/blob/master/doc/source/tune/key-concepts.rst) or\n",
-    "  [API documentation](https://github.com/ray-project/ray/blob/master/doc/source/tune/api_docs/overview.rst).\n",
+    "  [API documentation](https://github.com/ray-project/ray/blob/master/doc/source/tune/api/api.rst).\n",
     "- Notebooks, written in `.ipynb` format. All Tune examples are written as notebooks. These notebooks render in\n",
     "  the browser like `.md` or `.rst` files, but have the added benefit of adding launch buttons to the top of the\n",
     "  document, so that users can run the code themselves in either Binder or Google Colab. A good first example to look\n",
@@ -148,7 +148,7 @@
     "```\n",
     "\n",
     "The above snippet was taken from the\n",
-    "[Tune API documentation](https://github.com/ray-project/ray/blob/master/doc/source/tune/api_docs/integration.rst),\n",
+    "[Tune API documentation](https://github.com/ray-project/ray/blob/master/doc/source/tune/api/integration.rst),\n",
     "which you can look at for reference.\n",
     "\n",
     "If you want to change the content of the API documentation, you will have to edit the respective function or class\n",
@@ -448,4 +448,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
+}
\ No newline at end of file

From 37086a5a1d0b85d7f6779d362395d5fbc59d5ad9 Mon Sep 17 00:00:00 2001
From: "Chris K. W" <cwong@anyscale.com>
Date: Fri, 10 Feb 2023 15:07:04 -0800
Subject: [PATCH 233/267] [Autoscaler] Make ~/.bashrc optional in autoscaler
 commands (#32393)

At the moment, autoscaler commands fail (and head node set up fails) if the user doesn't have a .bashrc. This seems like an unnecessary requirement for startup.

There's also a completely pointless true &&, which looks like an artifact from someone's refactor.
---
 python/ray/autoscaler/_private/command_runner.py | 2 +-
 python/ray/tests/test_command_runner.py          | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/python/ray/autoscaler/_private/command_runner.py b/python/ray/autoscaler/_private/command_runner.py
index 0840be3558d1..bc2c2d000d07 100644
--- a/python/ray/autoscaler/_private/command_runner.py
+++ b/python/ray/autoscaler/_private/command_runner.py
@@ -104,7 +104,7 @@ def _with_environment_variables(cmd: str, environment_variables: Dict[str, objec
 
 def _with_interactive(cmd):
     force_interactive = (
-        f"true && source ~/.bashrc && "
+        f"source ~/.bashrc; "
         f"export OMP_NUM_THREADS=1 PYTHONWARNINGS=ignore && ({cmd})"
     )
     return ["bash", "--login", "-c", "-i", quote(force_interactive)]
diff --git a/python/ray/tests/test_command_runner.py b/python/ray/tests/test_command_runner.py
index fcf3bcd69e20..7cbf93ed9145 100644
--- a/python/ray/tests/test_command_runner.py
+++ b/python/ray/tests/test_command_runner.py
@@ -113,7 +113,7 @@ def test_ssh_command_runner():
         "--login",
         "-c",
         "-i",
-        """'true && source ~/.bashrc && export OMP_NUM_THREADS=1 PYTHONWARNINGS=ignore && (export var1='"'"'"quote between this \\" and this"'"'"';export var2='"'"'"123"'"'"';echo helloo)'""",  # noqa: E501
+        """'source ~/.bashrc; export OMP_NUM_THREADS=1 PYTHONWARNINGS=ignore && (export var1='"'"'"quote between this \\" and this"'"'"';export var2='"'"'"123"'"'"';echo helloo)'""",  # noqa: E501
     ]
 
     # Much easier to debug this loop than the function call.
@@ -152,7 +152,7 @@ def test_docker_command_runner():
     # This string is insane because there are an absurd number of embedded
     # quotes. While this is a ridiculous string, the escape behavior is
     # important and somewhat difficult to get right for environment variables.
-    cmd = """'true && source ~/.bashrc && export OMP_NUM_THREADS=1 PYTHONWARNINGS=ignore && (docker exec -it  container /bin/bash -c '"'"'bash --login -c -i '"'"'"'"'"'"'"'"'true && source ~/.bashrc && export OMP_NUM_THREADS=1 PYTHONWARNINGS=ignore && (export var1='"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"quote between this \\" and this"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"';export var2='"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"123"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"';echo hello)'"'"'"'"'"'"'"'"''"'"' )'"""  # noqa: E501
+    cmd = """'source ~/.bashrc; export OMP_NUM_THREADS=1 PYTHONWARNINGS=ignore && (docker exec -it  container /bin/bash -c '"'"'bash --login -c -i '"'"'"'"'"'"'"'"'source ~/.bashrc; export OMP_NUM_THREADS=1 PYTHONWARNINGS=ignore && (export var1='"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"quote between this \\" and this"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"';export var2='"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"123"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"'"';echo hello)'"'"'"'"'"'"'"'"''"'"' )'"""  # noqa: E501
 
     expected = [
         "ssh",

From 704fd4a8a7a92e9a7eaaa40cd562c4721528ae0e Mon Sep 17 00:00:00 2001
From: clarng <clarence.wyng@gmail.com>
Date: Fri, 10 Feb 2023 15:16:29 -0800
Subject: [PATCH 234/267] [core] Force kill worker whose job has exited
 (#32217)

## Why are these changes needed?

The worker leaks currently when the task references some global import like tensorflow. There are couple issues that led to this bug:

when the worker finishes executing it does not clean up all its borrowed references
the reference counting code treats borrowed reference as something it owns
if the worker thinks it owns references it will not exit
the worker pool will not force exit an idle worker, even if the job is dead, if the worker refuses to due to the aforementioned object ownership
This PR implements the logic in worker pool to force kill an idle worker whose job has exited
---
 python/ray/tests/BUILD                |   2 +-
 python/ray/tests/test_node_manager.py |  34 +++++++
 src/ray/common/ray_config_def.h       |   3 +
 src/ray/core_worker/core_worker.cc    |  15 +++-
 src/ray/protobuf/core_worker.proto    |   6 +-
 src/ray/raylet/worker.h               |   3 +
 src/ray/raylet/worker_pool.cc         |  41 ++++++++-
 src/ray/raylet/worker_pool_test.cc    | 123 +++++++++++++++++++++++++-
 8 files changed, 215 insertions(+), 12 deletions(-)

diff --git a/python/ray/tests/BUILD b/python/ray/tests/BUILD
index 5fa316f00fec..fd1672fd93b1 100644
--- a/python/ray/tests/BUILD
+++ b/python/ray/tests/BUILD
@@ -120,6 +120,7 @@ py_test_module_list(
     "test_multi_node_2.py",
     "test_multinode_failures.py",
     "test_multinode_failures_2.py",
+    "test_node_manager.py",
     "test_object_assign_owner.py",
     "test_placement_group.py",
     "test_placement_group_2.py",
@@ -180,7 +181,6 @@ py_test_module_list(
     "test_metrics_agent_2.py",
     "test_microbenchmarks.py",
     "test_mini.py",
-    "test_node_manager.py",
     "test_numba.py",
     "test_redis_tls.py",
     "test_raylet_output.py",
diff --git a/python/ray/tests/test_node_manager.py b/python/ray/tests/test_node_manager.py
index f8d44779bdda..f6931dfc980e 100644
--- a/python/ray/tests/test_node_manager.py
+++ b/python/ray/tests/test_node_manager.py
@@ -8,6 +8,8 @@
 )
 import pytest
 import os
+from ray.experimental.state.api import list_objects
+import subprocess
 
 
 # This tests the queue transitions for infeasible tasks. This has been an issue
@@ -221,6 +223,38 @@ def fn(self):
     ray.get(det_actor.fn.remote())
 
 
+@pytest.mark.parametrize(
+    "call_ray_start",
+    ["""ray start --head"""],
+    indirect=True,
+)
+def test_reference_global_import_does_not_leak_worker_upon_driver_exit(call_ray_start):
+    driver = """
+import ray
+import numpy as np
+import tensorflow
+
+def leak_repro(obj):
+    tensorflow
+    return []
+
+ds = ray.data.from_numpy(np.ones((100_000)))
+ds.map(leak_repro, max_retries=0)
+  """
+    try:
+        run_string_as_driver(driver)
+    except subprocess.CalledProcessError:
+        pass
+
+    ray.init(address=call_ray_start)
+
+    def no_object_leaks():
+        objects = list_objects(_explain=True, timeout=3)
+        return len(objects) == 0
+
+    wait_for_condition(no_object_leaks, timeout=10, retry_interval_ms=1000)
+
+
 if __name__ == "__main__":
     import sys
 
diff --git a/src/ray/common/ray_config_def.h b/src/ray/common/ray_config_def.h
index 5ac38df00291..5dbcc88584ae 100644
--- a/src/ray/common/ray_config_def.h
+++ b/src/ray/common/ray_config_def.h
@@ -775,3 +775,6 @@ RAY_CONFIG(int64_t,
 /// the mapped plasma pages.
 RAY_CONFIG(bool, worker_core_dump_exclude_plasma_store, true)
 RAY_CONFIG(bool, raylet_core_dump_exclude_plasma_store, true)
+
+/// Whether to kill idle workers of a terminated job.
+RAY_CONFIG(bool, kill_idle_workers_of_terminated_job, true)
diff --git a/src/ray/core_worker/core_worker.cc b/src/ray/core_worker/core_worker.cc
index 8dc7934732ce..7adda2ec927d 100644
--- a/src/ray/core_worker/core_worker.cc
+++ b/src/ray/core_worker/core_worker.cc
@@ -3588,12 +3588,21 @@ void CoreWorker::HandleExit(rpc::ExitRequest request,
   // We consider the worker to be idle if it doesn't own any objects and it doesn't have
   // any object pinning RPCs in flight.
   bool is_idle = !own_objects && pins_in_flight == 0;
-  reply->set_success(is_idle);
+  bool force_exit = request.force_exit();
+  RAY_LOG(DEBUG) << "Exiting: is_idle: " << is_idle << " force_exit: " << force_exit;
+  if (!is_idle && force_exit) {
+    RAY_LOG(INFO) << "Force exiting worker that owns object. This may cause other "
+                     "workers that depends on the object to lose it. "
+                  << "Own objects: " << own_objects
+                  << " # Pins in flight: " << pins_in_flight;
+  }
+  bool will_exit = is_idle || force_exit;
+  reply->set_success(will_exit);
   send_reply_callback(
       Status::OK(),
-      [this, is_idle]() {
+      [this, will_exit]() {
         // If the worker is idle, we exit.
-        if (is_idle) {
+        if (will_exit) {
           Exit(rpc::WorkerExitType::INTENDED_SYSTEM_EXIT,
                "Worker exits because it was idle (it doesn't have objects it owns while "
                "no task or actor has been scheduled) for a long time.");
diff --git a/src/ray/protobuf/core_worker.proto b/src/ray/protobuf/core_worker.proto
index b89c9bf2e10e..2500f896b6a9 100644
--- a/src/ray/protobuf/core_worker.proto
+++ b/src/ray/protobuf/core_worker.proto
@@ -360,7 +360,11 @@ message DeleteSpilledObjectsRequest {
 
 message DeleteSpilledObjectsReply {}
 
-message ExitRequest {}
+message ExitRequest {
+  /// Whether to force exit the worker, regardless of whether the core worker
+  /// owns object.
+  bool force_exit = 1;
+}
 
 message ExitReply {
   /// Whether or not exit succeeds. If the core worker owns any object, the request fails.
diff --git a/src/ray/raylet/worker.h b/src/ray/raylet/worker.h
index e77e090b839f..5e1ad77e503e 100644
--- a/src/ray/raylet/worker.h
+++ b/src/ray/raylet/worker.h
@@ -121,6 +121,9 @@ class WorkerInterface {
   FRIEND_TEST(WorkerPoolTest, PopWorkerMultiTenancy);
   FRIEND_TEST(WorkerPoolTest, TestWorkerCapping);
   FRIEND_TEST(WorkerPoolTest, TestWorkerCappingLaterNWorkersNotOwningObjects);
+  FRIEND_TEST(WorkerPoolTest, TestJobFinishedForceKillIdleWorker);
+  FRIEND_TEST(WorkerPoolTest,
+              WorkerFromAliveJobDoesNotBlockWorkerFromDeadJobFromGettingKilled);
   FRIEND_TEST(WorkerPoolTest, TestWorkerCappingWithExitDelay);
   FRIEND_TEST(WorkerPoolTest, MaximumStartupConcurrency);
   FRIEND_TEST(WorkerPoolTest, HandleWorkerRegistration);
diff --git a/src/ray/raylet/worker_pool.cc b/src/ray/raylet/worker_pool.cc
index 93458603d634..c7e6b2cb3080 100644
--- a/src/ray/raylet/worker_pool.cc
+++ b/src/ray/raylet/worker_pool.cc
@@ -734,7 +734,8 @@ Status WorkerPool::RegisterWorker(const std::shared_ptr<WorkerInterface> &worker
   STATS_worker_register_time_ms.Record(duration.count());
   RAY_LOG(DEBUG) << "Registering worker " << worker->WorkerId() << " with pid " << pid
                  << ", port: " << port << ", register cost: " << duration.count()
-                 << ", worker_type: " << rpc::WorkerType_Name(worker->GetWorkerType());
+                 << ", worker_type: " << rpc::WorkerType_Name(worker->GetWorkerType())
+                 << ", startup token: " << worker_startup_token;
   worker->SetAssignedPort(port);
 
   state.registered_workers.insert(worker);
@@ -975,12 +976,17 @@ void WorkerPool::PushWorker(const std::shared_ptr<WorkerInterface> &worker) {
                                     &found,
                                     &used,
                                     &task_id);
+  RAY_LOG(DEBUG) << "PushWorker " << worker->WorkerId() << " used: " << used;
   if (!used) {
     // Put the worker to the idle pool.
     state.idle.insert(worker);
     int64_t now = get_time_();
     idle_of_all_languages_.emplace_back(worker, now);
     idle_of_all_languages_map_[worker] = now;
+  } else if (!found) {
+    RAY_LOG(INFO) << "Worker not returned to the idle pool after being used. This may "
+                     "cause a worker leak, worker id:"
+                  << worker->WorkerId();
   }
   // We either have an idle worker or a slot to start a new worker.
   if (worker->GetWorkerType() == rpc::WorkerType::WORKER) {
@@ -1006,11 +1012,18 @@ void WorkerPool::TryKillingIdleWorkers() {
   for (const auto &idle_pair : idle_of_all_languages_) {
     const auto &idle_worker = idle_pair.first;
     const auto &job_id = idle_worker->GetAssignedJobId();
+
+    RAY_LOG(DEBUG) << " Checking idle worker "
+                   << idle_worker->GetAssignedTask().GetTaskSpecification().DebugString()
+                   << " worker id " << idle_worker->WorkerId();
+
     if (running_size <= static_cast<size_t>(num_workers_soft_limit_)) {
-      if (!finished_jobs_.count(job_id)) {
+      if (!finished_jobs_.contains(job_id)) {
         // Ignore the soft limit for jobs that have already finished, as we
         // should always clean up these workers.
-        break;
+        RAY_LOG(DEBUG) << "job not finished. Not going to kill worker "
+                       << idle_worker->WorkerId();
+        continue;
       }
     }
 
@@ -1020,6 +1033,8 @@ void WorkerPool::TryKillingIdleWorkers() {
     }
 
     if (idle_worker->IsDead()) {
+      RAY_LOG(DEBUG) << "idle worker is already dead. Not going to kill worker "
+                     << idle_worker->WorkerId();
       // This worker has already been killed.
       // This is possible because a Java worker process may hold multiple workers.
       continue;
@@ -1034,6 +1049,8 @@ void WorkerPool::TryKillingIdleWorkers() {
       continue;
     }
 
+    // TODO(clarng): get rid of multiple workers per process code here, as that is
+    // not longer supported.
     auto process = idle_worker->GetProcess();
     // Make sure all workers in this worker process are idle.
     // This block of code is needed by Java workers.
@@ -1079,8 +1096,10 @@ void WorkerPool::TryKillingIdleWorkers() {
                      << " with pid " << process.GetId()
                      << " has been idle for a a while. Kill it.";
       // To avoid object lost issue caused by forcibly killing, send an RPC request to the
-      // worker to allow it to do cleanup before exiting.
+      // worker to allow it to do cleanup before exiting. We kill it anyway if the driver
+      // is already exited.
       if (!worker->IsDead()) {
+        RAY_LOG(DEBUG) << "Sending exit message to worker " << worker->WorkerId();
         // Register the worker to pending exit so that we can correctly calculate the
         // running_size.
         // This also means that there's an inflight `Exit` RPC request to the worker.
@@ -1090,6 +1109,12 @@ void WorkerPool::TryKillingIdleWorkers() {
         RAY_CHECK(running_size > 0);
         running_size--;
         rpc::ExitRequest request;
+        if (finished_jobs_.contains(job_id) &&
+            RayConfig::instance().kill_idle_workers_of_terminated_job()) {
+          RAY_LOG(INFO) << "Force exiting worker whose job has exited "
+                        << worker->WorkerId();
+          request.set_force_exit(true);
+        }
         rpc_client->Exit(
             request, [this, worker](const ray::Status &status, const rpc::ExitReply &r) {
               RAY_CHECK(pending_exit_idle_workers_.erase(worker->WorkerId()));
@@ -1100,6 +1125,7 @@ void WorkerPool::TryKillingIdleWorkers() {
               // In case of failed to send request, we remove it from pool as well
               // TODO (iycheng): We should handle the grpc failure in better way.
               if (!status.ok() || r.success()) {
+                RAY_LOG(DEBUG) << "Removed worker " << worker->WorkerId();
                 auto &worker_state = GetStateForLanguage(worker->GetLanguage());
                 // If we could kill the worker properly, we remove them from the idle
                 // pool.
@@ -1111,6 +1137,7 @@ void WorkerPool::TryKillingIdleWorkers() {
                   worker->MarkDead();
                 }
               } else {
+                RAY_LOG(DEBUG) << "Failed to remove worker " << worker->WorkerId();
                 // We re-insert the idle worker to the back of the queue if it fails to
                 // kill the worker (e.g., when the worker owns the object). Without this,
                 // if the first N workers own objects, it can't kill idle workers that are
@@ -1123,6 +1150,8 @@ void WorkerPool::TryKillingIdleWorkers() {
               }
             });
       } else {
+        RAY_LOG(DEBUG) << "Removing dead worker " << worker->WorkerId();
+
         // Even it's a dead worker, we still need to remove them from the pool.
         RemoveWorker(worker_state.idle, worker);
       }
@@ -1287,6 +1316,10 @@ void WorkerPool::PrestartWorkers(const TaskSpecification &task_spec,
                                  int64_t backlog_size,
                                  int64_t num_available_cpus) {
   // Code path of task that needs a dedicated worker.
+  RAY_LOG(DEBUG) << "PrestartWorkers, num_available_cpus " << num_available_cpus
+                 << " backlog_size " << backlog_size << " task spec "
+                 << task_spec.DebugString() << " has runtime env "
+                 << task_spec.HasRuntimeEnv();
   if ((task_spec.IsActorCreationTask() && !task_spec.DynamicWorkerOptions().empty()) ||
       task_spec.HasRuntimeEnv() || task_spec.GetLanguage() != ray::Language::PYTHON) {
     return;  // Not handled.
diff --git a/src/ray/raylet/worker_pool_test.cc b/src/ray/raylet/worker_pool_test.cc
index a16bc74b1405..61bbc0ef90ac 100644
--- a/src/ray/raylet/worker_pool_test.cc
+++ b/src/ray/raylet/worker_pool_test.cc
@@ -41,10 +41,12 @@ std::vector<Language> LANGUAGES = {Language::PYTHON, Language::JAVA};
 
 class MockWorkerClient : public rpc::CoreWorkerClientInterface {
  public:
-  MockWorkerClient(instrumented_io_context &io_service) : io_service_(io_service) {}
+  MockWorkerClient() {}
 
   void Exit(const rpc::ExitRequest &request,
             const rpc::ClientCallback<rpc::ExitReply> &callback) {
+    exit_count++;
+    last_exit_forced = request.force_exit();
     callbacks_.push_back(callback);
   }
 
@@ -72,8 +74,9 @@ class MockWorkerClient : public rpc::CoreWorkerClientInterface {
     return true;
   }
 
+  bool last_exit_forced = false;
+  int64_t exit_count = 0;
   std::list<rpc::ClientCallback<rpc::ExitReply>> callbacks_;
-  instrumented_io_context &io_service_;
 };
 
 static std::unordered_map<std::string, int> runtime_env_reference;
@@ -272,7 +275,7 @@ class WorkerPoolMock : public WorkerPool {
                                                                worker_startup_token);
     std::shared_ptr<WorkerInterface> worker =
         std::dynamic_pointer_cast<WorkerInterface>(worker_);
-    auto rpc_client = std::make_shared<MockWorkerClient>(instrumented_io_service_);
+    auto rpc_client = std::make_shared<MockWorkerClient>();
     worker->Connect(rpc_client);
     mock_worker_rpc_clients_.emplace(worker->WorkerId(), rpc_client);
     if (set_process && !proc.IsNull()) {
@@ -1213,6 +1216,8 @@ TEST_F(WorkerPoolTest, TestWorkerCapping) {
   // workers will be killed.
   auto mock_rpc_client_it = mock_worker_rpc_clients_.find(
       worker_pool_->GetIdleWorkers().front().first->WorkerId());
+  ASSERT_EQ(mock_rpc_client_it->second->exit_count, 1);
+  ASSERT_EQ(mock_rpc_client_it->second->last_exit_forced, false);
   mock_rpc_client_it->second->ExitReplySucceed();
   worker_pool_->TryKillingIdleWorkers();
   ASSERT_EQ(worker_pool_->GetIdleWorkerSize(), num_workers - 1);
@@ -1220,6 +1225,8 @@ TEST_F(WorkerPoolTest, TestWorkerCapping) {
   // The second core worker doesn't exit, meaning idle worker shouldn't have been killed.
   mock_rpc_client_it = mock_worker_rpc_clients_.find(
       worker_pool_->GetIdleWorkers().front().first->WorkerId());
+  ASSERT_EQ(mock_rpc_client_it->second->exit_count, 1);
+  ASSERT_EQ(mock_rpc_client_it->second->last_exit_forced, false);
   mock_rpc_client_it->second->ExitReplyFailed();
   worker_pool_->TryKillingIdleWorkers();
   ASSERT_EQ(worker_pool_->GetIdleWorkerSize(), num_workers - 1);
@@ -1234,11 +1241,15 @@ TEST_F(WorkerPoolTest, TestWorkerCapping) {
   worker_pool_->TryKillingIdleWorkers();
   mock_rpc_client_it = mock_worker_rpc_clients_.find(
       worker_pool_->GetIdleWorkers().back().first->WorkerId());
+  ASSERT_EQ(mock_rpc_client_it->second->exit_count, 1);
+  ASSERT_EQ(mock_rpc_client_it->second->last_exit_forced, false);
   ASSERT_FALSE(mock_rpc_client_it->second->ExitReplySucceed());
 
   // Now let's make sure the pending exiting workers exitted properly.
   mock_rpc_client_it = mock_worker_rpc_clients_.find(
       worker_pool_->GetIdleWorkers().front().first->WorkerId());
+  ASSERT_EQ(mock_rpc_client_it->second->exit_count, 1);
+  ASSERT_EQ(mock_rpc_client_it->second->last_exit_forced, false);
   mock_rpc_client_it->second->ExitReplySucceed();
   worker_pool_->TryKillingIdleWorkers();
   ASSERT_EQ(worker_pool_->GetIdleWorkerSize(), num_workers - 2);
@@ -1249,6 +1260,7 @@ TEST_F(WorkerPoolTest, TestWorkerCapping) {
   worker_pool_->TryKillingIdleWorkers();
   mock_rpc_client_it = mock_worker_rpc_clients_.find(
       worker_pool_->GetIdleWorkers().front().first->WorkerId());
+  ASSERT_EQ(mock_rpc_client_it->second->exit_count, 0);
   ASSERT_FALSE(mock_rpc_client_it->second->ExitReplySucceed());
 
   // Start two IO workers. These don't count towards the limit.
@@ -1280,6 +1292,7 @@ TEST_F(WorkerPoolTest, TestWorkerCapping) {
   ASSERT_EQ(worker_pool_->GetIdleWorkerSize(), num_workers - 2);
   for (auto &worker : worker_pool_->GetIdleWorkers()) {
     mock_rpc_client_it = mock_worker_rpc_clients_.find(worker.first->WorkerId());
+    ASSERT_EQ(mock_rpc_client_it->second->last_exit_forced, false);
     ASSERT_FALSE(mock_rpc_client_it->second->ExitReplySucceed());
   }
   int num_callbacks = 0;
@@ -1435,6 +1448,110 @@ TEST_F(WorkerPoolTest, TestWorkerCappingWithExitDelay) {
   ASSERT_EQ(worker_pool_->GetIdleWorkerSize(), workers.size());
 }
 
+TEST_F(WorkerPoolTest, TestJobFinishedForceKillIdleWorker) {
+  auto job_id = JOB_ID;
+
+  /// Add worker to the pool.
+  PopWorkerStatus status;
+  auto [proc, token] = worker_pool_->StartWorkerProcess(
+      Language::PYTHON, rpc::WorkerType::WORKER, job_id, &status);
+  auto worker = worker_pool_->CreateWorker(Process(), Language::PYTHON, job_id);
+  worker->SetStartupToken(worker_pool_->GetStartupToken(proc));
+  RAY_CHECK_OK(worker_pool_->RegisterWorker(
+      worker, proc.GetId(), worker_pool_->GetStartupToken(proc), [](Status, int) {}));
+  worker_pool_->OnWorkerStarted(worker);
+  worker_pool_->PushWorker(worker);
+  ASSERT_EQ(worker_pool_->GetIdleWorkerSize(), 1);
+
+  /// Execute some task with the worker.
+  auto task_spec = ExampleTaskSpec(/*actor_id=*/ActorID::Nil(), Language::PYTHON, job_id);
+  worker = worker_pool_->PopWorkerSync(task_spec, false);
+  ASSERT_EQ(worker_pool_->GetIdleWorkerSize(), 0);
+
+  /// Return the worker.
+  worker_pool_->PushWorker(worker);
+  ASSERT_EQ(worker_pool_->GetIdleWorkerSize(), 1);
+
+  auto mock_rpc_client_it = mock_worker_rpc_clients_.find(worker->WorkerId());
+  auto mock_rpc_client = mock_rpc_client_it->second;
+
+  worker_pool_->SetCurrentTimeMs(2000);
+
+  // Won't kill the worker since job hasn't finished and we are under
+  // the soft limit (5).
+  worker_pool_->TryKillingIdleWorkers();
+  ASSERT_EQ(mock_rpc_client->exit_count, 0);
+
+  // Finish the job.
+  worker_pool_->HandleJobFinished(job_id);
+
+  // The pool should try to force kill the worker.
+  worker_pool_->TryKillingIdleWorkers();
+  ASSERT_EQ(mock_rpc_client->exit_count, 1);
+  ASSERT_EQ(mock_rpc_client->last_exit_forced, true);
+
+  mock_rpc_client->ExitReplySucceed();
+}
+
+TEST_F(WorkerPoolTest, WorkerFromAliveJobDoesNotBlockWorkerFromDeadJobFromGettingKilled) {
+  rpc::JobConfig job_config;
+
+  /// Add worker to the pool whose job will stay alive.
+  auto job_id_alive = JobID::FromInt(11111);
+  RegisterDriver(Language::PYTHON, job_id_alive, job_config);
+  {
+    PopWorkerStatus status;
+    auto [proc, token] = worker_pool_->StartWorkerProcess(
+        Language::PYTHON, rpc::WorkerType::WORKER, job_id_alive, &status);
+    auto worker = worker_pool_->CreateWorker(Process(), Language::PYTHON, job_id_alive);
+    worker->SetStartupToken(worker_pool_->GetStartupToken(proc));
+    RAY_CHECK_OK(worker_pool_->RegisterWorker(
+        worker, proc.GetId(), worker_pool_->GetStartupToken(proc), [](Status, int) {}));
+    worker_pool_->OnWorkerStarted(worker);
+    worker_pool_->PushWorker(worker);
+  }
+  ASSERT_EQ(worker_pool_->GetIdleWorkerSize(), 1);
+
+  /// Add worker to the pool whose job will be killed.
+  auto job_id_dead = JobID::FromInt(22222);
+  RegisterDriver(Language::PYTHON, job_id_dead, job_config);
+  std::shared_ptr<WorkerInterface> worker_to_kill;
+  {
+    PopWorkerStatus status;
+    auto [proc, token] = worker_pool_->StartWorkerProcess(
+        Language::PYTHON, rpc::WorkerType::WORKER, job_id_dead, &status);
+    auto worker = worker_pool_->CreateWorker(Process(), Language::PYTHON, job_id_dead);
+    worker->SetStartupToken(worker_pool_->GetStartupToken(proc));
+    RAY_CHECK_OK(worker_pool_->RegisterWorker(
+        worker, proc.GetId(), worker_pool_->GetStartupToken(proc), [](Status, int) {}));
+    worker_pool_->OnWorkerStarted(worker);
+    worker_pool_->PushWorker(worker);
+
+    worker_to_kill = worker;
+  }
+  ASSERT_EQ(worker_pool_->GetIdleWorkerSize(), 2);
+
+  auto mock_rpc_client_it = mock_worker_rpc_clients_.find(worker_to_kill->WorkerId());
+  auto mock_rpc_client = mock_rpc_client_it->second;
+
+  worker_pool_->SetCurrentTimeMs(2000);
+
+  // Won't kill the workers since neither job has finished.
+  worker_pool_->TryKillingIdleWorkers();
+  ASSERT_EQ(mock_rpc_client->exit_count, 0);
+
+  // Finish the job of the second worker.
+  worker_pool_->HandleJobFinished(job_id_dead);
+
+  // The pool should try to force kill the second worker whose job is dead,
+  // and keep the first worker whose job is alive.
+  worker_pool_->TryKillingIdleWorkers();
+  ASSERT_EQ(mock_rpc_client->exit_count, 1);
+  ASSERT_EQ(mock_rpc_client->last_exit_forced, true);
+
+  mock_rpc_client->ExitReplySucceed();
+}
+
 TEST_F(WorkerPoolTest, PopWorkerWithRuntimeEnv) {
   ASSERT_EQ(worker_pool_->GetProcessSize(), 0);
   auto actor_creation_id = ActorID::Of(JOB_ID, TaskID::ForDriverTask(JOB_ID), 1);

From 9a041191ed960e8d0362ccc0b5886ac86a188666 Mon Sep 17 00:00:00 2001
From: Clark Zinzow <clarkzinzow@gmail.com>
Date: Fri, 10 Feb 2023 15:25:26 -0800
Subject: [PATCH 235/267] [Datasets] Make ray.data.from_* APIs lazy. (#32390)

This PR makes the ray.data.from_*() APIs lazy.
---
 doc/source/data/dataset-ml-preprocessing.rst  |  3 +-
 .../examples/torch_image_example.ipynb        |  4 +-
 .../examples/torch_incremental_learning.ipynb |  2 +-
 python/ray/data/dataset.py                    | 30 +++++++++-----
 python/ray/data/read_api.py                   | 10 ++---
 python/ray/data/tests/test_dataset.py         | 39 +++++++++----------
 6 files changed, 49 insertions(+), 39 deletions(-)

diff --git a/doc/source/data/dataset-ml-preprocessing.rst b/doc/source/data/dataset-ml-preprocessing.rst
index 68228a80b5c9..77cae2a696ab 100644
--- a/doc/source/data/dataset-ml-preprocessing.rst
+++ b/doc/source/data/dataset-ml-preprocessing.rst
@@ -89,8 +89,7 @@ Other preprocessing operations require global operations, such as groupbys and g
         for x in range(10)])
 
     # Group by the A column and calculate the per-group mean for B and C columns.
-    agg_ds: ray.data.Dataset = ds.groupby("A").mean(["B", "C"])
-    agg_ds.fully_executed()
+    agg_ds: ray.data.Dataset = ds.groupby("A").mean(["B", "C"]).fully_executed()
     # -> Sort Sample: 100%|███████████████████████████████████████| 10/10 [00:01<00:00,  9.04it/s]
     # -> GroupBy Map: 100%|███████████████████████████████████████| 10/10 [00:00<00:00, 23.66it/s]
     # -> GroupBy Reduce: 100%|████████████████████████████████████| 10/10 [00:00<00:00, 937.21it/s]
diff --git a/doc/source/ray-air/examples/torch_image_example.ipynb b/doc/source/ray-air/examples/torch_image_example.ipynb
index 71f027a6ff48..f55d0d28e067 100644
--- a/doc/source/ray-air/examples/torch_image_example.ipynb
+++ b/doc/source/ray-air/examples/torch_image_example.ipynb
@@ -195,8 +195,8 @@
                 "    return {\"image\": images, \"label\": labels}\n",
                 "\n",
                 "\n",
-                "train_dataset = train_dataset.map_batches(convert_batch_to_numpy)\n",
-                "test_dataset = test_dataset.map_batches(convert_batch_to_numpy)"
+                "train_dataset = train_dataset.map_batches(convert_batch_to_numpy).fully_executed()\n",
+                "test_dataset = test_dataset.map_batches(convert_batch_to_numpy).fully_executed()"
             ]
         },
         {
diff --git a/doc/source/ray-air/examples/torch_incremental_learning.ipynb b/doc/source/ray-air/examples/torch_incremental_learning.ipynb
index cc7f4217d9d8..eec994e138ef 100644
--- a/doc/source/ray-air/examples/torch_incremental_learning.ipynb
+++ b/doc/source/ray-air/examples/torch_incremental_learning.ipynb
@@ -294,7 +294,7 @@
     "\n",
     "        return {\"image\": images, \"label\": labels}\n",
     "\n",
-    "    mnist_dataset = mnist_dataset.map_batches(convert_batch_to_numpy)\n",
+    "    mnist_dataset = mnist_dataset.map_batches(convert_batch_to_numpy).fully_executed()\n",
     "    return mnist_dataset"
    ]
   },
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index 41141590e0c9..02051cb3bdab 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -281,7 +281,8 @@ def map(
             >>> ds = ray.data.from_items(
             ...     [{"value": i} for i in range(1000)])
             >>> ds.map(lambda record: {"v2": record["value"] * 2})
-            Dataset(num_blocks=..., num_rows=1000, schema={v2: int64})
+            Map
+            +- Dataset(num_blocks=..., num_rows=1000, schema={value: int64})
             >>> # Define a callable class that persists state across
             >>> # function invocations for efficiency.
             >>> init_model = ... # doctest: +SKIP
@@ -459,7 +460,8 @@ def map_batches(
             ...     return batch
             >>> ds = ds.map_batches(map_fn)
             >>> ds
-            Dataset(num_blocks=1, num_rows=3, schema={name: object, age: int64, age_in_dog_years: int64})
+            MapBatches(map_fn)
+            +- Dataset(num_blocks=1, num_rows=3, schema={name: object, age: int64})
 
             Your ``fn`` can return a different type than the input type. To learn more
             about supported output types, read
@@ -470,7 +472,9 @@ def map_batches(
             ...     return list(batch["age_in_dog_years"])
             >>> ds = ds.map_batches(map_fn)
             >>> ds
-            Dataset(num_blocks=1, num_rows=3, schema=<class 'int'>)
+            MapBatches(map_fn)
+            +- MapBatches(map_fn)
+                +- Dataset(num_blocks=1, num_rows=3, schema={name: object, age: int64})
 
             :ref:`Actors <actor-guide>` can improve the performance of some workloads.
             For example, you can use :ref:`actors <actor-guide>` to load a model once
@@ -519,7 +523,12 @@ def map_batches(
                 ``Dict[str, numpy.ndarray]`` for tabular datasets. Default is "default".
             prefetch_batches: The number of batches to fetch ahead of the current batch
                 to process. If set to greater than 0, a separate thread will be used
-                to fetch the specified amount of formatted batches from blocks. This improves performance for non-CPU bound UDFs, allowing batch fetching compute and formatting to be overlapped with the UDF. Defaults to 0 (no prefetching enabled.) Increasing the number of batches to prefetch can result in higher throughput, at the expense of requiring more heap memory to buffer the batches.
+                to fetch the specified amount of formatted batches from blocks. This
+                improves performance for non-CPU bound UDFs, allowing batch fetching
+                compute and formatting to be overlapped with the UDF. Defaults to 0 (no
+                prefetching enabled.) Increasing the number of batches to prefetch can
+                result in higher throughput, at the expense of requiring more heap
+                memory to buffer the batches.
             zero_copy_batch: Whether ``fn`` should be provided zero-copy, read-only
                 batches. If this is ``True`` and no copy is required for the
                 ``batch_format`` conversion, the batch will be a zero-copy, read-only
@@ -774,7 +783,8 @@ def select_columns(
             >>> # Select only "col1" and "col2" columns.
             >>> ds = ds.select_columns(cols=["col1", "col2"])
             >>> ds
-            Dataset(num_blocks=..., num_rows=10, schema={col1: int64, col2: int64})
+            MapBatches(<lambda>)
+            +- Dataset(num_blocks=10, num_rows=10, schema={col1: int64, col2: int64, col3: int64})
 
 
         Time complexity: O(dataset size / parallelism)
@@ -786,7 +796,7 @@ def select_columns(
                 tasks, or ActorPoolStrategy(min, max) to use an autoscaling actor pool.
             ray_remote_args: Additional resource requirements to request from
                 ray (e.g., num_gpus=1 to request GPUs for the map tasks).
-        """
+        """  # noqa: E501
         return self.map_batches(
             lambda batch: BlockAccessor.for_block(batch).select(columns=cols),
             zero_copy_batch=True,
@@ -1586,12 +1596,13 @@ def groupby(self, key: Optional[KeyFn]) -> "GroupedDataset[T]":
             >>> # Group by a key function and aggregate.
             >>> ray.data.range(100).groupby(lambda x: x % 3).count()
             Aggregate
-            +- Dataset(num_blocks=..., num_rows=100, schema=<class 'int'>)
+            +- Dataset(num_blocks=..., num_rows=3, schema=<class 'int'>)
             >>> # Group by an Arrow table column and aggregate.
             >>> ray.data.from_items([
             ...     {"A": x % 3, "B": x} for x in range(100)]).groupby(
             ...     "A").count()
-            Dataset(num_blocks=..., num_rows=3, schema={A: int64, count(): int64})
+            Aggregate
+            +- Dataset(num_blocks=100, num_rows=100, schema={A: int64, B: int64})
 
         Time complexity: O(dataset size * log(dataset size / parallelism))
 
@@ -1984,7 +1995,8 @@ def sort(
             >>> ds = ray.data.from_items(
             ...     [{"value": i} for i in range(1000)])
             >>> ds.sort("value", descending=True)
-            Dataset(num_blocks=..., num_rows=1000, schema={value: int64})
+            Sort
+            +- Dataset(num_blocks=..., num_rows=1000, schema={value: int64})
             >>> # Sort by a key function.
             >>> ds.sort(lambda record: record["value"]) # doctest: +SKIP
 
diff --git a/python/ray/data/read_api.py b/python/ray/data/read_api.py
index 5008743bd117..9eddc2730b1f 100644
--- a/python/ray/data/read_api.py
+++ b/python/ray/data/read_api.py
@@ -128,7 +128,7 @@ def from_items(items: List[Any], *, parallelism: int = -1) -> Dataset[Any]:
             run_by_consumer=False,
         ),
         0,
-        False,
+        True,
     )
 
 
@@ -1264,7 +1264,7 @@ def from_pandas_refs(
                 run_by_consumer=False,
             ),
             0,
-            False,
+            True,
         )
 
     df_to_block = cached_remote_fn(_df_to_block, num_returns=2)
@@ -1279,7 +1279,7 @@ def from_pandas_refs(
             run_by_consumer=False,
         ),
         0,
-        False,
+        True,
     )
 
 
@@ -1338,7 +1338,7 @@ def from_numpy_refs(
             run_by_consumer=False,
         ),
         0,
-        False,
+        True,
     )
 
 
@@ -1390,7 +1390,7 @@ def from_arrow_refs(
             run_by_consumer=False,
         ),
         0,
-        False,
+        True,
     )
 
 
diff --git a/python/ray/data/tests/test_dataset.py b/python/ray/data/tests/test_dataset.py
index c188ec150f7f..12dc26e97264 100644
--- a/python/ray/data/tests/test_dataset.py
+++ b/python/ray/data/tests/test_dataset.py
@@ -233,7 +233,7 @@ def mapper(x):
         return x
 
     with pytest.raises(ray.exceptions.RayTaskError):
-        ds.map(mapper)
+        ds.map(mapper).fully_executed()
 
 
 def test_dataset_lineage_serialization(shutdown_only):
@@ -2791,13 +2791,11 @@ def test_map_batches_block_bundling_auto(
     assert ds.num_blocks() == num_blocks
 
     # Blocks should be bundled up to the batch size.
-    ds1 = ds.map_batches(lambda x: x, batch_size=batch_size)
-    ds1.fully_executed()
+    ds1 = ds.map_batches(lambda x: x, batch_size=batch_size).fully_executed()
     assert ds1.num_blocks() == math.ceil(num_blocks / max(batch_size // block_size, 1))
 
     # Blocks should not be bundled up when batch_size is not specified.
-    ds2 = ds.map_batches(lambda x: x)
-    ds2.fully_executed()
+    ds2 = ds.map_batches(lambda x: x).fully_executed()
     assert ds2.num_blocks() == num_blocks
 
 
@@ -2823,7 +2821,7 @@ def test_map_batches_block_bundling_skewed_manual(
     )
     # Confirm that we have the expected number of initial blocks.
     assert ds.num_blocks() == num_blocks
-    ds = ds.map_batches(lambda x: x, batch_size=batch_size)
+    ds = ds.map_batches(lambda x: x, batch_size=batch_size).fully_executed()
 
     # Blocks should be bundled up to the batch size.
     assert ds.num_blocks() == expected_num_blocks
@@ -2849,7 +2847,7 @@ def test_map_batches_block_bundling_skewed_auto(
     )
     # Confirm that we have the expected number of initial blocks.
     assert ds.num_blocks() == num_blocks
-    ds = ds.map_batches(lambda x: x, batch_size=batch_size)
+    ds = ds.map_batches(lambda x: x, batch_size=batch_size).fully_executed()
     curr = 0
     num_out_blocks = 0
     for block_size in block_sizes:
@@ -4005,38 +4003,38 @@ def test_groupby_agg_bad_on(ray_start_regular_shared):
     df = pd.DataFrame({"A": [x % 3 for x in xs], "B": xs, "C": [2 * x for x in xs]})
     # Wrong type.
     with pytest.raises(TypeError):
-        ray.data.from_pandas(df).groupby("A").mean(5)
+        ray.data.from_pandas(df).groupby("A").mean(5).fully_executed()
     with pytest.raises(TypeError):
-        ray.data.from_pandas(df).groupby("A").mean([5])
+        ray.data.from_pandas(df).groupby("A").mean([5]).fully_executed()
     # Empty list.
     with pytest.raises(ValueError):
-        ray.data.from_pandas(df).groupby("A").mean([])
+        ray.data.from_pandas(df).groupby("A").mean([]).fully_executed()
     # Nonexistent column.
     with pytest.raises(ValueError):
-        ray.data.from_pandas(df).groupby("A").mean("D")
+        ray.data.from_pandas(df).groupby("A").mean("D").fully_executed()
     with pytest.raises(ValueError):
-        ray.data.from_pandas(df).groupby("A").mean(["B", "D"])
+        ray.data.from_pandas(df).groupby("A").mean(["B", "D"]).fully_executed()
     # Columns for simple Dataset.
     with pytest.raises(ValueError):
-        ray.data.from_items(xs).groupby(lambda x: x % 3 == 0).mean("A")
+        ray.data.from_items(xs).groupby(lambda x: x % 3 == 0).mean("A").fully_executed()
 
     # Test bad on for global aggregation
     # Wrong type.
     with pytest.raises(TypeError):
-        ray.data.from_pandas(df).mean(5)
+        ray.data.from_pandas(df).mean(5).fully_executed()
     with pytest.raises(TypeError):
-        ray.data.from_pandas(df).mean([5])
+        ray.data.from_pandas(df).mean([5]).fully_executed()
     # Empty list.
     with pytest.raises(ValueError):
-        ray.data.from_pandas(df).mean([])
+        ray.data.from_pandas(df).mean([]).fully_executed()
     # Nonexistent column.
     with pytest.raises(ValueError):
-        ray.data.from_pandas(df).mean("D")
+        ray.data.from_pandas(df).mean("D").fully_executed()
     with pytest.raises(ValueError):
-        ray.data.from_pandas(df).mean(["B", "D"])
+        ray.data.from_pandas(df).mean(["B", "D"]).fully_executed()
     # Columns for simple Dataset.
     with pytest.raises(ValueError):
-        ray.data.from_items(xs).mean("A")
+        ray.data.from_items(xs).mean("A").fully_executed()
 
 
 @pytest.mark.parametrize("num_parts", [1, 30])
@@ -4285,7 +4283,7 @@ def test_groupby_map_groups_merging_invalid_result(ray_start_regular_shared):
 
     # The UDF returns None, which is invalid.
     with pytest.raises(TypeError):
-        grouped.map_groups(lambda x: None if x == [1] else x)
+        grouped.map_groups(lambda x: None if x == [1] else x).fully_executed()
 
 
 @pytest.mark.parametrize("num_parts", [1, 2, 30])
@@ -5406,6 +5404,7 @@ def f(should_import_polars):
             ray.data.from_pandas(dfs)
             .map_batches(lambda t: t, batch_format="pyarrow", batch_size=None)
             .sort(key="a")
+            .fully_executed()
         )
         assert any(ray.get([f.remote(True) for _ in range(parallelism)]))
 

From b3b033667b22d68ec6243c32a63534bd688f8f71 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Fri, 10 Feb 2023 19:09:58 -0800
Subject: [PATCH 236/267] Fix doc test for dataset.py (#32458)

Signed-off-by: Cheng Su <scnju13@gmail.com>
---
 python/ray/data/dataset.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index 02051cb3bdab..084d13a7a8e1 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -474,7 +474,7 @@ def map_batches(
             >>> ds
             MapBatches(map_fn)
             +- MapBatches(map_fn)
-                +- Dataset(num_blocks=1, num_rows=3, schema={name: object, age: int64})
+               +- Dataset(num_blocks=1, num_rows=3, schema={name: object, age: int64})
 
             :ref:`Actors <actor-guide>` can improve the performance of some workloads.
             For example, you can use :ref:`actors <actor-guide>` to load a model once
@@ -1596,7 +1596,7 @@ def groupby(self, key: Optional[KeyFn]) -> "GroupedDataset[T]":
             >>> # Group by a key function and aggregate.
             >>> ray.data.range(100).groupby(lambda x: x % 3).count()
             Aggregate
-            +- Dataset(num_blocks=..., num_rows=3, schema=<class 'int'>)
+            +- Dataset(num_blocks=..., num_rows=100, schema=<class 'int'>)
             >>> # Group by an Arrow table column and aggregate.
             >>> ray.data.from_items([
             ...     {"A": x % 3, "B": x} for x in range(100)]).groupby(

From 80e982b17aa20ad9f6be16704a0a654ba72d4218 Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Sat, 11 Feb 2023 13:29:57 -0800
Subject: [PATCH 237/267] [RLlib] Shared encoder MARL unittest and example
 (#32460)

Signed-off-by: Kourosh Hakhamaneshi <kourosh@anyscale.com>
---
 rllib/BUILD                                   |   7 +
 rllib/core/rl_module/rl_module.py             |  13 +-
 .../rl_module/tests/test_rl_module_specs.py   | 155 ++++++++++++++++++
 rllib/core/testing/tf/bc_module.py            |  70 ++++++++
 rllib/core/testing/torch/bc_module.py         |  82 +++++++++
 5 files changed, 322 insertions(+), 5 deletions(-)
 create mode 100644 rllib/core/rl_module/tests/test_rl_module_specs.py

diff --git a/rllib/BUILD b/rllib/BUILD
index 696caf5b444b..c2b458b4beb0 100644
--- a/rllib/BUILD
+++ b/rllib/BUILD
@@ -1851,6 +1851,13 @@ py_test(
     srcs = ["core/rl_module/tests/test_marl_module.py"]
 )
 
+py_test(
+    name = "test_rl_module_specs",
+    tags = ["team:rllib", "core"],
+    size = "medium",
+    srcs = ["core/rl_module/tests/test_rl_module_specs.py"]
+)
+
 py_test(
     name = "test_trainer_runner",
     tags = ["team:rllib", "multi_gpu", "exclusive"],
diff --git a/rllib/core/rl_module/rl_module.py b/rllib/core/rl_module/rl_module.py
index 560d24e18d20..601bcbb2de3e 100644
--- a/rllib/core/rl_module/rl_module.py
+++ b/rllib/core/rl_module/rl_module.py
@@ -19,9 +19,8 @@
     convert_to_canonical_format,
 )
 from ray.rllib.models.distributions import Distribution
-from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID
+from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID, SampleBatch
 from ray.rllib.utils.nested_dict import NestedDict
-
 from ray.rllib.utils.typing import SampleBatchType
 
 
@@ -265,15 +264,19 @@ def output_specs_train(self) -> SpecType:
 
     def input_specs_inference(self) -> SpecType:
         """Returns the input specs of the forward_inference method."""
-        return {}
+        return self._default_input_specs()
 
     def input_specs_exploration(self) -> SpecType:
         """Returns the input specs of the forward_exploration method."""
-        return {}
+        return self._default_input_specs()
 
     def input_specs_train(self) -> SpecType:
         """Returns the input specs of the forward_train method."""
-        return {}
+        return self._default_input_specs()
+
+    def _default_input_specs(self) -> SpecType:
+        """Returns the default input specs."""
+        return [SampleBatch.OBS]
 
     @check_input_specs("_input_specs_inference")
     @check_output_specs("_output_specs_inference")
diff --git a/rllib/core/rl_module/tests/test_rl_module_specs.py b/rllib/core/rl_module/tests/test_rl_module_specs.py
new file mode 100644
index 000000000000..6a7fec50bf45
--- /dev/null
+++ b/rllib/core/rl_module/tests/test_rl_module_specs.py
@@ -0,0 +1,155 @@
+import unittest
+import gymnasium as gym
+import torch
+
+from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
+from ray.rllib.core.rl_module.marl_module import (
+    MultiAgentRLModule,
+    MultiAgentRLModuleSpec,
+)
+from ray.rllib.core.testing.torch.bc_module import (
+    DiscreteBCTorchModule,
+    BCTorchRLModuleWithSharedGlobalEncoder,
+    BCTorchMultiAgentSpec,
+)
+from ray.rllib.core.testing.tf.bc_module import (
+    DiscreteBCTFModule,
+    BCTfRLModuleWithSharedGlobalEncoder,
+    BCTfMultiAgentSpec,
+)
+
+MODULES = [DiscreteBCTorchModule, DiscreteBCTFModule]
+CUSTOM_MODULES = {
+    "torch": BCTorchRLModuleWithSharedGlobalEncoder,
+    "tf": BCTfRLModuleWithSharedGlobalEncoder,
+}
+CUSTOM_MARL_SPECS = {"torch": BCTorchMultiAgentSpec, "tf": BCTfMultiAgentSpec}
+
+
+class BCRLModuleSpecCustom(SingleAgentRLModuleSpec):
+    """A customized SingleAgentRLModuleSpec."""
+
+    def build(self):
+        # this handles all implementation details
+        config = {
+            "input_dim": self.observation_space.shape[0],
+            "hidden_dim": self.model_config["hidden_dim"],
+            "output_dim": self.action_space.n,
+        }
+        return self.module_class(**config)
+
+
+class TestRLModuleSpecs(unittest.TestCase):
+    def test_single_agent_spec(self):
+        """Tests RLlib's default SingleAgentRLModuleSpec."""
+        env = gym.make("CartPole-v1")
+        for module_class in MODULES:
+            spec = SingleAgentRLModuleSpec(
+                module_class=module_class,
+                observation_space=env.observation_space,
+                action_space=env.action_space,
+                model_config={"hidden_dim": 64},
+            )
+
+            module = spec.build()
+            self.assertIsInstance(module, module_class)
+
+    def test_customized_single_agent_spec(self):
+        """Tests the a customized SingleAgentRLModuleSpec."""
+        env = gym.make("CartPole-v1")
+        for module_class in MODULES:
+
+            spec = BCRLModuleSpecCustom(
+                module_class=module_class,
+                observation_space=env.observation_space,
+                action_space=env.action_space,
+                model_config={"hidden_dim": 64},
+            )
+            module = spec.build()
+            self.assertIsInstance(module, module_class)
+
+    def test_multi_agent_spec(self):
+        env = gym.make("CartPole-v1")
+        num_agents = 2
+        # make sure I use both default and cutomized single agent specs
+        single_agent_spec_classes = [SingleAgentRLModuleSpec, BCRLModuleSpecCustom]
+        for module_class in MODULES:
+            module_specs = {}
+            for i in range(num_agents):
+                module_spec_cls = single_agent_spec_classes[i % num_agents]
+                module_specs[f"module_{i}"] = module_spec_cls(
+                    module_class=module_class,
+                    observation_space=env.observation_space,
+                    action_space=env.action_space,
+                    model_config={"hidden_dim": 32 * (i + 1)},
+                )
+
+            spec = MultiAgentRLModuleSpec(
+                module_class=MultiAgentRLModule, module_specs=module_specs
+            )
+            module = spec.build()
+            self.assertIsInstance(module, MultiAgentRLModule)
+
+    def test_customized_multi_agent_spec(self):
+        """Tests creating a customized MARL BC module that owns a shared encoder."""
+
+        global_dim = 10
+        local_dims = [16, 32]
+        action_dims = [2, 4]
+
+        # TODO (Kourosh): add tf support
+        for fw in ["torch"]:
+            spec_cls = CUSTOM_MARL_SPECS[fw]
+            module_cls = CUSTOM_MODULES[fw]
+
+            spec = spec_cls(
+                module_class=MultiAgentRLModule,
+                module_specs={
+                    "agent_1": SingleAgentRLModuleSpec(
+                        module_class=module_cls,
+                        observation_space=gym.spaces.Dict(
+                            {
+                                "global": gym.spaces.Box(
+                                    low=-1, high=1, shape=(global_dim,)
+                                ),
+                                "local": gym.spaces.Box(
+                                    low=-1, high=1, shape=(local_dims[0],)
+                                ),
+                            }
+                        ),
+                        action_space=gym.spaces.Discrete(action_dims[0]),
+                        model_config={"hidden_dim": 128},
+                    ),
+                    "agent_2": SingleAgentRLModuleSpec(
+                        module_class=module_cls,
+                        observation_space=gym.spaces.Dict(
+                            {
+                                "global": gym.spaces.Box(
+                                    low=-1, high=1, shape=(global_dim,)
+                                ),
+                                "local": gym.spaces.Box(
+                                    low=-1, high=1, shape=(local_dims[1],)
+                                ),
+                            }
+                        ),
+                        action_space=gym.spaces.Discrete(action_dims[1]),
+                        model_config={"hidden_dim": 128},
+                    ),
+                },
+            )
+
+            model = spec.build()
+
+            if fw == "torch":
+                # change the parameters of the shared encoder and make sure it changes
+                # across all agents
+                foo = model["agent_1"].encoder[0].bias
+                foo.data = torch.ones_like(foo.data)
+                self.assertTrue(torch.allclose(model["agent_2"].encoder[0].bias, foo))
+
+
+if __name__ == "__main__":
+    import pytest
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/rllib/core/testing/tf/bc_module.py b/rllib/core/testing/tf/bc_module.py
index aaad27e594fa..200f0c101c90 100644
--- a/rllib/core/testing/tf/bc_module.py
+++ b/rllib/core/testing/tf/bc_module.py
@@ -4,6 +4,7 @@
 from typing import Any, Mapping
 
 from ray.rllib.core.rl_module.rl_module import RLModule
+from ray.rllib.core.rl_module.marl_module import MultiAgentRLModuleSpec
 from ray.rllib.core.rl_module.tf.tf_rl_module import TfRLModule
 from ray.rllib.models.specs.typing import SpecType
 from ray.rllib.policy.sample_batch import SampleBatch
@@ -100,3 +101,72 @@ def from_model_config(
         }
 
         return cls(**config)
+
+
+class BCTfRLModuleWithSharedGlobalEncoder(TfRLModule):
+    def __init__(self, encoder, local_dim, hidden_dim, action_dim):
+        super().__init__()
+
+        self.encoder = encoder
+        self.policy_head = tf.keras.Sequential(
+            [
+                tf.keras.layers.Dense(
+                    hidden_dim + local_dim,
+                    input_shape=(hidden_dim + local_dim,),
+                    activation="relu",
+                ),
+                tf.keras.layers.Dense(hidden_dim, activation="relu"),
+                tf.keras.layers.Dense(action_dim),
+            ]
+        )
+
+    @override(RLModule)
+    def _default_input_specs(self):
+        return [("obs", "global"), ("obs", "local")]
+
+    @override(RLModule)
+    def _forward_inference(self, batch):
+        return self._common_forward(batch)
+
+    @override(RLModule)
+    def _forward_exploration(self, batch):
+        return self._common_forward(batch)
+
+    @override(RLModule)
+    def _forward_train(self, batch):
+        return self._common_forward(batch)
+
+    def _common_forward(self, batch):
+        obs = batch["obs"]
+        global_enc = self.encoder(obs["global"])
+        policy_in = tf.concat([global_enc, obs["local"]], axis=-1)
+        action_logits = self.policy_head(policy_in)
+
+        return {"action_dist": tf.distributions.Categorical(logits=action_logits)}
+
+
+class BCTfMultiAgentSpec(MultiAgentRLModuleSpec):
+    def build(self):
+        # constructing the global encoder based on the observation_space of the first
+        # module
+        module_spec = next(iter(self.module_specs.values()))
+        global_dim = module_spec.observation_space["global"].shape[0]
+        hidden_dim = module_spec.model_config["hidden_dim"]
+        shared_encoder = tf.keras.Sequential(
+            [
+                tf.keras.Input(shape=(global_dim,)),
+                tf.keras.layers.ReLU(),
+                tf.keras.layers.Dense(hidden_dim),
+            ]
+        )
+
+        rl_modules = {}
+        for module_id, module_spec in self.module_specs.items():
+            rl_modules[module_id] = module_spec.module_class(
+                encoder=shared_encoder,
+                local_dim=module_spec.observation_space["local"].shape[0],
+                hidden_dim=hidden_dim,
+                action_dim=module_spec.action_space.n,
+            )
+
+        return self.module_class(rl_modules)
diff --git a/rllib/core/testing/torch/bc_module.py b/rllib/core/testing/torch/bc_module.py
index 5701f5ddac6a..b654ab3d3eca 100644
--- a/rllib/core/testing/torch/bc_module.py
+++ b/rllib/core/testing/torch/bc_module.py
@@ -2,6 +2,7 @@
 from typing import Any, Mapping
 
 from ray.rllib.core.rl_module import RLModule
+from ray.rllib.core.rl_module.marl_module import MultiAgentRLModuleSpec
 from ray.rllib.core.rl_module.torch.torch_rl_module import TorchRLModule
 from ray.rllib.models.specs.typing import SpecType
 from ray.rllib.utils.annotations import override
@@ -85,3 +86,84 @@ def from_model_config(
         }
 
         return cls(**config)
+
+
+class BCTorchRLModuleWithSharedGlobalEncoder(TorchRLModule):
+    """An example of an RLModule that uses an encoder shared with other things.
+
+    For example, we could consider a multi-agent case where for inference each agent
+    needs to know the global state of the environment, as well as the local state of
+    itself. For better representation learning we would like to share the encoder
+    across all the modules. So this module simply accepts the encoder object as its
+    input argument and uses it to encode the global state. The local state is passed
+    through as is. The policy head is then a simple MLP that takes the concatenation of
+    the global and local state as input and outputs the action logits.
+
+    """
+
+    def __init__(
+        self, encoder: nn.Module, local_dim: int, hidden_dim: int, action_dim: int
+    ) -> None:
+        super().__init__()
+
+        self.encoder = encoder
+        self.policy_head = nn.Sequential(
+            nn.Linear(hidden_dim + local_dim, hidden_dim),
+            nn.ReLU(),
+            nn.Linear(hidden_dim, action_dim),
+        )
+
+    @override(RLModule)
+    def _default_input_specs(self):
+        return [("obs", "global"), ("obs", "local")]
+
+    @override(RLModule)
+    def _forward_inference(self, batch):
+        with torch.no_grad():
+            return self._common_forward(batch)
+
+    @override(RLModule)
+    def _forward_exploration(self, batch):
+        with torch.no_grad():
+            return self._common_forward(batch)
+
+    @override(RLModule)
+    def _forward_train(self, batch):
+        return self._common_forward(batch)
+
+    def _common_forward(self, batch):
+        obs = batch["obs"]
+        global_enc = self.encoder(obs["global"])
+        policy_in = torch.cat([global_enc, obs["local"]], dim=-1)
+        action_logits = self.policy_head(policy_in)
+
+        return {"action_dist": torch.distributions.Categorical(logits=action_logits)}
+
+
+class BCTorchMultiAgentSpec(MultiAgentRLModuleSpec):
+
+    # TODO: make sure the default class is MultiAgentRLModule
+
+    def build(self):
+
+        # constructing the global encoder based on the observation_space of the first
+        # module
+        module_spec = next(iter(self.module_specs.values()))
+        global_dim = module_spec.observation_space["global"].shape[0]
+        hidden_dim = module_spec.model_config["hidden_dim"]
+        shared_encoder = nn.Sequential(
+            nn.Linear(global_dim, hidden_dim),
+            nn.ReLU(),
+            nn.Linear(hidden_dim, hidden_dim),
+        )
+
+        rl_modules = {}
+        for module_id, module_spec in self.module_specs.items():
+            rl_modules[module_id] = module_spec.module_class(
+                encoder=shared_encoder,
+                local_dim=module_spec.observation_space["local"].shape[0],
+                hidden_dim=hidden_dim,
+                action_dim=module_spec.action_space.n,
+            )
+
+        return self.module_class(rl_modules)

From 4c52789ffd11bc68531c7f84b8add4219a9eb1a7 Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Mon, 13 Feb 2023 17:18:40 +0100
Subject: [PATCH 238/267] [RLlib] Derive SAC model from
 AlgorithmConfig["model"] instead of MODEL_DEFAULTS (#31821)

---
 rllib/algorithms/sac/rnnsac_torch_policy.py | 7 ++++---
 rllib/algorithms/sac/sac_tf_policy.py       | 6 +++---
 2 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/rllib/algorithms/sac/rnnsac_torch_policy.py b/rllib/algorithms/sac/rnnsac_torch_policy.py
index 04d23c26bf67..32a562e8be61 100644
--- a/rllib/algorithms/sac/rnnsac_torch_policy.py
+++ b/rllib/algorithms/sac/rnnsac_torch_policy.py
@@ -1,13 +1,14 @@
 import gymnasium as gym
 import numpy as np
 from typing import List, Optional, Tuple, Type, Union
+import copy
 
 import ray
 from ray.rllib.algorithms.dqn.dqn_tf_policy import PRIO_WEIGHTS
 from ray.rllib.algorithms.sac import SACTorchPolicy
 from ray.rllib.algorithms.sac.rnnsac_torch_model import RNNSACTorchModel
 from ray.rllib.algorithms.sac.sac_torch_policy import _get_dist_class
-from ray.rllib.models import ModelCatalog, MODEL_DEFAULTS
+from ray.rllib.models import ModelCatalog
 from ray.rllib.models.modelv2 import ModelV2
 from ray.rllib.models.torch.torch_action_dist import TorchDistributionWrapper
 from ray.rllib.policy.policy import Policy
@@ -47,9 +48,9 @@ def build_rnnsac_model(
     # Force-ignore any additionally provided hidden layer sizes.
     # Everything should be configured using SAC's `q_model_config` and
     # `policy_model_config` config settings.
-    policy_model_config = MODEL_DEFAULTS.copy()
+    policy_model_config = copy.deepcopy(config["model"])
     policy_model_config.update(config["policy_model_config"])
-    q_model_config = MODEL_DEFAULTS.copy()
+    q_model_config = copy.deepcopy(config["model"])
     q_model_config.update(config["q_model_config"])
 
     default_model_cls = RNNSACTorchModel
diff --git a/rllib/algorithms/sac/sac_tf_policy.py b/rllib/algorithms/sac/sac_tf_policy.py
index c57004e125b5..32c9ec805d67 100644
--- a/rllib/algorithms/sac/sac_tf_policy.py
+++ b/rllib/algorithms/sac/sac_tf_policy.py
@@ -18,7 +18,7 @@
 from ray.rllib.algorithms.sac.sac_tf_model import SACTFModel
 from ray.rllib.algorithms.sac.sac_torch_model import SACTorchModel
 from ray.rllib.evaluation.episode import Episode
-from ray.rllib.models import ModelCatalog, MODEL_DEFAULTS
+from ray.rllib.models import ModelCatalog
 from ray.rllib.models.modelv2 import ModelV2
 from ray.rllib.models.tf.tf_action_dist import (
     Beta,
@@ -71,9 +71,9 @@ def build_sac_model(
     # Force-ignore any additionally provided hidden layer sizes.
     # Everything should be configured using SAC's `q_model_config` and
     # `policy_model_config` config settings.
-    policy_model_config = copy.deepcopy(MODEL_DEFAULTS)
+    policy_model_config = copy.deepcopy(config["model"])
     policy_model_config.update(config["policy_model_config"])
-    q_model_config = copy.deepcopy(MODEL_DEFAULTS)
+    q_model_config = copy.deepcopy(config["model"])
     q_model_config.update(config["q_model_config"])
 
     default_model_cls = SACTorchModel if config["framework"] == "torch" else SACTFModel

From cacc9822167e5514778242bb0038ef2cf9fd63af Mon Sep 17 00:00:00 2001
From: Artur Niederfahrenhorst <artur@anyscale.com>
Date: Mon, 13 Feb 2023 17:20:55 +0100
Subject: [PATCH 239/267] [RLlib] Add sample timer to all algorithms'
 `training_step()` methods (where it's simple to add). (#32475)

---
 rllib/algorithms/a2c/a2c.py               | 19 +++++-----
 rllib/algorithms/algorithm.py             | 19 +++++-----
 rllib/algorithms/alpha_zero/alpha_zero.py |  8 +++--
 rllib/algorithms/dqn/dqn.py               |  8 +++--
 rllib/algorithms/dreamer/dreamer.py       |  4 ++-
 rllib/algorithms/impala/impala.py         | 44 ++++++++++++-----------
 rllib/algorithms/ppo/ppo.py               | 21 ++++++-----
 rllib/algorithms/qmix/qmix.py             |  8 +++--
 rllib/algorithms/simple_q/simple_q.py     |  8 +++--
 9 files changed, 80 insertions(+), 59 deletions(-)

diff --git a/rllib/algorithms/a2c/a2c.py b/rllib/algorithms/a2c/a2c.py
index 126db6a3d3ea..c2b666b99325 100644
--- a/rllib/algorithms/a2c/a2c.py
+++ b/rllib/algorithms/a2c/a2c.py
@@ -19,6 +19,7 @@
     NUM_ENV_STEPS_SAMPLED,
     NUM_ENV_STEPS_TRAINED,
     SYNCH_WORKER_WEIGHTS_TIMER,
+    SAMPLE_TIMER,
 )
 from ray.rllib.utils.typing import ResultDict
 
@@ -178,14 +179,16 @@ def training_step(self) -> ResultDict:
         # apply the averaged gradient in one SGD step. This conserves GPU
         # memory, allowing for extremely large experience batches to be
         # used.
-        if self.config.count_steps_by == "agent_steps":
-            train_batch = synchronous_parallel_sample(
-                worker_set=self.workers, max_agent_steps=self.config.microbatch_size
-            )
-        else:
-            train_batch = synchronous_parallel_sample(
-                worker_set=self.workers, max_env_steps=self.config.microbatch_size
-            )
+        with self._timers[SAMPLE_TIMER]:
+            if self.config.count_steps_by == "agent_steps":
+                train_batch = synchronous_parallel_sample(
+                    worker_set=self.workers, max_agent_steps=self.config.microbatch_size
+                )
+            else:
+                train_batch = synchronous_parallel_sample(
+                    worker_set=self.workers, max_env_steps=self.config.microbatch_size
+                )
+
         self._counters[NUM_ENV_STEPS_SAMPLED] += train_batch.env_steps()
         self._counters[NUM_AGENT_STEPS_SAMPLED] += train_batch.agent_steps()
 
diff --git a/rllib/algorithms/algorithm.py b/rllib/algorithms/algorithm.py
index 4f835a151969..05c386e60384 100644
--- a/rllib/algorithms/algorithm.py
+++ b/rllib/algorithms/algorithm.py
@@ -98,6 +98,7 @@
     NUM_ENV_STEPS_TRAINED,
     SYNCH_WORKER_WEIGHTS_TIMER,
     TRAINING_ITERATION_TIMER,
+    SAMPLE_TIMER,
 )
 from ray.rllib.utils.metrics.learner_info import LEARNER_INFO
 from ray.rllib.utils.policy import validate_policy_id
@@ -1339,14 +1340,16 @@ def training_step(self) -> ResultDict:
             The results dict from executing the training iteration.
         """
         # Collect SampleBatches from sample workers until we have a full batch.
-        if self.config.count_steps_by == "agent_steps":
-            train_batch = synchronous_parallel_sample(
-                worker_set=self.workers, max_agent_steps=self.config.train_batch_size
-            )
-        else:
-            train_batch = synchronous_parallel_sample(
-                worker_set=self.workers, max_env_steps=self.config.train_batch_size
-            )
+        with self._timers[SAMPLE_TIMER]:
+            if self.config.count_steps_by == "agent_steps":
+                train_batch = synchronous_parallel_sample(
+                    worker_set=self.workers,
+                    max_agent_steps=self.config.train_batch_size,
+                )
+            else:
+                train_batch = synchronous_parallel_sample(
+                    worker_set=self.workers, max_env_steps=self.config.train_batch_size
+                )
         train_batch = train_batch.as_multi_agent()
         self._counters[NUM_AGENT_STEPS_SAMPLED] += train_batch.agent_steps()
         self._counters[NUM_ENV_STEPS_SAMPLED] += train_batch.env_steps()
diff --git a/rllib/algorithms/alpha_zero/alpha_zero.py b/rllib/algorithms/alpha_zero/alpha_zero.py
index a1ac8c027f68..2bec09df274e 100644
--- a/rllib/algorithms/alpha_zero/alpha_zero.py
+++ b/rllib/algorithms/alpha_zero/alpha_zero.py
@@ -23,6 +23,7 @@
     NUM_AGENT_STEPS_SAMPLED,
     NUM_ENV_STEPS_SAMPLED,
     SYNCH_WORKER_WEIGHTS_TIMER,
+    SAMPLE_TIMER,
 )
 from ray.rllib.utils.replay_buffers.utils import validate_buffer_config
 from ray.rllib.utils.typing import ResultDict
@@ -344,9 +345,10 @@ def training_step(self) -> ResultDict:
         """
 
         # Sample n MultiAgentBatches from n workers.
-        new_sample_batches = synchronous_parallel_sample(
-            worker_set=self.workers, concat=False
-        )
+        with self._timers[SAMPLE_TIMER]:
+            new_sample_batches = synchronous_parallel_sample(
+                worker_set=self.workers, concat=False
+            )
 
         for batch in new_sample_batches:
             # Update sampling step counters.
diff --git a/rllib/algorithms/dqn/dqn.py b/rllib/algorithms/dqn/dqn.py
index ffc0524c0e57..00ece2b5790d 100644
--- a/rllib/algorithms/dqn/dqn.py
+++ b/rllib/algorithms/dqn/dqn.py
@@ -35,6 +35,7 @@
 from ray.rllib.utils.metrics import (
     NUM_ENV_STEPS_SAMPLED,
     NUM_AGENT_STEPS_SAMPLED,
+    SAMPLE_TIMER,
 )
 from ray.rllib.utils.deprecation import (
     Deprecated,
@@ -402,9 +403,10 @@ def training_step(self) -> ResultDict:
 
         for _ in range(store_weight):
             # Sample (MultiAgentBatch) from workers.
-            new_sample_batch = synchronous_parallel_sample(
-                worker_set=self.workers, concat=True
-            )
+            with self._timers[SAMPLE_TIMER]:
+                new_sample_batch = synchronous_parallel_sample(
+                    worker_set=self.workers, concat=True
+                )
 
             # Update counters
             self._counters[NUM_AGENT_STEPS_SAMPLED] += new_sample_batch.agent_steps()
diff --git a/rllib/algorithms/dreamer/dreamer.py b/rllib/algorithms/dreamer/dreamer.py
index 29c9b1553bbf..bb6114ed3071 100644
--- a/rllib/algorithms/dreamer/dreamer.py
+++ b/rllib/algorithms/dreamer/dreamer.py
@@ -23,6 +23,7 @@
 from ray.rllib.utils.metrics import (
     NUM_AGENT_STEPS_SAMPLED,
     NUM_ENV_STEPS_SAMPLED,
+    SAMPLE_TIMER,
 )
 from ray.rllib.utils.metrics.learner_info import LEARNER_INFO
 from ray.rllib.utils.typing import (
@@ -364,7 +365,8 @@ def training_step(self) -> ResultDict:
         batch_size = self.config.batch_size
 
         # Collect SampleBatches from rollout workers.
-        batch = synchronous_parallel_sample(worker_set=self.workers)
+        with self._timers[SAMPLE_TIMER]:
+            batch = synchronous_parallel_sample(worker_set=self.workers)
         self._counters[NUM_AGENT_STEPS_SAMPLED] += batch.agent_steps()
         self._counters[NUM_ENV_STEPS_SAMPLED] += batch.env_steps()
 
diff --git a/rllib/algorithms/impala/impala.py b/rllib/algorithms/impala/impala.py
index bea342df72c2..23040b7ff54b 100644
--- a/rllib/algorithms/impala/impala.py
+++ b/rllib/algorithms/impala/impala.py
@@ -36,6 +36,7 @@
     NUM_SYNCH_WORKER_WEIGHTS,
     NUM_TRAINING_STEP_CALLS_SINCE_LAST_SYNCH_WORKER_WEIGHTS,
     SYNCH_WORKER_WEIGHTS_TIMER,
+    SAMPLE_TIMER,
 )
 from ray.rllib.utils.replay_buffers.multi_agent_replay_buffer import ReplayMode
 from ray.rllib.utils.replay_buffers.replay_buffer import _ALL_POLICIES
@@ -673,27 +674,28 @@ def get_samples_from_workers(
         self,
         return_object_refs: Optional[bool] = False,
     ) -> List[Tuple[int, Union[ObjectRef, SampleBatchType]]]:
-        # Perform asynchronous sampling on all (remote) rollout workers.
-        if self.workers.num_healthy_remote_workers() > 0:
-            self.workers.foreach_worker_async(
-                lambda worker: worker.sample(),
-                healthy_only=True,
-            )
-            sample_batches: List[
-                Tuple[int, ObjectRef]
-            ] = self.workers.fetch_ready_async_reqs(
-                timeout_seconds=self._timeout_s_sampler_manager,
-                return_obj_refs=return_object_refs,
-            )
-        elif self.workers.local_worker() and self.config.create_env_on_local_worker:
-            # Sampling from the local worker
-            sample_batch = self.workers.local_worker().sample()
-            if return_object_refs:
-                sample_batch = ray.put(sample_batch)
-            sample_batches = [(0, sample_batch)]
-        else:
-            # Not much we can do. Return empty list and wait.
-            return []
+        with self._timers[SAMPLE_TIMER]:
+            if self.workers.num_healthy_remote_workers() > 0:
+                # Perform asynchronous sampling on all (remote) rollout workers.
+                self.workers.foreach_worker_async(
+                    lambda worker: worker.sample(),
+                    healthy_only=True,
+                )
+                sample_batches: List[
+                    Tuple[int, ObjectRef]
+                ] = self.workers.fetch_ready_async_reqs(
+                    timeout_seconds=self._timeout_s_sampler_manager,
+                    return_obj_refs=return_object_refs,
+                )
+            elif self.workers.local_worker() and self.config.create_env_on_local_worker:
+                # Sampling from the local worker
+                sample_batch = self.workers.local_worker().sample()
+                if return_object_refs:
+                    sample_batch = ray.put(sample_batch)
+                sample_batches = [(0, sample_batch)]
+            else:
+                # Not much we can do. Return empty list and wait.
+                return []
 
         return sample_batches
 
diff --git a/rllib/algorithms/ppo/ppo.py b/rllib/algorithms/ppo/ppo.py
index 969755e5f977..52b069566990 100644
--- a/rllib/algorithms/ppo/ppo.py
+++ b/rllib/algorithms/ppo/ppo.py
@@ -39,6 +39,7 @@
     NUM_AGENT_STEPS_SAMPLED,
     NUM_ENV_STEPS_SAMPLED,
     SYNCH_WORKER_WEIGHTS_TIMER,
+    SAMPLE_TIMER,
 )
 
 if TYPE_CHECKING:
@@ -374,15 +375,17 @@ def get_default_policy_class(
     @ExperimentalAPI
     def training_step(self) -> ResultDict:
         # Collect SampleBatches from sample workers until we have a full batch.
-        if self.config.count_steps_by == "agent_steps":
-            train_batch = synchronous_parallel_sample(
-                worker_set=self.workers,
-                max_agent_steps=self.config.train_batch_size,
-            )
-        else:
-            train_batch = synchronous_parallel_sample(
-                worker_set=self.workers, max_env_steps=self.config.train_batch_size
-            )
+        with self._timers[SAMPLE_TIMER]:
+            if self.config.count_steps_by == "agent_steps":
+                train_batch = synchronous_parallel_sample(
+                    worker_set=self.workers,
+                    max_agent_steps=self.config.train_batch_size,
+                )
+            else:
+                train_batch = synchronous_parallel_sample(
+                    worker_set=self.workers, max_env_steps=self.config.train_batch_size
+                )
+
         train_batch = train_batch.as_multi_agent()
         self._counters[NUM_AGENT_STEPS_SAMPLED] += train_batch.agent_steps()
         self._counters[NUM_ENV_STEPS_SAMPLED] += train_batch.env_steps()
diff --git a/rllib/algorithms/qmix/qmix.py b/rllib/algorithms/qmix/qmix.py
index d622007cef94..135663e2d9e6 100644
--- a/rllib/algorithms/qmix/qmix.py
+++ b/rllib/algorithms/qmix/qmix.py
@@ -20,6 +20,7 @@
     NUM_ENV_STEPS_SAMPLED,
     NUM_TARGET_UPDATES,
     SYNCH_WORKER_WEIGHTS_TIMER,
+    SAMPLE_TIMER,
 )
 from ray.rllib.utils.replay_buffers.utils import sample_min_n_steps_from_buffer
 from ray.rllib.utils.typing import ResultDict
@@ -256,9 +257,10 @@ def training_step(self) -> ResultDict:
             The results dict from executing the training iteration.
         """
         # Sample n batches from n workers.
-        new_sample_batches = synchronous_parallel_sample(
-            worker_set=self.workers, concat=False
-        )
+        with self._timers[SAMPLE_TIMER]:
+            new_sample_batches = synchronous_parallel_sample(
+                worker_set=self.workers, concat=False
+            )
 
         for batch in new_sample_batches:
             # Update counters.
diff --git a/rllib/algorithms/simple_q/simple_q.py b/rllib/algorithms/simple_q/simple_q.py
index b2d3850af882..38ec3ba48c8b 100644
--- a/rllib/algorithms/simple_q/simple_q.py
+++ b/rllib/algorithms/simple_q/simple_q.py
@@ -32,6 +32,7 @@
     NUM_TARGET_UPDATES,
     SYNCH_WORKER_WEIGHTS_TIMER,
     TARGET_NET_UPDATE_TIMER,
+    SAMPLE_TIMER,
 )
 from ray.rllib.utils.replay_buffers.utils import (
     update_priorities_in_replay_buffer,
@@ -314,9 +315,10 @@ def training_step(self) -> ResultDict:
         local_worker = self.workers.local_worker()
 
         # Sample n MultiAgentBatches from n workers.
-        new_sample_batches = synchronous_parallel_sample(
-            worker_set=self.workers, concat=False
-        )
+        with self._timers[SAMPLE_TIMER]:
+            new_sample_batches = synchronous_parallel_sample(
+                worker_set=self.workers, concat=False
+            )
 
         for batch in new_sample_batches:
             # Update sampling step counters.

From 2e9b83423b39431090d5a653d272f413a010e523 Mon Sep 17 00:00:00 2001
From: Ian Rodney <ian.rodney@gmail.com>
Date: Mon, 13 Feb 2023 08:51:37 -0800
Subject: [PATCH 240/267] [ActorInit] Fix Bug in Actor creation (#32277)

In #28149 RayActorError is called with a str as cause, but this is not an accepted type. This leads to hitting the assertion error in the else case: assert isinstance(cause, ActorDiedErrorContext) on L283.
---
 python/ray/_raylet.pyx | 14 +++++++++++---
 1 file changed, 11 insertions(+), 3 deletions(-)

diff --git a/python/ray/_raylet.pyx b/python/ray/_raylet.pyx
index 0a6a099a8382..55eb4693af3e 100644
--- a/python/ray/_raylet.pyx
+++ b/python/ray/_raylet.pyx
@@ -134,6 +134,7 @@ from ray.util.scheduling_strategies import (
 )
 import ray._private.ray_constants as ray_constants
 import ray.cloudpickle as ray_pickle
+from ray.core.generated.common_pb2 import ActorDiedErrorContext
 from ray._private.async_compat import sync_to_async, get_new_event_loop
 from ray._private.client_mode_hook import disable_client_hook
 import ray._private.gcs_utils as gcs_utils
@@ -774,10 +775,17 @@ cdef void execute_task(
                 if len(inspect.getmembers(
                         actor.__class__,
                         predicate=inspect.iscoroutinefunction)) == 0:
+                    error_message = (
+                        "Failed to create actor. The failure reason "
+                        "is that you set the async flag, but the actor does not "
+                        "have any coroutine functions.")
                     raise RayActorError(
-                        f"Failed to create the actor {core_worker.get_actor_id()}. "
-                        "The failure reason is that you set the async flag, "
-                        "but the actor has no any coroutine function.")
+                        ActorDiedErrorContext(
+                            error_message=error_message,
+                            actor_id=core_worker.get_actor_id(),
+                            class_name=class_name
+                            )
+                        )
                 # Increase recursion limit if necessary. In asyncio mode,
                 # we have many parallel callstacks (represented in fibers)
                 # that's suspended for execution. Python interpreter will

From 997e95eedbec3fce397a4bdc4edf0e7242bb8da6 Mon Sep 17 00:00:00 2001
From: Pratik Rajput <110167551+prrajput1199@users.noreply.github.com>
Date: Mon, 13 Feb 2023 23:19:34 +0530
Subject: [PATCH 241/267] Fix typo in README.md (#32466)

Signed-off-by: Pratik <pratikrajput1199@gmail.com>
---
 doc/README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/doc/README.md b/doc/README.md
index e810c478d08a..bd131b119273 100644
--- a/doc/README.md
+++ b/doc/README.md
@@ -133,4 +133,4 @@ Please note that the parsing is extremely simple (regex replace) and will not su
 
 ## Testing changes locally
 
-If you want to run the preprocessing locally on a specific file (to eg. see how it will render after docs have been built), run `source/preprocess_github_markdown.py PATH_TO_MARKDOWN_FILE PATH_TO_PREPROCESSED_MARKDOWN_FILE`. Make sure to also edit `EXTERNAL_MARKDOWN_FILES` in `source/custom_directives.py` so that your file does not get overwritten by one downloaded form GitHub.
+If you want to run the preprocessing locally on a specific file (to eg. see how it will render after docs have been built), run `source/preprocess_github_markdown.py PATH_TO_MARKDOWN_FILE PATH_TO_PREPROCESSED_MARKDOWN_FILE`. Make sure to also edit `EXTERNAL_MARKDOWN_FILES` in `source/custom_directives.py` so that your file does not get overwritten by one downloaded from GitHub.

From 4ffa7fd87fc0e63aaf7e75a3154778fccb394f08 Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Mon, 13 Feb 2023 10:49:13 -0800
Subject: [PATCH 242/267] [RLlib] Added test version of BC algorithm based on
 RLModules an RLTrainers (#32471)

Signed-off-by: Kourosh Hakhamaneshi <kourosh@anyscale.com>
---
 rllib/BUILD                                   |  7 +++
 .../core/rl_module/tests/test_marl_module.py  | 26 +++++------
 .../rl_module/tests/test_rl_module_specs.py   | 12 ++---
 .../rl_module/tf/tests/test_tf_rl_module.py   | 12 ++---
 .../torch/tests/test_torch_rl_module.py       | 12 ++---
 .../core/rl_trainer/tests/test_rl_trainer.py  |  4 +-
 .../tests/test_trainer_runner_config.py       |  2 +-
 .../torch/tests/test_torch_rl_trainer.py      | 18 ++------
 rllib/core/testing/bc_algorithm.py            | 45 +++++++++++++++++++
 rllib/core/testing/tests/test_bc_algorithm.py | 44 ++++++++++++++++++
 rllib/core/testing/tf/bc_module.py            | 16 +------
 rllib/core/testing/torch/bc_module.py         | 16 +------
 rllib/core/testing/utils.py                   |  2 +-
 13 files changed, 138 insertions(+), 78 deletions(-)
 create mode 100644 rllib/core/testing/bc_algorithm.py
 create mode 100644 rllib/core/testing/tests/test_bc_algorithm.py

diff --git a/rllib/BUILD b/rllib/BUILD
index c2b458b4beb0..49271a17ded8 100644
--- a/rllib/BUILD
+++ b/rllib/BUILD
@@ -1887,6 +1887,13 @@ py_test(
     srcs = ["core/rl_trainer/torch/tests/test_torch_rl_trainer.py"]
 )
 
+py_test(
+    name = "test_bc_algorithm",
+    tags = ["team:rllib", "core"],
+    size = "medium",
+    srcs = ["core/testing/tests/test_bc_algorithm.py"]
+)
+
 # --------------------------------------------------------------------
 # Models and Distributions
 # rllib/models/
diff --git a/rllib/core/rl_module/tests/test_marl_module.py b/rllib/core/rl_module/tests/test_marl_module.py
index fa7a2f030525..52c1afd0a79f 100644
--- a/rllib/core/rl_module/tests/test_marl_module.py
+++ b/rllib/core/rl_module/tests/test_marl_module.py
@@ -19,12 +19,12 @@ def test_from_config(self):
         module1 = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
         module2 = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         multi_agent_dict = {"module1": module1, "module2": module2}
@@ -43,11 +43,11 @@ def test_from_multi_agent_config(self):
             "modules": {
                 "module1": SingleAgentRLModuleSpec(
                     module_class=DiscreteBCTorchModule,
-                    model_config={"hidden_dim": 64},
+                    model_config={"fcnet_hiddens": [64]},
                 ),
                 "module2": SingleAgentRLModuleSpec(
                     module_class=DiscreteBCTorchModule,
-                    model_config={"hidden_dim": 32},
+                    model_config={"fcnet_hiddens": [32]},
                 ),
             },
             "observation_space": env.observation_space,  # this is common
@@ -68,7 +68,7 @@ def test_as_multi_agent(self):
         marl_module = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         ).as_multi_agent()
 
         self.assertNotIsInstance(marl_module, DiscreteBCTorchModule)
@@ -87,7 +87,7 @@ def test_get_set_state(self):
         module = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         ).as_multi_agent()
 
         state = module.get_state()
@@ -101,7 +101,7 @@ def test_get_set_state(self):
         module2 = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         ).as_multi_agent()
         state2 = module2.get_state()
         check(state, state2, false=True)
@@ -119,7 +119,7 @@ def test_add_remove_modules(self):
         module = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         ).as_multi_agent()
 
         module.add_module(
@@ -127,7 +127,7 @@ def test_add_remove_modules(self):
             DiscreteBCTorchModule.from_model_config(
                 env.observation_space,
                 env.action_space,
-                model_config={"hidden_dim": 32},
+                model_config={"fcnet_hiddens": [32]},
             ),
         )
         self.assertEqual(set(module.keys()), {DEFAULT_POLICY_ID, "test"})
@@ -142,7 +142,7 @@ def test_add_remove_modules(self):
                 DiscreteBCTorchModule.from_model_config(
                     env.observation_space,
                     env.action_space,
-                    model_config={"hidden_dim": 32},
+                    model_config={"fcnet_hiddens": [32]},
                 ),
             ),
         )
@@ -152,7 +152,7 @@ def test_add_remove_modules(self):
             DiscreteBCTorchModule.from_model_config(
                 env.observation_space,
                 env.action_space,
-                model_config={"hidden_dim": 32},
+                model_config={"fcnet_hiddens": [32]},
             ),
             override=True,
         )
@@ -239,12 +239,12 @@ def test_serialize_deserialize(self):
         module1 = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
         module2 = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         multi_agent_dict = {"module1": module1, "module2": module2}
diff --git a/rllib/core/rl_module/tests/test_rl_module_specs.py b/rllib/core/rl_module/tests/test_rl_module_specs.py
index 6a7fec50bf45..22db1bc3f823 100644
--- a/rllib/core/rl_module/tests/test_rl_module_specs.py
+++ b/rllib/core/rl_module/tests/test_rl_module_specs.py
@@ -33,7 +33,7 @@ def build(self):
         # this handles all implementation details
         config = {
             "input_dim": self.observation_space.shape[0],
-            "hidden_dim": self.model_config["hidden_dim"],
+            "hidden_dim": self.model_config["fcnet_hiddens"][0],
             "output_dim": self.action_space.n,
         }
         return self.module_class(**config)
@@ -48,7 +48,7 @@ def test_single_agent_spec(self):
                 module_class=module_class,
                 observation_space=env.observation_space,
                 action_space=env.action_space,
-                model_config={"hidden_dim": 64},
+                model_config={"fcnet_hiddens": [64]},
             )
 
             module = spec.build()
@@ -63,7 +63,7 @@ def test_customized_single_agent_spec(self):
                 module_class=module_class,
                 observation_space=env.observation_space,
                 action_space=env.action_space,
-                model_config={"hidden_dim": 64},
+                model_config={"fcnet_hiddens": [64]},
             )
             module = spec.build()
             self.assertIsInstance(module, module_class)
@@ -81,7 +81,7 @@ def test_multi_agent_spec(self):
                     module_class=module_class,
                     observation_space=env.observation_space,
                     action_space=env.action_space,
-                    model_config={"hidden_dim": 32 * (i + 1)},
+                    model_config={"fcnet_hiddens": [32 * (i + 1)]},
                 )
 
             spec = MultiAgentRLModuleSpec(
@@ -118,7 +118,7 @@ def test_customized_multi_agent_spec(self):
                             }
                         ),
                         action_space=gym.spaces.Discrete(action_dims[0]),
-                        model_config={"hidden_dim": 128},
+                        model_config={"fcnet_hiddens": [128]},
                     ),
                     "agent_2": SingleAgentRLModuleSpec(
                         module_class=module_cls,
@@ -133,7 +133,7 @@ def test_customized_multi_agent_spec(self):
                             }
                         ),
                         action_space=gym.spaces.Discrete(action_dims[1]),
-                        model_config={"hidden_dim": 128},
+                        model_config={"fcnet_hiddens": [128]},
                     ),
                 },
             )
diff --git a/rllib/core/rl_module/tf/tests/test_tf_rl_module.py b/rllib/core/rl_module/tf/tests/test_tf_rl_module.py
index 2b147a883404..b09b42a3a681 100644
--- a/rllib/core/rl_module/tf/tests/test_tf_rl_module.py
+++ b/rllib/core/rl_module/tf/tests/test_tf_rl_module.py
@@ -18,7 +18,7 @@ def test_compilation(self):
         module = DiscreteBCTFModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         self.assertIsInstance(module, TfRLModule)
@@ -30,7 +30,7 @@ def test_forward_train(self):
         module = DiscreteBCTFModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         obs_shape = env.observation_space.shape
@@ -62,7 +62,7 @@ def test_forward(self):
         module = DiscreteBCTFModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         obs_shape = env.observation_space.shape
@@ -78,7 +78,7 @@ def test_get_set_state(self):
         module = DiscreteBCTFModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         state = module.get_state()
@@ -87,7 +87,7 @@ def test_get_set_state(self):
         module2 = DiscreteBCTFModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
         state2 = module2.get_state()
         check(state["policy"][0], state2["policy"][0], false=True)
@@ -101,7 +101,7 @@ def test_serialize_deserialize(self):
         module = DiscreteBCTFModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         # create a new module from the old module
diff --git a/rllib/core/rl_module/torch/tests/test_torch_rl_module.py b/rllib/core/rl_module/torch/tests/test_torch_rl_module.py
index ad3ff047e4a8..c106647efbce 100644
--- a/rllib/core/rl_module/torch/tests/test_torch_rl_module.py
+++ b/rllib/core/rl_module/torch/tests/test_torch_rl_module.py
@@ -17,7 +17,7 @@ def test_compilation(self):
         module = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         self.assertIsInstance(module, TorchRLModule)
@@ -29,7 +29,7 @@ def test_forward_train(self):
         module = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         obs_shape = env.observation_space.shape
@@ -57,7 +57,7 @@ def test_forward(self):
         module = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         obs_shape = env.observation_space.shape
@@ -73,7 +73,7 @@ def test_get_set_state(self):
         module = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         state = module.get_state()
@@ -82,7 +82,7 @@ def test_get_set_state(self):
         module2 = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
         state2 = module2.get_state()
         check(state, state2, false=True)
@@ -96,7 +96,7 @@ def test_serialize_deserialize(self):
         module = DiscreteBCTorchModule.from_model_config(
             env.observation_space,
             env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         )
 
         # create a new module from the old module
diff --git a/rllib/core/rl_trainer/tests/test_rl_trainer.py b/rllib/core/rl_trainer/tests/test_rl_trainer.py
index 6b431600cc79..7489c2a1225e 100644
--- a/rllib/core/rl_trainer/tests/test_rl_trainer.py
+++ b/rllib/core/rl_trainer/tests/test_rl_trainer.py
@@ -22,7 +22,7 @@ def get_trainer() -> RLTrainer:
             module_class=DiscreteBCTFModule,
             observation_space=env.observation_space,
             action_space=env.action_space,
-            model_config={"hidden_dim": 32},
+            model_config={"fcnet_hiddens": [32]},
         ),
         optimizer_config={"lr": 1e-3},
         trainer_scaling_config=TrainerScalingConfig(),
@@ -127,7 +127,7 @@ def set_optimizer_fn(module):
                 module_class=DiscreteBCTFModule,
                 observation_space=env.observation_space,
                 action_space=env.action_space,
-                model_config={"hidden_dim": 16},
+                model_config={"fcnet_hiddens": [16]},
             ),
             set_optimizer_fn=set_optimizer_fn,
         )
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner_config.py b/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
index 46e215acd86d..4eacf477f3b6 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
@@ -43,7 +43,7 @@ def test_trainer_runner_build_from_algorithm_config(self):
             AlgorithmConfig()
             .rl_module(rl_module_class=DiscreteBCTFModule)
             .training(rl_trainer_class=BCTfRLTrainer)
-            .training(model={"hidden_dim": 32})
+            .training(model={"fcnet_hiddens": [32]})
         )
         config.freeze()
         runner_config = config.get_trainer_runner_config(
diff --git a/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py b/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
index 0be8428599e6..95b68da7ceb3 100644
--- a/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
+++ b/rllib/core/rl_trainer/torch/tests/test_torch_rl_trainer.py
@@ -8,27 +8,15 @@
 from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
 from ray.rllib.core.rl_trainer.rl_trainer import RLTrainer
 from ray.rllib.core.testing.torch.bc_module import DiscreteBCTorchModule
-from ray.rllib.core.testing.torch.bc_rl_trainer import BCTorchRLTrainer
 from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID
 from ray.rllib.utils.test_utils import check, get_cartpole_dataset_reader
 from ray.rllib.utils.numpy import convert_to_numpy
-from ray.rllib.core.rl_trainer.scaling_config import TrainerScalingConfig
+from ray.rllib.core.testing.utils import get_rl_trainer
 
 
 def _get_trainer() -> RLTrainer:
     env = gym.make("CartPole-v1")
-
-    trainer = BCTorchRLTrainer(
-        module_spec=SingleAgentRLModuleSpec(
-            module_class=DiscreteBCTorchModule,
-            observation_space=env.observation_space,
-            action_space=env.action_space,
-            model_config={"hidden_dim": 32},
-        ),
-        optimizer_config={"lr": 1e-3},
-        trainer_scaling_config=TrainerScalingConfig(),
-    )
-
+    trainer = get_rl_trainer("torch", env)
     trainer.build()
 
     return trainer
@@ -125,7 +113,7 @@ def set_optimizer_fn(module):
                 module_class=DiscreteBCTorchModule,
                 observation_space=env.observation_space,
                 action_space=env.action_space,
-                model_config={"hidden_dim": 16},
+                model_config={"fcnet_hiddens": [16]},
             ),
             set_optimizer_fn=set_optimizer_fn,
         )
diff --git a/rllib/core/testing/bc_algorithm.py b/rllib/core/testing/bc_algorithm.py
new file mode 100644
index 000000000000..77e4f91fb911
--- /dev/null
+++ b/rllib/core/testing/bc_algorithm.py
@@ -0,0 +1,45 @@
+"""Contains example implementation of a custom algorithm.
+
+Note: It doesn't include any real use-case functionality; it only serves as an example
+to test the algorithm construction and customization.
+"""
+
+from ray.rllib.algorithms import Algorithm, AlgorithmConfig
+from ray.rllib.policy.torch_policy_v2 import TorchPolicyV2
+from ray.rllib.policy.eager_tf_policy_v2 import EagerTFPolicyV2
+from ray.rllib.core.testing.torch.bc_module import DiscreteBCTorchModule
+from ray.rllib.core.testing.torch.bc_rl_trainer import BCTorchRLTrainer
+from ray.rllib.core.testing.tf.bc_module import DiscreteBCTFModule
+from ray.rllib.core.testing.tf.bc_rl_trainer import BCTfRLTrainer
+
+
+class BCConfigTest(AlgorithmConfig):
+    def __init__(self, algo_class=None):
+        super().__init__(algo_class=algo_class or BCAlgorithmTest)
+
+    def get_default_rl_module_class(self):
+        if self.framework_str == "torch":
+            return DiscreteBCTorchModule
+        elif self.framework_str == "tf2":
+            return DiscreteBCTFModule
+
+    def get_default_rl_trainer_class(self):
+        if self.framework_str == "torch":
+            return BCTorchRLTrainer
+        elif self.framework_str == "tf2":
+            return BCTfRLTrainer
+
+
+class BCAlgorithmTest(Algorithm):
+    @classmethod
+    def get_default_policy_class(cls, config: AlgorithmConfig):
+        if config.framework_str == "torch":
+            return TorchPolicyV2
+        elif config.framework_str == "tf2":
+            return EagerTFPolicyV2
+        else:
+            raise ValueError("Unknown framework: {}".format(config.framework_str))
+
+    def training_step(self):
+        # do nothing.
+        return {}
diff --git a/rllib/core/testing/tests/test_bc_algorithm.py b/rllib/core/testing/tests/test_bc_algorithm.py
new file mode 100644
index 000000000000..9909e53e79ae
--- /dev/null
+++ b/rllib/core/testing/tests/test_bc_algorithm.py
@@ -0,0 +1,44 @@
+import unittest
+
+import ray
+from ray.rllib.core.testing.torch.bc_module import DiscreteBCTorchModule
+from ray.rllib.core.testing.tf.bc_module import DiscreteBCTFModule
+
+from ray.rllib.core.testing.bc_algorithm import BCConfigTest
+from ray.rllib.utils.test_utils import framework_iterator
+
+
+class TestRLTrainer(unittest.TestCase):
+    @classmethod
+    def setUp(cls) -> None:
+        ray.init()
+
+    @classmethod
+    def tearDown(cls) -> None:
+        ray.shutdown()
+
+    def test_bc_algorithm(self):
+
+        config = (
+            BCConfigTest()
+            .rl_module(_enable_rl_module_api=True)
+            .training(_enable_rl_trainer_api=True, model={"fcnet_hiddens": [32, 32]})
+        )
+
+        # TODO (Kourosh): Add tf2 support
+        for fw in framework_iterator(config, frameworks=("torch")):
+            algo = config.build(env="CartPole-v1")
+            policy = algo.get_policy()
+            rl_module = policy.model
+
+            if fw == "torch":
+                assert isinstance(rl_module, DiscreteBCTorchModule)
+            elif fw == "tf":
+                assert isinstance(rl_module, DiscreteBCTFModule)
+
+
+if __name__ == "__main__":
+    import pytest
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))
diff --git a/rllib/core/testing/tf/bc_module.py b/rllib/core/testing/tf/bc_module.py
index 200f0c101c90..f8d213241078 100644
--- a/rllib/core/testing/tf/bc_module.py
+++ b/rllib/core/testing/tf/bc_module.py
@@ -33,18 +33,6 @@ def __init__(
         self.policy = tf.keras.Sequential(layers)
         self._input_dim = input_dim
 
-    @override(RLModule)
-    def input_specs_exploration(self) -> SpecType:
-        return ["obs"]
-
-    @override(RLModule)
-    def input_specs_inference(self) -> SpecType:
-        return ["obs"]
-
-    @override(RLModule)
-    def input_specs_train(self) -> SpecType:
-        return ["obs"]
-
     @override(RLModule)
     def output_specs_exploration(self) -> SpecType:
         return ["action_dist"]
@@ -96,7 +84,7 @@ def from_model_config(
 
         config = {
             "input_dim": observation_space.shape[0],
-            "hidden_dim": model_config["hidden_dim"],
+            "hidden_dim": model_config["fcnet_hiddens"][0],
             "output_dim": action_space.n,
         }
 
@@ -151,7 +139,7 @@ def build(self):
         # module
         module_spec = next(iter(self.module_specs.values()))
         global_dim = module_spec.observation_space["global"].shape[0]
-        hidden_dim = module_spec.model_config["hidden_dim"]
+        hidden_dim = module_spec.model_config["fcnet_hiddens"][0]
         shared_encoder = tf.keras.Sequential(
             [
                 tf.keras.Input(shape=(global_dim,)),
diff --git a/rllib/core/testing/torch/bc_module.py b/rllib/core/testing/torch/bc_module.py
index b654ab3d3eca..ce5fd81d64a9 100644
--- a/rllib/core/testing/torch/bc_module.py
+++ b/rllib/core/testing/torch/bc_module.py
@@ -30,18 +30,6 @@ def __init__(
 
         self.input_dim = input_dim
 
-    @override(RLModule)
-    def input_specs_exploration(self) -> SpecType:
-        return ["obs"]
-
-    @override(RLModule)
-    def input_specs_inference(self) -> SpecType:
-        return ["obs"]
-
-    @override(RLModule)
-    def input_specs_train(self) -> SpecType:
-        return ["obs"]
-
     @override(RLModule)
     def output_specs_exploration(self) -> SpecType:
         return ["action_dist"]
@@ -81,7 +69,7 @@ def from_model_config(
 
         config = {
             "input_dim": observation_space.shape[0],
-            "hidden_dim": model_config["hidden_dim"],
+            "hidden_dim": model_config["fcnet_hiddens"][0],
             "output_dim": action_space.n,
         }
 
@@ -150,7 +138,7 @@ def build(self):
         # module
         module_spec = next(iter(self.module_specs.values()))
         global_dim = module_spec.observation_space["global"].shape[0]
-        hidden_dim = module_spec.model_config["hidden_dim"]
+        hidden_dim = module_spec.model_config["fcnet_hiddens"][0]
         shared_encoder = nn.Sequential(
             nn.Linear(global_dim, hidden_dim),
             nn.ReLU(),
diff --git a/rllib/core/testing/utils.py b/rllib/core/testing/utils.py
index 6dbf9f60fd17..15f268312817 100644
--- a/rllib/core/testing/utils.py
+++ b/rllib/core/testing/utils.py
@@ -60,7 +60,7 @@ def get_module_spec(framework: str, env: "gym.Env", is_multi_agent: bool = False
         module_class=get_module_class(framework),
         observation_space=env.observation_space,
         action_space=env.action_space,
-        model_config={"hidden_dim": 32},
+        model_config={"fcnet_hiddens": [32]},
     )
 
     if is_multi_agent:

From 7e662dd7728cfcfe79e0569c8f4006b05c7e2a1d Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Mon, 13 Feb 2023 11:07:11 -0800
Subject: [PATCH 243/267] [tune] Move experiment state/checkpoint/resume
 management into a separate file (#32457)

Experiment state management is currently convoluted.
We keep track of many duplicate variables, e.g. local/remote checkpoint dirs and syncers.
The resume/syncing logic also takes up a lot of space in the trial runner.

Saving and restoring experiment state is orthogonal to the actual trial lifecycle logic, thus it makes sense to separate this out. In the same go, I've removed a lot of duplicated state and simplified some APIs that will also make it easier to test the experiment state component separately.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 python/ray/tune/execution/experiment_state.py | 466 ++++++++++++
 python/ray/tune/execution/trial_runner.py     | 705 +++++-------------
 python/ray/tune/impl/tuner_internal.py        |   2 +-
 python/ray/tune/tests/test_trial_runner_3.py  |   8 +-
 python/ray/tune/tune.py                       |   8 +-
 python/ray/tune/tuner.py                      |   2 +-
 6 files changed, 658 insertions(+), 533 deletions(-)
 create mode 100644 python/ray/tune/execution/experiment_state.py

diff --git a/python/ray/tune/execution/experiment_state.py b/python/ray/tune/execution/experiment_state.py
new file mode 100644
index 000000000000..4c5aa4e2c3a8
--- /dev/null
+++ b/python/ray/tune/execution/experiment_state.py
@@ -0,0 +1,466 @@
+from collections import Counter
+from dataclasses import dataclass
+from typing import Dict, Optional, Union, Callable
+
+import click
+import logging
+import os
+import time
+import warnings
+
+from ray.tune.impl.out_of_band_serialize_dataset import out_of_band_serialize_dataset
+from ray.tune import TuneError
+
+from ray.tune.syncer import SyncConfig, get_node_to_storage_syncer
+from ray.tune.experiment import Trial
+
+
+logger = logging.getLogger(__name__)
+
+
+VALID_RESUME_TYPES = [True, "LOCAL", "REMOTE", "PROMPT", "ERRORED_ONLY", "AUTO"]
+
+
+@dataclass
+class _ResumeConfig:
+    resume_unfinished: bool = True
+    resume_errored: bool = False
+    restart_errored: bool = False
+
+
+def _resume_str_to_config(resume_str: str) -> _ResumeConfig:
+    if resume_str is True:
+        resume_str = "LOCAL"
+    elif resume_str == "ERRORED_ONLY":
+        warnings.warn(
+            "Passing `resume='ERRORED_ONLY'` to tune.run() is deprecated and "
+            "will be removed in the future. Please pass e.g. "
+            "`resume='LOCAL+RESTART_ERRORED_ONLY'` instead."
+        )
+        resume_str = "LOCAL+RESTART_ERRORED_ONLY"
+
+    # Parse resume string, e.g. AUTO+ERRORED
+    resume_config = _ResumeConfig()
+    resume_settings = resume_str.split("+")
+    resume_str = resume_settings[0]
+
+    for setting in resume_settings:
+        if setting == "ERRORED":
+            resume_config.resume_errored = True
+        elif setting == "RESTART_ERRORED":
+            resume_config.restart_errored = True
+        elif setting == "ERRORED_ONLY":
+            resume_config.resume_unfinished = False
+            resume_config.restart_errored = False
+            resume_config.resume_errored = True
+        elif setting == "RESTART_ERRORED_ONLY":
+            resume_config.resume_unfinished = False
+            resume_config.restart_errored = True
+            resume_config.resume_errored = False
+
+    assert resume_str in VALID_RESUME_TYPES, "resume={} is not one of {}".format(
+        resume_str, VALID_RESUME_TYPES
+    )
+    return resume_config
+
+
+def _experiment_checkpoint_exists(experiment_dir: str) -> bool:
+    return bool(_find_newest_experiment_checkpoint(experiment_dir=experiment_dir))
+
+
+def _find_newest_experiment_checkpoint(experiment_dir: str) -> Optional[str]:
+    """Returns file name of most recently modified checkpoint."""
+
+    def construct(file: str) -> str:
+        return os.path.join(experiment_dir, file)
+
+    candidate_paths = [
+        construct(file)
+        for file in os.listdir(experiment_dir)
+        if file.startswith("experiment_state") and file.endswith(".json")
+    ]
+    if not candidate_paths:
+        return None
+
+    return max(candidate_paths)
+
+
+class _ExperimentCheckpointManager:
+    """Helper class for managing experiment-level checkpoints.
+
+    This class implements the ``checkpoint()`` method used to checkpoint
+    experiment state. When called, this will serialize and write to disk
+    the state of the trial runner, trial executor, and search algorithm, to
+    a specified checkpoint file.
+
+    The checkpoint period is automatically adjusted to
+    ``max(10, time_per_checkpoint * 19)``. This means that at most 5% of the
+    time (1/20) will be used for writing checkpoints, while 95% of the time
+    (19/20) will be used to handle the rest of the training loop.
+
+    If ``sync_every_n_trial_checkpoints`` is not None, syncing
+    to cloud will be forced if any trial has checkpointed more times than
+    ``sync_every_n_trial_checkpoints`` since last sync.
+
+    """
+
+    def __init__(
+        self,
+        *,
+        local_checkpoint_dir: str,
+        remote_checkpoint_dir: str,
+        checkpoint_period: Union[int, float, str],
+        sync_config: SyncConfig,
+        sync_every_n_trial_checkpoints: Optional[int] = None,
+    ):
+        # Checkpoint directories
+        self._local_checkpoint_dir = local_checkpoint_dir
+        self._remote_checkpoint_dir = remote_checkpoint_dir
+
+        # Synch to/from cloud
+        self._sync_config = sync_config or SyncConfig
+        self._syncer = get_node_to_storage_syncer(self._sync_config)
+
+        # Last save + sync time
+        self._last_save_time = 0.0
+        self._last_sync_time = 0.0
+
+        # Dynamic checkpointing period
+        self._auto_checkpoint_enabled = checkpoint_period == "auto"
+        if self._auto_checkpoint_enabled:
+            self._checkpoint_period = 10.0  # Initial value
+        else:
+            self._checkpoint_period = float(checkpoint_period)
+
+        # Upload triggered by trial checkpoints
+        self._sync_every_n_trial_checkpoints = sync_every_n_trial_checkpoints
+        self._trial_num_checkpoints_since_last_sync: Dict[Trial, int] = Counter()
+        self._excessive_sync_threshold = float(
+            os.environ.get(
+                "TUNE_WARN_EXCESSIVE_EXPERIMENT_CHECKPOINT_SYNC_THRESHOLD_S", "30"
+            )
+        )
+        self._should_force_cloud_sync = False
+
+    @property
+    def auto_checkpoint_enabled(self):
+        return self._auto_checkpoint_enabled
+
+    def _update_auto_checkpoint_time(self, time_taken: float):
+        if self._auto_checkpoint_enabled:
+            # Multiplying this time by 19 means we spend ~5% of the time
+            # writing global checkpoints and 95% of the time processing trials
+            self._checkpoint_period = max(10.0, time_taken * 19)
+            logger.debug(
+                f"Global experiment checkpointing took "
+                f"{time_taken:.2f} seconds. "
+                f"Adjusting checkpoint period to "
+                f"{self._checkpoint_period:.2f} seconds."
+            )
+
+    def on_trial_checkpoint(self, trial: Trial):
+        if not self._sync_every_n_trial_checkpoints:
+            return
+
+        self._trial_num_checkpoints_since_last_sync[trial] += 1
+
+        if (
+            self._trial_num_checkpoints_since_last_sync[trial]
+            >= self._sync_every_n_trial_checkpoints
+        ):
+            self._should_force_cloud_sync = True
+
+    def checkpoint(
+        self,
+        save_fn: Callable[[], None],
+        force: bool = False,
+        wait: bool = False,
+    ):
+        """Saves execution state to `self._local_checkpoint_dir`.
+
+        Overwrites the current session checkpoint, which starts when self
+        is instantiated. Throttle depends on self._checkpoint_period.
+
+        Also, automatically saves the search algorithm to the local
+        checkpoint dir.
+
+        Args:
+            save_fn: Function to call to actually save data. Should expect
+                one string argument specifying the directory to save to.
+            force: Forces a checkpoint despite checkpoint_period.
+            wait: Wait until sync to cloud has finished.
+
+        """
+        if not self._local_checkpoint_dir:
+            return
+
+        force = force or self._should_force_cloud_sync
+
+        now = time.time()
+        if now - self._last_save_time < self._checkpoint_period and not force:
+            return
+
+        # Checkpoint
+        checkpoint_time_start = time.monotonic()
+
+        with out_of_band_serialize_dataset():
+            save_fn()
+
+        # Sync to cloud
+        self.sync_up(force=force, wait=wait)
+
+        checkpoint_time_taken = time.monotonic() - checkpoint_time_start
+
+        # Adjust dynamic checkpointing
+        self._update_auto_checkpoint_time(time_taken=checkpoint_time_taken)
+
+        # Finish
+        self._last_save_time = time.time()
+        return self._local_checkpoint_dir
+
+    def sync_up(self, force: bool = False, wait: bool = False) -> bool:
+        # self._remote_checkpoint_dir can be empty in tests, but shouldn't
+        # be empty when using in end-to-end tune.
+        # Todo (krfricke): We may want to not store directories in this manager
+        # but instead always pass them from the trial runner.
+        if not self._syncer:  # or not self._remote_checkpoint_dir:
+            return False
+
+        if bool(self._sync_config.upload_dir):
+            # If an upload dir is given, trainable actors upload checkpoints
+            # themselves. Then the driver does not need to sync checkpoints.
+            exclude = ["*/checkpoint_*"]
+        else:
+            # Otherwise, we sync the full trial dir.
+            exclude = None
+
+        if force:
+            # Wait until previous sync command finished
+            try:
+                self._syncer.wait()
+            except TimeoutError as e:
+                logger.warning(
+                    "The previous sync of the experiment checkpoint to the cloud "
+                    f"timed out: {str(e)}. Tune will continue to retry syncing. "
+                    "If this warning keeps showing up, consider diagnosing the "
+                    "reason behind the hanging sync operation, or increase the "
+                    "`sync_timeout` in `SyncConfig`."
+                )
+            synced = self._syncer.sync_up(
+                local_dir=self._local_checkpoint_dir,
+                remote_dir=self._remote_checkpoint_dir,
+                exclude=exclude,
+            )
+        else:
+            synced = self._syncer.sync_up_if_needed(
+                local_dir=self._local_checkpoint_dir,
+                remote_dir=self._remote_checkpoint_dir,
+                exclude=exclude,
+            )
+
+        if wait:
+            self._syncer.wait()
+
+        if not synced:
+            return False
+
+        self._should_force_cloud_sync = False
+        self._trial_num_checkpoints_since_last_sync.clear()
+
+        # syncing might have taken some time, so we grab the current timestamp again
+        now = time.time()
+        if now - self._last_sync_time < self._excessive_sync_threshold:
+            logger.warning(
+                "Experiment checkpoint syncing has been triggered multiple "
+                f"times in the last {self._excessive_sync_threshold} seconds. "
+                "A sync will be triggered whenever a trial has checkpointed "
+                "more than `num_to_keep` times since last sync or if "
+                f"{self._syncer.sync_period} seconds have passed since last "
+                "sync. If you have set `num_to_keep` in your `CheckpointConfig`, "
+                "consider increasing the checkpoint frequency or keeping more "
+                "checkpoints. You can supress this warning by changing the "
+                "`TUNE_WARN_EXCESSIVE_EXPERIMENT_CHECKPOINT_SYNC_THRESHOLD_S` "
+                "environment variable."
+            )
+        self._last_sync_time = now
+        return True
+
+    def sync_down(self, force: bool = False, wait: bool = False) -> bool:
+        if not self._syncer or not self._remote_checkpoint_dir:
+            return False
+
+        if bool(self._sync_config.upload_dir):
+            # If an upload dir is given, trainable actors upload checkpoints
+            # themselves. Then the driver does not need to sync checkpoints.
+            exclude = ["*/checkpoint_*"]
+        else:
+            # Otherwise, we sync the full trial dir.
+            exclude = None
+
+        if force:
+            # Wait until previous sync command finished
+            try:
+                self._syncer.wait()
+            except TimeoutError as e:
+                logger.warning(
+                    "The previous sync of the experiment checkpoint from the cloud "
+                    f"timed out: {str(e)}."
+                )
+            synced = self._syncer.sync_down(
+                remote_dir=self._remote_checkpoint_dir,
+                local_dir=self._local_checkpoint_dir,
+                exclude=exclude,
+            )
+        else:
+            synced = self._syncer.sync_down_if_needed(
+                remote_dir=self._remote_checkpoint_dir,
+                local_dir=self._local_checkpoint_dir,
+                exclude=exclude,
+            )
+
+        if wait:
+            try:
+                self._syncer.wait()
+            except TuneError as e:
+                raise RuntimeError(
+                    "Syncing the remote experiment checkpoint to the driver "
+                    "failed. Please check the error message. If you want to "
+                    'start a new experiment, use `resume="AUTO"` or '
+                    "`resume=None`. If you expected an experiment to "
+                    "already exist, check if you supplied the correct "
+                    "`upload_dir` to the `tune.SyncConfig` passed to "
+                    "`tune.Tuner()`."
+                ) from e
+
+        return synced
+
+    def _resume_auto(self) -> bool:
+        if self._remote_checkpoint_dir and self._syncer:
+            logger.info(
+                f"Trying to find and download experiment checkpoint at "
+                f"{self._remote_checkpoint_dir}"
+            )
+            # Todo: This syncs the entire experiment including trial
+            # checkpoints. We should exclude these in the future.
+            try:
+                self._syncer.sync_down_if_needed(
+                    remote_dir=self._remote_checkpoint_dir,
+                    local_dir=self._local_checkpoint_dir,
+                )
+                self._syncer.wait()
+            except TuneError as e:
+                logger.warning(
+                    f"Got error when trying to sync down: {e} "
+                    f"\nPlease check this error message for potential "
+                    f"access problems - if a directory was not found, "
+                    f"that is expected at this stage when you're starting "
+                    f"a new experiment."
+                )
+                logger.info(
+                    "No remote checkpoint was found or an error occurred "
+                    "when trying to download the experiment checkpoint. "
+                    "Please check the previous warning message for more "
+                    "details. "
+                    "Ray Tune will now start a new experiment."
+                )
+                return False
+            if not _experiment_checkpoint_exists(self._local_checkpoint_dir):
+                logger.warning(
+                    "A remote checkpoint was fetched, but no checkpoint "
+                    "data was found. This can happen when e.g. the cloud "
+                    "bucket exists but does not contain any data. "
+                    "Ray Tune will start a new, fresh run."
+                )
+                return False
+            logger.info(
+                "A remote experiment checkpoint was found and will be "
+                "used to restore the previous experiment state."
+            )
+            return True
+        elif not _experiment_checkpoint_exists(self._local_checkpoint_dir):
+            logger.info(
+                "No local checkpoint was found. "
+                "Ray Tune will now start a new experiment."
+            )
+            return False
+        logger.info(
+            "A local experiment checkpoint was found and will be used "
+            "to restore the previous experiment state."
+        )
+        return True
+
+    def resume(self, resume_type: Union[str, bool]) -> Optional[_ResumeConfig]:
+        """Checks whether to resume experiment.
+
+        If experiment should be resumed, this method may sync down experiment state
+        from the cloud and then return a ResumeConfig mapping to the resume type.
+
+        Args:
+            resume_type: One of ["REMOTE", "LOCAL", "PROMPT", "AUTO"]. Can
+                be suffixed with one or more of ["+ERRORED", "+ERRORED_ONLY",
+                "+RESTART_ERRORED", "+RESTART_ERRORED_ONLY"]
+
+        Returns:
+            _ResumeConfig if resume is successful. None otherwise.
+        """
+        if not resume_type:
+            return None
+
+        resume_config = _resume_str_to_config(resume_type)
+
+        # Not clear if we need this assertion, since we should always have a
+        # local checkpoint dir.
+        assert self._local_checkpoint_dir or (
+            self._remote_checkpoint_dir and self._syncer
+        )
+
+        if resume_type == "AUTO":
+            if self._resume_auto():
+                return resume_config
+            # Else
+            return None
+
+        if resume_type in ["LOCAL", "PROMPT"]:
+            if not _experiment_checkpoint_exists(self._local_checkpoint_dir):
+                raise ValueError(
+                    f"You called resume ({resume_type}) when no checkpoint "
+                    f"exists in local directory "
+                    f"({self._local_checkpoint_dir}). If you want to start "
+                    f'a new experiment, use `resume="AUTO"` or '
+                    f"`resume=None`. If you expected an experiment to "
+                    f"already exist, check if you supplied the correct "
+                    f"`local_dir` to `air.RunConfig()`."
+                )
+            elif resume_type == "PROMPT":
+                if click.confirm(
+                    f"Resume from local directory? " f"({self._local_checkpoint_dir})"
+                ):
+                    return resume_config
+
+        if resume_type in ["REMOTE", "PROMPT"]:
+            if resume_type == "PROMPT" and not click.confirm(
+                f"Try downloading from remote directory? "
+                f"({self._remote_checkpoint_dir})"
+            ):
+                return None
+            if not self._remote_checkpoint_dir or not self._syncer:
+                raise ValueError(
+                    "Called resume from remote without remote directory or "
+                    "without valid syncer. "
+                    "Fix this by passing a `SyncConfig` object with "
+                    "`upload_dir` set to `Tuner(sync_config=...)`."
+                )
+
+            # Try syncing down the upload directory.
+            logger.info(
+                f"Downloading experiment checkpoint from "
+                f"{self._remote_checkpoint_dir}"
+            )
+            self.sync_down(force=True, wait=True)
+
+            if not _experiment_checkpoint_exists(self._local_checkpoint_dir):
+                raise ValueError(
+                    "Called resume when no checkpoint exists "
+                    "in remote or local directory."
+                )
+        return resume_config
diff --git a/python/ray/tune/execution/trial_runner.py b/python/ray/tune/execution/trial_runner.py
index 52c2ee05b50f..55aa5b66790f 100644
--- a/python/ray/tune/execution/trial_runner.py
+++ b/python/ray/tune/execution/trial_runner.py
@@ -1,8 +1,5 @@
-from collections import defaultdict
-from dataclasses import dataclass
-from typing import Any, DefaultDict, Dict, List, Optional, Union, Tuple, Set
+from typing import Any, Dict, List, Optional, Union, Tuple, Set
 
-import click
 from datetime import datetime
 import json
 import logging
@@ -16,7 +13,11 @@
 from ray.air._internal.checkpoint_manager import CheckpointStorage
 from ray.exceptions import RayTaskError
 from ray.tune.error import _TuneStopTrialError, _TuneRestoreError
-from ray.tune.impl.out_of_band_serialize_dataset import out_of_band_serialize_dataset
+from ray.tune.execution.experiment_state import (
+    _ExperimentCheckpointManager,
+    _find_newest_experiment_checkpoint,
+    _experiment_checkpoint_exists,
+)
 from ray.util import get_node_ip_address
 from ray.tune import TuneError
 from ray.tune.callback import CallbackList, Callback
@@ -40,14 +41,14 @@
 from ray.tune.schedulers import FIFOScheduler, TrialScheduler
 from ray.tune.stopper import NoopStopper, Stopper
 from ray.tune.search import BasicVariantGenerator, SearchAlgorithm
-from ray.tune.syncer import SyncConfig, get_node_to_storage_syncer, Syncer
+from ray.tune.syncer import SyncConfig
 from ray.tune.experiment import Trial
 from ray.tune.utils import warn_if_slow, flatten_dict
 from ray.tune.utils.log import Verbosity, has_verbosity
 from ray.tune.execution.placement_groups import PlacementGroupFactory
 from ray.tune.utils.serialization import TuneFunctionDecoder, TuneFunctionEncoder
 from ray.tune.web_server import TuneServer
-from ray.util.annotations import DeveloperAPI
+from ray.util.annotations import DeveloperAPI, Deprecated
 from ray.util.debug import log_once
 
 MAX_DEBUG_TRIALS = 20
@@ -55,219 +56,6 @@
 logger = logging.getLogger(__name__)
 
 
-def _find_newest_experiment_checkpoint(ckpt_dir) -> Optional[str]:
-    """Returns path to most recently modified checkpoint."""
-    full_paths = [
-        os.path.join(ckpt_dir, fname)
-        for fname in os.listdir(ckpt_dir)
-        if fname.startswith("experiment_state") and fname.endswith(".json")
-    ]
-    if not full_paths:
-        return None
-    return max(full_paths)
-
-
-@dataclass
-class _ResumeConfig:
-    resume_unfinished: bool = True
-    resume_errored: bool = False
-    restart_errored: bool = False
-
-
-class _ExperimentCheckpointManager:
-    """Helper class for managing experiment-level checkpoints.
-
-    This class implements the ``checkpoint()`` method used to checkpoint
-    experiment state. When called, this will serialize and write to disk
-    the state of the trial runner, trial executor, and search algorithm, to
-    a specified checkpoint file.
-
-    The checkpoint period is automatically adjusted to
-    ``max(10, time_per_checkpoint * 19)``. This means that at most 5% of the
-    time (1/20) will be used for writing checkpoints, while 95% of the time
-    (19/20) will be used to handle the rest of the training loop.
-
-    If ``sync_every_n_trial_checkpoints`` is not None, syncing
-    to cloud will be forced if any trial has checkpointed more times than
-    ``sync_every_n_trial_checkpoints`` since last sync.
-
-    """
-
-    def __init__(
-        self,
-        local_checkpoint_dir: str,
-        checkpoint_period: Union[int, float, str],
-        start_time: float,
-        session_str: str,
-        syncer: Syncer,
-        sync_trial_checkpoints: bool,
-        remote_checkpoint_dir: str,
-        sync_every_n_trial_checkpoints: Optional[int] = None,
-    ):
-        self._local_checkpoint_dir = local_checkpoint_dir
-        self._auto_checkpoint_enabled = checkpoint_period == "auto"
-        if self._auto_checkpoint_enabled:
-            self._checkpoint_period = 10.0  # Initial value
-        else:
-            self._checkpoint_period = float(checkpoint_period)
-
-        self._start_time = start_time
-        self._session_str = session_str
-
-        self._syncer = syncer
-        self._sync_trial_checkpoints = sync_trial_checkpoints
-        self._remote_checkpoint_dir = remote_checkpoint_dir
-
-        self._last_checkpoint_time = 0.0
-        self._last_sync_time = 0.0
-        self._sync_every_n_trial_checkpoints = sync_every_n_trial_checkpoints
-        self._trial_num_checkpoints_since_last_sync: DefaultDict[
-            Trial, int
-        ] = defaultdict(int)
-        self._excessive_sync_threshold = float(
-            os.environ.get(
-                "TUNE_WARN_EXCESSIVE_EXPERIMENT_CHECKPOINT_SYNC_THRESHOLD_S", "30"
-            )
-        )
-        self._should_force_cloud_sync = False
-
-    @property
-    def auto_checkpoint_enabled(self):
-        return self._auto_checkpoint_enabled
-
-    def on_trial_checkpoint(self, trial: Trial):
-        if not self._sync_every_n_trial_checkpoints:
-            return
-        self._trial_num_checkpoints_since_last_sync[trial] += 1
-        if (
-            self._trial_num_checkpoints_since_last_sync[trial]
-            >= self._sync_every_n_trial_checkpoints
-        ):
-            self._should_force_cloud_sync = True
-
-    def checkpoint(
-        self,
-        checkpoint_file: str,
-        trial_runner: "TrialRunner",
-        trial_executor: RayTrialExecutor,
-        search_alg: SearchAlgorithm,
-        callbacks: CallbackList,
-        force: bool = False,
-    ):
-        """Saves execution state to `self._local_checkpoint_dir`.
-
-        Overwrites the current session checkpoint, which starts when self
-        is instantiated. Throttle depends on self._checkpoint_period.
-
-        Also automatically saves the search algorithm to the local
-        checkpoint dir.
-
-        Args:
-            force: Forces a checkpoint despite checkpoint_period.
-        """
-        if not self._local_checkpoint_dir:
-            return
-
-        force = force or self._should_force_cloud_sync
-
-        now = time.time()
-        if now - self._last_checkpoint_time < self._checkpoint_period and (not force):
-            return
-
-        def _serialize_and_write():
-            runner_state = {
-                "checkpoints": list(trial_executor.get_checkpoints().values()),
-                "runner_data": trial_runner.__getstate__(),
-                "stats": {
-                    "start_time": self._start_time,
-                    "timestamp": self._last_checkpoint_time,
-                },
-            }
-            tmp_file_name = os.path.join(self._local_checkpoint_dir, ".tmp_checkpoint")
-            with open(tmp_file_name, "w") as f:
-                json.dump(runner_state, f, indent=2, cls=TuneFunctionEncoder)
-
-            os.replace(tmp_file_name, checkpoint_file)
-            search_alg.save_to_dir(
-                self._local_checkpoint_dir, session_str=self._session_str
-            )
-            callbacks.save_to_dir(
-                self._local_checkpoint_dir, session_str=self._session_str
-            )
-
-        checkpoint_time_start = time.monotonic()
-        with out_of_band_serialize_dataset():
-            _serialize_and_write()
-
-        if self._sync_trial_checkpoints:
-            exclude = None
-        else:
-            exclude = ["*/checkpoint_*"]
-
-        synced = False
-        if self._syncer:
-            if force:
-                # Wait until previous sync command finished
-                try:
-                    self._syncer.wait()
-                except TimeoutError as e:
-                    logger.warning(
-                        "The previous sync of the experiment checkpoint to the cloud "
-                        f"timed out: {str(e)}. Tune will continue to retry syncing. "
-                        "If this warning keeps showing up, consider diagnosing the "
-                        "reason behind the hanging sync operation, or increase the "
-                        "`sync_timeout` in `SyncConfig`."
-                    )
-                synced = self._syncer.sync_up(
-                    local_dir=self._local_checkpoint_dir,
-                    remote_dir=self._remote_checkpoint_dir,
-                    exclude=exclude,
-                )
-            else:
-                synced = self._syncer.sync_up_if_needed(
-                    local_dir=self._local_checkpoint_dir,
-                    remote_dir=self._remote_checkpoint_dir,
-                    exclude=exclude,
-                )
-
-        if synced:
-            self._should_force_cloud_sync = False
-            self._trial_num_checkpoints_since_last_sync.clear()
-
-            # syncing might have taken some time, so we grab the current timestamp again
-            now = time.time()
-            if now - self._last_sync_time < self._excessive_sync_threshold:
-                logger.warning(
-                    "Experiment checkpoint syncing has been triggered multiple "
-                    f"times in the last {self._excessive_sync_threshold} seconds. "
-                    "A sync will be triggered whenever a trial has checkpointed "
-                    "more than `num_to_keep` times since last sync or if "
-                    f"{self._syncer.sync_period} seconds have passed since last "
-                    "sync. If you have set `num_to_keep` in your `CheckpointConfig`, "
-                    "consider increasing the checkpoint frequency or keeping more "
-                    "checkpoints. You can supress this warning by changing the "
-                    "`TUNE_WARN_EXCESSIVE_EXPERIMENT_CHECKPOINT_SYNC_THRESHOLD_S` "
-                    "environment variable."
-                )
-            self._last_sync_time = now
-
-        checkpoint_time_taken = time.monotonic() - checkpoint_time_start
-
-        if self._auto_checkpoint_enabled:
-            # Multiplying this time by 19 means we spend ~5% of the time
-            # writing global checkpoints and 95% of the time processing trials
-            self._checkpoint_period = max(10.0, checkpoint_time_taken * 19)
-            logger.debug(
-                f"Global experiment checkpointing took "
-                f"{checkpoint_time_taken:.2f} seconds. "
-                f"Adjusting checkpoint period to "
-                f"{self._checkpoint_period:.2f} seconds."
-            )
-
-        self._last_checkpoint_time = time.time()
-        return self._local_checkpoint_dir
-
-
 @DeveloperAPI
 class TrialRunner:
     """A TrialRunner implements the event loop for scheduling trials on Ray.
@@ -326,7 +114,6 @@ class TrialRunner:
     """
 
     CKPT_FILE_TMPL = "experiment_state-{}.json"
-    VALID_RESUME_TYPES = [True, "LOCAL", "REMOTE", "PROMPT", "ERRORED_ONLY", "AUTO"]
     RAISE = "RAISE"
 
     def __init__(
@@ -347,8 +134,6 @@ def __init__(
         callbacks: Optional[List[Callback]] = None,
         metric: Optional[str] = None,
         trial_checkpoint_config: Optional[CheckpointConfig] = None,
-        # Deprecate on next refactor
-        driver_sync_trial_checkpoints: bool = False,
     ):
         self._search_alg = search_alg or BasicVariantGenerator()
         self._placeholder_resolvers = placeholder_resolvers
@@ -358,33 +143,7 @@ def __init__(
         self._insufficient_resources_manager = _InsufficientResourcesManager()
         self._pending_trial_queue_times = {}
 
-        # Set the number of maximum pending trials
-        max_pending_trials = os.getenv("TUNE_MAX_PENDING_TRIALS_PG", "auto")
-        if max_pending_trials == "auto":
-            # Auto detect
-            if isinstance(self._search_alg, BasicVariantGenerator):
-                # Use a minimum of 16 to trigger fast autoscaling
-                # Scale up to at most the number of available cluster CPUs
-                cluster_cpus = ray.cluster_resources().get("CPU", 1.0)
-                self._max_pending_trials = max(16, int(cluster_cpus * 1.1))
-
-                if self._max_pending_trials > 128:
-                    logger.warning(
-                        f"The maximum number of pending trials has been "
-                        f"automatically set to the number of available "
-                        f"cluster CPUs, which is high "
-                        f"({self._max_pending_trials} CPUs/pending trials). "
-                        f"If you're running an experiment with a large number "
-                        f"of trials, this could lead to scheduling overhead. "
-                        f"In this case, consider setting the "
-                        f"`TUNE_MAX_PENDING_TRIALS_PG` environment variable "
-                        f"to the desired maximum number of concurrent trials."
-                    )
-            else:
-                self._max_pending_trials = 1
-        else:
-            # Manual override
-            self._max_pending_trials = int(max_pending_trials)
+        self._max_pending_trials = _get_max_pending_trials(self._search_alg)
 
         self._sync_config = sync_config or SyncConfig()
 
@@ -437,16 +196,26 @@ def __init__(
 
         self._experiment_dir_name = experiment_dir_name
 
-        self._syncer = get_node_to_storage_syncer(self._sync_config)
         self._stopper = stopper or NoopStopper()
-        self._resumed = False
 
-        should_resume, resume_config = self._validate_resume(
-            resume_type=resume,
-            driver_sync_trial_checkpoints=driver_sync_trial_checkpoints,
+        self._start_time = time.time()
+        self._last_checkpoint_time = -float("inf")
+
+        self._session_str = datetime.fromtimestamp(self._start_time).strftime(
+            "%Y-%m-%d_%H-%M-%S"
         )
 
-        if should_resume:
+        if checkpoint_period is None:
+            checkpoint_period = os.getenv("TUNE_GLOBAL_CHECKPOINT_S", "auto")
+
+        self._checkpoint_period = checkpoint_period
+        self._trial_checkpoint_config = trial_checkpoint_config or CheckpointConfig()
+        self._checkpoint_manager = self._create_checkpoint_manager()
+
+        self._resumed = False
+        resume_config = self._checkpoint_manager.resume(resume_type=resume)
+
+        if resume_config:
             try:
                 self.resume(
                     resume_unfinished=resume_config.resume_unfinished,
@@ -464,27 +233,18 @@ def __init__(
         else:
             logger.debug("Starting a new experiment.")
 
-        self._start_time = time.time()
-        self._last_checkpoint_time = -float("inf")
-
-        self._session_str = datetime.fromtimestamp(self._start_time).strftime(
-            "%Y-%m-%d_%H-%M-%S"
-        )
-        self.checkpoint_file = None
-        if self._local_checkpoint_dir:
-            self.checkpoint_file = os.path.join(
-                self._local_checkpoint_dir,
-                TrialRunner.CKPT_FILE_TMPL.format(self._session_str),
-            )
+    @Deprecated("Use `TrialRunner.experiment_state_path` instead.")
+    @property
+    def checkpoint_file(self) -> str:
+        return self.experiment_state_path
 
-        if checkpoint_period is None:
-            checkpoint_period = os.getenv("TUNE_GLOBAL_CHECKPOINT_S", "auto")
+    @property
+    def experiment_state_file_name(self) -> str:
+        return TrialRunner.CKPT_FILE_TMPL.format(self._session_str)
 
-        self._checkpoint_period = checkpoint_period
-        self._trial_checkpoint_config = trial_checkpoint_config or CheckpointConfig()
-        self._checkpoint_manager = self._create_checkpoint_manager(
-            driver_sync_trial_checkpoints
-        )
+    @property
+    def experiment_state_path(self) -> str:
+        return os.path.join(self._local_checkpoint_dir, self.experiment_state_file_name)
 
     def setup_experiments(
         self, experiments: List[Experiment], total_num_samples: int
@@ -508,15 +268,12 @@ def end_experiment_callbacks(self) -> None:
         """Calls ``on_experiment_end`` method in callbacks."""
         self._callbacks.on_experiment_end(trials=self._trials)
 
-    def _create_checkpoint_manager(self, sync_trial_checkpoints: bool = True):
+    def _create_checkpoint_manager(self):
         return _ExperimentCheckpointManager(
             local_checkpoint_dir=self._local_checkpoint_dir,
-            checkpoint_period=self._checkpoint_period,
-            start_time=self._start_time,
-            session_str=self._session_str,
-            syncer=self._syncer,
-            sync_trial_checkpoints=sync_trial_checkpoints,
             remote_checkpoint_dir=self._remote_checkpoint_dir,
+            checkpoint_period=self._checkpoint_period,
+            sync_config=self._sync_config,
             sync_every_n_trial_checkpoints=self._trial_checkpoint_config.num_to_keep,
         )
 
@@ -538,267 +295,95 @@ def _remote_checkpoint_dir(self):
             return os.path.join(self._sync_config.upload_dir, self._experiment_dir_name)
         return None
 
-    def _validate_resume(
-        self, resume_type: Union[str, bool], driver_sync_trial_checkpoints=True
-    ) -> Tuple[bool, Optional[_ResumeConfig]]:
-        """Checks whether to resume experiment.
-
-        Args:
-            resume_type: One of ["REMOTE", "LOCAL", "PROMPT", "AUTO"]. Can
-                be suffixed with one or more of ["+ERRORED", "+ERRORED_ONLY",
-                "+RESTART_ERRORED", "+RESTART_ERRORED_ONLY"]
-            driver_sync_trial_checkpoints: Boolean indicating if the driver
-                should sync trial checkpoints from the driver node to cloud.
-
-        Returns:
-            Tuple of (should_resume, _ResumeConfig).
-        """
-        if not resume_type:
-            return False, None
-
-        if resume_type is True:
-            resume_type = "LOCAL"
-        elif resume_type == "ERRORED_ONLY":
-            warnings.warn(
-                "Passing `resume='ERRORED_ONLY'` to tune.run() is deprecated and "
-                "will be removed in the future. Please pass e.g. "
-                "`resume='LOCAL+RESTART_ERRORED_ONLY'` instead."
-            )
-            resume_type = "LOCAL+RESTART_ERRORED_ONLY"
-
-        # Parse resume string, e.g. AUTO+ERRORED
-        resume_config = _ResumeConfig()
-        resume_settings = resume_type.split("+")
-        resume_type = resume_settings[0]
-
-        for setting in resume_settings:
-            if setting == "ERRORED":
-                resume_config.resume_errored = True
-            elif setting == "RESTART_ERRORED":
-                resume_config.restart_errored = True
-            elif setting == "ERRORED_ONLY":
-                resume_config.resume_unfinished = False
-                resume_config.restart_errored = False
-                resume_config.resume_errored = True
-            elif setting == "RESTART_ERRORED_ONLY":
-                resume_config.resume_unfinished = False
-                resume_config.restart_errored = True
-                resume_config.resume_errored = False
-
-        assert (
-            resume_type in self.VALID_RESUME_TYPES
-        ), "resume_type {} is not one of {}".format(
-            resume_type, self.VALID_RESUME_TYPES
-        )
-        # Not clear if we need this assertion, since we should always have a
-        # local checkpoint dir.
-        assert self._local_checkpoint_dir or (
-            self._remote_checkpoint_dir and self._syncer
-        )
-
-        if resume_type == "AUTO":
-            if self._remote_checkpoint_dir and self._syncer:
-                logger.info(
-                    f"Trying to find and download experiment checkpoint at "
-                    f"{self._remote_checkpoint_dir}"
-                )
-                # Todo: This syncs the entire experiment including trial
-                # checkpoints. We should exclude these in the future.
-                try:
-                    self._syncer.sync_down_if_needed(
-                        remote_dir=self._remote_checkpoint_dir,
-                        local_dir=self._local_checkpoint_dir,
-                    )
-                    self._syncer.wait()
-                except TuneError as e:
-                    logger.warning(
-                        f"Got error when trying to sync down: {e} "
-                        f"\nPlease check this error message for potential "
-                        f"access problems - if a directory was not found, "
-                        f"that is expected at this stage when you're starting "
-                        f"a new experiment."
-                    )
-                    logger.info(
-                        "No remote checkpoint was found or an error occurred "
-                        "when trying to download the experiment checkpoint. "
-                        "Please check the previous warning message for more "
-                        "details. "
-                        "Ray Tune will now start a new experiment."
-                    )
-                    return False, None
-                if not self.checkpoint_exists(self._local_checkpoint_dir):
-                    logger.warning(
-                        "A remote checkpoint was fetched, but no checkpoint "
-                        "data was found. This can happen when e.g. the cloud "
-                        "bucket exists but does not contain any data. "
-                        "Ray Tune will start a new, fresh run."
-                    )
-                    return False, None
-                logger.info(
-                    "A remote experiment checkpoint was found and will be "
-                    "used to restore the previous experiment state."
-                )
-                return True, resume_config
-            elif not self.checkpoint_exists(self._local_checkpoint_dir):
-                logger.info(
-                    "No local checkpoint was found. "
-                    "Ray Tune will now start a new experiment."
-                )
-                return False, None
-            logger.info(
-                "A local experiment checkpoint was found and will be used "
-                "to restore the previous experiment state."
-            )
-            return True, resume_config
-
-        if resume_type in ["LOCAL", "PROMPT"]:
-            if not self.checkpoint_exists(self._local_checkpoint_dir):
-                raise ValueError(
-                    f"You called resume ({resume_type}) when no checkpoint "
-                    f"exists in local directory "
-                    f"({self._local_checkpoint_dir}). If you want to start "
-                    f'a new experiment, use `resume="AUTO"` or '
-                    f"`resume=None`. If you expected an experiment to "
-                    f"already exist, check if you supplied the correct "
-                    f"`local_dir` to `air.RunConfig()`."
-                )
-            elif resume_type == "PROMPT":
-                if click.confirm(
-                    f"Resume from local directory? " f"({self._local_checkpoint_dir})"
-                ):
-                    return True, resume_config
-
-        if resume_type in ["REMOTE", "PROMPT"]:
-            if resume_type == "PROMPT" and not click.confirm(
-                f"Try downloading from remote directory? "
-                f"({self._remote_checkpoint_dir})"
-            ):
-                return False, None
-            if not self._remote_checkpoint_dir or not self._syncer:
-                raise ValueError(
-                    "Called resume from remote without remote directory or "
-                    "without valid syncer. "
-                    "Fix this by passing a `SyncConfig` object with "
-                    "`upload_dir` set to `Tuner(sync_config=...)`."
-                )
-
-            # Try syncing down the upload directory.
-            logger.info(
-                f"Downloading experiment checkpoint from "
-                f"{self._remote_checkpoint_dir}"
-            )
-            if driver_sync_trial_checkpoints:
-                exclude = None
-            else:
-                exclude = ["*/checkpoint_*"]
-
-            try:
-                self._syncer.sync_down_if_needed(
-                    remote_dir=self._remote_checkpoint_dir,
-                    local_dir=self._local_checkpoint_dir,
-                    exclude=exclude,
-                )
-                self._syncer.wait()
-            except TuneError as e:
-                raise RuntimeError(
-                    "Syncing the remote experiment checkpoint to the driver "
-                    "failed. Please check the error message. If you want to "
-                    'start a new experiment, use `resume="AUTO"` or '
-                    "`resume=None`. If you expected an experiment to "
-                    "already exist, check if you supplied the correct "
-                    "`upload_dir` to the `tune.SyncConfig` passed to "
-                    "`tune.Tuner()`."
-                ) from e
-
-            if not self.checkpoint_exists(self._local_checkpoint_dir):
-                raise ValueError(
-                    "Called resume when no checkpoint exists "
-                    "in remote or local directory."
-                )
-        return True, resume_config
-
     @classmethod
-    def checkpoint_exists(cls, directory):
+    def checkpoint_exists(cls, directory: str) -> bool:
         if not os.path.exists(directory):
             return False
-        return any(
-            (fname.startswith("experiment_state") and fname.endswith(".json"))
-            for fname in os.listdir(directory)
-        )
 
-    def checkpoint(self, force: bool = False):
-        """Saves execution state to `self._local_checkpoint_dir`.
+        return _experiment_checkpoint_exists(directory)
 
-        Overwrites the current session checkpoint, which starts when self
-        is instantiated. Throttle depends on self._checkpoint_period.
+    def save_to_dir(self, experiment_dir: Optional[str] = None):
+        """Save TrialRunner state to experiment directory.
 
-        Also automatically saves the search algorithm to the local
-        checkpoint dir.
+        Accepts an ``experiment_dir`` argument which defaults to the
+        local checkpoint directory.
 
-        Args:
-            force: Forces a checkpoint despite checkpoint_period.
+        This method will save the trial runner state, the searcher state,
+        and the callback states into the experiment directory.
         """
-        with warn_if_slow(
-            "experiment_checkpoint",
-            message="Checkpointing the experiment state took "
-            "{duration:.3f} s, which may be a performance "
-            "bottleneck. Please ensure the "
-            "`TUNE_GLOBAL_CHECKPOINT_S` environment variable is "
-            "something significantly higher than this duration "
-            "to ensure compute time is mostly spent on the main "
-            "training loop.",
-            # No backlog warning if forced checkpoint as we wait
-            # for previous sync to finish.
-            disable=self._checkpoint_manager.auto_checkpoint_enabled or force,
-        ):
+        experiment_dir = experiment_dir or self._local_checkpoint_dir
+
+        # Get state from trial executor and runner
+        runner_state = {
+            # Trials
+            "checkpoints": list(self.trial_executor.get_checkpoints().values()),
+            # Experiment data
+            "runner_data": self.__getstate__(),
+            # Metadata
+            "stats": {
+                "start_time": self._start_time,
+                "timestamp": self._last_checkpoint_time,
+            },
+        }
+
+        tmp_file_name = os.path.join(experiment_dir, ".tmp_experiment_state")
+
+        with open(tmp_file_name, "w") as f:
+            json.dump(runner_state, f, indent=2, cls=TuneFunctionEncoder)
+
+        os.replace(
+            tmp_file_name,
+            os.path.join(experiment_dir, self.experiment_state_file_name),
+        )
 
-            self._checkpoint_manager.checkpoint(
-                checkpoint_file=self.checkpoint_file,
-                trial_runner=self,
-                trial_executor=self.trial_executor,
-                search_alg=self._search_alg,
-                callbacks=self._callbacks,
-                force=force,
-            )
+        self._search_alg.save_to_dir(
+            self._local_checkpoint_dir, session_str=self._session_str
+        )
+        self._callbacks.save_to_dir(
+            self._local_checkpoint_dir, session_str=self._session_str
+        )
 
-    def resume(
-        self,
-        resume_unfinished: bool = True,
-        resume_errored: bool = False,
-        restart_errored: bool = False,
-    ):
-        """Resumes all checkpointed trials from previous run.
+    def restore_from_dir(self, experiment_dir: Optional[str] = None) -> List[Trial]:
+        """Restore TrialRunner state from experiment directory.
 
-        Requires user to manually re-register their objects. Also stops
-        all ongoing trials.
+        Accepts an ``experiment_dir`` argument which defaults to the
+        local checkpoint directory.
+
+        This method will restore the trial runner state, the searcher state,
+        and the callback states. It will then parse the trial states
+        and return them as a list of Trial objects.
         """
-        newest_ckpt_path = _find_newest_experiment_checkpoint(
+        experiment_dir = experiment_dir or self._local_checkpoint_dir
+
+        # Update local checkpoint dir
+        self._local_checkpoint_dir = experiment_dir
+
+        # Find newest state file
+        newest_state_path = _find_newest_experiment_checkpoint(
             self._local_checkpoint_dir
         )
 
-        if not newest_ckpt_path:
+        if not newest_state_path:
             raise ValueError(
                 f"Tried to resume from checkpoint dir "
                 f"`{self._local_checkpoint_dir}`, but no "
                 f"experiment checkpoint data was found."
             )
 
-        logger.info(f"Using following checkpoint to resume: {newest_ckpt_path}")
-        with open(newest_ckpt_path, "r") as f:
-            runner_state = json.load(f, cls=TuneFunctionDecoder)
-            self.checkpoint_file = newest_ckpt_path
+        # Set checkpoint file to load
+        logger.info(
+            f"Using following experiment state file to resume: " f"{newest_state_path}"
+        )
 
         logger.warning(
-            "".join(
-                [
-                    "Attempting to resume experiment from {}. ".format(
-                        self._local_checkpoint_dir
-                    ),
-                    "This will ignore any new changes to the specification.",
-                ]
-            )
+            f"Attempting to resume experiment from {self._local_checkpoint_dir}. "
+            "This will ignore any new changes to the specification."
         )
 
+        # Actually load data
+        with open(newest_state_path, "r") as f:
+            runner_state = json.load(f, cls=TuneFunctionDecoder)
+
         # 1. Restore trial runner state
         self.__setstate__(runner_state["runner_data"])
 
@@ -809,7 +394,7 @@ def resume(
         if self._callbacks.can_restore(self._local_checkpoint_dir):
             self._callbacks.restore_from_dir(self._local_checkpoint_dir)
 
-        # 3. Load trial table from experiment checkpoint
+        # 3. Load trials
         trials = []
         for trial_json_state in runner_state["checkpoints"]:
             trial = Trial.from_json_state(trial_json_state)
@@ -828,7 +413,53 @@ def resume(
 
             trials.append(trial)
 
-        # 4. Set trial statuses according to the resume configuration
+        return trials
+
+    def checkpoint(self, force: bool = False, wait: bool = False):
+        """Saves execution state to `self._local_checkpoint_dir`.
+
+        Overwrites the current session checkpoint, which starts when self
+        is instantiated. Throttle depends on self._checkpoint_period.
+
+        Also automatically saves the search algorithm to the local
+        checkpoint dir.
+
+        Args:
+            force: Forces a checkpoint despite checkpoint_period.
+            wait: Wait until syncing to cloud has finished.
+
+        """
+        with warn_if_slow(
+            "experiment_checkpoint",
+            message="Checkpointing the experiment state took "
+            "{duration:.3f} s, which may be a performance "
+            "bottleneck. Please ensure the "
+            "`TUNE_GLOBAL_CHECKPOINT_S` environment variable is "
+            "something significantly higher than this duration "
+            "to ensure compute time is mostly spent on the main "
+            "training loop.",
+            # No backlog warning if forced checkpoint as we wait
+            # for previous sync to finish.
+            disable=self._checkpoint_manager.auto_checkpoint_enabled or force or wait,
+        ):
+            self._checkpoint_manager.checkpoint(
+                save_fn=self.save_to_dir, force=force, wait=wait
+            )
+
+    def resume(
+        self,
+        resume_unfinished: bool = True,
+        resume_errored: bool = False,
+        restart_errored: bool = False,
+    ):
+        """Resumes all checkpointed trials from previous run.
+
+        Requires user to manually re-register their objects. Also stops
+        all ongoing trials.
+        """
+        trials = self.restore_from_dir()
+
+        # Set trial statuses according to the resume configuration
         for trial in sorted(trials, key=lambda t: t.last_update_time, reverse=True):
             trial_to_add = trial
             if trial.status == Trial.ERROR:
@@ -1581,7 +1212,6 @@ def __getstate__(self):
             "_scheduler_alg",
             "_pending_trial_queue_times",
             "trial_executor",
-            "_syncer",
             "_callbacks",
             "_checkpoint_manager",
             "_local_checkpoint_dir",
@@ -1677,3 +1307,38 @@ def __getattr__(self, attr):
                     f"starting 1.12s.0"
                 )
         return getattr(self._trial_runner, attr)
+
+
+def _get_max_pending_trials(search_alg: SearchAlgorithm) -> int:
+    max_pending_trials = os.getenv("TUNE_MAX_PENDING_TRIALS_PG", "auto")
+
+    if max_pending_trials != "auto":
+        return int(max_pending_trials)
+
+    # Else, auto detect.
+
+    # Only BasicVariantGenerator supports > 1 pending trials.
+    # This is because we don't want to generate too many trials
+    # before we fit the searcher model.
+    if not isinstance(search_alg, BasicVariantGenerator):
+        return 1
+
+    # Use a minimum of 16 to trigger fast autoscaling
+    # Scale up to at most the number of available cluster CPUs
+    cluster_cpus = ray.cluster_resources().get("CPU", 1.0)
+    max_pending_trials = max(16, int(cluster_cpus * 1.1))
+
+    if max_pending_trials > 128:
+        logger.warning(
+            f"The maximum number of pending trials has been "
+            f"automatically set to the number of available "
+            f"cluster CPUs, which is high "
+            f"({max_pending_trials} CPUs/pending trials). "
+            f"If you're running an experiment with a large number "
+            f"of trials, this could lead to scheduling overhead. "
+            f"In this case, consider setting the "
+            f"`TUNE_MAX_PENDING_TRIALS_PG` environment variable "
+            f"to the desired maximum number of concurrent trials."
+        )
+
+    return max_pending_trials
diff --git a/python/ray/tune/impl/tuner_internal.py b/python/ray/tune/impl/tuner_internal.py
index 76b5f233d7a8..3ee84e3349c2 100644
--- a/python/ray/tune/impl/tuner_internal.py
+++ b/python/ray/tune/impl/tuner_internal.py
@@ -15,7 +15,7 @@
 from ray.air._internal.remote_storage import download_from_uri, is_non_local_path_uri
 from ray.air.config import RunConfig, ScalingConfig
 from ray.tune import Experiment, TuneError, ExperimentAnalysis
-from ray.tune.execution.trial_runner import _ResumeConfig
+from ray.tune.execution.experiment_state import _ResumeConfig
 from ray.tune.registry import is_function_trainable
 from ray.tune.result_grid import ResultGrid
 from ray.tune.trainable import Trainable
diff --git a/python/ray/tune/tests/test_trial_runner_3.py b/python/ray/tune/tests/test_trial_runner_3.py
index 3c07f667a2fb..954f18a429d9 100644
--- a/python/ray/tune/tests/test_trial_runner_3.py
+++ b/python/ray/tune/tests/test_trial_runner_3.py
@@ -800,8 +800,8 @@ def num_checkpoints(trial):
         )
         runner.add_trial(trial)
 
-        runner.step()  # start trial
-        runner.step()  # run iteration 1-3
+        while not trial._last_result:
+            runner.step()  # start and run until first result
         runner.step()  # process save
         self.assertEqual(trial.last_result[TRAINING_ITERATION], 3)
         self.assertEqual(num_checkpoints(trial), 1)
@@ -1058,7 +1058,7 @@ def should_checkpoint(self):
 
         # also check if the warning is printed
         buffer = []
-        from ray.tune.execution.trial_runner import logger
+        from ray.tune.execution.experiment_state import logger
 
         with patch.object(logger, "warning", lambda x: buffer.append(x)):
             while not runner.is_finished():
@@ -1113,7 +1113,7 @@ def testForcedCloudCheckpointSyncTimeout(self):
         assert syncer.sync_up_counter == 1
 
         buffer = []
-        logger = logging.getLogger("ray.tune.execution.trial_runner")
+        logger = logging.getLogger("ray.tune.execution.experiment_state")
         with patch.object(logger, "warning", lambda x: buffer.append(x)):
             # The second checkpoint will log a warning about the previous sync
             # timing out. Then, it will launch a new sync process in the background.
diff --git a/python/ray/tune/tune.py b/python/ray/tune/tune.py
index b72d6230c060..3bafc7d00b92 100644
--- a/python/ray/tune/tune.py
+++ b/python/ray/tune/tune.py
@@ -740,9 +740,6 @@ class and registered trainables.
         callbacks=callbacks,
         metric=metric,
         trial_checkpoint_config=experiments[0].checkpoint_config,
-        # Driver should only sync trial checkpoints if
-        # checkpoints are not synced to cloud
-        driver_sync_trial_checkpoints=not bool(sync_config.upload_dir),
     )
 
     if not runner.resumed:
@@ -776,10 +773,7 @@ class and registered trainables.
     tune_taken = time.time() - tune_start
 
     try:
-        runner.checkpoint(force=True)
-        # Wait for the final remote directory sync to finish before exiting
-        if runner._syncer:
-            runner._syncer.wait()
+        runner.checkpoint(force=True, wait=True)
     except Exception as e:
         logger.warning(f"Trial Runner checkpointing failed: {str(e)}")
 
diff --git a/python/ray/tune/tuner.py b/python/ray/tune/tuner.py
index 1c35acd411a6..c15ade6cb597 100644
--- a/python/ray/tune/tuner.py
+++ b/python/ray/tune/tuner.py
@@ -8,7 +8,7 @@
 from ray.air._internal.remote_storage import list_at_uri
 from ray.air.util.node import _force_on_current_node
 from ray.tune import TuneError
-from ray.tune.execution.trial_runner import _ResumeConfig
+from ray.tune.execution.experiment_state import _ResumeConfig
 from ray.tune.result_grid import ResultGrid
 from ray.tune.trainable import Trainable
 from ray.tune.impl.tuner_internal import TunerInternal, _TUNER_PKL

From 6de3cbe9a1a821754c47d337f212341aa55e2a7a Mon Sep 17 00:00:00 2001
From: Archit Kulkarni <architkulkarni@users.noreply.github.com>
Date: Mon, 13 Feb 2023 11:35:04 -0800
Subject: [PATCH 244/267] [Jobs] Improve error message in case of `404`
 (#31120)

An identical error message is returned in multiple cases if something goes wrong when pinging the api/version endpoint. This PR adds more information to the error message in case where the endpoint returns 404 in order to help with debugging.
---
 dashboard/modules/dashboard_sdk.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/dashboard/modules/dashboard_sdk.py b/dashboard/modules/dashboard_sdk.py
index 518ac355c6c4..946736158a51 100644
--- a/dashboard/modules/dashboard_sdk.py
+++ b/dashboard/modules/dashboard_sdk.py
@@ -241,7 +241,9 @@ def _check_connection_and_version_with_url(
         try:
             r = self._do_request("GET", url)
             if r.status_code == 404:
-                raise RuntimeError(version_error_message)
+                raise RuntimeError(
+                    "Version check returned 404. " + version_error_message
+                )
             r.raise_for_status()
 
             running_ray_version = r.json()["ray_version"]

From 80f2161ac3bdd931015834439cd999da25ba7152 Mon Sep 17 00:00:00 2001
From: Clark Zinzow <clarkzinzow@gmail.com>
Date: Mon, 13 Feb 2023 13:05:39 -0800
Subject: [PATCH 245/267] [Datasets] Track bundles object store utilization as
 soon as they're added to an operator (#32482)

This PR ensures that the object store utilization for a bundle is still tracked when it's queued internally by an operator, e.g. MapOperator queueing bundles for the sake of bundling up to a minimum bundle size, or due to workers not yet being ready for dispatch.
---
 .../execution/operators/map_operator.py       |   8 +-
 .../test_executor_resource_management.py      | 134 +++++++++++++++++-
 2 files changed, 134 insertions(+), 8 deletions(-)

diff --git a/python/ray/data/_internal/execution/operators/map_operator.py b/python/ray/data/_internal/execution/operators/map_operator.py
index 7da98d626331..3a55725a234a 100644
--- a/python/ray/data/_internal/execution/operators/map_operator.py
+++ b/python/ray/data/_internal/execution/operators/map_operator.py
@@ -147,6 +147,10 @@ def start(self, options: "ExecutionOptions"):
 
     def add_input(self, refs: RefBundle, input_index: int):
         assert input_index == 0, input_index
+        # Add ref bundle allocation to operator's object store metrics.
+        self._metrics.cur += refs.size_bytes()
+        if self._metrics.cur > self._metrics.peak:
+            self._metrics.peak = self._metrics.cur
         # Add RefBundle to the bundler.
         self._block_ref_bundler.add_bundle(refs)
         if self._block_ref_bundler.has_bundle():
@@ -181,10 +185,6 @@ def _handle_task_submitted(self, task: "_TaskState"):
         """
         # Notify output queue that this task is pending.
         self._output_queue.notify_pending_task(task)
-        # Update object store metrics.
-        self._metrics.cur += task.inputs.size_bytes()
-        if self._metrics.cur > self._metrics.peak:
-            self._metrics.peak = self._metrics.cur
 
     @abstractmethod
     def notify_work_completed(
diff --git a/python/ray/data/tests/test_executor_resource_management.py b/python/ray/data/tests/test_executor_resource_management.py
index bc98518326b0..c4a9d7cdce3e 100644
--- a/python/ray/data/tests/test_executor_resource_management.py
+++ b/python/ray/data/tests/test_executor_resource_management.py
@@ -97,6 +97,41 @@ def test_task_pool_resource_reporting(ray_start_10_cpus_shared):
     assert usage.object_store_memory == pytest.approx(128, abs=50), usage
 
 
+def test_task_pool_resource_reporting_with_bundling(ray_start_10_cpus_shared):
+    input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
+    op = MapOperator.create(
+        _mul2_transform,
+        input_op=input_op,
+        name="TestMapper",
+        compute_strategy=TaskPoolStrategy(),
+        min_rows_per_bundle=3,
+    )
+    assert op.current_resource_usage() == ExecutionResources(
+        cpu=0, gpu=0, object_store_memory=0
+    )
+    op.start(ExecutionOptions())
+    op.add_input(input_op.get_next(), 0)
+    usage = op.current_resource_usage()
+    # No tasks submitted yet due to bundling.
+    assert usage.cpu == 0, usage
+    assert usage.gpu == 0, usage
+    # Queued bundles (in bundler) still count against object storage usage.
+    assert usage.object_store_memory == pytest.approx(80, abs=10), usage
+    op.add_input(input_op.get_next(), 0)
+    usage = op.current_resource_usage()
+    # No tasks submitted yet due to bundling.
+    assert usage.cpu == 0, usage
+    assert usage.gpu == 0, usage
+    # Queued bundles (in bundler) still count against object storage usage.
+    assert usage.object_store_memory == pytest.approx(160, abs=10), usage
+    op.add_input(input_op.get_next(), 0)
+    usage = op.current_resource_usage()
+    # Task has now been submitted since we've met the minimum bundle size.
+    assert usage.cpu == 1, usage
+    assert usage.gpu == 0, usage
+    assert usage.object_store_memory == pytest.approx(240, abs=10), usage
+
+
 def test_actor_pool_resource_reporting(ray_start_10_cpus_shared):
     input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
     op = MapOperator.create(
@@ -116,15 +151,22 @@ def test_actor_pool_resource_reporting(ray_start_10_cpus_shared):
     )
 
     # Add inputs.
-    for _ in range(4):
+    for i in range(4):
         # Pool is still idle while waiting for actors to start, so additional tasks
         # shouldn't trigger scale-up, so incremental resource usage should still be 0.
         assert op.incremental_resource_usage() == ExecutionResources(cpu=0, gpu=0)
         op.add_input(input_op.get_next(), 0)
+        usage = op.current_resource_usage()
+        assert usage.cpu == 2, usage
+        assert usage.gpu == 0, usage
+        # Queued bundles still count against object store usage.
+        assert usage.object_store_memory == pytest.approx((i + 1) * 80, abs=10), usage
     # Pool is still idle while waiting for actors to start.
-    assert op.current_resource_usage() == ExecutionResources(
-        cpu=2, gpu=0, object_store_memory=0
-    )
+    usage = op.current_resource_usage()
+    assert usage.cpu == 2, usage
+    assert usage.gpu == 0, usage
+    # Queued bundles still count against object store usage.
+    assert usage.object_store_memory == pytest.approx(320, abs=10), usage
 
     # Wait for actors to start.
     work_refs = op.get_work_refs()
@@ -174,6 +216,90 @@ def test_actor_pool_resource_reporting(ray_start_10_cpus_shared):
     assert usage.object_store_memory == 0, usage
 
 
+def test_actor_pool_resource_reporting_with_bundling(ray_start_10_cpus_shared):
+    input_op = InputDataBuffer(make_ref_bundles([[i] for i in range(100)]))
+    op = MapOperator.create(
+        _mul2_transform,
+        input_op=input_op,
+        name="TestMapper",
+        compute_strategy=ActorPoolStrategy(2, 10),
+        min_rows_per_bundle=2,
+    )
+    op.start(ExecutionOptions())
+    assert op.base_resource_usage() == ExecutionResources(cpu=2, gpu=0)
+    # All actors are idle (pending creation), therefore shouldn't need to scale up when
+    # submitting a new task, so incremental resource usage should be 0.
+    assert op.incremental_resource_usage() == ExecutionResources(cpu=0, gpu=0)
+    # Actors are pending creation, but they still count against CPU utilization.
+    assert op.current_resource_usage() == ExecutionResources(
+        cpu=2, gpu=0, object_store_memory=0
+    )
+
+    # Add inputs.
+    for i in range(4):
+        # Pool is still idle while waiting for actors to start, so additional tasks
+        # shouldn't trigger scale-up, so incremental resource usage should still be 0.
+        assert op.incremental_resource_usage() == ExecutionResources(cpu=0, gpu=0)
+        op.add_input(input_op.get_next(), 0)
+        usage = op.current_resource_usage()
+        assert usage.cpu == 2, usage
+        assert usage.gpu == 0, usage
+        # Queued bundles still count against object store usage.
+        assert usage.object_store_memory == pytest.approx((i + 1) * 80, abs=10), usage
+    # Pool is still idle while waiting for actors to start.
+    usage = op.current_resource_usage()
+    assert usage.cpu == 2, usage
+    assert usage.gpu == 0, usage
+    # Queued bundles still count against object store usage.
+    assert usage.object_store_memory == pytest.approx(320, abs=10), usage
+
+    # Wait for actors to start.
+    work_refs = op.get_work_refs()
+    assert len(work_refs) == 2
+    for work_ref in work_refs:
+        ray.get(work_ref)
+        op.notify_work_completed(work_ref)
+
+    # Now that both actors have started, a new task would trigger scale-up, so
+    # incremental resource usage should be 1 CPU.
+    inc_usage = op.incremental_resource_usage()
+    assert inc_usage.cpu == 1, inc_usage
+    assert inc_usage.gpu == 0, inc_usage
+
+    # Actors have now started and the pool is actively running tasks.
+    usage = op.current_resource_usage()
+    assert usage.cpu == 2, usage
+    assert usage.gpu == 0, usage
+    assert usage.object_store_memory == pytest.approx(320, abs=10), usage
+
+    # Indicate that no more inputs will arrive.
+    op.inputs_done()
+
+    # Wait until tasks are done.
+    work_refs = op.get_work_refs()
+    while work_refs:
+        for work_ref in work_refs:
+            ray.get(work_ref)
+            op.notify_work_completed(work_ref)
+        work_refs = op.get_work_refs()
+
+    # Work is done and the pool has been scaled down.
+    usage = op.current_resource_usage()
+    assert usage.cpu == 0, usage
+    assert usage.gpu == 0, usage
+    assert usage.object_store_memory == pytest.approx(416, abs=10), usage
+
+    # Consume task outputs.
+    while op.has_next():
+        op.get_next()
+
+    # Work is done, pool has been scaled down, and outputs have been consumed.
+    usage = op.current_resource_usage()
+    assert usage.cpu == 0, usage
+    assert usage.gpu == 0, usage
+    assert usage.object_store_memory == 0, usage
+
+
 if __name__ == "__main__":
     import sys
 

From e71c63f1f2de06cd71f83a56a1c45e97482bb1f2 Mon Sep 17 00:00:00 2001
From: xwjiang2010 <87673679+xwjiang2010@users.noreply.github.com>
Date: Mon, 13 Feb 2023 14:47:44 -0800
Subject: [PATCH 246/267] [tune/train] clean up tune/train result output
 (#32234)

* [tune/train] remove duplicated keys in tune/train results.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* timestamp

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* result_timestamp defaults to None

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* fix test

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* fix progress_reporter test.

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* .get(, None)

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* fix test

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* fix test_gpu

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

* WORKER_

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>

---------

Signed-off-by: xwjiang2010 <xwjiang2010@gmail.com>
---
 python/ray/train/_internal/session.py         | 17 +++----
 python/ray/train/constants.py                 | 21 ++++----
 python/ray/train/tests/test_examples.py       |  2 +-
 python/ray/train/tests/test_gpu_examples.py   |  2 +-
 python/ray/train/tests/test_mosaic_trainer.py |  5 +-
 python/ray/tune/result.py                     | 16 +++----
 python/ray/tune/tests/test_api.py             |  6 +--
 python/ray/tune/trainable/trainable.py        | 48 ++++++++-----------
 rllib/algorithms/algorithm.py                 |  3 +-
 rllib/utils/test_utils.py                     |  2 -
 10 files changed, 55 insertions(+), 67 deletions(-)

diff --git a/python/ray/train/_internal/session.py b/python/ray/train/_internal/session.py
index f9bedd889efb..a623dc449a45 100644
--- a/python/ray/train/_internal/session.py
+++ b/python/ray/train/_internal/session.py
@@ -17,15 +17,13 @@
 from ray.data import Dataset, DatasetPipeline
 from ray.train._internal.accelerator import Accelerator
 from ray.train.constants import (
-    DATE,
     DETAILED_AUTOFILLED_KEYS,
-    HOSTNAME,
-    NODE_IP,
-    PID,
+    WORKER_HOSTNAME,
+    WORKER_NODE_IP,
+    WORKER_PID,
     TIME_THIS_ITER_S,
     TIME_TOTAL_S,
     TIMESTAMP,
-    TRAINING_ITERATION,
     CHECKPOINT_METADATA_KEY,
 )
 from ray.train.error import SessionMisuseError
@@ -229,14 +227,11 @@ def _auto_fill_metrics(self, result: dict) -> dict:
         self.last_report_time = current_time
 
         auto_filled_metrics = {
-            DATE: current_datetime.strftime("%Y-%m-%d_%H-%M-%S"),
             TIMESTAMP: int(time.mktime(current_datetime.timetuple())),
-            TIME_THIS_ITER_S: time_this_iter,
             TIME_TOTAL_S: self.time_total,
-            PID: os.getpid(),
-            HOSTNAME: platform.node(),
-            NODE_IP: self.local_ip,
-            TRAINING_ITERATION: self.iteration,
+            WORKER_PID: os.getpid(),
+            WORKER_HOSTNAME: platform.node(),
+            WORKER_NODE_IP: self.local_ip,
         }
 
         if not self.detailed_autofilled_metrics:
diff --git a/python/ray/train/constants.py b/python/ray/train/constants.py
index abb9e3cffb26..71b499befeb0 100644
--- a/python/ray/train/constants.py
+++ b/python/ray/train/constants.py
@@ -16,21 +16,22 @@
 )
 
 # Autofilled session.report() metrics. Keys should be consistent with Tune.
-TIMESTAMP = "_timestamp"
-TIME_THIS_ITER_S = "_time_this_iter_s"
-TRAINING_ITERATION = "_training_iteration"
+# The train provided `TIME_THIS_ITER_S` and `TIMESTAMP` will triumph what's
+# auto-filled by Tune session.
+# TODO: Combine the following two with tune's, once there is a centralized
+#  file for both tune/train constants.
+TIMESTAMP = "timestamp"
+TIME_THIS_ITER_S = "time_this_iter_s"
 
-BASIC_AUTOFILLED_KEYS = {TIMESTAMP, TIME_THIS_ITER_S, TRAINING_ITERATION}
-
-DATE = "_date"
-HOSTNAME = "_hostname"
-NODE_IP = "_node_ip"
-PID = "_pid"
 TIME_TOTAL_S = "_time_total_s"
 
+WORKER_HOSTNAME = "_hostname"
+WORKER_NODE_IP = "_node_ip"
+WORKER_PID = "_pid"
+
 # Will not be reported unless ENABLE_DETAILED_AUTOFILLED_METRICS_ENV
 # env var is not 0
-DETAILED_AUTOFILLED_KEYS = {DATE, HOSTNAME, NODE_IP, PID, TIME_TOTAL_S}
+DETAILED_AUTOFILLED_KEYS = {WORKER_HOSTNAME, WORKER_NODE_IP, WORKER_PID, TIME_TOTAL_S}
 
 # Default filename for JSON logger
 RESULT_FILE_JSON = "results.json"
diff --git a/python/ray/train/tests/test_examples.py b/python/ray/train/tests/test_examples.py
index 11918e449213..ca0d6a6efbe4 100644
--- a/python/ray/train/tests/test_examples.py
+++ b/python/ray/train/tests/test_examples.py
@@ -1,7 +1,7 @@
 import pytest
 
 from ray.air.config import ScalingConfig
-from ray.train.constants import TRAINING_ITERATION
+from ray.tune.result import TRAINING_ITERATION
 
 from ray.train.examples.horovod.horovod_example import (
     train_func as horovod_torch_train_func,
diff --git a/python/ray/train/tests/test_gpu_examples.py b/python/ray/train/tests/test_gpu_examples.py
index 567c5967f91b..6f506b5bdb92 100644
--- a/python/ray/train/tests/test_gpu_examples.py
+++ b/python/ray/train/tests/test_gpu_examples.py
@@ -4,7 +4,6 @@
 from ray.air import Checkpoint, session
 
 from ray.air.config import ScalingConfig
-from ray.train.constants import TRAINING_ITERATION
 from ray.train.examples.horovod.horovod_example import (
     train_func as horovod_torch_train_func,
 )
@@ -21,6 +20,7 @@
 )
 from ray.train.tensorflow.tensorflow_trainer import TensorflowTrainer
 from ray.train.torch.torch_trainer import TorchTrainer
+from ray.tune.result import TRAINING_ITERATION
 
 
 def test_tensorflow_mnist_gpu(ray_start_4_cpus_2_gpus):
diff --git a/python/ray/train/tests/test_mosaic_trainer.py b/python/ray/train/tests/test_mosaic_trainer.py
index fa11b2227a4d..59d1c88a0284 100644
--- a/python/ray/train/tests/test_mosaic_trainer.py
+++ b/python/ray/train/tests/test_mosaic_trainer.py
@@ -6,9 +6,10 @@
 import torchvision
 from torchvision import transforms, datasets
 
+from ray.air import session
 from ray.air.config import ScalingConfig
 import ray.train as train
-from ray.air import session
+from ray.tune.result import TRAINING_ITERATION
 
 
 scaling_config = ScalingConfig(num_workers=2, use_gpu=False)
@@ -89,7 +90,7 @@ def test_mosaic_cifar10(ray_start_4_cpus):
     assert result["epoch"][result.index[-1]] == 4
 
     # check train_iterations
-    assert result["_training_iteration"][result.index[-1]] == 5
+    assert result[TRAINING_ITERATION][result.index[-1]] == 5
 
     # check metrics/train/Accuracy has increased
     acc = list(result["metrics/train/Accuracy"])
diff --git a/python/ray/tune/result.py b/python/ray/tune/result.py
index 04abc42a2449..a62729a122c1 100644
--- a/python/ray/tune/result.py
+++ b/python/ray/tune/result.py
@@ -32,9 +32,6 @@
 # (Optional) Mean loss for training iteration
 MEAN_LOSS = "mean_loss"
 
-# (Optional) Mean loss for training iteration
-NEG_MEAN_LOSS = "neg_mean_loss"
-
 # (Optional) Mean accuracy for training iteration
 MEAN_ACCURACY = "mean_accuracy"
 
@@ -44,6 +41,10 @@
 # (Optional/Auto-filled) Accumulated number of episodes for this trial.
 EPISODES_TOTAL = "episodes_total"
 
+# The timestamp of when the result is generated.
+# Default to when the result is processed by tune.
+TIMESTAMP = "timestamp"
+
 # Number of timesteps in this iteration.
 TIMESTEPS_THIS_ITER = "timesteps_this_iter"
 
@@ -67,7 +68,6 @@
 DEFAULT_RESULT_KEYS = (
     TRAINING_ITERATION,
     TIME_TOTAL_S,
-    TIMESTEPS_TOTAL,
     MEAN_ACCURACY,
     MEAN_LOSS,
 )
@@ -77,7 +77,7 @@
     TRIAL_ID,
     "experiment_id",
     "date",
-    "timestamp",
+    TIMESTAMP,
     PID,
     HOSTNAME,
     NODE_IP,
@@ -95,14 +95,12 @@
     PID,
     TIME_TOTAL_S,
     TIME_THIS_ITER_S,
-    "timestamp",
-    "experiment_id",
+    TIMESTAMP,
     "date",
     "time_since_restore",
-    "iterations_since_restore",
     "timesteps_since_restore",
+    "iterations_since_restore",
     "config",
-    "warmup_time",
 )
 
 # __duplicate__ is a magic keyword used internally to
diff --git a/python/ray/tune/tests/test_api.py b/python/ray/tune/tests/test_api.py
index 5467fb763602..3e75ebfad7da 100644
--- a/python/ray/tune/tests/test_api.py
+++ b/python/ray/tune/tests/test_api.py
@@ -156,7 +156,6 @@ def _function_trainable(config, reporter):
             "time_since_restore",
             "experiment_id",
             "date",
-            "warmup_time",
         }
 
         self.assertEqual(len(class_output), len(results))
@@ -871,7 +870,7 @@ def testReportTimeStep(self):
         results1 = [dict(mean_accuracy=5, done=i == 99) for i in range(100)]
         logs1, _ = self.checkAndReturnConsistentLogs(results1)
 
-        self.assertTrue(all(log[TIMESTEPS_TOTAL] is None for log in logs1))
+        self.assertTrue(all(TIMESTEPS_TOTAL not in log for log in logs1))
 
         # Test that no timesteps_this_iter are logged if only timesteps_total
         # are returned.
@@ -891,7 +890,8 @@ def testReportTimeStep(self):
         self.assertFalse(any(hasattr(log, TIMESTEPS_THIS_ITER) for log in logs2))
 
         # Test that timesteps_total and episodes_total are reported when
-        # timesteps_this_iter and episodes_this_iter despite only return zeros.
+        # timesteps_this_iter and episodes_this_iter are provided by user,
+        # despite only return zeros.
         results3 = [
             dict(timesteps_this_iter=0, episodes_this_iter=0) for i in range(10)
         ]
diff --git a/python/ray/tune/trainable/trainable.py b/python/ray/tune/trainable/trainable.py
index fb1558d8366a..6af9f93eb5c3 100644
--- a/python/ray/tune/trainable/trainable.py
+++ b/python/ray/tune/trainable/trainable.py
@@ -7,7 +7,6 @@
 import sys
 import tempfile
 import time
-import uuid
 from contextlib import redirect_stderr, redirect_stdout
 from datetime import datetime
 from typing import Any, Callable, Dict, List, Optional, Union, Type, TYPE_CHECKING
@@ -35,6 +34,7 @@
     STDOUT_FILE,
     TIME_THIS_ITER_S,
     TIME_TOTAL_S,
+    TIMESTAMP,
     TIMESTEPS_THIS_ITER,
     TIMESTEPS_TOTAL,
     TRAINING_ITERATION,
@@ -133,7 +133,6 @@ def __init__(
             sync_timeout: Timeout after which sync processes are aborted.
         """
 
-        self._experiment_id = uuid.uuid4().hex
         self.config = config or {}
         trial_info = self.config.pop(TRIAL_INFO, None)
 
@@ -164,10 +163,10 @@ def __init__(
         self._stdout_file = stdout_file
         self._stderr_file = stderr_file
 
-        start_time = time.time()
+        self._start_time = time.time()
         self._local_ip = ray.util.get_node_ip_address()
         self.setup(copy.deepcopy(self.config))
-        setup_time = time.time() - start_time
+        setup_time = time.time() - self._start_time
         if setup_time > SETUP_TIME_THRESHOLD:
             logger.info(
                 "Trainable.setup took {:.3f} seconds. If your "
@@ -176,8 +175,6 @@ def __init__(
                 "overheads.".format(setup_time)
             )
         log_sys_usage = self.config.get("log_sys_usage", False)
-        self._start_time = start_time
-        self._warmup_time = None
         self._monitor = UtilMonitor(start=log_sys_usage)
 
         self.remote_checkpoint_dir = remote_checkpoint_dir
@@ -240,6 +237,7 @@ def get_auto_filled_metrics(
         self,
         now: Optional[datetime] = None,
         time_this_iter: Optional[float] = None,
+        timestamp: Optional[int] = None,
         debug_metrics_only: bool = False,
     ) -> dict:
         """Return a dict with metrics auto-filled by the trainable.
@@ -252,9 +250,8 @@ def get_auto_filled_metrics(
             now = datetime.today()
         autofilled = {
             TRIAL_ID: self.trial_id,
-            "experiment_id": self._experiment_id,
             "date": now.strftime("%Y-%m-%d_%H-%M-%S"),
-            "timestamp": int(time.mktime(now.timetuple())),
+            "timestamp": timestamp if timestamp else int(time.mktime(now.timetuple())),
             TIME_THIS_ITER_S: time_this_iter,
             TIME_TOTAL_S: self._time_total,
             PID: os.getpid(),
@@ -262,10 +259,11 @@ def get_auto_filled_metrics(
             NODE_IP: self._local_ip,
             "config": self.config,
             "time_since_restore": self._time_since_restore,
-            "timesteps_since_restore": self._timesteps_since_restore,
             "iterations_since_restore": self._iterations_since_restore,
-            "warmup_time": self._warmup_time,
         }
+        if self._timesteps_since_restore:
+            autofilled["timesteps_since_restore"] = self._timesteps_since_restore
+
         if debug_metrics_only:
             autofilled = {k: v for k, v in autofilled.items() if k in DEBUG_METRICS}
         return autofilled
@@ -334,10 +332,6 @@ def train(self):
             `time_total_s` (float): Accumulated time in seconds for this
             entire experiment.
 
-            `experiment_id` (str): Unique string identifier
-            for this experiment. This id is preserved
-            across checkpoint / restore calls.
-
             `training_iteration` (int): The index of this
             training iteration, e.g. call to train(). This is incremented
             after `step()` is called.
@@ -347,7 +341,7 @@ def train(self):
             `date` (str): A formatted date of when the result was processed.
 
             `timestamp` (str): A UNIX timestamp of when the result
-            was processed.
+            was processed. This may be overridden.
 
             `hostname` (str): Hostname of the machine hosting the training
             process.
@@ -358,8 +352,6 @@ def train(self):
         Returns:
             A dict that describes training progress.
         """
-        if self._warmup_time is None:
-            self._warmup_time = time.time() - self._start_time
         start = time.time()
         try:
             result = self.step()
@@ -385,9 +377,11 @@ def train(self):
         self._time_total += time_this_iter
         self._time_since_restore += time_this_iter
 
+        result_timestamp = result.get(TIMESTAMP, None)
+
         result.setdefault(DONE, False)
 
-        # self._timesteps_total should only be tracked if increments provided
+        # self._timesteps_total should only be tracked if increments are provided
         if result.get(TIMESTEPS_THIS_ITER) is not None:
             if self._timesteps_total is None:
                 self._timesteps_total = 0
@@ -401,16 +395,18 @@ def train(self):
             self._episodes_total += result[EPISODES_THIS_ITER]
 
         # self._timesteps_total should not override user-provided total
-        result.setdefault(TIMESTEPS_TOTAL, self._timesteps_total)
-        result.setdefault(EPISODES_TOTAL, self._episodes_total)
+        if self._timesteps_total is not None:
+            result.setdefault(TIMESTEPS_TOTAL, self._timesteps_total)
+        if self._episodes_total is not None:
+            result.setdefault(EPISODES_TOTAL, self._episodes_total)
         result.setdefault(TRAINING_ITERATION, self._iteration)
 
-        # Provides auto-filled neg_mean_loss for avoiding regressions
-        if result.get("mean_loss"):
-            result.setdefault("neg_mean_loss", -result["mean_loss"])
-
         now = datetime.today()
-        result.update(self.get_auto_filled_metrics(now, time_this_iter))
+        result.update(
+            self.get_auto_filled_metrics(
+                now=now, time_this_iter=time_this_iter, timestamp=result_timestamp
+            )
+        )
 
         monitor_data = self._monitor.get_data()
         if monitor_data:
@@ -429,7 +425,6 @@ def train(self):
 
     def get_state(self):
         return {
-            "experiment_id": self._experiment_id,
             "iteration": self._iteration,
             "timesteps_total": self._timesteps_total,
             "time_total": self._time_total,
@@ -774,7 +769,6 @@ def restore(
             to_load = os.path.join(checkpoint_dir, relative_checkpoint_path)
 
         # Set metadata
-        self._experiment_id = metadata["experiment_id"]
         self._iteration = metadata["iteration"]
         self._timesteps_total = metadata["timesteps_total"]
         self._time_total = metadata["time_total"]
diff --git a/rllib/algorithms/algorithm.py b/rllib/algorithms/algorithm.py
index 05c386e60384..b26a6085cb6a 100644
--- a/rllib/algorithms/algorithm.py
+++ b/rllib/algorithms/algorithm.py
@@ -2360,12 +2360,13 @@ def get_auto_filled_metrics(
         self,
         now: Optional[datetime] = None,
         time_this_iter: Optional[float] = None,
+        timestamp: Optional[int] = None,
         debug_metrics_only: bool = False,
     ) -> dict:
         # Override this method to make sure, the `config` key of the returned results
         # contains the proper Tune config dict (instead of an AlgorithmConfig object).
         auto_filled = super().get_auto_filled_metrics(
-            now, time_this_iter, debug_metrics_only
+            now, time_this_iter, timestamp, debug_metrics_only
         )
         if "config" not in auto_filled:
             raise KeyError("`config` key not found in auto-filled results dict!")
diff --git a/rllib/utils/test_utils.py b/rllib/utils/test_utils.py
index 5f21b836fb85..207b9820cf63 100644
--- a/rllib/utils/test_utils.py
+++ b/rllib/utils/test_utils.py
@@ -634,7 +634,6 @@ def check_train_results(train_results: PartialAlgorithmConfigDict) -> ResultDict
         "episode_reward_max",
         "episode_reward_mean",
         "episode_reward_min",
-        "episodes_total",
         "hist_stats",
         "info",
         "iterations_since_restore",
@@ -646,7 +645,6 @@ def check_train_results(train_results: PartialAlgorithmConfigDict) -> ResultDict
         "sampler_perf",
         "time_since_restore",
         "time_this_iter_s",
-        "timesteps_since_restore",
         "timesteps_total",
         "timers",
         "time_total_s",

From e56665ef6c686582683f0a6a090037bff26f058a Mon Sep 17 00:00:00 2001
From: Ricky Xu <xuchen727@hotmail.com>
Date: Mon, 13 Feb 2023 15:28:01 -0800
Subject: [PATCH 247/267] [ci][core] Calculate actor creation time properly for
 stress_test_many_tasks (#32438)

Signed-off-by: rickyyx <rickyx@anyscale.com>

We are calculating actor creation task submission time, which is less useful for this test.
---
 release/nightly_tests/stress_tests/test_many_tasks.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/release/nightly_tests/stress_tests/test_many_tasks.py b/release/nightly_tests/stress_tests/test_many_tasks.py
index 08bcfacd2ca3..ce3942260dc6 100644
--- a/release/nightly_tests/stress_tests/test_many_tasks.py
+++ b/release/nightly_tests/stress_tests/test_many_tasks.py
@@ -27,6 +27,9 @@ class Actor(object):
     def method(self, size, *xs):
         return np.ones(size, dtype=np.uint8)
 
+    def ready(self):
+        pass
+
 
 # Stage 0: Submit a bunch of small tasks with large returns.
 def stage0(smoke=False):
@@ -99,6 +102,7 @@ def stage3(total_num_remote_cpus, smoke=False):
     start_time = time.time()
     logger.info("Creating %s actors.", total_num_remote_cpus)
     actors = [Actor.remote() for _ in range(total_num_remote_cpus)]
+    ray.get([actor.ready.remote() for actor in actors])
     stage_3_creation_time = time.time() - start_time
     logger.info("Finished stage 3 actor creation in %s seconds.", stage_3_creation_time)
 

From 2cee078ea635469ef9f4d6ad671167990f84dbfd Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Mon, 13 Feb 2023 15:40:17 -0800
Subject: [PATCH 248/267] [tune] Structure refactor: Raise on import of old
 modules (#32486)

Following our tune package restructure (https://github.com/ray-project/ray/pulls?q=is%3Apr+in%3Atitle+%5Btune%2Fstructure%5D), we now had 3 releases where we logged a warning (2.0-2.3). For 2.4, we should raise an error instead. For 2.5, we can remove the old files/packages.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 python/ray/tune/_structure_refactor.py | 8 ++------
 1 file changed, 2 insertions(+), 6 deletions(-)

diff --git a/python/ray/tune/_structure_refactor.py b/python/ray/tune/_structure_refactor.py
index 451d2003f5ac..60a9fd331bc5 100644
--- a/python/ray/tune/_structure_refactor.py
+++ b/python/ray/tune/_structure_refactor.py
@@ -1,5 +1,3 @@
-import warnings
-
 from ray.util import log_once
 
 
@@ -8,7 +6,7 @@ def warn_structure_refactor(old_module: str, new_module: str, direct: bool = Tru
     if log_once(f"tune:structure:refactor:{old_module}"):
         warning = (
             f"The module `{old_module}` has been moved to `{new_module}` and the old "
-            f"location will be deprecated soon. Please adjust your imports to point "
+            f"location has been deprecated. Please adjust your imports to point "
             f"to the new location."
         )
 
@@ -24,6 +22,4 @@ def warn_structure_refactor(old_module: str, new_module: str, direct: bool = Tru
                 f"check the contents of `{new_module}` before making changes."
             )
 
-        with warnings.catch_warnings():
-            warnings.simplefilter("always")
-            warnings.warn(warning, DeprecationWarning, stacklevel=3)
+        raise DeprecationWarning(warning)

From 91940e3a5e80aba52e55d13581a1e9122d69f07f Mon Sep 17 00:00:00 2001
From: Yunxuan Xiao <xiaoyunxuan1998@gmail.com>
Date: Mon, 13 Feb 2023 15:45:53 -0800
Subject: [PATCH 249/267] [Doc] Add data ingestion clarification for AIR
 converting existing pytorch code example (#32058)

The example under Ray AI Runtime/Example section directly used native PyTorch datasets for data loading. It's good to clarify that the current approach is for simplicity, the more recommended approach is to use the Ray dataset.

Signed-off-by: Yunxuan Xiao <yunxuanx@Yunxuans-MBP.local.meter>
Signed-off-by: Yunxuan Xiao <xiaoyunxuan1998@gmail.com>
Co-authored-by: Yunxuan Xiao <yunxuanx@Yunxuans-MBP.local.meter>
Co-authored-by: angelinalg <122562471+angelinalg@users.noreply.github.com>
Co-authored-by: Yunxuan Xiao <yunxuanx@Yunxuans-MacBook-Pro.local>
---
 .../convert_existing_pytorch_code_to_ray_air.ipynb    | 11 +++++++----
 1 file changed, 7 insertions(+), 4 deletions(-)

diff --git a/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb b/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb
index bc462afdaf4e..22a54749cedf 100644
--- a/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb
+++ b/doc/source/ray-air/examples/convert_existing_pytorch_code_to_ray_air.ipynb
@@ -59,11 +59,14 @@
    ]
   },
   {
+   "attachments": {},
    "cell_type": "markdown",
    "id": "db36ae56",
    "metadata": {},
    "source": [
-    "Then we download the data:"
+    "Then we download the data: \n",
+    "\n",
+    "This tutorial assumes that your existing code is using the `torch.utils.data.Dataset` native to PyTorch. It continues to use `torch.utils.data.Dataset` to allow you to make as few code changes as possible. **This tutorial also runs with Ray Data, which gives you the benefits of efficient parallel preprocessing.** See an example of using Ray Data for the CIFAR-10 dataset {doc}`here </ray-air/examples/torch_image_example>`."
    ]
   },
   {
@@ -1300,7 +1303,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3.8.10 ('venv': venv)",
+   "display_name": "Python 3",
    "language": "python",
    "name": "python3"
   },
@@ -1314,11 +1317,11 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.10"
+   "version": "3.9.6 (default, Oct 18 2022, 12:41:40) \n[Clang 14.0.0 (clang-1400.0.29.202)]"
   },
   "vscode": {
    "interpreter": {
-    "hash": "3c0d54d489a08ae47a06eae2fd00ff032d6cddb527c382959b7b2575f6a8167f"
+    "hash": "31f2aee4e71d21fbe5cf8b01ff0e069b9275f58929596ceb00d14d90e3e16cd6"
    }
   }
  },

From 71dfd207957342363a575b76349a1c738f6e95d0 Mon Sep 17 00:00:00 2001
From: Clark Zinzow <clarkzinzow@gmail.com>
Date: Mon, 13 Feb 2023 16:54:46 -0800
Subject: [PATCH 250/267] [Datasets] Always preserve order for the
 BulkExecutor. (#32437)

This PR always preserves order for the bulk executor. We may revisit this in the future, at which point we'd update all of the tests that rely on order preservation.

## Checks

- [ ] I've signed off every commit(by using the -s flag, i.e., `git commit -s`) in this PR.
- [ ] I've run `scripts/format.sh` to lint the changes in this PR.
- [ ] I've included any doc changes needed for https://docs.ray.io/en/master/.
- [ ] I've made sure the tests are passing. Note that there might be a few flaky tests, see the recent failures at https://flakey-tests.ray.io/
- Testing Strategy
   - [ ] Unit tests
   - [ ] Release tests
   - [ ] This PR is not tested :(
---
 .../ray/data/_internal/execution/bulk_executor.py   |  2 ++
 python/ray/data/_internal/execution/interfaces.py   |  3 ++-
 python/ray/data/tests/test_bulk_executor.py         | 13 ++++++++++++-
 3 files changed, 16 insertions(+), 2 deletions(-)

diff --git a/python/ray/data/_internal/execution/bulk_executor.py b/python/ray/data/_internal/execution/bulk_executor.py
index 6542dd0a596f..53ca0e59b802 100644
--- a/python/ray/data/_internal/execution/bulk_executor.py
+++ b/python/ray/data/_internal/execution/bulk_executor.py
@@ -24,6 +24,8 @@ class BulkExecutor(Executor):
     """
 
     def __init__(self, options: ExecutionOptions):
+        # Bulk executor always preserves order.
+        options.preserve_order = True
         super().__init__(options)
         self._stats: Optional[DatasetStats] = DatasetStats(stages={}, parent=None)
         self._executed = False
diff --git a/python/ray/data/_internal/execution/interfaces.py b/python/ray/data/_internal/execution/interfaces.py
index 98a9e8679503..53f4bfc79fb6 100644
--- a/python/ray/data/_internal/execution/interfaces.py
+++ b/python/ray/data/_internal/execution/interfaces.py
@@ -156,7 +156,8 @@ class ExecutionOptions:
     # node (node driving the execution).
     locality_with_output: bool = False
 
-    # Set this to preserve the ordering between blocks processed by operators.
+    # Set this to preserve the ordering between blocks processed by operators under the
+    # streaming executor. The bulk executor always preserves order.
     preserve_order: bool = False
 
     # Whether to enable locality-aware task dispatch to actors (on by default).
diff --git a/python/ray/data/tests/test_bulk_executor.py b/python/ray/data/tests/test_bulk_executor.py
index 3c466675246e..421392ab94a4 100644
--- a/python/ray/data/tests/test_bulk_executor.py
+++ b/python/ray/data/tests/test_bulk_executor.py
@@ -31,7 +31,18 @@ def ref_bundles_to_list(bundles: List[RefBundle]) -> List[List[Any]]:
     return output
 
 
-@pytest.mark.parametrize("preserve_order", [False, True])
+@pytest.mark.parametrize(
+    "preserve_order",
+    [
+        True,
+        pytest.param(
+            False,
+            marks=pytest.mark.skip(
+                reason="Bulk executor currently always preserves order"
+            ),
+        ),
+    ],
+)
 def test_multi_stage_execution(ray_start_10_cpus_shared, preserve_order):
     executor = BulkExecutor(ExecutionOptions(preserve_order=preserve_order))
     inputs = make_ref_bundles([[x] for x in range(20)])

From 421b52794dbbbf9cb185fbbb38d59283d699522b Mon Sep 17 00:00:00 2001
From: Justin Yu <justinvyu@berkeley.edu>
Date: Mon, 13 Feb 2023 17:30:24 -0800
Subject: [PATCH 251/267] [Tune] Fix docstring failures (#32484)

This PR fixes the `Stopper` doctests that are erroring. Previously, it used a `tune.Trainable` as its trainable, which would error on fit since its methods are not implemented. Also, it was missing some imports.

Signed-off-by: Justin Yu <justinvyu@berkeley.edu>
---
 python/ray/air/checkpoint.py       |  1 +
 python/ray/tune/stopper/stopper.py | 58 ++++++++++++++++++++----------
 2 files changed, 40 insertions(+), 19 deletions(-)

diff --git a/python/ray/air/checkpoint.py b/python/ray/air/checkpoint.py
index 07a2ee7734c1..f1232922f4c3 100644
--- a/python/ray/air/checkpoint.py
+++ b/python/ray/air/checkpoint.py
@@ -435,6 +435,7 @@ def from_checkpoint(cls, other: "Checkpoint") -> "Checkpoint":
         generic :py:class:`Checkpoint` object.
 
         Examples:
+
             >>> result = TorchTrainer.fit(...)  # doctest: +SKIP
             >>> checkpoint = TorchCheckpoint.from_checkpoint(result.checkpoint)  # doctest: +SKIP # noqa: E501
             >>> model = checkpoint.get_model()  # doctest: +SKIP
diff --git a/python/ray/tune/stopper/stopper.py b/python/ray/tune/stopper/stopper.py
index 0a29b1fed35d..c61900402c63 100644
--- a/python/ray/tune/stopper/stopper.py
+++ b/python/ray/tune/stopper/stopper.py
@@ -1,4 +1,5 @@
 import abc
+from typing import Any, Dict
 
 from ray.util.annotations import PublicAPI
 
@@ -15,34 +16,42 @@ class Stopper(abc.ABC):
 
         >>> import time
         >>> from ray import air, tune
+        >>> from ray.air import session
         >>> from ray.tune import Stopper
         >>>
         >>> class TimeStopper(Stopper):
         ...     def __init__(self):
         ...         self._start = time.time()
-        ...         self._deadline = 5
+        ...         self._deadline = 5  # Stop all trials after 5 seconds
         ...
         ...     def __call__(self, trial_id, result):
         ...         return False
         ...
         ...     def stop_all(self):
         ...         return time.time() - self._start > self._deadline
-        >>>
+        ...
+        >>> def train_fn(config):
+        ...     for i in range(100):
+        ...         time.sleep(1)
+        ...         session.report({"iter": i})
+        ...
         >>> tuner = tune.Tuner(
-        ...     tune.Trainable,
-        ...     tune_config=tune.TuneConfig(num_samples=200),
-        ...     run_config=air.RunConfig(stop=TimeStopper())
+        ...     train_fn,
+        ...     tune_config=tune.TuneConfig(num_samples=2),
+        ...     run_config=air.RunConfig(stop=TimeStopper()),
         ... )
-        >>> tuner.fit()
-        == Status ==...
+        >>> print("[ignore]"); result_grid = tuner.fit()  # doctest: +ELLIPSIS
+        [ignore]...
+        >>> all(result.metrics["time_total_s"] < 6 for result in result_grid)
+        True
 
     """
 
-    def __call__(self, trial_id, result):
+    def __call__(self, trial_id: str, result: Dict[str, Any]) -> bool:
         """Returns true if the trial should be terminated given the result."""
         raise NotImplementedError
 
-    def stop_all(self):
+    def stop_all(self) -> bool:
         """Returns true if the experiment should be terminated."""
         raise NotImplementedError
 
@@ -56,28 +65,39 @@ class CombinedStopper(Stopper):
 
     Examples:
 
-        >>> from ray.tune.stopper import (CombinedStopper,
-        ...     MaximumIterationStopper, TrialPlateauStopper)
+        >>> import numpy as np
+        >>> from ray import air, tune
+        >>> from ray.air import session
+        >>> from ray.tune.stopper import (
+        ...     CombinedStopper,
+        ...     MaximumIterationStopper,
+        ...     TrialPlateauStopper,
+        ... )
         >>>
         >>> stopper = CombinedStopper(
         ...     MaximumIterationStopper(max_iter=20),
-        ...     TrialPlateauStopper(metric="my_metric")
+        ...     TrialPlateauStopper(metric="my_metric"),
         ... )
-        >>>
+        >>> def train_fn(config):
+        ...     for i in range(25):
+        ...         session.report({"my_metric": np.random.normal(0, 1 - i / 25)})
+        ...
         >>> tuner = tune.Tuner(
-        ...     tune.Trainable,
-        ...     run_config=air.RunConfig(stop=stopper)
+        ...     train_fn,
+        ...     run_config=air.RunConfig(stop=stopper),
         ... )
-        >>> tuner.fit()
-        == Status ==...
+        >>> print("[ignore]"); result_grid = tuner.fit()  # doctest: +ELLIPSIS
+        [ignore]...
+        >>> all(result.metrics["training_iteration"] <= 20 for result in result_grid)
+        True
 
     """
 
     def __init__(self, *stoppers: Stopper):
         self._stoppers = stoppers
 
-    def __call__(self, trial_id, result):
+    def __call__(self, trial_id: str, result: Dict[str, Any]) -> bool:
         return any(s(trial_id, result) for s in self._stoppers)
 
-    def stop_all(self):
+    def stop_all(self) -> bool:
         return any(s.stop_all() for s in self._stoppers)

From bc012884e12a91d719857faffa8e0fa25c3d1a1e Mon Sep 17 00:00:00 2001
From: Eric Liang <ekhliang@gmail.com>
Date: Mon, 13 Feb 2023 17:32:42 -0800
Subject: [PATCH 252/267] [data] Fix pandas import failures by moving it to a
 top-level data import (#32447)

---
 python/ray/data/__init__.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/python/ray/data/__init__.py b/python/ray/data/__init__.py
index 9a114f84490a..ce978149e8ea 100644
--- a/python/ray/data/__init__.py
+++ b/python/ray/data/__init__.py
@@ -1,3 +1,7 @@
+# Short term workaround for https://github.com/ray-project/ray/issues/32435
+# Datasets currently has a hard dependency on pandas, so it doesn't need to be delayed.
+import pandas  # noqa
+
 from ray.data._internal.compute import ActorPoolStrategy
 from ray.data._internal.progress_bar import set_progress_bars
 from ray.data.dataset import Dataset

From a447cbbb2d41dda06bcd60cb4f366b4ad9944a70 Mon Sep 17 00:00:00 2001
From: kourosh hakhamaneshi <31483498+kouroshHakha@users.noreply.github.com>
Date: Mon, 13 Feb 2023 18:16:48 -0800
Subject: [PATCH 253/267] [RLlib] Allow MARLModule customization from algorithm
 config (#32473)

Signed-off-by: Kourosh Hakhamaneshi <kourosh@anyscale.com>
---
 rllib/BUILD                                   |   4 +-
 rllib/algorithms/algorithm.py                 |  23 +--
 rllib/algorithms/algorithm_config.py          | 116 +++++++++----
 rllib/algorithms/ppo/ppo.py                   |   8 +-
 .../ppo/tests/test_ppo_rl_trainer.py          |   3 +
 .../algorithms/tests/test_algorithm_config.py |   7 +-
 rllib/core/rl_module/marl_module.py           | 100 +++++++++--
 rllib/core/rl_module/rl_module.py             |   8 +
 .../rl_module/tests/test_rl_module_specs.py   |   6 +-
 .../tests/test_trainer_runner_config.py       |  12 +-
 rllib/core/rl_trainer/trainer_runner.py       |   6 +-
 rllib/core/testing/bc_algorithm.py            |   7 +-
 rllib/core/testing/tests/test_bc_algorithm.py | 103 +++++++++++-
 rllib/core/testing/tf/bc_module.py            |  18 +-
 rllib/core/testing/torch/bc_module.py         |  17 +-
 rllib/evaluation/rollout_worker.py            | 155 ++++++++++++++----
 rllib/policy/policy.py                        |  22 ++-
 rllib/utils/policy.py                         |   3 +
 18 files changed, 479 insertions(+), 139 deletions(-)

diff --git a/rllib/BUILD b/rllib/BUILD
index 49271a17ded8..6cae4c62ca0a 100644
--- a/rllib/BUILD
+++ b/rllib/BUILD
@@ -3867,7 +3867,7 @@ py_test(
 py_test(
     name = "examples/rl_trainer/multi_agent_cartpole_ppo_torch",
     main = "examples/rl_trainer/multi_agent_cartpole_ppo.py",
-    tags = ["team:rllib", "exclusive", "examples", "no-gpu"],
+    tags = ["team:rllib", "exclusive", "examples"],
     size = "medium",
     srcs = ["examples/rl_trainer/multi_agent_cartpole_ppo.py"],
     args = ["--as-test", "--framework=torch", "--num-gpus=0"]
@@ -3886,7 +3886,7 @@ py_test(
 py_test(
     name = "examples/rl_trainer/multi_agent_cartpole_ppo_torch_multi_gpu",
     main = "examples/rl_trainer/multi_agent_cartpole_ppo.py",
-    tags = ["team:rllib", "exclusive", "examples", "multi-gpu"],
+    tags = ["team:rllib", "exclusive", "examples", "multi_gpu"],
     size = "medium",
     srcs = ["examples/rl_trainer/multi_agent_cartpole_ppo.py"],
     args = ["--as-test", "--framework=torch", "--num-gpus=2"]
diff --git a/rllib/algorithms/algorithm.py b/rllib/algorithms/algorithm.py
index b26a6085cb6a..8ef170668379 100644
--- a/rllib/algorithms/algorithm.py
+++ b/rllib/algorithms/algorithm.py
@@ -35,14 +35,8 @@
 import ray.cloudpickle as pickle
 
 from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
-from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
-from ray.rllib.core.rl_module.marl_module import (
-    MultiAgentRLModuleSpec,
-    MultiAgentRLModule,
-)
-
-from ray.rllib.connectors.agent.obs_preproc import ObsPreprocessorConnector
 from ray.rllib.algorithms.registry import ALGORITHMS as ALL_ALGORITHMS
+from ray.rllib.connectors.agent.obs_preproc import ObsPreprocessorConnector
 from ray.rllib.env.env_context import EnvContext
 from ray.rllib.env.utils import _gym_env_creator
 from ray.rllib.evaluation.episode import Episode
@@ -699,20 +693,7 @@ def setup(self, config: AlgorithmConfig) -> None:
             # the two we need to loop through the policy modules and create a simple
             # MARLModule from the RLModule within each policy.
             local_worker = self.workers.local_worker()
-            module_specs = {}
-
-            for pid, policy in local_worker.policy_map.items():
-                module_specs[pid] = SingleAgentRLModuleSpec(
-                    module_class=policy.config["rl_module_class"],
-                    observation_space=policy.observation_space,
-                    action_space=policy.action_space,
-                    model_config=policy.config["model"],
-                )
-
-            module_spec = MultiAgentRLModuleSpec(
-                module_class=MultiAgentRLModule, module_specs=module_specs
-            )
-
+            module_spec = local_worker.marl_module_spec
             trainer_runner_config = self.config.get_trainer_runner_config(module_spec)
             self.trainer_runner = trainer_runner_config.build()
 
diff --git a/rllib/algorithms/algorithm_config.py b/rllib/algorithms/algorithm_config.py
index 8796427f6c00..2fc03b08d735 100644
--- a/rllib/algorithms/algorithm_config.py
+++ b/rllib/algorithms/algorithm_config.py
@@ -16,12 +16,13 @@
 
 import ray
 from ray.rllib.algorithms.callbacks import DefaultCallbacks
-from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
 from ray.rllib.core.rl_trainer.rl_trainer import RLTrainerHPs
 from ray.rllib.core.rl_trainer.trainer_runner_config import (
     TrainerRunnerConfig,
     ModuleSpec,
 )
+from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
+from ray.rllib.core.rl_module.marl_module import MultiAgentRLModuleSpec
 from ray.rllib.evaluation.rollout_worker import RolloutWorker
 from ray.rllib.env.env_context import EnvContext
 from ray.rllib.env.multi_agent_env import MultiAgentEnv
@@ -91,7 +92,6 @@
 
 if TYPE_CHECKING:
     from ray.rllib.algorithms.algorithm import Algorithm
-    from ray.rllib.core.rl_module import RLModule
     from ray.rllib.core.rl_trainer import RLTrainer
 
 logger = logging.getLogger(__name__)
@@ -406,7 +406,7 @@ def __init__(self, algo_class=None):
         self.worker_cls = None
 
         # `self.rl_module()`
-        self.rl_module_class = None
+        self.rl_module_spec = None
         self._enable_rl_module_api = False
 
         # `self.experimental()`
@@ -879,10 +879,16 @@ def validate(self) -> None:
                 # compatibility for now. User only needs to set num_rollout_workers.
                 self.input_config["parallelism"] = self.num_rollout_workers or 1
 
-        # resolve rl_module class
-        if self._enable_rl_module_api and self.rl_module_class is None:
-            rl_module_class_path = self.get_default_rl_module_class()
-            self.rl_module_class = _resolve_class_path(rl_module_class_path)
+        # resolve rl_module_spec class
+        if self._enable_rl_module_api and self.rl_module_spec is None:
+            self.rl_module_spec = self.get_default_rl_module_spec()
+            if not isinstance(
+                self.rl_module_spec, (SingleAgentRLModuleSpec, MultiAgentRLModuleSpec)
+            ):
+                raise ValueError(
+                    "rl_module_spec must be an instance of "
+                    "SingleAgentRLModuleSpec or MultiAgentRLModuleSpec."
+                )
 
         # make sure the resource requirements for trainer runner is valid
         if self.num_trainer_workers == 0 and self.num_gpus_per_worker > 1:
@@ -2170,22 +2176,26 @@ def debugging(
     def rl_module(
         self,
         *,
-        rl_module_class: Optional[Type["RLModule"]] = NotProvided,
+        rl_module_spec: Optional[ModuleSpec] = NotProvided,
         _enable_rl_module_api: Optional[bool] = NotProvided,
     ) -> "AlgorithmConfig":
         """Sets the config's RLModule settings.
 
         Args:
-            rl_module_class: The RLModule class to use for this config.
+            rl_module_spec: The RLModule spec to use for this config. It can be either
+                a SingleAgentRLModuleSpec or a MultiAgentRLModuleSpec. If the
+                observation_space, action_space, or the model_config is not specified
+                it will be inferred from the env and other parts of the algorithm
+                config object.
             _enable_rl_module_api: Whether to enable the RLModule API for this config.
-                By default if you call `config.rl_module(rl_module=MyRLModule)`, the
+                By default if you call `config.rl_module(...)`, the
                 RLModule API will NOT be enabled. If you want to enable it, you can call
                 `config.rl_module(_enable_rl_module_api=True)`.
         Returns:
             This updated AlgorithmConfig object.
         """
-        if rl_module_class is not NotProvided:
-            self.rl_module_class = rl_module_class
+        if rl_module_spec is not NotProvided:
+            self.rl_module_spec = rl_module_spec
 
         if self._enable_rl_module_api is not NotProvided:
             self._enable_rl_module_api = _enable_rl_module_api
@@ -2641,15 +2651,14 @@ def validate_train_batch_size_vs_rollout_fragment_length(self) -> None:
                     f"{suggested_rollout_fragment_length}."
                 )
 
-    def get_default_rl_module_class(self) -> Union[Type["RLModule"], str]:
-        """Returns the RLModule class to use for this algorithm.
+    def get_default_rl_module_spec(self) -> ModuleSpec:
+        """Returns the RLModule spec to use for this algorithm.
 
-        Override this method in the sub-class to return the RLModule class type given
+        Override this method in the sub-class to return the RLModule spec given
         the input framework.
 
         Returns:
-            The RLModule class to use for this algorithm either as a class type or as
-            a string (e.g. ray.rllib.core.rl_trainer.testing.torch.BCModule).
+            The RLModule spec to use for this algorithm.
         """
         raise NotImplementedError
 
@@ -2665,25 +2674,72 @@ def get_default_rl_trainer_class(self) -> Union[Type["RLTrainer"], str]:
         """
         raise NotImplementedError
 
-    def get_trainer_runner_config(
-        self, module_spec: Optional[ModuleSpec] = None
-    ) -> TrainerRunnerConfig:
+    def get_marl_module_spec(
+        self,
+        policy_dict: Dict[str, PolicySpec],
+        policies_to_train: Callable[[PolicyID, SampleBatchType], bool],
+    ) -> MultiAgentRLModuleSpec:
+        """Returns the MultiAgentRLModule spec based on the given policy spec dict.
 
-        if module_spec is None:
-            module_spec = SingleAgentRLModuleSpec()
+        Args:
+            policy_dict: The policy spec dict. Using this dict, we can determine the
+                inferred values for observation_space, action_space, and config for
+                each policy. If the module spec does not have these values specified,
+                they will get auto-filled with these values obtrained from the policy
+                spec dict. Here we are relying on the policy's logic for infering these
+                values from other sources of information (e.g. environement)
+            policies_to_train: The policies to train. This can be optionally used to
+                construct the MultiAgentRLModuleSpec (if necessary).
+        """
+        # TODO (Kourosh): When we replace policy entirely there will be no need for
+        # this function to map policy_dict to marl_module_specs anymore. The module
+        # spec will be directly given by the user or inferred from env and spaces.
+
+        # If the module is single-agent convert it to multi-agent spec
+        if isinstance(self.rl_module_spec, SingleAgentRLModuleSpec):
+            marl_module_spec = MultiAgentRLModuleSpec(
+                module_specs={
+                    k: copy.deepcopy(self.rl_module_spec) for k in policy_dict.keys()
+                },
+            )
+        elif isinstance(self.rl_module_spec, MultiAgentRLModuleSpec):
+            marl_module_spec = self.rl_module_spec
+
+            if isinstance(marl_module_spec.module_specs, SingleAgentRLModuleSpec):
+                # the individual module specs are not given, it is given as one
+                # SingleAgentRLModuleSpec to be re-used for all
+                marl_module_spec.module_specs = {
+                    k: copy.deepcopy(marl_module_spec.module_specs)
+                    for k in policy_dict.keys()
+                }
 
-        if isinstance(module_spec, SingleAgentRLModuleSpec):
-            if module_spec.module_class is None:
-                module_spec.module_class = self.rl_module_class
+            # otherwise it is assumed that the module specs are given as a dict that
+            # match the sampler's policy dict
+        else:
+            raise ValueError(
+                "RLModuleSpec must be either SingleAgentRLModuleSpec "
+                "or MultiAgentRLModuleSpec!"
+            )
 
-            if module_spec.observation_space is None:
-                module_spec.observation_space = self.observation_space
+        # Make sure that policy_dict and marl_module_spec have similar keys
+        if set(policy_dict.keys()) != set(marl_module_spec.module_specs.keys()):
+            raise ValueError("Policy dict and module spec have different keys!")
 
-            if module_spec.action_space is None:
-                module_spec.action_space = self.action_space
+        # fill in the missing values from the module spec
+        for module_id in policy_dict:
+            policy_spec = policy_dict[module_id]
+            module_spec = marl_module_spec.module_specs[module_id]
 
+            if module_spec.observation_space is None:
+                module_spec.observation_space = policy_spec.observation_space
+            if module_spec.action_space is None:
+                module_spec.action_space = policy_spec.action_space
             if module_spec.model_config is None:
-                module_spec.model_config = self.model
+                module_spec.model_config = policy_spec.config.get("model", {})
+
+        return marl_module_spec
+
+    def get_trainer_runner_config(self, module_spec: ModuleSpec) -> TrainerRunnerConfig:
 
         if not self._is_frozen:
             raise ValueError(
diff --git a/rllib/algorithms/ppo/ppo.py b/rllib/algorithms/ppo/ppo.py
index 52b069566990..0fcf54c11327 100644
--- a/rllib/algorithms/ppo/ppo.py
+++ b/rllib/algorithms/ppo/ppo.py
@@ -17,6 +17,7 @@
 from ray.rllib.algorithms.algorithm_config import AlgorithmConfig, NotProvided
 from ray.rllib.algorithms.pg import PGConfig
 from ray.rllib.algorithms.ppo.ppo_rl_trainer_config import PPORLTrainerHPs
+from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
 from ray.rllib.execution.rollout_ops import (
     standardize_fields,
 )
@@ -43,7 +44,6 @@
 )
 
 if TYPE_CHECKING:
-    from ray.rllib.core.rl_module import RLModule
     from ray.rllib.core.rl_trainer.rl_trainer import RLTrainer
 
 
@@ -122,17 +122,17 @@ def __init__(self, algo_class=None):
         self.vf_share_layers = DEPRECATED_VALUE
 
     @override(AlgorithmConfig)
-    def get_default_rl_module_class(self) -> Union[Type["RLModule"], str]:
+    def get_default_rl_module_spec(self) -> SingleAgentRLModuleSpec:
         if self.framework_str == "torch":
             from ray.rllib.algorithms.ppo.torch.ppo_torch_rl_module import (
                 PPOTorchRLModule,
             )
 
-            return PPOTorchRLModule
+            return SingleAgentRLModuleSpec(module_class=PPOTorchRLModule)
         elif self.framework_str == "tf2":
             from ray.rllib.algorithms.ppo.tf.ppo_tf_rl_module import PPOTfRLModule
 
-            return PPOTfRLModule
+            return SingleAgentRLModuleSpec(module_class=PPOTfRLModule)
         else:
             raise ValueError(f"The framework {self.framework_str} is not supported.")
 
diff --git a/rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py b/rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py
index 52d52596058f..c0914f57f5fe 100644
--- a/rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py
+++ b/rllib/algorithms/ppo/tests/test_ppo_rl_trainer.py
@@ -87,10 +87,13 @@ def test_loss(self):
         config.training(_enable_rl_trainer_api=True)
         config.validate()
         config.freeze()
+
         trainer_runner_config = config.get_trainer_runner_config(
             SingleAgentRLModuleSpec(
+                module_class=config.rl_module_spec.module_class,
                 observation_space=policy.observation_space,
                 action_space=policy.action_space,
+                model_config=policy.config["model"],
             )
         )
         trainer_runner = trainer_runner_config.build()
diff --git a/rllib/algorithms/tests/test_algorithm_config.py b/rllib/algorithms/tests/test_algorithm_config.py
index 07ba383eb6e8..9e90656cfaa7 100644
--- a/rllib/algorithms/tests/test_algorithm_config.py
+++ b/rllib/algorithms/tests/test_algorithm_config.py
@@ -5,6 +5,7 @@
 from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 from ray.rllib.algorithms.ppo import PPO, PPOConfig
 from ray.rllib.algorithms.ppo.torch.ppo_torch_rl_module import PPOTorchRLModule
+from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
 
 
 class TestAlgorithmConfig(unittest.TestCase):
@@ -157,14 +158,14 @@ def test_rl_module_api(self):
         )
 
         config.validate()
-        self.assertEqual(config.rl_module_class, PPOTorchRLModule)
+        self.assertEqual(config.rl_module_spec.module_class, PPOTorchRLModule)
 
         class A:
             pass
 
-        config = config.rl_module(rl_module_class=A)
+        config = config.rl_module(rl_module_spec=SingleAgentRLModuleSpec(A))
         config.validate()
-        self.assertEqual(config.rl_module_class, A)
+        self.assertEqual(config.rl_module_spec.module_class, A)
 
     def test_rl_trainer_api(self):
         # TODO (Kourosh): the default rl_trainer of PPO is not implemented yet. When
diff --git a/rllib/core/rl_module/marl_module.py b/rllib/core/rl_module/marl_module.py
index b95bc9659638..9083cea91d7f 100644
--- a/rllib/core/rl_module/marl_module.py
+++ b/rllib/core/rl_module/marl_module.py
@@ -17,23 +17,6 @@
 ModuleID = str
 
 
-@ExperimentalAPI
-@dataclass
-class MultiAgentRLModuleSpec:
-    """A utility spec class to make it constructing RLModules (in multi-agent case) easier.
-
-    Args:
-        module_class: ...
-        module_specs: ...
-    """
-
-    module_class: Optional[Type["MultiAgentRLModule"]] = None
-    module_specs: Optional[Dict[ModuleID, SingleAgentRLModuleSpec]] = None
-
-    def build(self) -> "MultiAgentRLModule":
-        return self.module_class.from_multi_agent_config({"modules": self.module_specs})
-
-
 def _get_module_configs(config: Dict[str, Any]):
     """Constructs a mapping from module_id to module config.
 
@@ -449,3 +432,86 @@ def _check_module_exists(self, module_id: ModuleID) -> None:
                 f"Module with module_id {module_id} not found. "
                 f"Available modules: {set(self.keys())}"
             )
+
+
+@ExperimentalAPI
+@dataclass
+class MultiAgentRLModuleSpec:
+    """A utility spec class to make it constructing MARL modules easier.
+
+
+    Users can extend this class to modify the behavior of base class. For example to
+    share neural networks across the modules, the build method can be overriden to
+    create the shared module first and then pass it to custom module classes that would
+    then use it as a shared module.
+
+    Args:
+        marl_module_class: The class of the multi-agent RLModule to construct. By
+            default it is set to MultiAgentRLModule class. This class simply loops
+            throught each module and calls their foward methods.
+        module_specs: The module specs for each individual module. It can be either a
+            SingleAgentRLModuleSpec used for all module_ids or a dictionary mapping
+            from module IDs to SingleAgentRLModuleSpecs for each individual module.
+    """
+
+    marl_module_class: Type[MultiAgentRLModule] = MultiAgentRLModule
+    module_specs: Union[
+        SingleAgentRLModuleSpec, Dict[ModuleID, SingleAgentRLModuleSpec]
+    ] = None
+
+    def __post_init__(self):
+        if self.module_specs is None:
+            raise ValueError(
+                "module_specs cannot be None. It should be either a "
+                "SingleAgentRLModuleSpec or a dictionary mapping from module IDs to "
+                "SingleAgentRLModuleSpecs for each individual module."
+            )
+
+    def build(
+        self, module_id: Optional[ModuleID] = None
+    ) -> Union[SingleAgentRLModuleSpec, "MultiAgentRLModule"]:
+        """Builds either the multi-agent module or the single-agent module.
+
+        If module_id is None, it builds the multi-agent module. Otherwise, it builds
+        the single-agent module with the given module_id.
+
+        Note: If when build is called the module_specs is not a dictionary, it will
+        raise an error, since it should have been updated by the caller to inform us
+        about the module_ids.
+
+        Args:
+            module_id: The module_id of the single-agent module to build. If None, it
+                builds the multi-agent module.
+
+        Returns:
+            The built module. If module_id is None, it returns the multi-agent module.
+        """
+
+        self._check_before_build()
+
+        if module_id:
+            return self.module_specs[module_id].build()
+        return self.marl_module_class.from_multi_agent_config(
+            {"modules": self.module_specs}
+        )
+
+    def add_modules(
+        self, module_specs: Dict[ModuleID, SingleAgentRLModuleSpec]
+    ) -> None:
+        """Add new module specs to the spec.
+
+        Args:
+            module_specs: The mapping for the module_id to the single-agent module
+                specs to be added to this multi-agent module spec.
+        """
+        if self.module_specs is None:
+            self.module_specs = {}
+        self.module_specs.update(module_specs)
+
+    def _check_before_build(self):
+        if not isinstance(self.module_specs, dict):
+            raise ValueError(
+                f"When build() is called on {self.__class__} the module_specs "
+                "should be a dictionary mapping from module IDs to "
+                "SingleAgentRLModuleSpecs for each individual module."
+            )
diff --git a/rllib/core/rl_module/rl_module.py b/rllib/core/rl_module/rl_module.py
index 601bcbb2de3e..776c50806474 100644
--- a/rllib/core/rl_module/rl_module.py
+++ b/rllib/core/rl_module/rl_module.py
@@ -45,6 +45,14 @@ class SingleAgentRLModuleSpec:
     model_config: Optional[Dict[str, Any]] = None
 
     def build(self) -> "RLModule":
+
+        if self.observation_space is None:
+            raise ValueError("Observation space must be specified.")
+        if self.action_space is None:
+            raise ValueError("Action space must be specified.")
+        if self.model_config is None:
+            raise ValueError("Model config must be specified.")
+
         return self.module_class.from_model_config(
             observation_space=self.observation_space,
             action_space=self.action_space,
diff --git a/rllib/core/rl_module/tests/test_rl_module_specs.py b/rllib/core/rl_module/tests/test_rl_module_specs.py
index 22db1bc3f823..3f4230e0f5ad 100644
--- a/rllib/core/rl_module/tests/test_rl_module_specs.py
+++ b/rllib/core/rl_module/tests/test_rl_module_specs.py
@@ -84,9 +84,7 @@ def test_multi_agent_spec(self):
                     model_config={"fcnet_hiddens": [32 * (i + 1)]},
                 )
 
-            spec = MultiAgentRLModuleSpec(
-                module_class=MultiAgentRLModule, module_specs=module_specs
-            )
+            spec = MultiAgentRLModuleSpec(module_specs=module_specs)
             module = spec.build()
             self.assertIsInstance(module, MultiAgentRLModule)
 
@@ -103,7 +101,7 @@ def test_customized_multi_agent_spec(self):
             module_cls = CUSTOM_MODULES[fw]
 
             spec = spec_cls(
-                module_class=MultiAgentRLModule,
+                marl_module_class=MultiAgentRLModule,
                 module_specs={
                     "agent_1": SingleAgentRLModuleSpec(
                         module_class=module_cls,
diff --git a/rllib/core/rl_trainer/tests/test_trainer_runner_config.py b/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
index 4eacf477f3b6..7a4f111c17d9 100644
--- a/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
+++ b/rllib/core/rl_trainer/tests/test_trainer_runner_config.py
@@ -39,16 +39,14 @@ def test_trainer_runner_build_from_algorithm_config(self):
 
         env = gym.make("CartPole-v1")
 
-        config = (
-            AlgorithmConfig()
-            .rl_module(rl_module_class=DiscreteBCTFModule)
-            .training(rl_trainer_class=BCTfRLTrainer)
-            .training(model={"fcnet_hiddens": [32]})
-        )
+        config = AlgorithmConfig().training(rl_trainer_class=BCTfRLTrainer)
         config.freeze()
         runner_config = config.get_trainer_runner_config(
             SingleAgentRLModuleSpec(
-                observation_space=env.observation_space, action_space=env.action_space
+                module_class=DiscreteBCTFModule,
+                observation_space=env.observation_space,
+                action_space=env.action_space,
+                model_config={"fcnet_hiddens": [32]},
             )
         )
         runner_config.build()
diff --git a/rllib/core/rl_trainer/trainer_runner.py b/rllib/core/rl_trainer/trainer_runner.py
index 5b6f193195bb..6f2876a79a5b 100644
--- a/rllib/core/rl_trainer/trainer_runner.py
+++ b/rllib/core/rl_trainer/trainer_runner.py
@@ -334,7 +334,11 @@ def set_weights(self, weights) -> None:
         if self.is_local:
             self._trainer.set_weights(weights)
         else:
-            self._worker_manager.foreach_actor(lambda w: w.set_weights(weights))
+            results_or_errors = self._worker_manager.foreach_actor(
+                lambda w: w.set_weights(weights)
+            )
+            # raise errors if any
+            self._get_results(results_or_errors)
 
     def get_weights(self, module_ids: Optional[Set[str]] = None) -> Mapping[str, Any]:
         if self.is_local:
diff --git a/rllib/core/testing/bc_algorithm.py b/rllib/core/testing/bc_algorithm.py
index 77e4f91fb911..0f195ff4e8fd 100644
--- a/rllib/core/testing/bc_algorithm.py
+++ b/rllib/core/testing/bc_algorithm.py
@@ -11,17 +11,18 @@
 from ray.rllib.core.testing.torch.bc_rl_trainer import BCTorchRLTrainer
 from ray.rllib.core.testing.tf.bc_module import DiscreteBCTFModule
 from ray.rllib.core.testing.tf.bc_rl_trainer import BCTfRLTrainer
+from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
 
 
 class BCConfigTest(AlgorithmConfig):
     def __init__(self, algo_class=None):
         super().__init__(algo_class=algo_class or BCAlgorithmTest)
 
-    def get_default_rl_module_class(self):
+    def get_default_rl_module_spec(self):
         if self.framework_str == "torch":
-            return DiscreteBCTorchModule
+            return SingleAgentRLModuleSpec(module_class=DiscreteBCTorchModule)
         elif self.framework_str == "tf2":
-            return DiscreteBCTFModule
+            return SingleAgentRLModuleSpec(module_class=DiscreteBCTFModule)
 
     def get_default_rl_trainer_class(self):
         if self.framework_str == "torch":
diff --git a/rllib/core/testing/tests/test_bc_algorithm.py b/rllib/core/testing/tests/test_bc_algorithm.py
index 9909e53e79ae..bc943f6882b6 100644
--- a/rllib/core/testing/tests/test_bc_algorithm.py
+++ b/rllib/core/testing/tests/test_bc_algorithm.py
@@ -1,23 +1,34 @@
 import unittest
 
+import gymnasium as gym
 import ray
-from ray.rllib.core.testing.torch.bc_module import DiscreteBCTorchModule
-from ray.rllib.core.testing.tf.bc_module import DiscreteBCTFModule
-
+from ray.rllib.core.testing.torch.bc_module import (
+    DiscreteBCTorchModule,
+    BCTorchMultiAgentSpec,
+    BCTorchRLModuleWithSharedGlobalEncoder,
+)
+from ray.rllib.core.testing.tf.bc_module import (
+    DiscreteBCTFModule,
+    BCTfMultiAgentSpec,
+    BCTfRLModuleWithSharedGlobalEncoder,
+)
+from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
 from ray.rllib.core.testing.bc_algorithm import BCConfigTest
 from ray.rllib.utils.test_utils import framework_iterator
+from ray.rllib.examples.env.multi_agent import MultiAgentCartPole
 
 
 class TestRLTrainer(unittest.TestCase):
     @classmethod
-    def setUp(cls) -> None:
+    def setUpClass(cls) -> None:
         ray.init()
 
     @classmethod
-    def tearDown(cls) -> None:
+    def tearDownClass(cls) -> None:
         ray.shutdown()
 
     def test_bc_algorithm(self):
+        """Tests the Test BC algorithm in single -agent case."""
 
         config = (
             BCConfigTest()
@@ -36,6 +47,88 @@ def test_bc_algorithm(self):
             elif fw == "tf":
                 assert isinstance(rl_module, DiscreteBCTFModule)
 
+    def test_bc_algorithm_marl(self):
+        """Tests simple extension of single-agent to independent multi-agent case."""
+
+        policies = {"policy_1", "policy_2"}
+        config = (
+            BCConfigTest()
+            .rl_module(_enable_rl_module_api=True)
+            .training(_enable_rl_trainer_api=True, model={"fcnet_hiddens": [32, 32]})
+            .multi_agent(
+                policies=policies,
+                policy_mapping_fn=lambda agent_id, **kwargs: list(policies)[agent_id],
+            )
+            .environment(MultiAgentCartPole, env_config={"num_agents": 2})
+        )
+
+        # TODO (Kourosh): Add tf2 support
+        for fw in framework_iterator(config, frameworks=("torch")):
+            algo = config.build()
+            for policy_id in policies:
+                policy = algo.get_policy(policy_id=policy_id)
+                rl_module = policy.model
+
+                if fw == "torch":
+                    assert isinstance(rl_module, DiscreteBCTorchModule)
+                elif fw == "tf":
+                    assert isinstance(rl_module, DiscreteBCTFModule)
+
+    def test_bc_algorithm_w_custom_marl_module(self):
+        """Tests the independent multi-agent case with shared encoders."""
+
+        for fw in ["torch"]:
+            if fw == "torch":
+                spec = BCTorchMultiAgentSpec(
+                    module_specs=SingleAgentRLModuleSpec(
+                        module_class=BCTorchRLModuleWithSharedGlobalEncoder
+                    )
+                )
+            else:
+                spec = BCTfMultiAgentSpec(
+                    module_specs=SingleAgentRLModuleSpec(
+                        module_class=BCTfRLModuleWithSharedGlobalEncoder
+                    )
+                )
+
+            policies = {"policy_1", "policy_2"}
+            config = (
+                BCConfigTest()
+                .framework(fw)
+                .rl_module(_enable_rl_module_api=True, rl_module_spec=spec)
+                .training(
+                    _enable_rl_trainer_api=True,
+                    model={"fcnet_hiddens": [32, 32]},
+                )
+                .multi_agent(
+                    policies=policies,
+                    policy_mapping_fn=lambda agent_id, **kwargs: list(policies)[
+                        agent_id
+                    ],
+                )
+                # an env a weird nested obs that requires a custom model with shared
+                # encoders
+                .environment(
+                    observation_space=gym.spaces.Dict(
+                        {
+                            "global": gym.spaces.Box(low=-1, high=1, shape=(10,)),
+                            "local": gym.spaces.Box(low=-1, high=1, shape=(20,)),
+                        }
+                    ),
+                    action_space=gym.spaces.Discrete(2),
+                )
+                .experimental(_disable_preprocessor_api=True)
+            )
+            algo = config.build()
+            for policy_id in policies:
+                policy = algo.get_policy(policy_id=policy_id)
+                rl_module = policy.model
+
+                if fw == "torch":
+                    assert isinstance(rl_module, BCTorchRLModuleWithSharedGlobalEncoder)
+                elif fw == "tf":
+                    assert isinstance(rl_module, BCTfRLModuleWithSharedGlobalEncoder)
+
 
 if __name__ == "__main__":
     import pytest
diff --git a/rllib/core/testing/tf/bc_module.py b/rllib/core/testing/tf/bc_module.py
index f8d213241078..11baf6306e44 100644
--- a/rllib/core/testing/tf/bc_module.py
+++ b/rllib/core/testing/tf/bc_module.py
@@ -1,10 +1,10 @@
 import gymnasium as gym
 import tensorflow as tf
 import tensorflow_probability as tfp
-from typing import Any, Mapping
+from typing import Any, Mapping, Optional
 
 from ray.rllib.core.rl_module.rl_module import RLModule
-from ray.rllib.core.rl_module.marl_module import MultiAgentRLModuleSpec
+from ray.rllib.core.rl_module.marl_module import MultiAgentRLModuleSpec, ModuleID
 from ray.rllib.core.rl_module.tf.tf_rl_module import TfRLModule
 from ray.rllib.models.specs.typing import SpecType
 from ray.rllib.policy.sample_batch import SampleBatch
@@ -134,7 +134,9 @@ def _common_forward(self, batch):
 
 
 class BCTfMultiAgentSpec(MultiAgentRLModuleSpec):
-    def build(self):
+    def build(self, module_id: Optional[ModuleID] = None):
+
+        self._check_before_build()
         # constructing the global encoder based on the observation_space of the first
         # module
         module_spec = next(iter(self.module_specs.values()))
@@ -148,6 +150,14 @@ def build(self):
             ]
         )
 
+        if module_id:
+            return module_spec.module_class(
+                encoder=shared_encoder,
+                local_dim=module_spec.observation_space["local"].shape[0],
+                hidden_dim=hidden_dim,
+                action_dim=module_spec.action_space.n,
+            )
+
         rl_modules = {}
         for module_id, module_spec in self.module_specs.items():
             rl_modules[module_id] = module_spec.module_class(
@@ -157,4 +167,4 @@ def build(self):
                 action_dim=module_spec.action_space.n,
             )
 
-        return self.module_class(rl_modules)
+        return self.marl_module_class(rl_modules)
diff --git a/rllib/core/testing/torch/bc_module.py b/rllib/core/testing/torch/bc_module.py
index ce5fd81d64a9..e11cd4e64d46 100644
--- a/rllib/core/testing/torch/bc_module.py
+++ b/rllib/core/testing/torch/bc_module.py
@@ -1,8 +1,8 @@
 import gymnasium as gym
-from typing import Any, Mapping
+from typing import Any, Mapping, Optional
 
 from ray.rllib.core.rl_module import RLModule
-from ray.rllib.core.rl_module.marl_module import MultiAgentRLModuleSpec
+from ray.rllib.core.rl_module.marl_module import MultiAgentRLModuleSpec, ModuleID
 from ray.rllib.core.rl_module.torch.torch_rl_module import TorchRLModule
 from ray.rllib.models.specs.typing import SpecType
 from ray.rllib.utils.annotations import override
@@ -132,8 +132,9 @@ class BCTorchMultiAgentSpec(MultiAgentRLModuleSpec):
 
     # TODO: make sure the default class is MultiAgentRLModule
 
-    def build(self):
+    def build(self, module_id: Optional[ModuleID] = None):
 
+        self._check_before_build()
         # constructing the global encoder based on the observation_space of the first
         # module
         module_spec = next(iter(self.module_specs.values()))
@@ -145,6 +146,14 @@ def build(self):
             nn.Linear(hidden_dim, hidden_dim),
         )
 
+        if module_id:
+            return module_spec.module_class(
+                encoder=shared_encoder,
+                local_dim=module_spec.observation_space["local"].shape[0],
+                hidden_dim=hidden_dim,
+                action_dim=module_spec.action_space.n,
+            )
+
         rl_modules = {}
         for module_id, module_spec in self.module_specs.items():
             rl_modules[module_id] = module_spec.module_class(
@@ -154,4 +163,4 @@ def build(self):
                 action_dim=module_spec.action_space.n,
             )
 
-        return self.module_class(rl_modules)
+        return self.marl_module_class(rl_modules)
diff --git a/rllib/evaluation/rollout_worker.py b/rllib/evaluation/rollout_worker.py
index 47f08ae50d3b..c30f15aa7b47 100644
--- a/rllib/evaluation/rollout_worker.py
+++ b/rllib/evaluation/rollout_worker.py
@@ -734,7 +734,9 @@ def wrap(env):
 
         self.filters: Dict[PolicyID, Filter] = defaultdict(NoFilter)
 
-        self._build_policy_map(policy_dict=self.policy_dict)
+        # if RLModule API is enabled, marl_module_spec holds the specs of the RLModules
+        self.marl_module_spec = None
+        self._update_policy_map(policy_dict=self.policy_dict)
 
         # Update Policy's view requirements from Model, only if Policy directly
         # inherited from base `Policy` class. At this point here, the Policy
@@ -1379,7 +1381,7 @@ def add_policy(
             }
 
         self.policy_dict.update(policy_dict_to_add)
-        self._build_policy_map(
+        self._update_policy_map(
             policy_dict=policy_dict_to_add,
             policy=policy,
             policy_states={policy_id: policy_state},
@@ -1917,34 +1919,88 @@ def __del__(self):
         if hasattr(self, "sampler") and isinstance(self.sampler, AsyncSampler):
             self.sampler.shutdown = True
 
-    def _build_policy_map(
+    def _update_policy_map(
         self,
         *,
         policy_dict: MultiAgentPolicyConfigDict,
         policy: Optional[Policy] = None,
         policy_states: Optional[Dict[PolicyID, PolicyState]] = None,
     ) -> None:
-        """Adds the given policy_dict to `self.policy_map`.
+        """Updates the policy map (and other stuff) on this worker.
+
+        It performes the following:
+            1. It updates the observation preprocessors and updates the policy_specs
+                with the postprocessed observation_spaces.
+            2. It updates the policy_specs with the complete algorithm_config (merged
+                with the policy_spec's config).
+            3. If needed it will update the self.marl_module_spec on this worker
+            3. It updates the policy map with the new policies
+            4. It updates the filter dict
+            5. It calls the on_create_policy() hook of the callbacks on the newly added
+                policies.
 
         Args:
-            policy_dict: The MultiAgentPolicyConfigDict to be added to this
-                worker's PolicyMap.
-            policy: If the policy to add already exists, user can provide it here.
-            policy_states: Optional dict from PolicyIDs to PolicyStates to
-                restore the states of the policies being built.
+            policy_dict: The policy dict to update the policy map with.
+            policy: The policy to update the policy map with.
+            policy_states: The policy states to update the policy map with.
         """
-        from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
 
-        # If our policy_map does not exist yet, create it here.
-        self.policy_map = self.policy_map or PolicyMap(
-            capacity=self.config.policy_map_capacity,
-            policy_states_are_swappable=self.config.policy_states_are_swappable,
+        # Update the input policy dict with the postprocessed observation spaces and
+        # merge configs. Also updates the preprocessor dict.
+        updated_policy_dict = self._get_complete_policy_specs_dict(policy_dict)
+
+        # Use the updated policy dict to create the marl_module_spec if necessary
+        if self.config._enable_rl_module_api:
+            spec = self.config.get_marl_module_spec(
+                updated_policy_dict, self.is_policy_to_train
+            )
+            if self.marl_module_spec is None:
+                # this is the first time, so we should create the marl_module_spec
+                self.marl_module_spec = spec
+            else:
+                # This is adding a new policy, so we need call add_modules on the
+                # module_specs of returned spec.
+                self.marl_module_spec.add_modules(spec.module_specs)
+
+            # Add __marl_module_spec key into the config so that the policy can access
+            # it.
+            updated_policy_dict = self._update_policy_dict_with_marl_module(
+                updated_policy_dict
+            )
+
+        # Builds the self.policy_map dict
+        self._build_policy_map(
+            policy_dict=updated_policy_dict,
+            policy=policy,
+            policy_states=policy_states,
         )
+
+        # Initialize the filter dict
+        self._update_filter_dict(updated_policy_dict)
+
+        # Call callback policy init hooks
+        self._call_callbacks_on_create_policy()
+
+        if self.worker_index == 0:
+            logger.info(f"Built policy map: {self.policy_map}")
+            logger.info(f"Built preprocessor map: {self.preprocessors}")
+
+    def _get_complete_policy_specs_dict(
+        self, policy_dict: MultiAgentPolicyConfigDict
+    ) -> MultiAgentPolicyConfigDict:
+        """Processes the policy dict and creates a new copy with the processed attrs.
+
+        This processes the observation_space and prepares them for passing to rl module
+        construction. It also merges the policy configs with the algorithm config.
+        During this processing, we will also construct the preprocessors dict.
+        """
+        from ray.rllib.algorithms.algorithm_config import AlgorithmConfig
+
+        updated_policy_dict = copy.deepcopy(policy_dict)
         # If our preprocessors dict does not exist yet, create it here.
         self.preprocessors = self.preprocessors or {}
-
         # Loop through given policy-dict and add each entry to our map.
-        for name, policy_spec in sorted(policy_dict.items()):
+        for name, policy_spec in sorted(updated_policy_dict.items()):
             logger.debug("Creating policy for {}".format(name))
 
             # Policy brings its own complete AlgorithmConfig -> Use it for this policy.
@@ -1979,15 +2035,53 @@ def _build_policy_map(
                     # the running of these preprocessors.
                     self.preprocessors[name] = preprocessor
 
+            policy_spec.config = merged_conf
+            policy_spec.observation_space = obs_space
+
+        return updated_policy_dict
+
+    def _update_policy_dict_with_marl_module(
+        self, policy_dict: MultiAgentPolicyConfigDict
+    ) -> MultiAgentPolicyConfigDict:
+        for name, policy_spec in policy_dict.items():
+            policy_spec.config["__marl_module_spec"] = self.marl_module_spec
+        return policy_dict
+
+    def _build_policy_map(
+        self,
+        *,
+        policy_dict: MultiAgentPolicyConfigDict,
+        policy: Optional[Policy] = None,
+        policy_states: Optional[Dict[PolicyID, PolicyState]] = None,
+    ) -> None:
+        """Adds the given policy_dict to `self.policy_map`.
+
+        Args:
+            policy_dict: The MultiAgentPolicyConfigDict to be added to this
+                worker's PolicyMap.
+            policy: If the policy to add already exists, user can provide it here.
+            policy_states: Optional dict from PolicyIDs to PolicyStates to
+                restore the states of the policies being built.
+        """
+
+        # If our policy_map does not exist yet, create it here.
+        self.policy_map = self.policy_map or PolicyMap(
+            capacity=self.config.policy_map_capacity,
+            policy_states_are_swappable=self.config.policy_states_are_swappable,
+        )
+
+        # Loop through given policy-dict and add each entry to our map.
+        for name, policy_spec in sorted(policy_dict.items()):
+
             # Create the actual policy object.
             if policy is None:
                 new_policy = create_policy_for_framework(
                     policy_id=name,
                     policy_class=get_tf_eager_cls_if_necessary(
-                        policy_spec.policy_class, merged_conf
+                        policy_spec.policy_class, policy_spec.config
                     ),
-                    merged_config=merged_conf,
-                    observation_space=obs_space,
+                    merged_config=policy_spec.config,
+                    observation_space=policy_spec.observation_space,
                     action_space=policy_spec.action_space,
                     worker_index=self.worker_index,
                     seed=self.seed,
@@ -2002,7 +2096,12 @@ def _build_policy_map(
             if restore_states:
                 new_policy.set_state(restore_states)
 
-            if merged_conf.enable_connectors:
+    def _update_filter_dict(self, policy_dict: MultiAgentPolicyConfigDict) -> None:
+        """Updates the filter dict for the given policy_dict."""
+
+        for name, policy_spec in sorted(policy_dict.items()):
+            new_policy = self.policy_map[name]
+            if policy_spec.config.enable_connectors:
                 # Note(jungong) : We should only create new connectors for the
                 # policy iff we are creating a new policy from scratch. i.e,
                 # we should NOT create new connectors when we already have the
@@ -2017,7 +2116,7 @@ def _build_policy_map(
                 ):
                     # TODO(jungong) : revisit this. It will be nicer to create
                     # connectors as the last step of Policy.__init__().
-                    create_connectors_for_policy(new_policy, merged_conf)
+                    create_connectors_for_policy(new_policy, policy_spec.config)
                 maybe_get_filters_for_syncing(self, name)
             else:
                 filter_shape = tree.map_structure(
@@ -2030,18 +2129,14 @@ def _build_policy_map(
                 )
 
                 self.filters[name] = get_filter(
-                    merged_conf.observation_filter,
+                    policy_spec.config.observation_filter,
                     filter_shape,
                 )
 
-            if name in self.policy_map:
-                self.callbacks.on_create_policy(
-                    policy_id=name, policy=self.policy_map[name]
-                )
-
-        if self.worker_index == 0:
-            logger.info(f"Built policy map: {self.policy_map}")
-            logger.info(f"Built preprocessor map: {self.preprocessors}")
+    def _call_callbacks_on_create_policy(self):
+        """Calls the on_create_policy callback for each policy in the policy map."""
+        for name, policy in self.policy_map.items():
+            self.callbacks.on_create_policy(policy_id=name, policy=policy)
 
     def _get_input_creator_from_config(self):
         def valid_module(class_path):
diff --git a/rllib/policy/policy.py b/rllib/policy/policy.py
index 82c4549abcf4..193c78abfa94 100644
--- a/rllib/policy/policy.py
+++ b/rllib/policy/policy.py
@@ -334,6 +334,8 @@ def __init__(
         """
         self.observation_space: gym.Space = observation_space
         self.action_space: gym.Space = action_space
+        # the policy id in the global context.
+        self.__policy_id = config.get("__policy_id")
         # The base struct of the observation/action spaces.
         # E.g. action-space = gym.spaces.Dict({"a": Discrete(2)}) ->
         # action_space_struct = {"a": Discrete(2)}
@@ -380,10 +382,22 @@ def make_rl_module(self) -> "RLModule":
         this method should be implemented and should return the RLModule instance to
         use for this Policy. Otherwise, RLlib will error out.
         """
-        module_class: RLModule = self.config["rl_module_class"]
-        return module_class.from_model_config(
-            self.observation_space, self.action_space, model_config=self.config["model"]
-        )
+        # if imported on top it creates circular dependency
+        from ray.rllib.core.rl_module.rl_module import SingleAgentRLModuleSpec
+
+        if self.__policy_id is None:
+            raise ValueError(
+                "When using RLModule API, `policy_id` within the policies must be "
+                "set. This should have happened automatically. If you see this "
+                "bug, please file a github issue."
+            )
+
+        module_spec = self.config["__marl_module_spec"]
+        if isinstance(module_spec, SingleAgentRLModuleSpec):
+            module = module_spec.build()
+        else:
+            module = module_spec.build(module_id=self.__policy_id)
+        return module
 
     @DeveloperAPI
     def init_view_requirements(self):
diff --git a/rllib/utils/policy.py b/rllib/utils/policy.py
index e01c08a388df..2afb50ac0603 100644
--- a/rllib/utils/policy.py
+++ b/rllib/utils/policy.py
@@ -103,6 +103,9 @@ def create_policy_for_framework(
     if isinstance(merged_config, AlgorithmConfig):
         merged_config = merged_config.to_dict()
 
+    # add policy_id to merged_config
+    merged_config["__policy_id"] = policy_id
+
     framework = merged_config.get("framework", "tf")
     # Tf.
     if framework in ["tf2", "tf"]:

From efc432bd21ee47743a4b08899df1196060cb6771 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Mon, 13 Feb 2023 18:30:11 -0800
Subject: [PATCH 254/267] [tune] Fix resuming from cloud storage (+ test)
 (#32504)

#32457 refactored the experiment checkpoint management but introduced a bug where state is not correctly restored anymore. This was caught by a unit test error. This PR resolves the bug and makes sure the test passes.

Signed-off-by: Kai Fricke <kai@anyscale.com>
---
 python/ray/tune/execution/experiment_state.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/python/ray/tune/execution/experiment_state.py b/python/ray/tune/execution/experiment_state.py
index 4c5aa4e2c3a8..afa3befd636b 100644
--- a/python/ray/tune/execution/experiment_state.py
+++ b/python/ray/tune/execution/experiment_state.py
@@ -1,6 +1,6 @@
 from collections import Counter
 from dataclasses import dataclass
-from typing import Dict, Optional, Union, Callable
+from typing import Callable, Dict, Optional, Tuple, Union
 
 import click
 import logging
@@ -28,7 +28,7 @@ class _ResumeConfig:
     restart_errored: bool = False
 
 
-def _resume_str_to_config(resume_str: str) -> _ResumeConfig:
+def _resume_str_to_config(resume_str: str) -> Tuple[str, _ResumeConfig]:
     if resume_str is True:
         resume_str = "LOCAL"
     elif resume_str == "ERRORED_ONLY":
@@ -61,7 +61,7 @@ def _resume_str_to_config(resume_str: str) -> _ResumeConfig:
     assert resume_str in VALID_RESUME_TYPES, "resume={} is not one of {}".format(
         resume_str, VALID_RESUME_TYPES
     )
-    return resume_config
+    return resume_str, resume_config
 
 
 def _experiment_checkpoint_exists(experiment_dir: str) -> bool:
@@ -406,7 +406,7 @@ def resume(self, resume_type: Union[str, bool]) -> Optional[_ResumeConfig]:
         if not resume_type:
             return None
 
-        resume_config = _resume_str_to_config(resume_type)
+        resume_type, resume_config = _resume_str_to_config(resume_type)
 
         # Not clear if we need this assertion, since we should always have a
         # local checkpoint dir.

From 99d00ad8cbe06e5ab1af83ec22a7913dcb4d872f Mon Sep 17 00:00:00 2001
From: Jiajun Yao <jeromeyjj@gmail.com>
Date: Tue, 14 Feb 2023 14:57:05 +0800
Subject: [PATCH 255/267] [Doc] Restructure core API docs (#32236)

Similar to #31204, refactor the core api reference for better layout and view.

Signed-off-by: Jiajun Yao <jeromeyjj@gmail.com>
---
 doc/source/_toc.yml                           |   2 +-
 .../job-submission/jobs-package-ref.rst       |   2 +-
 doc/source/ray-core/actors.rst                |   2 +-
 doc/source/ray-core/actors/actor-utils.rst    |   4 +-
 doc/source/ray-core/api.rst                   |  11 -
 doc/source/ray-core/{ => api}/cli.rst         |   0
 doc/source/ray-core/api/core.rst              |  60 ++++
 doc/source/ray-core/api/exceptions.rst        |  32 ++
 doc/source/ray-core/api/index.rst             |  14 +
 doc/source/ray-core/api/runtime-env.rst       |   8 +
 doc/source/ray-core/api/scheduling.rst        |  25 ++
 doc/source/ray-core/api/utility.rst           |  35 ++
 doc/source/ray-core/configure.rst             |  10 +-
 .../ray-core/examples/monte_carlo_pi.rst      |  10 +-
 .../ray-core/fault_tolerance/actors.rst       |   2 +-
 doc/source/ray-core/fault_tolerance/tasks.rst |   2 +-
 doc/source/ray-core/objects.rst               |   4 +-
 doc/source/ray-core/package-ref.rst           | 298 ------------------
 .../closure-capture-large-objects.rst         |   4 +-
 .../ray-core/patterns/limit-pending-tasks.rst |   2 +-
 doc/source/ray-core/patterns/nested-tasks.rst |   2 +-
 .../patterns/pass-large-arg-by-value.rst      |   2 +-
 doc/source/ray-core/patterns/pipelining.rst   |   2 +-
 doc/source/ray-core/patterns/ray-get-loop.rst |   2 +-
 .../patterns/ray-get-submission-order.rst     |   4 +-
 .../patterns/ray-get-too-many-objects.rst     |   2 +-
 .../patterns/redefine-task-actor-loop.rst     |   2 +-
 .../ray-core/patterns/return-ray-put.rst      |   2 +-
 .../ray-core/patterns/unnecessary-ray-get.rst |   2 +-
 doc/source/ray-core/scheduling/index.rst      |   2 +-
 .../ray-core/scheduling/placement-group.rst   |  14 +-
 doc/source/ray-core/scheduling/resources.rst  |   5 +-
 doc/source/ray-core/tasks.rst                 |   6 +-
 .../ray-core/tasks/using-ray-with-gpus.rst    |   4 +-
 doc/source/ray-more-libs/joblib.rst           |   4 +-
 .../ray-observability/api/state/api.rst       |  96 ++++++
 .../ray-observability/{ => api}/state/cli.rst |   6 +-
 doc/source/ray-observability/overview.rst     |  14 +-
 .../state/ray-state-api-reference.rst         | 180 -----------
 .../ray-observability/state/state-api.rst     |  98 +++---
 doc/source/ray-references/api.rst             |   2 +-
 python/ray/data/block.py                      |  17 +-
 python/ray/data/datasource/partitioning.py    |  26 +-
 python/ray/experimental/state/api.py          | 132 ++++----
 python/ray/experimental/state/state_cli.py    |  46 +--
 rllib/policy/sample_batch.py                  |   2 +-
 46 files changed, 491 insertions(+), 710 deletions(-)
 delete mode 100644 doc/source/ray-core/api.rst
 rename doc/source/ray-core/{ => api}/cli.rst (100%)
 create mode 100644 doc/source/ray-core/api/core.rst
 create mode 100644 doc/source/ray-core/api/exceptions.rst
 create mode 100644 doc/source/ray-core/api/index.rst
 create mode 100644 doc/source/ray-core/api/runtime-env.rst
 create mode 100644 doc/source/ray-core/api/scheduling.rst
 create mode 100644 doc/source/ray-core/api/utility.rst
 delete mode 100644 doc/source/ray-core/package-ref.rst
 create mode 100644 doc/source/ray-observability/api/state/api.rst
 rename doc/source/ray-observability/{ => api}/state/cli.rst (95%)
 delete mode 100644 doc/source/ray-observability/state/ray-state-api-reference.rst

diff --git a/doc/source/_toc.yml b/doc/source/_toc.yml
index a5b63efb6462..e2426b5f2e0a 100644
--- a/doc/source/_toc.yml
+++ b/doc/source/_toc.yml
@@ -33,7 +33,7 @@ parts:
               - file: ray-core/examples/batch_training
               - file: ray-core/examples/automl_for_time_series
               - file: ray-core/examples/web-crawler
-          - file: ray-core/api
+          - file: ray-core/api/index
 
       - file: cluster/getting-started
         title: "Ray Clusters"
diff --git a/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst b/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst
index 3e6afaec76ec..fa700c94bb0c 100644
--- a/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst
+++ b/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst
@@ -8,7 +8,7 @@ Python SDK API Reference
 For an overview with examples see :ref:`Ray Jobs <jobs-overview>`.
 
 For the CLI reference see :ref:`Ray Job Submission CLI Reference <ray-job-submission-cli-ref>`.
- 
+
 .. _job-submission-client-ref:
 
 JobSubmissionClient
diff --git a/doc/source/ray-core/actors.rst b/doc/source/ray-core/actors.rst
index 0b6d4c1c5f0c..08509634958e 100644
--- a/doc/source/ray-core/actors.rst
+++ b/doc/source/ray-core/actors.rst
@@ -337,7 +337,7 @@ By default, Ray actors won't be :ref:`restarted <fault-tolerance-actors>` and
 actor tasks won't be retried when actors crash unexpectedly.
 You can change this behavior by setting
 ``max_restarts`` and ``max_task_retries`` options
-in :ref:`ray.remote() <ray-remote-ref>` and :ref:`.options() <ray-options-ref>`.
+in :func:`ray.remote() <ray.remote>` and :meth:`.options() <ray.actor.ActorClass.options>`.
 See :ref:`Ray fault tolerance <fault-tolerance>` for more details.
 
 FAQ: Actors, Workers and Resources
diff --git a/doc/source/ray-core/actors/actor-utils.rst b/doc/source/ray-core/actors/actor-utils.rst
index 01e35107d9dc..6e5b3da20d4d 100644
--- a/doc/source/ray-core/actors/actor-utils.rst
+++ b/doc/source/ray-core/actors/actor-utils.rst
@@ -11,7 +11,7 @@ Actor Pool
 
     .. literalinclude:: ../doc_code/actor-pool.py
 
-    See the :ref:`package reference <ray-actor-pool-ref>` for more information.
+    See the :class:`package reference <ray.util.ActorPool>` for more information.
 
 .. tabbed:: Java
 
@@ -25,7 +25,7 @@ Message passing using Ray Queue
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Sometimes just using one signal to synchronize is not enough. If you need to send data among many tasks or
-actors, you can use :ref:`ray.util.queue.Queue <ray-queue-ref>`.
+actors, you can use :class:`ray.util.queue.Queue <ray.util.queue.Queue>`.
 
 .. literalinclude:: ../doc_code/actor-queue.py
 
diff --git a/doc/source/ray-core/api.rst b/doc/source/ray-core/api.rst
deleted file mode 100644
index 0d86189932f9..000000000000
--- a/doc/source/ray-core/api.rst
+++ /dev/null
@@ -1,11 +0,0 @@
-API References
-==============
-
-.. toctree::
-    :maxdepth: 2
-    :caption: Ray Core API References
-
-    package-ref.rst
-    cli.rst
-    ../ray-observability/state/cli.rst
-    ../ray-observability/state/ray-state-api-reference.rst
diff --git a/doc/source/ray-core/cli.rst b/doc/source/ray-core/api/cli.rst
similarity index 100%
rename from doc/source/ray-core/cli.rst
rename to doc/source/ray-core/api/cli.rst
diff --git a/doc/source/ray-core/api/core.rst b/doc/source/ray-core/api/core.rst
new file mode 100644
index 000000000000..c78e9afc418c
--- /dev/null
+++ b/doc/source/ray-core/api/core.rst
@@ -0,0 +1,60 @@
+Core API
+========
+
+.. autosummary::
+    :toctree: doc/
+
+    ray.init
+    ray.shutdown
+    ray.is_initialized
+
+Tasks
+-----
+
+.. autosummary::
+    :toctree: doc/
+
+    ray.remote
+    ray.remote_function.RemoteFunction.options
+    ray.cancel
+
+Actors
+------
+
+.. autosummary::
+    :toctree: doc/
+
+    ray.remote
+    ray.actor.ActorClass.options
+    ray.method
+    ray.get_actor
+    ray.kill
+
+Objects
+-------
+
+.. autosummary::
+    :toctree: doc/
+
+    ray.get
+    ray.wait
+    ray.put
+
+.. _runtime-context-apis:
+
+Runtime Context
+---------------
+.. autosummary::
+    :toctree: doc/
+
+    ray.runtime_context.get_runtime_context
+    ray.runtime_context.RuntimeContext
+    ray.get_gpu_ids
+
+Cross Language
+--------------
+.. autosummary::
+    :toctree: doc/
+
+    ray.cross_language.java_function
+    ray.cross_language.java_actor_class
diff --git a/doc/source/ray-core/api/exceptions.rst b/doc/source/ray-core/api/exceptions.rst
new file mode 100644
index 000000000000..d041612573d4
--- /dev/null
+++ b/doc/source/ray-core/api/exceptions.rst
@@ -0,0 +1,32 @@
+.. _ray-core-exceptions:
+
+Exceptions
+==========
+
+.. autosummary::
+    :toctree: doc/
+
+    ray.exceptions.RayError
+    ray.exceptions.RayTaskError
+    ray.exceptions.RayActorError
+    ray.exceptions.TaskCancelledError
+    ray.exceptions.TaskUnschedulableError
+    ray.exceptions.ActorUnschedulableError
+    ray.exceptions.AsyncioActorExit
+    ray.exceptions.LocalRayletDiedError
+    ray.exceptions.WorkerCrashedError
+    ray.exceptions.TaskPlacementGroupRemoved
+    ray.exceptions.ActorPlacementGroupRemoved
+    ray.exceptions.ObjectStoreFullError
+    ray.exceptions.OutOfDiskError
+    ray.exceptions.ObjectLostError
+    ray.exceptions.ObjectFetchTimedOutError
+    ray.exceptions.GetTimeoutError
+    ray.exceptions.OwnerDiedError
+    ray.exceptions.PlasmaObjectNotAvailable
+    ray.exceptions.ObjectReconstructionFailedError
+    ray.exceptions.ObjectReconstructionFailedMaxAttemptsExceededError
+    ray.exceptions.ObjectReconstructionFailedLineageEvictedError
+    ray.exceptions.RuntimeEnvSetupError
+    ray.exceptions.CrossLanguageError
+    ray.exceptions.RaySystemError
diff --git a/doc/source/ray-core/api/index.rst b/doc/source/ray-core/api/index.rst
new file mode 100644
index 000000000000..eb5cdd9d0ef5
--- /dev/null
+++ b/doc/source/ray-core/api/index.rst
@@ -0,0 +1,14 @@
+Ray Core API
+============
+
+.. toctree::
+    :maxdepth: 2
+
+    core.rst
+    scheduling.rst
+    runtime-env.rst
+    utility.rst
+    exceptions.rst
+    cli.rst
+    ../../ray-observability/api/state/cli.rst
+    ../../ray-observability/api/state/api.rst
diff --git a/doc/source/ray-core/api/runtime-env.rst b/doc/source/ray-core/api/runtime-env.rst
new file mode 100644
index 000000000000..607766a9535a
--- /dev/null
+++ b/doc/source/ray-core/api/runtime-env.rst
@@ -0,0 +1,8 @@
+Runtime Env API
+===============
+
+.. autosummary::
+    :toctree: doc/
+
+    ray.runtime_env.RuntimeEnvConfig
+    ray.runtime_env.RuntimeEnv
diff --git a/doc/source/ray-core/api/scheduling.rst b/doc/source/ray-core/api/scheduling.rst
new file mode 100644
index 000000000000..2971aae8e3c8
--- /dev/null
+++ b/doc/source/ray-core/api/scheduling.rst
@@ -0,0 +1,25 @@
+Scheduling API
+==============
+
+Scheduling Strategy
+-------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    ray.util.scheduling_strategies.PlacementGroupSchedulingStrategy
+    ray.util.scheduling_strategies.NodeAffinitySchedulingStrategy
+
+.. _ray-placement-group-ref:
+
+Placement Group
+---------------
+
+.. autosummary::
+    :toctree: doc/
+
+    ray.util.placement_group.placement_group
+    ray.util.placement_group.PlacementGroup
+    ray.util.placement_group.placement_group_table
+    ray.util.placement_group.remove_placement_group
+    ray.util.placement_group.get_current_placement_group
diff --git a/doc/source/ray-core/api/utility.rst b/doc/source/ray-core/api/utility.rst
new file mode 100644
index 000000000000..36da67415d4f
--- /dev/null
+++ b/doc/source/ray-core/api/utility.rst
@@ -0,0 +1,35 @@
+Utility
+=======
+
+.. autosummary::
+   :toctree: doc/
+
+   ray.util.ActorPool
+   ray.util.queue.Queue
+   ray.nodes
+   ray.cluster_resources
+   ray.available_resources
+
+.. _custom-metric-api-ref:
+
+Custom Metrics
+--------------
+
+.. autosummary::
+   :toctree: doc/
+
+   ray.util.metrics.Counter
+   ray.util.metrics.Gauge
+   ray.util.metrics.Histogram
+
+.. _package-ref-debugging-apis:
+
+Debugging
+---------
+
+.. autosummary::
+   :toctree: doc/
+
+   ray.util.pdb.set_trace
+   ray.util.inspect_serializability
+   ray.timeline
diff --git a/doc/source/ray-core/configure.rst b/doc/source/ray-core/configure.rst
index 23eafaf5c88d..6a2c5c78272d 100644
--- a/doc/source/ray-core/configure.rst
+++ b/doc/source/ray-core/configure.rst
@@ -57,12 +57,12 @@ If using the command line, connect to the Ray cluster as follow:
 .. _omp-num-thread-note:
 
 .. note::
-    Ray sets the environment variable ``OMP_NUM_THREADS=<num_cpus>`` if ``num_cpus`` is set on 
-    the task/actor via :ref:`ray.remote() <ray-remote-ref>` and :ref:`.options() <ray-options-ref>`.
-    Ray sets ``OMP_NUM_THREADS=1`` if ``num_cpus`` is not specified; this 
+    Ray sets the environment variable ``OMP_NUM_THREADS=<num_cpus>`` if ``num_cpus`` is set on
+    the task/actor via :func:`ray.remote() <ray.remote>` and :meth:`task.options() <ray.remote_function.RemoteFunction.options>`/:meth:`actor.options() <ray.actor.ActorClass.options>`.
+    Ray sets ``OMP_NUM_THREADS=1`` if ``num_cpus`` is not specified; this
     is done to avoid performance degradation with many workers (issue #6998). You can
-    also override this by explicitly setting ``OMP_NUM_THREADS`` to override anything Ray sets by default. 
-    ``OMP_NUM_THREADS`` is commonly used in numpy, PyTorch, and Tensorflow to perform multi-threaded 
+    also override this by explicitly setting ``OMP_NUM_THREADS`` to override anything Ray sets by default.
+    ``OMP_NUM_THREADS`` is commonly used in numpy, PyTorch, and Tensorflow to perform multi-threaded
     linear algebra. In multi-worker setting, we want one thread per worker instead of many threads
     per worker to avoid contention. Some other libraries may have their own way to configure
     parallelism. For example, if you're using OpenCV, you should manually set the number of
diff --git a/doc/source/ray-core/examples/monte_carlo_pi.rst b/doc/source/ray-core/examples/monte_carlo_pi.rst
index faf1caa75139..8f3cd1fa23e5 100644
--- a/doc/source/ray-core/examples/monte_carlo_pi.rst
+++ b/doc/source/ray-core/examples/monte_carlo_pi.rst
@@ -19,7 +19,7 @@ To get started, install Ray via ``pip install -U ray``. See :ref:`Installing Ray
 
 Starting Ray
 ------------
-First, let's include all modules needed for this tutorial and start a local Ray cluster with :ref:`ray.init() <ray-init-ref>`:
+First, let's include all modules needed for this tutorial and start a local Ray cluster with :func:`ray.init() <ray.init>`:
 
 .. literalinclude:: ../doc_code/monte_carlo_pi.py
     :language: python
@@ -41,7 +41,7 @@ Ray actors are essentially stateful services that anyone with an instance (a han
     :start-after: __defining_actor_start__
     :end-before: __defining_actor_end__
 
-We define a Ray actor by decorating a normal Python class with :ref:`ray.remote <ray-remote-ref>`.
+We define a Ray actor by decorating a normal Python class with :func:`ray.remote <ray.remote>`.
 The progress actor has ``report_progress()`` method that will be called by sampling tasks to update their progress individually
 and ``get_progress()`` method to get the overall progress.
 
@@ -55,7 +55,7 @@ Ray tasks are stateless functions. They execute asynchronously, and run in paral
     :start-after: __defining_task_start__
     :end-before: __defining_task_end__
 
-To convert a normal Python function as a Ray task, we decorate the function with :ref:`ray.remote <ray-remote-ref>`.
+To convert a normal Python function as a Ray task, we decorate the function with :func:`ray.remote <ray.remote>`.
 The sampling task takes a progress actor handle as an input and reports progress to it.
 The above code shows an example of calling actor methods from tasks.
 
@@ -97,7 +97,7 @@ While sampling tasks are running, we can periodically query the progress by call
 To call an actor method, use ``actor_handle.method.remote()``.
 This invocation immediately returns an ``ObjectRef`` as a future
 and then executes the method asynchronously on the remote actor process.
-To fetch the actual returned value of ``ObjectRef``, we use the blocking :ref:`ray.get() <ray-get-ref>`.
+To fetch the actual returned value of ``ObjectRef``, we use the blocking :func:`ray.get() <ray.get>`.
 
 Calculating π
 -------------
@@ -108,7 +108,7 @@ Finally, we get number of samples inside the circle from the remote sampling tas
     :start-after: __calculating_pi_start__
     :end-before: __calculating_pi_end__
 
-As we can see from the above code, besides a single ``ObjectRef``, :ref:`ray.get() <ray-get-ref>` can also take a list of ``ObjectRef`` and return a list of results.
+As we can see from the above code, besides a single ``ObjectRef``, :func:`ray.get() <ray.get>` can also take a list of ``ObjectRef`` and return a list of results.
 
 If you run this tutorial, you will see output like:
 
diff --git a/doc/source/ray-core/fault_tolerance/actors.rst b/doc/source/ray-core/fault_tolerance/actors.rst
index 9d01df1e9448..a254fa5fb562 100644
--- a/doc/source/ray-core/fault_tolerance/actors.rst
+++ b/doc/source/ray-core/fault_tolerance/actors.rst
@@ -24,7 +24,7 @@ After the specified number of restarts, subsequent actor methods will
 raise a ``RayActorError``.
 
 By default, actor tasks execute with at-most-once semantics
-(``max_task_retries=0`` in the ``@ray.remote`` :ref:`decorator <ray-remote-ref>`). This means that if an
+(``max_task_retries=0`` in the ``@ray.remote`` :func:`decorator <ray.remote>`). This means that if an
 actor task is submitted to an actor that is unreachable, Ray will report the
 error with ``RayActorError``, a Python-level exception that is thrown when
 ``ray.get`` is called on the future returned by the task. Note that this
diff --git a/doc/source/ray-core/fault_tolerance/tasks.rst b/doc/source/ray-core/fault_tolerance/tasks.rst
index 69652b1852e8..f99d934e2463 100644
--- a/doc/source/ray-core/fault_tolerance/tasks.rst
+++ b/doc/source/ray-core/fault_tolerance/tasks.rst
@@ -71,7 +71,7 @@ If a task is hanging, you may want to cancel the task to continue to make
 progress. You can do this by calling ``ray.cancel`` on an ``ObjectRef``
 returned by the task. By default, this will send a KeyboardInterrupt to the
 task's worker if it is mid-execution.  Passing ``force=True`` to ``ray.cancel``
-will force-exit the worker. See :ref:`the API reference <ray-cancel-ref>` for
+will force-exit the worker. See :func:`the API reference <ray.cancel>` for
 ``ray.cancel`` for more details.
 
 Note that currently, Ray will not automatically retry tasks that have been
diff --git a/doc/source/ray-core/objects.rst b/doc/source/ray-core/objects.rst
index 7c7f0b69eb56..721924c12c2c 100644
--- a/doc/source/ray-core/objects.rst
+++ b/doc/source/ray-core/objects.rst
@@ -12,7 +12,7 @@ similar.
 Object refs can be created in two ways.
 
   1. They are returned by remote function calls.
-  2. They are returned by ``put`` (:ref:`docstring <ray-put-ref>`).
+  2. They are returned by :func:`ray.put() <ray.put>`.
 
 .. tabbed:: Python
 
@@ -48,7 +48,7 @@ Object refs can be created in two ways.
 Fetching Object Data
 --------------------
 
-You can use the ``get`` method (:ref:`docstring <ray-get-ref>`) to fetch the result of a remote object from an object ref.
+You can use the :func:`ray.get() <ray.get>` method to fetch the result of a remote object from an object ref.
 If the current node's object store does not contain the object, the object is downloaded.
 
 .. tabbed:: Python
diff --git a/doc/source/ray-core/package-ref.rst b/doc/source/ray-core/package-ref.rst
deleted file mode 100644
index 190d158b318d..000000000000
--- a/doc/source/ray-core/package-ref.rst
+++ /dev/null
@@ -1,298 +0,0 @@
-Ray Core API
-============
-
-Python API
-----------
-
-.. _ray-init-ref:
-
-ray.init
-~~~~~~~~
-
-.. autofunction:: ray.init
-
-.. _ray-is_initialized-ref:
-
-ray.is_initialized
-~~~~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.is_initialized
-
-.. _ray-remote-ref:
-
-ray.remote
-~~~~~~~~~~
-
-.. autofunction:: ray.remote
-
-.. _ray-options-ref:
-
-.. autofunction:: ray.remote_function.RemoteFunction.options
-
-.. autofunction:: ray.actor.ActorClass.options
-
-.. _scheduling-strategy-ref:
-
-.. autofunction:: ray.util.scheduling_strategies.PlacementGroupSchedulingStrategy
-
-.. autofunction:: ray.util.scheduling_strategies.NodeAffinitySchedulingStrategy
-
-.. _ray-get-ref:
-
-ray.get
-~~~~~~~
-
-.. autofunction:: ray.get
-
-.. _ray-wait-ref:
-
-ray.wait
-~~~~~~~~
-
-.. autofunction:: ray.wait
-
-.. _ray-put-ref:
-
-ray.put
-~~~~~~~
-
-.. autofunction:: ray.put
-
-.. _ray-kill-ref:
-
-ray.kill
-~~~~~~~~
-
-.. autofunction:: ray.kill
-
-.. _ray-cancel-ref:
-
-ray.cancel
-~~~~~~~~~~
-
-.. autofunction:: ray.cancel
-
-.. _ray-get_actor-ref:
-
-
-ray.get_actor
-~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.get_actor
-
-.. _ray-get_gpu_ids-ref:
-
-ray.get_gpu_ids
-~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.get_gpu_ids
-
-.. _ray-shutdown-ref:
-
-ray.shutdown
-~~~~~~~~~~~~
-
-.. autofunction:: ray.shutdown
-
-.. _ray-method-ref:
-
-ray.method
-~~~~~~~~~~
-
-.. autofunction:: ray.method
-
-.. _ray-actor-pool-ref:
-
-ray.util.ActorPool
-~~~~~~~~~~~~~~~~~~
-
-.. autoclass:: ray.util.ActorPool
-   :members:
-
-ray.util.queue.Queue
-~~~~~~~~~~~~~~~~~~~~
-
-.. _ray-queue-ref:
-
-.. autoclass:: ray.util.queue.Queue
-   :members:
-
-.. _ray-nodes-ref:
-
-ray.nodes
-~~~~~~~~~
-
-.. autofunction:: ray.nodes
-
-.. _ray-timeline-ref:
-
-ray.timeline
-~~~~~~~~~~~~
-
-.. autofunction:: ray.timeline
-
-.. _ray-cluster_resources-ref:
-
-ray.cluster_resources
-~~~~~~~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.cluster_resources
-
-.. _ray-available_resources-ref:
-
-ray.available_resources
-~~~~~~~~~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.available_resources
-
-ray.cross_language
-~~~~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.cross_language.java_function
-
-.. autofunction:: ray.cross_language.java_actor_class
-
-.. _ray-placement-group-ref:
-
-Placement Group APIs
---------------------
-
-placement_group
-~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.util.placement_group.placement_group
-
-
-PlacementGroup (class)
-~~~~~~~~~~~~~~~~~~~~~~
-
-.. autoclass:: ray.util.placement_group.PlacementGroup
-   :members:
-
-placement_group_table
-~~~~~~~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.util.placement_group.placement_group_table
-
-
-remove_placement_group
-~~~~~~~~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.util.placement_group.remove_placement_group
-
-get_current_placement_group
-~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. autofunction:: ray.util.placement_group.get_current_placement_group
-
-.. _custom-metric-api-ref:
-
-Custom Metrics APIs
--------------------
-
-Counter
-~~~~~~~
-
-.. autoclass:: ray.util.metrics.Counter
-   :members:
-
-Gauge
-~~~~~
-
-.. autoclass:: ray.util.metrics.Gauge
-   :members:
-
-Histogram
-~~~~~~~~~
-
-.. autoclass:: ray.util.metrics.Histogram
-   :members:
-
-.. _runtime-context-apis:
-
-Runtime Context APIs
---------------------
-
-.. autofunction:: ray.runtime_context.get_runtime_context
-
-.. autoclass:: ray.runtime_context.RuntimeContext
-    :members:
-
-.. _runtime-env-apis:
-
-Runtime Env APIs
-----------------
-
-.. autoclass:: ray.runtime_env.RuntimeEnvConfig
-    :members:
-
-.. autoclass:: ray.runtime_env.RuntimeEnv
-    :members:
-
-.. _package-ref-debugging-apis:
-
-Debugging APIs
---------------
-
-.. autofunction:: ray.util.pdb.set_trace
-
-.. autofunction:: ray.util.inspect_serializability
-
-.. _ray-core-exceptions:
-
-Exceptions
-----------
-
-.. autoclass:: ray.exceptions.RayError
-   :members:
-
-.. _ray-core-exceptions-ray-task-error:
-.. autoclass:: ray.exceptions.RayTaskError
-   :members:
-.. autoclass:: ray.exceptions.TaskCancelledError
-   :members:
-.. autoclass:: ray.exceptions.GetTimeoutError
-   :members:
-.. _ray-core-exceptions-ray-actor-error:
-.. autoclass:: ray.exceptions.RayActorError
-   :members:
-.. _ray-core-exceptions-runtime-env-setup-error:
-.. autoclass:: ray.exceptions.RuntimeEnvSetupError
-   :members:
-.. autoclass:: ray.exceptions.TaskUnschedulableError
-   :members:
-.. autoclass:: ray.exceptions.ActorUnschedulableError
-   :members:
-.. autoclass:: ray.exceptions.TaskPlacementGroupRemoved
-   :members:
-.. autoclass:: ray.exceptions.ActorPlacementGroupRemoved
-   :members:
-.. autoclass:: ray.exceptions.LocalRayletDiedError
-   :members:
-.. autoclass:: ray.exceptions.WorkerCrashedError
-   :members:
-.. autoclass:: ray.exceptions.RaySystemError
-   :members:
-.. autoclass:: ray.exceptions.ObjectStoreFullError
-   :members:
-.. autoclass:: ray.exceptions.OutOfDiskError
-   :members:
-.. _ray-core-exceptions-object-lost-error:
-.. autoclass:: ray.exceptions.ObjectLostError
-   :members:
-.. autoclass:: ray.exceptions.ObjectFetchTimedOutError
-   :members:
-.. autoclass:: ray.exceptions.OwnerDiedError
-   :members:
-.. autoclass:: ray.exceptions.ObjectReconstructionFailedError
-   :members:
-.. autoclass:: ray.exceptions.ObjectReconstructionFailedMaxAttemptsExceededError
-   :members:
-.. autoclass:: ray.exceptions.ObjectReconstructionFailedLineageEvictedError
-   :members:
-.. autoclass:: ray.exceptions.PlasmaObjectNotAvailable
-   :members:
-.. autoclass:: ray.exceptions.AsyncioActorExit
-   :members:
-.. autoclass:: ray.exceptions.CrossLanguageError
-   :members:
diff --git a/doc/source/ray-core/patterns/closure-capture-large-objects.rst b/doc/source/ray-core/patterns/closure-capture-large-objects.rst
index b5cace64173c..c51a24f7ecc7 100644
--- a/doc/source/ray-core/patterns/closure-capture-large-objects.rst
+++ b/doc/source/ray-core/patterns/closure-capture-large-objects.rst
@@ -3,13 +3,13 @@ Anti-pattern: Closure capturing large objects harms performance
 
 **TLDR:** Avoid closure capturing large objects in remote functions or classes, use object store instead.
 
-When you define a :ref:`ray.remote <ray-remote-ref>` function or class,
+When you define a :func:`ray.remote <ray.remote>` function or class,
 it is easy to accidentally capture large (more than a few MB) objects implicitly in the definition.
 This can lead to slow performance or even OOM since Ray is not designed to handle serialized functions or classes that are very large.
 
 For such large objects, there are two options to resolve this problem:
 
-- Use :ref:`ray.put() <ray-put-ref>` to put the large objects in the Ray object store, and then pass object references as arguments to the remote functions or classes (*"better approach #1"* below)
+- Use :func:`ray.put() <ray.put>` to put the large objects in the Ray object store, and then pass object references as arguments to the remote functions or classes (*"better approach #1"* below)
 - Create the large objects inside the remote functions or classes by passing a lambda method (*"better approach #2"*). This is also the only option for using unserializable objects.
 
 
diff --git a/doc/source/ray-core/patterns/limit-pending-tasks.rst b/doc/source/ray-core/patterns/limit-pending-tasks.rst
index fd5ccddbc42d..8a266990c4d4 100644
--- a/doc/source/ray-core/patterns/limit-pending-tasks.rst
+++ b/doc/source/ray-core/patterns/limit-pending-tasks.rst
@@ -3,7 +3,7 @@
 Pattern: Using ray.wait to limit the number of pending tasks
 ============================================================
 
-In this pattern, we use :ref:`ray.wait() <ray-wait-ref>` to limit the number of pending tasks.
+In this pattern, we use :func:`ray.wait() <ray.wait>` to limit the number of pending tasks.
 
 If we continuously submit tasks faster than their process time, we will accumulate tasks in the pending task queue, which can eventually cause OOM.
 With ``ray.wait()``, we can apply backpressure and limit the number of pending tasks so that the pending task queue won't grow indefinitely and cause OOM.
diff --git a/doc/source/ray-core/patterns/nested-tasks.rst b/doc/source/ray-core/patterns/nested-tasks.rst
index 170b8f63525d..070761ed7720 100644
--- a/doc/source/ray-core/patterns/nested-tasks.rst
+++ b/doc/source/ray-core/patterns/nested-tasks.rst
@@ -28,7 +28,7 @@ Code example
     :start-after: __pattern_start__
     :end-before: __pattern_end__
 
-We call :ref:`ray.get() <ray-get-ref>` after both ``quick_sort_distributed`` function invocations take place.
+We call :func:`ray.get() <ray.get>` after both ``quick_sort_distributed`` function invocations take place.
 This allows you to maximize parallelism in the workload. See :doc:`ray-get-loop` for more details.
 
 Notice in the execution times above that with smaller tasks, the non-distributed version is faster. However, as the task execution
diff --git a/doc/source/ray-core/patterns/pass-large-arg-by-value.rst b/doc/source/ray-core/patterns/pass-large-arg-by-value.rst
index 37a6816f2245..b95b981fdec9 100644
--- a/doc/source/ray-core/patterns/pass-large-arg-by-value.rst
+++ b/doc/source/ray-core/patterns/pass-large-arg-by-value.rst
@@ -3,7 +3,7 @@
 Anti-pattern: Passing the same large argument by value repeatedly harms performance
 ===================================================================================
 
-**TLDR:** Avoid passing the same large argument by value to multiple tasks, use :ref:`ray.put() <ray-put-ref>` and pass by reference instead.
+**TLDR:** Avoid passing the same large argument by value to multiple tasks, use :func:`ray.put() <ray.put>` and pass by reference instead.
 
 When passing a large argument (>100KB) by value to a task,
 Ray will implicitly store the argument in the object store and the worker process will fetch the argument to the local object store from the caller's object store before running the task.
diff --git a/doc/source/ray-core/patterns/pipelining.rst b/doc/source/ray-core/patterns/pipelining.rst
index 42ad5e5320c2..cf9e63bdb2ce 100644
--- a/doc/source/ray-core/patterns/pipelining.rst
+++ b/doc/source/ray-core/patterns/pipelining.rst
@@ -23,5 +23,5 @@ Code example
 .. literalinclude:: ../doc_code/pattern_pipelining.py
 
 In the example above, a worker actor pulls work off of a queue and then does some computation on it.
-Without pipelining, we call :ref:`ray.get() <ray-get-ref>` immediately after requesting a work item, so we block while that RPC is in flight, causing idle CPU time.
+Without pipelining, we call :func:`ray.get() <ray.get>` immediately after requesting a work item, so we block while that RPC is in flight, causing idle CPU time.
 With pipelining, we instead preemptively request the next work item before processing the current one, so we can use the CPU while the RPC is in flight which increases the CPU utilization.
diff --git a/doc/source/ray-core/patterns/ray-get-loop.rst b/doc/source/ray-core/patterns/ray-get-loop.rst
index 5e75191a5e1f..4ecf9666d774 100644
--- a/doc/source/ray-core/patterns/ray-get-loop.rst
+++ b/doc/source/ray-core/patterns/ray-get-loop.rst
@@ -3,7 +3,7 @@
 Anti-pattern: Calling ray.get in a loop harms parallelism
 =========================================================
 
-**TLDR:** Avoid calling :ref:`ray.get() <ray-get-ref>` in a loop since it's a blocking call; use ``ray.get()`` only for the final result.
+**TLDR:** Avoid calling :func:`ray.get() <ray.get>` in a loop since it's a blocking call; use ``ray.get()`` only for the final result.
 
 A call to ``ray.get()`` fetches the results of remotely executed functions. However, it is a blocking call, which means that it always waits until the requested result is available.
 If you call ``ray.get()`` in a loop, the loop will not continue to run until the call to ``ray.get()`` is resolved.
diff --git a/doc/source/ray-core/patterns/ray-get-submission-order.rst b/doc/source/ray-core/patterns/ray-get-submission-order.rst
index 9a4d57b32537..f0141e2daae3 100644
--- a/doc/source/ray-core/patterns/ray-get-submission-order.rst
+++ b/doc/source/ray-core/patterns/ray-get-submission-order.rst
@@ -1,12 +1,12 @@
 Anti-pattern: Processing results in submission order using ray.get increases runtime
 ====================================================================================
 
-**TLDR:** Avoid processing independent results in submission order using :ref:`ray.get() <ray-get-ref>` since results may be ready in a different order than the submission order.
+**TLDR:** Avoid processing independent results in submission order using :func:`ray.get() <ray.get>` since results may be ready in a different order than the submission order.
 
 A batch of tasks is submitted, and we need to process their results individually once they’re done.
 If each task takes a different amount of time to finish and we process results in submission order, we may waste time waiting for all of the slower (straggler) tasks that were submitted earlier to finish while later faster tasks have already finished.
 
-Instead, we want to process the tasks in the order that they finish using :ref:`ray.wait() <ray-wait-ref>` to speed up total time to completion.
+Instead, we want to process the tasks in the order that they finish using :func:`ray.wait() <ray.wait>` to speed up total time to completion.
 
 .. figure:: ../images/ray-get-submission-order.svg
 
diff --git a/doc/source/ray-core/patterns/ray-get-too-many-objects.rst b/doc/source/ray-core/patterns/ray-get-too-many-objects.rst
index bd03de0962a3..d0f247eebc65 100644
--- a/doc/source/ray-core/patterns/ray-get-too-many-objects.rst
+++ b/doc/source/ray-core/patterns/ray-get-too-many-objects.rst
@@ -1,7 +1,7 @@
 Anti-pattern: Fetching too many objects at once with ray.get causes failure
 ===========================================================================
 
-**TLDR:** Avoid calling :ref:`ray.get() <ray-get-ref>` on too many objects since this will lead to heap out-of-memory or object store out-of-space. Instead fetch and process one batch at a time.
+**TLDR:** Avoid calling :func:`ray.get() <ray.get>` on too many objects since this will lead to heap out-of-memory or object store out-of-space. Instead fetch and process one batch at a time.
 
 If you have a large number of tasks that you want to run in parallel, trying to do ``ray.get()`` on all of them at once could lead to failure with heap out-of-memory or object store out-of-space since Ray needs to fetch all the objects to the caller at the same time.
 Instead you should get and process the results one batch at a time. Once a batch is processed, Ray will evict objects in that batch to make space for future batches.
diff --git a/doc/source/ray-core/patterns/redefine-task-actor-loop.rst b/doc/source/ray-core/patterns/redefine-task-actor-loop.rst
index 939b16dc585f..c0b2191773b3 100644
--- a/doc/source/ray-core/patterns/redefine-task-actor-loop.rst
+++ b/doc/source/ray-core/patterns/redefine-task-actor-loop.rst
@@ -3,7 +3,7 @@ Anti-pattern: Redefining the same remote function or class harms performance
 
 **TLDR:** Avoid redefining the same remote function or class.
 
-Decorating the same function or class multiple times using the :ref:`ray.remote <ray-remote-ref>` decorator leads to slow performance in Ray.
+Decorating the same function or class multiple times using the :func:`ray.remote <ray.remote>` decorator leads to slow performance in Ray.
 For each Ray remote function or class, Ray will pickle it and upload to GCS.
 Later on, the worker that runs the task or actor will download and unpickle it.
 Each decoration of the same function or class generates a new remote function or class from Ray's perspective.
diff --git a/doc/source/ray-core/patterns/return-ray-put.rst b/doc/source/ray-core/patterns/return-ray-put.rst
index 8bd1ae3e527c..4afc6b90b4ff 100644
--- a/doc/source/ray-core/patterns/return-ray-put.rst
+++ b/doc/source/ray-core/patterns/return-ray-put.rst
@@ -1,7 +1,7 @@
 Anti-pattern: Returning ray.put() ObjectRefs from a task harms performance and fault tolerance
 ==============================================================================================
 
-**TLDR:** Avoid calling :ref:`ray.put() <ray-put-ref>` on task return values and returning the resulting ObjectRefs.
+**TLDR:** Avoid calling :func:`ray.put() <ray.put>` on task return values and returning the resulting ObjectRefs.
 Instead, return these values directly if possible.
 
 Returning ray.put() ObjectRefs are considered anti-patterns for the following reasons:
diff --git a/doc/source/ray-core/patterns/unnecessary-ray-get.rst b/doc/source/ray-core/patterns/unnecessary-ray-get.rst
index 121cecabd297..c0322c22e190 100644
--- a/doc/source/ray-core/patterns/unnecessary-ray-get.rst
+++ b/doc/source/ray-core/patterns/unnecessary-ray-get.rst
@@ -3,7 +3,7 @@
 Anti-pattern: Calling ray.get unnecessarily harms performance
 =============================================================
 
-**TLDR:** Avoid calling :ref:`ray.get() <ray-get-ref>` unnecessarily for intermediate steps. Work with object references directly, and only call ``ray.get()`` at the end to get the final result.
+**TLDR:** Avoid calling :func:`ray.get() <ray.get>` unnecessarily for intermediate steps. Work with object references directly, and only call ``ray.get()`` at the end to get the final result.
 
 When ``ray.get()`` is called, objects must be transferred to the worker/node that calls ``ray.get()``. If you don't need to manipulate the object, you probably don't need to call ``ray.get()`` on it!
 
diff --git a/doc/source/ray-core/scheduling/index.rst b/doc/source/ray-core/scheduling/index.rst
index 5ec7f1c9bab6..16b28525e83b 100644
--- a/doc/source/ray-core/scheduling/index.rst
+++ b/doc/source/ray-core/scheduling/index.rst
@@ -31,7 +31,7 @@ If all nodes are infeasible, the task or actor cannot be scheduled until feasibl
 Scheduling Strategies
 ---------------------
 
-Tasks or actors support a :ref:`scheduling_strategy <ray-remote-ref>` option to specify the strategy used to decide the best node among feasible nodes.
+Tasks or actors support a :func:`scheduling_strategy <ray.remote>` option to specify the strategy used to decide the best node among feasible nodes.
 Currently the supported strategies are the followings.
 
 "DEFAULT"
diff --git a/doc/source/ray-core/scheduling/placement-group.rst b/doc/source/ray-core/scheduling/placement-group.rst
index a5c613874d13..d6d01f05b899 100644
--- a/doc/source/ray-core/scheduling/placement-group.rst
+++ b/doc/source/ray-core/scheduling/placement-group.rst
@@ -360,7 +360,7 @@ Let's create a placement group. Recall that each bundle is a collection of resou
 
 Now let's define an actor that uses GPU. We'll also define a task that use ``extra_resources``.
 You can schedule actors/tasks on the placement group using
-:ref:`options(scheduling_strategy=PlacementGroupSchedulingStrategy(...)) <scheduling-strategy-ref>`.
+:class:`options(scheduling_strategy=PlacementGroupSchedulingStrategy(...)) <ray.util.scheduling_strategies.PlacementGroupSchedulingStrategy>`.
 
 .. tabbed:: Python
 
@@ -470,7 +470,7 @@ You can schedule actors/tasks on the placement group using
       };
 
       RAY_REMOTE(&Counter::Ping, &Counter::GetValue, CreateCounter);
-      
+
       // Create GPU actors on a gpu bundle.
       for (int index = 0; index < 2; index++) {
         ray::Actor(CreateCounter)
@@ -660,9 +660,9 @@ Placement Group Lifetimes
 .. tabbed:: Python
 
     By default, the lifetimes of placement groups are not detached and will be destroyed
-    when the driver is terminated (but, if it is created from a detached actor, it is 
-    killed when the detached actor is killed). If you'd like to keep the placement group 
-    alive regardless of its job or detached actor, you should specify 
+    when the driver is terminated (but, if it is created from a detached actor, it is
+    killed when the detached actor is killed). If you'd like to keep the placement group
+    alive regardless of its job or detached actor, you should specify
     `lifetime="detached"`. For example:
 
     .. code-block:: python
@@ -671,8 +671,8 @@ Placement Group Lifetimes
       pg = placement_group([{"CPU": 2}, {"CPU": 2}], strategy="STRICT_SPREAD", lifetime="detached")
       ray.get(pg.ready())
 
-    The placement group's lifetime will be independent of the driver now. This means it 
-    is possible to retrieve the placement group from other drivers regardless of when 
+    The placement group's lifetime will be independent of the driver now. This means it
+    is possible to retrieve the placement group from other drivers regardless of when
     the current driver exits. Let's see an example:
 
     .. code-block:: python
diff --git a/doc/source/ray-core/scheduling/resources.rst b/doc/source/ray-core/scheduling/resources.rst
index 04e7b811be74..e2455cc27032 100644
--- a/doc/source/ray-core/scheduling/resources.rst
+++ b/doc/source/ray-core/scheduling/resources.rst
@@ -78,7 +78,7 @@ There are several ways to do that depending on how you start the Ray cluster:
 
 .. tabbed:: ray.init()
 
-    If you are using :ref:`ray.init() <ray-init-ref>` to start a single node Ray cluster, you can do the following to manually specify node resources:
+    If you are using :func:`ray.init() <ray.init>` to start a single node Ray cluster, you can do the following to manually specify node resources:
 
     .. literalinclude:: ../doc_code/resources.py
         :language: python
@@ -136,7 +136,8 @@ The default resource requirements for actors was chosen for historical reasons.
 It's recommended to always explicitly set ``num_cpus`` for actors to avoid any surprises.
 If resources are specified explicitly, they are required for both scheduling and running.)
 
-You can also explicitly specify a task's or actor's resource requirements (for example, one task may require a GPU) instead of using default ones via :ref:`ray.remote() <ray-remote-ref>` and :ref:`.options() <ray-options-ref>`.
+You can also explicitly specify a task's or actor's resource requirements (for example, one task may require a GPU) instead of using default ones via :func:`ray.remote() <ray.remote>`
+and :meth:`task.options() <ray.remote_function.RemoteFunction.options>`/:meth:`actor.options() <ray.actor.ActorClass.options>`.
 
 .. tabbed:: Python
 
diff --git a/doc/source/ray-core/tasks.rst b/doc/source/ray-core/tasks.rst
index f3e65113ca0c..429f7f715445 100644
--- a/doc/source/ray-core/tasks.rst
+++ b/doc/source/ray-core/tasks.rst
@@ -164,7 +164,7 @@ Waiting for Partial Results
 ---------------------------
 
 Calling **ray.get** on Ray task results will block until the task finished execution. After launching a number of tasks, you may want to know which ones have
-finished executing without blocking on all of them. This could be achieved by (:ref:`ray-wait-ref`). The function
+finished executing without blocking on all of them. This could be achieved by :func:`ray.wait() <ray.wait>`. The function
 works as follows.
 
 .. tabbed:: Python
@@ -215,7 +215,7 @@ For tasks that return multiple objects, Ray also supports remote generators that
 Cancelling tasks
 ----------------
 
-Ray tasks can be canceled by calling ``ray.cancel`` (:ref:`docstring <ray-cancel-ref>`) on the returned Object ref.
+Ray tasks can be canceled by calling :func:`ray.cancel() <ray.cancel>` on the returned Object ref.
 
 .. tabbed:: Python
 
@@ -242,7 +242,7 @@ By default, Ray will :ref:`retry <task-retries>` failed tasks
 due to system failures and specified application-level failures.
 You can change this behavior by setting
 ``max_retries`` and ``retry_exceptions`` options
-in :ref:`ray.remote() <ray-remote-ref>` and :ref:`.options() <ray-options-ref>`.
+in :func:`ray.remote() <ray.remote>` and :meth:`.options() <ray.remote_function.RemoteFunction.options>`.
 See :ref:`Ray fault tolerance <fault-tolerance>` for more details.
 
 
diff --git a/doc/source/ray-core/tasks/using-ray-with-gpus.rst b/doc/source/ray-core/tasks/using-ray-with-gpus.rst
index d6c74be1e113..c795f3a59913 100644
--- a/doc/source/ray-core/tasks/using-ray-with-gpus.rst
+++ b/doc/source/ray-core/tasks/using-ray-with-gpus.rst
@@ -40,7 +40,7 @@ and assign GPUs to the task or actor by setting the ``CUDA_VISIBLE_DEVICES`` env
     :start-after: __get_gpu_ids_start__
     :end-before: __get_gpu_ids_end__
 
-Inside a task or actor, :ref:`ray.get_gpu_ids() <ray-get_gpu_ids-ref>` will return a
+Inside a task or actor, :func:`ray.get_gpu_ids() <ray.get_gpu_ids>` will return a
 list of GPU IDs that are available to the task or actor.
 Typically, it is not necessary to call ``ray.get_gpu_ids()`` because Ray will
 automatically set the ``CUDA_VISIBLE_DEVICES`` environment variable,
@@ -99,7 +99,7 @@ task tries to use the same GPU. To address the problem, Ray disables the worker
 process reuse between GPU tasks by default, where the GPU resources is released after
 the task process exits. Since this adds overhead to GPU task scheduling,
 you can re-enable worker reuse by setting ``max_calls=0``
-in the :ref:`ray.remote <ray-remote-ref>` decorator.
+in the :func:`ray.remote <ray.remote>` decorator.
 
 .. literalinclude:: ../doc_code/gpus.py
     :language: python
diff --git a/doc/source/ray-more-libs/joblib.rst b/doc/source/ray-more-libs/joblib.rst
index d55efbf21f8d..d41ed8aa4dab 100644
--- a/doc/source/ray-more-libs/joblib.rst
+++ b/doc/source/ray-more-libs/joblib.rst
@@ -51,8 +51,8 @@ a multi-node Ray cluster instead.
   with joblib.parallel_backend('ray'):
       search.fit(digits.data, digits.target)
 
-You can also set the ``ray_remote_args`` argument in ``parallel_backend`` to :ref:`configure
-the Ray Actors <ray-remote-ref>` making up the Pool. This can be used to eg. :ref:`assign resources
+You can also set the ``ray_remote_args`` argument in ``parallel_backend`` to :func:`configure
+the Ray Actors <ray.remote>` making up the Pool. This can be used to eg. :ref:`assign resources
 to Actors, such as GPUs <actor-resource-guide>`.
 
 .. code-block:: python
diff --git a/doc/source/ray-observability/api/state/api.rst b/doc/source/ray-observability/api/state/api.rst
new file mode 100644
index 000000000000..bfd37f82c391
--- /dev/null
+++ b/doc/source/ray-observability/api/state/api.rst
@@ -0,0 +1,96 @@
+State API
+=========
+
+.. _state-api-ref:
+
+.. note::
+
+    APIs are :ref:`alpha <api-stability-alpha>`. This feature requires a full installation of Ray using ``pip install "ray[default]"``.
+
+For an overview with examples see :ref:`Monitoring Ray States <state-api-overview-ref>`.
+
+For the CLI reference see :ref:`Ray State CLI Reference <state-api-cli-ref>` or :ref:`Ray Log CLI Reference <ray-logs-api-cli-ref>`.
+
+State Python SDK
+-----------------
+
+State APIs are also exported as functions.
+
+Summary APIs
+~~~~~~~~~~~~
+
+.. autosummary::
+   :toctree: doc/
+
+    ray.experimental.state.api.summarize_actors
+    ray.experimental.state.api.summarize_objects
+    ray.experimental.state.api.summarize_tasks
+
+List APIs
+~~~~~~~~~~
+
+.. autosummary::
+   :toctree: doc/
+
+    ray.experimental.state.api.list_actors
+    ray.experimental.state.api.list_placement_groups
+    ray.experimental.state.api.list_nodes
+    ray.experimental.state.api.list_jobs
+    ray.experimental.state.api.list_workers
+    ray.experimental.state.api.list_tasks
+    ray.experimental.state.api.list_objects
+    ray.experimental.state.api.list_runtime_envs
+
+Get APIs
+~~~~~~~~~
+
+.. autosummary::
+   :toctree: doc/
+
+    ray.experimental.state.api.get_actor
+    ray.experimental.state.api.get_placement_group
+    ray.experimental.state.api.get_node
+    ray.experimental.state.api.get_worker
+    ray.experimental.state.api.get_task
+    ray.experimental.state.api.get_objects
+
+Log APIs
+~~~~~~~~
+
+.. autosummary::
+   :toctree: doc/
+
+    ray.experimental.state.api.list_logs
+    ray.experimental.state.api.get_log
+
+.. _state-api-schema:
+
+State APIs Schema
+-----------------
+
+.. autosummary::
+   :toctree: doc/
+
+    ray.experimental.state.common.ActorState
+    ray.experimental.state.common.TaskState
+    ray.experimental.state.common.NodeState
+    ray.experimental.state.common.PlacementGroupState
+    ray.experimental.state.common.WorkerState
+    ray.experimental.state.common.ObjectState
+    ray.experimental.state.common.RuntimeEnvState
+    ray.experimental.state.common.JobState
+    ray.experimental.state.common.StateSummary
+    ray.experimental.state.common.TaskSummaries
+    ray.experimental.state.common.TaskSummaryPerFuncOrClassName
+    ray.experimental.state.common.ActorSummaries
+    ray.experimental.state.common.ActorSummaryPerClass
+    ray.experimental.state.common.ObjectSummaries
+    ray.experimental.state.common.ObjectSummaryPerKey
+
+State APIs Exceptions
+---------------------
+
+.. autosummary::
+   :toctree: doc/
+
+    ray.experimental.state.exception.RayStateApiException
diff --git a/doc/source/ray-observability/state/cli.rst b/doc/source/ray-observability/api/state/cli.rst
similarity index 95%
rename from doc/source/ray-observability/state/cli.rst
rename to doc/source/ray-observability/api/state/cli.rst
index da765ac79c15..7b38592eb795 100644
--- a/doc/source/ray-observability/state/cli.rst
+++ b/doc/source/ray-observability/api/state/cli.rst
@@ -7,7 +7,7 @@ State
 -----
 This section contains commands to access the :ref:`live state of Ray resources (actor, task, object, etc.) <state-api-overview-ref>`.
 
-.. note:: 
+.. note::
 
     APIs are :ref:`alpha <api-stability-alpha>`. This feature requires a full installation of Ray using ``pip install "ray[default]"``. This feature also requires the dashboard component to be available. The dashboard component needs to be included when starting the ray cluster, which is the default behavior for ``ray start`` and ``ray.init()``. For more in-depth debugging, you could check the dashboard log at ``<RAY_LOG_DIR>/dashboard.log``, which is usually ``/tmp/ray/session_latest/logs/dashboard.log``.
 
@@ -34,11 +34,11 @@ Log
 ---
 This section contains commands to :ref:`access logs <state-api-log-doc>` from Ray clusters.
 
-.. note:: 
+.. note::
 
     APIs are :ref:`alpha <api-stability-alpha>`. This feature requires a full installation of Ray using ``pip install "ray[default]"``.
 
-Log CLI allows users to access the log from the cluster. 
+Log CLI allows users to access the log from the cluster.
 Note that only the logs from alive nodes are available through this API.
 
 .. click:: ray.experimental.state.state_cli:logs_state_cli_group
diff --git a/doc/source/ray-observability/overview.rst b/doc/source/ray-observability/overview.rst
index 3da5515c01c7..f45bbfbf69a5 100644
--- a/doc/source/ray-observability/overview.rst
+++ b/doc/source/ray-observability/overview.rst
@@ -26,9 +26,9 @@ Exceptions
 Creating a new task or submitting an actor task generates an object reference. When ``ray.get`` is called on the object reference,
 the API raises an exception if anything goes wrong with a related task, actor or object. For example,
 
-- :ref:`RayTaskError <ray-core-exceptions-ray-task-error>` is raised when there's an error from user code that throws an exception.
-- :ref:`RayActorError <ray-core-exceptions-ray-actor-error>` is raised when an actor is dead (by a system failure such as node failure or user-level failure such as an exception from ``__init__`` method). 
-- :ref:`RuntimeEnvSetupError <ray-core-exceptions-runtime-env-setup-error>` is raised when the actor or task couldn't be started because :ref:`a runtime environment <runtime-environments>` failed to be created.
+- :class:`RayTaskError <ray.exceptions.RayTaskError>` is raised when there's an error from user code that throws an exception.
+- :class:`RayActorError <ray.exceptions.RayActorError>` is raised when an actor is dead (by a system failure such as node failure or user-level failure such as an exception from ``__init__`` method).
+- :class:`RuntimeEnvSetupError <ray.exceptions.RuntimeEnvSetupError>` is raised when the actor or task couldn't be started because :ref:`a runtime environment <runtime-environments>` failed to be created.
 
 See :ref:`Exceptions Reference <ray-core-exceptions>` for more details.
 
@@ -134,16 +134,16 @@ Here's an example output.
 
 Metrics
 -------
-Ray collects and exposes the physical stats (e.g., CPU, memory, GRAM, disk, and network usage of each node), 
-internal stats (e.g., number of actors in the cluster, number of worker failures of the cluster), 
+Ray collects and exposes the physical stats (e.g., CPU, memory, GRAM, disk, and network usage of each node),
+internal stats (e.g., number of actors in the cluster, number of worker failures of the cluster),
 and custom metrics (e.g., metrics defined by users). All stats can be exported as time series data (to Prometheus by default) and used
-to monitor the cluster over time. 
+to monitor the cluster over time.
 
 See :ref:`Ray Metrics <ray-metrics>` for more details.
 
 Profiling
 ---------
-Ray is compatible with Python profiling tools such as ``CProfile``. It also supports its built-in profiling tool such as :ref:```ray timeline`` <ray-timeline-doc>`. 
+Ray is compatible with Python profiling tools such as ``CProfile``. It also supports its built-in profiling tool such as :ref:```ray timeline`` <ray-timeline-doc>`.
 
 See :ref:`Profiling <ray-core-profiling>` for more details.
 
diff --git a/doc/source/ray-observability/state/ray-state-api-reference.rst b/doc/source/ray-observability/state/ray-state-api-reference.rst
deleted file mode 100644
index b5ae074368fb..000000000000
--- a/doc/source/ray-observability/state/ray-state-api-reference.rst
+++ /dev/null
@@ -1,180 +0,0 @@
-Ray State API
-=============
-
-.. _state-api-ref:
-
-.. note:: 
-
-    APIs are :ref:`alpha <api-stability-alpha>`. This feature requires a full installation of Ray using ``pip install "ray[default]"``.
-
-For an overview with examples see :ref:`Monitoring Ray States <state-api-overview-ref>`.
-
-For the CLI reference see :ref:`Ray State CLI Reference <state-api-cli-ref>` or :ref:`Ray Log CLI Reference <ray-logs-api-cli-ref>`.
-
-State Python SDK
------------------
-
-State APIs are also exported as functions. 
-
-Summary APIs
-~~~~~~~~~~~~
-.. autofunction:: ray.experimental.state.api.summarize_actors
-.. autofunction:: ray.experimental.state.api.summarize_objects
-.. autofunction:: ray.experimental.state.api.summarize_tasks
-
-List APIs
-~~~~~~~~~~
-
-.. autofunction:: ray.experimental.state.api.list_actors
-.. autofunction:: ray.experimental.state.api.list_placement_groups
-.. autofunction:: ray.experimental.state.api.list_nodes
-.. autofunction:: ray.experimental.state.api.list_jobs
-.. autofunction:: ray.experimental.state.api.list_workers
-.. autofunction:: ray.experimental.state.api.list_tasks
-.. autofunction:: ray.experimental.state.api.list_objects
-.. autofunction:: ray.experimental.state.api.list_runtime_envs
-
-Get APIs
-~~~~~~~~~
-
-.. autofunction:: ray.experimental.state.api.get_actor
-.. autofunction:: ray.experimental.state.api.get_placement_group
-.. autofunction:: ray.experimental.state.api.get_node
-.. autofunction:: ray.experimental.state.api.get_worker
-.. autofunction:: ray.experimental.state.api.get_task
-.. autofunction:: ray.experimental.state.api.get_objects
-
-Log APIs
-~~~~~~~~
-.. autofunction:: ray.experimental.state.api.list_logs
-.. autofunction:: ray.experimental.state.api.get_log
-
-.. _state-api-schema:
-
-State APIs Schema
------------------
-
-.. _state-api-schema-actor:
-
-ActorState
-~~~~~~~~~~
-
-.. autoclass:: ray.experimental.state.common.ActorState
-    :members:
-
-.. _state-api-schema-task:
-
-TaskState
-~~~~~~~~~
-
-.. autoclass:: ray.experimental.state.common.TaskState
-    :members:
-
-.. _state-api-schema-node:
-
-NodeState
-~~~~~~~~~
-
-.. autoclass:: ray.experimental.state.common.NodeState
-    :members:
-
-.. _state-api-schema-pg:
-
-PlacementGroupState
-~~~~~~~~~~~~~~~~~~~
-
-.. autoclass:: ray.experimental.state.common.PlacementGroupState
-    :members:
-
-.. _state-api-schema-worker:
-
-WorkerState
-~~~~~~~~~~~
-
-.. autoclass:: ray.experimental.state.common.WorkerState
-    :members:
-
-.. _state-api-schema-obj:
-
-ObjectState
-~~~~~~~~~~~
-
-.. autoclass:: ray.experimental.state.common.ObjectState
-    :members:
-
-.. _state-api-schema-runtime-env:
-
-RuntimeEnvState
-~~~~~~~~~~~~~~~
-
-.. autoclass:: ray.experimental.state.common.RuntimeEnvState
-    :members:
-
-.. _state-api-schema-job:
-
-JobState
-~~~~~~~~
-
-.. autoclass:: ray.experimental.state.common.JobState
-    :members:
-
-.. _state-api-schema-summary:
-
-StateSummary
-~~~~~~~~~~~~
-
-.. autoclass:: ray.experimental.state.common.StateSummary
-    :members:
-
-.. _state-api-schema-task-summary:
-
-TaskSummary
-~~~~~~~~~~~
-
-.. _state-api-schema-task-summaries:
-
-.. autoclass:: ray.experimental.state.common.TaskSummaries
-    :members:
-
-.. _state-api-schema-task-summary-per-key:
-
-.. autoclass:: ray.experimental.state.common.TaskSummaryPerFuncOrClassName
-    :members:
-
-.. _state-api-schema-actor-summary:
-
-ActorSummary
-~~~~~~~~~~~~
-
-.. _state-api-schema-actor-summaries:
-
-.. autoclass:: ray.experimental.state.common.ActorSummaries
-    :members:
-
-.. _state-api-schema-actor-summary-per-key:
-
-.. autoclass:: ray.experimental.state.common.ActorSummaryPerClass
-    :members:
-
-.. _state-api-schema-object-summary:
-
-ObjectSummary
-~~~~~~~~~~~~~
-
-.. _state-api-schema-object-summaries:
-
-.. autoclass:: ray.experimental.state.common.ObjectSummaries
-    :members:
-
-.. _state-api-schema-object-summary-per-key:
-
-.. autoclass:: ray.experimental.state.common.ObjectSummaryPerKey
-    :members:
-
-State APIs Exceptions
----------------------
-
-.. _state-api-exceptions:
-
-.. autoclass:: ray.experimental.state.exception.RayStateApiException
-    :members:
\ No newline at end of file
diff --git a/doc/source/ray-observability/state/state-api.rst b/doc/source/ray-observability/state/state-api.rst
index 04bd682e6d07..78778ef3b753 100644
--- a/doc/source/ray-observability/state/state-api.rst
+++ b/doc/source/ray-observability/state/state-api.rst
@@ -7,7 +7,7 @@ Monitoring Ray States
 
 Ray state APIs allow users to conveniently access the current state (snapshot) of Ray through CLI or Python SDK.
 
-.. note:: 
+.. note::
 
     APIs are :ref:`alpha <api-stability-alpha>`. This feature requires a full installation of Ray using ``pip install "ray[default]"``. This feature also requires the dashboard component to be available. The dashboard component needs to be included when starting the ray cluster, which is the default behavior for ``ray start`` and ``ray.init()``. For more in-depth debugging, you could check the dashboard log at ``<RAY_LOG_DIR>/dashboard.log``, which is usually ``/tmp/ray/session_latest/logs/dashboard.log``.
 
@@ -27,12 +27,12 @@ Run any workload. In this example, you will use the following script that runs 2
     def task_running_300_seconds():
         print("Start!")
         time.sleep(300)
-    
+
     @ray.remote
     class Actor:
         def __init__(self):
             print("Actor created")
-    
+
     # Create 2 tasks
     tasks = [task_running_300_seconds.remote() for _ in range(2)]
 
@@ -84,7 +84,7 @@ Let's list all actors.
 
     .. code-block:: python
 
-        from ray.experimental.state.api import list_actors 
+        from ray.experimental.state.api import list_actors
         print(list_actors())
 
 .. code-block:: text
@@ -100,15 +100,15 @@ Let's list all actors.
     0  31405554844820381c2f0f8501000000  Actor                 96956  ALIVE
     1  f36758a9f8871a9ca993b1d201000000  Actor                 96955  ALIVE
 
-You can get the state of a single task using the get API. 
+You can get the state of a single task using the get API.
 
 .. tabbed:: CLI
 
     .. code-block:: bash
 
         # In this case, 31405554844820381c2f0f8501000000
-        ray get actors <ACTOR_ID> 
-    
+        ray get actors <ACTOR_ID>
+
 .. tabbed:: Python SDK
 
     .. code-block:: python
@@ -139,7 +139,7 @@ You can also access logs through ``ray logs`` API.
 
         ray list actors
         # In this case, ACTOR_ID is 31405554844820381c2f0f8501000000
-        ray logs actor --id <ACTOR_ID> 
+        ray logs actor --id <ACTOR_ID>
 
 .. tabbed:: Python SDK
 
@@ -164,13 +164,13 @@ Key Concepts
 Ray state APIs allow you to access **states** of **resources** through **summary**, **list**, and **get** APIs. It also supports **logs** API to access logs.
 
 - **states**: The state of the cluster of corresponding resources. States consist of immutable metadata (e.g., actor's name) and mutable states (e.g., actor's scheduling state or pid).
-- **resources**: Resources created by Ray. E.g., actors, tasks, objects, placement groups, and etc. 
+- **resources**: Resources created by Ray. E.g., actors, tasks, objects, placement groups, and etc.
 - **summary**: API to return the summarized view of resources.
 - **list**: API to return every individual entity of resources.
 - **get**: API to return a single entity of resources in detail.
 - **logs**: API to access the log of actors, tasks, workers, or system log files.
 
-Summary 
+Summary
 -------
 Return the summarized information of the given Ray resource (objects, actors, tasks).
 It is recommended to start monitoring states through summary APIs first. When you find anomalies
@@ -193,7 +193,7 @@ E.g., Summarize all actors
         from ray.experimental.state.api import summarize_actors
         print(summarize_actors())
 
-E.g., Summarize all tasks  
+E.g., Summarize all tasks
 ~~~~~~~~~~~~~~~~~~~~~~~~~
 
 .. tabbed:: CLI
@@ -209,7 +209,7 @@ E.g., Summarize all tasks
         from ray.experimental.state.api import summarize_tasks
         print(summarize_tasks())
 
-E.g., Summarize all objects  
+E.g., Summarize all objects
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 .. note::
@@ -223,7 +223,7 @@ E.g., Summarize all objects
 
     .. code-block:: bash
 
-        ray summary objects 
+        ray summary objects
 
 .. tabbed:: Python SDK
 
@@ -235,34 +235,34 @@ E.g., Summarize all objects
 List
 ----
 
-Get a list of resources, possible resources include: 
+Get a list of resources, possible resources include:
 
-- :ref:`Actors <actor-guide>`, e.g., actor id, state, pid, death_cause. (:ref:`output schema <state-api-schema-actor>`)
-- :ref:`Tasks <ray-remote-functions>`, e.g., name, scheduling state, type, runtime env info (:ref:`output schema <state-api-schema-task>`)
-- :ref:`Objects <objects-in-ray>`, e.g., object id, callsites, reference types. (:ref:`output schema <state-api-schema-obj>`)
-- :ref:`Jobs <jobs-overview>`, e.g., start/end time, entrypoint, status. (:ref:`output schema <state-api-schema-job>`)
-- :ref:`Placement Groups <ray-placement-group-doc-ref>`, e.g., name, bundles, stats. (:ref:`output schema <state-api-schema-pg>`)
-- Nodes (Ray worker nodes), e.g., node id, node ip, node state. (:ref:`output schema <state-api-schema-node>`)
-- Workers (Ray worker processes), e.g., worker id, type, exit type and details. (:ref:`output schema <state-api-schema-worker>`)
-- :ref:`Runtime environments <runtime-environments>`, e.g., runtime envs, creation time, nodes (:ref:`output schema <state-api-schema-runtime-env>`)
+- :ref:`Actors <actor-guide>`, e.g., actor id, state, pid, death_cause. (:class:`output schema <ray.experimental.state.common.ActorState>`)
+- :ref:`Tasks <ray-remote-functions>`, e.g., name, scheduling state, type, runtime env info (:class:`output schema <ray.experimental.state.common.TaskState>`)
+- :ref:`Objects <objects-in-ray>`, e.g., object id, callsites, reference types. (:class:`output schema <ray.experimental.state.common.ObjectState>`)
+- :ref:`Jobs <jobs-overview>`, e.g., start/end time, entrypoint, status. (:class:`output schema <ray.experimental.state.common.JobState>`)
+- :ref:`Placement Groups <ray-placement-group-doc-ref>`, e.g., name, bundles, stats. (:class:`output schema <ray.experimental.state.common.PlacementGroupState>`)
+- Nodes (Ray worker nodes), e.g., node id, node ip, node state. (:class:`output schema <ray.experimental.state.common.NodeState>`)
+- Workers (Ray worker processes), e.g., worker id, type, exit type and details. (:class:`output schema <ray.experimental.state.common.WorkerState>`)
+- :ref:`Runtime environments <runtime-environments>`, e.g., runtime envs, creation time, nodes (:class:`output schema <ray.experimental.state.common.RuntimeEnvState>`)
 
-E.g., List all nodes 
+E.g., List all nodes
 ~~~~~~~~~~~~~~~~~~~~~
 
 .. tabbed:: CLI
 
     .. code-block:: bash
 
-        ray list nodes 
+        ray list nodes
 
 .. tabbed:: Python SDK
 
     .. code-block:: python
 
-        from ray.experimental.state.api import list_nodes() 
+        from ray.experimental.state.api import list_nodes()
         list_nodes()
 
-E.g., List all placement groups 
+E.g., List all placement groups
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 .. tabbed:: CLI
@@ -275,10 +275,10 @@ E.g., List all placement groups
 
     .. code-block:: python
 
-        from ray.experimental.state.api import list_placement_groups 
+        from ray.experimental.state.api import list_placement_groups
         list_placement_groups()
 
- 
+
 E.g., List local referenced objects created by a process
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
@@ -294,7 +294,7 @@ E.g., List local referenced objects created by a process
 
     .. code-block:: python
 
-        from ray.experimental.state.api import list_objects 
+        from ray.experimental.state.api import list_objects
         list_objects(filters=[("pid", "=", <PID>), ("reference_type", "=", "LOCAL_REFERENCE")])
 
 E.g., List alive actors
@@ -310,7 +310,7 @@ E.g., List alive actors
 
     .. code-block:: python
 
-        from ray.experimental.state.api import list_actors 
+        from ray.experimental.state.api import list_actors
         list_actors(filters=[("state", "=", "ALIVE")])
 
 E.g., List running tasks
@@ -326,7 +326,7 @@ E.g., List running tasks
 
     .. code-block:: python
 
-        from ray.experimental.state.api import list_tasks 
+        from ray.experimental.state.api import list_tasks
         list_tasks(filters=[("state", "=", "RUNNING")])
 
 E.g., List non-running tasks
@@ -342,7 +342,7 @@ E.g., List non-running tasks
 
     .. code-block:: python
 
-        from ray.experimental.state.api import list_tasks 
+        from ray.experimental.state.api import list_tasks
         list_tasks(filters=[("state", "!=", "RUNNING")])
 
 E.g., List running tasks that have a name func
@@ -358,7 +358,7 @@ E.g., List running tasks that have a name func
 
     .. code-block:: python
 
-        from ray.experimental.state.api import list_tasks 
+        from ray.experimental.state.api import list_tasks
         list_tasks(filters=[("state", "=", "RUNNING"), ("name", "=", "task_running_300_seconds()")])
 
 E.g., List tasks with more details
@@ -376,7 +376,7 @@ E.g., List tasks with more details
 
     .. code-block:: python
 
-        from ray.experimental.state.api import list_tasks 
+        from ray.experimental.state.api import list_tasks
         list_tasks(detail=True)
 
 Get
@@ -389,13 +389,13 @@ E.g., Get a task info
 
     .. code-block:: bash
 
-        ray get tasks <TASK_ID> 
+        ray get tasks <TASK_ID>
 
 .. tabbed:: Python SDK
 
     .. code-block:: python
 
-        from ray.experimental.state.api import get_task 
+        from ray.experimental.state.api import get_task
         get_task(id=<TASK_ID>)
 
 E.g., Get a node info
@@ -405,13 +405,13 @@ E.g., Get a node info
 
     .. code-block:: bash
 
-        ray get nodes <NODE_ID> 
+        ray get nodes <NODE_ID>
 
 .. tabbed:: Python SDK
 
     .. code-block:: python
 
-        from ray.experimental.state.api import get_node 
+        from ray.experimental.state.api import get_node
         get_node(id=<NODE_ID>)
 
 Logs
@@ -435,11 +435,11 @@ E.g., Get all retrievable log file names from a head node in a cluster
 
     .. code-block:: python
 
-        # You could get the node id / node ip from `ray list nodes` 
-        from ray.experimental.state.api import list_logs 
-        # `ray logs` by default print logs from a head node. 
-        # So in order to list the same logs, you should provide the head node id. 
-        # You could get the node id / node ip from `ray list nodes` 
+        # You could get the node id / node ip from `ray list nodes`
+        from ray.experimental.state.api import list_logs
+        # `ray logs` by default print logs from a head node.
+        # So in order to list the same logs, you should provide the head node id.
+        # You could get the node id / node ip from `ray list nodes`
         list_logs(node_id=<HEAD_NODE_ID>)
 
 E.g., Get a particular log file from a node
@@ -452,13 +452,13 @@ E.g., Get a particular log file from a node
         # You could get the node id / node ip from `ray list nodes`
         ray logs cluster gcs_server.out --node-id <NODE_ID>
         # `ray logs cluster` is alias to `ray logs` when querying with globs.
-        ray logs gcs_server.out --node-id <NODE_ID> 
+        ray logs gcs_server.out --node-id <NODE_ID>
 
 .. tabbed:: Python SDK
 
     .. code-block:: python
 
-        from ray.experimental.state.api import get_log 
+        from ray.experimental.state.api import get_log
 
         # Node IP could be retrieved from list_nodes() or ray.nodes()
         for line in get_log(filename="gcs_server.out", node_id=<NODE_ID>):
@@ -471,7 +471,7 @@ E.g., Stream a log file from a node
 
     .. code-block:: bash
 
-        # You could get the node id / node ip from `ray list nodes` 
+        # You could get the node id / node ip from `ray list nodes`
         ray logs raylet.out --node-ip <NODE_IP> --follow
         # Or,
         ray logs cluster raylet.out --node-ip <NODE_IP> --follow
@@ -481,7 +481,7 @@ E.g., Stream a log file from a node
 
     .. code-block:: python
 
-        from ray.experimental.state.api import get_log 
+        from ray.experimental.state.api import get_log
 
         # Node IP could be retrieved from list_nodes() or ray.nodes()
         # The loop will block with `follow=True`
@@ -508,7 +508,7 @@ E.g., Stream log from an actor with actor id
         for line in get_log(actor_id=<ACTOR_ID>, follow=True):
             print(line)
 
-E.g., Stream log from a pid 
+E.g., Stream log from a pid
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 .. tabbed:: CLI
@@ -521,7 +521,7 @@ E.g., Stream log from a pid
 
     .. code-block:: python
 
-        from ray.experimental.state.api import get_log 
+        from ray.experimental.state.api import get_log
 
         # Node IP could be retrieved from list_nodes() or ray.nodes()
         # You could get the pid of the worker running the actor easily when output
diff --git a/doc/source/ray-references/api.rst b/doc/source/ray-references/api.rst
index 55cf2e3dd29e..77cee502833c 100644
--- a/doc/source/ray-references/api.rst
+++ b/doc/source/ray-references/api.rst
@@ -13,4 +13,4 @@ API References
     ../rllib/package_ref/index.rst
     ../workflows/api/api.rst
     ../cluster/package-overview.rst
-    ../ray-core/package-ref.rst
+    ../ray-core/api/index.rst
diff --git a/python/ray/data/block.py b/python/ray/data/block.py
index 3de5992d8511..d3629ab6fd35 100644
--- a/python/ray/data/block.py
+++ b/python/ray/data/block.py
@@ -209,21 +209,18 @@ def build(self) -> "BlockExecStats":
 @DeveloperAPI
 @dataclass
 class BlockMetadata:
-    """Metadata about the block.
-
-    Attributes:
-        num_rows: The number of rows contained in this block, or None.
-        size_bytes: The approximate size in bytes of this block, or None.
-        schema: The pyarrow schema or types of the block elements, or None.
-        input_files: The list of file paths used to generate this block, or
-            the empty list if indeterminate.
-        exec_stats: Execution stats for this block.
-    """
+    """Metadata about the block."""
 
+    #: The number of rows contained in this block, or None.
     num_rows: Optional[int]
+    #: The approximate size in bytes of this block, or None.
     size_bytes: Optional[int]
+    #: The pyarrow schema or types of the block elements, or None.
     schema: Optional[Union[type, "pyarrow.lib.Schema"]]
+    #: The list of file paths used to generate this block, or
+    #: the empty list if indeterminate.
     input_files: Optional[List[str]]
+    #: Execution stats for this block.
     exec_stats: Optional[BlockExecStats]
 
     def __post_init__(self):
diff --git a/python/ray/data/datasource/partitioning.py b/python/ray/data/datasource/partitioning.py
index b7255d0a7721..30462514c36a 100644
--- a/python/ray/data/datasource/partitioning.py
+++ b/python/ray/data/datasource/partitioning.py
@@ -42,25 +42,23 @@ class Partitioning:
 
     Path-based partition formats embed all partition keys and values directly in
     their dataset file paths.
-
-    Attributes:
-        style: The partition style - may be either HIVE or DIRECTORY.
-        base_dir: "/"-delimited base directory that all partitioned paths should
-            exist under (exclusive). File paths either outside of, or at the first
-            level of, this directory will be considered unpartitioned. Specify
-            `None` or an empty string to search for partitions in all file path
-            directories.
-        field_names: The partition key field names (i.e. column names for tabular
-            datasets). When non-empty, the order and length of partition key
-            field names must match the order and length of partition values.
-            Required when parsing DIRECTORY partitioned paths or generating
-            HIVE partitioned paths.
-        filesystem: Filesystem that will be used for partition path file I/O.
     """
 
+    #: The partition style - may be either HIVE or DIRECTORY.
     style: PartitionStyle
+    #: "/"-delimited base directory that all partitioned paths should
+    #: exist under (exclusive). File paths either outside of, or at the first
+    #: level of, this directory will be considered unpartitioned. Specify
+    #: `None` or an empty string to search for partitions in all file path
+    #: directories.
     base_dir: Optional[str] = None
+    #: The partition key field names (i.e. column names for tabular
+    #: datasets). When non-empty, the order and length of partition key
+    #: field names must match the order and length of partition values.
+    #: Required when parsing DIRECTORY partitioned paths or generating
+    #: HIVE partitioned paths.
     field_names: Optional[List[str]] = None
+    #: Filesystem that will be used for partition path file I/O.
     filesystem: Optional["pyarrow.fs.FileSystem"] = None
 
     def __post_init__(self):
diff --git a/python/ray/experimental/state/api.py b/python/ray/experimental/state/api.py
index daefed8b423b..883c43cacbe0 100644
--- a/python/ray/experimental/state/api.py
+++ b/python/ray/experimental/state/api.py
@@ -550,12 +550,12 @@ def get_actor(
 
     Returns:
         None if actor not found, or dictionarified
-        :ref:`ActorState <state-api-schema-actor>`.
+        :class:`ActorState <ray.experimental.state.common.ActorState>`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).get(
         StateResource.ACTORS, id, GetApiOptions(timeout=timeout), _explain=_explain
     )
@@ -589,12 +589,12 @@ def get_placement_group(
 
     Returns:
         None if actor not found, or dictionarified
-        :ref:`PlacementGroupState <state-api-schema-pg>`.
+        :class:`~ray.experimental.state.common.PlacementGroupState`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).get(
         StateResource.PLACEMENT_GROUPS,
         id,
@@ -621,12 +621,12 @@ def get_node(
 
     Returns:
         None if actor not found, or dictionarified
-        :ref:`NodeState <state-api-schema-node>`.
+        :class:`NodeState <ray.experimental.state.common.NodeState>`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>`
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`
             if the CLI is failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).get(
         StateResource.NODES,
         id,
@@ -653,12 +653,12 @@ def get_worker(
 
     Returns:
         None if actor not found, or dictionarified
-        :ref:`WorkerState <state-api-schema-worker>`.
+        :class:`WorkerState <ray.experimental.state.common.WorkerState>`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).get(
         StateResource.WORKERS,
         id,
@@ -685,12 +685,13 @@ def get_task(
 
     Returns:
         None if task not found, or a list of dictionarified
-        :ref:`TaskState <state-api-schema-task>` from the task attempts.
+        :class:`~ray.experimental.state.common.TaskState`
+        from the task attempts.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).get(
         StateResource.TASKS,
         id,
@@ -719,12 +720,13 @@ def get_objects(
             failed query information.
 
     Returns:
-        List of dictionarified :ref:`ObjectState <state-api-schema-obj>`.
+        List of dictionarified
+        :class:`~ray.experimental.state.common.ObjectState`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>`  if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`  if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).get(
         StateResource.OBJECTS,
         id,
@@ -753,7 +755,7 @@ def list_actors(
         timeout: Max timeout value for the state APIs requests made.
         detail: When True, more details info (specified in `ActorState`)
             will be queried and returned. See
-            :ref:`ActorState <state-api-schema-actor>`.
+            :class:`ActorState <ray.experimental.state.common.ActorState>`.
         raise_on_missing_output: When True, exceptions will be raised if
             there is missing data due to truncation/data source unavailable.
         _explain: Print the API information such as API latency or
@@ -761,12 +763,12 @@ def list_actors(
 
     Returns:
         List of dictionarified
-        :ref:`ActorState <state-api-schema-actor>`.
+        :class:`ActorState <ray.experimental.state.common.ActorState>`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).list(
         StateResource.ACTORS,
         options=ListApiOptions(
@@ -800,7 +802,7 @@ def list_placement_groups(
         timeout: Max timeout value for the state APIs requests made.
         detail: When True, more details info (specified in `PlacementGroupState`)
             will be queried and returned. See
-            :ref:`PlacementGroupState <state-api-schema-pg>`.
+            :class:`~ray.experimental.state.common.PlacementGroupState`.
         raise_on_missing_output: When True, exceptions will be raised if
             there is missing data due to truncation/data source unavailable.
         _explain: Print the API information such as API latency or
@@ -808,12 +810,12 @@ def list_placement_groups(
 
     Returns:
         List of dictionarified
-        :ref:`PlacementGroupState <state-api-schema-pg>`.
+        :class:`~ray.experimental.state.common.PlacementGroupState`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).list(
         StateResource.PLACEMENT_GROUPS,
         options=ListApiOptions(
@@ -844,7 +846,7 @@ def list_nodes(
         timeout: Max timeout value for the state APIs requests made.
         detail: When True, more details info (specified in `NodeState`)
             will be queried and returned. See
-            :ref:`NodeState <state-api-schema-node>`.
+            :class:`NodeState <ray.experimental.state.common.NodeState>`.
         raise_on_missing_output: When True, exceptions will be raised if
             there is missing data due to truncation/data source unavailable.
         _explain: Print the API information such as API latency or
@@ -852,12 +854,12 @@ def list_nodes(
 
     Returns:
         List of dictionarified
-        :ref:`NodeState <state-api-schema-node>`.
+        :class:`NodeState <ray.experimental.state.common.NodeState>`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>`
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`
             if the CLI failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).list(
         StateResource.NODES,
         options=ListApiOptions(
@@ -888,7 +890,7 @@ def list_jobs(
         timeout: Max timeout value for the state APIs requests made.
         detail: When True, more details info (specified in `JobState`)
             will be queried and returned. See
-            :ref:`JobState <state-api-schema-job>`.
+            :class:`JobState <ray.experimental.state.common.JobState>`.
         raise_on_missing_output: When True, exceptions will be raised if
             there is missing data due to truncation/data source unavailable.
         _explain: Print the API information such as API latency or
@@ -896,12 +898,12 @@ def list_jobs(
 
     Returns:
         List of dictionarified
-        :ref:`JobState <state-api-schema-job>`.
+        :class:`JobState <ray.experimental.state.common.JobState>`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).list(
         StateResource.JOBS,
         options=ListApiOptions(
@@ -932,7 +934,7 @@ def list_workers(
         timeout: Max timeout value for the state APIs requests made.
         detail: When True, more details info (specified in `WorkerState`)
             will be queried and returned. See
-            :ref:`WorkerState <state-api-schema-worker>`.
+            :class:`WorkerState <ray.experimental.state.common.WorkerState>`.
         raise_on_missing_output: When True, exceptions will be raised if
             there is missing data due to truncation/data source unavailable.
         _explain: Print the API information such as API latency or
@@ -940,12 +942,12 @@ def list_workers(
 
     Returns:
         List of dictionarified
-        :ref:`WorkerState <state-api-schema-worker>`.
+        :class:`WorkerState <ray.experimental.state.common.WorkerState>`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).list(
         StateResource.WORKERS,
         options=ListApiOptions(
@@ -976,7 +978,7 @@ def list_tasks(
         timeout: Max timeout value for the state APIs requests made.
         detail: When True, more details info (specified in `WorkerState`)
             will be queried and returned. See
-            :ref:`WorkerState <state-api-schema-worker>`.
+            :class:`WorkerState <ray.experimental.state.common.WorkerState>`.
         raise_on_missing_output: When True, exceptions will be raised if
             there is missing data due to truncation/data source unavailable.
         _explain: Print the API information such as API latency or
@@ -984,12 +986,12 @@ def list_tasks(
 
     Returns:
         List of dictionarified
-        :ref:`WorkerState <state-api-schema-worker>`.
+        :class:`WorkerState <ray.experimental.state.common.WorkerState>`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).list(
         StateResource.TASKS,
         options=ListApiOptions(
@@ -1020,7 +1022,7 @@ def list_objects(
         timeout: Max timeout value for the state APIs requests made.
         detail: When True, more details info (specified in `ObjectState`)
             will be queried and returned. See
-            :ref:`ObjectState <state-api-schema-obj>`.
+            :class:`ObjectState <ray.experimental.state.common.ObjectState>`.
         raise_on_missing_output: When True, exceptions will be raised if
             there is missing data due to truncation/data source unavailable.
         _explain: Print the API information such as API latency or
@@ -1028,12 +1030,12 @@ def list_objects(
 
     Returns:
         List of dictionarified
-        :ref:`ObjectState <state-api-schema-obj>`.
+        :class:`ObjectState <ray.experimental.state.common.ObjectState>`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).list(
         StateResource.OBJECTS,
         options=ListApiOptions(
@@ -1064,7 +1066,7 @@ def list_runtime_envs(
         timeout: Max timeout value for the state APIs requests made.
         detail: When True, more details info (specified in `RuntimeEnvState`)
             will be queried and returned. See
-            :ref:`RuntimeEnvState <state-api-schema-runtime-env>`.
+            :class:`RuntimeEnvState <ray.experimental.state.common.RuntimeEnvState>`.
         raise_on_missing_output: When True, exceptions will be raised if
             there is missing data due to truncation/data source unavailable.
         _explain: Print the API information such as API latency or
@@ -1072,12 +1074,12 @@ def list_runtime_envs(
 
     Returns:
         List of dictionarified
-        :ref:`RuntimeEnvState <state-api-schema-runtime-env>`.
+        :class:`RuntimeEnvState <ray.experimental.state.common.RuntimeEnvState>`.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
-            failed to query the data.
-    """
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`
+            if the CLI failed to query the data.
+    """  # noqa: E501
     return StateApiClient(address=address).list(
         StateResource.RUNTIME_ENVS,
         options=ListApiOptions(
@@ -1161,9 +1163,9 @@ def get_log(
         A Generator of log line, None for SendType and ReturnType.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
 
     api_server_url = ray_address_to_api_server_url(address)
     media_type = "stream" if follow else "file"
@@ -1232,10 +1234,10 @@ def list_logs(
         values are list of log filenames.
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data, or ConnectionError if failed to resolve the
             ray address.
-    """
+    """  # noqa: E501
     assert (
         node_ip is not None or node_id is not None
     ), "At least one of node ip and node id is required"
@@ -1291,12 +1293,13 @@ def summarize_tasks(
             failed query information.
 
     Return:
-        Dictionarified :ref:`TaskSummaries <state-api-schema-task-summaries>`
+        Dictionarified
+        :class:`~ray.experimental.state.common.TaskSummaries`
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>`
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`
             if the CLI is failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).summary(
         SummaryResource.TASKS,
         options=SummaryApiOptions(timeout=timeout),
@@ -1323,12 +1326,13 @@ def summarize_actors(
             failed query information.
 
     Return:
-        Dictionarified :ref:`ActorSummaries <state-api-schema-actor-summaries>`
+        Dictionarified
+        :class:`~ray.experimental.state.common.ActorSummaries`
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).summary(
         SummaryResource.ACTORS,
         options=SummaryApiOptions(timeout=timeout),
@@ -1355,12 +1359,12 @@ def summarize_objects(
             failed query information.
 
     Return:
-        Dictionarified :ref:`ObjectSummaries <state-api-schema-object-summaries>`
+        Dictionarified :class:`~ray.experimental.state.common.ObjectSummaries`
 
     Raises:
-        Exceptions: :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        Exceptions: :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             failed to query the data.
-    """
+    """  # noqa: E501
     return StateApiClient(address=address).summary(
         SummaryResource.OBJECTS,
         options=SummaryApiOptions(timeout=timeout),
diff --git a/python/ray/experimental/state/state_cli.py b/python/ray/experimental/state/state_cli.py
index 1f297c9eaba0..55f94ad6bc31 100644
--- a/python/ray/experimental/state/state_cli.py
+++ b/python/ray/experimental/state/state_cli.py
@@ -353,7 +353,7 @@ def ray_get(
     The output schema is defined at :ref:`State API Schema section. <state-api-schema>`
 
     For example, the output schema of `ray get tasks <task-id>` is
-    :ref:`ray.experimental.state.common.TaskState <state-api-schema-task>`.
+    :class:`~ray.experimental.state.common.TaskState`.
 
     Usage:
 
@@ -378,9 +378,9 @@ def ray_get(
         id: The id of the resource.
 
     Raises:
-        :ref:`RayStateApiException <state-api-exceptions>`
+        :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`
             if the CLI is failed to query the data.
-    """
+    """  # noqa: E501
     # All resource names use '_' rather than '-'. But users options have '-'
     resource = StateResource(resource.replace("-", "_"))
 
@@ -466,7 +466,7 @@ def ray_list(
     The output schema is defined at :ref:`State API Schema section. <state-api-schema>`
 
     For example, the output schema of `ray list tasks` is
-    :ref:`ray.experimental.state.common.TaskState <state-api-schema-task>`.
+    :class:`~ray.experimental.state.common.TaskState`.
 
     Usage:
 
@@ -517,9 +517,9 @@ def ray_list(
         resource: The type of the resource to query.
 
     Raises:
-        :ref:`RayStateApiException <state-api-exceptions>`
+        :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`
             if the CLI is failed to query the data.
-    """
+    """  # noqa: E501
     # All resource names use '_' rather than '-'. But users options have '-'
     resource = StateResource(resource.replace("-", "_"))
     format = AvailableFormat(format)
@@ -581,12 +581,12 @@ def task_summary(ctx, timeout: float, address: str):
     task function names.
 
     The output schema is
-    :ref:`ray.experimental.state.common.TaskSummaries <state-api-schema-task-summary>`.
+    :class:`~ray.experimental.state.common.TaskSummaries`.
 
     Raises:
-        :ref:`RayStateApiException <state-api-exceptions>`
+        :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`
             if the CLI is failed to query the data.
-    """
+    """  # noqa: E501
     print(
         format_summary_output(
             summarize_tasks(
@@ -612,13 +612,13 @@ def actor_summary(ctx, timeout: float, address: str):
     actor class names.
 
     The output schema is
-    :ref:`ray.experimental.state.common.ActorSummaries
-    <state-api-schema-actor-summary>`.
+    :class:`ray.experimental.state.common.ActorSummaries
+    <ray.experimental.state.common.ActorSummaries>`.
 
     Raises:
-        :ref:`RayStateApiException <state-api-exceptions>`
+        :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`
             if the CLI is failed to query the data.
-    """
+    """  # noqa: E501
     print(
         format_summary_output(
             summarize_actors(
@@ -663,13 +663,13 @@ def object_summary(ctx, timeout: float, address: str):
         ```
 
     The output schema is
-    :ref:`ray.experimental.state.common.ObjectSummaries
-    <state-api-schema-object-summary>`.
+    :class:`ray.experimental.state.common.ObjectSummaries
+    <ray.experimental.state.common.ObjectSummaries>`.
 
     Raises:
-        :ref:`RayStateApiException <state-api-exceptions>`
+        :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`
             if the CLI is failed to query the data.
-    """
+    """  # noqa: E501
     print(
         format_object_summary_output(
             summarize_objects(
@@ -920,9 +920,9 @@ def log_cluster(
         ```
 
     Raises:
-        :ref:`RayStateApiException <state-api-exceptions>` if the CLI
+        :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>` if the CLI
             is failed to query the data.
-    """
+    """  # noqa: E501
 
     if node_id is None and node_ip is None:
         node_ip = _get_head_node_ip(address)
@@ -1029,10 +1029,10 @@ def log_actor(
         ```
 
     Raises:
-        :ref:`RayStateApiException <state-api-exceptions>`
+        :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`
             if the CLI is failed to query the data.
         MissingParameter if inputs are missing.
-    """
+    """  # noqa: E501
 
     if pid is None and id is None:
         raise click.MissingParameter(
@@ -1102,10 +1102,10 @@ def log_worker(
         ```
 
     Raises:
-        :ref:`RayStateApiException <state-api-exceptions>`
+        :class:`RayStateApiException <ray.experimental.state.exception.RayStateApiException>`
             if the CLI is failed to query the data.
         MissingParameter if inputs are missing.
-    """
+    """  # noqa: E501
 
     _print_log(
         address=address,
diff --git a/rllib/policy/sample_batch.py b/rllib/policy/sample_batch.py
index 98fe4213b1dd..0f83b70fb0f9 100644
--- a/rllib/policy/sample_batch.py
+++ b/rllib/policy/sample_batch.py
@@ -804,7 +804,7 @@ def to_device(self, device, framework="torch"):
     def size_bytes(self) -> int:
         """Returns sum over number of bytes of all data buffers.
 
-        For numpy arrays, we use `.nbytes`. For all other value types, we use
+        For numpy arrays, we use ``.nbytes``. For all other value types, we use
         sys.getsizeof(...).
 
         Returns:

From b89457aa860252241693698a43ab4c402de97455 Mon Sep 17 00:00:00 2001
From: Jian Xiao <99709935+jianoaix@users.noreply.github.com>
Date: Mon, 13 Feb 2023 23:09:46 -0800
Subject: [PATCH 256/267] Deflake test_dataset.py: split torch tests (#32487)

One of the flakiness of test_dataset.py is due to the timeout. This splits out the torch tests from this big test file.

https://github.com/ray-project/ray/issues/32067
---
 python/ray/data/tests/test_dataset.py       | 309 ------------------
 python/ray/data/tests/test_dataset_torch.py | 330 ++++++++++++++++++++
 2 files changed, 330 insertions(+), 309 deletions(-)
 create mode 100644 python/ray/data/tests/test_dataset_torch.py

diff --git a/python/ray/data/tests/test_dataset.py b/python/ray/data/tests/test_dataset.py
index 12dc26e97264..933dc3952e1d 100644
--- a/python/ray/data/tests/test_dataset.py
+++ b/python/ray/data/tests/test_dataset.py
@@ -1299,143 +1299,6 @@ def test_tensors_in_tables_iter_batches(
         pd.testing.assert_frame_equal(batch, expected_batch)
 
 
-@pytest.mark.parametrize("pipelined", [False, True])
-def test_tensors_in_tables_to_torch(ray_start_regular_shared, pipelined):
-    outer_dim = 3
-    inner_shape = (2, 2, 2)
-    shape = (outer_dim,) + inner_shape
-    num_items = np.prod(np.array(shape))
-    arr = np.arange(num_items).reshape(shape)
-    df1 = pd.DataFrame(
-        {"one": TensorArray(arr), "two": TensorArray(arr + 1), "label": [1.0, 2.0, 3.0]}
-    )
-    arr2 = np.arange(num_items, 2 * num_items).reshape(shape)
-    df2 = pd.DataFrame(
-        {
-            "one": TensorArray(arr2),
-            "two": TensorArray(arr2 + 1),
-            "label": [4.0, 5.0, 6.0],
-        }
-    )
-    df = pd.concat([df1, df2])
-    ds = ray.data.from_pandas([df1, df2])
-    ds = maybe_pipeline(ds, pipelined)
-    torchd = ds.to_torch(
-        label_column="label", batch_size=2, unsqueeze_label_tensor=False
-    )
-
-    num_epochs = 1 if pipelined else 2
-    for _ in range(num_epochs):
-        features, labels = [], []
-        for batch in iter(torchd):
-            features.append(batch[0].numpy())
-            labels.append(batch[1].numpy())
-        features, labels = np.concatenate(features), np.concatenate(labels)
-        values = np.stack([df["one"].to_numpy(), df["two"].to_numpy()], axis=1)
-        np.testing.assert_array_equal(values, features)
-        np.testing.assert_array_equal(df["label"].to_numpy(), labels)
-
-
-@pytest.mark.parametrize("pipelined", [False, True])
-def test_tensors_in_tables_to_torch_mix(ray_start_regular_shared, pipelined):
-    outer_dim = 3
-    inner_shape = (2, 2, 2)
-    shape = (outer_dim,) + inner_shape
-    num_items = np.prod(np.array(shape))
-    arr = np.arange(num_items).reshape(shape)
-    df1 = pd.DataFrame(
-        {
-            "one": TensorArray(arr),
-            "two": [1, 2, 3],
-            "label": [1.0, 2.0, 3.0],
-        }
-    )
-    arr2 = np.arange(num_items, 2 * num_items).reshape(shape)
-    df2 = pd.DataFrame(
-        {
-            "one": TensorArray(arr2),
-            "two": [4, 5, 6],
-            "label": [4.0, 5.0, 6.0],
-        }
-    )
-    df = pd.concat([df1, df2])
-    ds = ray.data.from_pandas([df1, df2])
-    ds = maybe_pipeline(ds, pipelined)
-    torchd = ds.to_torch(
-        label_column="label",
-        feature_columns=[["one"], ["two"]],
-        batch_size=2,
-        unsqueeze_label_tensor=False,
-        unsqueeze_feature_tensors=False,
-    )
-
-    num_epochs = 1 if pipelined else 2
-    for _ in range(num_epochs):
-        col1, col2, labels = [], [], []
-        for batch in iter(torchd):
-            col1.append(batch[0][0].numpy())
-            col2.append(batch[0][1].numpy())
-            labels.append(batch[1].numpy())
-        col1, col2 = np.concatenate(col1), np.concatenate(col2)
-        labels = np.concatenate(labels)
-        np.testing.assert_array_equal(col1, np.sort(df["one"].to_numpy()))
-        np.testing.assert_array_equal(col2, np.sort(df["two"].to_numpy()))
-        np.testing.assert_array_equal(labels, np.sort(df["label"].to_numpy()))
-
-
-@pytest.mark.skip(
-    reason=(
-        "Waiting for Torch to support unsqueezing and concatenating nested tensors."
-    )
-)
-@pytest.mark.parametrize("pipelined", [False, True])
-def test_tensors_in_tables_to_torch_variable_shaped(
-    ray_start_regular_shared, pipelined
-):
-    shapes = [(2, 2), (3, 3), (4, 4)]
-    cumsum_sizes = np.cumsum([0] + [np.prod(shape) for shape in shapes[:-1]])
-    arrs1 = [
-        np.arange(offset, offset + np.prod(shape)).reshape(shape)
-        for offset, shape in zip(cumsum_sizes, shapes)
-    ]
-    df1 = pd.DataFrame(
-        {
-            "one": TensorArray(arrs1),
-            "two": TensorArray([a + 1 for a in arrs1]),
-            "label": [1.0, 2.0, 3.0],
-        }
-    )
-    base = cumsum_sizes[-1]
-    arrs2 = [
-        np.arange(base + offset, base + offset + np.prod(shape)).reshape(shape)
-        for offset, shape in zip(cumsum_sizes, shapes)
-    ]
-    df2 = pd.DataFrame(
-        {
-            "one": TensorArray(arrs2),
-            "two": TensorArray([a + 1 for a in arrs2]),
-            "label": [4.0, 5.0, 6.0],
-        }
-    )
-    df = pd.concat([df1, df2])
-    ds = ray.data.from_pandas([df1, df2])
-    ds = maybe_pipeline(ds, pipelined)
-    torchd = ds.to_torch(
-        label_column="label", batch_size=2, unsqueeze_label_tensor=False
-    )
-
-    num_epochs = 1 if pipelined else 2
-    for _ in range(num_epochs):
-        features, labels = [], []
-        for batch in iter(torchd):
-            features.append(batch[0].numpy())
-            labels.append(batch[1].numpy())
-        features, labels = np.concatenate(features), np.concatenate(labels)
-        values = np.stack([df["one"].to_numpy(), df["two"].to_numpy()], axis=1)
-        np.testing.assert_array_equal(values, features)
-        np.testing.assert_array_equal(df["label"].to_numpy(), labels)
-
-
 def test_empty_shuffle(ray_start_regular_shared):
     ds = ray.data.range(100, parallelism=100)
     ds = ds.filter(lambda x: x)
@@ -3072,178 +2935,6 @@ def test_iter_tf_batches_tensor_ds(ray_start_regular_shared, pipelined):
         np.testing.assert_array_equal(arr, combined_iterations)
 
 
-@pytest.mark.parametrize("pipelined", [False, True])
-def test_to_torch(ray_start_regular_shared, pipelined):
-    import torch
-
-    df1 = pd.DataFrame(
-        {"one": [1, 2, 3], "two": [1.0, 2.0, 3.0], "label": [1.0, 2.0, 3.0]}
-    )
-    df2 = pd.DataFrame(
-        {"one": [4, 5, 6], "two": [4.0, 5.0, 6.0], "label": [4.0, 5.0, 6.0]}
-    )
-    df3 = pd.DataFrame({"one": [7, 8], "two": [7.0, 8.0], "label": [7.0, 8.0]})
-    df = pd.concat([df1, df2, df3])
-    ds = ray.data.from_pandas([df1, df2, df3])
-    ds = maybe_pipeline(ds, pipelined)
-    torchd = ds.to_torch(label_column="label", batch_size=3)
-
-    num_epochs = 1 if pipelined else 2
-    for _ in range(num_epochs):
-        iterations = []
-        for batch in iter(torchd):
-            iterations.append(torch.cat((batch[0], batch[1]), dim=1).numpy())
-        combined_iterations = np.concatenate(iterations)
-        np.testing.assert_array_equal(np.sort(df.values), np.sort(combined_iterations))
-
-
-@pytest.mark.parametrize("pipelined", [False, True])
-def test_iter_torch_batches(ray_start_regular_shared, pipelined):
-    import torch
-
-    df1 = pd.DataFrame(
-        {"one": [1, 2, 3], "two": [1.0, 2.0, 3.0], "label": [1.0, 2.0, 3.0]}
-    )
-    df2 = pd.DataFrame(
-        {"one": [4, 5, 6], "two": [4.0, 5.0, 6.0], "label": [4.0, 5.0, 6.0]}
-    )
-    df3 = pd.DataFrame({"one": [7, 8], "two": [7.0, 8.0], "label": [7.0, 8.0]})
-    df = pd.concat([df1, df2, df3])
-    ds = ray.data.from_pandas([df1, df2, df3])
-    ds = maybe_pipeline(ds, pipelined)
-
-    num_epochs = 1 if pipelined else 2
-    for _ in range(num_epochs):
-        iterations = []
-        for batch in ds.iter_torch_batches(batch_size=3):
-            iterations.append(
-                torch.stack(
-                    (batch["one"], batch["two"], batch["label"]),
-                    dim=1,
-                ).numpy()
-            )
-        combined_iterations = np.concatenate(iterations)
-        np.testing.assert_array_equal(np.sort(df.values), np.sort(combined_iterations))
-
-
-@pytest.mark.parametrize("pipelined", [False, True])
-def test_iter_torch_batches_tensor_ds(ray_start_regular_shared, pipelined):
-    arr1 = np.arange(12).reshape((3, 2, 2))
-    arr2 = np.arange(12, 24).reshape((3, 2, 2))
-    arr = np.concatenate((arr1, arr2))
-    ds = ray.data.from_numpy([arr1, arr2])
-    ds = maybe_pipeline(ds, pipelined)
-
-    num_epochs = 1 if pipelined else 2
-    for _ in range(num_epochs):
-        iterations = []
-        for batch in ds.iter_torch_batches(batch_size=2):
-            iterations.append(batch.numpy())
-        combined_iterations = np.concatenate(iterations)
-        np.testing.assert_array_equal(arr, combined_iterations)
-
-
-@pytest.mark.parametrize("input", ["single", "list", "dict"])
-@pytest.mark.parametrize("force_dtype", [False, True])
-@pytest.mark.parametrize("label_type", [None, "squeezed", "unsqueezed"])
-def test_to_torch_feature_columns(
-    ray_start_regular_shared, input, force_dtype, label_type
-):
-    import torch
-
-    df1 = pd.DataFrame(
-        {
-            "one": [1, 2, 3],
-            "two": [1.0, 2.0, 3.0],
-            "three": [4.0, 5.0, 6.0],
-            "label": [1.0, 2.0, 3.0],
-        }
-    )
-    df2 = pd.DataFrame(
-        {
-            "one": [4, 5, 6],
-            "two": [4.0, 5.0, 6.0],
-            "three": [7.0, 8.0, 9.0],
-            "label": [4.0, 5.0, 6.0],
-        }
-    )
-    df3 = pd.DataFrame(
-        {"one": [7, 8], "two": [7.0, 8.0], "three": [10.0, 11.0], "label": [7.0, 8.0]}
-    )
-    df = pd.concat([df1, df2, df3]).drop("three", axis=1)
-    ds = ray.data.from_pandas([df1, df2, df3])
-
-    feature_column_dtypes = None
-    label_column_dtype = None
-    if force_dtype:
-        label_column_dtype = torch.long
-    if input == "single":
-        feature_columns = ["one", "two"]
-        if force_dtype:
-            feature_column_dtypes = torch.long
-    elif input == "list":
-        feature_columns = [["one"], ["two"]]
-        if force_dtype:
-            feature_column_dtypes = [torch.long, torch.long]
-    elif input == "dict":
-        feature_columns = {"X1": ["one"], "X2": ["two"]}
-        if force_dtype:
-            feature_column_dtypes = {"X1": torch.long, "X2": torch.long}
-
-    label_column = None if label_type is None else "label"
-    unsqueeze_label_tensor = label_type == "unsqueezed"
-
-    torchd = ds.to_torch(
-        label_column=label_column,
-        feature_columns=feature_columns,
-        feature_column_dtypes=feature_column_dtypes,
-        label_column_dtype=label_column_dtype,
-        unsqueeze_label_tensor=unsqueeze_label_tensor,
-        batch_size=3,
-    )
-    iterations = []
-
-    for batch in iter(torchd):
-        features, label = batch
-
-        if input == "single":
-            assert isinstance(features, torch.Tensor)
-            if force_dtype:
-                assert features.dtype == torch.long
-            data = features
-        elif input == "list":
-            assert isinstance(features, list)
-            assert all(isinstance(item, torch.Tensor) for item in features)
-            if force_dtype:
-                assert all(item.dtype == torch.long for item in features)
-            data = torch.cat(tuple(features), dim=1)
-        elif input == "dict":
-            assert isinstance(features, dict)
-            assert all(isinstance(item, torch.Tensor) for item in features.values())
-            if force_dtype:
-                assert all(item.dtype == torch.long for item in features.values())
-            data = torch.cat(tuple(features.values()), dim=1)
-
-        if not label_type:
-            assert label is None
-        else:
-            assert isinstance(label, torch.Tensor)
-            if force_dtype:
-                assert label.dtype == torch.long
-            if unsqueeze_label_tensor:
-                assert label.dim() == 2
-            else:
-                assert label.dim() == 1
-                label = label.view(-1, 1)
-            data = torch.cat((data, label), dim=1)
-        iterations.append(data.numpy())
-
-    combined_iterations = np.concatenate(iterations)
-    if not label_type:
-        df.drop("label", axis=1, inplace=True)
-    np.testing.assert_array_equal(df.values, combined_iterations)
-
-
 def test_block_builder_for_block(ray_start_regular_shared):
     # list
     builder = BlockBuilder.for_block(list())
diff --git a/python/ray/data/tests/test_dataset_torch.py b/python/ray/data/tests/test_dataset_torch.py
new file mode 100644
index 000000000000..e36587437f65
--- /dev/null
+++ b/python/ray/data/tests/test_dataset_torch.py
@@ -0,0 +1,330 @@
+import numpy as np
+import pandas as pd
+import pytest
+
+import ray
+from ray.data.extensions.tensor_extension import TensorArray
+from ray.data.tests.conftest import *  # noqa
+from ray.tests.conftest import *  # noqa
+
+
+def maybe_pipeline(ds, enabled):
+    if enabled:
+        return ds.window(blocks_per_window=1)
+    else:
+        return ds
+
+
+@pytest.mark.parametrize("pipelined", [False, True])
+def test_to_torch(ray_start_regular_shared, pipelined):
+    import torch
+
+    df1 = pd.DataFrame(
+        {"one": [1, 2, 3], "two": [1.0, 2.0, 3.0], "label": [1.0, 2.0, 3.0]}
+    )
+    df2 = pd.DataFrame(
+        {"one": [4, 5, 6], "two": [4.0, 5.0, 6.0], "label": [4.0, 5.0, 6.0]}
+    )
+    df3 = pd.DataFrame({"one": [7, 8], "two": [7.0, 8.0], "label": [7.0, 8.0]})
+    df = pd.concat([df1, df2, df3])
+    ds = ray.data.from_pandas([df1, df2, df3])
+    ds = maybe_pipeline(ds, pipelined)
+    torchd = ds.to_torch(label_column="label", batch_size=3)
+
+    num_epochs = 1 if pipelined else 2
+    for _ in range(num_epochs):
+        iterations = []
+        for batch in iter(torchd):
+            iterations.append(torch.cat((batch[0], batch[1]), dim=1).numpy())
+        combined_iterations = np.concatenate(iterations)
+        np.testing.assert_array_equal(np.sort(df.values), np.sort(combined_iterations))
+
+
+@pytest.mark.parametrize("input", ["single", "list", "dict"])
+@pytest.mark.parametrize("force_dtype", [False, True])
+@pytest.mark.parametrize("label_type", [None, "squeezed", "unsqueezed"])
+def test_to_torch_feature_columns(
+    ray_start_regular_shared, input, force_dtype, label_type
+):
+    import torch
+
+    df1 = pd.DataFrame(
+        {
+            "one": [1, 2, 3],
+            "two": [1.0, 2.0, 3.0],
+            "three": [4.0, 5.0, 6.0],
+            "label": [1.0, 2.0, 3.0],
+        }
+    )
+    df2 = pd.DataFrame(
+        {
+            "one": [4, 5, 6],
+            "two": [4.0, 5.0, 6.0],
+            "three": [7.0, 8.0, 9.0],
+            "label": [4.0, 5.0, 6.0],
+        }
+    )
+    df3 = pd.DataFrame(
+        {"one": [7, 8], "two": [7.0, 8.0], "three": [10.0, 11.0], "label": [7.0, 8.0]}
+    )
+    df = pd.concat([df1, df2, df3]).drop("three", axis=1)
+    ds = ray.data.from_pandas([df1, df2, df3])
+
+    feature_column_dtypes = None
+    label_column_dtype = None
+    if force_dtype:
+        label_column_dtype = torch.long
+    if input == "single":
+        feature_columns = ["one", "two"]
+        if force_dtype:
+            feature_column_dtypes = torch.long
+    elif input == "list":
+        feature_columns = [["one"], ["two"]]
+        if force_dtype:
+            feature_column_dtypes = [torch.long, torch.long]
+    elif input == "dict":
+        feature_columns = {"X1": ["one"], "X2": ["two"]}
+        if force_dtype:
+            feature_column_dtypes = {"X1": torch.long, "X2": torch.long}
+
+    label_column = None if label_type is None else "label"
+    unsqueeze_label_tensor = label_type == "unsqueezed"
+
+    torchd = ds.to_torch(
+        label_column=label_column,
+        feature_columns=feature_columns,
+        feature_column_dtypes=feature_column_dtypes,
+        label_column_dtype=label_column_dtype,
+        unsqueeze_label_tensor=unsqueeze_label_tensor,
+        batch_size=3,
+    )
+    iterations = []
+
+    for batch in iter(torchd):
+        features, label = batch
+
+        if input == "single":
+            assert isinstance(features, torch.Tensor)
+            if force_dtype:
+                assert features.dtype == torch.long
+            data = features
+        elif input == "list":
+            assert isinstance(features, list)
+            assert all(isinstance(item, torch.Tensor) for item in features)
+            if force_dtype:
+                assert all(item.dtype == torch.long for item in features)
+            data = torch.cat(tuple(features), dim=1)
+        elif input == "dict":
+            assert isinstance(features, dict)
+            assert all(isinstance(item, torch.Tensor) for item in features.values())
+            if force_dtype:
+                assert all(item.dtype == torch.long for item in features.values())
+            data = torch.cat(tuple(features.values()), dim=1)
+
+        if not label_type:
+            assert label is None
+        else:
+            assert isinstance(label, torch.Tensor)
+            if force_dtype:
+                assert label.dtype == torch.long
+            if unsqueeze_label_tensor:
+                assert label.dim() == 2
+            else:
+                assert label.dim() == 1
+                label = label.view(-1, 1)
+            data = torch.cat((data, label), dim=1)
+        iterations.append(data.numpy())
+
+    combined_iterations = np.concatenate(iterations)
+    if not label_type:
+        df.drop("label", axis=1, inplace=True)
+    np.testing.assert_array_equal(df.values, combined_iterations)
+
+
+@pytest.mark.parametrize("pipelined", [False, True])
+def test_tensors_in_tables_to_torch(ray_start_regular_shared, pipelined):
+    outer_dim = 3
+    inner_shape = (2, 2, 2)
+    shape = (outer_dim,) + inner_shape
+    num_items = np.prod(np.array(shape))
+    arr = np.arange(num_items).reshape(shape)
+    df1 = pd.DataFrame(
+        {"one": TensorArray(arr), "two": TensorArray(arr + 1), "label": [1.0, 2.0, 3.0]}
+    )
+    arr2 = np.arange(num_items, 2 * num_items).reshape(shape)
+    df2 = pd.DataFrame(
+        {
+            "one": TensorArray(arr2),
+            "two": TensorArray(arr2 + 1),
+            "label": [4.0, 5.0, 6.0],
+        }
+    )
+    df = pd.concat([df1, df2])
+    ds = ray.data.from_pandas([df1, df2])
+    ds = maybe_pipeline(ds, pipelined)
+    torchd = ds.to_torch(
+        label_column="label", batch_size=2, unsqueeze_label_tensor=False
+    )
+
+    num_epochs = 1 if pipelined else 2
+    for _ in range(num_epochs):
+        features, labels = [], []
+        for batch in iter(torchd):
+            features.append(batch[0].numpy())
+            labels.append(batch[1].numpy())
+        features, labels = np.concatenate(features), np.concatenate(labels)
+        values = np.stack([df["one"].to_numpy(), df["two"].to_numpy()], axis=1)
+        np.testing.assert_array_equal(values, features)
+        np.testing.assert_array_equal(df["label"].to_numpy(), labels)
+
+
+@pytest.mark.parametrize("pipelined", [False, True])
+def test_tensors_in_tables_to_torch_mix(ray_start_regular_shared, pipelined):
+    outer_dim = 3
+    inner_shape = (2, 2, 2)
+    shape = (outer_dim,) + inner_shape
+    num_items = np.prod(np.array(shape))
+    arr = np.arange(num_items).reshape(shape)
+    df1 = pd.DataFrame(
+        {
+            "one": TensorArray(arr),
+            "two": [1, 2, 3],
+            "label": [1.0, 2.0, 3.0],
+        }
+    )
+    arr2 = np.arange(num_items, 2 * num_items).reshape(shape)
+    df2 = pd.DataFrame(
+        {
+            "one": TensorArray(arr2),
+            "two": [4, 5, 6],
+            "label": [4.0, 5.0, 6.0],
+        }
+    )
+    df = pd.concat([df1, df2])
+    ds = ray.data.from_pandas([df1, df2])
+    ds = maybe_pipeline(ds, pipelined)
+    torchd = ds.to_torch(
+        label_column="label",
+        feature_columns=[["one"], ["two"]],
+        batch_size=2,
+        unsqueeze_label_tensor=False,
+        unsqueeze_feature_tensors=False,
+    )
+
+    num_epochs = 1 if pipelined else 2
+    for _ in range(num_epochs):
+        col1, col2, labels = [], [], []
+        for batch in iter(torchd):
+            col1.append(batch[0][0].numpy())
+            col2.append(batch[0][1].numpy())
+            labels.append(batch[1].numpy())
+        col1, col2 = np.concatenate(col1), np.concatenate(col2)
+        labels = np.concatenate(labels)
+        np.testing.assert_array_equal(col1, np.sort(df["one"].to_numpy()))
+        np.testing.assert_array_equal(col2, np.sort(df["two"].to_numpy()))
+        np.testing.assert_array_equal(labels, np.sort(df["label"].to_numpy()))
+
+
+@pytest.mark.skip(
+    reason=(
+        "Waiting for Torch to support unsqueezing and concatenating nested tensors."
+    )
+)
+@pytest.mark.parametrize("pipelined", [False, True])
+def test_tensors_in_tables_to_torch_variable_shaped(
+    ray_start_regular_shared, pipelined
+):
+    shapes = [(2, 2), (3, 3), (4, 4)]
+    cumsum_sizes = np.cumsum([0] + [np.prod(shape) for shape in shapes[:-1]])
+    arrs1 = [
+        np.arange(offset, offset + np.prod(shape)).reshape(shape)
+        for offset, shape in zip(cumsum_sizes, shapes)
+    ]
+    df1 = pd.DataFrame(
+        {
+            "one": TensorArray(arrs1),
+            "two": TensorArray([a + 1 for a in arrs1]),
+            "label": [1.0, 2.0, 3.0],
+        }
+    )
+    base = cumsum_sizes[-1]
+    arrs2 = [
+        np.arange(base + offset, base + offset + np.prod(shape)).reshape(shape)
+        for offset, shape in zip(cumsum_sizes, shapes)
+    ]
+    df2 = pd.DataFrame(
+        {
+            "one": TensorArray(arrs2),
+            "two": TensorArray([a + 1 for a in arrs2]),
+            "label": [4.0, 5.0, 6.0],
+        }
+    )
+    df = pd.concat([df1, df2])
+    ds = ray.data.from_pandas([df1, df2])
+    ds = maybe_pipeline(ds, pipelined)
+    torchd = ds.to_torch(
+        label_column="label", batch_size=2, unsqueeze_label_tensor=False
+    )
+
+    num_epochs = 1 if pipelined else 2
+    for _ in range(num_epochs):
+        features, labels = [], []
+        for batch in iter(torchd):
+            features.append(batch[0].numpy())
+            labels.append(batch[1].numpy())
+        features, labels = np.concatenate(features), np.concatenate(labels)
+        values = np.stack([df["one"].to_numpy(), df["two"].to_numpy()], axis=1)
+        np.testing.assert_array_equal(values, features)
+        np.testing.assert_array_equal(df["label"].to_numpy(), labels)
+
+
+@pytest.mark.parametrize("pipelined", [False, True])
+def test_iter_torch_batches(ray_start_regular_shared, pipelined):
+    import torch
+
+    df1 = pd.DataFrame(
+        {"one": [1, 2, 3], "two": [1.0, 2.0, 3.0], "label": [1.0, 2.0, 3.0]}
+    )
+    df2 = pd.DataFrame(
+        {"one": [4, 5, 6], "two": [4.0, 5.0, 6.0], "label": [4.0, 5.0, 6.0]}
+    )
+    df3 = pd.DataFrame({"one": [7, 8], "two": [7.0, 8.0], "label": [7.0, 8.0]})
+    df = pd.concat([df1, df2, df3])
+    ds = ray.data.from_pandas([df1, df2, df3])
+    ds = maybe_pipeline(ds, pipelined)
+
+    num_epochs = 1 if pipelined else 2
+    for _ in range(num_epochs):
+        iterations = []
+        for batch in ds.iter_torch_batches(batch_size=3):
+            iterations.append(
+                torch.stack(
+                    (batch["one"], batch["two"], batch["label"]),
+                    dim=1,
+                ).numpy()
+            )
+        combined_iterations = np.concatenate(iterations)
+        np.testing.assert_array_equal(np.sort(df.values), np.sort(combined_iterations))
+
+
+@pytest.mark.parametrize("pipelined", [False, True])
+def test_iter_torch_batches_tensor_ds(ray_start_regular_shared, pipelined):
+    arr1 = np.arange(12).reshape((3, 2, 2))
+    arr2 = np.arange(12, 24).reshape((3, 2, 2))
+    arr = np.concatenate((arr1, arr2))
+    ds = ray.data.from_numpy([arr1, arr2])
+    ds = maybe_pipeline(ds, pipelined)
+
+    num_epochs = 1 if pipelined else 2
+    for _ in range(num_epochs):
+        iterations = []
+        for batch in ds.iter_torch_batches(batch_size=2):
+            iterations.append(batch.numpy())
+        combined_iterations = np.concatenate(iterations)
+        np.testing.assert_array_equal(arr, combined_iterations)
+
+
+if __name__ == "__main__":
+    import sys
+
+    sys.exit(pytest.main(["-v", __file__]))

From f0d96c5c846b76a76a709641c6d906dc11599916 Mon Sep 17 00:00:00 2001
From: Jian Xiao <99709935+jianoaix@users.noreply.github.com>
Date: Mon, 13 Feb 2023 23:10:55 -0800
Subject: [PATCH 257/267] Clean up RAY_DATASET_FORCE_LOCAL_METADATA flag
 (#32483)

Follow up to https://github.com/ray-project/ray/pull/32015.
---
 python/ray/data/dataset.py  | 45 +++++++++++++++----------------------
 python/ray/data/read_api.py |  4 +---
 2 files changed, 19 insertions(+), 30 deletions(-)

diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index 084d13a7a8e1..a13f73b3b455 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -1,7 +1,6 @@
 import collections
 import itertools
 import logging
-import os
 import sys
 import time
 import html
@@ -2712,35 +2711,27 @@ def transform(blocks: Iterable[Block], ctx, fn) -> Iterable[Block]:
                 datasource.on_write_failed([], e)
                 raise
         else:
+            logger.warning(
+                "The Datasource.do_write() is deprecated in "
+                "Ray 2.4 and will be removed in future release. Use "
+                "Datasource.write() instead."
+            )
+
             ctx = DatasetContext.get_current()
             blocks, metadata = zip(*self._plan.execute().get_blocks_with_metadata())
-
-            # TODO(ekl) remove this feature flag.
-            if "RAY_DATASET_FORCE_LOCAL_METADATA" in os.environ:
-                write_results: List[ObjectRef[WriteResult]] = datasource.do_write(
-                    blocks, metadata, ray_remote_args=ray_remote_args, **write_args
-                )
-            else:
-                logger.warning(
-                    "The Datasource.do_write() is deprecated in "
-                    "Ray 2.4 and will be removed in future release. Use "
-                    "Datasource.write() instead."
-                )
-                # Prepare write in a remote task so that in Ray client mode, we
-                # don't do metadata resolution from the client machine.
-                do_write = cached_remote_fn(
-                    _do_write, retry_exceptions=False, num_cpus=0
-                )
-                write_results: List[ObjectRef[WriteResult]] = ray.get(
-                    do_write.remote(
-                        datasource,
-                        ctx,
-                        blocks,
-                        metadata,
-                        ray_remote_args,
-                        _wrap_arrow_serialization_workaround(write_args),
-                    )
+            # Prepare write in a remote task so that in Ray client mode, we
+            # don't do metadata resolution from the client machine.
+            do_write = cached_remote_fn(_do_write, retry_exceptions=False, num_cpus=0)
+            write_results: List[ObjectRef[WriteResult]] = ray.get(
+                do_write.remote(
+                    datasource,
+                    ctx,
+                    blocks,
+                    metadata,
+                    ray_remote_args,
+                    _wrap_arrow_serialization_workaround(write_args),
                 )
+            )
 
             progress = ProgressBar("Write Progress", len(write_results))
             try:
diff --git a/python/ray/data/read_api.py b/python/ray/data/read_api.py
index 9eddc2730b1f..f7d7944821f7 100644
--- a/python/ray/data/read_api.py
+++ b/python/ray/data/read_api.py
@@ -1,5 +1,4 @@
 import logging
-import os
 from typing import TYPE_CHECKING, Any, Dict, List, Optional, Tuple, TypeVar, Union
 
 import numpy as np
@@ -279,8 +278,7 @@ def read_datasource(
     ):
         ray_remote_args["scheduling_strategy"] = "SPREAD"
 
-    # TODO(ekl) remove this feature flag.
-    force_local = "RAY_DATASET_FORCE_LOCAL_METADATA" in os.environ
+    force_local = False
     cur_pg = ray.util.get_current_placement_group()
     pa_ds = _lazy_import_pyarrow_dataset()
     if pa_ds:

From 3414797b835e46aa61ec0a28db096f99d17eccf2 Mon Sep 17 00:00:00 2001
From: Jian Xiao <99709935+jianoaix@users.noreply.github.com>
Date: Mon, 13 Feb 2023 23:11:51 -0800
Subject: [PATCH 258/267] Add write operator in new logical plan (#32440)

---
 .../logical/operators/map_operator.py         | 21 +++++++++++++++
 .../ray/data/_internal/planner/plan_map_op.py |  4 +++
 python/ray/data/_internal/planner/write.py    | 18 +++++++++++++
 python/ray/data/dataset.py                    | 26 ++++++++++++-------
 .../data/tests/test_execution_optimizer.py    |  6 +++++
 5 files changed, 66 insertions(+), 9 deletions(-)
 create mode 100644 python/ray/data/_internal/planner/write.py

diff --git a/python/ray/data/_internal/logical/operators/map_operator.py b/python/ray/data/_internal/logical/operators/map_operator.py
index 42bfb3bb1010..41f45dc4be49 100644
--- a/python/ray/data/_internal/logical/operators/map_operator.py
+++ b/python/ray/data/_internal/logical/operators/map_operator.py
@@ -8,6 +8,7 @@
 )
 from ray.data.block import BatchUDF, RowUDF
 from ray.data.context import DEFAULT_BATCH_SIZE
+from ray.data.datasource import Datasource
 
 
 if sys.version_info >= (3, 8):
@@ -119,6 +120,26 @@ def __init__(
         )
 
 
+class Write(AbstractMap):
+    """Logical operator for write."""
+
+    def __init__(
+        self,
+        input_op: LogicalOperator,
+        datasource: Datasource,
+        ray_remote_args: Optional[Dict[str, Any]] = None,
+        **write_args,
+    ):
+        super().__init__(
+            "Write",
+            input_op,
+            fn=lambda x: x,
+            ray_remote_args=ray_remote_args,
+        )
+        self._datasource = datasource
+        self._write_args = write_args
+
+
 class Filter(AbstractMap):
     """Logical operator for filter."""
 
diff --git a/python/ray/data/_internal/planner/plan_map_op.py b/python/ray/data/_internal/planner/plan_map_op.py
index 6cf4a42a200e..a7b4f5305995 100644
--- a/python/ray/data/_internal/planner/plan_map_op.py
+++ b/python/ray/data/_internal/planner/plan_map_op.py
@@ -14,11 +14,13 @@
     FlatMap,
     MapBatches,
     MapRows,
+    Write,
 )
 from ray.data._internal.planner.filter import generate_filter_fn
 from ray.data._internal.planner.flat_map import generate_flat_map_fn
 from ray.data._internal.planner.map_batches import generate_map_batches_fn
 from ray.data._internal.planner.map_rows import generate_map_rows_fn
+from ray.data._internal.planner.write import generate_write_fn
 from ray.data.block import Block, CallableClass
 
 
@@ -41,6 +43,8 @@ def _plan_map_op(op: AbstractMap, input_physical_dag: PhysicalOperator) -> MapOp
         transform_fn = generate_flat_map_fn()
     elif isinstance(op, Filter):
         transform_fn = generate_filter_fn()
+    elif isinstance(op, Write):
+        transform_fn = generate_write_fn(op._datasource, **op._write_args)
     else:
         raise ValueError(f"Found unknown logical operator during planning: {op}")
 
diff --git a/python/ray/data/_internal/planner/write.py b/python/ray/data/_internal/planner/write.py
new file mode 100644
index 000000000000..d85285b8783a
--- /dev/null
+++ b/python/ray/data/_internal/planner/write.py
@@ -0,0 +1,18 @@
+from typing import Callable, Iterator
+
+from ray.data._internal.execution.interfaces import TaskContext
+from ray.data.block import Block, RowUDF
+from ray.data.datasource import Datasource
+
+
+def generate_write_fn(
+    datasource: Datasource, **write_args
+) -> Callable[[Iterator[Block], TaskContext, RowUDF], Iterator[Block]]:
+    # If the write op succeeds, the resulting Dataset is a list of
+    # WriteResult (one element per write task). Otherwise, an error will
+    # be raised. The Datasource can handle execution outcomes with the
+    # on_write_complete() and on_write_failed().
+    def fn(blocks: Iterator[Block], ctx, fn) -> Iterator[Block]:
+        return [[datasource.write(blocks, ctx, **write_args)]]
+
+    return fn
diff --git a/python/ray/data/dataset.py b/python/ray/data/dataset.py
index a13f73b3b455..22e8b4a56479 100644
--- a/python/ray/data/dataset.py
+++ b/python/ray/data/dataset.py
@@ -41,11 +41,13 @@
     FlatMap,
     MapRows,
     MapBatches,
+    Write,
 )
 from ray.data._internal.planner.filter import generate_filter_fn
 from ray.data._internal.planner.flat_map import generate_flat_map_fn
 from ray.data._internal.planner.map_batches import generate_map_batches_fn
 from ray.data._internal.planner.map_rows import generate_map_rows_fn
+from ray.data._internal.planner.write import generate_write_fn
 from ray.data.dataset_iterator import DatasetIterator
 from ray.data._internal.block_batching import batch_block_refs
 from ray.data._internal.block_list import BlockList
@@ -2686,24 +2688,30 @@ def write_datasource(
             )
 
         if hasattr(datasource, "write"):
-            # If the write operator succeeds, the resulting Dataset is a list of
-            # WriteResult (one element per write task). Otherwise, an error will
-            # be raised. The Datasource can handle execution outcomes with the
-            # on_write_complete() and on_write_failed().
-            def transform(blocks: Iterable[Block], ctx, fn) -> Iterable[Block]:
-                return [[datasource.write(blocks, ctx, **write_args)]]
-
             plan = self._plan.with_stage(
                 OneToOneStage(
                     "write",
-                    transform,
+                    generate_write_fn(datasource, **write_args),
                     "tasks",
                     ray_remote_args,
                     fn=lambda x: x,
                 )
             )
+
+            logical_plan = self._logical_plan
+            if logical_plan is not None:
+                write_op = Write(
+                    logical_plan.dag,
+                    datasource,
+                    ray_remote_args=ray_remote_args,
+                    **write_args,
+                )
+                logical_plan = LogicalPlan(write_op)
+
             try:
-                self._write_ds = Dataset(plan, self._epoch, self._lazy).fully_executed()
+                self._write_ds = Dataset(
+                    plan, self._epoch, self._lazy, logical_plan
+                ).fully_executed()
                 datasource.on_write_complete(
                     ray.get(self._write_ds._plan.execute().get_blocks())
                 )
diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index 122823b078c7..fd84bc85aa56 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -495,6 +495,12 @@ def test_read_map_chain_operator_fusion_e2e(ray_start_regular_shared, enable_opt
     assert name in ds.stats()
 
 
+def test_write_operator(ray_start_regular_shared, enable_optimizer, tmp_path):
+    ds = ray.data.range(10, parallelism=2)
+    ds.write_csv(tmp_path)
+    assert "DoRead->Write" in ds._write_ds.stats()
+
+
 def test_sort_operator(ray_start_regular_shared, enable_optimizer):
     planner = Planner()
     read_op = Read(ParquetDatasource())

From 66c05338b07f1ef149928d4742b5f70c6c49b138 Mon Sep 17 00:00:00 2001
From: Cheng Su <scnju13@gmail.com>
Date: Mon, 13 Feb 2023 23:15:52 -0800
Subject: [PATCH 259/267] [Datasets] Add logical operator for aggregate
 (#32462)

This PR is to add logical operator for group-by aggregate. The change includes:
* `Aggregate`: the logical operator for aggregate
* `generate_aggregate_fn`: the generated function for aggregate operator
* `SortAggregateTaskSpec`: the task spec for doing sort-based aggregate, mostly refactored from [_GroupbyOp](https://github.com/ray-project/ray/blob/master/python/ray/data/grouped_dataset.py#L35).
---
 .../logical/operators/all_to_all_operator.py  |  20 +++-
 .../ray/data/_internal/planner/aggregate.py   |  73 ++++++++++++
 .../planner/exchange/aggregate_task_spec.py   | 111 ++++++++++++++++++
 .../_internal/planner/plan_all_to_all_op.py   |   4 +
 python/ray/data/grouped_dataset.py            |  12 ++
 .../data/tests/test_execution_optimizer.py    |  31 +++++
 6 files changed, 250 insertions(+), 1 deletion(-)
 create mode 100644 python/ray/data/_internal/planner/aggregate.py
 create mode 100644 python/ray/data/_internal/planner/exchange/aggregate_task_spec.py

diff --git a/python/ray/data/_internal/logical/operators/all_to_all_operator.py b/python/ray/data/_internal/logical/operators/all_to_all_operator.py
index 150490866ec3..351a9c340efc 100644
--- a/python/ray/data/_internal/logical/operators/all_to_all_operator.py
+++ b/python/ray/data/_internal/logical/operators/all_to_all_operator.py
@@ -1,6 +1,7 @@
-from typing import Any, Dict, Optional
+from typing import Any, Dict, List, Optional
 
 from ray.data._internal.logical.interfaces import LogicalOperator
+from ray.data.aggregate import AggregateFn
 from ray.data.block import KeyFn
 
 
@@ -97,3 +98,20 @@ def __init__(
         )
         self._key = key
         self._descending = descending
+
+
+class Aggregate(AbstractAllToAll):
+    """Logical operator for aggregate."""
+
+    def __init__(
+        self,
+        input_op: LogicalOperator,
+        key: Optional[KeyFn],
+        aggs: List[AggregateFn],
+    ):
+        super().__init__(
+            "Aggregate",
+            input_op,
+        )
+        self._key = key
+        self._aggs = aggs
diff --git a/python/ray/data/_internal/planner/aggregate.py b/python/ray/data/_internal/planner/aggregate.py
new file mode 100644
index 000000000000..e16bae344f2e
--- /dev/null
+++ b/python/ray/data/_internal/planner/aggregate.py
@@ -0,0 +1,73 @@
+from typing import List, Optional, Tuple
+
+from ray.data._internal.execution.interfaces import (
+    AllToAllTransformFn,
+    RefBundle,
+    TaskContext,
+)
+from ray.data._internal.planner.exchange.aggregate_task_spec import (
+    SortAggregateTaskSpec,
+)
+from ray.data._internal.planner.exchange.push_based_shuffle_task_scheduler import (
+    PushBasedShuffleTaskScheduler,
+)
+from ray.data._internal.planner.exchange.pull_based_shuffle_task_scheduler import (
+    PullBasedShuffleTaskScheduler,
+)
+from ray.data._internal.planner.exchange.sort_task_spec import SortTaskSpec
+from ray.data._internal.stats import StatsDict
+from ray.data.aggregate import AggregateFn
+from ray.data.block import KeyFn
+from ray.data.context import DatasetContext
+
+
+def generate_aggregate_fn(
+    key: Optional[KeyFn],
+    aggs: List[AggregateFn],
+) -> AllToAllTransformFn:
+    """Generate function to aggregate blocks by the specified key column or key
+    function.
+    """
+    # TODO: validate blocks with AggregateFn._validate.
+    if len(aggs) == 0:
+        raise ValueError("Aggregate requires at least one aggregation")
+
+    def fn(
+        refs: List[RefBundle],
+        ctx: TaskContext,
+    ) -> Tuple[List[RefBundle], StatsDict]:
+        blocks = []
+        for ref_bundle in refs:
+            for block, _ in ref_bundle.blocks:
+                blocks.append(block)
+        if len(blocks) == 0:
+            return (blocks, {})
+
+        num_mappers = len(blocks)
+
+        if key is None:
+            num_outputs = 1
+            boundaries = []
+        else:
+            # Use same number of output partitions.
+            num_outputs = num_mappers
+            # Sample boundaries for aggregate key.
+            boundaries = SortTaskSpec.sample_boundaries(
+                blocks,
+                [(key, "ascending")] if isinstance(key, str) else key,
+                num_outputs,
+            )
+
+        agg_spec = SortAggregateTaskSpec(
+            boundaries=boundaries,
+            key=key,
+            aggs=aggs,
+        )
+        if DatasetContext.get_current().use_push_based_shuffle:
+            scheduler = PushBasedShuffleTaskScheduler(agg_spec)
+        else:
+            scheduler = PullBasedShuffleTaskScheduler(agg_spec)
+
+        return scheduler.execute(refs, num_outputs)
+
+    return fn
diff --git a/python/ray/data/_internal/planner/exchange/aggregate_task_spec.py b/python/ray/data/_internal/planner/exchange/aggregate_task_spec.py
new file mode 100644
index 000000000000..5bf2f5d05099
--- /dev/null
+++ b/python/ray/data/_internal/planner/exchange/aggregate_task_spec.py
@@ -0,0 +1,111 @@
+from typing import List, Optional, Tuple, Union
+
+from ray.data._internal.planner.exchange.interfaces import ExchangeTaskSpec
+from ray.data._internal.table_block import TableBlockAccessor
+from ray.data.aggregate import _AggregateOnKeyBase, AggregateFn, Count
+from ray.data.block import (
+    Block,
+    BlockAccessor,
+    BlockExecStats,
+    BlockMetadata,
+    KeyFn,
+    KeyType,
+)
+
+
+class SortAggregateTaskSpec(ExchangeTaskSpec):
+    """
+    The implementation for sort-based aggregate tasks.
+
+    Aggregate is done in 2 steps: partial aggregate of individual blocks, and
+    final aggregate of sorted blocks.
+
+    Partial aggregate (`map`): each block is sorted locally, then partitioned into
+    smaller blocks according to the boundaries. Each partitioned block is aggregated
+    separately, then passed to a final aggregate task.
+
+    Final aggregate (`reduce`): each task would receive a block from every worker that
+    consists of items in a certain range. It then merges the sorted blocks and
+    aggregates on-the-fly.
+    """
+
+    def __init__(
+        self,
+        boundaries: List[KeyType],
+        key: Optional[KeyFn],
+        aggs: List[AggregateFn],
+    ):
+        super().__init__(
+            map_args=[boundaries, key, aggs],
+            reduce_args=[key, aggs],
+        )
+
+    @staticmethod
+    def map(
+        idx: int,
+        block: Block,
+        output_num_blocks: int,
+        boundaries: List[KeyType],
+        key: Optional[KeyFn],
+        aggs: List[AggregateFn],
+    ) -> List[Union[BlockMetadata, Block]]:
+        stats = BlockExecStats.builder()
+
+        block = SortAggregateTaskSpec._prune_unused_columns(block, key, aggs)
+
+        if key is None:
+            partitions = [block]
+        else:
+            partitions = BlockAccessor.for_block(block).sort_and_partition(
+                boundaries,
+                [(key, "ascending")] if isinstance(key, str) else key,
+                descending=False,
+            )
+        parts = [BlockAccessor.for_block(p).combine(key, aggs) for p in partitions]
+        meta = BlockAccessor.for_block(block).get_metadata(
+            input_files=None, exec_stats=stats.build()
+        )
+        return parts + [meta]
+
+    @staticmethod
+    def reduce(
+        key: Optional[KeyFn],
+        aggs: List[AggregateFn],
+        *mapper_outputs: List[Block],
+        partial_reduce: bool = False,
+    ) -> Tuple[Block, BlockMetadata]:
+        return BlockAccessor.for_block(mapper_outputs[0]).aggregate_combined_blocks(
+            list(mapper_outputs), key, aggs, finalize=not partial_reduce
+        )
+
+    @staticmethod
+    def _prune_unused_columns(
+        block: Block,
+        key: KeyFn,
+        aggs: Tuple[AggregateFn],
+    ) -> Block:
+        """Prune unused columns from block before aggregate."""
+        prune_columns = True
+        columns = set()
+
+        if isinstance(key, str):
+            columns.add(key)
+        elif callable(key):
+            prune_columns = False
+
+        for agg in aggs:
+            if isinstance(agg, _AggregateOnKeyBase) and isinstance(agg._key_fn, str):
+                columns.add(agg._key_fn)
+            elif not isinstance(agg, Count):
+                # Don't prune columns if any aggregate key is not string.
+                prune_columns = False
+
+        block_accessor = BlockAccessor.for_block(block)
+        if (
+            prune_columns
+            and isinstance(block_accessor, TableBlockAccessor)
+            and block_accessor.num_rows() > 0
+        ):
+            return block_accessor.select(list(columns))
+        else:
+            return block
diff --git a/python/ray/data/_internal/planner/plan_all_to_all_op.py b/python/ray/data/_internal/planner/plan_all_to_all_op.py
index fbb20f2b3f4f..985a5a88c403 100644
--- a/python/ray/data/_internal/planner/plan_all_to_all_op.py
+++ b/python/ray/data/_internal/planner/plan_all_to_all_op.py
@@ -2,11 +2,13 @@
 from ray.data._internal.execution.operators.all_to_all_operator import AllToAllOperator
 from ray.data._internal.logical.operators.all_to_all_operator import (
     AbstractAllToAll,
+    Aggregate,
     RandomShuffle,
     RandomizeBlocks,
     Repartition,
     Sort,
 )
+from ray.data._internal.planner.aggregate import generate_aggregate_fn
 from ray.data._internal.planner.random_shuffle import generate_random_shuffle_fn
 from ray.data._internal.planner.randomize_blocks import generate_randomize_blocks_fn
 from ray.data._internal.planner.repartition import generate_repartition_fn
@@ -30,6 +32,8 @@ def _plan_all_to_all_op(
         fn = generate_repartition_fn(op._num_outputs, op._shuffle)
     elif isinstance(op, Sort):
         fn = generate_sort_fn(op._key, op._descending)
+    elif isinstance(op, Aggregate):
+        fn = generate_aggregate_fn(op._key, op._aggs)
     else:
         raise ValueError(f"Found unknown logical operator during planning: {op}")
 
diff --git a/python/ray/data/grouped_dataset.py b/python/ray/data/grouped_dataset.py
index 8f3a4b56e33f..ae058a44a4d5 100644
--- a/python/ray/data/grouped_dataset.py
+++ b/python/ray/data/grouped_dataset.py
@@ -3,6 +3,8 @@
 from ray.data._internal import sort
 from ray.data._internal.compute import CallableClass, ComputeStrategy
 from ray.data._internal.delegating_block_builder import DelegatingBlockBuilder
+from ray.data._internal.logical.interfaces import LogicalPlan
+from ray.data._internal.logical.operators.all_to_all_operator import Aggregate
 from ray.data._internal.plan import AllToAllStage
 from ray.data._internal.shuffle import ShuffleOp, SimpleShufflePlan
 from ray.data._internal.push_based_shuffle import PushBasedShufflePlan
@@ -217,10 +219,20 @@ def do_agg(blocks, clear_input_blocks: bool, *_):
             )
 
         plan = self._dataset._plan.with_stage(AllToAllStage("aggregate", None, do_agg))
+
+        logical_plan = self._dataset._logical_plan
+        if logical_plan is not None:
+            op = Aggregate(
+                logical_plan.dag,
+                key=self._key,
+                aggs=aggs,
+            )
+            logical_plan = LogicalPlan(op)
         return Dataset(
             plan,
             self._dataset._epoch,
             self._dataset._lazy,
+            logical_plan,
         )
 
     def _aggregate_on(
diff --git a/python/ray/data/tests/test_execution_optimizer.py b/python/ray/data/tests/test_execution_optimizer.py
index fd84bc85aa56..37e60f4e9e62 100644
--- a/python/ray/data/tests/test_execution_optimizer.py
+++ b/python/ray/data/tests/test_execution_optimizer.py
@@ -7,6 +7,7 @@
 from ray.data._internal.logical.interfaces import LogicalPlan
 from ray.data._internal.logical.optimizers import PhysicalOptimizer
 from ray.data._internal.logical.operators.all_to_all_operator import (
+    Aggregate,
     RandomShuffle,
     Repartition,
     Sort,
@@ -19,6 +20,7 @@
     FlatMap,
 )
 from ray.data._internal.planner.planner import Planner
+from ray.data.aggregate import Count
 from ray.data.datasource.parquet_datasource import ParquetDatasource
 
 from ray.data.tests.conftest import *  # noqa
@@ -545,6 +547,35 @@ def test_sort_e2e(
     # assert [d["one"] for d in r2] == list(reversed(range(100)))
 
 
+def test_aggregate_operator(ray_start_regular_shared, enable_optimizer):
+    planner = Planner()
+    read_op = Read(ParquetDatasource())
+    op = Aggregate(
+        read_op,
+        key="col1",
+        aggs=[Count()],
+    )
+    plan = LogicalPlan(op)
+    physical_op = planner.plan(plan).dag
+
+    assert op.name == "Aggregate"
+    assert isinstance(physical_op, AllToAllOperator)
+    assert len(physical_op.input_dependencies) == 1
+    assert isinstance(physical_op.input_dependencies[0], MapOperator)
+
+
+def test_aggregate_e2e(
+    ray_start_regular_shared,
+    enable_optimizer,
+    use_push_based_shuffle,
+):
+    ds = ray.data.range_table(100, parallelism=4)
+    ds = ds.groupby("value").count()
+    assert ds.count() == 100
+    for idx, row in enumerate(ds.sort("value").iter_rows()):
+        assert row.as_pydict() == {"value": idx, "count()": 1}
+
+
 if __name__ == "__main__":
     import sys
 

From d092b126b6755779707be6e4d5b7f52c272181c1 Mon Sep 17 00:00:00 2001
From: Kai Fricke <krfricke@users.noreply.github.com>
Date: Tue, 14 Feb 2023 09:00:26 -0800
Subject: [PATCH 260/267] [tune] Fix two tests after structure refactor
 deprecation (#32517)

#32486 introduced two test failures after hard-depracting a structure refactor. This PR fixes these two stale imports.

Signed-off-by: Kai Fricke <coding@kaifricke.com>
---
 python/ray/tune/tests/test_legacy_import.py     | 2 +-
 python/ray/tune/tests/test_progress_reporter.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/python/ray/tune/tests/test_legacy_import.py b/python/ray/tune/tests/test_legacy_import.py
index 012874caadec..620cfe2205f5 100644
--- a/python/ray/tune/tests/test_legacy_import.py
+++ b/python/ray/tune/tests/test_legacy_import.py
@@ -47,7 +47,7 @@ def logging_setup():
 def test_import_module_raises_warnings(module):
     py_cmd = (
         f"import pytest\n"
-        f"with pytest.warns(DeprecationWarning):\n"
+        f"with pytest.raises(DeprecationWarning):\n"
         f"      import {module}\n"
         f"\n"
     )
diff --git a/python/ray/tune/tests/test_progress_reporter.py b/python/ray/tune/tests/test_progress_reporter.py
index 61ae854b56d3..33cce827a559 100644
--- a/python/ray/tune/tests/test_progress_reporter.py
+++ b/python/ray/tune/tests/test_progress_reporter.py
@@ -22,7 +22,7 @@
     _max_len,
 )
 from ray.tune.result import AUTO_RESULT_KEYS
-from ray.tune.trial import Trial
+from ray.tune.experiment.trial import Trial
 
 EXPECTED_RESULT_1 = """Result logdir: /foo
 Number of trials: 5 (1 PENDING, 3 RUNNING, 1 TERMINATED)

From d87d86fc00a4d6f4c5e60ff4c814df64cd4eef33 Mon Sep 17 00:00:00 2001
From: Justin Yu <justinvyu@anyscale.com>
Date: Tue, 14 Feb 2023 09:01:57 -0800
Subject: [PATCH 261/267] [AIR][Train][Doc] Restructure API reference (#32360)

This PR splits up long API refs in AIR and Train into individual pages, one dedicated to each method/class.

This PR is a followup to #31204 and #32311, which made the same changes for Ray Data/Tune docs.

Signed-off-by: Justin Yu <justinvyu@berkeley.edu>
---
 .buildkite/pipeline.build.yml                 |   4 +
 doc/requirements-doc.txt                      |   3 +
 doc/source/_toc.yml                           |   4 +-
 doc/source/ray-air/api/api.rst                |  19 +
 doc/source/ray-air/api/checkpoint.rst         |  47 +++
 doc/source/ray-air/api/configs.rst            |  25 ++
 doc/source/ray-air/api/dataset-ingest.rst     |  23 ++
 doc/source/ray-air/api/predictor.rst          |  87 ++++
 doc/source/ray-air/api/preprocessor.rst       |  94 +++++
 doc/source/ray-air/api/serve.rst              |  18 +
 doc/source/ray-air/api/session.rst            |  41 ++
 .../ray-air/examples/serving_guide.ipynb      |  20 +-
 doc/source/ray-air/package-ref.rst            | 372 ------------------
 doc/source/ray-references/api.rst             |   4 +-
 doc/source/train/api.rst                      | 243 ------------
 doc/source/train/api/api.rst                  |  89 +++++
 doc/source/tune/api/execution.rst             |   2 +
 doc/source/tune/api/integration.rst           |   1 +
 doc/source/tune/api/result_grid.rst           |   1 +
 doc/source/tune/api/trainable.rst             |   7 -
 20 files changed, 470 insertions(+), 634 deletions(-)
 create mode 100644 doc/source/ray-air/api/api.rst
 create mode 100644 doc/source/ray-air/api/checkpoint.rst
 create mode 100644 doc/source/ray-air/api/configs.rst
 create mode 100644 doc/source/ray-air/api/dataset-ingest.rst
 create mode 100644 doc/source/ray-air/api/predictor.rst
 create mode 100644 doc/source/ray-air/api/preprocessor.rst
 create mode 100644 doc/source/ray-air/api/serve.rst
 create mode 100644 doc/source/ray-air/api/session.rst
 delete mode 100644 doc/source/ray-air/package-ref.rst
 delete mode 100644 doc/source/train/api.rst
 create mode 100644 doc/source/train/api/api.rst

diff --git a/.buildkite/pipeline.build.yml b/.buildkite/pipeline.build.yml
index 4c3d1593db64..ba17ebd70ff1 100644
--- a/.buildkite/pipeline.build.yml
+++ b/.buildkite/pipeline.build.yml
@@ -574,6 +574,10 @@
     - pushd /ray && git clean -f -f -x -d -e .whl -e python/ray/dashboard/client && popd
     - bazel clean --expunge
     - export WANDB_MODE=offline
+    # Horovod needs to be installed separately (needed for API ref imports)
+    - ./ci/env/install-horovod.sh
+    # See https://stackoverflow.com/questions/63383400/error-cannot-uninstall-ruamel-yaml-while-creating-docker-image-for-azure-ml-a
+    - pip install mosaicml==0.10.1 --ignore-installed
     - ./ci/ci.sh build
 
 - label: ":octopus: Tune multinode tests"
diff --git a/doc/requirements-doc.txt b/doc/requirements-doc.txt
index 745688ffb8c0..44457f9457f4 100644
--- a/doc/requirements-doc.txt
+++ b/doc/requirements-doc.txt
@@ -36,6 +36,9 @@ torch
 torchvision
 transformers
 
+# Train
+mxnet==1.8.0.post0
+
 # Ray libraries
 git+https://github.com/ray-project/tune-sklearn@master#tune-sklearn
 git+https://github.com/ray-project/xgboost_ray@master#egg=xgboost_ray
diff --git a/doc/source/_toc.yml b/doc/source/_toc.yml
index e2426b5f2e0a..066a552b5f0e 100644
--- a/doc/source/_toc.yml
+++ b/doc/source/_toc.yml
@@ -118,7 +118,7 @@ parts:
               - file: ray-air/examples/automl_with_ray_air
               - file: ray-air/examples/batch_tuning
               - file: ray-air/examples/batch_forecasting
-          - file: ray-air/package-ref
+          - file: ray-air/api/api
           - file: ray-air/benchmarks
 
       - file: data/dataset
@@ -181,7 +181,7 @@ parts:
               - file: train/examples/pytorch/torch_data_prefetch_benchmark/benchmark_example
                 title: "Torch Data Prefetching Benchmark"
           - file: train/faq
-          - file: train/api
+          - file: train/api/api
 
       - file: tune/index
         title: Ray Tune
diff --git a/doc/source/ray-air/api/api.rst b/doc/source/ray-air/api/api.rst
new file mode 100644
index 000000000000..e635557e5cbd
--- /dev/null
+++ b/doc/source/ray-air/api/api.rst
@@ -0,0 +1,19 @@
+.. _air-api-ref:
+
+Ray AIR API
+===========
+
+.. toctree::
+    :maxdepth: 2
+
+    Preprocessor (Ray Data + Ray Train)<preprocessor.rst>
+    Dataset Ingest (Ray Data + Ray Train)<dataset-ingest.rst>
+    Trainers (Ray Train)<../../train/api/api>
+    Tuner (Ray Tune)<../../tune/api/execution>
+    Results (Ray Train + Ray Tune)<../../tune/api/result_grid>
+    AIR Session (Ray Train + Ray Tune)<session>
+    AIR Configurations (Ray Train + Ray Tune)<configs.rst>
+    AIR Checkpoint (All Libraries)<checkpoint.rst>
+    Predictors (Ray Data + Ray Train)<predictor.rst>
+    Model Serving in AIR (Ray Serve)<serve.rst>
+    External Library Integrations<../../tune/api/integration>
diff --git a/doc/source/ray-air/api/checkpoint.rst b/doc/source/ray-air/api/checkpoint.rst
new file mode 100644
index 000000000000..43104d924ded
--- /dev/null
+++ b/doc/source/ray-air/api/checkpoint.rst
@@ -0,0 +1,47 @@
+.. _air-checkpoint-ref:
+
+Ray AIR Checkpoint
+==================
+
+.. seealso::
+
+    See :ref:`this API reference section <train-framework-specific-ckpts>` for
+    framework-specific checkpoints used with AIR's library integrations.
+
+Constructor Options
+-------------------
+
+.. currentmodule:: ray.air.checkpoint
+
+.. autosummary::
+    :toctree: doc/
+
+    Checkpoint
+    Checkpoint.from_dict
+    Checkpoint.from_bytes
+    Checkpoint.from_directory
+    Checkpoint.from_uri
+    Checkpoint.from_checkpoint
+
+Checkpoint Properties
+---------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    Checkpoint.uri
+    Checkpoint.get_internal_representation
+    Checkpoint.get_preprocessor
+    Checkpoint.set_preprocessor
+
+Checkpoint Format Conversions
+-----------------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    Checkpoint.to_dict
+    Checkpoint.to_bytes
+    Checkpoint.to_directory
+    Checkpoint.as_directory
+    Checkpoint.to_uri
diff --git a/doc/source/ray-air/api/configs.rst b/doc/source/ray-air/api/configs.rst
new file mode 100644
index 000000000000..d0fb97c32a81
--- /dev/null
+++ b/doc/source/ray-air/api/configs.rst
@@ -0,0 +1,25 @@
+
+Ray AIR Configurations
+======================
+
+.. TODO(ml-team): Add a general AIR configuration guide that covers all of these configs.
+
+.. seealso::
+
+    See :ref:`this Ray Train configuration user guide <train-config>` for more details.
+
+.. currentmodule:: ray
+
+.. autosummary::
+    :toctree: doc/
+
+    air.RunConfig
+    air.ScalingConfig
+    air.DatasetConfig
+    air.CheckpointConfig
+    air.FailureConfig
+
+.. autosummary::
+
+    tune.TuneConfig
+    tune.syncer.SyncConfig
diff --git a/doc/source/ray-air/api/dataset-ingest.rst b/doc/source/ray-air/api/dataset-ingest.rst
new file mode 100644
index 000000000000..fd962d853cbb
--- /dev/null
+++ b/doc/source/ray-air/api/dataset-ingest.rst
@@ -0,0 +1,23 @@
+Ray Dataset Ingest into AIR Trainers
+=====================================
+
+.. seealso::
+
+    See this :ref:`AIR Dataset ingest guide <air-configure-ingest>` for usage examples.
+
+.. currentmodule:: ray
+
+.. autosummary::
+
+    air.session.get_dataset_shard
+    ~data.DatasetIterator
+    ~air.DatasetConfig
+
+Debugging Utilities
+-------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    ~air.util.check_ingest.make_local_dataset_iterator
+    ~air.util.check_ingest.DummyTrainer
diff --git a/doc/source/ray-air/api/predictor.rst b/doc/source/ray-air/api/predictor.rst
new file mode 100644
index 000000000000..a62f1496b211
--- /dev/null
+++ b/doc/source/ray-air/api/predictor.rst
@@ -0,0 +1,87 @@
+Predictor
+=========
+
+.. seealso::
+
+    See this :ref:`user guide on performing model inference <air-predictors>` in
+    AIR for usage examples.
+
+.. currentmodule:: ray.train
+
+Predictor Interface
+-------------------
+
+Constructor Options
+~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    predictor.Predictor
+    predictor.Predictor.from_checkpoint
+    predictor.Predictor.from_pandas_udf
+
+Predictor Properties
+~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    predictor.Predictor.get_preprocessor
+    predictor.Predictor.set_preprocessor
+
+
+Prediction API
+~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    predictor.Predictor.predict
+
+
+Supported Data Formats
+~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    predictor.Predictor.preferred_batch_format
+    ~predictor.DataBatchType
+
+
+Batch Predictor
+---------------
+
+Constructor
+~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    batch_predictor.BatchPredictor
+
+
+Batch Prediction API
+~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    batch_predictor.BatchPredictor.predict
+    batch_predictor.BatchPredictor.predict_pipelined
+
+
+Built-in Predictors for Library Integrations
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    ~xgboost.XGBoostPredictor
+    ~lightgbm.LightGBMPredictor
+    ~tensorflow.TensorflowPredictor
+    ~torch.TorchPredictor
+    ~huggingface.HuggingFacePredictor
+    ~sklearn.SklearnPredictor
+    ~rl.RLPredictor
diff --git a/doc/source/ray-air/api/preprocessor.rst b/doc/source/ray-air/api/preprocessor.rst
new file mode 100644
index 000000000000..d2e1a3f998ab
--- /dev/null
+++ b/doc/source/ray-air/api/preprocessor.rst
@@ -0,0 +1,94 @@
+.. _air-preprocessor-ref:
+
+Preprocessor
+============
+
+Preprocessor Interface
+------------------------
+
+.. currentmodule:: ray.data
+
+Constructor
+~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    ~preprocessor.Preprocessor
+
+Fit/Transform APIs
+~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    ~preprocessor.Preprocessor.fit
+    ~preprocessor.Preprocessor.fit_transform
+    ~preprocessor.Preprocessor.transform
+    ~preprocessor.Preprocessor.transform_batch
+    ~preprocessor.Preprocessor.transform_stats
+
+
+Generic Preprocessors
+---------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    ~preprocessors.BatchMapper
+    ~preprocessors.Chain
+    ~preprocessors.Concatenator
+    ~preprocessors.SimpleImputer
+
+Categorical Encoders
+--------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    ~preprocessors.Categorizer
+    ~preprocessors.LabelEncoder
+    ~preprocessors.MultiHotEncoder
+    ~preprocessors.OneHotEncoder
+    ~preprocessors.OrdinalEncoder
+
+Feature Scalers
+---------------
+
+.. autosummary::
+    :toctree: doc/
+
+    ~preprocessors.MaxAbsScaler
+    ~preprocessors.MinMaxScaler
+    ~preprocessors.Normalizer
+    ~preprocessors.PowerTransformer
+    ~preprocessors.RobustScaler
+    ~preprocessors.StandardScaler
+
+K-Bins Discretizers
+-------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    ~preprocessors.CustomKBinsDiscretizer
+    ~preprocessors.UniformKBinsDiscretizer
+
+Image Preprocessors
+-------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    ~preprocessors.TorchVisionPreprocessor
+
+Text Encoders
+-------------
+
+.. autosummary::
+    :toctree: doc/
+
+    ~preprocessors.CountVectorizer
+    ~preprocessors.FeatureHasher
+    ~preprocessors.HashingVectorizer
+    ~preprocessors.Tokenizer
diff --git a/doc/source/ray-air/api/serve.rst b/doc/source/ray-air/api/serve.rst
new file mode 100644
index 000000000000..7dfaacd6db67
--- /dev/null
+++ b/doc/source/ray-air/api/serve.rst
@@ -0,0 +1,18 @@
+.. _air-serve-integration:
+
+Model Serving in AIR
+=====================
+
+.. seealso::
+
+    See this :ref:`model serving guide <air-serving-guide>` to see how Ray Serve
+    can be used within the Ray AIR ecosystem.
+
+.. currentmodule:: ray.serve.air_integrations
+
+.. autosummary::
+    :toctree: doc/
+
+    PredictorWrapper
+
+.. autoclass:: PredictorDeployment
\ No newline at end of file
diff --git a/doc/source/ray-air/api/session.rst b/doc/source/ray-air/api/session.rst
new file mode 100644
index 000000000000..ccd58861d5d7
--- /dev/null
+++ b/doc/source/ray-air/api/session.rst
@@ -0,0 +1,41 @@
+.. _air-session-ref:
+
+Ray AIR Session
+===============
+
+.. currentmodule:: ray.air
+
+.. seealso::
+    See this :ref:`Ray Train user guide <train-monitoring>` and
+    this :ref:`Ray Tune user guide <tune-function-api>` for usage examples
+    of ``ray.air.session`` in the respective libraries.
+
+Retrieve Checkpoints and Datasets
+-----------------------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    session.get_checkpoint
+    session.get_dataset_shard
+
+
+AIR Session Metadata
+----------------------------
+
+.. autosummary::
+    :toctree: doc/
+
+    session.get_experiment_name
+    session.get_trial_name
+    session.get_trial_id
+    session.get_trial_resources
+    session.get_trial_dir
+    session.get_world_size
+    session.get_world_rank
+    session.get_local_world_size
+    session.get_local_rank
+    session.get_node_rank
+
+
+
diff --git a/doc/source/ray-air/examples/serving_guide.ipynb b/doc/source/ray-air/examples/serving_guide.ipynb
index 48726524ace6..977809faa7df 100644
--- a/doc/source/ray-air/examples/serving_guide.ipynb
+++ b/doc/source/ray-air/examples/serving_guide.ipynb
@@ -1,6 +1,7 @@
 {
  "cells": [
   {
+   "attachments": {},
    "cell_type": "markdown",
    "metadata": {},
    "source": [
@@ -13,11 +14,11 @@
     "After training a model with Ray Train, you can serve a model using Ray Serve. In this guide, we will cover how to use Ray AIR's `PredictorDeployment`, `Predictor`, and `Checkpoint` abstractions to quickly deploy a model for online inference.\n",
     "\n",
     "But before that, let's review the key concepts:\n",
-    "- [`Checkpoint`](ray.air.checkpoint) represents a trained model stored in memory, file, or remote uri.\n",
+    "- [`Checkpoint`](air-checkpoint-ref) represents a trained model stored in memory, file, or remote uri.\n",
     "- [`Predictor`](ray.train.predictor.Predictor)s understand how to perform a model inference given checkpoints and the model definition. Ray AIR comes with predictors for each supported frameworks. \n",
     "- [`Deployment`](serve-key-concepts-deployment) is a Ray Serve construct that represent an HTTP endpoint along with scalable pool of models.\n",
     "\n",
-    "The core concept for model deployment is the `PredictorDeployment`. The `PredictorDeployment` takes a [predictor](ray.train.predictor.Predictor) class and a [checkpoint](ray.air.checkpoint) and transforms them into a live HTTP endpoint. \n",
+    "The core concept for model deployment is the `PredictorDeployment`. The `PredictorDeployment` takes a [predictor](ray.train.predictor.Predictor) class and a [checkpoint](air-checkpoint-ref) and transforms them into a live HTTP endpoint. \n",
     "\n",
     "We'll start with a simple quick-start demo showing how you can use the `PredictorDeployment` to deploy your model for online inference."
    ]
@@ -199,10 +200,11 @@
    ]
   },
   {
+   "attachments": {},
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "The following block serves a Ray AIR model from a [checkpoint](ray.air.checkpoint), using the built-in [`XGBoostPredictor`](ray.train.xgboost.XGBoostPredictor)."
+    "The following block serves a Ray AIR model from a [checkpoint](air-checkpoint-ref), using the built-in [`XGBoostPredictor`](ray.train.xgboost.XGBoostPredictor)."
    ]
   },
   {
@@ -903,11 +905,8 @@
   }
  ],
  "metadata": {
-  "interpreter": {
-   "hash": "3d292ac03404f7ef6351ef2ed79a7f4abdf879ab5af2497c4aeba036dba01cfa"
-  },
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "ray_dev_py38",
    "language": "python",
    "name": "python3"
   },
@@ -921,7 +920,12 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.5"
+   "version": "3.8.13 | packaged by conda-forge | (default, Mar 25 2022, 06:05:16) \n[Clang 12.0.1 ]"
+  },
+  "vscode": {
+   "interpreter": {
+    "hash": "265d195fda5292fe8f69c6e37c435a5634a1ed3b6799724e66a975f68fa21517"
+   }
   }
  },
  "nbformat": 4,
diff --git a/doc/source/ray-air/package-ref.rst b/doc/source/ray-air/package-ref.rst
deleted file mode 100644
index 2fa48650e45a..000000000000
--- a/doc/source/ray-air/package-ref.rst
+++ /dev/null
@@ -1,372 +0,0 @@
-.. _air-api-ref:
-
-Ray AIR API
-===========
-
-.. contents::
-    :local:
-
-Components
-----------
-
-.. _air-preprocessor-ref:
-
-Preprocessor
-~~~~~~~~~~~~
-
-.. autoclass:: ray.data.preprocessor.Preprocessor
-    :members:
-
-Generic Preprocessors
-#####################
-
-.. autoclass:: ray.data.preprocessors.BatchMapper
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.Chain
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.Concatenator
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.SimpleImputer
-    :show-inheritance:
-
-.. automethod:: ray.data.Dataset.train_test_split
-    :noindex:
-
-Categorical Encoders
-####################
-
-.. autoclass:: ray.data.preprocessors.Categorizer
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.LabelEncoder
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.MultiHotEncoder
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.OneHotEncoder
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.OrdinalEncoder
-    :show-inheritance:
-
-Feature Scalers
-###############
-
-.. autoclass:: ray.data.preprocessors.MaxAbsScaler
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.MinMaxScaler
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.Normalizer
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.PowerTransformer
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.RobustScaler
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.StandardScaler
-    :show-inheritance:
-
-K-Bins Discretizers
-###################
-
-.. autoclass:: ray.data.preprocessors.CustomKBinsDiscretizer
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.UniformKBinsDiscretizer
-    :show-inheritance:
-
-Image Preprocessors
-###################
-
-.. autoclass:: ray.data.preprocessors.TorchVisionPreprocessor
-    :show-inheritance:
-    
-Text Encoders
-#############
-
-.. autoclass:: ray.data.preprocessors.CountVectorizer
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.FeatureHasher
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.HashingVectorizer
-    :show-inheritance:
-
-.. autoclass:: ray.data.preprocessors.Tokenizer
-    :show-inheritance:
-
-.. _air-abstract-trainer-ref:
-
-Trainer
-~~~~~~~
-
-.. autoclass:: ray.train.trainer.BaseTrainer
-    :members:
-
-    .. automethod:: __init__
-
-Abstract Classes
-################
-
-.. autoclass:: ray.train.data_parallel_trainer.DataParallelTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-.. autoclass:: ray.train.gbdt_trainer.GBDTTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-.. autoclass:: ray.air.util.check_ingest.DummyTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-.. _air-results-ref:
-
-Dataset Iteration
-#################
-
-.. autoclass:: ray.data.DatasetIterator
-    :members:
-    :noindex:
-
-.. autofunction:: ray.air.util.check_ingest.make_local_dataset_iterator
-
-Training Result
-###############
-
-.. automodule:: ray.air.result
-    :members:
-
-.. _air-session-ref:
-
-Training Session
-################
-
-.. automodule:: ray.air.session
-    :members:
-    :noindex:
-
-Trainer Configs
-###############
-
-.. automodule:: ray.air.config
-    :members:
-
-Checkpoint
-~~~~~~~~~~
-
-.. _air-checkpoint-ref:
-
-.. automodule:: ray.air.checkpoint
-    :members:
-
-Predictor
-~~~~~~~~~
-
-.. autoclass:: ray.train.predictor.Predictor
-    :members:
-
-Data Types
-##########
-
-.. autoclass:: ray.train.predictor.DataBatchType
-
-Batch Predictor
-###############
-
-.. autoclass:: ray.train.batch_predictor.BatchPredictor
-    :members:
-
-.. _air-tuner-ref:
-
-Tuner
-~~~~~
-
-.. autoclass:: ray.tune.tuner.Tuner
-    :members:
-
-TuneConfig
-##########
-
-.. automodule:: ray.tune.tune_config
-    :members:
-
-Tuner Results
-#############
-
-.. automodule:: ray.tune.result_grid
-    :members:
-
-.. _air-serve-integration:
-
-Serving
-~~~~~~~
-
-.. autoclass:: ray.serve.air_integrations.PredictorDeployment
-
-.. autoclass:: ray.serve.air_integrations.PredictorWrapper
-
-.. _air-trainer-ref:
-
-Trainer and Predictor Integrations
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-XGBoost
-#######
-
-.. autoclass:: ray.train.xgboost.XGBoostTrainer
-    :members:
-    :show-inheritance:
-    :noindex:
-
-    .. automethod:: __init__
-        :noindex:
-
-
-.. automodule:: ray.train.xgboost
-    :members:
-    :exclude-members: XGBoostTrainer
-    :show-inheritance:
-    :noindex:
-
-LightGBM
-########
-
-.. autoclass:: ray.train.lightgbm.LightGBMTrainer
-    :members:
-    :show-inheritance:
-    :noindex:
-
-    .. automethod:: __init__
-        :noindex:
-
-
-.. automodule:: ray.train.lightgbm
-    :members:
-    :exclude-members: LightGBMTrainer
-    :show-inheritance:
-    :noindex:
-
-TensorFlow
-##########
-
-.. autoclass:: ray.train.tensorflow.TensorflowTrainer
-    :members:
-    :show-inheritance:
-    :noindex:
-
-    .. automethod:: __init__
-        :noindex:
-
-
-.. automodule:: ray.train.tensorflow
-    :members:
-    :exclude-members: TensorflowTrainer
-    :show-inheritance:
-    :noindex:
-
-.. _air-pytorch-ref:
-
-PyTorch
-#######
-
-.. autoclass:: ray.train.torch.TorchTrainer
-    :members:
-    :show-inheritance:
-    :noindex:
-
-    .. automethod:: __init__
-        :noindex:
-
-
-.. automodule:: ray.train.torch
-    :members:
-    :exclude-members: TorchTrainer
-    :show-inheritance:
-    :noindex:
-
-Horovod
-#######
-
-.. autoclass:: ray.train.horovod.HorovodTrainer
-    :members:
-    :show-inheritance:
-    :noindex:
-
-    .. automethod:: __init__
-        :noindex:
-
-
-.. automodule:: ray.train.horovod
-    :members:
-    :exclude-members: HorovodTrainer
-    :show-inheritance:
-    :noindex:
-
-HuggingFace
-###########
-
-.. autoclass:: ray.train.huggingface.HuggingFaceTrainer
-    :members:
-    :show-inheritance:
-    :noindex:
-
-    .. automethod:: __init__
-        :noindex:
-
-
-.. automodule:: ray.train.huggingface
-    :members:
-    :exclude-members: HuggingFaceTrainer
-    :show-inheritance:
-    :noindex:
-
-Scikit-Learn
-############
-
-.. autoclass:: ray.train.sklearn.SklearnTrainer
-    :members:
-    :show-inheritance:
-    :noindex:
-
-    .. automethod:: __init__
-        :noindex:
-
-
-.. automodule:: ray.train.sklearn
-    :members:
-    :exclude-members: SklearnTrainer
-    :show-inheritance:
-    :noindex:
-
-
-Reinforcement Learning (RLlib)
-##############################
-
-.. automodule:: ray.train.rl
-    :members:
-    :show-inheritance:
-    :noindex:
-
-.. _air-builtin-callbacks:
-
-Integrations
-~~~~~~~~~~~~~~~~~~~~~~~
-
-See :doc:`this API reference </tune/api/integration>` for AIR integrations with other libraries
-such as Weights and Biases, MLFlow, Keras, and more.
diff --git a/doc/source/ray-references/api.rst b/doc/source/ray-references/api.rst
index 77cee502833c..5f9e1e0199ea 100644
--- a/doc/source/ray-references/api.rst
+++ b/doc/source/ray-references/api.rst
@@ -5,9 +5,9 @@ API References
     :maxdepth: 2
     :caption: Ray API References
 
-    ../ray-air/package-ref.rst
+    ../ray-air/api/api.rst
     ../data/api/api.rst
-    ../train/api.rst
+    ../train/api/api.rst
     ../tune/api/api.rst
     ../serve/api/index.rst
     ../rllib/package_ref/index.rst
diff --git a/doc/source/train/api.rst b/doc/source/train/api.rst
deleted file mode 100644
index de1e986f0e00..000000000000
--- a/doc/source/train/api.rst
+++ /dev/null
@@ -1,243 +0,0 @@
-.. _train-api:
-
-Ray Train API
-=============
-
-This page covers framework specific integrations with Ray Train and Ray Train Developer APIs.
-
-For core Ray AIR APIs, take a look at the :ref:`AIR Trainer package reference <air-trainer-ref>`.
-
-.. _train-integration-api:
-
-Trainer and Predictor Integrations
-----------------------------------
-
-XGBoost
-~~~~~~~
-
-``XGBoostTrainer``
-******************
-
-.. autoclass:: ray.train.xgboost.XGBoostTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-``XGBoostPredictor``
-********************
-
-.. automodule:: ray.train.xgboost
-    :members:
-    :exclude-members: XGBoostTrainer
-    :show-inheritance:
-
-LightGBM
-~~~~~~~~
-
-``LightGBMTrainer``
-*******************
-
-.. autoclass:: ray.train.lightgbm.LightGBMTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-``LightGBMPredictor``
-*********************
-
-
-.. automodule:: ray.train.lightgbm
-    :members:
-    :exclude-members: LightGBMTrainer
-    :show-inheritance:
-
-TensorFlow
-~~~~~~~~~~
-
-``TensorflowTrainer``
-*********************
-
-.. autoclass:: ray.train.tensorflow.TensorflowTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-``TensorflowPredictor`` and ``TensorflowCheckpoint``
-****************************************************
-
-.. automodule:: ray.train.tensorflow
-    :members:
-    :exclude-members: TensorflowTrainer
-    :show-inheritance:
-
-PyTorch
-~~~~~~~
-
-``TorchTrainer``
-****************
-
-.. autoclass:: ray.train.torch.TorchTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-
-``TorchPredictor``
-******************
-
-.. autoclass:: ray.train.torch.TorchPredictor
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-``TorchDetectionPredictor``
-***************************
-
-.. autoclass:: ray.train.torch.TorchDetectionPredictor
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-Horovod
-~~~~~~~
-
-``HorovodTrainer``
-******************
-
-.. autoclass:: ray.train.horovod.HorovodTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-``HorovodConfig``
-*****************
-
-.. automodule:: ray.train.horovod
-    :members:
-    :exclude-members: HorovodTrainer
-    :show-inheritance:
-
-HuggingFace
-~~~~~~~~~~~
-
-``HuggingFaceTrainer``
-**********************
-
-.. autoclass:: ray.train.huggingface.HuggingFaceTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-``HuggingFacePredictor`` and ``HuggingFaceCheckpoint``
-******************************************************
-
-.. automodule:: ray.train.huggingface
-    :members:
-    :exclude-members: HuggingFaceTrainer
-    :show-inheritance:
-
-Scikit-Learn
-~~~~~~~~~~~~
-
-``SklearnTrainer``
-******************
-
-.. autoclass:: ray.train.sklearn.SklearnTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-``SklearnPredictor`` and ``SklearnCheckpoint``
-**********************************************
-
-.. automodule:: ray.train.sklearn
-    :members:
-    :exclude-members: SklearnTrainer
-    :show-inheritance:
-
-Mosaic
-~~~~~~
-
-``MosaicTrainer``
-*****************
-
-.. autoclass:: ray.train.mosaic.MosaicTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-
-.. automodule:: ray.train.mosaic
-    :members:
-    :exclude-members: MosaicTrainer
-    :show-inheritance:
-
-
-Reinforcement Learning with RLlib
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-``RLTrainer``
-*************
-
-.. autoclass:: ray.train.rl.RLTrainer
-    :members:
-    :show-inheritance:
-
-    .. automethod:: __init__
-
-``RLPredictor`` and ``RLCheckpoint``
-************************************
-
-.. automodule:: ray.train.rl
-    :members:
-    :exclude-members: RLTrainer
-    :show-inheritance:
-
-
-Base Classes (Developer APIs)
------------------------------
-
-.. _train-base-trainer:
-
-.. autoclass:: ray.train.trainer.BaseTrainer
-    :members:
-    :noindex:
-
-    .. automethod:: __init__
-        :noindex:
-
-.. autoclass:: ray.train.data_parallel_trainer.DataParallelTrainer
-    :members:
-    :show-inheritance:
-    :noindex:
-
-    .. automethod:: __init__
-        :noindex:
-
-.. autoclass:: ray.train.gbdt_trainer.GBDTTrainer
-    :members:
-    :show-inheritance:
-    :noindex:
-
-    .. automethod:: __init__
-        :noindex:
-
-.. _train-backend:
-
-.. autoclass:: ray.train.backend.Backend
-    :members:
-
-.. _train-backend-config:
-
-.. autoclass:: ray.train.backend.BackendConfig
-    :members:
diff --git a/doc/source/train/api/api.rst b/doc/source/train/api/api.rst
new file mode 100644
index 000000000000..76b190802ac4
--- /dev/null
+++ b/doc/source/train/api/api.rst
@@ -0,0 +1,89 @@
+.. _train-api:
+.. _air-trainer-ref:
+
+Ray Train API
+=============
+
+This page covers framework specific integrations with Ray Train and Ray Train Developer APIs.
+
+For core Ray AIR APIs, take a look at the :ref:`AIR package reference <air-api-ref>`.
+
+Ray Train Base Classes (Developer APIs)
+---------------------------------------
+
+.. currentmodule:: ray.train
+
+.. _train-base-trainer:
+
+Trainer Base Classes
+~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    ~trainer.BaseTrainer
+    ~data_parallel_trainer.DataParallelTrainer
+    ~gbdt_trainer.GBDTTrainer
+
+``BaseTrainer`` Methods
+************************
+
+.. autosummary::
+    :toctree: doc/
+
+    ~trainer.BaseTrainer.fit
+    ~trainer.BaseTrainer.setup
+    ~trainer.BaseTrainer.preprocess_datasets
+    ~trainer.BaseTrainer.training_loop
+    ~trainer.BaseTrainer.as_trainable
+
+
+Train Backend Base Classes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _train-backend:
+.. _train-backend-config:
+
+.. autosummary::
+    :toctree: doc/
+
+    backend.Backend
+    backend.BackendConfig
+
+
+.. _train-integration-api:
+
+Ray Train Integrations
+----------------------
+
+Ray Train Built-in Trainers
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    ~xgboost.XGBoostTrainer
+    ~lightgbm.LightGBMTrainer
+    ~tensorflow.TensorflowTrainer
+    ~torch.TorchTrainer
+    ~horovod.HorovodTrainer
+    ~huggingface.HuggingFaceTrainer
+    ~sklearn.SklearnTrainer
+    ~mosaic.MosaicTrainer
+    ~rl.RLTrainer
+
+.. _train-framework-specific-ckpts:
+
+Ray Train Framework-specific Checkpoints
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autosummary::
+    :toctree: doc/
+
+    ~tensorflow.TensorflowCheckpoint
+    ~torch.TorchCheckpoint
+    ~xgboost.XGBoostCheckpoint
+    ~lightgbm.LightGBMCheckpoint
+    ~huggingface.HuggingFaceCheckpoint
+    ~sklearn.SklearnCheckpoint
+    ~rl.RLCheckpoint
diff --git a/doc/source/tune/api/execution.rst b/doc/source/tune/api/execution.rst
index 50154462a703..bc49c62ca533 100644
--- a/doc/source/tune/api/execution.rst
+++ b/doc/source/tune/api/execution.rst
@@ -3,6 +3,8 @@ Tune Execution (tune.Tuner)
 
 .. _tune-run-ref:
 
+.. _air-tuner-ref:
+
 Tuner
 -----
 
diff --git a/doc/source/tune/api/integration.rst b/doc/source/tune/api/integration.rst
index 0ad8ff86d2a6..65655abf5f8b 100644
--- a/doc/source/tune/api/integration.rst
+++ b/doc/source/tune/api/integration.rst
@@ -12,6 +12,7 @@ External library integrations for Ray Tune
 .. currentmodule:: ray
 
 .. _tune-monitoring-integrations:
+.. _air-builtin-callbacks:
 
 Tune Experiment Monitoring Integrations
 ----------------------------------------
diff --git a/doc/source/tune/api/result_grid.rst b/doc/source/tune/api/result_grid.rst
index abda7956af8f..020460a7477d 100644
--- a/doc/source/tune/api/result_grid.rst
+++ b/doc/source/tune/api/result_grid.rst
@@ -1,3 +1,4 @@
+.. _air-results-ref:
 .. _tune-analysis-docs:
 
 .. _result-grid-docstring:
diff --git a/doc/source/tune/api/trainable.rst b/doc/source/tune/api/trainable.rst
index 3b46f22694c1..6c8e50e771e3 100644
--- a/doc/source/tune/api/trainable.rst
+++ b/doc/source/tune/api/trainable.rst
@@ -270,20 +270,13 @@ session (Function API)
 .. currentmodule:: ray
 
 .. autosummary::
-    :toctree: doc/
 
     air.session.report
-    :noindex:
     air.session.get_checkpoint
-    :noindex:
     air.session.get_trial_name
-    :noindex:
     air.session.get_trial_id
-    :noindex:
     air.session.get_trial_resources
-    :noindex:
     air.session.get_trial_dir
-    :noindex:
 
 .. _tune-trainable-docstring:
 

From 19ca00b8d70fd2782d39da1041504b6d979615ee Mon Sep 17 00:00:00 2001
From: Jiajun Yao <jeromeyjj@gmail.com>
Date: Wed, 15 Feb 2023 01:52:10 +0800
Subject: [PATCH 262/267] Fix autosummary to show docstring of class members
 (#32520)

By default, autosummary only shows one line for each class member instead of the entire docstring. Ideally the fix should be autosummarying class members as well but that generates too many doc pages and causes doc build timeout. For now, default to show docstring of class members in the class pages and an explicit opt-in to autosummary class members.

Signed-off-by: Jiajun Yao <jeromeyjj@gmail.com>
---
 doc/source/_templates/autosummary/class.rst   |  6 +++
 .../autosummary/class_with_autosummary.rst    | 45 +++++++++++++++++++
 .../job-submission/jobs-package-ref.rst       |  1 +
 doc/source/data/api/dataset.rst               |  1 +
 doc/source/data/api/dataset_context.rst       |  1 +
 doc/source/data/api/dataset_pipeline.rst      |  1 +
 doc/source/data/api/grouped_dataset.rst       |  1 +
 doc/source/data/api/random_access_dataset.rst |  1 +
 doc/source/serve/api/python_api.md            |  1 +
 doc/source/tune/api/callbacks.rst             |  1 +
 doc/source/tune/api/execution.rst             |  1 +
 doc/source/tune/api/logging.rst               |  1 +
 doc/source/tune/api/reporters.rst             |  2 +
 doc/source/tune/api/result_grid.rst           |  1 +
 doc/source/tune/api/schedulers.rst            |  1 +
 doc/source/tune/api/stoppers.rst              |  5 +++
 doc/source/tune/api/suggestion.rst            |  1 +
 doc/source/tune/api/syncing.rst               |  1 +
 doc/source/tune/api/trainable.rst             |  1 +
 python/ray/air/execution/resources/request.py |  1 +
 20 files changed, 74 insertions(+)
 create mode 100644 doc/source/_templates/autosummary/class.rst
 create mode 100644 doc/source/_templates/autosummary/class_with_autosummary.rst

diff --git a/doc/source/_templates/autosummary/class.rst b/doc/source/_templates/autosummary/class.rst
new file mode 100644
index 000000000000..8643ade9ab82
--- /dev/null
+++ b/doc/source/_templates/autosummary/class.rst
@@ -0,0 +1,6 @@
+{{ fullname | escape | underline}}
+
+.. currentmodule:: {{ module }}
+
+.. autoclass:: {{ objname }}
+    :members:
diff --git a/doc/source/_templates/autosummary/class_with_autosummary.rst b/doc/source/_templates/autosummary/class_with_autosummary.rst
new file mode 100644
index 000000000000..b409424e83e9
--- /dev/null
+++ b/doc/source/_templates/autosummary/class_with_autosummary.rst
@@ -0,0 +1,45 @@
+{#
+  Generating pages for class methods and attributes
+  significantly increases the doc build time and causes timeouts.
+  For now, opt in explicitly via `:template: autosummary/class_with_autosummary.rst`
+#}
+{#
+  It's a known bug (https://github.com/sphinx-doc/sphinx/issues/9884)
+  that autosummary will generate warning for inherited instance attributes.
+  Those warnings will fail our build.
+  For now, we don't autosummary classes with inherited instance attributes.
+#}
+
+{{ fullname | escape | underline}}
+
+.. currentmodule:: {{ module }}
+
+.. autoclass:: {{ objname }}
+
+   {% block methods %}
+   {% if methods %}
+   .. rubric:: {{ _('Methods') }}
+
+   .. autosummary::
+      :toctree:
+
+   {% for item in methods %}
+      {{ name }}.{{ item }}
+   {%- endfor %}
+
+   {% endif %}
+   {% endblock %}
+
+   {% block attributes %}
+   {% if attributes %}
+   .. rubric:: {{ _('Attributes') }}
+
+   .. autosummary::
+      :toctree:
+
+   {% for item in attributes %}
+      {{ name }}.{{ item }}
+   {%- endfor %}
+
+   {% endif %}
+   {% endblock %}
diff --git a/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst b/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst
index fa700c94bb0c..beaf1127f449 100644
--- a/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst
+++ b/doc/source/cluster/running-applications/job-submission/jobs-package-ref.rst
@@ -16,6 +16,7 @@ JobSubmissionClient
 
 .. autosummary::
    :toctree: doc/
+   :template: autosummary/class_with_autosummary.rst
 
    JobSubmissionClient
    JobSubmissionClient.submit_job
diff --git a/doc/source/data/api/dataset.rst b/doc/source/data/api/dataset.rst
index fe006b68ab4b..8bcd4107560c 100644
--- a/doc/source/data/api/dataset.rst
+++ b/doc/source/data/api/dataset.rst
@@ -10,6 +10,7 @@ Constructor
 
 .. autosummary::
    :toctree: doc/
+   :template: autosummary/class_with_autosummary.rst
 
    Dataset
 
diff --git a/doc/source/data/api/dataset_context.rst b/doc/source/data/api/dataset_context.rst
index 107f9567dc25..2288352d59f3 100644
--- a/doc/source/data/api/dataset_context.rst
+++ b/doc/source/data/api/dataset_context.rst
@@ -10,6 +10,7 @@ Constructor
 
 .. autosummary::
    :toctree: doc/
+   :template: autosummary/class_with_autosummary.rst
 
    context.DatasetContext
 
diff --git a/doc/source/data/api/dataset_pipeline.rst b/doc/source/data/api/dataset_pipeline.rst
index 70919f562253..7ec82d999f81 100644
--- a/doc/source/data/api/dataset_pipeline.rst
+++ b/doc/source/data/api/dataset_pipeline.rst
@@ -10,6 +10,7 @@ Constructor
 
 .. autosummary::
    :toctree: doc/
+   :template: autosummary/class_with_autosummary.rst
 
    DatasetPipeline
 
diff --git a/doc/source/data/api/grouped_dataset.rst b/doc/source/data/api/grouped_dataset.rst
index b426a91aa74d..8e496bd92fd3 100644
--- a/doc/source/data/api/grouped_dataset.rst
+++ b/doc/source/data/api/grouped_dataset.rst
@@ -12,6 +12,7 @@ Constructor
 
 .. autosummary::
    :toctree: doc/
+   :template: autosummary/class_with_autosummary.rst
 
    grouped_dataset.GroupedDataset
 
diff --git a/doc/source/data/api/random_access_dataset.rst b/doc/source/data/api/random_access_dataset.rst
index e3a171af18d2..f1e1c231f6b2 100644
--- a/doc/source/data/api/random_access_dataset.rst
+++ b/doc/source/data/api/random_access_dataset.rst
@@ -12,6 +12,7 @@ Constructor
 
 .. autosummary::
    :toctree: doc/
+   :template: autosummary/class_with_autosummary.rst
 
    random_access_dataset.RandomAccessDataset
 
diff --git a/doc/source/serve/api/python_api.md b/doc/source/serve/api/python_api.md
index 9b288318842f..205f77b24dc3 100644
--- a/doc/source/serve/api/python_api.md
+++ b/doc/source/serve/api/python_api.md
@@ -24,6 +24,7 @@
 ```{eval-rst}
 .. autosummary::
    :toctree: doc/
+   :template: autosummary/class_with_autosummary.rst
 
    serve.handle.RayServeHandle
    serve.handle.RayServeHandle.remote
diff --git a/doc/source/tune/api/callbacks.rst b/doc/source/tune/api/callbacks.rst
index 5cee421c13ba..6c2cc35eeca8 100644
--- a/doc/source/tune/api/callbacks.rst
+++ b/doc/source/tune/api/callbacks.rst
@@ -19,6 +19,7 @@ Callback Initialization and Setup
 .. currentmodule:: ray.tune
 .. autosummary::
     :toctree: doc/
+    :template: autosummary/class_with_autosummary.rst
 
     Callback
     Callback.setup
diff --git a/doc/source/tune/api/execution.rst b/doc/source/tune/api/execution.rst
index bc49c62ca533..d615a2764182 100644
--- a/doc/source/tune/api/execution.rst
+++ b/doc/source/tune/api/execution.rst
@@ -12,6 +12,7 @@ Tuner
 
 .. autosummary::
     :toctree: doc/
+    :template: autosummary/class_with_autosummary.rst
 
     Tuner
     Tuner.fit
diff --git a/doc/source/tune/api/logging.rst b/doc/source/tune/api/logging.rst
index e5eb8732b626..80e37d77884c 100644
--- a/doc/source/tune/api/logging.rst
+++ b/doc/source/tune/api/logging.rst
@@ -75,6 +75,7 @@ LoggerCallback Interface
 
 .. autosummary::
     :toctree: doc/
+    :template: autosummary/class_with_autosummary.rst
 
     tune.logger.LoggerCallback
     tune.logger.LoggerCallback.log_trial_start
diff --git a/doc/source/tune/api/reporters.rst b/doc/source/tune/api/reporters.rst
index b163d5695099..e50a9d5708db 100644
--- a/doc/source/tune/api/reporters.rst
+++ b/doc/source/tune/api/reporters.rst
@@ -95,6 +95,7 @@ Reporter Interface (tune.ProgressReporter)
 
 .. autosummary::
     :toctree: doc/
+    :template: autosummary/class_with_autosummary.rst
 
     ProgressReporter
     ProgressReporter.report
@@ -106,6 +107,7 @@ Tune Built-in Reporters
 
 .. autosummary::
     :toctree: doc/
+    :template: autosummary/class_with_autosummary.rst
 
     CLIReporter
     CLIReporter.add_metric_column
diff --git a/doc/source/tune/api/result_grid.rst b/doc/source/tune/api/result_grid.rst
index 020460a7477d..bf827e05fc5f 100644
--- a/doc/source/tune/api/result_grid.rst
+++ b/doc/source/tune/api/result_grid.rst
@@ -13,6 +13,7 @@ ResultGrid (tune.ResultGrid)
 
 .. autosummary::
     :toctree: doc/
+    :template: autosummary/class_with_autosummary.rst
 
     tune.ResultGrid
     tune.ResultGrid.get_best_result
diff --git a/doc/source/tune/api/schedulers.rst b/doc/source/tune/api/schedulers.rst
index a7ee7772092a..e4abd515f5d8 100644
--- a/doc/source/tune/api/schedulers.rst
+++ b/doc/source/tune/api/schedulers.rst
@@ -335,6 +335,7 @@ TrialScheduler Interface
 
 .. autosummary::
     :toctree: doc/
+    :template: autosummary/class_with_autosummary.rst
 
     TrialScheduler
     TrialScheduler.choose_trial_to_run
diff --git a/doc/source/tune/api/stoppers.rst b/doc/source/tune/api/stoppers.rst
index 28dfa38d8044..cf0ad4b1be5e 100644
--- a/doc/source/tune/api/stoppers.rst
+++ b/doc/source/tune/api/stoppers.rst
@@ -23,8 +23,13 @@ Stopper Interface (tune.Stopper)
 
 .. autosummary::
     :toctree: doc/
+    :template: autosummary/class_with_autosummary.rst
 
     Stopper
+
+.. autosummary::
+    :toctree: doc/
+
     Stopper.__call__
     Stopper.stop_all
 
diff --git a/doc/source/tune/api/suggestion.rst b/doc/source/tune/api/suggestion.rst
index bce657c9ecc5..179a393aaf7a 100644
--- a/doc/source/tune/api/suggestion.rst
+++ b/doc/source/tune/api/suggestion.rst
@@ -331,6 +331,7 @@ If you are interested in implementing or contributing a new Search Algorithm, pr
 
 .. autosummary::
     :toctree: doc/
+    :template: autosummary/class_with_autosummary.rst
 
     Searcher
     Searcher.suggest
diff --git a/doc/source/tune/api/syncing.rst b/doc/source/tune/api/syncing.rst
index d7f24fd44920..f7591aed6c50 100644
--- a/doc/source/tune/api/syncing.rst
+++ b/doc/source/tune/api/syncing.rst
@@ -25,6 +25,7 @@ Remote Storage Syncer Interface (tune.Syncer)
 
 .. autosummary::
     :toctree: doc/
+    :template: autosummary/class_with_autosummary.rst
 
     Syncer
     Syncer.sync_up
diff --git a/doc/source/tune/api/trainable.rst b/doc/source/tune/api/trainable.rst
index 6c8e50e771e3..8ceeefcf2d23 100644
--- a/doc/source/tune/api/trainable.rst
+++ b/doc/source/tune/api/trainable.rst
@@ -285,6 +285,7 @@ Trainable (Class API)
 
 .. autosummary::
     :toctree: doc/
+    :template: autosummary/class_with_autosummary.rst
 
     tune.Trainable
     tune.Trainable.setup
diff --git a/python/ray/air/execution/resources/request.py b/python/ray/air/execution/resources/request.py
index 8a66fb5cfe00..87455a6b3ad8 100644
--- a/python/ray/air/execution/resources/request.py
+++ b/python/ray/air/execution/resources/request.py
@@ -108,6 +108,7 @@ def head_bundle_is_empty(self):
     @property
     @DeveloperAPI
     def head_cpus(self) -> float:
+        """Returns the number of cpus in the head bundle."""
         return 0.0 if self._head_bundle_is_empty else self._bundles[0].get("CPU", 0.0)
 
     @property

From bf5e721780a4cc757c7c613e79c26cea7300a834 Mon Sep 17 00:00:00 2001
From: Stephanie Wang <swang@cs.berkeley.edu>
Date: Tue, 14 Feb 2023 12:19:56 -0600
Subject: [PATCH 263/267] [core] Add opt-in flag for Windows and OSX clusters,
 update ray start output to match docs (#32409)

Un-revert #31166.

This PR cleans up a few usability issues around Ray clusters:

- Makes some cleanups to the ray start log output to match the new documentation on Ray clusters. Mainly, de-emphasize Ray Client and recommend jobs instead.
- Add an opt-in flag for enabling multi-node clusters for OSX and Windows. Previously, it was possible to start a multi-node cluster, but then any Ray programs would fail mysteriously after connecting to the cluster. Now, it will warn the user with an error message if the opt-in flag is not set.
- Document multi-node support for OSX and Windows.

Signed-off-by: Stephanie Wang <swang@cs.berkeley.edu>
Co-authored-by: Archit Kulkarni <architkulkarni@users.noreply.github.com>
---
 .bazelrc                                      |   3 +
 .buildkite/pipeline.macos.yml                 |   1 +
 .buildkite/pipeline.windows.yml               |   1 +
 doc/source/cluster/getting-started.rst        |   6 +
 doc/source/ray-overview/installation.rst      |   6 +-
 java/test.sh                                  |   1 +
 .../main/java/io/ray/test/GcsClientTest.java  |   5 +
 python/ray/_private/ray_constants.py          |  19 ++-
 python/ray/_private/services.py               |  13 +-
 python/ray/_private/worker.py                 |  17 ++-
 python/ray/scripts/scripts.py                 | 144 ++++++++++++------
 python/ray/tests/test_basic_4.py              |   4 +
 .../test_cli_patterns/test_ray_start.txt      |  17 ++-
 .../gcs/gcs_client/global_state_accessor.cc   |   6 +-
 14 files changed, 177 insertions(+), 66 deletions(-)

diff --git a/.bazelrc b/.bazelrc
index 1b98b8f72a3f..f8b916446e54 100644
--- a/.bazelrc
+++ b/.bazelrc
@@ -29,6 +29,9 @@ test --test_env=PYENV_VERSION
 test --test_env=PYENV_SHELL
 # Do not send usage stats to the server for tests
 test --test_env=RAY_USAGE_STATS_REPORT_URL="http://127.0.0.1:8000"
+# Enable cluster mode for OSX and Windows. By default, Ray
+# will not allow multinode OSX and Windows clusters.
+test --test_env=RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER="1"
 # This is needed for some core tests to run correctly
 build:windows --enable_runfiles
 # TODO(mehrdadn): Revert the "-\\.(asm|S)$" exclusion when this Bazel bug
diff --git a/.buildkite/pipeline.macos.yml b/.buildkite/pipeline.macos.yml
index 655003da2855..43243756ece8 100644
--- a/.buildkite/pipeline.macos.yml
+++ b/.buildkite/pipeline.macos.yml
@@ -46,6 +46,7 @@ steps:
     - export MAC_WHEELS=1
     - export MAC_JARS=1
     - export RAY_INSTALL_JAVA=1
+    - export RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER=1
     - . ./ci/ci.sh init && source ~/.zshenv
     - ./ci/ci.sh build
     # Test wheels
diff --git a/.buildkite/pipeline.windows.yml b/.buildkite/pipeline.windows.yml
index fef6b5187115..0aa3816ff747 100644
--- a/.buildkite/pipeline.windows.yml
+++ b/.buildkite/pipeline.windows.yml
@@ -35,6 +35,7 @@ steps:
     - conda init
     - . ./ci/ci.sh init
     - ./ci/ci.sh build
+    - export RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER="1"
     - if [ "${BUILDKITE_PARALLEL_JOB}" = "0" ]; then ./ci/ci.sh test_core; fi
     # The next command will be sharded into $parallelism shards.
     - ./ci/ci.sh test_python
diff --git a/doc/source/cluster/getting-started.rst b/doc/source/cluster/getting-started.rst
index 1538fbacb63d..8024ef751a33 100644
--- a/doc/source/cluster/getting-started.rst
+++ b/doc/source/cluster/getting-started.rst
@@ -22,6 +22,12 @@ Ray provides native cluster deployment support on the following technology stack
 Advanced users may want to :ref:`deploy Ray manually <on-prem>`
 or onto :ref:`platforms not listed here <ref-cluster-setup>`.
 
+.. note::
+
+    Multi-node Ray clusters are only supported on Linux. At your own risk, you
+    may deploy Windows and OSX clusters by setting the environment variable
+    ``RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER=1`` during deployment.
+
 What's next?
 ------------
 
diff --git a/doc/source/ray-overview/installation.rst b/doc/source/ray-overview/installation.rst
index 3c7f41dbe18e..bc35960eac54 100644
--- a/doc/source/ray-overview/installation.rst
+++ b/doc/source/ray-overview/installation.rst
@@ -203,7 +203,8 @@ You can install and use Ray C++ API as follows.
 M1 Mac (Apple Silicon) Support
 ------------------------------
 
-Ray has experimental support for machines running Apple Silicon (such as M1 macs). To get started:
+Ray has experimental support for machines running Apple Silicon (such as M1 macs).
+Multi-node clusters are untested. To get started with local Ray development:
 
 #. Install `miniforge <https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-MacOSX-arm64.sh>`_.
 
@@ -236,7 +237,8 @@ Ray has experimental support for machines running Apple Silicon (such as M1 macs
 Windows Support
 ---------------
 
-Windows support is currently in beta. Please submit any issues you encounter on
+Windows support is currently in beta, and multi-node Ray clusters are untested.
+Please submit any issues you encounter on
 `GitHub <https://github.com/ray-project/ray/issues/>`_.
 
 Installing Ray on Arch Linux
diff --git a/java/test.sh b/java/test.sh
index e40d123f52f7..2a595ffa5659 100755
--- a/java/test.sh
+++ b/java/test.sh
@@ -82,6 +82,7 @@ MAX_ROUNDS=1
 if [ $MAX_ROUNDS -gt 1 ]; then
   export RAY_BACKEND_LOG_LEVEL=debug
 fi
+export RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER=1
 
 round=1
 while true; do
diff --git a/java/test/src/main/java/io/ray/test/GcsClientTest.java b/java/test/src/main/java/io/ray/test/GcsClientTest.java
index 0d9a19d1d5d9..caf41e028d88 100644
--- a/java/test/src/main/java/io/ray/test/GcsClientTest.java
+++ b/java/test/src/main/java/io/ray/test/GcsClientTest.java
@@ -6,7 +6,9 @@
 import io.ray.runtime.config.RayConfig;
 import io.ray.runtime.gcs.GcsClient;
 import java.util.List;
+import org.apache.commons.lang3.SystemUtils;
 import org.testng.Assert;
+import org.testng.SkipException;
 import org.testng.annotations.BeforeClass;
 import org.testng.annotations.Test;
 
@@ -15,6 +17,9 @@ public class GcsClientTest extends BaseTest {
 
   @BeforeClass
   public void setUp() {
+    if (SystemUtils.IS_OS_MAC) {
+      throw new SkipException("Skip NodeIpTest on Mac OS");
+    }
     System.setProperty("ray.head-args.0", "--resources={\"A\":8}");
   }
 
diff --git a/python/ray/_private/ray_constants.py b/python/ray/_private/ray_constants.py
index 1b555c389409..3494cbdf2efa 100644
--- a/python/ray/_private/ray_constants.py
+++ b/python/ray/_private/ray_constants.py
@@ -2,6 +2,7 @@
 
 import logging
 import os
+import sys
 
 logger = logging.getLogger(__name__)
 
@@ -23,10 +24,18 @@ def env_integer(key, default):
 
 def env_bool(key, default):
     if key in os.environ:
-        return True if os.environ[key].lower() == "true" else False
+        return (
+            True
+            if os.environ[key].lower() == "true" or os.environ[key] == "1"
+            else False
+        )
     return default
 
 
+def env_set_by_user(key):
+    return key in os.environ
+
+
 # Whether event logging to driver is enabled. Set to 0 to disable.
 AUTOSCALER_EVENTS = env_integer("RAY_SCHEDULER_EVENTS", 1)
 
@@ -370,3 +379,11 @@ def gcs_actor_scheduling_enabled():
 # Ray wheels into the conda environment, so the Ray wheels for these Python
 # versions must be available online.
 RUNTIME_ENV_CONDA_PY_VERSIONS = [(3, 6), (3, 7), (3, 8), (3, 9), (3, 10)]
+
+# Whether to enable Ray clusters (in addition to local Ray).
+# Ray clusters are not explicitly supported for Windows and OSX.
+ENABLE_RAY_CLUSTERS_ENV_VAR = "RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER"
+ENABLE_RAY_CLUSTER = env_bool(
+    ENABLE_RAY_CLUSTERS_ENV_VAR,
+    not (sys.platform == "darwin" or sys.platform == "win32"),
+)
diff --git a/python/ray/_private/services.py b/python/ray/_private/services.py
index 27731e9de2dc..14fba2de6716 100644
--- a/python/ray/_private/services.py
+++ b/python/ray/_private/services.py
@@ -583,8 +583,11 @@ def resolve_ip_for_localhost(address: str):
     if not address:
         raise ValueError(f"Malformed address: {address}")
     address_parts = address.split(":")
-    # Make sure localhost isn't resolved to the loopback ip
     if address_parts[0] == "127.0.0.1" or address_parts[0] == "localhost":
+        # Clusters are disabled by default for OSX and Windows.
+        if not ray_constants.ENABLE_RAY_CLUSTER:
+            return address
+        # Make sure localhost isn't resolved to the loopback ip
         ip_address = get_node_ip_address()
         return ":".join([ip_address] + address_parts[1:])
     else:
@@ -627,10 +630,10 @@ def node_ip_address_from_perspective(address: str):
 def get_node_ip_address(address="8.8.8.8:53"):
     if ray._private.worker._global_node is not None:
         return ray._private.worker._global_node.node_ip_address
-    if sys.platform == "darwin" or sys.platform == "win32":
-        # Due to the mac osx/windows firewall,
-        # we use loopback ip as the ip address
-        # to prevent security popups.
+    if not ray_constants.ENABLE_RAY_CLUSTER:
+        # Use loopback IP as the local IP address to prevent bothersome
+        # firewall popups on OSX and Windows.
+        # https://github.com/ray-project/ray/issues/18730.
         return "127.0.0.1"
     return node_ip_address_from_perspective(address)
 
diff --git a/python/ray/_private/worker.py b/python/ray/_private/worker.py
index a1dcfa8277cf..531e3839b96b 100644
--- a/python/ray/_private/worker.py
+++ b/python/ray/_private/worker.py
@@ -1353,15 +1353,24 @@ def init(
                 job_config = ray.job_config.JobConfig()
             job_config.set_runtime_env(runtime_env)
 
-    if _node_ip_address is not None:
-        node_ip_address = services.resolve_ip_for_localhost(_node_ip_address)
-    raylet_ip_address = node_ip_address
-
     redis_address, gcs_address = None, None
     bootstrap_address = services.canonicalize_bootstrap_address(address, _temp_dir)
     if bootstrap_address is not None:
         gcs_address = bootstrap_address
         logger.info("Connecting to existing Ray cluster at address: %s...", gcs_address)
+        if not ray_constants.env_set_by_user(ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR):
+            # If the cluster already exists, then assume it's safe to connect
+            # to the cluster even if we're on Windows or OSX (unless the user
+            # explicitly set the flag).
+            ray_constants.ENABLE_RAY_CLUSTER = True
+
+    # NOTE(swang): We must set the node IP address *after* we determine whether
+    # this is an existing cluster or not. For Windows and OSX, the resolved IP
+    # is localhost for new clusters and the usual public IP for existing
+    # clusters.
+    if _node_ip_address is not None:
+        node_ip_address = services.resolve_ip_for_localhost(_node_ip_address)
+    raylet_ip_address = node_ip_address
 
     if local_mode:
         driver_mode = LOCAL_MODE
diff --git a/python/ray/scripts/scripts.py b/python/ray/scripts/scripts.py
index 6322fce9521c..f032cffdd030 100644
--- a/python/ray/scripts/scripts.py
+++ b/python/ray/scripts/scripts.py
@@ -578,10 +578,7 @@ def start(
             cf.bold("--port"),
         )
 
-    # Whether the original arguments include node_ip_address.
-    include_node_ip_address = False
     if node_ip_address is not None:
-        include_node_ip_address = True
         node_ip_address = services.resolve_ip_for_localhost(node_ip_address)
 
     resources = parse_resources_json(resources, cli_logger, cf)
@@ -749,68 +746,121 @@ def start(
         cli_logger.success("-" * len(startup_msg))
         cli_logger.newline()
         with cli_logger.group("Next steps"):
-            cli_logger.print("To connect to this Ray runtime from another node, run")
-            # NOTE(kfstorm): Java driver rely on this line to get the address
-            # of the cluster. Please be careful when updating this line.
-            cli_logger.print(
-                cf.bold("  ray start --address='{}'"),
-                bootstrap_address,
-            )
+            dashboard_url = node.address_info["webui_url"]
             if bootstrap_address.startswith("127.0.0.1:"):
+                if ray_constants.ENABLE_RAY_CLUSTER:
+                    cli_logger.print(
+                        "This Ray runtime only accepts connections from local host."
+                    )
+                    cli_logger.print(
+                        "To accept connections from remote hosts, "
+                        "specify a public ip when starting"
+                    )
+                    cli_logger.print(
+                        "the head node: ray start --head --node-ip-address=<public-ip>."
+                    )
+                else:
+                    cli_logger.print(
+                        "Multi-node Ray clusters are not supported on OSX and Windows."
+                    )
+                    cli_logger.print(
+                        "If you would like to proceed anyway, restart Ray with:"
+                    )
+                    cli_logger.print(
+                        cf.bold("  ray stop"),
+                    )
+                    cli_logger.print(
+                        cf.bold("  {}=true ray start"),
+                        ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR,
+                    )
+                cli_logger.newline()
+            else:
+                cli_logger.print("To add another node to this Ray cluster, run")
+                # NOTE(kfstorm): Java driver rely on this line to get the address
+                # of the cluster. Please be careful when updating this line.
                 cli_logger.print(
-                    "This Ray runtime only accepts connections from local host."
+                    cf.bold("  ray start --address='{}'"),
+                    bootstrap_address,
                 )
+                cli_logger.newline()
+            if ray_constants.ENABLE_RAY_CLUSTER:
                 cli_logger.print(
-                    "To accept connections from remote hosts, "
-                    "specify a public ip when starting"
+                    "To connect to this Ray cluster, run `ray.init()` as usual:"
                 )
+                with cli_logger.indented():
+                    cli_logger.print("{} ray", cf.magenta("import"))
+                    cli_logger.print(
+                        "ray{}init()",
+                        cf.magenta("."),
+                    )
+                cli_logger.newline()
                 cli_logger.print(
-                    "the head node: ray start --head --node-ip-address=<public-ip>."
+                    "To connect to this Ray instance from outside of "
+                    "the cluster, for example "
                 )
-            cli_logger.newline()
-            cli_logger.print("Alternatively, use the following Python code:")
-            with cli_logger.indented():
-                cli_logger.print("{} ray", cf.magenta("import"))
-                # Note: In the case of joining an existing cluster using
-                # `address="auto"`, the _node_ip_address parameter is
-                # unnecessary.
                 cli_logger.print(
-                    "ray{}init(address{}{}{})",
-                    cf.magenta("."),
-                    cf.magenta("="),
-                    cf.yellow("'auto'"),
-                    ", _node_ip_address{}{}".format(
-                        cf.magenta("="), cf.yellow("'" + node_ip_address + "'")
-                    )
-                    if include_node_ip_address
-                    else "",
+                    "when connecting to a remote cluster from your laptop, "
+                    "make sure the"
                 )
-
-            cli_logger.newline()
-            cli_logger.print("To see the status of the cluster, use")
-            cli_logger.print("  {}".format(cf.bold("ray status")))
-            dashboard_url = node.address_info["webui_url"]
-            if dashboard_url:
-                cli_logger.print("To monitor and debug Ray, view the dashboard at ")
                 cli_logger.print(
-                    "  {}".format(
-                        cf.bold(dashboard_url),
+                    "dashboard {}is accessible and use the Ray Jobs API. For example:",
+                    f"({dashboard_url}) " if dashboard_url else "",
+                )
+                if dashboard_url:
+                    cli_logger.print(
+                        cf.bold(
+                            "  RAY_ADDRESS='http://<dashboard URL>:{}' ray job submit "
+                            "--working-dir . "
+                            "-- python my_script.py"
+                        ),
+                        ray_params.dashboard_port,
                     )
+                cli_logger.newline()
+                cli_logger.print(
+                    "See https://docs.ray.io/en/latest/cluster/running-applications"
+                    "/job-submission/index.html"
                 )
-            cli_logger.newline()
-            cli_logger.print(
-                cf.underlined(
-                    "If connection fails, check your "
-                    "firewall settings and "
-                    "network configuration."
+                cli_logger.print(
+                    "for more information on connecting to the Ray cluster from "
+                    "a remote client."
                 )
-            )
-            cli_logger.newline()
+                cli_logger.newline()
+                cli_logger.print("To see the status of the cluster, use")
+                cli_logger.print("  {}".format(cf.bold("ray status")))
+                if dashboard_url:
+                    cli_logger.print("To monitor and debug Ray, view the dashboard at ")
+                    cli_logger.print(
+                        "  {}".format(
+                            cf.bold(dashboard_url),
+                        )
+                    )
+                cli_logger.newline()
+                cli_logger.print(
+                    cf.underlined(
+                        "If connection fails, check your "
+                        "firewall settings and "
+                        "network configuration."
+                    )
+                )
+                cli_logger.newline()
             cli_logger.print("To terminate the Ray runtime, run")
             cli_logger.print(cf.bold("  ray stop"))
         ray_params.gcs_address = bootstrap_address
     else:
         # Start worker node.
+        if not ray_constants.ENABLE_RAY_CLUSTER:
+            cli_logger.abort(
+                "Multi-node Ray clusters are not supported on Windows and OSX. "
+                "Restart the Ray cluster with the environment variable `{}=1` "
+                "to proceed anyway.",
+                cf.bold(ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR),
+            )
+            raise Exception(
+                "Multi-node Ray clusters are not supported on Windows and OSX. "
+                "Restart the Ray cluster with the environment variable "
+                f"`{ray_constants.ENABLE_RAY_CLUSTERS_ENV_VAR}=1` to proceed "
+                "anyway.",
+            )
 
         # Ensure `--address` flag is specified.
         if address is None:
diff --git a/python/ray/tests/test_basic_4.py b/python/ray/tests/test_basic_4.py
index 083ba0eaf605..43eb63e5ee95 100644
--- a/python/ray/tests/test_basic_4.py
+++ b/python/ray/tests/test_basic_4.py
@@ -4,9 +4,11 @@
 import sys
 import time
 from pathlib import Path
+import os
 
 import numpy as np
 import pytest
+from unittest import mock
 
 import ray
 import ray.cluster_utils
@@ -163,6 +165,8 @@ def g():
     sys.platform not in ["win32", "darwin"],
     reason="Only listen on localhost by default on mac and windows.",
 )
+@mock.patch("ray._private.services.ray_constants.ENABLE_RAY_CLUSTER", False)
+@mock.patch.dict(os.environ, {"RAY_ENABLE_WINDOWS_OR_OSX_CLUSTER": "0"})
 @pytest.mark.parametrize("start_ray", ["ray_start_regular", "call_ray_start"])
 def test_listen_on_localhost(start_ray, request):
     """All ray processes should listen on localhost by default
diff --git a/python/ray/tests/test_cli_patterns/test_ray_start.txt b/python/ray/tests/test_cli_patterns/test_ray_start.txt
index 6acae14bab52..bddb03bb7619 100644
--- a/python/ray/tests/test_cli_patterns/test_ray_start.txt
+++ b/python/ray/tests/test_cli_patterns/test_ray_start.txt
@@ -7,19 +7,28 @@ Ray runtime started.
 --------------------
 
 Next steps
-  To connect to this Ray runtime from another node, run
+  To add another node to this Ray cluster, run
     ray start --address='.+'
 
-  Alternatively, use the following Python code:
+  To connect to this Ray cluster, run `ray.init\(\)` as usual:
     import ray
-    ray\.init\(address='auto'\)
+    ray\.init\(\)
+
+  To connect to this Ray instance from outside of the cluster, for example
+  when connecting to a remote cluster from your laptop, make sure the
+  dashboard (.*) is accessible and use the Ray Jobs API\. For example:
+    RAY_ADDRESS='http://<dashboard URL>:8265' ray job submit --working-dir \. -- python my_script\.py
+
+  See https://docs\.ray\.io/en/latest/cluster/running-applications/job-submission/index\.html
+  for more information on connecting to the Ray cluster from a remote client\.
 
   To see the status of the cluster, use
     ray status
-  To monitor and debug Ray, view the dashboard at 
+  To monitor and debug Ray, view the dashboard at
     127.0.0.1:8265
 
   If connection fails, check your firewall settings and network configuration.
 
   To terminate the Ray runtime, run
     ray stop
+
diff --git a/src/ray/gcs/gcs_client/global_state_accessor.cc b/src/ray/gcs/gcs_client/global_state_accessor.cc
index e6376567913d..377a2076e852 100644
--- a/src/ray/gcs/gcs_client/global_state_accessor.cc
+++ b/src/ray/gcs/gcs_client/global_state_accessor.cc
@@ -354,9 +354,9 @@ ray::Status GlobalStateAccessor::GetNodeToConnectForDriver(
 
       if (relevant_client_index < 0 && head_node_client_index >= 0) {
         RAY_LOG(INFO) << "This node has an IP address of " << node_ip_address
-                      << ", while we can not find the matched Raylet address. "
-                      << "This maybe come from when you connect the Ray cluster "
-                      << "with a different IP address or connect a container.";
+                      << ", but we cannot find a local Raylet with the same address. "
+                      << "This can happen when you connect to the Ray cluster "
+                      << "with a different IP address or when connecting to a container.";
         relevant_client_index = head_node_client_index;
       }
       if (relevant_client_index < 0) {

From 9dcb369cc286037178a626e1afdb3a55964aa382 Mon Sep 17 00:00:00 2001
From: Amog Kamsetty <amogkam@users.noreply.github.com>
Date: Tue, 14 Feb 2023 12:01:25 -0800
Subject: [PATCH 264/267] [Data] Update DatasetPipeline.to_tf API to match with
 Dataset.to_tf (#32531)

Signed-off-by: amogkam <amogkamsetty@yahoo.com>
---
 python/ray/data/dataset_pipeline.py      | 19 ++++++++-----------
 python/ray/data/tests/test_dataset_tf.py | 15 +++++++++++++++
 2 files changed, 23 insertions(+), 11 deletions(-)

diff --git a/python/ray/data/dataset_pipeline.py b/python/ray/data/dataset_pipeline.py
index 6b0340f8defc..0a3fdc153888 100644
--- a/python/ray/data/dataset_pipeline.py
+++ b/python/ray/data/dataset_pipeline.py
@@ -12,7 +12,6 @@
     Iterator,
     List,
     Optional,
-    Tuple,
     Union,
 )
 import warnings
@@ -33,7 +32,7 @@
 from ray.data._internal.util import _is_tensor_schema
 from ray.data.block import BatchUDF, Block, DataBatch, KeyFn, RowUDF
 from ray.data.context import DatasetContext
-from ray.data.dataset import Dataset, T, U, TensorflowFeatureTypeSpec
+from ray.data.dataset import Dataset, T, U
 from ray.data.dataset_iterator import DatasetIterator
 from ray.data.datasource import Datasource
 from ray.data.datasource.file_based_datasource import (
@@ -1106,28 +1105,26 @@ def _is_tensor_dataset(self) -> bool:
 
     def to_tf(
         self,
+        feature_columns: Union[str, List[str]],
+        label_columns: Union[str, List[str]],
         *,
-        output_signature: Union[
-            TensorflowFeatureTypeSpec, Tuple[TensorflowFeatureTypeSpec, "tf.TypeSpec"]
-        ],
-        label_column: Optional[str] = None,
-        feature_columns: Optional[
-            Union[List[str], List[List[str]], Dict[str, List[str]]]
-        ] = None,
         prefetch_blocks: int = 0,
         batch_size: int = 1,
         drop_last: bool = False,
+        local_shuffle_buffer_size: Optional[int] = None,
+        local_shuffle_seed: Optional[int] = None,
     ) -> "tf.data.Dataset":
         """Call :py:meth:`Dataset.to_tf <ray.data.Dataset.to_tf>` over the stream of
         output batches from the pipeline"""
         return Dataset.to_tf(
             self,
-            output_signature=output_signature,
-            label_column=label_column,
             feature_columns=feature_columns,
+            label_columns=label_columns,
             prefetch_blocks=prefetch_blocks,
             batch_size=batch_size,
             drop_last=drop_last,
+            local_shuffle_buffer_size=local_shuffle_buffer_size,
+            local_shuffle_seed=local_shuffle_seed,
         )
 
     def to_torch(
diff --git a/python/ray/data/tests/test_dataset_tf.py b/python/ray/data/tests/test_dataset_tf.py
index 235fdee19354..2be4a34922cc 100644
--- a/python/ray/data/tests/test_dataset_tf.py
+++ b/python/ray/data/tests/test_dataset_tf.py
@@ -120,6 +120,21 @@ def test_element_spec_shape_with_tensors(self):
         assert tuple(features.shape) == (4, 3, 32, 32)
         assert tuple(labels.shape) == (4,)
 
+    def test_element_spec_pipeline(self):
+        ds = ray.data.from_items(
+            8 * [{"spam": np.zeros([3, 32, 32]), "ham": 0}]
+        ).repeat(2)
+
+        dataset = ds.to_tf(feature_columns="spam", label_columns="ham", batch_size=4)
+
+        feature_spec, label_spec = dataset.element_spec
+        assert tuple(feature_spec.shape) == (None, 3, 32, 32)
+        assert tuple(label_spec.shape) == (None,)
+
+        features, labels = next(iter(dataset))
+        assert tuple(features.shape) == (4, 3, 32, 32)
+        assert tuple(labels.shape) == (4,)
+
     @pytest.mark.parametrize("batch_size", [1, 2])
     def test_element_spec_shape_with_ragged_tensors(self, batch_size):
         df = pd.DataFrame(

From b12c0d1f290abca9ef179f7fc0ceeb0e372c207d Mon Sep 17 00:00:00 2001
From: Cade Daniel <cade@anyscale.com>
Date: Tue, 14 Feb 2023 12:27:24 -0800
Subject: [PATCH 265/267] Revert "[data] Fix pandas import failures by moving
 it to a top-level data import (#32447)" (#32533)

This reverts commit bc012884e12a91d719857faffa8e0fa25c3d1a1e.
---
 python/ray/data/__init__.py | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/python/ray/data/__init__.py b/python/ray/data/__init__.py
index ce978149e8ea..9a114f84490a 100644
--- a/python/ray/data/__init__.py
+++ b/python/ray/data/__init__.py
@@ -1,7 +1,3 @@
-# Short term workaround for https://github.com/ray-project/ray/issues/32435
-# Datasets currently has a hard dependency on pandas, so it doesn't need to be delayed.
-import pandas  # noqa
-
 from ray.data._internal.compute import ActorPoolStrategy
 from ray.data._internal.progress_bar import set_progress_bars
 from ray.data.dataset import Dataset

From e8f1cf6bc167db9611448de4df27b741af1d3402 Mon Sep 17 00:00:00 2001
From: Justin Yu <justinvyu@anyscale.com>
Date: Tue, 14 Feb 2023 12:58:54 -0800
Subject: [PATCH 266/267] [Tune] Update trainable `remote_checkpoint_dir` upon
 actor reuse (#32420)

This PR fixes trainable actor reuse to update the remote trial directory that it's writing checkpoints to.

Signed-off-by: Justin Yu <justinvyu@berkeley.edu>
---
 python/ray/air/_internal/remote_storage.py    |  2 +
 .../ray/tune/execution/ray_trial_executor.py  |  6 +-
 python/ray/tune/tests/test_actor_reuse.py     | 81 +++++++++++++++++--
 python/ray/tune/trainable/trainable.py        |  3 +-
 4 files changed, 85 insertions(+), 7 deletions(-)

diff --git a/python/ray/air/_internal/remote_storage.py b/python/ray/air/_internal/remote_storage.py
index 8e3cf6833060..bb05b90cb191 100644
--- a/python/ray/air/_internal/remote_storage.py
+++ b/python/ray/air/_internal/remote_storage.py
@@ -1,6 +1,7 @@
 import fnmatch
 import os
 import urllib.parse
+from pathlib import Path
 from pkg_resources import packaging
 from typing import List, Optional, Tuple
 
@@ -281,6 +282,7 @@ def _should_exclude(candidate: str) -> bool:
             full_source_path = os.path.normpath(os.path.join(local_path, candidate))
             full_target_path = os.path.normpath(os.path.join(bucket_path, candidate))
 
+            _ensure_directory(str(Path(full_target_path).parent))
             _pyarrow_fs_copy_files(
                 full_source_path, full_target_path, destination_filesystem=fs
             )
diff --git a/python/ray/tune/execution/ray_trial_executor.py b/python/ray/tune/execution/ray_trial_executor.py
index 09ebb04421d8..878360e0b4be 100644
--- a/python/ray/tune/execution/ray_trial_executor.py
+++ b/python/ray/tune/execution/ray_trial_executor.py
@@ -799,7 +799,11 @@ def reset_trial(
             with warn_if_slow("reset"):
                 try:
                     reset_val = ray.get(
-                        trainable.reset.remote(extra_config, logger_creator),
+                        trainable.reset.remote(
+                            extra_config,
+                            logger_creator=logger_creator,
+                            remote_checkpoint_dir=trial.remote_checkpoint_dir,
+                        ),
                         timeout=DEFAULT_GET_TIMEOUT,
                     )
                 except GetTimeoutError:
diff --git a/python/ray/tune/tests/test_actor_reuse.py b/python/ray/tune/tests/test_actor_reuse.py
index e0672fbbb3a8..e3da881cda82 100644
--- a/python/ray/tune/tests/test_actor_reuse.py
+++ b/python/ray/tune/tests/test_actor_reuse.py
@@ -7,6 +7,7 @@
 from ray import tune, logger
 from ray.tune import Trainable, run_experiments, register_trainable
 from ray.tune.error import TuneError
+from ray.tune.result_grid import ResultGrid
 from ray.tune.schedulers.trial_scheduler import FIFOScheduler, TrialScheduler
 from ray.tune.tune import _check_mixin
 
@@ -20,6 +21,13 @@ def ray_start_1_cpu():
     os.environ.pop("TUNE_STATE_REFRESH_PERIOD", None)
 
 
+@pytest.fixture
+def ray_start_2_cpus():
+    address_info = ray.init(num_cpus=2)
+    yield address_info
+    ray.shutdown()
+
+
 @pytest.fixture
 def ray_start_4_cpus_extra():
     address_info = ray.init(num_cpus=4, resources={"extra": 4})
@@ -85,7 +93,7 @@ def default_resource_request(cls, config):
         return None
 
 
-def _run_trials_with_frequent_pauses(trainable, reuse=False):
+def _run_trials_with_frequent_pauses(trainable, reuse=False, **kwargs):
     analysis = tune.run(
         trainable,
         num_samples=1,
@@ -93,8 +101,9 @@ def _run_trials_with_frequent_pauses(trainable, reuse=False):
         reuse_actors=reuse,
         scheduler=FrequentPausesScheduler(),
         verbose=0,
+        **kwargs,
     )
-    return analysis.trials
+    return analysis
 
 
 def test_trial_reuse_disabled(ray_start_1_cpu):
@@ -104,7 +113,8 @@ def test_trial_reuse_disabled(ray_start_1_cpu):
 
     We assert the `num_resets` of each trainable class to be 0 (no reuse).
     """
-    trials = _run_trials_with_frequent_pauses(MyResettableClass, reuse=False)
+    analysis = _run_trials_with_frequent_pauses(MyResettableClass, reuse=False)
+    trials = analysis.trials
     assert [t.last_result["id"] for t in trials] == [0, 1, 2, 3]
     assert [t.last_result["iter"] for t in trials] == [2, 2, 2, 2]
     assert [t.last_result["num_resets"] for t in trials] == [0, 0, 0, 0]
@@ -117,7 +127,8 @@ def test_trial_reuse_disabled_per_default(ray_start_1_cpu):
 
     We assert the `num_resets` of each trainable class to be 0 (no reuse).
     """
-    trials = _run_trials_with_frequent_pauses(MyResettableClass, reuse=None)
+    analysis = _run_trials_with_frequent_pauses(MyResettableClass, reuse=None)
+    trials = analysis.trials
     assert [t.last_result["id"] for t in trials] == [0, 1, 2, 3]
     assert [t.last_result["iter"] for t in trials] == [2, 2, 2, 2]
     assert [t.last_result["num_resets"] for t in trials] == [0, 0, 0, 0]
@@ -136,7 +147,8 @@ def test_trial_reuse_enabled(ray_start_1_cpu):
     - After each iteration, trials are paused and actors cached for reuse
     - Thus, the first trial finishes after 4 resets, the second after 5, etc.
     """
-    trials = _run_trials_with_frequent_pauses(MyResettableClass, reuse=True)
+    analysis = _run_trials_with_frequent_pauses(MyResettableClass, reuse=True)
+    trials = analysis.trials
     assert [t.last_result["id"] for t in trials] == [0, 1, 2, 3]
     assert [t.last_result["iter"] for t in trials] == [2, 2, 2, 2]
     assert [t.last_result["num_resets"] for t in trials] == [4, 5, 6, 7]
@@ -398,5 +410,64 @@ class MyTrainable(Trainable):
     assert _check_mixin(mlflow_mixin(MyTrainable))
 
 
+def test_remote_trial_dir_with_reuse_actors(ray_start_2_cpus, tmp_path):
+    """Check that the trainable has its remote directory set to the right
+    location, when new trials get swapped in on actor reuse.
+    Each trial runs for 2 iterations, with checkpoint_freq=1, so each remote
+    trial dir should have 2 checkpoints.
+    """
+    tmp_target = str(tmp_path / "upload_dir")
+    exp_name = "remote_trial_dir_update_on_actor_reuse"
+
+    def get_remote_trial_dir(trial_id: int):
+        return os.path.join(tmp_target, exp_name, str(trial_id))
+
+    class _MyResettableClass(MyResettableClass):
+        def __init__(self, *args, **kwargs):
+            super().__init__(*args, **kwargs)
+            self._should_raise = False
+
+        def load_checkpoint(self, *args, **kwargs):
+            super().load_checkpoint(*args, **kwargs)
+
+            # Make sure that `remote_checkpoint_dir` gets updated correctly
+            trial_id = self.config.get("id")
+            remote_trial_dir = get_remote_trial_dir(trial_id)
+            if self.remote_checkpoint_dir != "file://" + remote_trial_dir:
+                # Delay raising the exception, since raising here would cause
+                # an unhandled exception that doesn't fail the test.
+                self._should_raise = True
+
+        def step(self):
+            if self._should_raise:
+                raise RuntimeError(
+                    f"Failing! {self.remote_checkpoint_dir} not updated properly "
+                    f"for trial {self.config.get('id')}"
+                )
+            return super().step()
+
+    analysis = _run_trials_with_frequent_pauses(
+        _MyResettableClass,
+        reuse=True,
+        max_concurrent_trials=2,
+        local_dir=str(tmp_path),
+        name=exp_name,
+        sync_config=tune.SyncConfig(upload_dir=f"file://{tmp_target}"),
+        trial_dirname_creator=lambda t: str(t.config.get("id")),
+        checkpoint_freq=1,
+    )
+    result_grid = ResultGrid(analysis)
+    assert not result_grid.errors
+
+    # Check that each remote trial dir has 2 checkpoints.
+    for result in result_grid:
+        trial_id = result.config["id"]
+        remote_dir = get_remote_trial_dir(trial_id)
+        num_checkpoints = len(
+            [file for file in os.listdir(remote_dir) if file.startswith("checkpoint_")]
+        )
+        assert num_checkpoints == 2
+
+
 if __name__ == "__main__":
     sys.exit(pytest.main(["-v", __file__]))
diff --git a/python/ray/tune/trainable/trainable.py b/python/ray/tune/trainable/trainable.py
index 6af9f93eb5c3..b3c01f74554a 100644
--- a/python/ray/tune/trainable/trainable.py
+++ b/python/ray/tune/trainable/trainable.py
@@ -872,7 +872,7 @@ def export_model(
         export_dir = export_dir or self.logdir
         return self._export_model(export_formats, export_dir)
 
-    def reset(self, new_config, logger_creator=None):
+    def reset(self, new_config, logger_creator=None, remote_checkpoint_dir=None):
         """Resets trial for use with new config.
 
         Subclasses should override reset_config() to actually
@@ -914,6 +914,7 @@ def reset(self, new_config, logger_creator=None):
         self._time_since_restore = 0.0
         self._timesteps_since_restore = 0
         self._iterations_since_restore = 0
+        self.remote_checkpoint_dir = remote_checkpoint_dir
         self._restored = False
 
         return True

From b9f7e19aa1cb0d3d3f4f8f5e59f8e1ca8e9ea309 Mon Sep 17 00:00:00 2001
From: Alan Guo <aguo@anyscale.com>
Date: Tue, 14 Feb 2023 14:27:31 -0800
Subject: [PATCH 267/267] [docs] setting up grafana and prometheus (#31129)

---
 .../running-applications/images/graphs.png    | Bin 0 -> 150078 bytes
 .../monitoring-and-observability.rst          |  77 ++++++++++++++++-
 doc/source/ray-observability/ray-metrics.rst  |  80 ++++++++++--------
 3 files changed, 119 insertions(+), 38 deletions(-)
 create mode 100644 doc/source/cluster/running-applications/images/graphs.png

diff --git a/doc/source/cluster/running-applications/images/graphs.png b/doc/source/cluster/running-applications/images/graphs.png
new file mode 100644
index 0000000000000000000000000000000000000000..2cd41f5b9b2784ad4ba0e44f9d93ad1e1aa4b2c9
GIT binary patch
literal 150078
zcmcF~1y@^Lw>7jBFW%x%+$j=Vi(3i=x8m;ZR;+k&D^R>Z305q)yHngD1b5e)=Y8J$
z-Cyu!oH5QgezNyIYt1>=+>t7uW#6Kcpd%n4yp@-e0wEy0MnOP8%tS?o@6i<#dw{Qy
zTqWeyQQ<#7RI_jJZDKcRZ8tSX3pY<=7jpzl2S<BzHdj*@b8`n*D@V7J*X^PR2p<sS
zr9P>9{Wx6l{BAzyzkYMlv<ICKfF1AU{0KtiKn;<Tpp^@vW{N~-8P=_+sA(}zY4Dh%
zd#PT%q69Cp`Bt!1ww@2wOR46kOQX?tA_NV*Ho~L#9BW!TNb7#vAJ}r7Gb6%HbQy%;
zCHm`=M!VB^>&?o;>RtAQ5bT>c2kV<49DShvO+!9oRQ_WPuEbAL<Z$EVQz36Yx$y#Z
z=HO($!-&0$JnKaRM)gg8tT_9%(`4gxqGB}9jR}$QZl)!#9N*C`2~?$FiRsH`5cqrp
zC#VHle*7J2&b4|NN_zb6m%e1Ub^bx0K~s1r&H!-eNxZPf-GFSV&3Fj{Hch9Ouv!Wb
z1}W$-^*R5D?T<NPlTam)RuvTh0BLYAsR2*mIW@YJTS*1^CUwYpkFGQW5js`tQKf@?
z$EChY24)V-z+2x3iN?6cK+uH>=}ks~wj0>`I{=80E9T_+iV7-OKq?6O3WGERoITJx
z8(<gyMndIFwpTyatA3jMo}4JoA;)PrKN|%}#$%#;lhI7Ck_OtuM&eMieL!!HD<GX;
zxa?~Me|;?tf31bD#Rt2PPt_{7Dns0C7}J1CG%Tc)RLMPgh2BjACO#Z=D!^MX8WwFT
zlqPM^E|7(3{o>(MbG3(gIz4#H$gu9?P=7r10?}xR_nh4?^*}@^3mF9xj6+gn5@~<Z
z{v9unL%WHvLBQeq?r9eitj2CQt!AzLKJIA!%U?*l0cQ8F<p(V>WZQ~&wl7-nRw95h
z+loz5DnO1jQ%;*3u|Y$lYQ^BilxE+<xxZpPDbqheKg6DS6%E#A?bj~RnvUis`u;N4
z-`pqH)Kq5KyFBGJyNKD<jI#M+f&bv?-+ACj==nbGfBbl+=zF2S#Ik0zIW`uYOws=B
z!V}6p<IqSyo7+rk;C$j~2!DEVe0;etq3Fn3-IYtA&H;5UQv2@sDWSo$N2A8cs%C%v
zLIM2mffVv5i8TKHwGF9aUXkEdQv>kw;G!b&q07_a(c-gY5i%n^i=&!W<m`E~LqWJp
zXUCrpP)PEE<l9srSJ8;osfuN)rN5S-Tt$ho^MzR#eK+@3R(AOi=7Fwl+CewuyMQ=(
zpB`JmUuX-Mz>$ip-wq%q!dKl@r*}$7>rGfiAhiD0X;(&0f851I679^K4_Yo@^ebVB
z1R32dnwT#XJ-GMeb}vsy(PHY-lE9drbKxclTyHI(%I!tq#W3jrbJY0;zU^CC2~^?n
zW|mTctQ1e46G^#I9mg|F<dEAZ#37FiJNnvcWzQsYos?x4q+U=0sM>38ytbwlv-<-M
zs!2L>5h&6m&uOkwFLy2efWHwOVXkxgDEd9oq*|)U&)0n*9-WD<(+D-NqaA81JV%o|
zZtTdl*I^Mu3c2_-lIpZRVeE0VfTHf;kUQS5_0s+_0?U1%h8S=9uy-1L8$9D|JL5C#
z<rpFL;Kf0AJ>+heG3e-Zr>i$Ga`yNd4f|M?K45o|7EY_ZG>VU6<Na*u=v>aJ2SU%E
zq|bTYwB#6~BU_@XtLZo`ijDz}uU<aoFzoHF44cM_%4y6%dr$mx-I!x9MB`)?BHC7R
zck;;5o{s|Wk%OInEbgN!x^mCEh=_krZ$l6fI@vgVCin8la4GHB96<_6L(x(C-S#r{
zCt0do$a@DP7iwwvz|B5R=QLMORivl}Ykj;Yygn^?xnKLfc?=&bkQpAV)6#ydvp(gv
zerTlivi&m^t^`hG->-^tn%vRq#>UgUM{RhQ44eCNZ2W!amOC!%s>mYRp1W5n&jpVL
zT6eRnW0itvNFks04@f!qkl8c?dO)QFkty%=Js(_C^3KUg<D}4#UjYC-xUqeV+ZQph
zaqIH&N`n4cZLU1Pg3_i82qb)H{ta53X_69sdUi&!S5h@`mcQmw=LPd?v#?@=I)g}<
z&xf7|3ZvG9?4Q=T^Mxl~Em1qEn$!uX64Oow5$arn+cUIbe$QZ}G>F5*;^G(LOBSSR
zZOq{soXns4%(Yb<<5QcP2F;fBS=O0{tIdu__lv*Jb>%e_Xz?(yzqD1Xdr!0cO`;G&
z_P|4r$jHbsGd9k74mOyXnRVWNMj0%ej={n<CPKbh_Iyd@YZD{b*)0)Oc9az<9+%bd
zXTcVJCZ-77Mtl_>E=67B`B$vz`lRfA>cPwESD4_T&$`-W9pCa!Zy|0Z??sPgK-erv
zv=P6;T8^*RxmG|}a2&Gm$^Ch2Ea_iYwres`30u?j1PqwAT;b{ZqN(xIQPxXrvih9+
z<lMrmsRFP&O0Ms*&Sqbons!DTLaXmFG$G=c;r%&ox%K90i1O)-X}=X1-LXaUOM5OU
z)ZnGDhw$5EZ9(p@H3@xJJBmqdd?A$kGiRtaxL!j*Pn5y&oY<G5(}~T%KtxKi)Bfc=
z34~W!wpq=Pv*|kSAF1rWLwt|oQKm^Jty-T_Y~5qxOhS@{8bL!E^6)Ac;kA&b^ZL3-
z&!z?-RO#N<ujloBJv_t~Pfkq8t;HciAildtOP}1`->$5*9*Q}A>+36S=DLW-`Rdh@
z+4^u@>v}_>tGmdUHr!KQworS5Amn+Rmse`N#Ns7^3h}+)rJN5NhZTGuS7X&gj`4K!
zsCI?rD9m<S(59#6E`}rLQ@x~03Oj%VGd)a6ei!S_@B*e+S3em5$?Vx)cT&boF0Ou3
zbj3$JxP}EKfHp5sBIjm|_8J18dvtNmRk7&{lcn-;J&qTF_V(nxCJ8e(i7pGpbrm5i
zzSkz1I~9CxD43EZ)uoXu57*NxD<Q_|W?a@T3#`H7LF7-b0S$lr>@0@SW%K{kxqnys
z{auOH;kF@DX<d+AWTjP$hhlj-RjUkqpcE5(KBOo{LxkyknJ3GENxs6te|PN6{zFKS
zgJ82WBHq5qnF>JG+>^l<&@&zvj~l~teyTR^a(nvJa(6M8K8B$y1hKMp=oqZv5)~Y=
zQJq*=kr${Nn3=(hduKW~_QfSyZDj1@hMn^uMr~BY3F-QFgJGk2WoMr+Al4)xWiH@S
zV{A0S>Tr25B%W+*o(7wX_xde*7p>;BxTO|0u9%W?43|J|ezPYf%FPi~G2N+)jsg_V
zhvT!O<42(TUxLI7eF_TN6eg9WwzN1Oe$O4eqC}v<O~Czu!58nX?R)wBdUq7%fO|Dz
zmqUuwkGVV0trG3AR9@s3t5=D&G>@mvhBT7ze6hrOUf(QtZ=?w982VutOIur?<X6;D
z2<4jDxrG)<kwnV)s|jTrkRxHnmrf2VjgHk)=xFk}IT;QkK&k{h_W>-#zE3?9i@rey
z*+<)nwJo04)V(z!6K<PzY?mj8y%D2_+o)U97yNM%4!71;`#)=&-x*tGkWiXi1VoCr
z1Yf86yb7S)<=_^Sg4j(hHH2u3(-7EqaMi<*TYNAF?$<^~*~lO;(Xk(*pY(iDZdL=6
zCnpn{dAB0+8QX;mlfAysvE?<Fq`@Okcmy&rDQPEr+GJ?>IAsS1roNWbZ|;%T_K45V
zCYf6FwaFsb_N2^X5HLP^ShanYgs7~VD+b6%TNI;ROkB$oJLgh6J$GqV(~k<UPfB8C
zWo2enA?*_2km{xJ?#%05o>S=c_2<<0@4*?8Pa)qyQ}Z(;anFc-GP3DJlyrEJs%sM+
zd(#Zo_V%W-FP{Ykn~6wT)OA=k_HSNys{CjR4$x#^ugNr!YTxJETC5IA$+)i^lbyq)
zv?sSW)3neALQf~Y=g7J$i&b2y4w*;D0R~PNJTv4|7yQ>Llo(<G-GI4Km;FO?VKDp2
zqBDus^ZVOJs<N^z{w4ytrPdvHThhjz8!Xy{eG8JZrxD<I;>VOq9|yK0yCX8W@g<^<
z-a?&Anh)M3!MVv4Lie6jp?yV)gmS-Gx4bDNtN;LBm(x=bT73EN2!}^Zv0n-rpFjp0
zKs+K6$jIZe9o-fkPGMa|c217yR4GBJo6UjzD+isiI+#^!gH7`tD`l@qa9-zdmV@Cm
zV1J*)%Fd>bBW6h<YmtlpR5(7h-Xl)<6h|~ynuDOrT|{`?^yE22eQsuIWjew)`p&i}
znc!Rpe&4&qzAlqjrj|UND#_WcLQN+F0Z~nuc}_pZ>Md49{WG3q<BTn2?k0y`IoM;z
zi`?U!wBF-e?7ZhYicXm-Dm@X+95H|Pusimz!}QHjq)MYsVND!rQ7nYSmBb&F6dj+)
zzggtJpWxh=cyG?MdvF3fYKYsi`ScZ0j6R^N^FyZ`&jYqdkGLLBlU+h)$jyZ23wOZf
zrqG`g|Il%=S)x{cB~HVi_Agt0dtb8B41Hlk5$hOu(czrHXzfDui}0bEp6cOkE+)-$
zfw3QcS#dcI5EKtQ{~KYpW{UOGXT(ELj@4f(ABe8^p5@1l@Fnl_Nm;agUND8lOWR7z
z>62r^bO*=lLm{8!!6t7K-y5z8yshz<>j#9}uD@j7w}^>vtlD1?7c;+XHjlsjuu`MU
z_1~!t{ekIST5EX{@R{<3*fEEsxX$xqJh?AUWqK#3ED_Os=Xl`bYlQ@?9KRi6n@4v1
zr0!%z-iPMvs)B;xOPkEHaB?Zr&ZXxT2YMV-6+JCws@wu~_UYNx!R~m`PqZY)*3QBA
z_sFcdCp2sM`HVxdx!?nJ4GsL*UT1>{$i0uQ?vl24y6gvD=8Z5vijN|awjYKka}eUM
z!sS!Rxu%T0ntE(jo2McD8a*;PNlExA;R5~U#sR@@g8w9u+H%tI3vK=Mwfa>xIE>M7
ze_L<Q%_*t?4}k^-D+G$t7M8`<*7gO(^{H~S3S1fUsa#<=hr5(U-rkWLdBgMdKs7at
zBl7H)hcRb*hQ2f5_$L%BPC+iWt)`S$1`VjP1<8IpGL>x;nADT}8fT0o6y<~OrZR*#
zwBMa+W4=x6nL^*#r}sEok+os(xx0YL!w!ddg|mw8h&89_;)JhhN8KfV&nE`2B7b>)
zZdO_AmVEHw;^$W?-lhV?TK&$+EJFa7<ZUF5!_H7>P%B4<HmNg<O*83(os#7Y2y*kN
z+_EJEJ8g=^|CAv&q|+xbO--o8v%a_5UHqi%%M<W6yw4J?*Y=xi_j;<1ZaR%&;tU@T
zK9+Xl=Y+5Y9dz@PVi6sX!ef9KPn~<ArWO;yIXu+^3@ojkH{x{XpPmum(Xr)emUP=C
z<^6;EpxM{6NmY2}96g<Y-n1U+Ig@2Yo^f*R5#(qM_TIE8Jn<&Ua|6607Z(LHb#(`J
zYCHk{R&*=u609Va4i4{ECL(1_lcS_-7DnnR;)7zJ)|hV_1M)ic76AMcp?!C?mPGS)
z5wo+r00UU78Uy@=VRc$xsPST_rW;;2+g<F~R<2%laj=PrJfZM!^5Vqt)dU)1U*Jp9
zqGPcYj}0B760&1Wx5A9E+)m7G++y5TcZ{_7-nwht`k<U1B>q(*v5YR#7PfX;t47HX
z^h``S%*LeEA?2_j9H32O+E=w%TC%bc>{@-s`rL9USv*DGpW_qN{gCvyi^4#Z`-93v
z86F<Jx#;lQ(UQ6eiL!o}!f3|N210Jm?w4SvVVg5E`=qb|%F_J2<1$1lP+~gy=8762
ze`9%4Qoo@wo!WBCD;6Y)X+{E<-^JVjzFxFm8f|*k(KrrafXrGaLzCs4arnm{{kHSn
zV_@V}zdKp|AM6*WTQ~Sv$czFhkF_Zas;gdCY$oN#&v#lmn^|l3zO;D3W{*?NKZta9
zf^G!bPDcm@T=xmsumi$dvyGoO#r%_gX!O!32c*j8dL<^D=_uvO({ql7xx%b>1qZrs
zD2?XgqV=_}aVyai$OHznDqF%A{DMTDT4P#oNKSG{jn^bqeHQaQPcsZyh%nDt#)TCn
z)wtvAP16*SB#nolTxsk-U=tfO1krEc0qLf==~q-fV?#H9O%MXvTbdkyJY-GP$e3Q?
zVzW8e|DF?Jt-F2h?GrLB?BCv(Lr-qlvojwM{d~+Hc&8ghh=MVHe62oPl+4OLk|bX;
z33xkx!AO8{`xJmhCaeSpYlA)LP~c8jU^@U<P*xVD&DuA=i<)2+lbWizV`2HNcatc*
z^YM{v(kiC@+GA>OhK&^8F#;Y0%E~f5*91P7Y8MuiXWfT~$HIy((=&3m2mEExA_~m7
z_VgUpHT!OO06c2%(2TSZ%L<H(VVYLQhkca-^PuiZ(s>AFF0>nfIh*7eI+315My)v~
z15fSm%|Uy@&qgAtY34o_#K3UQugz$g$a^4SgXvQ1eG6sJACZGP`F~^6xn!wRXviw4
zH@UUP6gL0<l`By)eZZ39{Itq*_O~zn$Ctvq)`+fs+QBJ2gVrZAOW7(n^5L2Z_iySA
z920AwMYHJ0DhudMID{Dlsv2@LN|~rfE7CpUhPlxk>U(l=UIFJy%gakjOC!ywKWPAu
zP|yLAc^u#aRpxhl$9r_^?RaF{7;h{}7#5me5Q?oGhTUtyTwZ)~dEYIqoY0o)D>GQd
zQG>VmN5;qh!5jmpI9Q&%lkMZMlG^fUIY1PHh(sO^jijV!5lZL8+x+VJ9T5}>8iIhp
zXkv#2*D44^cd#8D`Aj$sT0|Qr5q!6xvrkGo35fM$AD-Im0`h*W_6zXwr06o#Dg?K^
zsrb{e766mhoYIjPL?S=(ZG^QI%<y@DNE48NX_FhASl43WwlIf%pC#=KN)u;m^JrZC
zL?a;KgO9D(UAd+6GWMdmF7Z!t)VZlCQE@$6mW9`{R!pRSczJ5nf6Me2sW6(PxSG`n
zoWF_f?UnWs6yl$nRn%}5c?&ehytqEcI0EIk3C3>;7S^KK&3Rt%>1Uk2-y@Kx$Ny7z
zxN-Uf1OOU9<k&dqNEu(!%>|ZZ$8$oyO#sv+Vd*+bCVflJht!0hbBuf}a?nm*?F2q?
zY}8dkKn^L>{mNC0Y;o;(f`+$`C40LL#{JL!tZ)6ZT_sJ4g3ZT%v<(D*6p>OC?ons{
zltF>D?3<jq_<nPeaYKc`exW#7$7pwoY3vKpW_7Ew8avqKxl5q0zXWYI&dJSj3FWS1
z!ae&s?(?zOJ<iAH%Qx4DE6Q+AzV>)OM?^|2^9nf1W;VrCTv9Bmq67Z~RZ7WFUVqv=
zV+NI%lfD(-kP9_vzQMza$jHi;o_1p$rXfqzrXpqA-e@rBn(DT6czLu-HCHt-2!Ym$
zi&v}ACTQn<A1^rQ<1MyAeSAiMQy)8CwbJh-$dP7W;aVOefrX7r{?u2JI0rrRUoM!h
z`aPJv4-yzN!SLJ~WlSW820qw?u=hO-=nzVDb5snC@N}Z$u9)(qbi;1&C&*hQh@IrY
zzrTMZ(ALSJF=W=Fe}k)T(dKNYuTwfe5+1x`wceCM&sXU(1};oM!<>$Y8$R470uvWC
ze}*Rpe7D2j`H<ppCGU5EAA+niwNpR47)Lh!iGLomp-%Xa`Z36s<O9Gj7(u5*jw>ba
z`%NvNT}}grOG3J@{XJ2IUk3OywzNp+YaT~HE?i`2%<<Gq=>t^{EHAURw)(qWUDh;K
zb-<+qau{^UgV<mWL3J;d<AT&Z3sfrg0jI+~+x{))PdqX>NKw-;=)S!r3X|B#v~?Ac
z)7I7R05HRL<95Q56O{x<H#c9AXB#9Bo74C84_Y+%a^*y+FplJiJn&X9V02J=1+v6B
z3Z(3TSA2K(kEwFU;UX%WT3?LmIXYc#m==P{2{7K2mD_&n%WpY9AFrQp`Kiv#;d0IP
z8LJ46**|&I>zJvb{Z{!w-i$S|L}KaWlpd-oolX2{+Q`B#RO(pNWAz5-FK#qnpr9m|
zfw&!4z@n?cJr-H7LM#`cF7yTwq8N6}fLBVzSVI8PQCcZXm#+l~DUXHpoMXBsg%n~O
z_w`a2(W<X><@uiUR;i7Qj%|e}HnM#J|K4_i&L&a16^ZU`+`Rb~Rxsb>J@NW*xiu}W
zm}sk@fcCebZkbZ(gm!w%KzXJ09{``~+Onj7MefWp<M3zmc7y(k%XEGURQs(%h4Efj
zItfDlxL5`rrQxpgjO6Gy+q!MWP5Kh3Ax4a!J-a`9T-9@UZNO8fRau3(e`w1kvtc?2
zE{1n_kdw`oZnHty&pl8gmqVc!xTwfFU%u!*Oik+Or&}5uQvj`!6?=yWtb4I7Q`DqY
z0|YWs<!Q<C${?w3f<S&U<1PnS_T0zwC2T0arsdhi2A-I(+Rpi(*xI*ifd`@V|7f5M
zmAQVR4XKjkMs8+aY@^l>Ly1%HflQk;II%K4yue*D2y?l-yx!o)!nnAAs{?Swh?`q&
zNpp}TC2HP0OIvuXtBWitX=`M3RE3pb;!0s1&JH=1lJs|W_DDfKUf^gNq)G8_Rsboc
zG+N7p8C^V};BQtomD3C)YK<Nf<5ZBmFq1PG>71UP#O$=y!EteVrseLYaGm`VU`C6Z
z=Zg#pqF;DK73(S4&~Y7$icmdJG#4(OtS9@MO?eOXa#0r=szqLsWr6a<c|SU@3_0H1
zmy}{u;JL|R&$%Z|bywT74o7G)RzYe8riPg5y~#>?wtM*R5*5|_$tsz<CPtVS*^oti
zbNbJxsB;eRV*9l9^?#}~UMz&dwLrLj5?)L%6A|G=)&Mg6j@Qirr$00!O3GW1<31RK
zJQSxfN0ya>fdD;0fv!@x#Jb0nQ)yaa8c<wJzvd}8_IC(6)Wi-3Rtkyn`D$4lpBJKJ
z{!|%o)Xl}q6z7YnlMiw@5i+`1N00{s$yr#2TOO|UZv8|94m<;MRrr-`^@J+h9=YKZ
z*=u)x3-fT%efrf8mxRa!j2~XUQE)5)<qJsZj<`t@X;zZ8B<+PJwOkLeU@qeqmRJ)?
z;G3lur>B2e-%}O~{~<K`_()Ah$cy0<N(^1?ZYK6SLHWIN{IlH6A0ZLv&-LN@dS0tp
zF*~<#lU(;c_1<5`H0Aceq6J!@{ZV5PS=gfnR4(4jpTWR@jqIiKpyljX`kKPFd*Pip
zYL%-FYk72)c|z6WpBW8AMZUvu27?KtOo#Of<!X<Wl1*=lOtH^vIj{fl$TU9gM0;8A
zklSCGS&pABmOEBIJd+^%kcunZdmI(87hkOERjy~aKR#2w;I<l!nlU&86x@a2lIYoH
zWGPH9w1xx?RCDks8renpLT+%bTB8oIHS#wkzWzC?s;zxZBQ|JT*&=l?76C_Rfm?Q1
z5><fqfjqD%$-zERE)d7|cPC|wwDKTZBY607hL&(VcWbggr-uUw$5(fUu=b9wE@AN2
z#NzB{6Z4FQRljUS!m;uzECT5}6{J^)f8;1b7)rcs%_sr~pjUa+j&C8!KiG;f9}&Lh
z;l$ay?rpvy>$f;*drEn90_v6jbTmX)qfesB{;aCC7IXj^8ByA5awzJZyZENn>#Uzv
zRMcxv3R~yLN`i;{t4j_szTtfv7yHe)A?k`^>l!#C-GNy!zQ?f2(qNS~r|$@_cep0e
z@PZ11H~I-tjd$_%FifI^!>x^xC2xV*;v6v_qKzVJwk9W*2RA{Pf9=pv;;n$(D;0ID
zbgoi<6c>A}VM?hfExpga*q;hBW;QVw5?eVJ2Kw5sRu;8AZid!Oj@pMPwS36Q8kF+X
zi|g~US2Wo)COL*BjMAciqFC=)nVXyEm;g!PRR&q@<V3W>chq=T8;v+oQqE8B8}tmW
zgyU0E%o7KDWP)5u;2Op0xwOxNhY<;V68=`Q!kbr}I3le=R`&L=qb<kPv+D-xP$Qm<
z9%p?L5)%2}zv0mXC$j^fq^mm%>Snby74AV%Wll-Y$&~ok+^{3Zn?;v9jvK9|;qx01
z3o1=Cp*%%_ORR86e11M<U%64`z8W25$2|JD%-SiA)9=B{J_3c(?N}7c7l9h){fe?%
zriykrgamr_FbbA^cNqy~UgE-v-W?M+#=`<C!nFN`5`INkka&5dPHw11#S6=sc!c*t
zp+K!exH3|2PiWvyv37s`0V+fUz^ky?j)XmPHghAE9qfN-A5j$Z&M5k;!QOJiZXc_B
zKEQ2gVQG>Qq`b8p$wzzxI*5S7$yToZE|a*{8?u77gAdP{?3Y0uGjHiXX4Bqne-V8l
zZI`6ZvXqq-kzh6SBukVsN%%^*9%&gEySdidVaC;bCi2soKGs0U>zL(*s6Pgzhi`g6
zwL~W7obwkH+S?28MLynYlH;qs|4jYqwZR<YQes={&E({yVjC@o0@}`dyyPQf@JsM~
zx;Me8TZnAVlRdH~#^HQzT5YB9I5hGdUghI!p@6H4$FY+qL}^wM5*x3Fx?E1dR=KMY
zVU+lzji!&XXgyiqWZeLx;?qN<r0+BPZo?Wf_8g(RC2its!E`pd9yo6^DQ|C>GnCF-
z9RovBXL((kSmCl({q^VTBQbGPQ*Ot$XXfk`5wfNiM*J;P0*o@0PpZj63<-@n5nKEz
z=x4g%nuA9EI5le>4`yrJfOg8<qKj#6ECv}n3oT)I>E+dHWldz7zAX(nXHpubCd1m|
z#}XY@t`bF(;NTOA-Lf;x3^x^G9T|s9i386e5pabiVS_3&GxHa?^fgmPR@Tb(!iG$E
z_%|sNGC{wOu<=~FY~6~>&4}*H>nr?78G*C0B~rDaFF;gzs$2^@uk;{#mWruN8Ns@)
zfuFL%o3cY1nnOCNN%EJ8io#^nN%9Hu><OPsh?@Kow8cw6b4jR(+*^{3SAVVGty45T
zqQq`ONdCFa^{aM|#P2az8?W$0wG3l92zz;S5+)&1{XsRPrsJFax=C##hxC|>4iJ{G
zmFPz=J?Sw>&pqG!YMPrp<C2-nT&=8JMi8q&G7T<a%cn(QVv!8wOPUzRTzm<3nn0<6
zqd>Z};j)JBZU5^9;1Ve@wfZ_4U80kj(cc&wW;iF$)KEkyH|K6qT*6$7&jYBkTzig1
zn5wo9k3iYm-!u2Nj+8R-)+4<{4--z>GIevm;iz&Yg!j_+xqw?M7lJTeEIc)$BE6a$
z{oroNJl*IxJ?2QAJMMbFEtFmy-+i;JNM&f`<ML{hW4`?bXKTw;DJH%;Q@7Xo$C6;0
z9umq|B|+fJn86GmFC0Onj>}f7d`QuSswoGiqEPsS&enUt<3{ltG{ifl%(Um@gOShR
z4@d+xXrJ5eUp0kcX(lPQ+)c&HjlIPIh_D+#29_Lhng+cAZ$X3aQZ4$4NGTXHhU^8G
z#eEXvo&(;0%r<dh@?TO**Yqk(O!9jnU6Zolp7+SiIQv8&j*^k1hoH>md<Pg$<NDLk
zfXDHnPI!D^fB>wyb9qKsy{u6~7vUF>4r{*v!nH=u(C*99Y5jn?4;k!L5U=pcm%npX
z_N9Gn=ETI$%q96ufEBaTLkzz_rf7P%)Dre{zQDUQsTg58*idK%R3Zn1!SK^ZCDjp_
z(+@iK+#E|gx0s?7RuF;r6EwF<xIH9@snP39m?5;kXND|#P}Pn>Sy7U_7_ocJC;K9e
z;Vee@<#ff7yD70V<wI?f-&1*@Vpmw#?b0LkrMY9<Eh-$sf6{U;Y^nT%R_mP6P_)yt
zO|`JR7VT}CVu_)#lhZf5;+~9#z&JH+dXlOE{k9&oIjSa(QIkGsN?H^vkc}!-#=|^{
zFz`|MskIdeNJLDr)3Rn};!J!K$MrB<`6eD-6oqF;USvXG9Gq2RjSD}N!%Oae{?y?{
zN{RBi60$^{PnxF<$6y**n0qJa^G4%*-RK<N#%LOHEQZo#f9B-mj51EA)l40L3Kzd`
zXir@i#KOREh38Xv*7RsnGBtHAqJ}l`gC%*Bi~}67`kPwcfgB@}S7pki7zy&LOT$Eb
zZ)l48du|zvOcJ0_sQoA@p~UxLbMKQ&d3cpzeo{<j5aDOds$`z_`pBM|-YgJDh1ra#
z*$>yh0>mm(nJA$c^-i)}eY-GX3sRLyZ=H!MOx8R_!zISkSCh9fZ!WAOp9`eh8MMUP
z&FpZuvnx4|<`v@Usxkk1Sv3remC+n`m1q5&@CC8|O0I%6(cleXT1pXdqQs_8q8)Dt
ztcf;>NqD^T0*RYDrC->^Oe^gd5~B&*-$7G9Go0X_dU6Z;eh#+R!j)XNnhJfg7wO@_
zFabDpzQHB6W9fHJ&m?20u94!$>#bo$4|}zs1ike*TJ7%uufUbbgC$W$?|^{!OYGCj
zQ$u4bzS_C<n$v)>AA*DM(#fHHi`Fsw;K(HaB;o0a9jx*#bI}I?RAEoc$jvhM^Skta
z8~Q%jNDd4Oue>q$&XKj$B7}>*DJk*NbPX>n4e_;}FNpB8{FNnPE$qUQk9?apw1W_J
zGZ};bbCHnrv^yL*+Y(kARIyTqvsWEm-FbClN;Ta~S~fPcN2LXxihTY-x&$a0xS$<1
z5IS8dS7Q6U-ZtJjkXek6`eyQ%KC4HQRH^#TzMPa5Nh-8|;tdpJZNF#zb{Ot`NOM^L
zEAjl^gL@bNR7?c+N^1Q~X)LAUkT9|J*W-EWski>$N8fQ)Afz5Auq5M17-<Li70Xns
zXb+qJ{vp|Yxp9$^vR9@b0V-9$+r%~5;wgr9Pt*;06TI5f)cq4`ym_N>U9Qf$-bf+A
zefr>^9G&7)IDr=7w_WQU>acNRO`yP@7ev|54q{BLOb!bdBbuMjIr>7ZVyXK+)!JkU
zs$i3hr1jN$*9#om>hV^N>h$h0J+q_U9$?VVp61-pGz?UbS99gg^}UXU$28CYl>d2_
zwB>A(#fAzXt?CeMtrJSE8kO~X7ScvEdp|dLPj;Tw6!7_>f(YLIP1`kEQ^d^eMTmZ)
zV$i7_YsAdrjhlx`-N%E)1c$gI73Oz*K>P0?Jk$tz2K+gtrQIg>t5LRwkrhG-BO>HU
z?H_Wq64lyf*3QPJ<lic^+lC$wd;N|x4}*;O^)sTM>D9P3-=kgNNB8pX(?UTR>NY8U
zqMp-F8lq&y8ahtH)kj%h9u87wSxOz>1si?O+}E|RENSp-FOIZ5PH}G&M}QafO0}2I
zN$@0aP?5g%ZEB~6C95!Q%hBVh&&?)$0Xh`I^xNC3%a}of+x6F0a!h9^uLv-_qwXGg
zY_-+@&KNDFd>P7WZ3lyMCKjJ+>lIKGqoWDX@7UHFp0g7^S31OeUjgt34H3p#XU?&%
z!bdD8@Iqm@9HH6H(Uu}*1N)+*K>6ZyvOA{bfji)Ss+_e%QE#lX9PS}IsZkYe!|eVE
zZVN6hwy0UaoK{QPb`jv&5m!xKa;aTkcW9hmM*y>ix)-p#mDg)M2|+^9I<cgC8&cQX
z<8b_+t%v&{jq&mrD)qG!%C`-qWOn9HwXHhj7x04z=IUP`Sz@=Gp1!*AwZRIA$bL7A
z3T<k-UygnaVe2Q8+p`xWbSZ*99y=f5nTDJs=n$DWn8cWQ9CRQYuOeVWlRBNr{t1{n
zrq?alyx$by2CIVop|ZAiqJ|}*n(R=VxtZ59HxCT`SGh+k%%-&m*IPdfs>or7*Yuk&
zIP!BA9wwpQ%(WAKeqt2Rf^7w@qI<Z6_8;fikSsfYkb+k6KK4I5L`j%O)!Qd#rMw$%
zjE5)jJS&#7>|OmI`}&*SXf<s*_{C{eUR7CVc$OcQ7kfT-*lMj*SvS?+Rj45}WF?=6
z_fCr@b_V}r+Vdmu0!P3aZy%qri-dvG1Lojto2Hum%7|iXPfM{L-7mN9dvI4u)v!71
z8j4=D#jpwAIi#{8oxeU-3`eS28mfF}H9hCDz+x)d@RD>XoHq3yBTKVyOzsi!r9NKX
zfKuH4jbB3@<nm!d9(&x~;oDogr9O_4a(c3PQHkF`bhp11jnJU&gBQ(z9ASon5<d^_
z4enG|V=lLMFy5g#ABBEc`duT_9c%kWBW|UI<u9V6efGD55Imgp*%cv8D89Jn*N}?7
zPIOhBcV0qTT5S-!Jpa=xY=>nB^S6;h%yV-NdeZ>6ZmDLBi!lWzzFAwHl7G#3O<~x!
zKW&RXS4kI1+Ib2=|3X)3dtvP44?q?z&ok{5<?yA_AA!rrzh3f>BM*i(tfk@VW0VU9
zW#qDF(+cregWloCpEHIN)y%o9l#ve}&3@l*LicOc{?lKo1aDOSZD4pCGuo;<{rqPQ
zU(kR4`}BWIinG7g#s69VvxvVz`S*mV{NJkocV!SdoPqv(j!wb<U5W6H?7#Pms*(A>
zD-oFa{~a!>1m>glNGO@$0_)8(S)@!bO;4(0Q#cMu>Ue}XNl=TscV@k`cZ1IQ74$$b
zAP_;ax%OsFH6t^w*uechOnlBAd>Gua&-9i`e458EKn%hz{_S9_^TFACDYN)&gS_rP
ze<kW%wK%Kzs#5&7#&)GTe&vfV3-}Mb%oXi5@F77ixY+nj!R6(pI291Qy-Y3lJ#_Q!
z@<T_+pBd!zEQ5|_dB1hzso4dfFv6W5uJTulu-(0-V4bl9wuJ`wby7gc{dGW&*QII;
z92u29+N1Dz4!M$N`g%<3Lm8?Q5rEy4W%-t}3`KV6OVi(EBpRXAnb4BFqS&Af+%lW>
zPFc$CQTEMU<NfmTs%QZ_tyPORh9=sG5{Q&>TkCtGK0ZFD=mJsouAbPs|F-Vkz(a=!
z3dnXl_c{6{GVr=TP|kEl0zLaaNAhu!@&yh1vTjQOA=p|sy?F3%?1}^`=JW^6>5kSL
zv93=4*V?+!D~R#$)@O)KrRFeU-~smCRHd*KU|UuJb@t}W@X0f<3m?TZ?|=l4LkVNJ
z2As?QU>%m2b61-FZKp8J`9!t9c<=ofS+ZweCOZvu1C}3#IQ%?V?0Y7H1VH^$!>T8z
zK5{7GZ<YC{;<<JII_!35djubxW~@EH9{FCjS+wIqa7gThPN2EZ*e{7I{`NC<N3ezf
zSi@e~Txps8W=7>Bg|e{UxA1!z3hzfW$l}tx?;5_}o>sfKrT;sK@y5m7?6Z#TgZ`c~
z`~{~0IQcGZ%^qR{j(&HpGjn~YGj8Yc&+F|_6+;$?$C0<5*wMe9T>xCz1jH=uE&q2M
zi-yPOwTe#z;Nln<Lk_bWZq+UPJ%jV+pS-o-hvIeZ8h;8~^Ln%L=bM!2t<vi};u)Sl
zaQ{!-PKwTtY$FQ?MA`irp8BcPRfQHvr1pIO`Bx+Z1`5ZY6%{E?;-=0%QF~3^QT5H5
zxO1rCT~>$~NOH8h$QxEMLFUwSJqJs>2R8kVd#vLz++3nz6lJhBU(Z@d%~y6>$+QUT
z{o|7Q`l$U`dL%p+oV=1iK5D+<9+RAFFvX=y;^dyWZZo7xf!KmDai-2)#ZWCQNtu(A
zSEg)tN~j9I-F%%}IQ-+6{B>QoOE-M%2OWcS3p>BWuSc&^AnuH0bekAdW<_az9R5<K
z8c1bJje+Z^@nYV|Gd)=?{sNMv+WCjcXS1sZ^4LpEs?4dUcUza(Zfbg@GWaAUSV;vT
zN+0P<t*r`5t0~k{Gct&Z*2Cb%qX_TEy!Y=@3B9i_@t`2YCFcaWP4|k+Yd1U&p7+K5
zL|N$)7t;J*CnCSu;rhtjM#_|an^TTkr{<pAzriGzgYPX?Ve-uEUsVl_(Vkm=NFHaE
zD|Xt)9EPmXFWz}Lte-JmUn~QnlTP$athbC~%fhkRE|&tuEeoU<-X%}f3cnmxa%N$i
z->u!s9`665(mI9nA7gVVyh=w{UP+F*ry*&ku@OVb?P^2Ypl@3L_e}-ah>sveUs=M9
zvRA>W7Ob^XWgqK4j6dE74uUPjq(4fTj%<xTAGMnZROJR<e|&i(S+ZvAW0NY^7;71L
z5lx^rY!%G^Nf9UN@5Op&ch6MG?eRFn?dHidmB|kO+S8zr@cqKLYL00CU8FF!*cs7e
z&?iQ+%}eF>aTZvg*UsDvh7XBpVOrnqfn5$bM7gTH{ax@UTGX|N=$8&#%f7R1VCG6#
z_{YVLXG#Ct*Tz1`aU9u#@`_q0<xM2v7KDfsn9*ML_-wIPfEf>*y_NBt6*fSf8_rG2
z-I&&ka?7M}eBl1{pBX8%{xTh6!7(9Ad^b3cjG3)=e4$_;(J!nh$jX#U7cY!6e0dVf
zubh<y(?%j~*uM0?bcIfLh~1sMgoZ`;Gc^U+*qF53j=p3&K5YZSi~DL>{?lcCiOV$}
zgq3AGwc`Q7-Ll79rEr>DBK9C4v2j`#5=f_%?U%#H4!x^edvdp-`GnwR_-(Zt+to?y
zNBdLlOKkgd)=7S^=jnWP|H5QLw1NLs%Wdn+$XxrANb!4++#YAu&4-)gwcf*ZrY`|c
zNY&RXhpUs)11&Zsg@vszsN(^5e0M`9kL-qzk0qsX_qah8VQ1a~aW9YF&l`8SYD=E!
z5!g4u#Z<yso&nc9ZBI8Z9mfn}5p9A4fsfOH<MD=K!E97n@?1jg;=l(7WI^3MJ9~IR
zE8(^84gM@3HI>i_GxqK*y5+KKjk^hCcC-2f`1|)~7Cp-r?Dl@{If_na7(afce`uE}
z;4y^IX=_FJ`BoKkYo|od2dgQ=^>MTzV8q5HI4$?ZHM~TN6NvB6R)oe}DhhFcYmF=y
zA&)B!&oS-yS&rQNyq#g(j;=e)(uEd@IzP6r2m?DxhifkneGxL6I<oqeYlK}h9Q~e}
zM;N$wZLO6Jd~>%;AAIhb+i%sLpV}V`btWNq*@nJ86|Autu9c^OFNQA()dKMm$4l{U
ztvBv@O#gmjl>U520yq*JUVE=fboIOsBTL|vY3;esu(q+PDnawlnDe>cMfnT%%SHPg
zrT6{@KjizZ5+(VlJ%LsUzjwelFZ_|ul~aFbfIt_-3<DFdQ!>TNnwmr@^j~FB@FJYD
z?+t<`L|il}&n%7Qovo#5zjg+s$M$2pG?yCf^31q+pcvjn)nJN<py#rrDbqKwwN!qJ
zQ7;oAaf@3NR9)on6^~NxBUM2y29l)(Qwm-02y^Wn+9e9M%We)?6VzL?mL%dtY~Zkq
zItib9VE;p&mq>GYxwXSDhCj)DGe9Kv3pM<hc;yMVU7Wn2`1@-_ELraDv|@QebGkQC
zLmZBCNmjb%G7L;~nG?8PjSd-pP2Vo{6~X|=qdp`E<8`<)K?V<4xN{ee+x=n|PId`>
zZJL+j$<M73r8ai7+t}2hz$X2^3w`uEYOr_F*R_e+_>u9`u?5_7kBr)q{<|mHhu~>1
zhse@u&i85WwKH{!nz=(sy#7T~=Yy`poG75Kal=O@C@9j5YY-X@b410QHEa;}`AYe?
z&EI|lW$37L){ih_jwIgwSyJ$(jO3dJ$^bYnX|&Ke_Jc+pFnP#XqVogOPi@BUpV_(G
zj*(8jkT86CXYON`tR(MpbtoTsr~0|o^+&H+oL7S)SS6!~akVY}qu32#?GF1TlbhQ(
zPUPV-r6E$GED7das5w2OF{i5bj*cR_;2?-KK|g~^4Xe7KBx$SPkV+cg(Cb%x*kr94
zIy@WSqPDt!&22k<1r^5-s<4H*;YrYBeO6_CPt<zL&M+2_Utv!z;!E7GgMk%l<ZT?e
z{_G<tsHe?*@Tbn>lc*$n7UGKJF8zkKh{bH9HIF{u>qAk$AQ}`;F6aIJ7^RV)#Pkm*
zVtv6Pqb>Jc@#)HUyJc&UIP3C+d3rsjs-PkkwUXi_47u9uoH&bOt>HiQb5$)IK7XAf
zg>slR{|kz|8qJ+lh+_`V_Qwrn5H=ygu931$`d!X&_h`#=(uvdUK)`i95+gy4zTgA9
zqAc=lSEYYg3?^=E4ZKKn5W|kX1G<4*l3?0OpZtO8+g1I$r#K?7eXWj`-XzF$efnhK
zOtM!IyDYsq&zpJhbz%ZQUKnA(zST(Kz|`F}h0bOm#JO1ZJuajqBPI0~M68Vd!z6**
zv9;G#`EVzrL@ToHs$h^SClu~;UWjxSguJm_4S3!9#F*h0UUVmrsu^9VrRFs{dU+%u
z<?qj9AsRbFTW`?kOioL}-3{aSwT?Q@MmhC!SLfq#y)I%3#gSv0<jKbW_!5Nj(AEQM
zKhGLrAooGOZ*+TnOJ73BX`3qd{!R1A6K1((1WW%;qt_QGzroz=xz2j~e0TCoG64m(
z<$k}yV4D6MlglZcWs}VO6?xf{FR$ui(~&;_K;;)^tu$o*rvWwnmVEVm9>?#HEwN7z
z3EM}crV84n&$}zzLzB-HGUW98i+>l3X#5BH-$_9#+_7f$V)<+Zt|zRmzH#|%Acf!$
z&-Vg`ONDEG>~sxo#V9FNB@U=+tbN-t6S&$@gck=gQ`9r<=w&s4B3&$;V%%eJ=Zocd
zj;XUim>2;a0U(2va(k+Xit7#!HCU>ojCo}05{Cx=BAJ{pFRO<pppX5>=K1c2jC}ZX
zfY(Jcn5MPSO0i$ethnS^Y583@`6GWTni#*gmibj#L7$dxYGd<tLy<83%h<XP@4_}K
z!<xuvFzX<!2Gf9lcz%YpNuOc`bDf(O!?ku~6q6Gm8oAZg)q{%9eL*mVW&zXU2vOZU
zLygS99c%GS{cD%!BFgj0B_Jm3@2l!E-7dtW(oRqBjR-LlAA#tD9j8!i#kursk|HyV
zoxYFUB3a^mZhaB#32c!0CXM&0iM!7qJOof6(yZ_4lk_*w!#)kg$p8*%syRkC9|_Xf
z4NUxOkVi4MxXEQA`ZzHMCl=IVKF4v^HY&7$BdsRZ53|H}!qV3Ix<8Phae3{Kzfbgj
z)rlH5LU3a6qtOGG?_V+oHC0CXN_F??{ih@l4(6M)!&kjEdT7*u?4UK-ChcFW6LcLg
z?0mF%P<7A&8WLXKp0+5ZoFkjYV1a&3f`pNdsFFc}KJ#Yd>OB?}V*46)j%3rJI>;eZ
z=EHhF)4OT|!qCqgL>)};Ixpdw7PLS|aH%!`J1rD{1##HCA?B|SnQ&irL0d{m;lXf=
z1yz5Wc&pUi;c9Q!A6Dnj4R8{k2<!16!<?3YVAXGZppzT#zC@`~B5&6IdFVCwb~DvW
zoI{(KP?a6Zw6NL-!GahYXOMU_#aQUtTI=FX*Ek*GNpN!j-uAn5Dq%<(R{l~PD&m5=
z5O<#&X9~t084(FWYht(fwc8NF*_l$v`~oOFs=sYPyzm}7af-3R{IKTAmCO&Yk*XC1
z$QrnyWu@NR(booste^iIRh<0S{~z&9Rz^-C{FhGt{~*VG^Y=`_#ijF~;8IMIf<jZh
z;L{FVh5;Xf;r!Vz-|kwd%G&8e&&&9#Kgyu@YGn3{=*fdeToSiMPzEA0k<=?CgiZu{
zPC0^7Df{nkzBP{i?7p7<o#ttkHYfV-FZxYjk4muLm$W%uwu%%wokfkGQVL4cXvjDS
z3DZW%Nv_JUV?NOv*&9scgb#A)uh;L?^Ek3s10IeVa@QVw^WoFG;8Po?s0TM8T8gP&
zpjTR0;&50obdr;d*I(~U221RBTj@BtDX_k02&AM1`Q&;D{d2rz_(GU$sn30-=z$%G
zRoDZ=#=#8Z#H9RY6W}CLCyPhc-&dp5c)b13T*y0CRK#$^9ELODo3H)wzRGh#0=}3H
z1}Eb!)jQce;M>dobJFD=BwTzQQUt%DJQnTG1HsJVg1viCQVq^4CMXXdry|^_fwELx
zxoB4bZ@FcD2`j5ik54WiLVxukynf2x7I!()5CJK$4)-{dy+eUVF3k^AfF9{?RIu=`
z_53Nr>9<`Q9DO`7lD}w?c~f<|Tvy`#+Wyf~LQuhXHfyJEP~U`D&8f)$Nhi|QB;G4!
z|3__MnS@4N*pfN3M$+pow77F$4GzfGQ>f#GoWFTWgFhoVD=m3qYH~FE*<C6Gu}6dC
z)ffXZ{gfITGW=q`r1BBXKQR+HjReusto=}%kZ27PCs!SteZpwTF*?}E{jbH&_>1M?
zR>Cwl9__=ndcQ2fwJ(b~uuY$oXO}q$w$@SusVGZy@<6Y@wue60vmNZV41V;(9>2hm
zke!|(qJm1m=WE$TgC_f~gty;)#$}?r2ATZS#dJWP)7|+pY%8|8kQPf!*b{8ycgyeG
zk;FO*_Nwg<zR1Pjo{B%bzd6|IM~plWw1PMT*+PdZ<ZtdC1F`ZKf2#=K!o}gXeb#pp
zs1yFb_Y9O}^=L9Om};aiYDitlvRq2PmAvW#O61>t1@Q10y{l<NEwq?eUJeB)&VySv
z`Q6ZnWWHxE(sosYpY@qIA3r7X)X{FLI@#L|)8j;{Y8fg6xjwPNgBN?T`9?f#DNv?5
zicWYBH|j5l5<Br@>Nug(R6%`RTDG1hC#P01Jw>rTbI@)2^oasC4G}d(e1SY+zjLMI
z>63e6&Ao>N4ps!(oxdEAfh5uh^%Dm{=S1lk{l(<q;-+iiC90IIoD3$q^h1GI;w5T0
z_3tGgKI06UY?igt52cUC@cF-=n%Ll@D7a%vIt@3b+QH!C+d5nehGHhYYr2x{Fg9dn
ztYu7LWt_@VDhf2C6gJ^;8lv(dcHClZMt?JJqHnanfZ<HgXf1!R6b`1$KNJ1%u+{~5
z>+SL5dP>V3KO`vOM2CI{huAkuZONNZy&m>(GDwrMr=gP6WMM2{y41(Be_H-aY~G21
zbJ0vNG}h1FT!<9NAty{BEl0R?77$@9PK}F7D>02GjgRCnh$nU?g(MuWLK_8^XI*+4
zc+!nx3c3`g9@Kr68L{Ped7?_q(S_!5+>$mmLiDCz&3T=-N}H+KZ|a+^B37X+$Ewm?
z8S+k_tURH@Fbi)Q7chlr*)P#R@3vO#4mPtiO-7v46IplR_<Yq)>-*?0!$tR<9jsQG
zq4VQH--jaZb?g!8-QrwsZw9fEmuUQ{zW%s0b*c?nVKObL(89%b?V-05;S*^?bzOVJ
z<s~D~|K_Z&(m&(*>R|UvLq@jHNg=<8luLJkA9ODplY(EaUVlBVzip6GbZXRbRq&5`
zK?RD<ZHQxF)*ZLwWYva1&g#nObL)u_6?2HKl(`T4oHI+>$lr^3cYR@H>Qbf31Ht!f
z{x_$$N%0@fYh&WagTNZLljc_!5HIxr@|=V9rY}W2z#y2WXf4d=r!{O%Qqx9vyy3f7
zBUrMCA-Bhsd?Mseg-(CpF)zrKnAdJ?aB<A%j}`vSYEx4B#O`8M7=%&jvy#z5N~Zt#
zMXEyJxcixY!_?-wz#njPgncV8CKfp9d4hkqFg5Vp9fFDo-cr{^2H5Y_C#TrUp>?57
zOf=;@oUD!vWF!%=X}t+w>Zzke$$?GHFUlKm4fLEcN>4-9O;qTR`55}Sybf>LdbLDf
zI9$75kBp2?w!?1jo){WVkDDpieb&FI9BZ_>&bi}2KE1S#pQgYMbRL|nTlv)KClLNl
z*zm3@v!ogKgL)sYwxx_N9p_tW&|Ih$T-y16|LDJ0Znt}o=Qy2hw^oxA7Aenr<o9(Y
zE0dTc<3sk~**4#^<?LKKW(-h+eYHpmgYV)<EFj0U-8&2Ac`~=AfOj+tB^*~mb1SIF
zfR#q41@)Zy#yf>E=+enPZLIA`_-tEpH_RHjAGE8Rz6w44UoQaNtT#w=_}K<TZO(%=
zFk}~}XkOj}_asg;S1kU$(Qo@QV?u_LkB6e)FLM*2Q|rOfS|MuTl1P3dGO{0zD)STW
z7FmqdlACV0VmHyva5bI&@G<T+;c-07#;(PdA-gWX!V)(BygRpxNl2WlxYg)z)tvnI
zRy~7XMpG<T%7jQ%^XAA5Hp?4FDH2Ho;F;TIJ9ZiD<ndscLJNC^YW)2-FdtZQT4oSk
znA{jAxxiZ5vrcb@MDwSve)7ETB@R12ck?^6q_rT)Y9iwDr|S{#z0cy{Xq?OTfH8WU
zOigK01u373-jbB9ErxOXCywNwj{ahAc>-j{bBvwL@?GvK?)H{yLf&S(lldK($K?*6
z%@gLDZlzukPy>6uVu`)<eiYyVbi>-u#v4yog#`9JCYJR>45x8GctGBXS<si+tWk6K
z7k@Xa?iMGvui4`~lTCg7+1R3y;0!X+#`qYhrMnikE!-nM4s?3Fm47v;>EqkXA)M5d
zVf|i#Vr8Y=dT(){tX>9`ZM(2<9RpO_EH{ug9WYtHL@noC2@w$LkdQC1Jo2&04?tEX
zH?}g1dMk9yu;GaoAxY*1dn*x3y1O<Z9pDiIpP6IqoALqYG-BQlCW1-slg5R1|36%v
z1yGe;*shh_2+{%~Dc#*2(k0zUH%K=~2%^&64bpCqZjolw-67rGaF*ZypP4g<(HUhs
zvffzFdh)utD?0mi7B2p*pHF-`e8e5DiHQtm!7Qk)&HQfEbE!|n^yjwRV{~cC5JfVv
zFI?h?U2kIhV6TWA%gk(r_N<FG%Kz|n?Jra_W(mUQwFdTn)|*4b^Ir(jr7;dnefbBb
z45Dyoiy)I+Cd>*Sk5{k?!<0?!Z(a!0mTllW5_c7q{>)al3eEa795zf!P4X?89@nYm
z%xUF*#gwai#o{d$<zCvhZr$gitcA{zW7<`1VkRam(cIT4wMUI{p~*ujd8F*D?1-UR
zZXOHr9(u&#n@Xu^h^ZlFo%FXn7lA3O6DJgd%<&_f5Ng8NUk}W?7epd=kHg12<>oz8
z!gG3hU#PKr_XQnWPC15Ph@Ovn!`0^UEYMoKRJ8D%JsIU#D=R9^FHEqKH9l$&q0?7E
zanii(30pCV?z)R^f~S(iy4Hyv%kvnIn6`J^<D=@Gzb9CGl+Z9M9rG#!m@K$qzwarF
zgSs2tgj~yZ3d;EcXX_%r%diXZ%hWr(dagiiv87#Y@p867_Ow<^d06+Ye^eljGy%zQ
z^}{1F+dey18%*zrsIb8UXRk@1S1DsN7(;mt1s)T#WGiM-Z}w@o@}p_F-D1`2f!c<n
z4w~YNP^h6V{J0Z}C&{Bq{B1XqFTZDGun2)gXKmAt!D1jaWkt$*?`qy(MN-?lDQpZB
zC1RoPiB?;qMOg()8Pf4jc#4pH8+P^i30Pr-?MZ`|@XQ^FOXARB*il||W>IT#%Gv_!
z(UHhdcqekh7HL2NOz7xzshy~?gtGBK|1254DBk!wU3#=CiFqs$JJ@+Amai%y?Tb(k
z6f3Dx_{m)9am4_yZKaUQ<E$s(UV|Db?8~AbsjU{*@wgG`iv04usqO<`zizzth%&40
zK;+`p>B!<<Z;~MQrQ=E+%L6>JQY6-kFe`iOLiOaW^OW)L%J|n^%K@aug*r{8$kTKj
zA{?-pZQ3)$xLR#AiXtP<l6Qt9$jj9Vw;n?MC-6_1xiq7$5oV@u(vD`t?fn=^_41nU
zjlWuE`n@QM?<8H2vsDu+vOvqc8LP&nQ9kWBaXPd*G;?!-49loy;eJtJx)S^-a<}{x
zz1f<v0Cus5;q^-&5})s#ZOk8gLNk7GNwU_kV(ia#8{HcPbQoL(WD*<rD-qp9t8W@+
z-koxMM~hPNxPo`(zV=+TygPm!^nvqtW>MC9!AYk=6Y>7df*M*&U6N;RsON90%rf$^
z5heTV-USsTN`xS%In7E64kn%6SJn<k`K3O@Y%#{}X2};#hq-k^;ke}P2MZmgZQkGJ
zB)@x#(-0kF>5unpPRU{--*k&S;7<(TdJU{BWq6#{J*_?&UyTos_wfdE@aeuGrL=lz
z+b33H<Kud_+<0-^O+GS7za#gVnv)%M`~xyn$fI~ll?tgYw6D6zYG=9Y^1^ZL)|C=_
z9`$sP^Z|#Pdq=_2-d*IJHQ*}giDtI@?pk`;Hyv6XJW-(=9N$U#rqS#4O@O36!>Y+o
ze|!ApCzj=+4-$-;5-xB1CVKDEU#AsxV>cV6nmc%ZjW8h8WE);M$6Z$o%3a5b3}Hoc
znk-ObnjiMVSm;{C_y5X3C1a&u9r3curR?wl&YuIuSDv<&*%~!5D0m`pSjcvX@!d;N
z@ap~yjnp?zjpBk*p!R2>W)Bzk#5>f%$r_hwAzMD;7h}zjB${C^_m{z9wab3UJ?Nyl
zEj~;aqpXh~UV7MRcP`&w$nX2FedDy%86pYDdR-T6NxIy<aE|s8Lr|{e@#uO7IgcQ<
z9a49^pw-sBlE$K1;kXe#91zoaw@ewMfL(|Gg$8@#+%B8Blp`P)O-B5La<OGk`#6Di
zNH%r8X<K(({!bctQk_g~d0tZu5{%SD-VuisZS#xdI%SA_`!Te{gMvh2Vi5VJMZ}k+
zMKEfsbhUy>=zhNK+9%WZ@@jO<@-^_|H;ZZd6rWho3WwMdPoQq|-j^f+@IuFZ_~Pmg
z%+q)`LSZpE<G!9BMT(GnK9(>cRFq-|>jnL~*}yO)oAVJFUT7+C&ca-PZs|1VT-_X^
zvK-GLOV2jmv1vNab$1UzL>~5@dRYQ)kZy7n?G@h$9L`JFGk#jd7#nSgY+Z7=uLv%D
zeeEZ#-_z}EH$ur_x|K|j_M6?{ZB2&Y-G$@H@Z)~KM(c$lk$`);evaqlqMLr-Zl+RU
zA<by%V!A5M*7Xg>BkEmb)K3e0mW>8FYU;w#d$C>Jx$Q#(Y1J#!Equ?dgd~E2cp2)T
z`^zrU<275K6hqpW41xm6^>h2}qDl&-@e;$@rIv)qFMWgJspFPmw5jOcWP`hpik#iz
zpnb+!0{P}}**~hnC(GPT{-rn$Lf*x~!-|BY9ZpH`#@kVXM)DC?(wHAn`nN>LB7)t6
zy^tPZ!LR4YC<ynAk%&{A8KPt%M!0;}Lk!Kgo6k>gh)7$XxZ(3U)87zN8C9{tk@HWT
zuX}{?dN~B$^i?<e+%u*g(h$8ETWX70e3Nz)M(P`eZ+Klv;O4i`1|>CO?LA)+_CF6M
zjjeh(cjr-K<^zo<Ha2^Z5)D{_IZ<_cd+|CE@5ktq6h!@LwQB4|`jBi^myqRVudhPN
zelfS6XwN12Z)dA*;VYl^!|q`Lx9HY+F*KKUCTEAzP>aap-^;#9En!0@2tlq6bAypE
z+fgov6i%5=-RIgu&w|pgg{CrM4cfU4J{(53n{_vvJWrnlxXU{$C0v&AGVeMa&xW7&
zvqlzI))!{ksu1^f?-=*29LJJVU|NmuAbtC@E%%Eat(_@45fMz~gNjjXVDb+0>&VDV
z|D2o9cB2xTK<6IIV|=)dl`Z7BAJ9`OjeO!7g8IPFA<0O~D!L60N~1UbjOVmcP@}Yk
zchG8%Q-7^IE4HQLG9F<Z)*6(c=<4A+>BF_+q3?<?e_AX=5%UYz@pazShqOt<SE*v0
zcoN8*i_)wsrvBTUJ&~EFHh&Sql)hu5he8nU<qf<z7s)VRtfss}KlF=OZgu;lU=v7j
z)HWQR*OQW&UZ~=H9A;WJUmw#D^Ioc_D20HxJv@d@kV3Tm$aK-bXWJ(F{^9B|^yt3l
zXx!~++|K?IC%h{~@SJ-2VgBeRS*rHpY!H*;=GN&%ZTZ`6zdu*m3$YdD8`*O_4tzaO
zx&%2H5Qd#2u=*TgJ{^zU-7n#1z9lN-43x69>5EceO_GgEH6X*3#r#gg8q#;&%iHmh
zr*;nv2tknG1|uUsnplO#Wp*8>7>~HwP3Nj`TZbcnh*;YqT;M1mKAJ~@k)$0eH#iI$
zBKdk&uMAfwpc1aa_3(<@kn%Aj^{X4`0h)ZU{qx0<V?j%6P1JeD7+IER1~Zf{{%xJQ
zl*bz4=Ce!36dq#D8+Za4qG}objNdOWKJZajSF6RF(@@O^o}y8#)44BI2aE1Pg4M9N
z?c0!DPW}2FqQgi%F+Fyl-3>)n`Kjr-X^7DlSf&j8{W8V<UIBxh-8B)6JrCZaUHi)4
z>EF=AjKNb@*cvAe@J5O?=(nyF)W<Vd;I9u6d&Ck8^_Nz*DfXkEEL8ZMFr}{_2cqz6
zd60#C+o`Xweb=Y2@2i6SwHxvxEhR;E)0s*xGMoB!PYgCg7Ij?T`&zqufA}3R?!y4z
zG+C4B{9K2az^FwdBcWH*6wLu;%*AW3;Ar$*`YGtH&I9vY$v7lW@}8B8L($tk(6z6y
zh+2UXk0LA8#DZLrIzxJTU6O(vG#_rSysp}ai$AsAbU}wi<l3uZlAJVpTNpiXwRz2w
zU7qJrVzW8J4Vq*&q|i}YY|h;E^C_hht;Jkm<k7g%n^Rr;5*FHOAsxbzjUd!JpDf@c
zf5t^k;hYUpl;`bk6qu^c5o%`%sKM8h$G*4;gwt$Lun|_w6@wqP@OH+g`1xY~QYJ!q
zEzV8w<CB9D>HQ~Y3c^F$-E04&cl~ew1bbY@fk|u%7xW7OA2zg?2>F{9edcyHIBYM@
zwg`wxEL>gTJXX;fo&53mbsm;4N^He-s4ZqY*ckiGx4u5y6>Q~7znO8K);t~W@!Y7H
zKK{LEH(!gG!q=07VQD=#8DYye6B%ruz)Jk4@-{QZ6FZ$qje~Bpn!AEUPLK$W^7Fai
zj>6YiDwNxYNhm6FYGL=Ag^G&OVNohJ+LAvjiR90cJOXa~loa(sf{<kTpdN-fTY)rQ
z`>j5+XDfb#8A83=VRtEX-Cp}C!%(+73zOAnI}3taLui;0G@v9Sf+^bBE#67D#S5mg
zTg{N81W(YEh0X+({SL`(++H?W8NX6%zT4cp-%VnvdK!6ORcLlUA*K+s62l_cRUw_Z
z+CgkPdv%HY#pcN)i<;m~W-hcari<hFUfmO0kq07W3W`)FPy|KT0i=N!mw;1|RYWNG
z7;d5F46D{&Us+8NK{3q5au^FOG&wbMrJUyy=NlEln~Xo4#Ial`LH;5K_67)WVrYt=
zexR|B!~3JR-Vm-fYSM1C<5O6~_sO@Yj(B5_kJVp2_JH3$GD!Cc9fP&<&BdP&TPLq8
zIh~pzKkveeX6MFbm@|r?<!OnVc)K>S2=M-dx^v+O!B*m(^od_4YN0vRh~;xsR)1$?
zy9arVJa?^0ZWnNVQR!c1@IqY$6FJZ_WN2lW({k>MGfn%;&Ah$^656_#V)7QCiQIH3
zkH96M$W}@8@bMX+{T)|61+9<J28y9KN9Z4KSH$>l-K)+r5A5bAf(>d3ggAcdqhOCd
zt7Qo9%G2&5f{Pej;I%|TwqCw|HZ1%=u;(+aiW6m=LR}GWMjh&P6`|$1Gu^g%3{{Ko
zM?@M%%jPNH$`SJM+?5Y#FXSeLFGBta>q^~!T{uSAXZE3(D6Wc~R!emUbbC)=f0O(o
zX=_zkyPNq`Pn|M|YtAz`6h>Om769)Cg=99gU!TKCsnGDaeZ@e>z!{+|Zm>R0louoc
z$i4B2IT>DDQT5-?RD+EF&Rng^2GvA(T97cQhb6&sUMEy(Td0{GJi8Klq-=6Oe2Z72
z;J*rqYMgSIa^+evBuBIAK=2Sb=JhytQ>9O|-rg_BD~~V}l%gfbZ>Wi|VvKAD)i#^?
zX;3l$WHgP{zLInGk)qUV?L_+ee)=hTWspsn2&NU4q<@Ph9(3#)>-N5Cd_6woh=XrF
zKH*@_f?@66YO|jpIJbnZ@!j?#D~!wkvaK#FR^x-GNut@{@T$k9^Zo=DyAqRLoqaB=
zQxNIXvGn(%s_)8XGe7N7u{up$o#SzkmsWejtFPCYT-~_YMBEc`Xpm_Im{UJ}PLVBC
z(;=Mq*|z%Xa$c_Gc@>P|Bq4iW)myw?Bx8x1AUr6Zmz=q|uuXZe_;6lfy|wKa&^>Il
z7}k>fY#UBX(rfJy-T&cM%)|}0J%uJ6nbA$Em_3i$e9_(H8RMP0Yonb^Wa{po8XnG;
zzsc@<$w*<k9?z6^d1&}Hv}fTjD|o2M$;njMm%MI&A=1hiSSWIlB*MRsXIRIJu@5qY
zzL=!i2@jt<97*J7?*FBWd^yY};{3h%*N1W9c}O4HQQHkVDix|Cj%S5Df1IV82S#X`
zshM+ZP97;MTN0J-{1@e!e9O(gO+11$r5xF$lwuTx9kwhO7J685aXFRlcza1CUe!7c
zpOZy==q1<nB2lqx;y8`c$F*}ZE|@)nOSQs0p|^if%TYjk4$hW#+XV@KT2S-(I=<&o
zFJ=uBaeinNJ8x!TZ3Sp~Q&X^TbKh^yYT)qU6Xp!Am=dUG(jTyU_ids~vJP+Og-u!-
ztD0##ufWj41Z^bNZ@DO^m4_=n-(y_+z1p8SbrCHhPb6(iKHqmnIc8!kxUb5|xr7Gq
z_X&KAd?KpjUi14*zsDKl^Yav;;6Rn(JSN(trjaqXn<`tD^jjFt@mO9t@VFEsi`438
z=XFg~fa>e~)WgXy3{BBz-O(MFmUj8x!t(ItDl)z67lV`NxWca)Z}(sG&Cn-CCIezK
z=|~r|kEyBM++X8*yzYW2B=_{Jt-o*x`zB88BUnmXLT-&$X4ne1#{X7%HG1=4UUvLF
zCX<kW{|<{kKIK5m<m+#jBpDuZ*_<IqQpSjOyLWYUGk&FNhG)U+f6x197Bq@O${xqe
z=DkTkCm<Q{Bz1p@=D5G8m2vYjKgpC`BR^o>!pteMxL7BW<oeUeEaI--+{mC8bv61%
z16DUR{xPC{cj(aSiwIxth+}E%GDU3piP5Fe!Si;uP^luT?d^R1-e}mM%jFDtsPtB`
zwM|bdagm**OjO27Z_Gpb8-}0$XPSiT)XPs#k2sbb=KKP>uZ16<ON_rxofAlT%`4h3
zdpeWZH2ZX_{95+aq&IS1{QyjpQhfD`ekPF&9ZDDl@bb|*Jv!7wZH`aMrRBmaP@4Po
z3lioVHB)NK8!bK+q8yvKg_iV_NtW}!N(-^!N$JP+__pZFtaX#a^zwtgFV*C128%LI
z!r54y^Npw3GqeEWfZMhQ+a;gX<&(J+Hs40g19bStXIh%6=}CCwSa8bya`s;4N=>^y
z>bAq?HS<yNR^sVTdN_>k1$dKwu~qEEKlVJWQh)d-b}fgCj{i{L@kr6gO^kf5&QgX~
zbSKc3&}FSwV79|X{s$59*PfTmpD|Y-arIUSI(jaPgd@ppG4rRIekk6gCR)DMga0t8
zc9zIsVH1h@RxO_Yb;i@6`qZrf^G)`GXsx{g0YL~EZX{;ppOK5RV64fNb-mFWXTO~Q
z@{u2|emT0ARzU@`#q{Q?1tBq2Rn(vMGO`YJRp{zis7g#r=;3Ga2TY)hZ}ppv@Z(eP
z?NoE`=C8G$E|qUapB^fCg*S3p9Hb#3@t)tDMAHKfOm13uHQX+C<jpI}rt(-4BUOW_
z@k~_;&<vWBvElS}!o!?rCvxS->%AFa`}OJW?;BuazbZ*oHKW4xAB86=DF0NY1pgho
zdLJ&&m~iwBx_a+glt93gbL$;WGu*>VClsB~&u2vTr=rL|is|LM$KA?Sd09i#BbSZB
z0&Bv|t@reJiHA*_iSWS7PL;e6Pc9Hw)&F>c_6?DmvF(}RzQi!%l~GIDZ9!$jZNgST
z$BN)E9lNVT>f~Ysk&y6rV@7J4+{Wy|(+8dX99=(Ur;P`LOf(k6NOPaY`j#{N!;dFh
zKZq&^0%}ns1GQUOOm>#n{0*D^=!T#4?m52&upmk@d&Ax})wv3?cpK4C1%CLFc!{pm
zc10homV%nLlAt$N^NZ-mpA}6vC%#&3_w=@rux|rvHVy9|^bA!D4Qz?(^=~|O{0#_r
zn0*(j$I=P=s#=-)p)q`DP+tKPYp{ab8*Pshf2Nkh*rIP|um4nS^=}Nf>U;UkKD7Q?
zFnml&e8kt9J*?vW_~^6ZON6Qa>);G(cXQHA*8Qdb$|_{-+?DhAw$lH%{z-QwLAmc`
zMbieDN9y0Gl0%DsWnL_0j>za0ApgU4!k}bS)q#|B(mA^kn~ou2s{yizJf;?GDT0_V
zg&4k`(}=T3%{=XV9CPq4($q9@63()}pQ1tqK3~7cMlFOtv)@@&&Q1>|mtUrkTBy}1
zOP}>sE{QeJhPSoFfR8Ua;ZHmJ06iOMBX1zqC}Pm4#s+<E3&Iu2MD-QH>%5bJ5&!DX
z_U|;C-tg7Rp@AZ-14WWDx+E3tkJbh7Q5{Wq5jKF`#?Ox=;EOelak7DL{`U(6T(+Oh
z{<oR^y@L=v-~a7ZM^x$iZx-R-zti}CzFi;sZluEOMnUQ{w`1U2=@fI@zuGhHH$2ln
zT_>xtGvrhQ6oaSNs$S)ia<44GQiPeN6Nm^x#W)G6GL+yk(U1W8#4|Hrojw)}y3$}@
zqXh%b1ysA)ro*p>PL0K1L9wy~l%QQW(BRva+i*GX23!@#A)kLE1V2|8&sU+vgdl}W
z<vp8;R3tZQKRR2jXHGO<#X!J>FwTpEmQ^8enaXni6>Wp$X7%Z^{rp98Z?C%W*BTvu
zdcz2Xul|k`2{{uCpUwR8;)oJ{#Dy`HTQ!PNXRM9(WaU@ea&d9Fp<!S!*-P`FiFaT^
z0=F7LD9%bCKFy^+-Not)D5Rp<)<GXwLkg`uGqt=NXhRHJ{@nv#=gcibmBJU~tiHk_
zBh1#XAM;%e@?0)#xE*Jus%j%wbHrQ?q#*$EV0IVTw0)=}uV^6Dpb$E_xF~qPy=4Wk
zU<KvG)%q5l-HO-n&o{TWc6N4hpbaU$!eNCw2=~wRrynM+^gz>u=C2vTy_w4~KhmZR
zP=8R<(o&vICDB&~gZ)hQ#QB?BuZaXZSK6(o&dWgMA=2pazDV%=IFB+;c5H_ez*Qy}
zg(jwXqEoXh?d(DtZ;^E80Ufg+?PX>G;F4*S^1psfB0lcAOGx-r;af+w<&R3o>>Mb{
zv>Tt>8t<$fp2~ADA+cdWRv<a<IyX0G?O;tspsy__2Ny_YJAHwrOnC#7XBlg%h`NkK
ze;Y%Kii!#-2m@sX^F1X)O8iYzDzvy*qMU>jxajY}$|X#3ay}+QW3Z$`!$3PkxBrKK
zJp>~?O6XwvuJUnHYu|q*N6tuvj!iLcZcg`>+l~@9@<W1RcTbOuB|BgUMVA$WnSM1u
zD{K)sGQD2Fbi26tv&J?zr}ds0WOp6NiBQ1cm9>oxd0O93|4u1a37SlW+&x0u>GGa9
z65%X>nWY1%sHG|kGlOYuyN7Fo#<7`i2>=?Af3Eqr(Os9zv}LTqE3?idsx;S^8*lhZ
zuktP*6K<f&^C+V(CX@2LTGP2UD*+`Ygq@2IaE-{Q8uSxW=lB7-^u&`Wpgjt6t;#^Y
z$!Ds{Tal;G9Q#FRa(Z&MzB}`F)wzy`ticZS!~24~PueGUDB0F<bXt#WpS%1L7}%$n
zJ*v}-+Es^Rl*Q$|a4xxH7J3Pep>go!k_FKQwd3$b%Fv_576b|M$FP7~n&$IwS#Lv-
z)NR7)Yu*u_c*0G)-CR@}QWAc1>bVpc4OzL+3h2Cj`NrDL23(s`7QYgA8aXby8tva+
zb9T>6X?m`(WzzOqJlceB_~|o%Dv2KE(CZoUN#qmgN`Y!EL@7cdKCpf<*Qu{?$@AEP
z6SqQuf6h4Hy4IRf_}N^C;jo_mg)`fXI#L(&tG}w5ZMF^O20UUxm<d~qne*agt{I{R
zZ`}Q#*Xh?&X_erEnW9$t-%D%KlboPe++uyRoRKmAr$XFjB3`ZCd}QGc*rZ>~6b%Z-
zg1h=LWLu+Y5>k6=?eOqa>nob<=3`Z8zf|mH?O2}OJwV#4v<w-wm8RX$I>YSe8Cu<_
zh|o=S+^LN9SA`IN=ddQ)Yh1Z)oW2%zl_=6@Ufwpik%3x$_a%Qq@mEfGfili161<#`
zP^p_JQM2DR#j6tWI`?+LoLmy4hwV4Y{(@kp4u2bLIcG1k-0B3ru|j@2)d8-9?6YsC
zNsefac6KE+W^)rS7s@-UfJ8@?Xq{^v1orf^<U|xv%V`_zKFUP<)i~_HY<=dK0rQls
zEDAua<Khb6Yn+&vsJe(e_>PuE!Nubt_Uu^jMnEJ~RnAxV-$aa;a~C24x#0by9Og#@
zP@kg_+b}zM7AAkD^L+c0e~QBNyEW$&&|QdidWRJmywQh>t@I4FSQkD1mF%|v{Rw~m
z)(S2=!762@>6*?vUnr7bkL1<o=&@4$b5!DC=G8eWS0l)?qGT})$&vd6Hf;yKD3(!~
zfrsHZzUrvYd6la==F!<V;-2naJ7Gny19uP7>fKgz4R~PefFS_p!;yy4Ex=|2gG$3L
zDXHmyJK>RK3O4&J##~)pRrR!bN;FCVH4}iFg2Z#$;|oV;Yf^7RVMHR{2=ldxwMN$F
zt&i--c`|ftuJGZKx>F!vXNV}2MU&`(9=vMFQk8>yd{%o<cAfgqHTXno`<Ybj#~+id
zVP&Xx<7kt!hN^dnIC)jW0!=-7^yE~!@{K?Ywh(S<{DTEa593<Yq$&R9D5r=wS&%Ir
zYi`X-gUs-|ZDGOEFQ#~)6C~euJ^qXUxM7W+iL$ORZfv3X6p`~cr(5XcLY1nk71lC!
zV<q&id8f0&dCP#hjhtG@!S0J5E;;SSzQYNOoUtArVDz)&tgoLtGLAO66VKWK#7{&#
ziHi$pxQKvy4G`y#qk=!JT_I~XIS3V6JG-xN##o_EyLE1>0bv2M|1<&sO~cI9ELoCW
zRxtB}ZWbAd^2*uG>({Tz)f9R0_#!2Qvz{i<2YbMTex#`yW1^=1^FnJv|29AfiUM<*
zH7}n_e$LjqCP-jjA8VmRgpgU`@yj~xjJ<xn!$xJ$k6(bSI&Fo8#8tpvVQ%D{!$C{D
zzuT3NTZSvXO*y?N-|T^$sgup?6e?<pzcGs?w@zc-c;xlfCGXGNlnMSAnd?1N_p6#E
z6xAB8&mzPj8oU=Oe#om+B+)9VZ@Ruv%A7BSZ=%KuoRK8zi1VZODPpK46Sb$3Qj9@K
zgm7v6*6JXO9(fo&ZUEKh>J27kMt{kr0EP$wzfYp%+rBCLc{X3+(6G>G8M!Xd>AtR=
z7#>doZ>a>$3BY-C%d>ig4D2KsVN{$9W#7h`g0kW&?-oO32qx~guHkzZ>r^CFRa(4{
ziwUn#6VGmZWt3GJ6Mi!8<r#ep{uj!K<G%0${$B3p)%Yv)Fo2p&-t2ccKt~Gp%%seE
zqU1Ww5~8E(lMMG2ehRNF7e0`C4kOK99b&=!Vco%G-j^;QY48+0cyRanF;z3S^tKO!
zw9sKMPx}Tje{1y{C9Ohw_s|gL&UO#eMz3=ETlHnxA5ffOHYod92%#31UJD`zmzcFP
z*k4`vN|?Gefon5t`lXU~7w&_z#)F^x<ftZ!_8Vj2vqah%+Wb*=G%VimyM7c=i(9u6
zH#IRKBIh)GoMibTWs;A#SvnqNV^*!R<bPI2X=_7^duldjT}VyCP>xh6%ikhOON0c@
z#%~XIOEfxa!S;IKQws|VnW+hrRP(BxbE<0F1;|!_c2d^jjug(MCIi&<Zv7|=X(Fdu
z?dnXT4lQZoBsi3e3?XO0uI;;M)1WOSoP;JeYBAIDz>5}skDGp`#`yUtNsJI{uVV~a
zrI&Bf!u}Q_k4ms1!1?&6dk(uxvMSWqgq`=bT*qA?><X}QaQyK;6vdDnMI)7>jburc
z#CXTbQ9a?XBw>8cTcOddpt#1*{jDur)E+e^(*Lwm`p2xN$ZR0|!eASqsq+f3eyVsw
zAVr0SLY|zNxd!7gq=+f&U{_Q{r3(st*66@k1IMVTRDh57rE49GFw5<o|3x^ft_CiX
zYOxpNKy!BUUD?29fwqdhhLJV&LqnGVPFZuZ8?cr!mK*g8-pUNKV|+h@u3T;=E*NY@
zsA8tvehD7C6<$6jYtQTEuhNV*1)qm|K)Btp_Ljb?^<vr>O6>HON;Yv*goHM*iotF(
zwsQz%AY2}RgtWphGfcHmg;$i^L1zJVLG}Dro|UT9Y|GG*ij<Else6~~zt!evk#)?k
zht6qXX~}$D1s+}C*|)KLd^{NzMtyeAGHpf`Mi7dzB+189f0M6dQn!8LQtad$P*7B2
z6xvLbQ^4y<Y>7H;BK!2|6W@-LW+MX2Svq#C+E}X{{!YL7Q$bhbbA?+@r4;5uTZ1uC
zGE5s3NAu5E+kt><BPA7ZLHZF!#PxuIWl-}x=WfI|!8#ccj)O~f_qdeu_OOcqzYl|$
zdJammqpkg!6EXrP_I2H|_a$kb^_ENgrc}7AT{f#b+%P+XL9DO8#nJ;76NcZnM*FCk
zH~fF@JB$L|U1|wMskZT7e3oAej!&2y?9yE6B77PscZ`Es^qP&y55p&?r5SkZcR@ff
zfC>zIL}_$p&%TdH*Zz`Jw*M<gpv5&-XeIj!sjRhk^sGlfP+RRQ1}-s&zYsS)lEP+I
zjoIW8P*>bp_W=NzIs2#&Tlmi~IJg2W@x-Q~RpWyPPlzu)gd<oChZi1=R8xiTQhpJ(
z(-63Pbn3W!Usvh=G-=~e;nvh|IS|&~D5tn#0(b0Wt*#_)`EDA8uK#VgZ35JVF4j-L
zssHu43T{z6`NUYnh-+e0g^pbVe7IUau!Yw+iZUpg?j#hkKfWs_l8r=Hpk~VF=VdL-
zV$d(fV%A%P1K_)8y*+$Gpr2=^%Xre~={FP=?oTj(1rW6HX`{w{%C{H~4oPdIU-Z!r
z^Bg9=wn<IQq=|v-h}V=)SIf=ZaHg*IFy}+ZIIL=52~c>$f}{w`G{~az&z#`j*M0rh
z?21L4egK{=B7KHPr}UCcq_Yp9B0#jtc^>mqRR1&MSKbNp8G6j@cT39QS9U!=*ZxXJ
zzW=CT!y_!3T@i6VQ`~?3JODDyXk2J{LWJ+)kUTLuE$h0hL$|#p6_fc*4_qcb*xjm`
zZ>TstpBeqCP`&%b8~l0XrwiR!&$6ghV<QBNgExo)``fJ)%YTamtx%Nd$!B$rS1-#{
zF?b^rwf5(krUfAr!EZO>{%Q*C2Cx3=yg^d01erVU1=Y;8a~;9zPZ?P~E(TxKB*5ax
ziBT6xC9jYf`kt$=bq{_pe@l5#eV~;S3%`+SC8{JRJRkn-m3aY<%np0q6MzVU$ayI0
ztt;uqjtfMw$Hh*+DP)ARY>@G=-9O~8v%g4|G~gRpLh50soU$6^otSt12An%va7Jc#
zIykNVIDMT(4O@l0&&c`LfZgDP;6T^&*LImoWjxeCzdfC_6F}sYIVptjhig8b(!Ibb
z`Z)OZEX+`>5zpNr^9H_+lINN{({%OkCh!THok_y;(^G!;4XF|cppSL3q2jmHTneP*
zy?aNvLE+V&e=Z|i-2II9#mcPtDTQ>YsWMl#g8%i$jgAefx{;6apLeqe4I4zQPZch#
z36+FDmsNOu*iuW_+5KugIH6r*Ayb110?IO8@y`As;{r>})Mq)y%nHUsQCg(<2`@6v
zIjsmcQgY<1FyUyjx`zsWe6OlZe3<0IDBIWP;$~EDq+HDA%?9@oECrVYPTe`1_UAA6
z4nz-wV$G)@v(?<`aC1}p#D^U3mmrZ)W+x8OuKj7Uarw^agOet$qW;I_&rTn1xQCvc
zC^|pMp~u_4)!DICqyL|zK~{XpzZc=Zv4Q_TNl+2KtC{~V9q`q8PpvP|SuqyECHlY9
z8F)qi9_&K-O?avGt5^Sh)4>`f7AkC<0;iN*ed~0b$qGOzy65Q3;9~$Mp;&2!5^Vt`
z(F<mn2z3Y<0ovOFNx3K)-h9pKmI%+xuz2jw5r#c{6+UTKgPx-+Qv#$InGiE}pcq1l
z%@@G@ZxXOyE;~2&GzI~4s=W~=Ma)|Z%M`*m+0Ki?jF5^^Rn=4Ltb4i>$@PKRxc(C+
zI)yp<#Z6|EK7)jb-#;D&5I^Ufm_FNJ2?!S@`)Dfi<y0VNkN@C+Sn%c?zut1ofoNXG
z+fL$%`cm+epmf@`+I-%fWabQ#<+F>rzwq#^FI6|c?7miTy35T@aJY2gQV_IuxEVZK
z*j=wM)pF2!GW2cP<Hc__{C6vbnI|Lk8>snLmbNpllPOmWCB*Z{nbW9z#`0=v5|)-~
z{`E23+<4VGEDmnM^gO|^!ZYpa#&4IG?(PS3UB%;;BO&c>LWgZn!XPB?-8hXO*igQ3
zp<{@v*h2^sTMMTI0pYMq%vg47PT<QoJXn#E1iUU^138Lb3-k063mpEgwHtIsAx990
zaN8{?xY(j@At8g0Bz>fjTlQ{y3#*9)e@3-lys@&kEz+j_8L;fL?|;qa3dq?WmurpO
z9{UUL$S_x~NAnbvm5Vh|!1LWORg00hk%0^RyJ^E0Eeh9xe@?bM(y4WSRfcEs>Q)1r
zR1B(~TU;C{`F7~`;!W>H6?m!#ybCVFLjML63!8jiLbY+H&pdAmlDyW!X|yM2`y36u
z%!@U(8fs>1VSpOB6^g{*AroF`&B;@T`65gf1~b;d;}};{P*jK=-UQ5LK*R!a0N?_w
ztZf0LvfBO*oxiEk^W!iD@RCwf)3%p?rL?|$1ODr-KYs{7sg$wSbp7ncbF+b^+I`X6
zd#b{eoNM?};7HfT;9q7eK1!m7h*pd0M>-&3d*yj-nnsJ3k9f*qV7<~B3Pc^FIPgqA
zW6mNW2pxLFKp$CdiveI5?xX@0MnE>jeF25GWt~8=z|=(=kK^W|$1+VEOhr#m9;*E|
zLkY~2nAepr=;p^KCw{h0j8X4SFEeZj9jcfF;vU!$UB`D1GQ*|^q5l0A;Q)jFjHss&
zwAQNOtb>>;estBCknl~kDm$lV;!Oje`{L6xnLdDM>XZn+SAIHOKE6z=#0i&_rHmUK
zhG9oY?r2YTUC+>pXL$VECvGZC$o*WeFDeRxhx%2C(Z7;c-YY*_(hyF;B&@C;mo$A(
z;%$XNqfAt!&ItF@{ERx1SU{;^|L0Z4mFIB>@=vBXX%erH7N4uw0rQ5Z$HkdQm#zbb
zI=tud!Q(GGrK>6;H4I9345oV;TVMXF@c`OCRz{Pu4f+<w#;s!okU&$t>wAA!gCc0d
z>&`6-+!uL!Na2#P&c)vm`U|i@DBQ@5e0j7E;Ov`qj?Gf6xE9NIN9;TT1B+LOzuz<c
zgLM4QB}lW!H1DVIOzOXbOO7Q8uzm$GGOx|9idR@MWRvGs#F?+<^Sy>(2p>O#hle*~
ze@!%Re06wt^SJz=Rdpj+Xnh)Re-tn@Wv@5;%bFtK20uVnPfsB0>GwF;eP2wV$0@!_
z<{M7L$OG&r`G5aHP0=u3j?PYYfwY#CbSTJ!b+{M+pj&Yv&UR==81j|NQN^O`)j6Q)
zd!AirZ66vA#3=^^in8{~x7{PoAI?PD&tJofJwCQQd=kPCQG#j%=4-Mq_du<H`-c=f
zkT>I*JkkKxL5EM0mMDg-B*7q;oy(N6YGPPlvD4E{RW7!VGICv|%$-L^7GS3I)a03y
z^6XL>cJC%QBT`cdPj3V_s`@OUw*2}RZ)M>~l8hc^-3;b*)B5ng)>lX?D#rHp(dp`@
z>S$|c7eixQIy+@_yd0F3c~FaSp`JmbqwmoqEH$JB@=S4fOD<Mwfzf~<!4D1%=I-69
z;{W=<DwCt~L&19Y?0qjj^N&S*I6z%zSe&lX0YUPpRXkXM!nm2cd!ktt(g1zjFg~j<
z5))H7<au?q%S_@sKx+a+=(^fuNif5+qs3Y#BA=U92!N2K7M7+&Rm8-{dJ3Y;y!gEK
zRoFo|ON<w{P@Ud*mZ9#mtemW=1bl-pm4Er)O<Ovuh=>TY>emY6ATQve0n(cvc?W<0
z{vENDP<kpDr9n*mU0I>5-nLW^*a?v4veuz0wBb{6u+B0Ir81aK$xMN#M+|7tmy+xI
z`xjSLPD-jrTcPY_=La)0Tso>*eUkSXHCCQxcJGWRX|q~Yp#a1rInChr_!$$BmKDY&
z<r?B?4T<*iLniJ8QHv+W_~HgOXmMXmx`EkB)Z&6^zFOF|w)x=iwKJOT9xU+{ucfag
zkbkzsfdrg>@uk`zC3bx^mVS<JaBjqmq7vS5P~_~buRGv&a^rF{-7imK<d1G}om~I-
zzHwpi-@&=D{y(|-Qz*C`G6K<QR}eqvHf9E42FXx1PuLjia2Hww`u2z$@$^OSmJ2~>
zmS}sFxejk+_4$4O?wIhsFnslG^0JYaLjhtpm<<CObc~R#MgY3akEh21B6K(LKmLl|
z$S{*dTiJZc%U!t4j|bcKczY|83`_ZR^G&7m-(zz9=>niyR3!ZL4oIS5N3i)ie3>@#
zN_jd_enf0gNc{X6clqwn=&Xw+AfmgF8bm!_Czem5#p;sdocvmqtB=T6;1~v}=Czg<
z$8nG&5%4(Z{-to*Ky<Y4_pM^Gl+R}qjV6-Re4zFqUjE(C%a^M3crogY2qlOs;O<pK
z0mq~iTa+V+-}s|Gzs;fEy9Ss}V&5S$iHWDx7gK4BlgY|}V4R*vAaTesKJI(;`N%{M
zuk9+r(dmBXy^W1+-^S_vZdVqYkkC8nX&Z1D+?-&v4M#Q|{?p%~2os@9DKnOMk^(Xu
zUQdfHU>}c7jfNW&qzihb^DKKtG#$1kX_NxZB%`iBGawv9k{}ZTGCMm*%OR^AGj~&I
zX4NTg{C@m<&~pFW9JyzTR_8WI(hF%cd?TDWc%*6$KABs7yNmYu=ReBJH;!{KQql=%
z@V+s@IH?Qr_32IYsELV7uZIIJj%FME1o~15N$wWZK*HPUy7K||G+{DF?aXC@ixcqs
zRzD_NarOuL9R<dl;i&@61MEJ<csVLn7Z;!<WdbFbtLm5v>W4&yk@}<qT)xQ(@7~=V
zUwwc`q8kU(;t$%dRqX#g@aH*DvJJ&J0(A(N-Z$s@yE6ah;$QlE_Xg1XF9o9(F%DOO
z4VD^riv*2l?K>hgm}ti^k=q_nn-Hu#)!p&3%4N6b7SFaO1PW;r3;mr@evy6QY*i^}
z9?R9=hK442BVovQO9ibtC_g9>zpb~0g(2-6>J0q-LjYf-WWpkkmLGrp@HqUdbQBDK
z`XKcs6j*u>H!%BYCSH*&aW+ePz}s7RTkvuG{V2=K7r(7V9=_HeBHlC??Y<e7_&u6i
zTm(1gOG4t?V0~wgdZJFJ#c{kv(Y!a?p)ASb&o}%uyaQmPQE3T3g5ErPnO)j+gcBob
zzR9(<)SPnVyXCulCr5X3<NN7P)xL%Se2z6?=rHg{CcR@OzpU49{jy6uaxX5Y2TMfD
zbADNN=o2+;xx(R_P+MV0)bp@(`|zlI?pI|$ABPhl)4bBYj-UHe-D72Sb(Or=j2%dT
zf&SPoRV+GOw9bFy`c(>s{u`txZTDwS&$EVyyA{)%?9xt7-YX3JiNQn*g?y%vw6Ot7
zb??SG|DzBlCQi9830+dd%9$pnra(i{)=>H;jK^OIsv-*MC{)x#3H=Qij=FmD1g(6M
zzD_YY9i&j7<>!|qf`bB%tztRRm9_kskZfyZ2k!TB5TtvJjFL$bBG8V7`|d-9b5<}g
z5$iJ=)+>`=;}5wkX1P;q8=EvkjWHqDbZH&RO>|f9_^|`pm1zn7#6&&%(c{U_)E>|^
z2qBc-y|~nVg%FZWOU%N1e0<!_>f0P}Pr%~8!>})M%}DC^G1iK*e>AD>Pr!9)+lTc+
zn7*I~(mPrix^R}kGux-Xb$uHygF^~V8>jDTj}`z-WD5hN4TwbC(Z~_Pui>UE3^qUG
zxBV$((xb)umM(np92_m;&@bkxv|oel=k*(1V}irbt9_3A<qF=CHb0TP;kGvha!itM
z-$%CH4cQ~P1gY=#O_OOSBC5v1HZ<Knf<fAj4}Dx>43&nR%m9*6qM<0L<+3$oUn)nR
zQK+uFxMK%$tg282L9C}=Y0gGO(%5K7I{KRrr$0PX5HP~FqVG{|ngu9PS4vBwta~=U
z`!<g|E02-SDk^*WQYa1-;3Z`)_m|aQ%q>2)&Y#i1R7tp3HZ8SWelK1w`3o{kwG8`U
zRPCQG$KKWKU0x&&?WhVIEgZ54Z>`m?H~Xc83AHNsKL}qHIVl37+ru-S$uKvWTKhC`
zo}zVraB{*T$NjxZw&R*AO7>};H-5mPD;h?P9gYn_0D522Yy9WkCTwFVj9ub6sfQE=
ze~zvIO1Iad`fn9qP{)T!83&XdnV=l99F;E$)QZq;_ih_o+n7iR`i#dA%fr<ZqF7Rq
zOo`LD4i}kA?Z~a@{Sz79gdTh_N6W?a-eeSVV-nNVMd_a<W-E^){vJFMh2g;*$miQo
zerlSc_ZkVCn^K$jcu)qyLnc@RIC_n@k#bZp!vVk^&I7fbY9OvY(Ze~Z&An1o`Mt)j
zP3|C!W##O(tLrZ<{-Gd!=Hb5+xG)$D^z^NrAj~e5PoPRn7gttxIuU`t7n<jm5O#dP
z?5XYBbe>cyuh^UDvUw)^Hldp_jkZLtj9S;}>(Gb!x(cEkTJTA-k+vj6terF)3XN3l
zGqZ3{ylvFAu{E7s*VX?XCsT+iPL7K<GBy_Stg1nfgTrNFsvGz>`D3pc2l87h@Un)1
zD4SU|A0GZXC_cZ9Vck(kRG|KrV>>Z9xyBp&xr?{<L00gWBYDVw)8K@~>Mua0TKX-h
z5CaEj*3Nxni;Bw4?E?2JV%6;aSN-dGk@+SeqdA}f5GvVEBl07!gnoAabWbZ5wyA<!
zGsmWD6P)`4w6Hrj5J3W;F%AIt7<&3xZi+9iLZ3hjODef*n5QjMK>(sB;yFJ}jQY$@
z!-*=x!oqs+Q8cC_99gpXo{hYOe}8iq=*Z4+$6-X9_|;s~^so>!NR(_P_2uj(g&Sc%
z_GSz&$=OfX*IJ!R(+ob$gtczvpmpB!i;L3)EyJ9E1Hwz7AH|=MTT~Qh^qAm?{jF;T
z>OuoNH{QrT$ACS(=F44MtHzFiyWz)>z(5ADVDXM;PcYIaw#wF9LbnUIeSwdkYNzlV
zmWZULYitBQV_KDb&844=anY(Y$fkc$<@~6jA@+X4rfBp4tudn;sOK2ooF-jw^0f8M
zJGLp7)kaE$VT_NC_SM=0c-S6A%$KwI<y*X$5if}ZJ)^-+HPylE5RKl-3`l&qyBZ%K
zmyj@p=isPrKJ8EPx+%aHgH#x`t=7syGKGA<Y-I&Rmh07;=-^emxDfHXMpF!n0By*I
z8^nLko2<M%s?ja@;SokpZc9S$Xmki|S50jawt8>EFi1`O9U?=!rD`3Ql`JjsS(>lm
zz$*~mhr+42o>H!NQ@(twXySH(aPMz7zqz-3O=vq+mQz=U-xG80dNtBknB@mnH!~4Z
zSiC=9mvk^+S8Y8`4Se>yt0T*^#Pa>w>M&42^ksV#rP#ab+&Y8W_b?mYj%iuhIBc%n
zxRmL&#jpfyByAg2M<z~b;%#oxYVud9%7JqIHEj8Dm<`6BN6|T{Q&I4`vLLbzGq+@x
zrNDK$@-M6@)OeR&gE_p!hCyo8OSH$VM@L7LAw+cCO_GYMcfCWK{#d{9P>Z3Y1lYnv
zbHBB{Cs`m9QF2u|sRS6m>hwajVqr9&3$3>sTTQqfxYp2zCZqezgbxaRD|8x{8MB1^
z^HYKg-XvP5P7W0o?tmk6aRR4cEYK5M)tf{)3Cj*4t7S$R61b~{+3%;zOy%C!0sTvi
ztj(On>-`r3O!|6Wlt^J+QB>lTg{y|KmDQIczo)Q}PUFXor+X1L*9ZE>LM;Ka)I#Qs
z>G}h0&Fn(@7bQ94%hLm^onbOX<LP`ZcnJH8)yVJO^LjkOot>fXFSjLWE4~EoKMu`O
zkqT{<&y^BrKA>3=2`{9lRI|pz!~4njO|`h!wz9SV(4Yy>p+rQ6J=*R(v=jS|o|cYI
zZ}%KWKrp8qaEs%xK(vbSbc_KB>-@(lnEyMsLS{LfVQC*g>gVT&`vNgEG;~DcRSkCZ
zvp*(4$BE1Na-VN=a}&I*#?wQ@Wkzk0Cns!$MMYW*Wby^rjx8rhcbEI_0`)RWeD2?8
z8@vp?S0OMaShL5y-%wVYC?)o0RO(YSgH}bAOAoq~bPp?9M9k>>$d)tiZ@}tVpUl}-
zf^z(9vo(C7&Sp*4Q@SWw`zXb5+>lwcYODfvgZlxY&*eTjHoD90xpZ<OEbzex<#Ui#
z<74<Zz1_UAi7(nXrw;J38w<%1(jTrl*Vpsx7Jj9KhDu>O@w81Jzdo<jk>=E_Gg$^V
z(7@+%bYkrHpKaQ$;SBT6?uhft$_{oWP=9i(J(!VIHX@B%Ur!fsNyRtxN9;U4S?#+D
zXBj#>Wq5+j*VeOt3=fpY*OKw~_WbuH2*D8g1?FyATLW8=(Q~Z{BiDgz_<NN?dZzk`
zEOfP#)z@ymHBMq!SlQ@FH^15$0c2Tr)zAC4>ZE)f6=fM1q?#N94p08Rzureg8hdV}
zU3AoiH|1CUkQvpQr2FL;(qX;SqCLcQ5zK6xq~c8@RXW{Yqg34x#mFSr*5cjXdTVRz
zm${~r`sTA@hyN^W%d+E^r%%Xj1MiD@2*5#4RW7$b`uP+`bb%&LgfS;8N5}Qg_>t<T
zm8ko34Z#ZB0}J<p?&g|SPR21iJH<9VzB^4IgR;H7ZRY8j97iMaVdYeVUqApfFG#)(
z#|(0wHFNS0EKlR9cG*(u?gs1_c>wE*9@x_Q)uv6aMxRhzTA5egl412LG;&DECYK8|
zaI{|580FR#6{QZv%TOk#r<e8jB@CE{IxhX~!jJrEIZWb!9z_<C76e`o_ih@XV4Sf&
zH(3fY7-K+1LOcc@8U1v!(l<f!E#RsMUhNx;=dilCoPEk}YC;7eZhE?zuWt}|*oIyk
z3>9M23xY0ZXLj?KX!CWB6aada7{f8Z4it$?QXRlgtuQ26xo?QFwzuusI^z%$(lGEJ
zNVF%TTF;}P6&Hgb4siYx(FM%WN1vV_j&}J0Fv81yk={O>p70+0nSf)m@`HnXY!vXi
za6KNkU7I?f8vt#bNXN%pk(|o5tdEqx69VPI`&MUy+uQl?YhBE1dxebPh11{9N!OD`
zcZwmos?4tdP4AisWXj49?1=>LiHI{Yh`dgyK*F&Xm1XtpZZU)I1s9ayfS4GZ#yPYv
zKnPSD=?<c}QMU{rttc&x4BSK+PB~!6Uq(b&H7fC97l4~yNbRA65#{q%>^))!HEE#k
z`cf1Uskdm8&->5OGCM1!+j-Ly6M)+By~5^KP0h*u+3@)Ca*xr|MO%?NecliHk`nbX
zQFWsE3M7rlbpYM@nw!0cRBV=d5-z*Dy9=~ZDKdsk2$1aU?Oi=QaK24qmKT$!$Z@c-
z0qJwlAf$p5F*ZM~%&RH^Qhr9X)Lst;|F;)lAqL&qht^UD&*<)U+Up^L=i~++G@cn5
zkxEArty)&LhH4al8{v#l;r$av>fd{^-lH?V9A>ZQfe<PV0hykyAtO-@PHxA!kP>>C
zp4HonJ-{mm?y)C|0odPCT%y`b%m&jSNwtP7a*qX0YL3hOrFFc#Ti46O#etKnC5dT`
z)6Z`c&DjL```ez<+BPD1mf^^)?CdC06i)I;pORhq-x(RPq!x}&PAV3wTbOx<z|wfw
zgg83e?#@JdoG5{Z@W;l6*J%yGvE>21oCy{Z6eZn%G{x2!aCh%NRk0`<@T3d!0J2)~
z&bzyN|Fq(8U*wd$xQK`Vk&D6rP-_bWssz4lLnj_l<RRj3NobM=*j*p^nd}dKeEkiS
zM7qQS50`|e%H~BSByi$PP5%u5GbhZ{`qA`B`cBG={AY5?lt}o?e`wPlcOLmAEw%dB
zolzjz6BFOhKixfv(*^<B<D+y{3NB9thV%W5z_l+@M8r!41qIB~@{JpO!(3|J&i#F~
zU@hkH@w(8%Rzr|m*%E$CF5I-Jb(rr6qfu4?s1`jvWb8hlqvozTkP&yV7L)T_2l5<z
zY>&lTZp?J~^-)EoGG`yu<8A)zaw6*4jF~#7KAU%ziP{>KxH_cNK@3wJ3TetGDK7a9
zM8)mxnetWXxE<zXinV{U%j-8dCy?GBOM{$N2qt*B$wNLYHeOucKewBAmyZ41?oI^i
z$g@yWfv+W_Gb%j=fzRP`$dZtlN5>aCD;Ar8^&m@wu?q-<856|!Q<-qFaof*{Dk{E2
zMLioF8m?w->pef`Y|uwne2;<v7yq^E)%4P7eC7w%_D#h%H;-2VUoc<P)VTScY5Awf
z!zcA^ok`}!d`+zHM3s(W6%-6AX(V=e&-NoWGT3z?{YtwGX`t#gDJe}{AJCE(+uYg&
zv%0`+#<jK@>gwteWTn5=d_xh}7h5?f$XN4F)bUN*<KF!Pm@)@U^PKJ0Hm7x|F>9WW
zr#HSJt~E)e)~mCV($M%?fSp=0GC$ur$7S2#eDUI0fl2u0rp3K5DUah)z8w%@dq=ra
z>C2579^!e@mA6pu758C8$TCY(;Lbfi-XWVBq1^spe<|RTnV`~JEE>)Cqd*HZe~b<o
zl$Q~T@i6urm1KS9p7RNWQSFxoLPD+{SL|%U;<QA$<>eW*k?2wmOWDN@h;&pXB^;gy
z^jgdYlxZ;RuaZ`F4#wNJWMs1*E0~V=_m)3wR-nXLzy$|BI0!@083%H;do?&{T|1-7
zaM$_&0l7sXTC(D!>Wl-wS$z{+^QFKOc^nV8e<Qxi`i9$~u(dT)E8rXhoUu98O{f}^
z1of_gU0sOYcT=oDI2LF`U%XTVv23@L6z10-CGCuEUvS@LTi+IqJvVe-`c*b*S(O6`
z%z1N-w%+=J=W1PcGL_-$S}n}us8%QOLZ-_=JWzGW>^!644v9oH$dvC((;tjRhvOw5
z8eZ39GT`HamRjfC36LcsR2b-}Dl3_Vt(kxXmv359+c~?cod0QDmMVS12<OXjPOtR{
z9^U)?YEVdntr{aCfi1EKON0sZZJjnhJ<8_C?=Q8af%G;o3*a;{9+)Zzes9#~CiPIJ
z(7<soZIj0VxV;e^mcy9glHff78f6-4?jgCXyu91)y9N2BrD<2oPoF?{lfyO$2y?9I
z6(cT)gieXz;kAC0R<7?RFz6H3|2{MjkhNq_7k<D>b@-rzcZQ0ZTo^HIIWjx@E=T2q
zg?B3Pd>yC*N$@!QtS10;;lztK+|jU&l*~-y_0WsK!9i9wHqhIQhHlv7M5J1b3p~56
z-k7Zz)zb&kM|f3nH8p@Ud_XTL$=%}z3VmoV4J=JeVkN@R-xmDcZ#es|{2jz59hdg=
z1g~G4AK$w1^Ur~<zW+nhR|Z7cb?s8p-O^psAl=g4Aq^tZ-6g4jfOJU-g8~B5B`IA)
zNOuk;jWnFi^PX@1io<Zvj<v2@*1m6$@}PZ@u_SXf0fL~!w{~}rIV0h$eyb))F5n1<
zc0?g6FJbPx<FIc=c<Kju0&dLkEJKb0O;mUap>uZY!rv8E8UjPcmF-bBnNL?981M#W
z=K#);WHiV6C^Y;4OsfUMIOP@OqkH#en}bm5oz8B`B&|U!!JwlABEf;Lwtc-P-Mqkr
z6D(SEj~YJ5GWOffTjsI2slUN{Cq1j!avZGGubE8sr*97!8~uF)1^gKD!eu0e9&d6a
zH&y`qp<M7827MTL9C$qW_DC*+8VtL9{J3${rslIkwj6w~mn-U?G70V<FuibJ(D5lO
z_HM-d{#jOWmE|Py&CHLrkr{LAr5h};nZNFe49JE7HVRuZBt@53nlpP16fLrJc=PiM
zy9b9`aWiH%j-HKK+Tc%Ib48`ittJYTTbQrrh>4^dwa36Fj06RJlgVf*Qegk86r2`e
zlGqotc@E1S^FQ@0O@VE62EOSI<(m1v3*WE8j~fHADf&1#_4VpXpC3*4e4nlN>Z_K>
zgKzYM4Yi9pzfQz~2fSJeHqDq<!^gR5)rhb8C1l#op$gX4^yTFoV1!X~OEYLD#0&r|
z1UqZ;+neT)e!pOg1=N_uc2z|d8*PX629x~!a-lI@iFU#)F`~a|DWjct6#Ghw$<b(W
zV-Qjk-SqTc6mA|iRXG{#zO^&b(<_rfDlMg>jHah_TqvpCPx}L@Ag`E6x1n=I<OMp&
zXZLLJ*7T6F5p0AZ-ozw(^mLmAp?@4GQ;?fj$h|{Wl+%LqXI3OownG9DV(7kpC2?AD
zyBCfRPpMvSU)7a=T!Q-VE;dz`d@luyX37ZFbg~R)IGHxu8V<Onpx`378ml*3#m4BW
zldTWADbUcq9A60(A7)%sAT(5jObXSjapQupM)#&g^pcI1s!fldo8v&YbL4N9{^ys(
zNT)CqwtBL0O(8}}l?M&Q-AogpV-$>vnr*XYF0F9e`%S>k$@$az(#-$%_5>x2oxSl{
z^2rq)7}K{DaA}=oQ?&7U<n8Ruus~QR?!X&_->wR5u(!5A_Q;Su0OnVKsrB>C{y^z&
zXYbqt<J0$S8&<a5nv_?LHr-V$S0~_a&}n!>M^ELxDW`C3GX*uDef9~(L;-=eT~?1K
zr~Q)3bU@DFXvJw^@0He}?xMSBnh#kQYs~k-xn(Nd7Cx01qUKT;FW2l7D-4;^hYH!)
z;;^txe(`tg>=@P+VtChaG!&NFL#%ODvotwYZ0ibteS&<G(frH6i6gdIy_H^RoKtRC
ze=y<Dz*ScI0+B4AjD@8kCxOwqE{AA=D2ym?NSpiTFAf#Ts0GR7tp&ed{q_MNiOLH}
z!n3E|9F*Z3KhDt_z2X*wCG=GH5BuuLbWp|He0Q2h>nTO&er-JuJ_UI@5+cJlIlvCE
zyVYv#LXgl`Hqqj9+lET3shbMggXxNue)7szWzO_+q=AO%-M{<Hc~BnHU0Kcn_)2dj
zEu4g@LHcJvpL#Z4lB~FEaTR#CdelCY8+6M`jQ-`}_*DdMpy%GJJ@P%_`!y86SP{xu
zS_bFhXyoRDy1n=t0j622GGOBNr(FP37v%uTp0U}86ztg8*e{X+Q4cR2K!f?QB}!Pl
zHOPdjvHR*O<FY4&X0!Z}%2IzC#S`@zjMm`LF;o#wf&%VBB3XE<tz6LhR~Y2$N&@uD
z+PQ*2%vb+s#Z**Od8`p%!Ljf6wom=-+v1GOEE<Yv5Ooj%FuXtAY`F|%7-t^c1a4mj
z9m7gXYwPPK=jN20oWwcGoxW#1O+WVXs(ascFw9?XeNt!szyuD*z@wuFL>jxJ9T`16
z?GlDb9i2<3LU0l1h-m|i7a7pi3MI0zk~c|tkLP`GELl-fuKzYBX(%JU>MI~SF1&qn
z#q?XSf<7YbYblW0@d`^I%YaDAUilC32EsP(R$rp4w7x4+6i?cLV&MJ4rn-18MZ-ZV
zRlK4mK32@sfp_~JUYK%LGzlSSa{~ofQ&qrejaMFBWj8dvcL3t&t$r7CczSw+=44kl
zCYgB|ctn9de5o}EB&uj3gi6&pYw76yqZX3|v!=nw+>!w$iJRjfvh1`!*!27Yf?yaB
zEyaTTjMu}z%E#)x?Z0blCl+GvVQr;$FN%NbsVPjI?~$16>FKJq|AtI^UH#EY6AiQX
z_af6YB35lYvin}De<A6bS7v5$oT3@3pw#91azF1qdLnp2h*k626yk09icgkz$2S=q
z(1ZM@I-<{j<iZ1GaQJ1y**4T1@HB~|6^HgBW7D?viBOo($)Tu;SV)>xiD6>cG${IP
zoV}wcTfF&1L<V>Ixk*NIEdkkU!QI`pNI|esSnK0GK0bGCmj{oN0HsLK_gFp2+zd92
zY`Iu_mQPD1A@m&yISP628zF_R4WqbNTfT2+XrFy2zZ!C-X<<QCbn7h+uSj6BD?^Oa
z0z)zyXmM<6KCN9g)$wof28X<t4Gc9A2zMr(O^bvceQScGda}t?X@39S(^Myt=481*
zY`P@=E=ye`M|QOo4KxN~6lSi+&!pwXXmt@}n&@#^lm>)+Dp!u-{aC3>DWvomBq;gy
zzM^)T4u8lK(vXkq{jW8({G4i8(i8a%xzfzCuR<Ki6y6pyfz!(J@B9U*BDF=jNk~k1
zp2=B)^#Zo*;1VO<OCEkxX53@E@)Aq$w^`tPqv(^?BGMiJ{gD%(Tju9QoBXfwK{cMD
z4Ea`Rv9op}+<}4JM)O??k<H6z;B0{IdAg5x5n~0@sBqt=W%aTb(Op!!_9kGGPUL#4
zoIs83>PXH?3DAMn^1OCs7DB6c$7D?=@fC+ux_VoK9gMvSeQ*ZO*X!3c;8p{iycBA$
zf<i`KHtcSW4@{C<RUCj|z{Yh`J!~bcpv(6WU3kmBe{CJ-tDmV&Hj24M>#|+<Q%O=$
znd|;qUB!@jKEP=ARS3scj4$qYisu-W)nP|D&Pf;|4h~KN7jK%4+r|wIy`X7Gyj4{{
z3bRI|GpvVhKsPCIEt@4qMk24$KLrk`ZI(s<36yhi6it-GnD~aynBTL4mOW6yJk`5R
z!Z)sI?s@ebdo0Eo(9DAooDl5+3`{XGDtIoTD+Eh=zYO-k&T^5+57%~jNZ)1T@bDu7
zeM{)U2LMa!S+Sjdt9-}Hk0$Eimp!!pBH$u?Hp$OQ91D&+&_}G6QWa~L?A50m`m1RX
z@@5WiNaBJIj%&u7+eaX!TZ~0D?e26z3*1cnUlUz>?q|K8#ZSqWl*a)B_2MrBIb6)E
zvcrbX_wCJCv^0d6G!PxPXVWi6`!&9{s;GC%_h2d(2<X3Za{4qsPg(%D2{+1=!g0kZ
z7ROz~$oH-+iY%mXZ>GF-^-@bkUA)Xw!(8g<UK|jIF1*W%`TBjz32=_jZz!F-azZ=D
zF7~RMD|86r^6g&N<%>~Z<Dp);y!h$0uy=NSd>cqpvQylWr^1cv8g9(`;xFF!QW*yP
ziriRN7F0z{Q)aTb{2+vZSqN0WtdXk)=iB=F4|d~GCk-JACgNBys`yCL^9=BF$H!Ov
zCvUOEa#0bqo<F-eU_(}7jh>P<YPS@Z4uR8~0n_jB6BR!K$Q%HRJec8$i98d#45B^<
zs{l7ZAskt~hUIO{w)72bxnBh#D<n{?-AZ1;uPMG?&ZVN*b=?|#+3;HpQph3u@=KC?
z=0YXzRD4Cs#NV+NjHU7Icl^p=Kn%c8?>4_lGLfSGwEXQ4t_AE!ZjRU*+tHs6msCK7
zwvhNm>>B<*d<Fa{7zqfhs+l?2wt<0P9v*_T$jAYrwK+KDFoo?3insgwCqx#I4aJUG
zplhh{9wDnRY3;qb62iLh0w>zopFbT7F0E<>hTb{vAw})&dAWz2zzFwEJp>H2TW_+>
zgJ|{_+LL`#&-q#hiEL|=7<`-A*-6X9%v|Okm6MZGTVKm9EIcr>h6gIdS)dF8_O9q?
zC6KcSfcoN^!ko}hc<o*OR`I0>dOR??{%zCn*ck58(o%(Lb?M3S$wsQoKNK7XJv|7d
zF1h|6Hu^P%Ei_P-owyJTd$!>2pPgj^cbA^QX2s#l^MB=?K=}=_U?l|Ps|<gT!E-))
z?d+;wRbLr6U9npiAl@jw%i&{0o7U!W82n2Y{l7h+&`Dl>^JN20nw4j@#ETf|@LhH3
zM~&9-ukXl8Ef>!U-pz~0(z6d)L371x>+6$7-=Kb=`(ad*ww!AQ{v;&^?UW%V^T(T+
zch2_P9iib*MvNrDtQaV)U;!UtC*o{<q$Me6kwHVQVr`8G#8|el_`iPy|LB+-^c^m>
z%(nR8jEty()27~WZa6gPR>;*tQcW!mpchrvecsp<vl`%wa&jsM44bB&4>HXvjs+>1
zLIRZ=BRofTWTf0%+qVD?0@{|Fo12gF^uX-^Kq(a#!U|+cu%&8DiUo+R0kDn=WJ;lG
z*#Z-jlW`l3k^3^JVV!W`K?Cjz4?PlqW8i5nw+6g(a6zO6f(-D*xw<}rnQrDU^YK=Z
z&Gu(%{D$5-_7#Ah@b?ECK%(FNJA|~>rP}6+tBT|>kz%^7b_4^Wk6h3>zpWzI7Ki$4
zL&FC}espax{HAw%BpVFe1o<w-`?B<wfSZ!{@Zftp2O`RN`1oFV=n!;Td<3>oIwar>
z1Mm2$xD@AQp^msq0dAbyh~sSS^S=5qtnlqLeNfaHx&`?N?#&7;i3j~yX^aM!+=h^z
z9*5eDQA03&z(30T$`Guq;z=;_`!MKsuF63$s(5l?2HJ-BVYb%h#lwFfeU<GBJOCZh
zkpAlo0ct<7Jie=R{T~P>hQB=A38NsF))<iSpy``@-e*7*YK~%>j(W072!^JuCQOY#
z-o;*h9S`6%7~RUax+08DB%jjFV02ut8p#S)&w2P*0~_TL6I1@dDevM#lIa))C=K^(
zv6U-%@)$b(Zqf!6xdvv#NEvB>IreA0yl3y-cvmXJlnwdzEf$ytS8P8kLuP;Z@qwET
ztTp0YA+S5h$jJc1Dl0=P-`C5siJ`cA$d{@N6gUG7Z5Ioui-F4yGst){$1hgynEF;k
z)n8fD)6*ALoVha+DWXa@Il6oJW*k;<0<gV*3w`tK88S+xj<In-AJ53>sM|&_?uC~Z
zO}-(!`}HXtRPvIYMl-^~+d2M)0cXwM%<>nb?{ULAJEgO-$?fc%5Igue_|-t20k5W0
z<rq6ZF9Hmu@SO#}KO8@o2$Tq)t_QiHx1^+``7LF!KzJJi;RPNqO%_>pVrzf<EQj!L
z$GK)AIXytJeu|H$!v$ep9{_*D{ZjlDZ|0lH;<%4Ctok@HPc~6fO3Kc(B-0k}@b`{P
zBO?XUcfl*lta7w0=_&x@1MTISBB7jKRjk~!)2yP43pMDT)Uq3_jF<v&DBge)tG?cQ
zu!k<lVOrb309t~hetefmvP1|`j2NwOM&``5hE<3!{_@LF^du<!EvO|H=kwp0@Sz(6
zTLQ)+6>G-_>;I-t@`Dw>-I8ASx`dTjNdf=6i^W;x15;?$ta$p1w-cMmXv8ii?es!$
z(cn(vPu68pn`57xTb6flc<}+75+GN<ZVv+vc~wwe7~H|C>0IIZyn$tSO3X`6@8mXc
zCrcjChLE~AK$fES&@pS|7Bw|xHaEZa4+sE4YqnH?-oO@{&KQyg_Ucu(c(<yJrijgz
z*XF>v0gk>m9>VB7;L?dmH}{VZ9Wv+#<bEyVWNrTz24M^%zuNC=j?+klG_P+&W+f&-
z1!y4pr`}12lf<+qaj*^WYmrt}S;RG8OxiSASv)n=St#gIl@nDVir@GEP2F?`n`>~P
zF8D0km8Wjo7##F5N7NgTnT`BUh-bE8gEM71mpN@7bYf{q&BuVm+IoWlKY9<<zXzJ5
zmMxg5%J8vo0~~;MS#PR^V|wsG=~;d4S|6gV95dyydDv6!7}K*(S$LUM>~_|R3)+%D
zQ!|s()13#yn3=jsUi*U8joeU3EDUf1-zw_k-%ED%oWTI94ou)nELnr+n?mWFUjWFm
z8`1-GI@nSkDj3u`Y@h~euCPuUS;*c6bswnwq<rn<@;n0ZJ<%99#T`efBxMu{Ph8Oz
z658?JdxA-Tjzi6tzxiL#!+e}&@X)~x)!Z!7RX}4b=wdmPHUe@5LH#^g<6+Vkm?^j%
z80$-?1RTrw(SVRxy}SidxcAwTxlkC`7{EI_J~k%BmRfAc#tY81j-z52zktA3pjB|J
zPfFX8;5YU07<%y%C0aJDfLxH2tQn+|$v3s0`1swd$8xzI%(lGCiig5Bb`t4P3xGP9
zng%Y<5*Pc~T%7|70Px2Xwf6Sx6B~qQ(H6T_AkE>Twkn5Wi9_aY6yLNPgKU3lnj5Gv
zC9f^c)d20q*KsoSyoZk^yLP&2)^FcNxzFjbvl7MvSsVU|5X3!NQRovmXjB=DGV)NQ
zCJ))UiDiz5r^`RZ$0eykj9R=oOigo4TD*xCs>i6jita14j(N9Im1&!yFlLH)fIt9H
zuq!cs|MYc<f~MXxo06Z;qf70a<0997SO3_nd$S;*t<1Yi_-dw-&vlnhk(8XWx84y9
zxy|)`ooK!A1Top}7ArS7*Trw>VxpB34T;2?`h{#&CZ$w2oAy<eslyuT8_u&#%ZC!<
zb%gabh)16IF1OVYioj7GS9&QJMllOpgp6}=d;$<@uVX|VHkmXTTAa*pwG5NJFWvnj
za)Gx$Q~3l>M$0=idfLJ1;eGn_$@SsR4}fGbbl?m%X>*S>FuO*N`RckoY~<b~7J~pu
z8bG1`vL0E;MUzOVA{XVn2ox}(7Az6CVX90(Y~ITqnDI8#Q>15ck)pM=l|sTZV|rR&
zK1!j{cNbqRPED3x>#4YLv<H6I^=R3bKBhE^-2_vM*YWY#pm5sQ*g%ylXlcm~y8XxN
zdW{ZPL~Br*%^Q9i7*GNk`QX6F2cYuB-b-D*9yf~9YlJO#G*iKy-9xZ<dBu2@n;e00
z)8%gqZ?ic&aT#p9+7Wa|_4HNj$xAIhXUhRcw4qi7icHDUaFdgK8EHMh5%9srNL5{(
z4pPMQ`W0Q`8w-o~hCiY%_GkD+1k^P&aG(;G?0~s)z2JTMl4rWyJQfPGws+5ZGm$DV
z{I(`V#YSpu@sA>Bx;0O3M-?S#3XBC@K;@PUN)Pm*H$>FLL$&=jHB*EDlk10_r3^6w
z?>-<9Hmi*=^AcV<%oOa305p|>04P6fSJ$5bi$r%@_=m*!&GpC{&;icY1#p270}ort
zw@XoRKr-ODw8|`bL;JEygr9zBy^Bsp3zQ>5@oECuuUIrV#SHW!%b||+6!EUR>(`~8
zMJY*#xl}hdGjx#OBjm4!hgEBWZY3f#pQr$<Dn$(!E`WjzkBquo@A%iDisE8|`bR~L
zy%!7`1{1-bu#(9I3@JJ)+d#(@a025;3t^mLfI?48V5mr^glMMVKYpUHV6XYa$#5{;
zJ4Dm#_xI)1U(|EvpH`0g+`bTH4V6WH#yxjHE{vDc7SXUNW!VY8SVBi_^nGQuVhyK*
zDouk6{Oi_6KGdxtx)HcSTfDo`Jovu_KjPplT_lo`7o-d=Ux*kGM#|Dj3uG5+vTzFs
z^a7GVyM!Nb%|+TJr81vvj8)Y%fOH2)`$1`;!%kdkC+^|lk&z}RMrG@IECPf)n;6f)
z{Q-_(uxCe>-tzYRIp-Jr@B#E1-(zBM!+^*YRMsS1*q^yJl_1)~!=qp_6Kh&bMzIlP
zDv=DX1_Kzhtbov5!NV&ePnRi!hajf~%!jt_?qD*s3U6kSE@!eT6Bs-X1R}hAqC*$^
zuMXeUZG0YmlbL4@)@=TFwjP;8neinT-b}jW0o}<;-c0tIni|kwbYNiv35k)RNrxK+
zSmP(M2=9Tf{osHiQ#DGaKnl2y(uepwtv{BO?8X%2cJ=owGB)BVT7V-<mQG0^-P(6H
zh$|1O(@&C-nPYvm&7Jv_6#z7R*OAYZA^4@mJfflsyqR5z*r3WV;nd*FgYDHhbZ?v}
zv@F97@hdT`gPNF7uCtmQY`|z)iW(Dngh-iO@U&_3m=izp3Gm7=CCj5q3nZ6NyvnVr
z!UHIQp^0I>E<2C-%K?DS00=7bS{VE)V2@GU{jBsYGdGJa^P>)Dx{-<D=KRzUA$lar
z!@V~}K#yuTE`r(&-ukErCgA#8ZK=zhoHoydLDkx^)2~Lc06qlJu9ku3o-^AfI5-X1
zi6*C)!PowFXxfRLbNH+))*QU`<oJ}FNDf{0$ol2&+)p>Y*4FzX?I)Ie%qs_ULCwuA
znK_xog=OUJk{vg3*({sx!=vgomK(%@sdK+>n*C+gP$3gJtfm@>c~F#}>$i<$T6zX2
zL)GjDdS;DO=#h&75%;y*ZPYoSC@aw|MJ_2LQkxv}3hJR5wFkm3(0;&-Pa=%SzEq`M
zShi+{Lxm++-3UYPYm);Pi_X5aKwD@iVFV)?hV>(}vpc+gN)5+p$}n$WT>{1-0NqS4
z9q}5dvoeA&I5aeL&pX0Z;W9b;jo0({vUF?2Xevskrj+<fLKNGlsV_doB>>dCDLCkR
z_2`mDRjC~yai6)ipM$0DOBek*vDL)T(8AJkt)ed*O7gLf0M%`uRCUP8*}0;5IFQk)
z?<M)5Iw=d{|7ih|2Hv>*HP(AhPHtQ^qFvHG7Do>EF3aqm+`^IvyW6x$y$?vH-t`Ex
zr7D}W`q$n3(sT`HWwiu^Q%On59?YS5vS`vS?cg@8o=;e~=|?M&iJX_`k5)JOoo&Yi
zNw7uAET>wQUoirW_;z|u!`0V-QAo<CP4}tx^nZ2>0^m@2F%SGTzwZ_uFRl-UJ-q@z
zO<HEaSvfnpT30r8k(Uw@=49-++#DAgOVa4M#{RgKcX#>gY<fSVIMON8)7z`&C$|O-
z;Tv#P=FZiJCuoFp^dGC`ik{-npj6_cE08w&=8B_Wk54TP{n=y~&mvtC7gtsP#OHf~
zKElC~VMAa#qr`x3BIJ`MMI+^8N_l}5w-W`AkNLZ!TCM(QR*r=N2wvTH*ZqLF#9Zse
z*&mVpiqYdzZ0xiwCchZi7M|g_KvVOAzi3%oxynojn+r_)ev#Skn_&O_v2SN5j1)}>
zl~^~mnhsav-TQaDqQ>_RXa*(Qd`ItlIZXX7+i$7I(0!l_Q!$69%i`&kU)oifhF0sO
znV6XrArnOtyF`?2AFf*i#^jECFg3zka<W?_&Hr64nf-#|tvD=bsO??CS0o4AKgQOd
z@yE;2p+(66m85~!z)@wclb(+7^@E#o4?@tr!<^5KkxU{>iEffr!TYZ)q)`c0CE%I@
zRyBfBQZ%xt(3K<R9Odze`QCpyEu_@sa(H1C70&-C#Z(n+nUj+VQj~j?jh(^2M@g<$
zxTGn+z`6y4hxjzRle0xr*+(c89T&`|w5!21^Rru5if<zCev-Krbss;!Qe7#9#-=vb
z8B64aOf7_vNl;6)uaPNMSWy5tO5!d!WXkhQ>!;&w#aA+_%U;k)^r6x~I=o)dng^e^
zHRGa}YH~ZB#jAfvSv>>uTQcHWcI{%|)QD!w?q>p1trwn1+2N5P8)O3j{7a<S>5t3-
z^}=I=YEguHNjE?rSvSuDx6*?%wM#x0+Y4zozhtkEdtGv(rAJhA;5<~Z*l`~$DHv5z
z<9silm1V5RoUF*ony!Y-Y5E3Wsvy%SrlsK(4Q`PkyX(fyOK?);n40nnyyOuUuA*xN
z>|H^L#$g(B;?;edJ>JFNp1U$MJ)M)=JH=gO^fDrar+}4u8_DsGLpPciPFNY+rPz&d
zn0cWqFhGn2&Z{+XsdQR)g!tgaqS&xbIn+UuelY1DRfhFhcgiLabm_4*8&C}f;i85;
zkY!mfndIG|Ui?#$m$Fu^uF&Cbf@?-EUANdFPW#o6Qc|Fto7=btw4*G?hEDHFdykLR
z1e}*;OoJ$aoC-u12)Ot~T_&^-&3lmpe;;5A0GRp`2>t{9QGW&5nwgn)>(N35t{-1P
zDGSP5lL3qHN{eu!gyGD?!*QuT99XbGc#fMJJj%fEFn>A<r)KG&CP1rKd*35>C9>Q*
z%(&kzq0Nhm0AEA5y#tzpy>qq=!RA>cbDI4#l_*~}#SbPD2{kd{hz3r><<~}Wb?z!c
z@eHJ>pGRP<LCB{Y;hi*1fw|fx=XQdywkvjwzQi{#cH_#3`rJV2x#`~2GH5Az?EMQw
zegZ%^;g-H*?Cy`k0_m4psUN@I5Xxy1jN4UsEM^z%^-`Cvuj*PSii$S02nwqXqw{JU
zw{3crii=T&s8^NlKCx8O<ty(kNq^mr8iQlRW&xP!P>%BQYs!*$cUh4+O@Pl~yWALX
zhIx+%eSmj7U9M^Xk%gEhzdFDn67v=0N;P_(h|QU#fhOysv+Pq`Jbtt+K!r>MVt@2s
z=Zc=;iHiqCbXkt(3Iq2j5`fHs^q4o3A1pL*4;s`i)c<9E&9ZkBk@0??q&jOdCM^bM
zWYD^9UC24H#V*ajOSIthIz)cHlm$JjxbnuEQ@B6fz%TR>h6kJvjgk{;E+@Ov6n?Nc
zJv@ZG3d?ucLfeBxN6Gzv=4lj*pY5KClU&QP#GJ}1poxn~U?}!=1`iAB(IS<+35$h6
zL4y@3L&a)&Jg>*EW^EOiA{z)IQ&@=6X^^NxJjvu(HqQ<fx3*MB#$Qyo7VkcwDzYju
z;bWQzB~*}S6azCQU5+wscR7N2Lx!X}XZEYfm&4W3c4<Jr0}53583xyvKBJOOX}xOt
zx5r9#QEzvtD?_ekk9$YO4nL4k_%4zdjC4t(UgWk9#o(p}j@_al4WXeBQcbz+Nk75G
zZ98HEZGZmqesrGyaGNv4p<(b{NRbO_?<xAQO-V`EP@n(H>d#8`p+vJ0XF5x2%#dy;
z1$v~yWyyb#v+GHez9ek6Bbh={he)ZzmCB!xZk1qX@7}<j0`-Pr+41X#KHEIePrs;N
z9UNl8{U;m^2IPasCj>|7LUk4mb}7wg?LU)41o_pzvR%5Q8bz6lvuQ<=&^-O<(@PBN
zzaI~^$oZ-je%d{OfrOx@rK#sPr2Fhpl$`|$l{Ul@IVojq&M|P0WLFz+QyVB&VGZrx
zw<1G%EBmd?Q`;?d7tWO{PD{6Sk7l>cE6q5~dAD34mzTlgO?PsC156fOS}sN8EBi;E
zm?7)BwJD0g_;FX!BlLvA<AY^@0I;1r$ENv=ud4@eS8r)}iA=JvirtQHwr2mCe+lBE
z04GtTZ5J4&4l+f-dSy$^G&hko(6a|Fh|y76!pPz%WZ=|}-yn7q<mcxW6pbz3M+&Ev
zN*dat3V0onf^Rwl)_eDc+g&jAh+5p#CBQ!TYH9$=N^pLwSTwPD<~O59!tI%3sD`O9
z-%Y?uu>g|3?jGRcof5eS^=s$216fLCnsj^XIRH#Ou9#s`AtjJ5hbsMpDXPMOL8qj&
zJFg7w@LK_=e3c_UprRN4c;y(f_jawXb9@j->a=)o!7as<T;j~UdfC!zu#2g!d>0C*
z$U=+(%sdglBf_M4=h&M9seT{hl|`>B0xN!?<K9c)A&Q&U<V;tDXunvj($iz4h^AqD
zGr@WnED5sqDiAa{HJFlvzp{w{k{G;j!bvCs)e{@3E26ulgTq#(tV9^4tiJm+v!Xxa
z$I`XQG%llaqd-(3d-odMs99Xd@8h_3Rqfp*l*60i!^49FHl>)N#L*xFm1HnNJJjOw
z0TB}$dtzcjwM}#LppW|G0=NQ0F8&_jqDEfjtXxB{9v{{#4NWqb3DHkc+8+Y~Zx>by
zKoIBUq4;dtz`_v)J?^mqBW@&a1#Kd5W@9PxtG&`AWB|CHD+Rgf44#bcj9WM_3M=DN
zCq3Jq9!D;CTKO>5aB>@T{_lc5BEPQgx#^^^-zkIn{hq;d%I5`TE!mH-$9o^pRnR4(
zD#VLv{9poDKTYz$X(tNv^`JqUOn@;tb*{)rwo7{)l>0M&?p$*ua67~Uia5UYmNVw-
z>ADJ6KHbOZKgZ$J4<G9sX2vF$BIyBvxh46qw4(FfbK-HA`X1ie+WP$8zti6RN{`)B
zqKL1@ag~qw*$s|s=8wC1v`#2!Agk+mFx`CnW(-R`M?|g4kO3bJBpw7sPp1*L-TH(m
z05}rB^p>lqHfBK=FQ+Tbp}leBV_sOmvbJB@-U*~wfFc4*BoYHA9I{5&vtH<sq{134
z`}Nn=X*xirH{FdYFiotE_lOAfdbly`#cFbZra(C45Od&)4(hnl8Kq_n9=^4wZv?qu
zh0gb#bs%~vE&&al)&d@Blv(Q9A5Tg-7F2j}HnvLw0M}}qWB4T|B5l4dTfp_ze=8;-
z0<4&Lo(LM|)#TF1(k!WQLS4CbdaN!E#rhXUvJE09_(YmoL`v+K^;o;Vr0^_uoTUn$
z=YPM%CXAqyo|IPnjI%PXg%pALY(wHDUNQYZHvVKA-+Q)nWgw-lF`*_~-*_@BG^7KN
zL>K-k&hUP;1sIebdfKmGKwujRaHL#nG$7<EXxufC`M4J#gBmD-*yHlkYv^r!n`?xl
zKwlqq$S1ojv4AUXfYa>#0n<5{{nmE0fM<W~WzNisFXBS|6H57VoTV?mHMX?0n*a^i
z2UydGz&&@|dK8p!6bKVVr3H}Y7oiggh<0?yKjz1mD~}I2K&}phNruFoRG|ffiPrBm
zSyT%&K`(nezB{RC@%!ci@Mp=Y5Fw9k%z7tFQu&t^1PJnd@=xyC&X}RMAtBUFj%hgR
z!TqsZZHf%|Uz<u2eFGC^>A-i}GOj!GTo4x%fZ9Dck86FvaFKj?NX3b5Qv9tf7OXmO
zX8}0W3F-)RToFqx-rC0G^rXkYNz%XVetv#_I?M;<<`IU+uP|#-_VA#WVG)XtD`o?h
zz3AOtyN46W2fe+0D`1W6l~(}Qx&^nP+weV7XXpkngw@tJoHc~prvr0EO%TkP(^M#7
z?F{G%dWuJ~!DEr_vIHzU1v&wCBp5|u5gZ&ZBVmrl+a>06F8BKNLdF+T5KOUb1$=<#
z=NItD_mAhM-UqWiy&T5RsmZrCbf}L9xq=Y&w1nO6D2YjkulHu!;yoEaa{@FDF6I8;
z^#8-qr@+k^7>`ExvnX)0n~K#mxyGV90dM-K`4et_=_MNv?he_3Ax6ok&3g<4ITSf~
zIYnK)e3r|@##;mgojn>#s(P{B`hrS5nE8V<qFUW$+wg{6w&bH*QUi2z+(lG2y5sm7
ze5HVW3l9&+#9Dd-J^TyOIsikl^LMx0zCm*MlcErQ@wb-b%w4<U;&0IrGVDz2i;Zqz
z%gF;}I|m2H_tHU);5!1a%u=Se--?Kc4s2CtY|%mQ9uHdWK2zBG!!837hJUmiVFY~*
zJ?sr4V35MDT*G`>=)h23JMr#Sl683<0HS`<Pg_?0Ui;a8HFW4N=>0eDGhnF*>#gKH
zT(Oh*e$(1Uq4d*ABhVa@2f+p9c^Pb-+`Q5!X_m&N>%gGc<_eS6)zjb3HZn4Wp0z>G
z9*>p>hPc|h&d)L1j_4z3(qCxy!}bn;^pXay6c*6FveqFms4xTlDtfr(8(&m-b}lYp
zqPq+NC_j$)Ij*Sp!RqEf@>MQ$_yE`&9>igvN4Aa3%zCTJ#|HQlJ3PvCONju|S#QI~
z$M?J76%I(*XmZ~|&xM8Jg10)$ITAx;T1`}-T5Ev@QbRa`H)h(qa6+yq9(OK7((NH#
z(HnhLP9Hiu<JdXMSA}@m&LQ7?|9yb+j?MI?4yE(FC-G(HssxfzrEimlX(KJnAXybY
z;PTMY&o6Q}^Ldnt4V94ZXE1!A?RvyT>*i-gnG7xxJQMd*MP6LY#G8rSv3e_!8HEg1
zVw2|@0===1rk5$$&x#PfS|879+m+zuzztN7nwo=vRT_YalLVhrwER1;J{#lC7Qi{_
zO2`BA&fednPyrexdVj<E?rM(uc;z1FF)XkBoB-&mujh{*;3e-*Jiy1}GV>2zZi5em
z%FP{_{*C?k^lBs+ubrr5K~}_{PQ1O;)ZauLiI=m$l*U~g*Hrv?(U3^U`-PTxEnoue
z6<e?ek~Uj}=BzUPk>(9<O&30zheksQ?Ha25&AQ_|kLAmDwIyth=NA(9gvg9Ur2-4(
zb!ve4RJQYP7Ci1@ZdU|ei$`e44f&!y5v_w6&R3?YtK6K5EFq<|^fck1e`0ZJYK{xd
zM9|B3j_=+8s~4clv$Bmr4z87(U1r%#g%&$uH1j%u^pTMT@ICO^IoT6Ow%lf#6v&*_
zv`uEV9L#T>%zW46tg3`irEO=Bga5uTe-a(g=EBMybRVv{%(iX0T4gmfG<NdsmMd2_
zw*#DWoej5(bgwf1&Q|5XavymfPt6}*0N!xm4KJ#U%cqXZt4Yagf(nzS!Ktztp}-y5
zq!Pj@`$$<aIo?d#?4ga@r!zL)%s;Wvr5!{pgKsu2E*z1)l6`V<Le)cuuS}e)3@Oyo
zB0nK<jTZD1amHTYt-*ca5x7CVl3&@L?kRF#kQD|=0Y#bF!*wh`X%iJ8_R+dKvkVcd
zH{C*9ZO39Ye3Kx##{FT@DEGGW(sxY(8Xnr)%Vg4^9AJzBfIzV8&29z~P{ZCsAaZHM
z=|Ulg?5+3rEajQmIkf4<mK()tjueZkDk|i*&@bx;bA0R^oX5u`RDG9$DKXo@bWg9t
z+?|;X144M!=Xuv1G)J^oK<8}k_-^}=G^Y~@nP4%P8bOm+>P0(Ml5)w|YuXfPm1t}7
zA1{5f@X=WjB2s*Q#1d=c>d={_HV*0FqE<(~r~h{5$=}+(FfTK`b@Rn%Ar*&}C^=bh
zXaBFI|0yz1loziz>kct;nl<+O<X%fe%D|T}U}f^hVa0iRIng94epW5c$jy{{A&pB)
zOuYR>0k%>9bjwe$?u(zCtO;#MXdCGbg{KO>vXob-1k5_{n$S&-NkOzBb#<9*1tUe1
ztUxgeV0w_mkQ5!gkA(cDoNG-TtNg_GQ;ul;S)9wAxTUpAlH@gW$gm1mYkzk)R?0Mk
z6;JK--M^XOY#)s;QiHB~uxY3Qs<apt^KrOW&7m^uTifEfCJz$R9Ln=^$JNE_Gu=|o
zUEQ$W-k<O@UZz>uWEt7Uo0q{yK2?s{c@O7uj(x@2tR8^m`1f}~LnP<Tq=jUvdnnEO
zk`g-*(lpq8vCn|-22fa#VF;<L%$rWr2m7|sbIU$Rtd|r784CyQ-~uMagp!hZd-h%V
zPj)rlOqyeHRouXx`M?>kCf5gwp&^xn#kvom>H{$P{4`LFi$QJP`9|o9^h~VNeZZFd
zwBHQK2C<bwU62+bprexvFp%--<<aFJ9M`SWXY-=XV3%3=4(ZERniZE9(yR6st<R?p
zeeu6Us^P0ScUtT}PAfNQ@sAAT9CCRWJvu9dwP}duUTMOJ@xbfknqC<@SPriP0a;0E
zNE|h@IJMizxRT;E<IE<*?}_{=L?yiZq6EVh30f>|rP>L@LAmm|)TAg;U4p6cG+94n
zHynZ%?auD7zQ-%-w~w7pk*ng2a&YxdPrj<B9IlhPm1__%<nilf5R78o0|8cnD`n8n
zT%fn72Gbb99=#_Bgl??d--aa6NTI5gm~3aS+yw-m35FoPZ-}Sb%CYVvr665B>7%mt
zvxx*XQVZygsDd{wOH<Kd&^%ag9IN-?`~ZD|SXUI*5?C-Xws}GEPsP|s_6OgsshOR_
zLmNB0=(#x~v6Zr%mi4<P53iD8U|={)CJ9!4%4uM)|AYx-xkA3jG%enL*Sn*AK&JHe
zRn-P?e@Mc1zqNNyOz=X*FU9IXP7xKjkQ&Y26U0{8yor#h>d)k}1>A)qymQ^)oW~RE
zyIIvowb2zhq`I83nQ7Yw)zJ{|%oPu~TEhwHKmWsE{#Ymp6#QmyHag&PkIrmCmB-G(
zbv6@npXaxc?qX#}&WdFV+yIw{OTYq~W?<$AW_dpF0*Kl+_nOMO(E5vTKw4)Uq9cg3
z;IkbKLreatU7}d`8q!{w4jkF@3k$PN9?VaMvbq^C3ZSi3vBY<cnd@iL$nyQjMeZ%L
zNwnYb@$WB^9$7WE>U=-lK38Co3;p}2m7;wRvMSvxUwQJ+xSb(Yz2>n)8W~yeY?{m5
z_N_melhNJj#f;GTG0D}sj`{XMrVgl!;otY=UeT$j4E;JTggqGphhk&9H_#p`LvAat
z?<Ma<q%DL_=Z8Qb)oH5vBS(t%-EpSNhcelxrH6;-6aA4n3E94;2K5sULz0qgIRm5i
zuSULJQZjP#6R`xV@~Y!t8D(j376Tl|9a61s#RK=}Hn8m;En9MFZ16GAE~%oP=^su=
zYF_IJ782EhKxcF;0%L)&(^YF<0R-*gvYqf9dHp&0!<ArGrpd>XJFe}kb@=o-xvS1H
zgrTqsrUA+OthK)wSp){;Mz068ISrQi0#?S!HrnsY2_F~Cp{rzG2JxlZgZ{!}A9~Kj
z0#_82L#Or2d&N*wBd0M3FN4Im4vv4alQ%Inp@+fEU=h7Z(fvN}*bc@6(2l>h{?vK)
z>&C~;B0uk;&8&9%90$|&d`I+)L{KyFIm$aHJmuji8!?CWvMKv#L)Cb6y29wG2|wnq
z8!u9kX~B*CiAV8y>1ty|Yzlt)E4`wd#v)lIqaznh<tdfXu1n>>kc-!mFr+_&xm_p9
ztZqweuZ=ASCbGJx+^jAfw){Y7{!~2Vv-Y0`gTYc}8!sa2@<i?FQKFQIx~j#LPOPCh
zSv52LKYDo*=wTgwXJRQ6ERf@%ynOG3#Xz;GqrAGjf%)5R57WC21&6XW>XpkbZSnFG
z`@Ds{d+qY5kw0lRGnHPmD1`C!$3b_ZDM%IT&3a;&Z+((*!wkjZQ}*H+Bk=@zdVvlD
z)g~tP^1`czU5zdmG<8~Dl3y0j`=WWG{?!Y(UmsuYTk{=UqjL9-EibDJw8%hCEp4PE
zK;jB*qT<im+H*Uct#~A9DRUPtK_=#-mf1Z6G*(7wT+Px;jbPaqC~YvnjmCY(uM`-1
zCyEW^|KPj?R<o2hi?;mldbS&X56C>9`PINI4X2jYYk_)<i_iY|vwAbdGMWMuHASb4
zo20nS-U4+?EfN=rB}L$!(`Pnzf-r8&L<FmN=@sd67RzVfrNU3v=-nL}No4#6vdxJg
zy0ei%7|JD=YKlcE7ps@*3zZTAy+42bl5x?%0dfQi$>1=c6tY-yj@}TMbs*E4i5Cxa
zoFa%^SQFasV~8;HS**KF)~>*Cc4^gLGdwV+60O@<Y%|hVHd>K)Xxa`s;=pOSAgd7n
z_qSI&V5`3Go?Efx=ilrNL(vLuP4kcuXCF?u`RcL7U(-G!?V8v2_u?19GyMM*1MA_Z
ziFe9ukZaiEdWenVIoXRBLxKC`A$`<$Yt*1iWJy!LyMMfFAVe4BOPa!k{s{V29Ky%W
zgJZ+va`}4c^9yC6!%X>d-y-3jCT*fifs4J@iYch%jzLhy<7e7RMHP%lKC0`82!&dM
zy;WWKbmcC+lgex<=ZR(aNJrs}FS`OI0=6STg0o!wuLtDHUpMwUKDaM4<YoVR1r7%?
zjLWMSzW}W8uk)@1U?MAq)TM$*_=ok!2OkhC@!4si-s617Sdn#hZ0UFB2khjbisRAo
zLYDHmhDZ4IXr!ZDp(y<rN>QJx#>S3=VfNObR)!?j<-mK?P_$W}Rhoe}N%WO%!{>i=
zYyWsAbVC?uw?ruOf7Z(4lJ1NN@YsEbGO54`l`eJdeH16Ss*{M&lMLf7NJcIA>G?k8
zYuZ7iA|u{Jeo=73#Q5uo?;K={uU?&2q8~}#QvUDM!aEs1O9XR_mC`_IQ{^G3aX)Wx
zJ*N?(T4iWuV-uaZt0dsKLyL-#mG%0`MP0+k_u~iq+1T#{O?E=9*E}!%a@N-HYNr7w
z*?lDhT7sTSu|Wv_D|&iNAUWvj5(5h9rw*dAQ4vy{LDwCSsweSWwYAo&4*7P{>hBx|
zB09G=O_A)fcCH1hlDu)j%=<*tuBnJuSW0b@?O_mp<?sGEO}P1W`NAAyF|K*|5twk1
zc*MIYDiHM7Y>q1Q5Ct)&kHW~T_NQsUBBAg{b)w6`N9V?!V<O2=FH{rZ?p-Pi-Fn4G
zCiVZ;(_v@=gRtT2*Xxq^Q|7>mdj)%(e3Y>@@F6``A`;kqPHip2JRa4{v@Cq10$i&D
zZw*L6>;Q0?)HMF=80$w33PJ>Vkxz3P93APF#yTd}5p-rMJx=b7{BLfQn36x4wKP|R
zsynEOq~3HBARz)Bx!6jd+ree(-JMXPlnNYHDD8K(DhEWhP|H91y1dV8wROt`vy0Z_
ziy05c#>PILA~KA*u;w~Lk1;fGRUpxJYQ-hd@t$9btj9A3#-`WDCkzV;nnEM6MzE*`
zkg4sy?KtA}69@8QSzyR1W03K&TB&F1%8XACGNU4usJ<Vg;$fC&%K55oxiqV9_bx@~
zwUp~6M6P%nii>yRXQNln_P=fBd^I)z^xQKm(2mu&>Qs{Q7MPRC$sp(;yzL<lAQB$d
zfM{c=*w^ZZfeM5%$F8WbhJXOcap$np&C0M|O(Oj_=_`<r=;oGKHC|@Y<{7QrB<u1B
zXRDECH93ZAT>sa?**o6R8&c7qG}J!RbFtAYWy%QAWeZ}1x5Jli7&|9ZDliMN&ftaj
zsE`&F0341oL_0)d%7a@CZSY!57^(m_)fji2yy+qAs4@wRO_gt=7m_}q5(%+Ec$rXH
z-gq=(ce8(<=;Whn3XFCfh3NkI-XZNzhCt1T5P|kRB}kdbbqJk+WzjxWyFigM@0&@*
z>g=k&1CyAk8so<gl%qb+HzGzmjw<h||Nq9oJ28{+bf>{J$;(&`MZr1S0(k`(FsS?9
z(#AQ~`PrXIbI@LA#*%Q+6}_>s$vm@#9<LUB7<gOrMK}l_dM0!=M%&yRAQW_Jy8ZU8
zs}&Cj$$^dLS{=0^p8vx-231Kn61=GQU#3LGlYisp+7&4?N*>L5VGIj<ZsO3w*X6-%
zd|od)hICKhebfj!;5ZmLDq@Yx!DXeLg?vn*W`R(e8@nGh5bB~7!2?Qv{Z%@iMm>^U
zzwSCX#Q4(=#l;xo<W@optAZb2_qEEKk%HeRQMGa5btx#JV*0jy*e46b5rfK*=Fxm#
zZ|02rI<%G(W(~udqf>-$!?2;>AKCrC=YU7eMXh9{RbselymA!+Xzn)#)ikTu)DQ1L
zdM!k|1O-x|F|qUh|Fi)6PwgQnyevNz7_!qsR(r2VwUq|9c$IhO>#2Zr&^FMM5Tfg(
zzYIIboCGXss`7Y}9~R<|(x!dmu$_g-Kgd6eWGh%ZdEX}`F_m{ISY6yl6}c!5XzKH1
zY6``7tX3|x7<q8hVrr9OBCsN9vv4CzH<r@Ly_c@4Z<xD^YW>Z_nV{cK+_gd8p@+?M
z++mm~qW8b^TDH4ySRsi5mGwjnglZVztbXFzbg+>qtGO+E<VsbR`tF0HX{6)QW^bjt
zaMr9%O524*xBi>{ndK@c<LXQ<0Yl0UVVc-x#m}Yp#&EBnuh$z{Cz0eAb@ufp?Hh1J
z@CXsVgZw^yv4)6T9vE1NHhg0tnf&9cUWff4O=JPhR1mFhZPv$%tgxwEMt<C1e$bV}
zl_S5ngb>Q^jO->|q2=tZP6z0kx44Lp|KH_!tOm2P5MS#3%B{b>9%sLtAA*c-7t0f7
z4mZ4S+n0C_qeOx0>A~gF?|*;XB9|;#be=WRpY5Ypo*as3?=v8p5qt9bYFmn^;pH<(
zt;h^fx~iJrnUwlSGR#X^6|T|$qRfhPSbQi$t825O9nRWmB(9}(Wv8ZfL3U58&_w5t
zO6c9aGOKbT@2ffy&(m)Dq#dKn8;Xk{iP{gtc$v)iZ5u`lWN-WW4Im`wI*<yY`;O(U
zjKO>YA}eE+;U}xAkJ>SwY+4~B7YKkNj+R9zCrVZJGUaPbit!a=CwP%M<aKF1gq{;*
zU;rQ5OmJimh1z%g6;dD3o2O4zwX)MYW5e6Ti1a!fPIIESSYmju9g{&oZ{AN20fO0x
z4I|Kg`^VQqUfK4!KjUUtcZ<N)E!AU7W#j4Vt#|sw1GKneP<m7Z;I-S*ekO_9bw5iy
zRodcA;S;V6K0rLoZ=Z=f0(Z7P&Ss%;immNvLkRozhs#>nb;?j`mcyCthwS+Iu#U@>
zn$mA645-cmvX#yl$WV->-pJ1lPFZGpxqM7CsKX+Ktu&~6mviL<hP6o)VAq_C<1(V;
zDPS7POq<5RBUsxr%F*JFO>~idjCNIFrFmPPc`1+|LFeocW>3UOv>H`;OFRf7T1nUP
zBN~Ejq_Z?#yr$IDG;yf(wI=#7-i#ctCg+*H?ES3%ZLZn|1EeqLmT>~}2Y3c29f&9_
z>B?8Z9djNeEJXi>3LQzDiKo>2tylH=UZ)!LZ=H2heBhF}Mp}9J=krmJA9&Xlagn}=
z`d}|qbCU*2V*0;QGSI@wcR|*(v>?oYGv#}A7W60{3g%vXEvrdhOSH@lc~Ah!E!dR)
zxbVR6sGnBz>w4OlLhOnrEsdSC95ex1VKh>#BfU>;9KRyu_11iy!(t=PfK-SiWez3q
zuRqB@Qzl5Q-`P7_ZS=y6K{xj5!26@;<WPdiRUW$&j39~)Sae05I5=3!pSsRDSTJZ)
z@uhJAPc+ie3$NUR??Ng5I(?p!YJRxC9~I~)#V9E$K_XSG{nXa!))0^tfoBQyX(-qS
z-yo3atu3O_FTyH7{JzrG+NhTfvSBMs$ZcjSay(sj0P}u4T1B9$t_HHgt|roR*Xw5D
zLEw$B>ndEPXOebRw}V1FIN?lmJ4nNAj4++4ibL}Awjef~UqpWo4x+<>{&nOx@H`5D
zs;wX7e1KG!+S*#&SZ2f5CYyf-2-vwerX*b;gl$JNk~-yH_f<az&@pJ;Oi9YU$}juM
zoXT)zma7qN$E`)N$pt(&gamX1nFdHsy&`{(R$%e-^RG7RG4=Loz2@WR2Zdhg6nZ+B
zX;Dqt2VFKfi9FE1mgb)Kth<5WY&R=xz=lL#`++9Y&f%yd<2_Jc-7SKNnNfk9DgxP%
zCdjjuGge}Zt2TvNGJ>bYxpoye4}FMn6E&|EU9)~SMVyAYgslJSw6?UI9yOE^sjNqK
zBn{p6)?kIY-^(Zd2P2t7NCJdQt4;nzv}TM{e|9AXw>)j6^mG#Z5OIM^S2F<~A!205
z577q{1)3sx#aryh-OIl=$3Y1o<%gSBOqMgd5NL0mj2o)`T<Mog$uquW$)jG~P~TgN
z%o_`zkG=ABPNhNh-5Cq--r(t26(atCL)k@2y->e<v~Rs3C5eTF<+#)wSum0fG-Nc%
z>U_0+A35k>@e96O6T&7(xtVLWiTJxvKQa56Hd(#K?~G=l-npQvDlu*QDZ5NNs^+It
zxzndlm?sYA54^9@22*)w<olZ3y;6#ciEC|mz$12nBJ1l{i(T|ED>3SjTDwwYcXq<p
zP6I`%>($t+Zfop-e}`*puRhEQjkP;ZhrGH(rt;sB2B?_~Zz4^mDlhmzTtU06{{H?T
zrHhYmXlk72G*aeoQ+D+5KgxycE)ptB*eK;y-70sE`pF-#+}1u&Gf^d+jfJB)lp$d!
zNIsB8%YHcoF0TP#Tsx%68C~_G>d{U-Jj8keMmmtdv6eJ|M1Ff~=WJj68qB95!36$|
z>~C#Xgg_@*5${dqe@v4LJArV8JYVoWv_}?ErQs91xgsD%1oAY{hv2T@7_g9KXT3Yx
zkz(zs|0}w)H{Wsohp@1)@ZAtyrt;K{TUSThw}$k!L_ARN%d^S>ko?teda(3m9AZZ+
zIOXe|pWI)*?4#QScu@-VW1sE1qlF!*$bhgfW4iudf|~HiWe{*v_5L>Z{S*Z9omSU=
zdlgEkIOIO;x%>o-Sg!vKz|0PdK|FlOdBS5xI1c68p?b<UyjX$PFWN^Rz<=p4Oc?*O
zNWo-OKQeYqOck`Q<bAXR1>W%8`JbUqqTVM@MHlQa2>fNqpB$HZ=@TU6%^%^US8MFf
zP+NoU0U7)R)Z5va!gleW$`>~u&{F5QA>`+b?fPb|BH9GNfBsBn%r>FSYaGB?;aG%=
z%DVIOrGx<d=V`JM2d_mkwu*4?nAMpH6k2XW!2}L_IhZ^>MCx_e6g$I#E!;|XVs%W4
zB^*J5L(1t-C!%KVnWU)FPxNsb7Mn{pQoS?>NYNFPsFWd(BX_*1*Drjp=QMe}uySEl
zUi+vntzIcU%YGj`U|eH!<I)BOC@MokCck{6o92Xbeb=L3Xa1i5U5UdzBO!o{KOhv~
zbMywf90d4O*WC#l;D$iKp<<v)@Ho8l1IcYdR~?AJE(-iAep{*ON(@Pk^Zbfzsq24A
zCV@1AS5y#Ww)S2IF@1A(y*~A$3OI0s0|NYS8hP@hzh{DP8?F}G?~R*V1dk7DpzF8r
zIAX_e@RphKCA#bB?SZlJ@gSvtQHk+;^{-#UiS!D`t(R<}rfr_U5%$i`85zFGG2Z-c
z9p<<sB4g3z(FW4o+Ky`6Rt5deMjE=>7`g(s>kP~h3C8LyUpXa&h2w~I0L<~PlhZp!
z&^>HF-U&XYwJlS%JzP{y0+a;63<i}Zo#m;hJyvc-x{VbYb*~w7KU&Xu8?tTcpCE!&
z7X{ZWBD%A?%alE&U80LiXOehgLNe1TSjSUN6u;s6@0=BIC3AH?)NM!B3t9UF8=y}B
zW7*VeR=NfUc{d7Y#?s_mG`J@DbO7IGiHUiR^)ui|B1Jo+;~1nvpY&U6tm~H*P1qrY
zfn_!}LtWb7M6sxw9-2#;wYHd<EOtM&vfA5?G<Sdwy<dIq$m~4>JHuIP())KP*%9es
zD|~$@dS~!B5&|vbdZe(%9MFwf97G3k(hXOwl2`O1EzSKEKc3`XfhP!je3PC|vr=MI
zu-lafWE{!|gnPtrkWmi0zy97%=?b&9ZV*lOoRoqgQyJ0q<W4yF-#P|`{}l$fVa8|w
zP%tqd*J{5jpXKLQHJCxBVD4Q|Sh2D{_22Y*TJml<vICvA6x5`+=p3u^$DK*xdbOWt
zWh~L82S_LOw#j4*Z7fl<Lyc?0$Kgps|B{xPVKT-d1<y+6M@svDUDm;6BaD>(S<W~=
zL5fF%%Bbd~ke>>$=_zIAH;vkO2`@fVk-tWC?6U})BKp+Qjbs>2{F?fP+3+Ola%uPl
zEF)z9sJ~J*v~6o|>aC~gj2!9!xWyx7LP5xCR(AGmRnQAyDhF}|(K`IRsfHzqjvo#A
z)5_oPXe``MkyTVw>I|@esvdCY6SK2YDjs}8Lja8J(zph~7c!8tig}I$u4zLfqk<+#
zCdf^+aSm>)H^=*j+i0ftQ0FaX0T5zPZvg#KqvtL<(5dxN1*D9R^SIAZ;O3SYm3LNN
zX!r(8f$5$9kEgQ?tFnu>wj$l#-6dTjEgb@zZs|rq>2B#px*KWObVv$_lynNx4bt^3
z-gD094}Nf60(<Xgtu@!2W89-s(XmL^;HsVC8bI0;AV##<fm_AWd=8{*cdJh?tM+GX
z2T=M=1TvIUwOw3X>inKWI`4jR+pR*AQ*qweDi!JXq`oMk1-;^>W?z8r9g3%^E=V>3
ze7)tiE61Y)9dKrYR!$Tu#;1d8rxjrj<VC2*KNKU%uVYj56W;+uYd#qdpnS5A)hab*
z`FTJ!6y9%=bR_Xl4EP51ExhfbDi@)Nzj!ETY170%#L45tGW0CmEGTg`TjOjxgT9Ql
z*qVoi>%r0}@NJd6&;GD6p!9hra3|;S+5^ZZ=jz=k7AAonIaJH<l>2ei?>g4|cyX07
z+2MoP2p?OvXzzLtjH#&>u+maolOEv*QN=6P)zyK;g8cqxncoU%QE&TR3j>#MxLF_&
zQYR`FH;ZtJ1G*E<BJ}(+<D&{QJ{S}LwajFiVg~^Yek2%tNpU4pCt8272EbohFidXc
z`wYwzA>IyIFD(S<=Y)6^F@dVh%ErdT!otSDxn`m1#3|p5vBUfA;ME;yf`WD&<j36{
zhDBr2d*+aYz0M;R&VgJT^8oqfRnuho83n@QZKsHIs|d*6JG$F=s=v!Ppv-on{qwEM
z^2ou&KrUP?K_#Mci16c<0<A`6FhUR=Yn(CWSCw>c1Mx2|p=J_+=CJSkb3b2i8azk@
ziLr$LMu&JZ65aAI%5N}&BK?o=MhexvFdieCk*C<&s}RTw$oGzW1CE#CMgHt7Pho<k
zxEzm%`}HA7pdXl?o(?eCK#v57PEh+W-cboILBWCP3N0&p>j76%AOfzjN2ug2f}~A%
zH)*p?Ost4=WfkY;1*FXrS#0-s?g3#6AP4|Y#IIlPVN5ybS#6z#gC<)I>9OF+(~F9T
z@CgW<gxT+VckhlX_6n2MM~oh^{jS_r`|9jWP6>f$DZis5Xgk}Bypk7cPXz}=V;sD^
z(YS%Y2W{$LorDKN%D~!D=Ig(;Oo^z)006VU?t5TBK@GfeY+v=BREc`m)}$@Aw?Iij
z9j^!kXA+=XY%2--TpS=zrzoANjY>rq;w{o1s-#qyfF!iKc^geaN!!sO3?^3K02(r{
zKUiseE)4)KLROBIyrioO0~0L1lRaA*D_i@#+Oqg$yUSNkm`GIMw%Go-z+$%|Bnh^?
zfeR$y$%yH<`oS~4G}*J8czg!>iQ~T~1JwfqqBFF$Q!RZR*zCIDU~uTiQ=otZT{tBN
zh86oYg9V!BGPNp*BQ>Z3wE{qgumOm6XJ=fA{Pb214i(9J-nnYc4Blh!Y@=s1=i(Gg
z9r0mb#vD5CjML}~c%|%?Sp(eo_0aj)x`)Q&LDzltgl^dPY)z}mQ+<BL6dy1ZkfWc%
zMWN$EcPQ?l85=&s2A(QZw2yhZm0Wy$@@^j~<ac$4bTUoKx<R*7Nl6KjsZ@Qq>Dvqu
z>EKN&4r~w(iULy5+M}!0tS*Rf<p{lNg&iS$$BN&3-r<!&dkd@6F=*m|>J+w`dG~U$
z7OeO_6N-o7b(x_(-snLSSc-Lw^!?V0@Ukx$(n+M=1GQN0h~7UD40$==A@VdK#ZxnO
zN^}CcjK)YInCXRaeMK<1F*CGD^dwe=FBh@heNpw^&BFyq=8gw^huD(Dyb4BDfnlXh
zA76bzg9XX$yEUV?KuN;2GPjZ=x@|+9&zEw@L(JdmaO6h}*D^HO{fnV`c{i4S>kvP@
z&f7eSQ8<G?7@Grjmgs}!wy>&S@7WC7Wn0v@hBsO6&qn!yhlP=dFDxb|#_9URxB;Ty
z{y9838Ltomx={=<Icq0>dW}^WKA4yUZf(`zi+mlSDk^1JR%gZ=-oyqQ=d<1lTwks1
z?ZIKeqTlQYa&^MDJ%Eq}01&<;1txDMdoFj1)ig9~=e*wCu_}R7afpb-KoZal41_M{
z3fgbB^!{C3;bdgxfh>@g79CK21D-9wUUKsB#i-{ItJG=(A6I^(l$I8OLt{^0pG&#M
zS4i3CdV-hWnF4u3<I25tJBNpVo+;9hvUM-=MX3E|CI4y<<}mTL^P56UU_J%<86A_D
z-uru@5J-4E=<$WH3rVaYfIpX<2{wbz-o(NaFt4B!MvR!TgG3}0CH3`*D=Q*)BPO6Z
z2&w%sK2A@%NX23N>bj?g8X^z1*Q5N(UejD7Yr81oYPSkc2uRxoPyU2BDwQAzS0d(<
z<*)I{8R>WLXg(0G)Fs=whB&wM0kydOAz8CSa(_t3Epx;qK49rvIGzLD(J@t;tn=Bj
zDcF!eg-(-bz1DYXii!p(lV8Ud)-Bl|3H@yvCCb$E^YXClby#1s0+#Jr?R=nY86gEl
zL0c066&$yknl|*E+v*Fz4E#G((y6E?!yxK)Itb=_n6dr4B!s}yoi0H&2G&`M`7`l3
zT~8O(J4i_oP-B4}IpLfDP|8|(c!WDMsi(GjZgN$(-`9Iev^F=3d07&?bvw?h@Oq`D
zHVYJUAt7(T-2t*&2~dHdT~N+DQw&sxVNpNV>!_$pZZ5?&ZqAvzx1+5gu{&P2A}AC;
zeI%dPLHJALcP*OuXX4>3;rRH`Df#nt5=^R0nAGAKlZ8pq<M1+aq)bSPjCKogD$U}d
zirx{<O!qxRRHw<&oV?L@DjT>|Xu2fWJ-y|lVk9`4$Bgy5nv#_c0<6~Z3xQh=xtw$y
zTrrLAu}0QZh|F-#UyWMMDQvN-FqalSzW5WhP&QQpgwUT|T^(<K5&@Zr?7MfNKvosS
zY3zZk!u<8-(yg=i#|Z~`#sHpKSW?OQhf78K{n^ODTrC+Dt>suYSV1J9B>=9PeZavw
z3&ex3BTe$YP{1lGDH$s=1}rQs$zomu$IUOJ<{#iEf!<lsra7y^hSy4~+V6$+egdPu
ztB>*`B2V|{7sU><7w!OT$oO@Hb{$<lbTVgNKbr<<TcMSDjLF0L&F)B*yql0T6auyx
zGbIgse0tQ@=TXL1or^L~5zle^r>OoS^FYe($#kG#0S*)mmK%TPGIh6(PFMS+`4+ea
zO)%mxEiT4{nCPX0;tBlc`3_r#>GF{f6aq0sPz?eNH|bm7%<LnFfq?-)yJQ9izku#K
z)+z%MQ)A<7=c4Dy;YSLejEP!K`68}><MSy3!w=pjfe<Dh6FXbmjcG8<x3<1Hvixe}
zBM5{`ELv;;svu>nK+?I*`Gz<A_zpNroG;Gks+1MMZqQd0NdU}&rDJ9aOhg^7c>Xg`
zK2RtB0PCW<<DUEWmj5|iX)}_bRC72fLaJe={W_7N-f~qW7|~!4<%SfPA1is;AO6W`
zLw($~PhZxuX1K+44rO=T?e3GTMb8=mNx6&+gXwJ5<nN`Qf1{E3?8z-098y>a*f|=^
zQ4C1<9M7)bDn`XRKOPW)vW6RwxWNGckq0r{1Y=pIcU8-%4hxD@Iop%{C_wH5bYv$&
z>`Cv@V18u^4y9Bs&IvRF$%Zvh)Wtz2mlp@YS^_s7L#;FV;9TwV*&Bg)NFZoehP1-W
zKgcqc*nzR;eqq!xKTs0jAR+eyKk{a0&W#d%B0%#qCwuK1-4>p-6Vd}mr=wBq)bFDS
z@4S;gn(MGv55rRr{~aCSG~;5^O9sv_a)XPdY>B_A6#a<*P*W2unHN8d_KG5pN(GVX
z3j>b_h6&VUTIjVHgzi1Hg_R;v;Is{u`8c*o=lAka){Ga}G2Q5-xX4sJl-yge{(ZH$
zhoc%0qzq=_O`k6mY*d(gz02$3ADSIcskhnn#VF(CIe|;{-_L_qY=9zFQ=0-F=o#{g
z+x-Ec+uv@ash$nRoALU^&dTwYpMY6-8k&`zW^9k<+gLp7_jnIiTx>bCjY9g?l{84F
z>8a6lBBh^w)w|+I98@-=>h_8+fc_{dI=ZSwvCeQ&k2S^pqLJo;v(ghD#5UA0W4+<z
z#FAfR?q8qevY7bYxSKqa`PPp-SPU6VDgN}eF~oDV`!$$97v$=PpISKIpefD{cBTJ(
zzK+P2J=Z9=3s_>mo8EXGkwTaO)V$gCP`5HlDSmVdfVL&AnzcyouCHN%M!oTLsMX@}
z=A6K0o8b+>xdR|)#qo9(XK3=KIbfjULu8ZGfv*&J3d1lHY_+PLFNQa7PYJfRISGTC
znbb&*27ua$j?Ji5W!2TfBE76^=yp!J+Mr_fW7Yn1TG8w=zrX3nE)Bnj4Q6}LQhLkX
zYg>I!TKO70Z<HR}I~muVgWRh(cej=rWtxnC&+hO0b4(UBE4$!g+RsqHRC&|6Wo8P;
zFbw#RKpFX^pLBQ=IawZVu=Ztu&W011+6MK9cz`@Mb>ypf108@{|8^Aa)aK-u`8(*F
z?#=82Ye}nMgNAtc80?jYzuVicn7j08uQd_!ZQc6eJCDq+i2p8`C@22w2BXy^>W70Y
z^mJwE!DV7FdGG4zXyrY?u8faN<{yU-eYJ4yVrfp*EgMil_mE{w<6H~#5++z2DPS|8
zQ7}@IMX9bfd=a^*SLdT1392!glQM}|M6*HB#7i9S*2s${_$ZS~*8SGQo_)8s!I&5R
z?uWh(_WJtE1B5+9;}u$93=1%TF)cSCi!%tT4y?AZF1A@0Spy#XURr}}!Ma!O54QUV
zHJ6^tNA1Tv(8Z4Jjt$i&VGJtR^_2Z{-)-huyDJQXSd5-ZQ+!C3?XV&LFW%}7Oa0?F
zB^Ose7WOYN3>IT?nCLd0;Yw?mL)&dY_?N}(#|qqJdBUCQm2Y_-ADS0F?>{u?QnY(!
zPHU7mB2txVek8uGJSxy;^-U@vdTzP4(8{BWZ2aX^B+fZ7fFFy&MZ|TYv#wL0dqasQ
zp{<Qb%EXDR+Za>{m+~*3OIi_SI3U)Pq=CyHmW~4|qowCx1Y1%a7~8F7oJidnjg73j
zFNcZPz|qHwLf1>-%Y>FaVYN9mpYIeTo$w1yka#0iELe&$ryx9Nd~Vp>dtK0UV<Yct
zA44wmzn<8$OpgA)zlY=RaqBca>aUO*ITktTFct*e5N3QPI#mcHfm8RjT#qK>CRK3H
zKz<{{Sgnc5xOWoy8lp0t{<)_}8<&yFF=U|W9h&<Xt(aLnbLP`m>Luw)rivQ%<nq~I
z`()X^MBE^Y$r%^i8tLCVp9W<(EB?RYKs-Dl$mr$K&|7VPOkxFp{Pf_2Jj(#CxjLvM
zJ6U=Xt%F<=`o&JsL?MevkZ@q9>(HlaVtrb;<UEC-8F+I!eVkrxcs<*|ZgJU?s;4U4
zxtH3^>TEFM!@V*aeY7cf1^Has_({kPR=KVi3`En6(%vgAIT>g)&y(&W<@~>EpCZMF
zUsQH;Bk8`5EUd&@K%f&xX6^x=Cr$;EKQu|`wz&b4sKI3L<k|7p%+ft6j3_3YO8y~r
zNQvmH5+j5V>mCuf0QByJ1hm&|vnKq!w~0<Q>k&5k1+Q}gD|!aj+wkMCt{Q#az_@X=
zJn8V^Tho6tWv3^s=dlp%Z=vBh7@@@C{<<%=C`PuyDTr_$=7~@{*0PBK%GYobf6{O{
zy|Bi(tzLg`8i!!I(L(8De<!@MM}kP?Mnt4S$K|nMMc@P20a<dcz6FRyV<japQw4^!
z$;n<77;uE%l=~=mz&F_@MSr;#q6#i0Ns{^>wTeo<$<~-aXj^qN7H^td5_J`<h#Xgn
zG@_D5f34Ju9u?g5U>G`H<e=Zi(yB%Ap-JB-6U-LiO$%TJ_^isl=&coCEl^j%BvpLT
z2^|#{sf?yqL{F09qT00$d+ienr4Q-(Uh7?m&qHuVs2o=*Y5v@R{qJ86?!@qSOTw45
zwppz=Z5-k_{&6q`XlPJsO6mH#8kfMjsHtzTos;U(QWC_$N!r5<X<v+^;JBpe%NR8%
z6F<KQNl0i$lb@$G!N##_KtrP8l*atz?TRWtP(@Psf(92lBLFoS@i(DDKn|#cG5Zj&
zbIHkxfP;gWU-zH3{P~M=Amf{BTtt8EQH?cCRF#hCTNNc9TuUWn%vbQi`LLPXD+uq=
zS!s3URp9kPizLvXJ(K8o))Ur?%_&mhgh;QM6fzPb5@Y5GX(mozj9_Um&?l-}Au$=C
zdm$$&QPYp7s{Hv8orhVt@$!%}BPA3$g)gZ_-1?qUS|&2=5O$89RXM@~z9X}*L9ftr
zkuzYdq|BTcR(y1s|G*THqB_NP>A)T_F!%A}>earq{<G^q#@66de5du+Kc^2-R2=Yh
zo3Bj`rbo4|J7YP&3)Vw#y=)h&r+;F=s3|kgek8%XtS)W!vfn9W{aC;H!Zfh;&0^&@
z!}{q%O&zk0z0PFF{y>XO96jcrPZGbY9~k-<_S-$9XS-a_(^DzCs|}ho>g!8k*`623
zx-S*j8{mXc!-}N#QvQj(Fh{LMU<=WkeD#WlMu7J4_7grORwmyuFH$Q`N}N>@2lo2p
zz^7r_&sLu|k>qrlgv{+3`&a%?3s5VYDZ=u8-kCAYf>>>84xV*TN;kJb$y6Q-2mTvO
zfT~sHP~R)N!vYtgYMTwhutGFL`Na3FR+WrMk*N^%4pb+E;NkC(sBWye&JZT3i8sny
zyb7i&Z^7@0oS{cY4xlIeW9tl51o2-635m$1t%2YcsLE01Qb45@Hf8xMH_74-TB+Z`
zCtU=QmhYc=O_M3;lI~9Ztil|C&3k($^IY7>7A1h<-U*B$CwEcbHhru_xR|$#nX(*v
z7R4$G_FoJ!fuFa(A#2HHN4hiUVlXhkz=#K=p-$-;>5N}levXdOn5Ul5CdzqwwFZpy
zzA<8*Se$yN=fwgten2;VIsr2XlK$sUbfFp(;E3ty>+AD7tX@51w`Z%O0R&B2#*5@d
z)xOi_FkXsQ-DejU(Ea=Y!X3eE=P^Kp1Agqh#n&_eQYQKFBY(1UGD%|M-}4(~+MN^#
zXxj{frZH*_hv*=ve<xBxX3_zx0$kBRw3el(O+?BJpQoo+Em;@<R)Q#leG9|?U6XvO
z&L>Q{n2M<{_W71!MBuOZ#ug>Ut#pzK|4R2)iW&`YSO&J)kk?Ai$*9zkCQOEECugTh
zBZWnLwyMLe`chBL!^9#jKB&_9j=oYgdtj1H0#4R?DwSsrkyWE#h9+5QsS2|mhP4gZ
zJRmMK)%DbrJenxL)RuXYx>&fK^8FIJtR7rB3%04Ato6p7H4J-*5ff!0%v0jAFmMn2
z`D5&QG$&r9YccqX4>AO+%XE3XI@Var={ePbitezrj5Bz%o~R6lxTbyU5ezxrfx92Q
zBjt;NH?)N=eyf2BGD^B6JnxUO_n0|I(K6!-K!S-Va^BG<`xN(_O@$Qo-N~+D<^yW7
zJl^b;+`z_{1@LQl>(4>~O%Ytn2Y^QYM(b(Mh^B}ZKa!>}x1c@<QWmxEA>@6HIi)sr
zu+$Ox(f3>rT)V-D5rIMgxJ<#ch3~VA)4!cXq1&B;=iB1mKO*3Psy*b`S+2L_7hYbL
zrIH0)lusUDwi18|%yycFxAW|&X=wvjufXdAVHFgB#3$@^d6M(A^|8i2(zzvqGjwLg
z0t`w-|FS==v)8hsFyIeDU*F!{re$T(rOBWFpa}zDTT2@o;!0j{ZFCnB2LVxFVu~9H
z2gbu+`qz1yc+M{ukJmihz6z|Oq?k`E&JNBTzHJfVd|yj=n|#*^Y$)t+uMYY@832}{
z$5kH~D=!kw*F_ig!y(_?w<a?zLY+v%AZ5Wuw)F3dATInL7NPNw{6_i=1FB?s;1^Y4
z1X~n&Y(e8=A9lfiJFby1IAztuUe5kJ)R0`M{w|P5o8^=d$f?hI_f6By{VLa#O-f)<
zr;#;E1#z&31@BefNfCV|om4WdSllFjq+lp2D%0y){b;C<H|~e{7_AyOT9>r)2}bL@
z18Vsod!nQhmAZ&=HYmE4JPJ0nm~q|g8**#@sc?oib&^3Jek!H3q81|@zF`Zl;46fy
z+*WE>-9aq3=20|}PNM->@}{cy&C|$0C;$M*F={36r)Fmrgt95g>zR^Az@w9?&h=gN
z&eHE!KZ>Qbtu4wlP%<?(R%$-N$jdJ*E^yGdAC;+NGZ~wieF2{p=(MzW-ym-~hX6kz
zH7uCt#m~=sJQE}VVuw8T6r?oy$Jr4P(PzE?bl=yOO8J2<!`#@HeD)kTLI9+$P3ZA@
z<Jm5nZOZT-G=Z+qMW0H%pAg2t9?(6cR?_180PolC^EL(t6qJ8j$u~A|`s^Y*0ai3U
z9dso?2Vr7qNs>A3+x}Kb0utB}Q?s(n!6kfV20t_`tW15l{o#@``?0YEl*%6f(3uJl
z2D6_5Kv<Tmojz7Y*I*r;Z4ek1>av~h8$B?0ZX4^QpPnKW7Z=NwsDYMkAGl5_1N}$_
zzkR+wbE0Al7q9T>`XqJ`2|vKTq&E9zNr))(eYG4rS~lZKQ)U&I(Vd!HkT+H124Yd*
z@0pPg`9Rm!19m5CE4y634{_Q*pQrQB@ZnADB9nOeBADO`zB_c%LeLyP7)F*^^$rrg
zy97C8QRWZ86sQ$PrsbJ?la;vTskNf@vXpr)@Tx(HrY^&Zq49Tmiq7FT3kC~*6Fic;
zIt-kOXtI9kpT9;rE5nH@3yEA5DjlG1W>bkT5Z~p#z%57K>}a`~x!_wCG1I7hfo%r^
zJ8>}cKpoLHD#U+2mgsSQ|MaG7!s9UcE5Hb0EV};V5`HtZbifl9ODZEjR5@Y1Ucn-C
z+oz_^OgEDtx8iXgtt+@n%xm+z)M@N@R8ZIt&Fxf>0zMs*Yp6A(%O@f=etZRKuyep4
zS=v8g50PYMHrMEN<_U&(X${lZEjZY5FMJpN0?jkz%N_^SyEzE<I9=Vk_yj4djJP0n
ztc7Vo?htb^%_(9)!9pr^aG7qYJh4Kf7#1ZijEFek^!A7|(tj^kDkAPXWfmyC{!Bts
zf_ajx^WLGC5x<4vEA=4s^m>0s=#rO5d98{l>zhsZ<{zygHdLylML+Zy8pMzuR5Ua&
zSptI$_jW`0%Oen#dN0Bbgf#%(q@U%nuOqU954~6wss0*s>59t~Uj2>w#Ud2snLSVF
zCMM)QeL?}bBmnq!4$Lti&q5r0V=dR383E&Hdl`iQh#>)e6f^L%;HWoSq<IVXR*HE%
zP|(8%?zD!556Myg!3;H?oLZI=`O5Hhj0%=eIyoc+4s32;225yi<bXm53<DdWJj<@a
z)8zr?i;@Lc>Kat|k*a0th#?X{o-z4*?#t@&YSdeB+LaU(1U+_&a1m*({E1gp>|L9y
zEdVh!nj1)@0I><2zks_7C|zj4xI8m8`ujI-nq5jFgYrq`#|Ih^*?r+LwCx-f8@qAg
z32@o;xagd3`D2X<g-}ta%si}-m^2D;4@4cm+_VtkO3`Etfy~%Nw|{`|1}UqlYyWvN
zjwWQtp0z9tej~t{y}HBr#&Syo5}Br^r$?b=KKh;4Y#`Q&RKz*zHq^5`nYn<5|7IZP
zp6EZkP?*Q%4T1Y+QO?A|%)r}^9WhlNM->7l(f>VJstV?}agL5baff%LbsAKNOvvO?
z>#DRJz8G1CWOu%r=r5>vx!xn{$<FYwr<|xww-d_VM-<ZLf4;51#{020I8G~~G+1ZC
zn1T!qHSsugXDzqDT%7!_ax#Y;LH}byQZBUCKBQ1hSss>y48yQGMvL)!nyb|Uo7IzQ
zHp1MK@r}4TnRjRaK^UYKPtE<9eW|-vRf9eLa@p-65_(L()QO^;i!NeD2eL_K;}T#T
z0WHglHZY$N&=ml9kTGT0dp~2fr<C|dw3yDI(<|ksrHtqox`VDNcmRXh2dbPh^@z(D
z^!y1%rD!zCd{xw`p5rUE)p5`<+T0qY0=N?pZmP{1v4Ln|NsyY6W$9v`4ALZZc5He(
ztoBV+D>dJI+CphR{{<TMxX4mq%>2e>54X#G*F37cmYkzfg&-1SK8>E7a7<|9PI1+;
zo<p~PLhU1punE}o%}kt$HKs~6nU@HO*Vl`#Ks@LiRH+C8sP2kW&t_K8_$K+-DQDn=
zI?_N$k<+(*eg=fVY4R-+K0aiCpio*KAv62N^?;Fp-Eajpmz<Q;%+oXU0|%_wGeEfV
zHRw#`GBT$Za|68G@4vWtD*j^KeiRtLI!yKOPbD+YEmtjUoCCED$jD;}M(R!wU>GBM
z8o#q7MZkg7L>-_e>lpdkEaHymM=3^2+{=ZQuD9^RoJ&zD>XZEmbNW%9ZW)Itckgwj
z9#GlmmNSn;o`c5IM3*i9?r-97_rO0H{6Las=Dq_GzOp3qIWu)n>;GrJqWG<ePL2(a
zZWM3WY5Dc|ri~=rGoL)!W?CFC&?0t^IpB&al35HnI&-}r8(GbUTV#>CBD9nlbNcgo
z>$^zNpa`i<M64pk42utoBCJzlbI7fg`K9P|M0vDIjQiK5c<sbGSUoI|!b8mS_uQQH
zs%T_6^y6q065OgqA?w$1A&8qMBvQLH^l+`_i5fhuvoke8f>-8bvH$@iJ8JmuO6uCt
z@^ygDFSQ{CF<-|ADGfYeq6D7JeyH88+a*qHb-wJ7F4xe>4@58rbZ(Ipz#Z5=ce?L$
zY8Ro1$d8k!Uq%%{2ad*U?=v}EsUkqVuF$HUoR~-QAKU<HEMHA6t#E1T)Z%b+9ng3O
z^0_y@_h6(q3JhNn{rM~{nBcp6CY-n+r5i}*+n(G=!&+Mjfurs(aPneB<b%w$pT~ZO
zSA;}l{SBxlwT$tOsX%)-lsKqk5DkLY(l5Wy2IVt?O$x-Tow}3ejLDe3quIdO04KJZ
z7NAgrP@s}2psNJJ6}h4W5EP0@nlV&nE!2uoChK}UKLkcj1nm0MT8w$+#OX)k8XA`e
z%kOMnD~aSVU?bJnG)q4H@=X}x#gzgXg$7w!rRjhm4m)8L?BjK%Qb`;vK_y>=4ZUzo
zGL0Qn`1nyY#XQeCegE$G3gl%-(qiZN&600fluQVdlMWi+#TdeTUn@S<E=y9?h~6xc
zBF@N|Z}Gw)%Q8@miN%T@m|Iztk<lVJKmP<Yk07cjBA-+EjW`c6jS-^?E57yqPWS!=
z2wWf(aEzmPS_3@QOO@MP>F53H{!)b-JZJdh6^vi*erpwC2CK{cN-C95sV+B5x_g@%
z7=(#TC)JD3Y-+<ItQy()MS22aHHn8W@g`k}2ov2S&%b=UAW1du8&<!i6=MuSHCs(^
z4i7WdC!{X*I1$+bRhM?ND8vd^)KMhts$e7=bKL5ft=e%~fpiI3?$qIbiFxrBd25YA
zeHRw#3UaJQr=3-*h;ogo7DqjzRQ=0j)pmBQ1%Kg%R|CqeL8Y|#9N22mcFUA93@FK1
z(ZL||NKr7_xRuFlDh-vr^IG^419eS+?^#S+!-`YJ2*#PdkLN};eowxIxTuD01JQX@
zx_Wxn<b(i^0_K$gn3#yL;D>+=P3&-5pN<Z2Cj7a&W5h*ne;m+5Jy=xW!M6ZqS@oFA
zGzVWayyFJ3!%}mAecP}lVD4=H$^qm@yDD^9rm~7ir++`F0Q3|otQX`nIs(DR<uS!G
zIAdnfa(Uji*UZ|3Xry6+Ct8~o7(t66Y!kodx&e@YhNcP3g@9ZVq(ZwtL^lEXjQNKT
z>`;5Bi($MN(l<Q;53lam!bBwy<z!^ug8CBl!ELouloUSE1O?5O64Ot}27lTf%VSJ%
zZutpDKwzOT0`@T&hT@#ufdUg1BUYtMU9N=t8+`(h1SEQQc7r!Te$$J;?>G!hFG2lu
zcS+I5gT|IAx(zSS&jUufVm|L^K;8w2(dPC(hmV(yGHAP6JHG?88TvHG=-T}tE#SYz
z6c%38G1LVFwNRAf?4tUL4Ee^M<Pn1TMlTH8A==iea|}PQF5kEYeh>gBFlL%!1c;OX
zF=g8;9w<t)evK#3m6>Y602!#wR$q|nH|0w!F__P}2UC74w~7d$rh^z5NnNL=>CieX
zOh(~!Ym&~G#c3@HGL_=L4na-F41VXKZoP&mF2{Hs98_hd8qKIy7mrT^8xbb^VuqES
z<+EwB^Y0;ALydevYy`MhS(%6`4X+rXvALRb?CPY;VKSbWleF|)KUp|Y%Z%S3zbOgu
z;0-LkW{fmH>isl)$Pbv}mNz@ZlO{gt4?z_;5{O*$q{oKM{>9eXDRO1%V7AL4%pGaI
zY^b+Bxp~#h$pahnu2x;zVMu}-3`EX`kzq>J(aM3O-QL4v8Lk8XM{hzrGB18gR#w`}
zG69g7Iy0CVnS+oMN$Qv+@bT5@=zXB6NAn-t-vBbFJUx<k^3RY^Lqlm*efFNyaHPj6
z5FJ^J0x8lLXHJkWlBWlE72{{D*H;$CNsV7&p`rYDp8*DAu$EJ43N6A_f0j;3t%a9w
z;P3B$#R?NACx|K5Cc605otLc{15ot=9;Fq}{ligKp_q-6vk`VRW~~~sFt=aX1&}hk
z8E`b|t`~hZgwNHl`mo6Njz4U6s!(2W%Isi<5ZoQKQ#y$L-f@5wT%d0T^4FMG$u0%7
zS%$qliePl&UtFFstIL)wS2V+Cipe?!g0pM2{|;{|fD_rcdF;n1$!r>78=$f!DbNAq
z9^mmJQfV9Nu3u;^iIk}`Yp3*+R6k$`<U%U*%XLQ^OaI%gmbiI0)~NER<>t{7Vl_2H
zQ3qcdAn)-+`!}2-i%Y7VvLxgdW38-&nWxhZNQ)TealFip?^f1eo?~44ts7q_-{poC
zhsd5P@eYz#&WKA&roj|A|1-TL+u4cYwR3W*Ox)}JqzewB#_YH(nZ^fMnL)`C=5}0M
zvXRT&^tIDuxnX$4kFN|F1`<kpKYLo~8x+i?^<y)K=6^Ea8CU0z<S$<K3R`xqq^P=H
zMFGkpNLjnDK!9=jQN;I@PJ9VF=FcQKO(yevE&7kp%c^}9@U>;>PQ1a^*7n=CZ|g65
zX$k;>c3l8Hr01?m>X#?wnPy=UFj$Nph8lk$JkBwFC)be}y|H=LH1b#Am;J0pnfeR`
zx07C1^IdsHXbgyoZE5$&tYlL?+Me9%0=CE*(Z~y^UiApn{_Lj5ezjV&qN(ww^zo?y
z%=&xqZ}^Z`k*G?OM(k3VNe1+HV>;&mlXn%m%riRLy%*iN+A8Wd*s;JIgqe?@q+js-
z2^^)RJDtQK(rEYcq8|w}l>|jl7P^lYMKjaB><>~VW|YQzjXOX?_v=fzieF>wX{%wF
zO1V03I1?;9Gr6%Ef&7NHVT1@=ugZ8x-y|HI3_`zI2>KaUu+gb%k8%NWMEM#ws);S$
z87GBrpmr&tRCE*;RcwTH@Q@xFtXW`rS>n_}IN`=m!BMj$`%FcqhRdp4`H(<n*?HfA
z0$=AMolK)ot(R}{nqwhC$1bZfWNq54T%XVB!TYM6(o$yUn|Z!$-R!MTBpQ=><$QoJ
zeYxTN<giGNPtg>61U=kn==dt~P4$0XXxM7HofP_qmCfUVB&U6v&QDD`{C9xwm$I>B
zk0r_sOE)OKvdsz&r7gY1nv9h>&mDeYxckn<PQ997^!RBmEs_>L!eksvyH`ChiHx73
zs~GR}7LB#t>JeL^^H7%Q&Adneoqg~gL!Klfk+Em-yHav-DOjfK-koB3f!(4)n<PBZ
zH^y-+%!nUhySl!}^2Cib#1r`Dmxol&8n4lOlw#arrh6@+Y=+j=pq(U+iOhe24yhQS
zn5gJl7KjP5PFH8%TwDtMZ-0IM;6z^g+G?UxBi;r_+)}l=EkTI}Z~f^CspbL-#eK)6
zhXv8=W26GExM7g=c^lE>!c<h2P`_TkuCbTXuu;^7cgn;lt@lO1)}}}s{_RW(>u_?K
zg_uWqnvaxGT3+x4GrghgYUiL7pAlC{dQEFa$nk}SJZ|MM)G^|lRe^sDoa8^=_H69X
z4LZoNqwxHg>!#q{o($8L4`WZ>PCa9)IJN)!h+2=#l99}K_?p#)yRh|{v@nxYUX`vz
zTQ&{0`Z)GQU!`j~G)Hq;%*L?1NcvlOPSko4@oNYYY>k2;wgopIbBqIo>D%eheT46M
z*(m%hI9Q%vI5~b7??6BVB{S@8*w3Ha$NBp5-LbhZ`Cr9F2eqvH{w}?)Nf}e>;1keb
zY%It}{-+Ao>f3gg8!Y|@no~+Fy%}b{UqV6s-%O2>n+&Tr1+@3MABJ0VT-vl`@Hq6!
zS1c$Isp2AHcCV3SBl%)OF<%CASYLU)(f`Gz$tQMqazKlIJl3HX^R8<(mc0}c$s$b!
zs`^<yn5Oh<QQ!}UMn5gVPI1C%K{;P#04-WJZcG^myJ?b3Mk9V=O|@(hv41XsLj2sQ
z2G_q2g?3gW-vh&Be}paDV=HT<j)Y8*vNI_MC*Vu6*$rBL9oi+9&h5*rrl9*;_~E9e
zsC$DOb7l~w?y;M<`p*0R-VU4J*Vo?61K&g626u}yBcHvSloYW_m}@uj<M`ohkgw!M
zKIp{Zgy*c#gSSXog(PA`vE>Zy-n2uKLc~NrB+s(!eR&!3z$kHYn2bC7Ny>sWgQ-NK
zqxjT}M^>4quTekzH0nE~f1qJm1AZ_dcgxW0d&79qU-njFIW5%3DTxH~t}wQou>E;z
zkHxLAg*}zvHNOn~P#2;QN4#7Ae3K0-%8CZtmpoV!1o&iz(XJKpGqp&b9qPm8vy@Jx
z+GDlHUjwV+V)asn(yeRx3Hvv$a86Q6tpxFC%W1yA3H^mJko=9Swqh`sjus&yIWqOv
zsOSClk9}f<w+>DP<K1#butheQ=<<{0zpPAgmka(36^XH^s3_6D8!Y4T(9s>iI{!8K
zr;KZRH@6V3^arCnYmmLIev{|8buNugA-B3ksa5^k1j`>-SILz>Uc+9FdG+T>M~^W>
z&0FR>3nf*5F9w3}z#b@Tq54u!Ahbj0R8KZM>4?v5Qqn0BMGzgr+^7M4zTdgO03SlY
z*#743wg?DR`m^4)O-M#0t)sl(oY!D)HZ?Z~{VrV`iw1>0)Eqnb9>4or!`~F?Vlbb#
zy#41&&m`)vJZS{1`<wWp(SkGf1!DJnwjPo))-GAIAtHK9Vw!tn1z{15?+s+0uMB?`
zf4cub7i}c}xE~|^UJ}N=@Gna(rBp@s{tfl2z9LsDyDHTFv5-@uX{`52r159hk=@^`
zbQ9dy8DDX99y2cCv&&;S)XE)sjs8w(6HYl1B3h)fYFs;;Caw5~9kZ4oRS3dh80r)m
z&Z-v1=0Z%AyA?{R68KpfWK-dJs7`E|(b2J#HpIlXZybZWc$KQQBMuOGf;44B;!LVW
za%B|j^>+$MC$%T<%BHq-PVELM((@$=tA9*ZC8g=ijl~4ec6PD}P8CGyl$@r}Yg5U$
za7At?7qBu}5s9+A20C8?MhEt~tyKlTL6XncgB)Cjh5TYIJOlcs<b$RKw2BtOE><J_
zyFYGr=d}KGFTiHSlcLYu-YSB<!Iwk@H{>y^O~7dnE9L7~_lIe%Qq3h+C6HPFfPgX4
z^oig(m|pab@8RL?n}<1^{arl*kE{DPf^XYoOCaE)SkuvjVK4=n9!1)$t;e27>o^un
z70>&QUzL#KhL|euB|2$tRaML<po6U+%P~HfsT_R((R?W>e2_9;(5wumQ3Vm>L))Le
zv9aTXOIzF7SiDZ_<3R;hAZ<N`x)eq1@Btv51<mPrMf%!fN0M4n1g7BqDjL|g4~F<7
z8lR=c^KDr*l^&hFNM0FJOw%__o(x%G!U23*c(6M7@C~h^ARP9s59IgzEr0Nsb}l@u
z&UX$l;1HP-$a4@}mSra}uW^TPT#RFaU$tlcJQ*#b9i$Pz47rEZNS4We*&fkX!gz1~
z5y3~C-B+rPWv4)NO>fNX?}_MT!^vm}tdV_H!N~TX&pe7fCqXB9LtHPVOg4&CF(wbA
zv8Q=1uQlKU4e^J~v#U@}8&f>xQ{IUs!>T7+C~fS&MiW}Knp~TggM6f({v0v&y(zqi
z#N9NXsIoRjzbILv8BR}a2+o9+=bt0fJ?i4URt*euKo#Zr_ji9A;SW6UY<Wj|e%h95
zW~$U=t5b#S?G~%((~{UyjgKoxxyudQ%IPGmNd|t~q}uh!NQtAgzpXu>oJf_1a!9xs
zy;WPxHZ{7#eP>P5%UPNR53a$kARy)Yhd9e@uk0p6zvvXGE4jyklcC4%wtI&mJUXeF
z%tuk6P#Xl3rLP+d%0Z@TjDJ1$FSK?KSEZhQEd#MEhoB(f)6rhIT)6ufYHDegR($N<
zzN+UCRW8%Mb}@1Q&zsG?^jUZGD=JvvM?_t29ss5r78ZqI8e^_q9;H#G%$u|0z*qB%
zp&=n2o=|%lLR8Q^BWm{yiHUjddbHBpQvY#cWhP*DUusrZzr#7L<JBD)90FLTvhVdP
zi(&?TEh1c|If|3hmR8JdZYfs;p?hmD8c{t1QzJ%Mu(-X_gzhAK)u~iwg|im^UHs1J
zF)$x5${pFhiQ9K3fy4ct7x#2DixI3IvT7gWM7dMaU-3r^H@gZWk&l&hB9N_)G-5|U
zTVTJxhnBwTE^%PR|Eu33i9`fFmnMSoA-=Ijjl~SsMEP%Ps&dy<e;aJoJx1-UYxD3Y
z=+qyKg?(#?Mt%fxskVC!S+ZGfVir{ZM3wP|MDBuz3umcUz7PRRmn!`|&J`J*nMNs3
zh!YPQ5t5U=moU>4&QCtqKgTWdR0}fmj;UW5zF1gTp$!i8G1QPH+I0d>cF{LB6}HMa
zm0W>K<W6l-IAM7z5v8xIlp1VtOuuRmV29F()Qd81Q{VeG{;WCK;G|V}#9>{zjh#zz
zngtDqf`O0t5P872hA``UUjcF+y5oHxlj2k#1tKPLD2Ns{^YB0#sRNZVsepH|x5(Ju
z9&)@@5}4iIe_yj7#FKD5`2qG&(4(*^Opx=vFF00PfUs}mwGavB_%ulmI+f^?lAClb
zA!O85qTHo@opxI4d_WyRBB^_X|Iu>Mm7_9~KJusIbZt3;R7D+cX~>JUS5iJapAlG1
zK{v<moZ^Whe}a&K!UIG+_N+cFuR7jN3<9rUu09iB<X3-4g$Md$T;w+Z(3MI^;li?_
zS&`{;hqhiZ(j?3Zc8bo4X^E_=T7Ke}RD{)n2SEDnucr~2x>}f~obrEKfHBAEKHu&x
z1ga)f5xv+-#=oc}<$My|SJ-edA)XT<A=Jay=J9ov#%m0;3Z*^t=J4?_5_Pg6m{KDO
z9j#fV5Q{40))OpMLD^I(9^;KfGP5M<B-t<ilOav%=F_#>cnJwcGVY2ztSh$mG`koR
zVrk`!b>;ioO#?3i)|2KZRLpJ6f-?=o9Y$)LAK)bf7$Y#wZ}H9)xc?HYi0ie5b{Uh{
z(p0ZsNT&UR9kQ%@k;IsgEGU7fSRoN^J*ik=wT&rZl3|Yg-2$~<vR3<pW2e75kE=^8
zCwCf6OA7s)bNGmDt~{uZ*>)Hw%2u_{pKhqVqdo&K6<v&JJr*KxszOxxlLOGM-i+|f
zJ`@zSjX~ogkOhuTF@InTC0yjzD87<Xt!?_TH@yESV!sG8D2^CDM;-Q@*`uc{{_W1O
zEhsD6e{sP<ziVUe$Z5u?6WVy{(^7Q2a$K<(k)eZ+zO?1KGrTptD*&z#OifIl4i`rJ
z8FK?S{LmKrWv}fy=zgqkm=MWTcfhFaquHtIQHRSixoBaI9SPOyv9cD7LtB*}=ri%7
zH0Y#s+`Pq<Xijcn!SjS3uG#us%Yc|mfJ-5q^Yd@jj#8l=?spqY)Q(<tRdlPJ>&W3&
zON?432F>WD%l7MsN97BCgtdz*W!6f9w!3fnWz6KU2vo4GkAK2hMNq))p=$s7m9M(e
zT@*__dU`PyD(tw+1NZBS!42_Qo<KLk`5fLQP7OLj)Rn7axf(;tDGrgTtH1RFulUhP
zf%OnXEcoLFs?aJnuEQh0MMp#^%>R%|-!FmXNBJe6nGw=rKOluH2j-gxGl-UBouhka
z$T&DS|LhijZRB``dRGDOM&&4iMZU?IA6v0Fauagx#&G_N%iFFd2fsPQT)VgW%-(+7
z=n~YmPRT?q*}=aDbXQAW@bU3M7!j$QNJlh|g4dy+mgZ3O1Y}(dzB^)UGfQI^a!dpV
zQQ@*uEv2KTpv@eL^0ZV5$T5xMmJ;rZQfu}0@S$O%1F~Ryq&+fa3?}-oj?bm~zJ9|t
z9Yz+v1!BzYRTspVH|FqhQTp$YWqnmj%m1GIDL6PdW{8(Pxm?_~awy*}E6H(X!P-8*
z|7R&WSYVwg;1TF|J$RhEOKkM8Tz#@vQJpxldE)sQuqV&G_w`okv7_ru2hm9vw+6<?
z?d3U_43pjWw_|PUTPP4TR6)MiX7?iqwqy`3Dr!js2Ij~g7h=CQH_d(j6;Pb@pjej1
z_BV_0{PfaVdABB_KxU97<a~<@)Y?E<URzfuVQb3`3==eIiXi0<R?2DL<l4uuwXID>
zBN=!m0Pn%2mhtZL(A35={pJQPKOWKO@r($>Y6Fix#naysGcFy##KK0ex78Ab9-bV9
zM1me?WWW1Ctqkak-=8JV0u#|z%c@5Tq^0LA(Bd>SL?s1kvkn&kHXhVo7zBo_bU4OK
z<o(!HV_?ElcsA00rthC9keToFA?XFyWy7}j02VwLLr#Tx0*v%MH*V};G#M-6oL<yV
z=djcsZoT3a$~x%uMcVXWz9|+6WB~n;?`j^Z^l|mQuC88-?;-Q+*OjDiJW+E*yXSTg
zgS1v@zK+;KySR^Rdc|ICzZ&aZ&i*>KN4X<_4g{i$P$c*u*r1op`x*^Oy<#uGFd@@x
zTgmq(GG}sW61n?q5*q}!S-5zFyL%@SbYA1Nle0(Uubq0-vPOp2a;6XvfaMi8nB$%9
zcRScs66e<iX)Z25>YFb4()ehoA-Z|)4dG+%P+$_B8hH6l3(ZYz%GV`e%!r=^@24M*
zStap+<>N|_9-N`t^j$U$?%Iq$myIFfRnIHGp!t;kzkdacZugES#^<7*`Rs9!I7QGA
zTD{&7rO6n@1ml!4V!ty>zZhdeRE%XxOb{E}10o0Bdfv@L3%<%11r}TVJ6;Ge*HLG|
zb8~e<*|bRpcuNGIH@qURyc2XZm_&rMeO|fgJoFMUC{Fz?E6FZut4NHWcy4hI?#htX
z*n?O5vGanDjLiPN-{>C0`?zg&b8e!*`#fW{52_JE{${wPe*4E}ox6}AAb4*8ZX$kq
zF|f@A9BMDMx<mpQ4CoB<W`m?09|N)oYB~DZQuT`8v;BOQG-_o$Mb05x1JZ@m;SAVT
z>7lBXCWQ3R!<tXWZ0KZjW4ki%&nFew<A=7~A4Z#AhCSTDgRUa*hGu4GlLJ#zA3@hO
zOk!dpc%}eno*{;UA!{giUvNzHiB$CFG#1PkQGwYDJYfO*AZU~E=-YjF_X}m=3tGVa
z`Zlm}?IQwU<U@(dBHu-QwxvKv6~xl@Z=*Qx&%D;u+DIBXTH6%>VP_~H_LEDPdu0Cn
zc>UD<Szj~;8s5e>HW45O6h~R;eWyxaoqgxOeuC@$u16B;cuWAR23Bk!J_8X@gFK3t
z7zghVODn23uEPripwXg)X2wq8gE{V*ih@dhM(ooz$wNbO7Tfraq>-YJ1)_BEUlO$y
zR@`p&G&FV>TM|ohe6lH?PWqKLKqeGulgq@A6@VP-q0|3{ho!{t_^WE$8zhTb<IP8@
zu*0#D!+>xeKs?*YF#r-5#8=MDBuEx;0+>J4zP6!R*47K5yu7Za#(!fDa6I$&1zAQ$
z2&eZ#MgLmD4?6v@m?~7W_1;i^qMJhp{0cD*4S+xf1AU>#ma$WW)oYxdJdUZUM0FMo
z&EMwq1JZz!tzA3>64S$C$xDhVqX&vD{#!dBs%Z>*_^hk0(Ay@)l!zO$@be)s1h*g~
zmZwZjOA1&F-_33(P)4oat==&7{6SPx!(ohQi^^1_zd6O|lJSyZ7?KPGdM1GF27(@j
zM7jEA4rLzv-dZxyR<6E3BWP%JiyJiqlTu(_4VbxfWi#;py4l~qn3870-#MU3if~_^
zD_V>*nbh`65LYQ<*Dl#?UV7ye07jpw;{s1d9&ARPJ);@D4GlccDU|ey#%7;^mqsVs
zV=L`-eOm_h64m%2MbP&bz=8jFXQJS*vj;u>z>ry8rhpSE6)nIpu(GnA%$dd-r_&!E
z9s>7}!u5j)^y4ZRvTXpo36K@6p9-*4IN9}n`20DE<=9|r?R(G*(A##1Ug_bf@ZP}a
z`qgz;(Uo6NkXQkxHc1MZLQW>1;02pHk%3C$N5HE)9X&l$YXBX6S_{h*aXEYC<95@*
z0_Iog#QRv!QDp9?{RH4p=y$aP8#BmqMn@nboEt1s_{tyc$pp80a}+7`xMMBY+WI}9
z>X+;7t*2Ziorl?Sv-QX0HPQR9CowlS48Qw9KS?(?g5~8bP%+?CRP^p&n7pOLC#Y2n
z;$QWCwu=hBT}Vq$H}SMUAF10p*y*l&{n?<TvN8)~rGfj(1ISN?Li4Se8I(!4Wkes5
zl82We)P4dn8!D^g-2v}pnw@;&7JsS^=9O5I#9Kwp?=l5rmX=E^D6mL~@g)xE8yy`T
z?5+Q%i7hCv+MgZ~eL@=Z`2&)*>Gt+Wu6JWQ$7*pHc2`@%npWIH?BCw*thOM;4)*^1
zhYJ$mpD#$9qN0(ei{AU9PiU=!Udpp))<EK>&U#ir;T?OFZ4UxaElNuGmwk%q2Zzii
zs}!t72A2*{13qBJ9(^xu<@ST9KL3T1)bBwq=5hAhk@a<<M4XLpRjfFO@PH4Pug<)}
z$M$>R%X63J+TEMkHV5PY^1eCEV^Ww+kV^>f+q!Ht3pDGwpum#=Igu}BN6iZk2e!eH
zF+H7(p=7RG@ccYNWn3Pst3Ru3ciknJ6`P&<wbu?eg>lIq##jzxX{UhnV?-)oas(`A
zVv;@U<DIp%lAL^ysR-g^zquHF@^6D{wEG4@q*5siEH4L$2`(-{dHSq@I#w`z{0_vA
zWs%dWU`P!<5YhVyjGNx-r<czdmi^s4ZRT3Qgm~6Ru3Y(c5AW?2OIW8BXI%MAeN^z@
zaQyJ}0wq#Gof)2+`xDR<k^B9{jf{*eoSBJ>s58vy{l0y*fdLChMF6^FtS(vuLHM9U
z4}IuFiLqZyO@R~0aF7T08L$w08WbPf{LVk7W;!oNzi@MPi_FY(3@$1%?>t{VKI>=q
zNqZL-lWU!>$1T<Dgfvp&BrPL@6iRb{xcWeFZ<tju81u~Q<q#B#GS>m6Z@NHN4alk5
z{G=@O9XQ`BDv*3{_A+Gu)R^A!k$e49#eSZURGoo5Q0J`>0`ORVaJISKxNEAiTqPnD
z0Ae|Y#P@k+#E6cp8J98df%FdKcfOnb3^YH-2Cd!Ewp!pl1_7xeTxqBvAC^?aGc){@
zv&z6HmaO9eB-m31uMLV`lV6~r30+=qV?rD+5Bc41wnaCd9-kgjM7>YnN>XFRWC;!3
zFQN8JWM}YKnG!qv9I{MS6dYYkz7jcMYqHO{-b1cnai}C<qDwZzb~kESb!^ksPqj4m
zJ%XywZkRUlE&lIg)hsH~II-ctzWuhz@3+Fe;ev?zj9O9W(`nG-AH6G|q}A&Znw9Ff
z!R4Frzc(&JTLLOvWX{QLES^$R1Feypl)<(;q3?{nMcD1_?Lk({^SJu!$hU6;K!gnR
zPdXrhTZI<{YQ$D~sp7gU8}u2df|EEn@W?4J?*-sh*6Nw=wEm(gQLcwV!A_W0Ru&G-
zj?rSs0dX)nV`0VCRc9X;&CcOKhBiP5s56^?J}h|Pv|n7W0P;gW5aJPAY;Bc30Di#K
z?CRj^<DsAQ)H0=W^<Zyzw+JvCHuDMm7)oRi&80=rj(y|kTLg0`Fg~uWT&8Z~Vjg1C
z7*V|IE|jgbx^xx04+hh~oQfN14kD-~tbX$j5NDj+_^3yNjw*OrNboSh@2HAPEO(CH
z17G|LF#*zn<8$g4Ot65c050c_f7Ydd`;IIt3jlpV!l;1vHAk^3UDkUwCM|6P1A0<q
zhk;dZ*5KT#&VV49n1nCYllAr_k>@C=7^}GuwyF8$(au*0K&1)Z#l#VF9qm+x47vJ-
z23gZjD6L0ugVL1aJZQ1A3WANHGP5;`IN&`k-X+PKol6PHF9nQLXbNrCdjMAGy+2?L
z0u0KJA4CJhzJTGls0+p2-KOE{9Yxb}uSaalmGSu$*>Pp%BLCloTaSHc*a&`0R<zh-
z+t8`+Vi>oyH`ly~&yC3Ky&K6G^ytnds*ytG>iR;ogk<|p<KeH}`zm_}j~_m_W8q_4
zKTe6H<-^MvQ&T{-#~2Y<W$VAc-KtThf(xgi%I6b-$8_p03>?En`o5HB%?`*8P*S&0
zjkVJqP`?wyr`$Y7RhL^^mG2GMt5*Qh-mV}bK&^`pa;&gr1Ym-Yo}i>ao9X7!F1;xp
z5Vu;VSgrwRapbWitQxu)vTaR?y(SZXpE}}lhup3Pg*0l3qP}7dBN(xj7eCA6pHtR(
zh@TT_z)n^^%?uPNAh{5)x0E{ggM)E^KHDI`NCO3$yU_QA1>%T&PzHkRBkx1ot|oFB
zl|c~3*>-h6Pl}#6WTv9Qj}!KM<>UpKnIkMC|1K`i`nkcQaP+6LX+`3TN6#M)vcpQn
z_ZmA#d(^d1X|9{juJ#x5{gW2yJ->dT+bvpnTEHu5%t7r*jJ*Gxx1TNSA1pR~1r~Ua
zhoPgZ3(B?(ASVYxvv4zPsn$@jMw<_W@aa`kvx^EX5DOC%?5Vm^;(@JC?2b8fy*!Sj
z8IA%yWr++!7Th4c@;{~N59{X?8`5qb)T<^+*hrK}kXWDXd&|_?=5>9;?ki_0Lt^xF
zd#nb6nX=QR)#wl|DS&S^##AP@#%+uZCV&#SOr>Ud$^Gs*gX0w6D?alUK<UcD!t&Y8
z%~%ir!KVWt)H3{62mk#<<qr*g4qb^Aa!y|%^J)Kdd2hkH5_^$~Bu<^S)_?2`@=j!x
zV@W8<BB!w;r#W5s@hd7Sz~(l-Ff)91My)jZ`e2?P+{}M3q_-{PdJ(odMF%_}d>Pm)
zt^T-npjVyeAw>GtBVq>X%9iOD*7;~a82T)_Ib8s6{qd5%!Qp&uRyJ9OLq}@ojwK)C
z4L=e8%7B6DXHsxk9si6rQpX83dk2)~)g=FtFPy$_e_}v`Rbfpg*X5(3>MIuiSZN6}
zB`mmi3p+4#bu#dF(IDW{=DA0QtQ5%ernu&&3wEqen7=G0ZIzKxRWGMt&ImOpnuAtc
z!^8N(!XSi!wp*4?4|(&q3>+E<XUs8AQB5>c1?pG)y)lCYri;IB=l0glZ{i>-RqCQD
z1-s$}j3C1JgF2esp!AgbXQe@BJ2w-Hb3SCSZ$iF}nCpSQE{{gPD=BmGo^S`oF&-6M
zdbw%(kucoJop;rp@y+G7((H04-|Phe6C4o#fqZhU^81A;;>VOctMtdNK<%7=+GBgU
z`x(=8w)kn08_m|k&(3@Azl0L<01pMyNl8VWA|4Ien6}Pwkv&KeKF5ar`o;EM^cEJZ
z3Q!qdq91Jk-W>$mtq~x>8DNOYCXm1kmj;^{VV-Po@+KYN`@eBr#|7e?ZYR6Cw5YdV
z%9z8@DK^LB3qblqZC$&fn!^9%>#U=q3fp$Cv`7g^cS%W0mw*C83P?zUfJk>pNH<6~
z2sj`jEirVD<VbgSch`A%-|t)Ntn<fNYyNN{?Af#T>?iK~x_%d1jQAY`P`%NnDgxp!
zwW^)XU!qk|nb_|go9a3wcrjUNCviquK`H7L7!VQz>?mDFLv$~TcY#Ve9@Mf!KAI#h
zi4pPPBSC`O7aUWMkD>K<`uZ&KB@@ilJo$1g;5qrB!TJmnm6Wuxb78>+^HQ|XIqf5B
zRVvd6ANE_j*@t`|HCSJa&rQ6N8^dq~khcSIuCWI8K&A)+s7C>cPm<<u&k-gtwkM5_
zf`wuk;Mn}@H%>~@EVCh38pc2k01hFCyV-~bWeAC)qB2-xCqjZC(27gCDoXTTzSLBg
z02BIHE+Bnkh_{ks!3dGo&VM}N?wsk&1lEXvNWmp076lTTU#70iz}(8m&|4u;DaV)c
z;@NQO0|4*=apZ#4N*vkr@!ckA`BoSonAm#RKw4H(@~qXt2AN%xcM=rJNS00ptUpLC
zT)%#(*}iKBS|;$&VV|Dr!G!<*{mXnfDhPzG8lR&;)^Gr_-`DK0Fc!d!rHUDtm=M%L
zFO5~UQ2p`I!66JR@4>Pyzpix{=(0i1=fPj*x_l5&4Uk6<Tn!LMLJ;xBegEkB8u8lx
zq#XaR_du(zW+gus_e4`G35?NdtU#6z)|PSwW7_&U=9b1;tDSG`DIicf0Xsbln||!K
zDog}G842GuKIr)Za-7S`xMUgdjUBxr)1?J|YO*mb6@esH+o(vqur55L5^S6bL5UdI
zbDAFuy8;FUdMw`7X5H1rxE=O|X~F4?#rzw#%x*v}4Fc;c3v2f#MOqHk3qD!fG9~w_
zu|Egq63~B$&KB;^@<s-tOTZUEc;8{6<4~H9?=|)z5b7L>;w~_oX(s%zGPi|CU>yo#
zuDyIf&R6zIOHMm;I7B$p5gWZX7X}Ri$iX~IR`8vW6Kor9J{GM%-=j}P#D7o_=R%#S
zwxJtj2GVR*!+A-L^w#}zr;`hL94c}D2I=ag({e3V5V{;7fwzF$d{}UDb~-%W9DmLM
z_N@|`?60eB2qH$y0W-{`oCIc#<J*Gh9**I*Kfp66jgj$knT;4;Jcu==5cBcR+7(I3
z&TL&jKAc%c`~ynd1<k8FzM(DQ=z#HUKtc@3gR4A?fwO4!PzXCGw8Nt-ZLV>Wh={qc
z38t$pEv=RdEwZ3BzAx0|Kw^CJ@eQ${*A5C$!m%WV|7MKO4yXF0L-ew^I79FhXsv()
z1K{pf!wRyD$FmxNYJaG3B)@luK1Qsy={5v}X@Jf`7`VJyURyd-QzAgQzj6#qYx2yt
zt~E>3bsn1PX%)l64BFh?USEhcB@BP_RyJgFt~%-?-D?G15pNMUQxY^_O;HtW%W6ah
zpDs>d&OPzhyVYZhrZ!xI8-92+*v^&{G@SKt3aIPM;r_}WoSW-zZI>mbq+Hwjk~}#$
zjV{F{At399a0QPxR1G8_L7WuWYTnAaUrnw*#9o1q`;Y@}&D6fEBHr(Icc_c|yY!FC
zBo3ue&)>h-6++vbU0F6FAXpNh9YB&bct|$8pHSV;3}fNyufsSST8d+h!FM-C;*f9t
zw!nA6zydAs(fiwvoKMkP!LuPPU`J<f5lxgF!OroLzGg;*1(@tKFS}KIFl#G~bqzHp
z_546C1-AV+wbu}Ny4V$fgK^O}B1E;<{$SwfegDka#qAje3K+G4l@BnoAV6jY(pCg<
zwgV#SI~rZS54zxj!q(ZEf{U%~TrqhW$NowO!?LMqdgdSQ2?Z91Bb??Lx_CT)&{|pf
zL9WOK{rLH_XQj8J4fYF|0jIHkP6M#`NLi1#m%)SuH^#_RpKH8dzPWswUP!f0Ol0ii
zP|0awZl02sA@h6uEue&g+Njpps>8MnsBlK-{saRWfD=_u@~0{uU6I?__GBSeQ&Lil
zmSK}WUF`Q}F8il2)mZyD`*=kJ0`QKSd}7G=*n^D$-@l`aLBY$#<(482)Q>!EY#N!u
z7ka)V&;04=xqgK+LlR~DHaLVoJ9aejIrx5#S-b>L(k{u`ag%9&yT-#Ub0rK~lyyX7
zV=DPg{HXQM^28{OD%t4FmU0_VtGJW=dRC&mW&s)xdC9wt-nMI8!wY}Q2>`S(E(`^H
zvvQa*Z74G%=gAnU4E3{Ru1=yj;MHIowe+`qnSB7kD<;%hB6fXnbu&}<s;8U)WKqSX
zyiEjLl(Sulmc3cvX^a4SEUN1nb!*X5-y_3Yg}dGR8;Ql^*+z_wMx$w4#erDU7dk2F
z#-AM{XRpr|4?V#(T$l)p2dUod?M5I)rSTe<tL&a8@pCF{QfF&>`-yBGXqzhY$KPq_
zZ&**~TU_JdP>Of8-C(J!tM5<>e%(9d66Nb~GQ6N$Hq8r^daY(<8J#8A4WNJi(y}oQ
z2mg$v7MZECli89v4p!%HkvR-SLlDI72mZo<Vj?qNGD{)sl>lHT%S9I(^Hm||9EJ;F
z2r+59c@Fb}7c7KF56Di2WrwB1=S?T0rQBXlp}QiUu%kIffPXx^*pe-{zD5BxvL-+9
zEV}wTe~#)70|NIooi4a-4kW1bK0;z`{(jVO2xcmB=$@giF9wPlqIWC9V8Gsya8Ciy
zhd?~h%MqZt-M_oyP5!zl@SwNjekKLj!h*hM594FCO&&ArewLU*)rZxQJOkE5p1ZHq
zO5-{@I*TCx`0f3Gz90w<+XT%(+o<S;a}OcMB|czHT+jY12xQLN<0bf5!T+2o3z_wr
z#pSBha+-1;zkv`If<@xMRu4b}o$x9SFD&HHYxF+%&%tXK2uVpJS)N>P{%VsNivB~j
zwnCql5GQAoN~_vRt5EY7-zx#+@2r?FZEX4!Rh;%RYrs%d@Zr@@jb9hHkKfwjaPx|F
z-yiMY-6ALM8pLjQ_VG(Z;3i9B`i+Q-+MRSc-pbk${M@=;2Ud!F4fbbPXrQ^U&Em&s
z+Zi2WzU{EDfe+1{F`t-W8P4SWK;FB#Ppx7*`C{L>s_7-3>v6qq(|v5k?BF<g35xEI
z*Y8$j|I9k>)$6TiLOL?xFhf21#l2hB>c5UPM#kgJ?#;8A<G$;sGeYWDIyh2yN^c?E
zfIeB;e8mIm=-<?U?zwN;s?;<M4K#NlFhyxo`f6nH=Ip^(+AesPJMaKupdf*gO`5Lm
z6BKE%To+A9L@s2;ns4xfFVm7m(7jKLO&8#fWc~FE>@%<H;^yA)Yb{i1`N%^x+J0(s
zD+QEf*)*ICQ#;&leYv@8zT2n%DH55>Jk#KiDM=&8K=BrmxR^r=woO2ZFi>JUUc0%&
zkluT|)ytV9XXfOpKFk*$gd{dy4VHdb0a{ck)^5Ny1sqC7sc4IGDDU5qP?6>8apYLB
zc6Zz(<}%-OyJVne-NPFN&U^ZLrp~3_=al7@5untn>%D>Go>jAdu<50mep$b}xyd^`
zY@v*3Z*XqzYwt@vv{dP}?ftC#Ic$n0{JJTCM$UxgQPrcL-u>S73LT;!HH}}q#;3uQ
zyuo=Il9;ID!MklP<K@tNVM3IUTVJ2NvgG4)Ht!2qN?1jnp5TUJSx<xbKGF7AY4pn>
zt!BTv8If|1XI$Le12;DmnVI^`P<w08PuN-q>*Q+N`Pb#&=wpA<<6#~3L~sJQiW0EQ
z7HVL!==YeVgY1qpzjE~#1G@G0u!|d?EYBqeQ0_St#qB*hyx~>h72)kntJ;3ZGsD9g
z8XkuKJ-}$b?dP1Vwn1lRCOjG$9Y5}{^LgVfjoest&Gv=#Q*zXvym+t^u`vVz(B;F^
zHEB~a{%&)g0pMNO(rZbXe0+^yWD%ArwIy2e<M<{*$=B*sctgiYY~9RIAOiwWTYl@A
zzOY#1w{L?F^oZNJKujr?_2dAkS%UsU;;bd~!yL`F;{e{zr&PLWGP%)rueJp}Oad1d
zd&)17U$@0_Wv$cx)ad07)HXP`(PLg;NBf=t7Lu_+L7iJI$DgTV^Ji<5hIGGwh^x|;
zWbIz_ds&+WznCBaU0s>apOrcH5-^APfLm4c@}d;1LcF#IC4g5mR*&DQbDR?6-DIJM
zrR*M*_3PlL1R&$*;&INHOeIy0j%MFC@G&p_Xzy9D&Q?B0UuGKdzgmFr6|T}!E@~#g
zrwZgH0FXo~?0WLsROI;bIp8O^gK$1m$5gEQ#rumG(cAiYgRy0i<aLix%8Az`Xx*JX
z*Y3T$ZjMIx;zyTAoTBGgz*UG?-!QDqx(a^la~uJ$UEcemavr30VAphVo}|WcPe}=X
zy?TsgJsW()kVjA7Ygs2n0-P+4=Z&}reeo&_9&r{~SCqg%Fe|XXxYk&6*bDdZcR=M=
zAjqwFHh)CY%?Cm|zn2$=WeV&ry2adM!W}%e+*I(ef)1{45)*U~j1)N1F2zsEGUkf(
z#Rb-WZu7i@JgkHU^aXf@#Fd%iX$dhw%xJO&UGkW10t6MbnGR)Mo?<J3)wS2JA~a%A
zDwe`xrLyyCk%J$yJc(`lxcEiIjKGChX2xbUR%)?v!3|l(H>+0!QIx=zGwRjN<{+#w
z_n46}OvYa~Df*?3Q1z$ZN!8W-nx`k+ysv<LAeV`(^Hh&4jcjx0Lno*pEn%)$7(8X=
zy%gs9_a{;2oemAmVfc~vtrgIh(Z<UYM0GxE1Nv+LF5KMN1B2z_@uj7;ZP(GI98?{{
z!DZ~21sW<tw*xzM_41Jbsj|%9`QN$CCH6x<Yez*X0V&D*aBaPA)-M_{yGheUmdT0u
z>s4XG?8iH7znQ`FKwnk$gb>hM#nThwpvk3#K&Cdm-vEjVeJ3Y;5P2~Dg10aAeR)1}
z{s>GHNQ-IA$4-@euWHn^=Ix&|d7_XD*qN^@)lb&!zr-45zz+k)8aak7_lwxlI0zFd
zwMY=6;*;I}BUGpwDNw^|WcRmuKnYz=Peo5UIeA5$|5Wf+AY{RqTkf8LO)kLgbwiSB
z9XvH944_J&RV!o4-LpD$q^(dddXg9rBhT`NBfWTMWYfc%jD&^)hoH3B%;o+A&n98D
z4X>COK$3iPe8wWC*luJ3c15;xfcEf$Q`3S({1q*8B1G<ecZA+-b1*<L<iB{aX;_&Q
zcBtO5RJG!yQ@uMO@5n9hrotI*<79n+VKr84v3rHxaC}DI>(Q4Sg_oevxyr_IYc)0m
zg7H>XP{6-<UI{7lkpchrzv1bJZdS=QkAz5X>-oItZXLEY2&i#8YYgM+ixFGSC4ONk
zAl#U8adf1YEF~VJUoAf}I@oNE-75LDt`2Q#S|m({?qMd~T6rQYEWEL)-(Q{=0HQ2i
zcju&KEr@|KQE{!u@Rc?lXnJs{GZTV=bMJklvrDOot!sW99V1Gn{;bzQ>-9<nX?ReZ
z<D1{$tsi*eVdG<m1JiZ}XQ<7&Q@)_?LNRUp-i{jlHh8zenmX!XzRiuDwSVaQ%O8ip
zFdRNA-g&Ht=DM3-^yT@oDd^xoy+HQs_4Hb2<!p?JZvT~Kpm}=c08VqPL>I9r&9N<D
zy#z>Y%LDb|vi$MJ?^US7>O9XHPnl|F9bU8=h2|{7x%=5F?LE8Ii2T;;w8bMDYi8aG
zXXaE^M%W7~7HZR^cb6G2n*#!<AU99n7^R5N!GJDb)gQdVFjZYGc>VrPyM_K;5t>3E
z-bY^29w<JjBzUhY$(TB@_rhDMcPWJ2zX3S(!P<6dx$*F$L2Zgnc`zb>gOuA`D<1`k
z%A&{Uopq0qXO?K5JYg?h;7o>)1Orb>3y7Cb1`RxUFt>tCNDX~(_Qu9kcp1VT{;Gm~
zfB!iIheR7DoolMX_>z?ifCDup|8=?QckRE+Fplm{RLCmNs#=(}Fo>1xaH8ay#DYgt
zwjb*OR6M$bJ1(NWAv5uNg&c1t<Q+Q^7k0c9txBP4i;I3-_ZwgU1U8z)sKc+)=n_VN
zX9w2Hk`FmkIRX3h5^LozSL--e<F`3)UGls$VL}tKgQMXbQR^^JeXJO5ZQPy!`)tv1
z#&~5AcnYRAMdfJIY5s_ar&yE{Zyg={oLPe;-%r&}rXtt{zd}CC3+wCGd`u%e76KnM
zYr7&vPtUdhB-vOe%NMADRsWi~g}pWUc$LR0l=v4a7RP={i$lg%+ApkpOAxlpdYiCb
zURze{wNtWflH8jpUaUcvsHnzD^bE<sdy|o39JaLl9A4f1V;GbO*n8>H<<(h<zGcBd
z)`6NQ`2PM_k5hgTI|PCy9aj!$LEKEW{@QNMoHmDu50n`SWCiT(eVhds=De1o2&gvm
zw_j(CQW&6<XRnWra7j(eGPxO%_Y#j7Tr>`jrY<6SSIdLd4$|FtBqRWE7RVvu^nNzP
zlq_?Js861_I-2+gT?+MWO?85(OQN;)Zx9|4-u|2b^wJFngMAK-V!6P!XD;UU-+v|d
zvQ`DS*xS?gzM2h^%#1}mF@ceV8I$z#t|?HS4uvE*5xM((fE2F2k%n|vnop>3E)~yM
zun4G-ph=PR!c9}Up2OG+67=S3S4`kctf%we)aZU8r>k5WkaoQ&63w$5C)o6GPv*jK
zp}5|OevJW^)XBG>mtK_&jdAP-bFg}>^pbOvCbl}QrbFgci<PT0u6^H<pHEWPeAo+N
z-96Z3HBc*D_4&NH-{>4!QO99qsnj+qUJZe0o=$*#zWs0zUjX+s_jMg8PaAXe<t!5E
zL{=^KU-L+GGAqQKNnG=o+iYGWU1u4k!<W(!_#$e0Q=xGn=}Fawm*~*;TzOpR*sG{P
zwqQCPdOpI}e=IJcaIN%}qvODm^zEu1bJjZ^19bE$m+o3j%Ch`oJ_v-8;!|3_C9zA+
zf@Fy9l#4v>CqAW8p?`cz!{XxL|HfZZ(meb^TE4fa@V?YA`1!+Y!KBr%3BMTp_~9jx
z@e~c+(bDPz_@CW67uV6mVM5PF|9s0S?B$HJyM|ZjQW$#hw-~-ql<CcEy~}`yV~F!Y
zSVYIge7&R9YNI10^>Q+YUnvd$NtA@(j=K!h?fO5B6GI?RmyB5$)V)VX2X8Y@Q24Pb
z`u0-miQahONR0rN^L43ZnyZ+aoQEeOl##etbH&5pbf8WhoPGT>k1VZJ_95^_wj{)j
z1`U5${(G(ur;C=U`0Ia8oy`78`u8XLRdNq!?#%K$%$XWAIbFTg><yrFwQ}|}fi3ID
z#vhs>CW8e#6wdOZ52q+AAGR$_tfvLK3*y<-?R=aFr%fNpVLqGA*r9fpjLKhQ`dorQ
z@M0wBZ+3}?!Fum~^XT>CAtwh4auydjIDWMW23I7cz9d1oG@}r)|AH{wD2>{~?^2qD
zH8DmH-t-S85nNc;M2y!}bd(dTM@PHsRaX!oU~S{^)=sj!Y|Z}YaHIx}IR5;}3Va}~
z<X>1b*zGM`k(E=Hv@%fYGOz5b9=~m2_maHQhx=R1l_(YywZ-r+1O;8SpZmGR&HX0z
zSGDAXfGrOyS6JY7UG`SX!_{Y#3ymm<#&pp9;_La9lY?b?#KF2}H7<(=Tu9xVU((l=
zdL~tLZ<KNq`;pTvLuJJ))DJ{s91FFvu}-XG!40ocX8E+aVRjo_HG*<WJ^81;L>i_c
zwdIWuZbS)7G6@9+d#@}PUJD-zb&`p*Fqi#5KR@tiE>aj?caK`X;x0>@hbE}imPi+B
zi`tDVDb=%Tn4xQDPMvKsv$&M`2GsspXgL@hnv!bZ4@T6v-&rzpF>4?rE7iwgeO}^L
z%)|G`q#=x6;+3FdC@v`k`mhvg*E6;-1T_s&gt{*I3yPDRZ_H4<{A{CtzO5nhjG=JT
zueOp^+Yy{3(8BVpDR=CAV;YVF`63iF4yeg%bTqb5ByeW2s(8bA%up_NiC9$(X%gyk
zRXy6@H05#!?N1{x{GMYxiyABAgQ#LE_NplT3I00o_MYem8>%LkA|hC+qm8!h)ibPe
z9)FZ!zQV9T1Z0+=jRp_HD3$msP(LLuu_}|=<-TYAI386VLORlsrd?l>{jKn1WZz|P
z$RBz2ohuDl#IuuYjucI2SJv2keVryr`uXegdq3H|$#C}i3xDILgUsfS+i6L-Hh)AB
zc~-lcdmb0P&irsrPeX(QN$n}^-AU=4#obZq{Y&4o(mVfpyScaj;+*XoLrQ%QUw`&*
zItHXko14+*Yr{|237iMIuXd*x^~td$Vn1Qcqtb0dTfXbDZoNWdi+rJk<~rZ*b{`^P
zHeF}HF8V=hf91UC49_MiEQW;L^Thhgw|y~?4}WRms};maVtl=8xQJ*z7pwklE5#bL
z7*po6K6|rjc!yfEI}^C=GqxVowvJo2nSWjDea)1nJAT*?`d(ub&&djygVu$UH8Kaw
zyqrs>2i)#fsa2^@wSI{}ep>CU`N=l*RKMDFpOd|(+GI%+x!%~Zez9>~w)8mM=uei7
zt^fh1mp|r5$TJMt$v?-MwsYlAq<y<et&$toBw2%uwF9Mdj^o0ejlO%21uk0jui4BT
z2hE%6%VMVx?TT52c1kfr%aERd1_E29zJXbO#}WEZJL~VojR8q#I8wAvp(u-Tk-=9e
zkF&$n646vx-sBcWY5!Y0CC*-HG_9ODJQyd@o{i2-GdWoyiC(5n{GL;unt$~nAr7PM
zw@!0b*}(y-)u+$D;dsg7$UiLE-mgNwwp84pAT=Emv1a37ojebCE=$_6tvgY>OeF4h
zZt#KJG?4B|UHudW>aBYggC0Qv=<$C={7j-v4y5BwOCz)Vyl2$^%lwCiyV|o-tMBDG
zIMN=yHtCjWBmC8sW=3CU>uYFj(mypMDT&w_w@;1oF)hidEIthcox<--6f*Mi%=nB%
z5wSlNzWt0czVzxKaA8=Ag-o-E1#(Jyn-aJjra>n4QLv*<W%3-hmW}b1ie-=z!*vH`
z2oBR|AS?-7q5Q7)*K;qifPY3da8qYiLESsy>Pi?%9I!mwxWc*!Mi`g0lO!Qw#+QY~
zR^P>+74<EV6IC5DmrtPpl?KYqm`8FU^tlN<YkJf6msqKNL;}^FeZtzB`DZD#EVaNq
zmy^@t{KCRmaMhE(C4}pADQ6hbX39P}KyT;c8zFddDd{1H+A0T_FW7+rM6IfU>3cq*
z*L(LAHc<}0M#I3sOpFB(M~XH|c(m-AHdCE>F?ZtRb>#1|(BFQ|UnAODGXAlydDYlu
zzEsW}HbwR=&PXY;E7;TjvE0i(`_I<VuS9HfiaCB?S8Y!~gJRm~c8D2>c~R(Mx8x0l
zUj9h1_|5(A4<h<oTrTm7g5fp({QaUGHx_~M<)_Wrw(+JL#wFUnFX9`{PB?|q{I99+
zc&zHT%A}s`>|kjdSMN-A?S64pC3wQ~>O>qNdQGv+Ti7%CQgO#5Y0(re1anVNny#tz
zK7QMFMs{{0+;BZW+jOy!UDh-jvsh$tb@B9O7NHDU@8#N0=kFSQ1GwvBd~XJq-Lt<F
zf?1wHlP2&8vf}7(#2ji&CZ~cV%%#0anCP6S_p9X>wg7k8CSH7W5G~43z-c}8N^5-$
zK^c<V7mz|0av!ccjG(@06(|pP3jDxt{8#H;&q7J5SF-MSjk-p7=c3kStM3=GRe{%E
z9eWZYJm`w5hg03-Bu&w+Jay$?vgZbVFSbKI7q^#~?XODU;cd7W;bpjTbvWMZ7hI)_
z{T}m?HR^@`2%J63a|fLw<K$s)`R^Td7d6Jg*|Eg(B)!hvPU-!t{LHnHYd}=GL(9pN
zSi8UKr13qmyVDBxy}my<)`})LxwhP&lMz*2`5S9&(rCl?=l9a0ofq!7R(oM<jmOQV
zfKKHuzwLA*DlO$(oaS!weO%tMZOyTB*F^!;kU5VmH`!sY#T@i7Z6p?{+DrADopN|e
ziV`vs%kyf9wgAH`%xfQhcsGpDAJQqyD3&(9yCyR4h4QYC?oDig@1crd@EaR-0mHj1
zH~T=NlLe~=Poo6NFSd(;sSLzhD>;aH74;DnPoK!-ET1%~kI&s^y~+CrF(xmUBNfdi
z|2Pm7zw7Q;xb7P$_?xJ2vTJoYmE0^BHBV!(yuO;8UEm8hsJk9>Sl|8P?zV&4biMBT
zCZPE%=G)5!81-QXTgXMF?>Y5hLA2A(#A|WEq_sJ8Tev;s$9k9hO@V}oiAiJ>GV;l}
zi~UjYvUdL7bct-T>#AfO7B<zwXtLo#BYk_Vftl-jh<tep+~HwBJku-a*hbu^UA?Mt
zxbH`1CS3gFpKjZn94OR#et(Bfk@g369bsrPUFUM*!sNbp=({$lHAl1V&gWdRy4LvR
z$uBH;FxY@PJoPTBTkLxrttO|UCRZSD(aSd?8`kl;P^shal6=BxyPrM7E15XUJL%&<
zYeh>1lITTd^ACxvWi1uan3odW9JFcG6}3=yY6|!CWCPFC!EPPB(h4ARbvCkpiH9^~
z8Y09a+S`>`^KW`I`f*^|l*fUeh&IV29QW?dF15-Nw!gM3dQeq5Orvsy>wBK<v3>AF
za&SVRWxUxLxAFy!<H`cb^xiG;$$0jqn_D--I%&FN?P_)7AD2@+d%&f7@nmeI+-99>
z%ypET&mDtpur+B{ck{E=_mr%Ku<U#PZoa@-LY2F#0!8AR-+PArnYiAGuZo$PFE?@B
zZ-UNY`@M$H;*#jGYV+u(OTrkjQ_#B0T+07KZPcHJZT+dp_>(jK@T2y?tF!mDL8L^E
z_>Vuv4>ugFsJQR8;58NrI37o5?#xvt_pRU!ck^u5?EPrYi|&qZrx0^YiF;-~Jr?Ec
z%J<GttNn{zV~elvPO^;dc)6twE^TwriRcyo&dOZ9gshhA3uJ-$?%VTO`5$RM>r*~d
zmt)i>{Y~xX_r3S<g~$b~d3O{A7RN%;tgB93kF81K&3P9A-LWd5PW`m2-KkV>2NlZ~
zbaxJP?<KQs-jA5^z2=8h!vB*-KhdDz;~IH*_ztJ}o+zOG1<M3}g7oyS$5+BzLU(i9
z4dwSVL6?>W9?MFYsUUCbO1^sT?p1Zo`ept7jqmaHIND{K02Q>DUrzL0Z>zV;;fz8E
zY`fQxQ6p_}VuR#m5qhoJx^P7*d*^Q@bp<OIN6C6Bea8>6+Y=M6r0~KYI4@DrN|yE1
z8m*M-XA(|Q1e>y77?Q0Fl-@ku3P8&T51rG?pvia2QHnew{L+750VUOBf$Byk8zh@S
zZ+fEXvO)ovM^aq@-A2h}g_kA#l5R~%+9OEn!Yi=twPPxe8Y{~8hBsMPrvxL;J1ch~
z)ZeQ(!c~p5A72UJ8oBcaeI$ZPBky{CCoEYuO73+ZZILwOuB~R~>@DIH?an2(SU-C?
z(kV64u{;9z?^9O(mO*OfB`Pm#g-!|Z9Fdf!pSjydM(7saWpCt{b117@2sDaeXNd9#
zV!loCZKg%J)Jr3HAv@uLpts)J{ph*E_0$8|_j_<%-P;doX&YM`Qj?5CYwC|aI_a3d
zu=u+QS>a((a~fWWzyT8Wfjy#`K89hZhzvn~e~Gcz-o?1awTdw+-@3n0crIHubi8f4
z3;H4#(}?)%jvvtTBa)K@r695hg_$`yTu~{y@>>s0-y`hPC&F4)gHx08bf050(p$q_
zxXR3M#diBsl3sHWcI=<~Icm#U2)+_~JNTR-7u0NI<desu4XUjtB>5=vp>Ej7$m9p<
z3L@X&8=IeuJXe@`3;7C^6$fVqRgl8eIe3I#b@r_=lwhhGrb|9~!$6V)D~ZqVVyc_c
zbvR;yl*rPN(bRLnH~u}#y4x*vKkYx4Tc?Bs(V0!ZW|h215xrvC2U7moXpveQ1V^s;
zYg#QyPY}(Rb(ZCW84ni{ieJ81aG=93W}u_}vCSjI|F)3O=)DE+p$wb;uFc9?fn4%y
z4}2CzaklS868dlsZo#iT@ZXNP*_0$3elf166P<K+jTa<&sbo|5M7ERWuKWrhg|OOY
z59+JW*?GyLthmBeOm^kT|8L}<;)LBdc{3n;jLa77Qb0(+0l=&iK#VNdz1ayhTU1P)
z=-p<nJv`GCaVUi3nlzATzHNLQo?@EwIU8>f;Om;3-p}XHwckaOxGuft{AKpk@Z!cG
zp<sOJ(>N||AP!cEPWa3XNZ`CDLXnbLe)TcVG7dFnv}k;24wm|IdnzSOynEt;LaB)V
z-_VGng%&zyK+p)w&?Fs!?EFgD{7qV(v@B`%-^{yHsfDB?#pr00j{40{e3uIguYVv~
z%AJ1jM)WBu9qh3oj;Gj4xp?@Mt5qk(bPFM<8LPgDZI77XYlW6u1vPmQQ6g?8g!$TX
zLd=D#YJOaD$`s4D1f;IJvt4(|*)KS~68T;*GDC+*T1ku@Jd^5qe!eGR#+(#YSLel|
z7He@rh`~knsia70$(Cr9v8gT0X`}Gonw=~c<&+jh6>p>ej6svP;H@nQF~0OTzBD`#
z@I60Q?C(F^T9#O|yIb3r6EZlp(fR1iBR`*{?_6EQUFO1jOwi5{^qLFbqCf4_xp-El
zL(7~S7ApCTb2SAK$t&O;H*V;aHa_ne55!X3u#LgN(ay2rX^)NAQm5f0@tZbA{8D<d
zFeA(smkopF%<t(dP~t46LX(}TsTeaP^RHt`o?WuRKMfl*mGt{}rplj+h)MHkN#>~b
zbe_gVD!t^9c-0o){KbEKUZ^i@&;jW+budD<JVn~;Q@6zKhqLng3N;9%6RBi*t3|Tj
zGeP#V!{h1qglbMVE6ul|n=n+Kr^h>AHszU)o>1M!OPIP;!g-soP|?xRNkxSa`i8gs
zHT!ds@k+eBo`G71p3jSHvFC3Z?aFg%p3<@jNg^>5JEB-=9beDiQsK_jWoh}G($5Kb
z`71Ih3CBZI(#)-^`)&>I>20TK!;`bVBy~pi0=={BoKJN2{goO2USoEZ4L3)Qdr-bU
z0hm^IpGm!AUF%*sa?e`2@LTsdEv_L=H(-zu>9X^=MY)Tnyy-T)W4kE~5WT&s7rl)4
zH5sy6M%*uz>P%b5L5NdDJihr}b=z%BAG<VN16zVRiJnd-WpcR5LjjpiNTRjL`#MF?
zA#^#<6x8M8j)!-Ax8Db^S?^tT<;}SCy0(eG&PjQZ&AB8mPn*rC#Y~%+`wbC?NOnJ-
z%s$>zO_Oapwh*ngc;0;39g`}b4}y>riURE7DN3829~Jy*A-~2kNln~FD`86|6A9*=
z0l>gV<5d8YRjam;pzzUACm3B~;WXKxz-?R1>)6WB<h_D_d5*Lq!_yhB{dJx3(YLT2
zIuK}4wwlCw5LN0Mb~)(ge*gDLxEU@j7ARsS=q_AZWG!s`BMCA|g+6)DMsqnTar3hK
zpYYx3{e{HfV)lCW{bn+u!kci$nAvmh%#i)L{_9fF)|^EK=D!0f$6dXgyxaT-Rd%-u
zu6DCuE4c=WN*nxs>$mSqT%rHzVyJYgq!1O9Q!=Ga7dUx_t!wl_F^i<_w{AbZ;T_ZI
z+wk!-TyBpek`TC~*J|(l0%#a7L-Y9OZ)@(!ardm33nXr2%`0$HSLmwQSP0kLmn<Y&
zKTUN|-z`#?Lz@%hUWUn-jxgOQMrO8+Y-5+`(h){8<Bg7d?}=0uq@X1%Y^_iRxHzc{
zu>V{#-TlQ|SR50t@N&uX5z(Q0f||JWWIT$$vD9k`TbPWvp(H8Voh0yQS4jBj_Q#(E
zzGfzDvrA1-K!uo*Ls`=sQRv>$<va?0RPzATTk@bX=YlXinpC7}KLTE%R>?So8H=!g
zS1`$Dr%)N4jFr?%C8@R6)(V|Xry~XVd1RHT6o%9y#-beIu&6%OJ9M;hCMXRF&a%Ms
zPN^sG<AadT7}wYpFr=(NIi<kw^FLBb{{*PLu4Q`r*G{!UA4xn0)`=vZ9rH;ErT42I
zzwG28UasT7g*Ppd&ub<v1`-_Or8v&Iz&0SaTTuX*fKdB?G3ygRjpcQR7pzJcVTQEG
zmG8)s1VL$kwIEE`Yo_QMDkq3BL>u2v8zgVj5NraDSsga^>Yz&Ea(>fkZejkufZ9lN
z+5<|H_Gyi6{?2r0|31#J!97shCPj}wz!LQdsu$t0#}BS2vUJ)~?|$d6qe#(8wMv?q
z$igntHIEDCeNrrZ&k50Sv6qC*Agf1{Uj%;kNI;%+z|>12&whtJ!?`F^5OVY&AEpL7
z_O@e&{KwF^_TbDKkU{GcUE_P|?Q?hJko$^O>am0}OtD;}qn(BjivUY|RJ<sX%S(pN
zn4(_BqYzg;+^9DH$e<oDtEg01>B>JK1;eFSBP8&cJ`hON@lPre71Ct=q|a7bcE^{-
z@Q-Dt&6Y3!27gZLI_n{kKBahf86rWat|?r6BWy&H2r=xG^0};5z`<dCABI_{SNKrN
zTZ{7#fMO4T%|tQH5KHBHti)RMD{h|?!@DE`((4S$2BkESE7)yxvFLeac7^KAN7EGh
zVOA=bFYqf~@xX(XjmW603tHd>3=Cw#u=7|>{J!j^?iW6AMbFjWn+ZMNp_SRQU(f|F
zj)t*R7`P*!JK9eb9EAl0KwDY{t*{;{jUv>~DVU+GmIP3`p<zG2>Nw_xtshY155yFC
zpo)ieSm^pGNlo*t;u%`7gPG%QVw`(c2p*Dg8VTE`XJxLZ-h!|i_|C;XMMbBEA^Z{m
z3jXUlsDC{akI5)WKCz{@{27=pzWe<pRE3!2(dgHO9*&mhZ7mg=8+3;6bl6Ko!ElOv
z@oxbXJoGs@WLLo-PDQ;z|IY!EBGAy)AQaPG!)7F)=4vZfvb`W&jq`Bcwlu^zI4FXy
zq%2TnMo@CCf6T&|eEs;Ltls4?xWYe6``=nTIM`|~sK6V5TJnD@@JY|>*bV-tI{yce
zhJyo+_MaEBvpx7Fg7bWf|J4Hg=MO%N%G&z7a=7?q$_)Je^ylOlIz4dP<Vl}gM;%s@
z^aGTrD>9~WGp5lqrth-9Wb^t~d)2GabcBe%1&6Ia5_h%7!$Nt2hD?JZh2aQeFVQXZ
zdx-)hSMMIWVzFxYm_Y|RL}t?<79Iu3utkNL(4=s-#s+=dB^F|W5unN(80UD&O^hiA
z&hbwXJ$~3ir56qBt`BP>8f*RE;5K8&Ng$b1)g_l@InayI6R){(?_CG{jPE~ycsVbj
z%|b^G3bZ>Z`F`7;Kp89A2!H4{SZtZ1f=fFkQm<X<`ZCxUsPB8!o4){Ski#Q@#+@j0
z;Kda5asCEGT((n<Ax6v{fcd#kJ%K9;ayE5qY+exJfEHkTyEJIFf{xapcE%|=e_XG5
zYIe58!C%^;!i22X4~6i@fq1{?Yr{aCb>P?FE~dLp>iaCmLdEkfAJ^H25V+3`eeNJx
z(@A1!ydsl4V|>F^kAizi#5}dpZE)0|KUGT;IC=E#K-~CmwlUnK{O=WZ`T_b4c+cP%
zY71v)5`763aKkH)%f~1%Xyupy|8a*IoRqV(3-BF020gg`FLv~>+OKA5UVBZ~VO_a9
zbso5&d1|_@)Uo97BLSoy0GK!shXI9s#|4R>Q7E9)19w~-7tnGWw}aeLXXi~ZVsPm-
zF`$I;1OyZ!!Vl>OtwtEbT!)vpJB_EVwsTHw!L*^{V}p}bnDu%<zfA`X!Sl~wGq-KL
zeNY*K7VAl=e#rcOK_N7#E1wDYw}D275x>xQxrN9}{C?D@`{8Lxh;dn!!~hmBQJ^h2
zIXQJW>R=vLkH7E|C$wMrhfXok95egH4$2?fax5x3-swW2hk)w++Np-smbDz_0eAQ7
zH46(Mu1PpM!)c4ffV?i$W&oX6RwA~`A`4374IPGEDd($HSAErAQys;9t|j;sk>DPl
z``*zS_#6sRjGJ8#=zkny*>Nn4V_G?nRWA4$Hij3~rJB|8haEo*1*VrYZr~l(G-?$J
zUj|-VGBUDMS5}t%Nky{ec@-MGi+`usQ>XGZ;0dlx^KO9~IMD=3LSn?e*e$OTXMrvO
z#Fzwazp*|WfG{<Sw?H(s0RtiCvL_WVD2_Xnu{&M50oTRP5?#Eu7A{55z~NH@;l$6R
z0DBX3gN!ve>_MfOomxD*vu8u_xsUI6d=!0pkMbllKQ(tX177ShM1|zn?K-`kZ;5IX
z)y1Vemf5uLZJOV#-Xm&LootZ?NDhj4ZB;EK(2&{irKcEwSQ(bn-}5D*t-l&%&eSh*
zzpc_LEG#rW&(ggZMNlt~P4CkY;>0U6c^twlSdt^WPScwa53Ts>UX1pZ>fS&pW3*~(
zM#5+=_X`^F-Znh6SA!(Lgbi4~ATZ8j%wmcQ<)P<QD;#tdhzB(5YM(o+FO$q@Q3RvE
zRN=1r1IP*&SS`Kjc`C3`vaLCNZIu@@WNT!hyrvPsnz2VN*i8M^=_>O08g~)b=)+^t
z`p_eak}mgig7<6?hOJQeQe-q1EtKw^mI{A7Q|!;>r0KnnAKgO%k@D*5T1QWNp%Hms
zEnV&(Al|bkO6hF`Y1#qh#bB)QocpQSp7#PR8Cg1rCXs@`C^SH;>`fmPP|?6mK|ega
zb7)jNLqQF!KaLqz9XE5ak0At4Lbw$J^f=CATmACAnF9Tuhvz29Orc`=qOeff+w>U`
zuEH>SaUq)fwlw<an^PqDxPg*MPcaN1wI6Z%+67q^&bxBL%IQ~>n_?U(RWXfIna6ea
zGy*MiN|qKhAl+w~0uD<Z%&U&6@2$q;m7zbCMxJ4YSbqKt2F9UOzQRtAgoFz(A|TT?
z$&qBw`kv3!^Y;KRo!_n)=L{9&?+^6`Un7absSjl2=|7bi9wPa~oy_cQb*SsN>(~{C
zK^KXGcvjmo@T<L`zcC4j19(2DlEp@Xwe&!|4X@n`LMDNZyz$MqWb;?U=#3%$^;(!Q
z!PGQ3w{}%D*w|RxN3<rA6hq4&4cfw`8Xe`_L*j?mbF8XN+D<K_E&dIEGwDf9G3`)O
zQs043_%OW&9olQgN3o;(QLD?f_~Nclfwp>i?Xkg^(>Ia}b^Ph*)dzbbc0jFR4kVR8
zk)H3{{{a{Q9|0v1_`qxC>#R|UNQmPHX?d?1iYjXoSD;^M+Lt=p_O}#pCNQL_6<9<A
z9k3pUVafP?p&SdhQangu$x+pg#Xf}nNT|(HDAcYqH#gHmbn?6$+B}h+JO6M&{%M?_
z7K=`wJnU>&a*7diSQ-U?H$h!}!s&&)H7v&QbDF&ZXO=z+w5-jcCn8?(^36>-Q=nxm
zx!Bj{>LAr&RxU+|(~ARm`lq?$_x?)zYH3uh4n*&=q`hXTKrO+c;wegcU3qTQN_6v+
zu2E73@?a2NXyFoD4qxdIgn8kNyQF4j(Iq3E6^B*WtaA{7uy}4BMUG^kFz7qs;~iE9
zb-bDnhaA$vnRM~}Ae9_s5{@<ki62l>CMXoVFaS)@<IAF>v}6M}=8pmXUW;3l@DQMY
zZ0C}P4wJBziT&B-0c9PjoUhA*#Esduy;X^d+T!@>dkhm3LFp=S<RVhmryOb_hF#QF
z3?oC*#*U#ESB-xiA0t?nBRW|6V@wP3F{+B+5IGSRgdC1n;eXzFTgUI}nUppV)uFZj
zh_Nhw*d0pIl=cA$Tc5B%_8<d4Hrl0j5_M;#Psennca`9jz3^k)G91mX2VF4ngWdpv
zSlPYJjrdbI2d@|}0J}CT>gyxJ(a?e8veat<73htWBXPiN#ibYzG%)Ph?{&QL8GuH`
zcU~8yI?_Xhi*mGCqTVtxZaJroRJGutA(flVwJVe-_?VM)y(0McX`C%+@##O$^*k^t
zRYu6v@f)GitteB{>GloPE<dhV4(O;8h!b%kVWXg*_$R;Cfqs$u<Yo{Jt2abq?5o6>
z<j*GLf)x6>nkY3#GA!gsUh!--{O#G-wKig~!P^lVSjf;4;iPG)Vbuzxx59mY)(uRJ
zj|sb1=)f!5^!TFGcVMOu3#fTe0%+-CF;v74fzgQ_@u~S>X87dnEGJ=Uq%a;RV>+()
zffUl7GDJ=Zds1=j1feN+ZAX$=EtjKdPtGcsSy7K4Q|@U!t}XGyvVg@uYSww?TK1y~
z1>Iadw&5SYtA01NG&0(mDHW4t10rmR)AW5h5znuZxv0E&wCgbox-}t2(!@hm-7(bd
z#9>PjOsrb?go#D}6td^HEIJN?<gM${CG|yyIPeTBlP|r&jW*}Zs5@ct-dSkjQ^KJZ
zu5B;}0*2$cyIYd{Za=s4?4}M{FcAeuQ%V=+jk=%~p#KAa88AbvQVd*P!dA00g}Fam
zJ`XOx5e3t?R(1<!VCbLH)fLV=l^MtAi#pxIsxdkl##e7sh}yWAUli!LpUayxP9H!}
z9rN~w-G`-_$Gcd}4}x+p=o~N!;N40TdB*Tt!hBf_f%9)dSHiYJTAMWN635rR3dc6{
zbVFk?nVIyLt(8UwnMG)iqL=M24qhv^i_V5U7SGPU1@jV@BA)%hE%K<}N$PGh9jx~6
zG?3u>NRiN>(6>ut(59qjmFQIvBjrr{g5?YelrXm1r_U%bjQB3reP8qDkSXw;KCTr>
z;+YOcI4^x)!;$HSy&L|44(=n<kWbC)^%Ik*fm{b~2vY87Ht9?0#bPe%!~{1z4k(V|
z;fI){Tv$6Rgp)aLa@Gylyc*Kx7y9A6?aUr#Lkbe__D#~(Cg-(|B@m62lA*_TMKeBU
zzgu;9_s9RTH-M!N6_jv@W2w}p>+f}IRjh58q&N9uG<KrjOQhAQ+D^ium$V8VJ11BM
zu+Zn>ONmdxnf#WcKyWM(@z5~#u;l&dptdVn`wezk;Gs?RzU9vKo|f}Dpm24pBa76d
zOq9<&u8(oDBPQM;NZNNBsPlVzN)2uqTQpKl3OY(_oo1gTN=*X#<DBYI6tb!0eb!w%
z19PHPVep_Ui-(=CZaOQAgTaG-DXR98edt&<v<HEWY^X$GeEDwZO^zJ32PssvPZb+n
zmBshj$B<f2bro><af%@IKJNRy_>QaU#l(mNqOR`f28D)ubCV)BRfw{&Mf}e#x>q$R
zom|KX#L970UWuR1AE|jJ5HUT|e8idERrz!xRcL1fE2w)Jg}k2ombSrUb?b54cP?%@
zhbwop*rWGY|JewAl)?aa=x=0$LVMB|uA9e1b6=8n!f-=f?OF~{9n>mogRqo2f)emw
zB)7dZXF<fo3g2M1=G)GAr7iWzABZ-nQ89{T^igyc8e_FHs7?oxMlKMsZof?YdNMeU
zH`*qr#Z#*BA5l@V;&;)INiAQ95<>HbdOnv>D3^D_+KXqwVe1J8n50<4xfxl~IJ@wZ
zpfdGJb}IL@r4#11BlQeYD3=h*P-lNZs`s%Lp@l5Vi-LnrvO@^$I7{Cn>p#1>5++*v
z3MWO;Q}4FoA_pGcl`b@v{!F@&nTR7ju<pss$QKmx*X1a?xN~xMjdgSkh6(t-E;D;I
z#9_jz92@g$!91RsvHU4Z&r?&vE_85L>eh)DF4>a|!c_%xS)T?zLV>Wf#mcQ#2(nom
z?n4-$Kbo4N0iv3&cS>K5ovht~5(2d<`0(xrlfT&qur{z-OR3t<P#e`#aS+CK6gpSW
z$Qmrvw8%?y!~OoTiZIid{oWe(wwgAncP{L+_`L;)?3&?ag=5fS1WS<w7oOt?1z3`S
z@i0M+5HqOATaZ{oT^)dl8Pp4(>l8DSVBuq+Ft0on-0LiQZaD=h`0=|W1_`V3>Q?Ow
z>`zMV(3uvnl|YA!dc2c+;&YSWGt4@><gBKY<r-_3m^@g(l-|k9TDHmdAoZe7{>d&X
z-rGrpkv&|JofzVq!|%Hqwf?YMbP9DEgKIW5A0*CJj?ZHTdfeUqatRx_S^G6OUI6yf
z|JSbfzdPN;|93O||Nk+E*)M$}%x`*LxJbwjtvz~kM|p@Bc*KzgoM(EuSE5=0YM7fa
zFe`DfGWPyBQB^ZeVUh~%IfodhX|CR>nUEw3!_|6v4zqRE)apw#2GGN}6eD>d3-XAf
zkrtx2r>;RKzrN5u3buSdkPW@ge60ZjucS53RUYB>u4jM`o}GXXWe9$EN%693yyeJ3
z3xX?668bsn0y1r@d5r{?1Osd?g_f#f%|B{H4Yaq&@p6TIerDN?+I&M;Ba#P7p|=EB
zPL`Zx?_u?IqPJghaQ>($J${F>9T?LgRA0ktq~;OH95W<@?1^fPN3`44B5I+!k8}-{
z4n7tz;(0b>g)-nN^Q2Q`h&HB<b<q#cU&8(5U6$t+3!of<9p$KZqxD2t?7Y}1-_Y^K
z#wQCGLuwU?WA>^;K{2seb|!T|)%iC*9kDKtLoM!ax%p_(bNTpkW9NgClM^o(umNHf
z$Q1G|%YEA4g1i+VRHdL4_1}i=G_LXk`~Rg^mfM_9yfdqkp|6CPcai)E6OiY+XZ1cs
zi1l_UA!mpRwb|6nzY)&{sq+>4#R4pZn8K3({={@2i;k7*D(KU-F46~ltkCgqrTJnz
z*AGI6q}%BMdVX)VUeI+%5X1wHjE@gj{z}Ic7Yw!3nQ^!-Zn#+LP3T$Qw=J5TP#n&!
zEXo8)SzXFmAFX#7imu214c7ylnh=;UfjOYkc$q1;To7z!DZK8*fLRy<!iR+Uv9W-q
zGc_&4=-}_OIxUxPdU`(!++Jns>rbrm0Bfwky!&m#6Q}~T{ljiW**itn7~|Ef(^t8A
zYY82Ve@FdL8A%&kmft2Skh-+WvJld*&)okwv6pybMDv*VG{=zo>KTDQV)j^Q54LVV
z0e{2N*?2zJYg02Dj5vCRaRD>i2Tiw0DQRgjvuP$g4Ex@>#*>mQ<Lhdh+LGhc-OwU$
z*90|SudOtjb`@n|Nd#J>V^PoREA7!~1s+&Suu}TQmcbiSQ-Ua^{uM`HZBtg`NPgY2
zv_uDwrpWQ#^|YQ|+gPAUTFonjrPkGXj+M-Vt+}kdSU07ccZs7oP<j5n4y~TK{&uD(
zA5&7IyjOoO4!Cso6d`k2?`OX3ivgG_O`y?xH{zN($EUj0Sa?`yas}!;Q&kaJS?@*d
z@4Y)r9P|*kI|gO0N?>g~H`rP-3wYj$^-nfd1wgJ2HtFxh8h>wX=H*pJxZC)TEFpm!
z!bCOpSG73A?ENEGSYIJQp7ms1Kz=@xNx2}X{GO5v80!$hW2nt`ucCmOUaBy{!r6<&
zdsXs!1jPt>`0rD53>J<IL58oW3=zaaZk$u@$S)Gyy3g;KeZHf|^DobA6I)2Ee|JuO
zZE)fd-bsh7i-yO%wY9aexoNhUsGIc0%}pQ#hw>vpj)@-kIYmaPl-ceIQ~6xbMq}YP
zE_KNFJ>5zBsXy%{PCY9oW<61xIyHr&#yTfamJL#CKs^Ng%tD@nqs(ELNU@iWC;~L2
z<@CM9KvDg$ocj^r$2#$<yJx|7`Un9U1t5pBvYJLSNGO5LIlkZg6M?@RpJ%zXm{NTS
z%L3CPJqO2JQqsE&4XT0!QM+J`$N84{II?mK_$bJaLC7Eg?u|O*Xg50`!$X1rT!RUJ
zPK7_+^u8Y5ePb~s^o^<4{q;QD1+ky^hdkZ#!=D<r3J)W;L-&`e-4yt33yp5)@p2;o
zWGBf*lH1rA4~+hR#bNGAMhg^SN+eSDCe8_Ju)mA#)F7J%SfJ^Wd+{;Qx>qYeA!@0r
zN_*@D_0sl&WWBX`_ri^dUwa}bhRGY*CzBeblh$5zH2NFXq8fbT4~n2DU#<fl?NA$C
z^iQ^yW(R+buf~73u2+7tvtrCf#Pxri5anu7;B1s)O*A*=23{W#k2RP@IVHM!sZi}6
zs3`^FVNnTntXv2JzqX=El|67XfVfDAe6{tgGHtent!prdm#S2`#bFWKyT2hO5%mf^
zELWFf0eh{4w&Rax{o$7QVIwqwG@$ShUB3q{hXu8^qq{U!x=Q1>?CU%;p?16@PF#9Z
z+7YVN;p@jj+s-BEam0{g1R`u)@vu+<_Ze(aMTzpNU_k-YUM;^$Y(X}Swj$F**3tak
ztsOV8$bq!>=UzcmRXyvKTrVRQbCxNDyuOW9^Dk9B0j|Wq>rUYEAl8>B7M{Hgj!{ql
zX*wIMq^PLKCGHw7#~?+U4R_Gvx1DN>&a4O94tqh3O^dI<fQEtMKO(>fkP+gC<y&*o
z^@}=^iX?m(0iGO3j97GS7yoc0X;A<|j}TY<!oziMrnM5$j3LRjus)`1m!na=sXMCz
z?ru?0K%LCX-CY|H##2#e_ewl_pVy;t%0hu9$aK1IpwE75<VheNia)I=qTRuI?6<xO
z@YU=C;@`;#A@D`5EYZp0P|DDNusG^+SIL|N6JrOz0-tko1Ft<xv})V-VaqpD*m5l)
zHLIhg%uBfh>QW?%Dk=n6LAA@#A}lM%peRa*a&mqSifUqwjTpm5vsW&_Sz<F?&F$_C
zAYZR7Wa|y~^D<>wf|e%$s=#5Z12BF8cSQ|y<0AofB*`{jk0nx_gG~bh0J;U~u>^!=
zsE`nhY|Nr(`(GmTH~^eod|OY%@d7!^cZ~(7$?a>^w!p?8y4}ixpEAjhJ3JzyN*SNZ
zWgS8&)CWRJbOaY*#NL_yJ-I6|*nM{6IcD581edSbYB>EDd-7_d+fS)hd<Lx72-~Vr
zx$q=@Ccg5bL=(QDt|n_mYvwa~6>{#WZ*O_&=P?U)Uq+3nRn|{_3?O0<l|<G>{oVlF
zs=rS5(!6VR!jLfjwS1F2_IdV1W9rM%8tmTp?zo<r39$E44Yj54-ZU8C`Wbz@zcRch
zY?f#_Sa@`OzHb47dVrk|$PKzpznpXNS4S<wRVL;F47tG66eg3A)#L-JVRB4M%oQ@a
zy5zswyO*zV)tCu?J{9=Zzh*C}XPrIqey%XG(<BN0y|1`ZLlO_<N^x_EO4-=dt^`+~
z`&jRBA}uroB#e}|x!9in#$twAWMBv?D)?ex5bl4|b*&*uxrs_*I^d2tZg`>|><UNy
zMk6VnZDC^*HE5If`%Rt<8{1<5L8Dd95NsV8EfUOBZaVF^8=4vE+xW|Mf5dq&rC>!4
zVxEwEuL|xnr3U%`+1P>#Nhn-kV{>~wEFfg?4_$$BgMzdvui<qU=dxqHkjoN@azR9v
z{w*_3VpSD$m<+``!caTwvW7n$1n5}|iE^r>n9pMDRNw3C3;Rn-n-VnMKG`BqueHBx
zujf}oO`bNjWhE|yxWdG!0^{D>=r+4`abZd2KpbJBlh$VuR09QV`^V}d;VX`?`f6qY
zZa+_kV42ixvP<-};3Idjzj2Cmv9;^m^G`^{)wnk`!>N-y%+n&VaF6cL*DbAo!ugce
zh?7VuHjF{;=dWL^`S~Su|A(gU4#c_-yBCTiduAkr5R$Cy71?F)E!le$vP1R?4|3Z(
zd+(LZ?2)~9$o^g4_xJYK<DuK#_x_CQI_F&H^s#$2MbsuedY8+wArqj)C@yRH3Sm}O
zQvKzFu6>gNz^HvI8MTOe*&|X8ju5u@i2<X#Or*N;j(Qve(JK`iCa}ZG%g;Y><FjaA
zDv+RFVGl`C`Ce6(wz47)uUS?AaA@!0Fmi(@iqWtc%&zzK^?e`7m4Dt8+JQV3=l_KY
zom;!;U1GxpY5VC18YybI><1$pJu`lN*TRd(ZjrRX$6;X?EYgfPE*f@TVpxw7ekSu;
zllqt8mIR~u=m;a;#}vAFsY}Gr{xyia+t3{t(0T6pkl^kyR#rLJi_)k#>v%#v65eBA
zP4D+8g=}tq92?6(Me!=DA%_7sIJMXl@5#8;)=dP_+tg|OWM%$DH9S7s(;*%0^scO5
z7XJNh3;!Vy_u{A9+$_S5)xL!Ez7<Jl1cWp)mQd(FL?uzxv^Z_qTMt8&5stUD?Xt3#
z4_V@qwK)4)Tlvxzg1|jP+3{g)Z0z!(E3i>8rMo^wKOkJH6wZ|_75}(A%+LK#pA|W}
zP#smd?ANo@NOwJ}oPjp(Px8M!|9xi?j(f@>TSZWY6rfKnjaRE5b55>?p@4%*tN3G+
zF!>&$NA?QK!s`XD_yNKdX-sRvgItK~i(Qz5BEgX3RUD7?anD3SK9<VicYTtT<#Ic#
zR?}uqECC8#x+T3M)usyW3bcdDvUhE?13Q-*|LM76$p|^}Dk{Z#(243Wy<5Is{W?ps
zk#hFE+%7ZT$44#dck&fh`*Y8SpQ5tI^Ill<TXn=~-tUPhdNaG)VjJzjg^8-j+;>oT
z#bH&9QoutWL>*A%Z4_=LLAjo_Ca~jT^$KgdggUuS0{L44N!GB<A@S&^Z7<v6%=rR2
z{R9(r`VU#+Q)8ji9Q}t&$t0b#2$N|(#u+(q8Y*(wGPh=(@Q+}=<k}<N!MT@w@%cU~
zZjO-NDk7^+Xmd$~X>VWsZoyZYl6uSlB+>#ePV5l($TiL4hW;il<9{hdO^3F32L(E;
z3j5>Zlb79l*6SUA&8VZrtj@%_Ryl^x759IuW5@bokj_jgrYII=bxk766jwl*dzmG!
zSUp6lGXCOcvhzUYwRic7k@LBS8ZHv)g3tE(#KZ(&JxPF-qXo-syzyOarn&FLVu~Uo
z1$>lJDppZTan7RUwf|W=;fx<gby<c6%0_L^1hWRw31>*)B)-G|K*TxFrf<GdrK;4`
z<?Lstut3_9CRpRcJ(Ymyk-j-+Ehs9AOC!D;X{!5=F*=_0rRNo6dLCn?{I-$4zR&4E
zO6P*j@X-9gE`LON4r746jpfIv4-T;ojA7$jh8OKvc4y@AEU9akfscVMv_x5WA|@g9
ze2;drDI%;t-aka|t~~!KGC;US>@BB_7pfjBTl2J9su5J^m;bW7jXgd6)^sm10@9BT
z<-KGW6UA_t+tM@319x6K!K5vZ?Y4H=B>7GX#rLTD0RdHtii*OtWvw+Yvw@dn3Ur<D
z@Z!d8{LkwM9J6&f($p6p)ymy8vlTa;FbZC5$WKfJ#i!w;`c(dsOLbf2VHAz6o@GgO
zUtlUIV1|F@BVWA^`Tk!&?Y3u~g9-}RT+i5{;G}w_{xs$7JLUJX4$pgo4fh78xg<?Z
z<0+2LzfvP*=+y*R5*ipDt)wGZzU1+`tQB&(E>+MhKe&7Eo&>k;rMB1MQv7Z9m*)I6
zA);8<(Ad@A+Ur7<f#?CcucW1R!tGNwl}|D7vI_USy^+)iQ?yu!!I|MbeFT)Zlbnqd
z*&}D--m|O}_x=#09+FgARF$6L9VYUlA@2L=eOhZebR08$aSgL9mz_n8NCSMQ)O(bk
zWa=upMMcIoE(Gz@qW1Pog6HGjkcd{6$dMn3?&zp*V6JE|!~jNK)%=t~kWm{ou)>_#
zd_uxEYJ?g6Sx=y>hsl>J#+s9}>BGzb$!KBPh6C^YajyMVR?n32i2B|s4T9|H4t%sU
z+O&bAd6<>Yv9?&YzFB2eq`;6T_rS{@*&J6;R+eSQU2DUh%dABNoYk0pG&hI*Jl4<$
zM+pfq=o!+1jGlVI>y#`Xc)$9tBw2(C<*12oQ&?F4!%DhAZw-N?BspbJT6v#&tLy46
z30_(^wSlS5UXwG{9iP&J`*g)xwDEm3!N_1Kk+`vS*(Z2~BEKyt2BG4Rh$=LpVe+$H
zaY+pal|WqIpo``F9Ie~L9>5>FY<c|rq0zBTN(=$sy8qJx=+Xx0Q%SLx70ka+-W<S}
zieoEfOr9}cNkg_N{aba2G!khnRc7`0rO60~puK;bEM?r8k)eIli`~Pdf3$S;#U+1D
zZwR%=&vtJ9dLOp9oBk`mIiWXtcR$s2SG?1CdwKc5@bcH*HD$0Ea$sIun2lmox6$xF
zlsjI>uWu+vMtRQ1$l@;9(u<0GiamBTC8GdNPk9pGH~Ztybiv|*IF%H28MA&8-w$@(
zxTmy3QSr{2h22P6-Rn`|Kd+84`^vPU)`lrwlY3~fuhQ$2p>c9@878gzabaDyP_a}c
zn~x(BQWKw$U}l(!v&l9d?C2VwPbq)=xYcd+F3y}gTHlag!s7XP?o1m*nvUzb$Byf`
zCR$(D>1L*vMow;QjkOMN*w$*f@TUf5D8`s2p(5XbyR}As+u+>h&w<<Es}vx*h5CHw
z<h87b%V<3<(Db#()#oQl^2Ol5(t|+T#zr3__MXE_a(|CI#pBYljt@;uO{=}G7?pp&
zy8N5vy>uD4H#9XB4)bX#atjA8&xkOT#z!NAy3VfWz2j%yPiMcbA^#kZJ?e~9y^qSY
zzP*WPO!ryIdfKe<@4Q}s9IK1?a8_KgeZxWRX_Iyls}W|}=jk00W=q6Op&Zo31>qS%
zO1;jzw3q5HN;m8CLqbMYY7HNr$j|{9B~c|BVrkKcBT#PpRVthN^6wE0{|}D~HhaH5
z#Ay0^Y<+MZsd_ddc+DzV_VbsvyQGDM&B3K>z?)8&gZM^aDzz5(wO=uUT^yxJyfN+J
z!N!w8QDX9{Tv)#$JoVLhk=*PAE)go!05w{>*B%${?QAk3NfIpa?hfbV%a;V9r`ZE7
zYyRU~!si5@Sd_7QhK5HBH0a1!*`fRq{BqQ|^pp|NtOS$gd$z5|`T-JMXMs%@EFpQr
zvm;%D`wYd8T?xe%ha6KnI_|=q-*m8dgCZ{5wqj>{aEV5eHCw1B{<Q9dFJO8JPO>Pl
zZR;B2NC|VfG?X~ii=@2|=ZnHA&;FT*WJdRSXQwt98n4aUuWB3*$9C<}4CDKP^LQbp
z+nKq^yw8p-nUzRNaa3?(3iY9oqV-?mdgW@8fR^L@_y16Y=UlgBO-v96ZVgbF6^N@&
zPN>n>KGJt`3aD6T92qZq@)pljj>6Q{b<*zazRI(DCB_bL$^@j#pj3#N2pnkw^hv;j
z=2t3ze?@K&S=Np~7ygkMn=A^v2ZULKOqgxprVy6{hpf91YDorTkncaCdWtH}^s>@3
z@x_ta=!Z+I0X)7`R7@DYR9?$hzEmZ(kDf%!-LYAYO^cFjui<^=Kfbi0C1oX@Aqj?j
z@9E{)99QgkX24nB*6}0Wr?6wk@P-S{tx}SMu!mqfB}Ip?mjo^ub|*idfjhFOy(b3p
z%6?~{@+wn^GACzp-|YLzA>$FMD<rpK$*3>1QUnjg9hR;G8YX$rh_L&P4UTN~rQGz&
zTjpiM*!B>jhbA7UV^~(2#A=!s1Qwl;)%E6r&;o1hQG$=U+t0zUL-A`i-F4j)te!Mt
z>@v~AFpbSqIvLrK?-?1$ZEVs3){jOw_FedZA+?Kd>#t8zFup4;OaCZrZgkD?r2}Jp
z-+}`#ZbzZSQ2$dyE<x+9t2_mCab<8_cpN-Qh<YcYOO!fMERMEbXFl%q5pA>-Tr?0@
zJh0ZYcC@l)tPW%GCiXS&h;^AprN^Hyxon-{NK-rx6)zlZQEXnZ19ETZ)-pC!YcqoS
zEp?AeJ-JAUI*qQP5!0F^P9!a^xH9b7_1bV+sp_}-6g65!9v)2FZNV8iB)6slLd+ey
zH0UI?V9P5!?x>_JuB^<S$l*)1c%ar(oZOVsw<4hkF73=`TDy%5T8dE$%VcXZ1ma4{
z&sjOS8nRikLq$qI9LG#j)2G1OE&zN5BHq!FtG}^;0fJ82<B=b=G}-URT4x83<q4B)
zxhSHnV|S`H{rfMRqpp&r?2?~|C(n;?V19W=KNZ+-bHnZkQ5VpJkz=7jlbqq?{g7E0
zXP1Y#okNyfjy{SZazN8x5mmT(=j1=Ljxw$Kl*`%r8`}ZPxq0%vLW|zd2Bm6o?=u+U
zicViwB-R~NBg`C}9q}~hsVF1nzrTD=`YfGSiGAb8u_m{+3PT{$nO3Su>8GxpO3a@Y
zmCTx4$I&BZmO-m;#SIC>B?z8|bSyqE6KP&hc=0egLxtHn-ibE_x~?*dlCk8NmBZDu
z($3ZI2?NnRCb;5}LR3Ne8oZp*Z`B{ZkzV_`U_*tDoG63vAeV{)s~j+Y1asR3hyToY
z&))qF9x?N0HZ6-wwdMX6l!4?6Eor9BV=mgKQmq?yKKE<1h}zg}xW6&vWm!Ma{QF#u
zcYMJns?T_cV~6f))5#s@X)d3Hxbo1ehk<QAi#DIk-Z2yOZVk(C#(C7iGM%(9Ih#;P
z_smC{*SK0)ax$^@Orb&#@~y~mnTToKVUxwLn)XL*M937>wJpF<_66tMz!LEkLHL;_
zOX@|-*x8vB^`E82d<LmYLGOL<k+HG2*7Df3`rvif`f`9zmYIkq<yQ<b6shsS!8>qU
znwXg2h~F9c5wlu3q`2AYs8#0{oATOuaC*A`Ev>H#Gj$M`2AX>CnTVNU<rzOJU1h|`
z(A=-%jg4fyA1QLg7ikk+<4xDEbX<?uMt_eTRKP^rbY&P@spsoyi8tWUwoEqvk9WGO
zD<?nS(9P{$A*~JgY`7lw(36sr16llTgJZfX;^1Fn7nBlWDyq15@3gVyU<bNd?CDJL
zPQg|K`|0&{blsb&@gRvz3yXHw!$Dzi4sIL#g9O3NTs%&fV(MQV9i8m<|9J7%@t*zh
z!@iG-%-3lB*xhN*z}48_f>YYtTd)Z{*nmCoqY7bu&iVuijD73(FYWnGw?}?dRit;b
zqo7=EPu3-SUYrb14YzL3kmo8T(Wkn6qsOLLZo?MT^YHj48i-ZmdBI(y<zw(-psMLu
zR^m+nDGAA+zZ);(hO4DH+l)J_<Vy_4DeV%Oht?S>v}bSa*{b=i#xfK!I;fYXolC55
z?i|*TlWlFSh&xm_`k1EOVEEBw{>8>Dt>z9a$RT&zGy~W1n=R{`H=q{V*w~@Rjld5r
zjE%UG@*o;$85_5V9Z7SzaoU^p@Y=E*De)k2{GWc_xLL3u)lb$nu}=Qp&Xq)*v5|UX
zzro?$<Tt@II-IxFeq!T4s4pnpzjU4KJ}JX{k}8RlSFp_Gb@iH?91AioK9L0v&{4&%
zz!vOK$#TIL#_1bSe_b6H>1rO!r-(E7&<_TI;i<#T{v`Ho89aps{#mVhkKAR#MFcg=
z7`GL3lw)Cc@%3hLRR0QmQ0r4+tG>^lKPR8KL4}3D?Y_%@@7_I^g)>vqN00tA`&@kr
z&gk}7+R`=r4-%~y+AGY*VQr@k3|!Nnl<t*weK0qF8b9DeWw+n#<yPw+)M4=bU2fT(
z;h~{UnDqb*^C_Ns$Bt9EVHc{r;4#6-$V&?gixT&77A(q%fnO>3A8K0;57`lB;Ca?`
z**9;n*6vhWTU*V}6Wq74D0s7W6Pmiql9c?Y#_7r}x1~rDMq38>jtPD%D+5fZ2tk%i
ztc~3#2expcZ#aacyr$!J*hkV%p=dXFvH8)Q$K#)r({_T8BB5^!66E6Odw6{DLrWDR
zx=Tb9zuTuFr9$B5cHwfEYr3)XSV+;xL3Zf?1ub!+Cb_p42R?nHx1shCU46f1BTDTD
zC{^O(Bxx5{!u~a03!gmZ{kh-GnUtgnMo#J3Rm7s>u9wZx<N}wNmK55Um{>1(ToXka
zZB$eJ0?TK7`$Z$}yL^%pUiHmA_>dssEP;zkyCApON^MQzynF9CIzwJ>+SQrv;z9Ml
zl=<uV#FUhl1%*iC#LfV^&aOAm1eikpvkbntA|UszTgNtsqoiWO?K@6}1_lWT<)hg(
z8YT6f?m;%fSYd&GfB2;P`aqyEJUrUHJ;N8zqKn8ck3Ko!+}vs_C=i3_LF(AI@&1Ja
zTj0YDt;rw;PsWh)^?99lXdVM5_Cp0#;@c@}7rtLi#r3V>6!;vRpA&1{D3q0<8oIn(
zdjlas>FJH(VH1z!vQdf$%)=(xgnu|O0O5xI$BFl=F@&WD_btG9SUT@Fbl>JaLHE0;
zcdGhY_P}{xn7I<`lYY|Zs8XicBk0HSzi0IM46Jp)ZIi<YKoO$zo*cPg`2D{pf1x0S
z!v;=u4%wyUV0^7=m*ACHbg1t*Fd=Qp6`WdO@7q*|M=t1#q~mCmcF*zG@z^b+!>a@b
z+wxHogH?7t#3~)sHJ!ST!kHD;vFqkV8sIa%)46o;=fK6bb|#C0itAbkskm!u2M+qb
z*jQllB+7yJjEPQ^%Vo8OnEPe{t=@YVlP1&9;q>o8%f;GPT2k>iu*A9C(Y@l~ze3?V
zX}`mw%^i`K=ge<Hmiz`6A7A;aU?oOv@KbY#qfES64jJ;iUN8WM*38JwBq?={5=@{H
zzSV|I@1$2{Cqp3!@L-fAote4i6D4&i&Ul){w~DHoZ7WRgJ^n2OLVgXLhqCOkiz&_#
z?=`jioAm_!MQ~+DZplo56yX5?;`;>P#Wd`!7=_(~>Vu0bj?ZltWE352vI7710nrTb
z@$t$NdBUQbY6O5}<bp6fFUJL5HV3DjnU<Q<Imo+$=$%);e-nh<1%3<3=V)!f9(?#w
zWxTekyh8I;i(d#-hE>gZC97Ga%>O&qU0WY=25PChOpGt`&l|yWTy5<XSaEinqh=mY
zBeL>l)Z`dLe5Y4h*N*?#)!?GyHVp*QzEx88|N1moM4+n(Seu;+n$dACHhA6l*>Z*?
zbPF~Km18Q```9;M=P&!`jcjZ_ZH=1-b>Uxbuf(f|iw!!29URyqigcDr`Q1UNE2C56
zOBJM~s#;DI`oeXEy`jMq0N6|h_O6Ju|Ej9uJ3A%nby$g6v}lP!4<-!VU3ZST&gz;j
z1nBNHU8n5Xob?j;i!98oWtuG>ouex&+g{FQ!XaB*3jquM7IgiBH%q6a6w`9jnq+-_
zDhvKY2eyxr9@W^LQExcp)t53z;kiHd_D#FlrY~S-J=%Vto0U<9mrJlof{w~<e@+Wf
zM5ylBum8ce*92W|iaIT!H+A;E{||>0--u3@V&_gf!b|7h(@4=+0SV9D*G_jie7r+D
zT?Jz^ZL;n10)!Qr%F3b)z<avoT4zc_Be9mf=Op-kT)ZlJV4Gwaq5bs8?A!N-C~tJ!
zA4=8Q|C?D~XMmNj#Uc%Af*p#T9~G5&VG_3|pv;Kgjn9=<wN0s3I@~YGPJAlVxJB1C
z;J@ctd6}TXylBUJdq29*-=KlHA2EwgMr9?@$mfb-Uw&M9_QYg^4>q5`!;(d-zI$|3
zS%o_P-<40Ym#cc**?zrovy8=K6sp*_hlfnX!_)JsbI(Q{DGGBAwnqYa-2PH<6soZ_
z{9Dzu9vK<}zG)0tolxn%`okj{kK+#F<{$OCd3o%wU&HXpcLip(*O3~yC9Uz0l=|VL
z)k4L%?%HrxAAH73wskc&*T@@6QEh?PFSxiu^YR!%dSiQ@oovsFikC!XzKMWdh4j#$
zx-5el19|H-0hLJ#@4=Bh$i9_+-%-;SqYrP8hK^K^6vuKWg*$~sV~Y2~-u7ym_ddTt
z=_@g*?~UofO=o>Kki-eh1)(s3A|cxI=awEeyBsX>p>bm>8q>T0XL)>(ww&U7#Fyu}
zCo9vaazqdtauZ(Mv*G&dDXT5x*^{#Up)Dw+0fw`w(f-_aJQ~<W5GoE1c3|gD1t5g^
zBY6SWAP93CoFDH?EH`ys@F%XeTftB*k~s*o_DIRi&A*%~zQVXUZ}T?(;1Z-q)xG)g
z^RIBM@cNT`?x(wSxDiXoZc>PsRa_rr_FZNyra9k&ljep@(uoWi*kYgCP}CNcx}UO4
zy;jLZzo!-~1{T-p%a&Yk8yJnm7bXstM#p{+O^<{L<z6=wjm*q^W|oqXAHdNLQ(z$4
zSYM|ttJT0V)d-X5Npp|LP7?r4Ck4HH>f-sanbt2uOw7OY9LpX8UBS`W_x<y5-cmMi
zB$8&Bn`2_07$(t$WU%u%#zJYPs7|{0FBl)aHEc`;W{iZtO3~qQyy9f%5{#e?<}39U
zOtgr5eEH`wv`xSeK=N)va`MujbWyE(hhQc49+=25H-CZQ&*w`8r^jTIw_p<DVD93v
z&Gy9o=I_~c$&yC?GIU`@<`D6bvBgV9wzXdCH895|j02nz_sK6sOl?yem(KvSZs2!;
zwi{3Y0C&QUAJR&-vN_!9sB?2WwvKW4Rc&C?)8g4~Zf>c6OE%`O1Q15=@KF3+4{d|z
zl|_MOva0g$-yBsx@Gz7ktI-;c_wW6k=KC9jo`6p9SicSFKascz+<iOl<+VWyt3XjN
z2@jTUX*e2oG?k-MS6n_BDn_<uq!C^HP~wC>cmQN1NFpXDf?mGl*9;$OJhq2$HAmoj
zo_W~-3L0?ER`KeUk`gLVF(DxsDm037o~PW9U6rB0!1kJJV0hT>>}8=sShBlfcbUxl
z_cXyqA;)3d0qIMp7eF<czN(erc*IoG{FGMF$jvRFFFHC0tIv>X?wy>=%Qt2(X^o&-
z{A%@HWoX5&%+lhE^E`h5t<*}X)hb%dJZng|W`wd`WKye1LTvNQ4EcDmJbswO*#h=W
znBeu2puVSPicK};2nXpS^4qr@+l?{HKg$pzLyOnKfvKdNo?99jO+T>z>-FB??5sF%
zw0M+Qs{1w1oXb(+1>UfeIo9tm4`SRqTU@8-m*4n3qna*~n}i6&^USxtzO5lem{G+=
zc~phT?*A=^yg>i{ml1s{h{AHR;(^oB1tCt(w9iP~3z0F~bdS&&oy%TxJ9SN`hS<9C
z?|hi?GF6MBEz+(Fm|iit!3W7ZMnQ2GQuJ<-T%L$BH~FtaTvo06_GIgZ{^4Of(_i1f
zQQ13WU@fZ>5h7_6%Qf$otg3s)gK~8R`&2GXp#Kbe;HbrYuiSmWYHDgK;oG+#%YJ5A
zNEVx@__wcJSeS06@yv)#!cdfd!G@xY8EzbkogFw`gVU~;vmw^WAPKok?i+1n2~iO8
zOl5tcJ_(=WKPh+;&zpOn<ztVR+IOJ>Fb_SdS}%frX}M?Q=g*&UoROHcXGHvZbKHTN
zE3<{^zCi9}Wd-BY%iC`Mvz^k=WRp&QBP}gmAd%^@M5ddWUl#}*A~1!5=b3_wd)L?Q
zpBWi*(9d~1&pGlkZsQnqA@a}WWSa+~gP3Uy`x1cO1UGo=#xuIe-{@XV*fP<OEn=!l
zA73m}T3H!jmc&=-%o@+4%}7cQAuybnD1~a@(@TRxdKm>=_5i=b3LFu)zM%rtDsjU+
zDC5(nO$OOLxaN`{Uk`YHuSF1fQ|Xb~1^6(iH;IB1FW~WnwQd*IQ(6Uid5H45uEYOk
z{njQpu`G5ma21dq?o#PIrm#cw*rhi+6gB^(uo|gBj`Y1QU3i~CyKs7zi=n)De4Yr8
zKZ^ZT*hZq+ue2s1b8{w9Kfmw8X7G8316^2}i#x*cjNk#(h%+o)&=k1vSwXPOgV4}#
z{HK&18J&OjaiW+(p56}!*1s<AOZwH-wMfE5z2=DVEvB8QYO85gqb=W|1)CD{HMu#D
zqvuNE5K(Y6F~|SU!)wm{28B-t8!OOHK{;q)K|e1~1lVkX(7Q~wZd<*=IQ!MJlEc~N
zMcG@t7bpCkS)uVzsI%6H`EhZTP0LKx9iR4U-bHG4toV1O!$A5@E*@?z914mZi0p*)
zH8o~D%zL@T#fIRCKB4gifiU5tWcBm&<EVl(yIDU-zIcVFZ{h^Ot3eFSN6<^nZ!NSP
z5!=?xru|D1;D5|7m>i&NWK1fIb8vo1;+C7Iw&5YG+axjHjFX>_`zwWCR3MFYtv4Y7
zwgdNJZ(se@>J})#)UQk}EOwExkuSu|^$)s9(GksBPQh81y%g4=HH2do+{jgX@wDhA
zxDlCKyrOMw@VC`8G(>Pv;Yx$B3u^18BNo<%zwdfJ{1;<y9QS|?2|`7cl(RB2e3Ozs
zW|%9Q(;y8#Oxbz~>7N`_Ozc}*Tj;(*>1tGvJE5s5%|IZcOgJ{qrKYC#=V#(e@Dqn(
z7(&yuYCZh9<~))irPNfb(e8fyv{VkGk`952iqcG_;2<K1Q#QJG>e1$AYyIh*dr*cL
zz~~Sa3BCfViOIUn8xD&nE;)I52J>_L%l16LJafPGCn&gYK>9+3y}~ZDyE%+zZgm1~
z6UaV+(-8){;3jgJvBL02p1-)pc3BGJ3hpq_O8k~lR2c^`d$dy2nv6M%*r<~6ZU#yL
zBIp^C03nV%%*)Hq$th^&5FUTXF{@`{5}?HHpOH5@s$&1IN3=kEJgBgkCWKl!9fy#R
zkoo!Z`S`CHWJf(3Kd~delr<7Pg>Wt^5+j2yIbR>D@|Po7)MQqeZB)4OfZSSD1saqp
zSeeuih2a(CG(!;9L8~jIi7>=<*0=_+>ee@F7B_YJW6xz5HXIclxmh%o_iH~v{`F2g
zpL)OJ2W_oj0RhLgn_0>YY4H3|m{n3q-p2BtLwX_|z`D@;c5FE8LsUUY^$!u+GGD}o
z!;e=Bwsn%G!&(gjVSTx5kk!T;Yx2S7Ye$DMT)i-eE;DMi)<LX`^k=!}ef2lF^9y%H
z<=C1Uo;mM5{(v_U8+&`1Us-Mbt}8-3N9MFdPJZDMlnF_X$iM~z`29JCyUZb=1&wjG
zp0OgXO)syn2VeBhTdmO1z`$)31tjzp7Do21NM^qT1~#1HHRztS8r;IfsDr0>Obk8!
zEa?20r7^KE+4x_!4M)Yc$4b)nrOReeL0#L&{}!l~!iKQN*ZcDY%gnQSH~0}pS9{(~
zTF=d1)z%uvOVJaBDl!m2m%_}<QtIjPMTV|z^tXBSEM=bgM_7K}tBT`OQ>{Q>P+nd>
zIyTBCC^*pDi&2)b55?*eDg{+dS?bhfh=i!tX6dYoSa7OwIbJIs9v$tTm>@A7NWIPR
zz0JQhA1|6cl8Zu^Sy-s8{d_A)0N{B-fO7xlu>TRC?Y`8>W0$DklAl+y#2sWsqiDTO
zM&c*D_t`)-2S<!ty*oi0hq}5Boo?QQ!}|V900K0v>vb@60ovcL##zTP@{(Kl<*I`H
z%$MrurvK(S%YtE&iNV+5@*EEbQ)L{~e0ECY$Zp1piVC=T7HqgB5ySPzW3M57r_9jc
zn~R5EcP~b;7#>bgL6HXGm{=qX(NPb*GBGuEJ=w@cM@6|@e<MhZgC3LL*1lvL7av~(
z#b|&PRUaN18JUc%HUJD?R#zoJLATd%BhcUf+`-97kAx1?70Y(6kW?{IVeeaWc9%uF
z{^#I64xo(I$~#io2?-OwdZM${;5hUalpO&F>oHe0%=3#2*V9?&o_MD+w7`1@7bvL6
zUbiYVz?5>a$8Aq$cxc5}H?py#Wf1@Vv>idl3`?4+A&p$ALi>h|0vsOfv49hHFiLCj
zVyV4e&(A7(D(+}=`OlWFQXXgj!ewj6dH>u4lw(IHL(b^qzso!=zVzfigS$e)*!XE+
zDxVm2svc1J(8HG6Ze7UA$sPP0k%#$Q9>+}%e~;AbYXK17sjF!%k8X_oJw3Kv9~5?&
z{c{CduBs{!)&_@c+uEt^<-hw=ucvAp&e);we4NYX$jbdq4su>@RgY-{n&}-GlHg0-
zBNmmOjtky(w%p`m)O{ZNb3CwTCQHq^RI>{X)K<J7eB-tK;**YhFHi#Ku1{8ntCBKZ
zS|6@v=<v)`$f6BSUeSW7pl2@MxB!#0a_?y8VxLy8(!JV9Qe5Nf-tI-0PeZv863^b}
z6cqup0RkYh1Jo$mr6V_po1sEiQbFxmIr{$2?3*0n2$Jl$Ew@rxjR%ib=ZZsI!@Wcc
zBGi4inVb+2>O?3m7wvd}xdOA~LsuppL6VY3GlUo&@1&$rEc@i@i?-mkf;u?gwo1V%
z8!3|w$gi?;PC-ryqvkriQn<*I2!wjt!jbC>hZG~m4ioMO<*VMQbmy9HE3~hLacpx`
zdiwiURdk92wTeC!X&O&@2w;<u^}MT~i-riab2oCSI2`f&Ree%rN>^~rXeB@0$3#(#
z*>{^o7vhT)QY4^Nq>b(ef(NeKr`V!JO1{4tVlie9r%{02m7z1#?u#W%KnPp#Te-?G
z`ci3R2`>g4<rZu<4A?6xzrf7Y+5z2$L6Td|cK*l)KxXiHTQlmLuJdAL<HL9_XYx}3
zKk^u@s*)XeWf=$<;~&pVObErTplS5}?dy)uiZMf>mY2f1))>gJ_qNBT^nZtt3q%qA
z<k9%4E&UzC$DBNvx`fTZXGIK+q8Pie|Cl7+8Bo1lhOsxJ9E?o97VXbzGAnDNlz62X
zV_P?V<OvhKN-6q<<+L~1FU@+D@cZ`%o){$@REYe|6MdQ}14p6)0cr7gs96$(BXi6)
zZ#ga4<a{3{1$CNL6`88kT-GqD77Kl%%n40wcRi)N>o(v(a9HZ}%I;ryRL`m`pv#U(
z(MCx|NwUXwE+`ya)I*T)yA7EQ4{4CDr7L-UEXNK)n5l5twtZI^j{Q;be_DXi5=O53
z)!K6GHRJ(SVYy}0pUe^p=<(2DdYlE;m{rw-z&t$7rlFq$J9Z0BbwP#JdXMf|MI<XR
z`ejJ|tEUVRPf_9xqx#gh(Z2D+K~ey2W*aqLhBU}_UOaN!cjH6PxP8SAgYGimEatv*
z?V%-i(9dMqP5S#jwN8;kGk9jfky2(y$stRV#`@>T6);c-UVk0NJ?uEjQ?~{cLWEL?
zMeeq1x&i}n1Dk9#)WASuM}4njH2z42cG?_2$*u4S%V<h0`0*p2QPvt;J;Nh51Ncrn
zYpCtumu`WcmearF=bl*1ZWCdC11RN6g}b@gSRgn7<nTD6un43LtTSP@`}?}$oY+r!
zafIm&A2|n2{V0V$uA^*s?%pvUm|hhI;t9&jNSb2B?s*1A_$4KJ{{!#bDbO!7Ns_Eo
zD2Jav^A{#WJ*>3d7s5sD<x#6#n_AUxyDfkpX?~joHPb|vjO8v7N_3FEN1j|86j<1-
zX`>Wpauc0C{qdA-Y}+Yh$-0u;St<RqY^IMswOq;eU3!$*8$kg_G0k0a_O9Gac^ZC}
zmAdk@d9|Dx$;@ira9JPJhw$Cfn!D5XdPg+|CF+BRLtQ#zlc1nd<LhOgja%X5JPn_H
zGP(NF5E)OwFX&J*9~X}M|M`<#c>CK;JKHz^<6-PYwOIO7R6R|b&bn!D3CO(#<wMN2
zlH*VP{I^OAXMfC5^bCHV%K!2(<N`yOXFrfT*4;CYx~<=PXIZMKL#Q(t43bRF_6B^%
zmtZbohBHuP+!4BPj>2JAtiX_RhxY_E9x}?2(kZ-!r<UQ0kxz}J7zHa6^KG|Et>U|$
z#PG6N3z#I)MbV}+_F6UtW^{9<yg|B??r~Yz#RygQVKqaDWR&ABr=a0hY2lvhkqd!1
zi}R@m&dlz&S>DS2@mZ_6n65&`6&_@@H8C6oWx_zw3NORgyHl%_|JeJEU-#&!$9)yZ
z<ZC2Dy+f<Wtb3#B*qYtKhWRls-?nbnIi^3kOcAf649kXBiB_teqi`>e;c*x*G3p)h
zNa^C2)^W#G<XcX5<7}8>3!OYO9ydFGXH3$+7VgDoku6Q}J<g-1nYHucyosaDb=bws
z_enPl{ZcP3ADj`C`Ms@g4f!a1ZL$2FKq^Db198cy&!WnT%7lspZ<i_`o$<UiRJIz5
zOs1%*5@>Wyt@N5}SXF!*l5yQKhSh@<^0DG{jxVQw=f(eL8b2hRh-0t4hYElVb1Ajc
z9GOz=Ts#<CHth0>Y|gTjg*?*ZTKMtCoXdg#8sPJz<AMKsLBOTlZBho}gP-rrgo?XF
zy}em=BH~w8jP>5HGjedff+_M~iE%*upK7VTVNd+7#;oz6F$#wbGt*(-tysNwetJX}
z@*Vp6q(3C-G<q4UBOrp_GBXp3cz+?P=98VJA3rJwr=~;zu;}Y!`eF$z)0@{Yol#No
zN}8&V9lTmGA3ju^SBNOuf;LVgDS2ai^Sjz8I6FP{YXuHrXlO{-Q8@@)LJ?+|SXhJb
z`#e4QA#)G19)a8WuOf@IcmOK5w`W(g+S>41cvyiD5)EC6kvbwPE3vUrhln_y4YR?4
zS<utdQ%O}hQYH&Jc_c{V9GaMrWKX0fL1$wdjObgUOObmb&E6*J2j9ZaE1-Q8Has}k
z3<PGOWg*z|zuWkm;<Z`__6@)`LGmU9nEyu@3Mt`vdFJaodtGonN@YXvEGTFON5%uw
zw;;D#I#+M;z>Rd0Q^MT*^@0sQ)Z$UhBeNrc2trqn8(}C#b02^OHH;D0fKnH999T*J
ztK-<;AbzTQPfSrL?s=9L^W6My<7ud@>zTUOO(9A1Cn|h*A%AcVWp54bSQJg<vmm*b
zl0xC|qbl+(qI=~C)O~>L`{d<;RCv8sC$39DgO=<boyD0ZL*I}7wTW{N*HRb5^oM_r
z&)2s<WGgU#9Uul;2mu1f*cD?O239KTF%+&{;s<wA-8R`Y6lsV;V~Lv)`tKA;zh`HM
zt|BB%)`&k?e9)V&R7^@vUf<sSp@X)akZ{|O|6b6ue0~oRJhE~7qjPgQ&^CiA5LNNN
z?EK`ZT3*mToQY7Tb5w#Z`W_mZ4Q~oOL1-Z1qq@HKGT7RJC(X#jw6V99Ra=|%`@>&4
z^^xIWkcy*2a)<-3C>4(0c#$>-=h%`BH=JnyH8l7Eq2WtNXi;Dds&QZ^1KWh9rC&Di
z^8+QV!7QPxi~ZVp`@i%?@X&!914stoyrAb$Qc+^#o{)EUCri;z>5lr`wUyOW98oz&
zr1TqdY^SvQpFxX%<^i;iqM|ye^zkSo0#oM%?gdEX6h4TCwuKfCo-=sLtZ(n8*JQ;a
zR#nEv4IvH?3DyG%3HTpY#0r)8PH4o`*0LeYhJTN={TW1GICtA@)u(3aOWS-j{VjWn
zDDlL2j;f>vtst0&&!+9qQ8Pyin~cNNl6Anri@bL@xADgTck(v>Y-D3C+3}FB?{%#m
zfnJ-0lr$r=0VI;bmX^=c^Kb}TsQP8YK!lRl{iC7+xbYAKp_!$*zTSTkpXT3anm_RK
zLji0N7Zun8Ol)k$_wPfgLI7ER$<E$B2<^zjWB39eb8esNpN9^>lrATerVK=f2?(ju
zob;`GAcO^8*38Vx=)(u3s%cp`CSJYzjWp(B{?VpxmV=XHQ1u<wEWh^lR82Gt6$o(E
z7QI(heFF^u3d)$NvWiNH`8W$GPT*aPjwt~)&<)$lm*MbtvDe+)Wn2Y<#IDElftv~k
zE;HM+b@2wJLGyb{gXw<o1#wlMcurZ=W**M$thUAD$22(m@y_EwXPxj@#_udG{ksx)
zL`F7I=Zx*iKg+Fz29qnd&_f8d`{QYV{DVLafQPAqQ<QIbx~qNa9Zq`BN9gNZ<DE`=
zr*~vnH0Xna6WyR}16>^yir~p|yIJ4cKM2W-o3~!SH|@NgQJPEI#*u4nkx`h50*h<@
z500|(@9mk2c#(9Wl8mU}l)9nEkq;jv2R^tn@sv@LuQto(p|<EvLUL(Mb<?c-!<6t7
z&Q#Y`Gsv_W<Oo|u(7_j^ysuv?8U@1_0fB*_L55xkKtA|X5&8MiV{t?faGaIL_*p*z
z>~C)WyDtBM6hTfA#*4xEu4bXf+OsKeUyN^Ml@1M~z-ijjatA6+Kw304nXaxpLCgSB
z`;Cp=)~$mWE}4LPXgN7KNDL9?E<h=;38|W*vBW<pF@iSk<&~%B?L%&31E5?)kw%xH
z%+li<oZKMhfKM185@6~hMi!8oSDc1sW}t(=1@gJsgv6<uCnh+}eRfad>Aw^(aBz;6
z1Fc`n`&yCEAAm(?Rbn)(?XJBe#Ziu=<idmSh=?cBcCL-jLPTIuL<lzCQWY5t!y~ie
zs;Z#!3-m)fd9SY6f-k=<sz|{5nwNx<G9!apQq~b@N#)yRRa>h;pbRp74Gj%Y9WYsb
z-Gmhz|5r)SE3MdrrL2bU>dLR0UuSAs<DgobA*2<eL2$C_G})!2#Ef%7A}tO79%KJ!
z{s=q;AWa@r8;Z)m57*;$ipd~sGqP9V6$}V*r~EoJ-I;2L7h*$dZvMm8qIVaDB49%V
zys1*0ACxT3dBMRaqFsGm#O1vGQC!y!wORcT-*VQF{mw&%843QNtW%`r$LhznD1nTF
zlYjn8f7|f;r5g(VFWrH%`l9st791`azp4nzyE4}!d)IGxr>F13Cy(L<k_#JN3ZTj_
zFOd^)FqF&e*RY6)iCexIkE8_YsTFBUi9{N^xw++FDra=F!^3jnlY3)|Rz^EAJKF|<
zz|e)$2c*A$jP;UBP@WA(2=8_x1Ys66u*L)7((;r7U!awE_Y5GG@R1ETNm3WDP6cUG
zdh7sNHYjzZoUTI?uWT1B%_%LZmQ4SeotKB9tSpuF4&nr5xyf1l&()5E2vEny$6>$~
zrvC^PadPsCS~wntr*YpGf;AMy04GwR0*Ughfy;dvIh_TN+Hkyj#op-oI`89s@8WSk
z1`WzMp<C2d|5itm69p@zx+u<p7e**=^N+H!j8TP+yu4CBaD*_R2W5b}<{t>jZpXhb
zA@Qd73140w(DgmW_G2A3kFzVO(4j9{T{FqW^#3YtwbOCNV^CUAhC4nrC1Lpf<-xHd
zj1{Yg6@2YCK}wh?4fXzav4^LrnORZzP%(x%>%C$y!+nBRVYy84>l=^1BM@VA2URsp
zsLeO%Z!n>gygEtY_V9V#D8aNW^{XEzEm;^RD}s*|9hovBKBN}|8ZU|z3K%qW(9X=v
z^a}{M2f|-V%N=G`*5T>tzRu2jw_iMe4tlYTt*s@nCr8n7xpsxCK`DUoz>S}qoH3Io
z6OhL5H8rG#|9E}$kRqnr{{EDi3}v=*^L%<gZM^SKGm^HpHaMsd{Pr;udE-vT5+6Nf
zlhDy24q!eGD%?uw$PlGghNoUp58Bnuk1^7V#^An%`>CVjDS$W!E`0Fx0;S_wZ$)7K
z4~T7e$uY4bVnn=9!A$vm^!w4VF%YTWZ9YH02WP<O=x7X=OY>nPpmsRHV!i1c8xBeN
z<3**G(+n9OT!~d^^0m@Z)3dXu4_nn<6el2BIzr>ux3;G7B#izXyD3QPzYL+qFUns@
z^V&xN^-<scJ`O|{RnJgDbZmoXgI2vwWbKp&uxePpA?YJ1BS=4?eQd1S?U=E!@VR7J
z`(Z0ae!e0(R%~i2B_i8Yk-&VZFe{f-Dz3S{ZmX47CuTCyj8RlMAt1Pbp*zG^CuDi>
z)kD<V<oV?l=?@*$@&Z@n<uAvBtu5f#hY(b_c4>+mW$04o7A+6|*l;Tl#8&)9k7w1<
zo1Wkf@wh0NmG`qG_vo>u8DwSPwn{vr!+G(LC3))2j5IqkA$oyf#=*LL##i~pGyXd#
zSnhik<Vf>Z2ag1KQfX7_8XWapsT|5C`5^5R&Lo&Gl*^7*$ib84l6?C969hP?7Z;~V
z6SLa=O>xG_(j<&gzaC$*#m7XI%8G)I6c&t`rKPc%Sz=KUi;AjhZXU(~;Igo<YxPU;
z)So8z$N9hEP0@c|8&b5T*=g>-0_&y*LPp?l=Xhic0IdaQ*Wp{#PaXogcuC>!b~JoI
zPTYDavT-pZ6ho_`nyHrrX$Xb}uJ7LE5_I@>N_e28jRzKy8L^YX40949_85Hf$obD%
ztRez^e1zdpkmJ^phkXcCqrqtrKUiSKsZw*~%T~{@(9vhJ$$l`iY~hfFSu7J%6DiYz
zuiwu6@2X@fDoyrgfwaD5@S)T0RL|ezt%4$nXG9?+0aB&k`50<;_lSKNKy$68m5^Ot
zM~2VlkOEPtfXt(-J-Oq!;07{dwQp&LT}2H)WpoX#obHXFrp<S?UXnW=KO7w$TR3r1
z*U@NSJEcK__qm&Td&k57IRAOZ$jPbKV}FIq!l93BIDaOq)e`c$5s}bib6k;zTjxcn
z-jHHT#m>bQF}-5oV1x?A3S%rnjhXF5DTTU<B;wr<4zA3tyKJ(cw(bHbSG8Eq_WUoY
z*UhPS8qJ&V!QtUn5G*CO_}sxF=W7Oad!!^?wao#ZV@1XG#EU!4i7(fz!n>Nx_*B&1
zvXMX}9#t^)6$;Adt&hQ7_@DFg%*@P;t(@Ze;#r4AM*PfLSNc@DjSBkjO5v%isR@l^
zBxu(E0qCIpWJjyPDOSzGPv%_on;bo47k}e-kF($mr4r&yHU^mv7$h<Tp~DvCeGn>b
zJkUW`i+~)l_KzGPY8akjUHI#@a&*aU?Y;RLYFf0Ai#a*zI&$$!cI|LQ3Py#Hvj&+_
zL8B<~%=t;$z)QiV=81n!prJQXH!(K88!`R{hUM}jl{1DIEG-LZ-#;sokt@ZG7?~WB
zv$n>zZo1-xutA{L)z+ptKwlrcvjj(4WY71rn@RTps+ywhUq`1}=RXhUS_l-7(D&}k
ze?={<owNv<wafoH%0K+k$w?w};;O`oj+4{LS>!^W%Sp8y|K+<c9PF7^uO<uQBugh}
zjiUdfuSe^>$ongBl<0oi)+eLX@>TZh2Vb#kYQ}D{+S6Tk*IoX#)FZ(jBfKU-q!3@X
z(DT|f;wR(~W(@ud94fng7MyLdeesa-^Y;|{Yu}0*cu(zo3Z%isjQF+K>hWBhjT|dl
zDw}~&+QGqT==W?JtS=uS9MEzjJ2*L(JI(UKa4drovb1w6ML(qoI(b*4u~8mxGZ#@{
zkZ~v;4Cbe4YO{V!+u=UpPmK6y+=iUN%`9m<qN@?2DTj;K!{>YIe|9%jq-g0S0dJDS
zIWPZT$C>Nmrx{1Kbs-oSpx*67&=C<4BiWEAPbR9vops>y5X!(i8%5>HSwv6DDA1lf
z6(}Yy?s_g}M;-_VJaor!&xuh#geqQ<F)kq~33Oj`>1xahjPdGf3G}H!G@nIT;xiSh
zcgbgzxV3VhPLvv=tqtfl+md6p>CFz}@bk}p6YvbMtAScgj2agj{GPQ3U&6oqc4D*Q
zh{?<QZKtdLF3m*K7}*CY4}ljf2GZ#Q&8l!%vG$jRRUbZnr2ca{9@5?#c@GRceu5YP
z%)1NJ%L7iru^`9~nhFS1Pqv_wPFJH%>wCe=+Y1&OaECi?jlqfsFaTdvR21HQO@}AL
zt1j?-<FuZWggfkUDz`9i^zGjrG5vKoSGQN{^Z|X@)Y{#OWzOj_YvCR|0RI{umT!Wg
zs4&ePl0i)_OqY^gmmOh{{z;t$KCJWJV@LZo=?-N4CBrXTb-jO*D!6~m$}-`#=1!hx
zIn{lv%eQX{JG!H^cE663mASvoY2I*r^X=xPfuijeR%3$X_l&`bX?aoS`8U^RNlDi3
z-nn_b+uO_mU2W;2f!%9%Vws_@+!G{eYn&_-u;stOkQD@Tf-4vt$`DF7(B6(p8G)8I
z5V|tK%v`Ow5g>{B<nskL(aL4V1B=<(SO@~8%g$C%&N|e@Llu33*(Nmd3Oq!Qj_kjD
z`SKsbAfOElB(%{zb_a`hL23|o>znfoVQRuy`8Z>U1Y!34b#b0&z?Ne)D54koxx&Yt
zOip*EA4tx*uFYz+*t~kaKAgn__9*~~G=3+UysFRQ+?8-woqe9ua6(k9NRUM|s`h9`
zK^d-50RfjA6uDGxDOx-jI`BFl8E1&?<qp?_5=$gqj4`E!UDjl6wc6thFMJ1qW6W+Q
zm&V)C+KQa6fRi@w{T{bsd~3-EjZ)9ZC<fd~ceU%fjmpRcujA^Zi{@P!M)~2}MR|-h
z76Iki@=^UJAM5zv8i%{-joc>Zlz#Y8`Ri@=I}XlQVEiIUhySCp0$TW5ivojE2C!3;
zk(VnmSjp4X(uj<SN=?;){Q&zG#yQ5YWZp_a)@os)rHs7n7!fgy^@1saM3Hvez6;<J
zS#{aO%F03_?6I)$^d~vN-BtS;Nw5U5RQpn2Mv9|=X0N2g%1+m*in%_Tn$RbQ3kr{+
zU=wm3FZ#Cb7}x0(l>7Cb0`fieSJ?ea2R7^bPxt~_VDZw>WX9H8``diS)mAmz`(Qei
z^fbQD{`@B?oTH%IT0Bl`5U$ap#+5HI?juU|IybAW<prLMQ3M^pj}I0W)X`Eed3oQ;
zJ7f3v%MwUGCCUu7P$F>Jnd(S-<p&XnC3YPcFdb@d-}fLY&wo7xRw0gl{~s#Bs||CQ
zAqw&FqV&FmLYx6=rOzTys@5^3phqgSv|LY;;G@jeVlgD4{EQP6;?~-U#tBlOF7RcM
z<dUb<bF!k0SXcm+c7aAs)SmZ^c<aJF*zY_gx_F^o3<T2Tp6lqWH%ondSAU}mbQ(gc
z=Dh+7rz_cBypW=cPA`43C{g-JIbU`01s^ku#ALnk1CtsUY}a#f`Mi<H<K|W?-11x@
zUu?yHN#Z{!JYCn*0|7U|#3};x9XFzjDOZ;gftVpEuJaL7IZP?eR=od2!G?a)T(uZ{
zXssS4C)-*8Gq9l}cz2HH8q{kPRJGN&8V*Am8YJ$@3)g@yQEP9(Tgw^7yNk{bU`z*`
zBq)mmgG&{WTX4Yq;X_DBMxKnU+*dhMwVIEFNF(px6JVV6zIX-={^0Lf*g!C(1Xdlx
zgP)8wekgBhmQ7+lI68tkp*lAf$GA*nr!4gA&_G}6yV=)^@-L{X<eBVxjWgnZWtvs#
zAm4w+K=1%KvP!E1*ycb93t{v?t^C2vEHl5{Po(q@Z#yBG`LtaBf+KnI2WB6`X}*(*
z7vQDha&vWRelk%?VPd)l4mV=dQl$!FBOG=$<dDX^GhI0{KQ7NkVC3NN#fBSjPyGJp
z&%ckTcXoDd>};erG^CvQi?is~N?Kd9K8$4Rf8PJ;PYc?q&E{WHa0=R)$$S0dH}a~b
zW)+@%dt!2O8yjY&<$UKtTj1G#8$M>CCiuZ%-nw&yg_Y~K-BT$b0l$W_k`gs01W_!~
zr-8N1!U}&afq~XmgO19U;p5zr6yu25PoG}X!EUNBzsF;H=wOUV@!2M{V(EZkYpgi4
zJU`TdcV|~(n)CT{+2seWzrOMJg~T!)oYjAidd6w#@d@qm3>pS7`D}xNxA=nPjwPlp
z8A5>p1T3>#iaY`R$$<<6q3s4m?|)BD_H6#n2g4@NG<j`S<iz|zKYhs;5U8AwMygSj
zD#RwnQQKX6jQzFeyA<6b+!FRHhgl)B4yp!VlBDJk31P31ea4Ckl37uZLa+MmE!Yf5
zxLsTvxHMEyufATu&nK*Kb||@M@pNersN9?AII}l3AGquHBwXN-B%n*r%86*26WC0?
z>KmlwDyucW)A^RAgW=Jc)~R&I0*!_McsVfE@%eA7=lJ-v94x3X+eB}gF(CPR!(lV^
z8+l{SNAYl+3Ip*K!)vRqF8&*JyQ<$IGMemU<<;Cei!&b%;=E1Yg#7HVWL_J?N1zfs
z>s~8cF5>}n3n})*&N53nI{NNaj1P=5a&oq3hsq%RjE)|W8Tk1hQmG616I6c>AG?~*
z8O@`k9IC}SG|Bzx5RYLI0Ns|YrAvZ`Km-l>VkrsCNf<G83Q|VA;N_Gn{o^H<uApW2
z1#h~N^l_TQ5yh)8k<#vof2c`$i^q>D3Qb4Y0nCq)7B8zI2W}Ty_jW@qGD<LP_KS(>
zXD?Oz0zefvId!tVvYlAguP3oG%1$pZa+*h%Y1?QrfBx!EXT%WU{>JT^G+DzlrKy>a
zl#0k~NSRC|J*?paYe?yMmY0Hp^3;^{kwGu{*aOndmk(>+VnkD=2H78PD$`{n64P|4
za3gMoRuKM<Fr)qsQHzl>w6h|*&!lJ<6HF3~*gKX-X_N8*k^pWWfBDF{k>Wy8@(Dv+
zNX3iyjFGJ_%#a&Q7cHlXF+vLuM&HB@^1d0L=_)$6&^^sH3Mn_016~vaqi`JPX%elx
zgDCXAjrWjY9O^7y*j>i#v^&?<oc9}`$l;k`iCm@c<>hGJKtQC_!6wo_{-Xij!Dd#L
zS=m()`SC0nW{(ymQQm|L$bjh;H0&Hzm3W~N>NOu<K_vr=5EnB5070Ov*tlLFCF=Oe
zw_W|GVuZA%oKimAxlmqp1XIY8ccSnO+l#cR-OgH{-z=)KMrtO!$z85y?V9Zf=~#jt
zfD<MG9~f1v4B#r=>l57JHqMnW#iOpJMH~AzS_WL7LvwS@K!a3iS(D4$LrWRavM3UR
zPcH}Iyi$mFz+u2l1(Rywa>MC-@m-DQ5W(9|{W%|lOF#fr6KxaW4<%PuS8LpkAHjl2
zFd?0;RR1CYnz{Deoc*5z{V(|VeD&Ac7Y~e2^S=7RJ-)q7PG$Dt!=KGqCfa=0ok+GC
zi#Rpr5KDF1=w}?V&~#Atl?^Jzo}Ia}=+<Z`21Xm%t1p(KRvPP*@B&>N<A-|S;_JYx
zJuS=8XKZ3(TFUJFkoq%Ke1AzbiMS#GatqRd3%R)M&hXEl%rzdV5LOHbr2@mP3K5Fn
z12<3bq6!Fn1ER{#r59iE;88q_f2*dFxUhiR+1Xjj{6KqLEg@}fv%(xmfX_A&^s#ba
zAbUSh1Pp?3BRX*3L5V-)_;9-N-+nu|uC-^^a%Fu5zp^MPu609AB2bdQeAzL&jG9yg
z4)h-@`5tM1*W!%73dcVn3CYW#O8iD*>R^;$kS@tb<Vb<ABOPIW37Otm4~V^30#{W&
ziiZe75_k%@5c=p1_8%>pto>J78u_aTG+KZ12LuLgPMR*6zJ(Ci+K*G7><V^|E^~Ly
zyQHXbyj6AP(skc;1+_@T_4o~Gn&2m3695J{CZmLXVSm_;hFLiMY2ihX*rWaP`fso8
zlTZR5FU};6eB*JnQ!njn@Wt_si!*tfb(noP=oR_74fl~npjxiv2FrK3nTNjVRJDlc
z9;4k24wR<(z&wV8IDfMwhL8|_k_jMl!;f6S|7ye`EGB0B)lNKbyz-TIUuB8qX`m$u
zFKFVDc0X@^WF=FJ^EZ5;q};MpD0Y~V_dQh&Q9_&5zILpTM?$8oIOy<j<Oic{s3QCS
zX#pPfd=yV?tw4#>mO9JdkRp>@F0<VH$oSP==Dcj&JV_(;oFT+_V5{W^GkI4EEgvO{
z_V_a*X~Hue?5rpzvK-|QRDT=-#!xNsJEB}OwV(3D{)>6lU^-H3dolAIHJ_5KdgzJl
z`va2Hsc_Rtj#A4908)s(V~pMV$Y!vSF#E6CO|W`=tbXI%EGeLCsio9XrcX>!>!H<j
zrFjTZxZ!)2SVaNhejnq+KKgs&Eo-Nlc~i0vxTh=CUjM*K8<2-G5(fJ&|Ha17nj<8=
zPET)mZgy|3nm+8U3ynB{_1(tK-WrTr-OvLY05#CjekuLGx%o>%a9CQ6Q-PG~$x`?K
zN7GryWwmu(+dx31L`o?M0cip0knV2jmhO^nfkT&oh=72A#0}CZ2#B<FcQ;7aH+jC_
z``<Z=+_CpwYpyxRxCSQ>k0E3UqStr(2L{BdGyTb$4i5M!jlWya0RjD`DP!`59wjbX
zrbTMqSm9L1J=?k`Uq*!enRrUo2Wl9$>*DmF7MT*$YxFan^~6+HYkXRK67smEf=F4?
zx+DKc^p)HrI>)b3iw0}8X{2;W0wu|176C}U&7r2_JNMKEW2#U7QbzO1su(|Eu0Qpb
z&iPxm$b!zPX`G55wfLo=K>HKDuC_*ncWtiGTaKtjRbplgs>HU^DAU<b_w>?vb$GWX
z;#1R4+*zD46m=eC{JAvHQtxr)Y5B=M{q_~7u4K`8iDj?X@D5Xj%Z}UT*zr+<keI{8
zsAeK}Kg++=MZoz)ZTG%ZmcCV{<SNtE9Dm`VUM|z})RF7Tj|x_Mnr8VY;rmdMT7IvJ
zFe-ZMHzaA3ZN0tsg}ujlRYC<>U%nO8IjL~#HN**cHDJZkOD^PooSqu`;W|x^>3XCS
zy!d7PeUA{UTzRF)KSW1P?P!T+HPif6*kJhIb#`URV^S{7efBA_n3%ZCBO*8nQziE}
z&h<aOzD8j#Gu^~2)~#uQBVa|FA_M}YNXGP-K-B=eIcMFDU92w_&%Ceb`&CJFIcb*;
zyU<6AQklFzs}d!6DTUwQsu`wP?)h8dB<iE*^QbA&OS6#`)ikQopC5kFthb#iob;2S
z<Y)_baB%9flRwH|;KFPps=q2g=$!j><P*|A2udKcs>c<})Oq!9u2DjBG%|D%^&ohX
zw`N%y%bzIv=y=uPiZ~~s;;@7?f>%pV!HHFFGfDjP{gY3dn11C;JZV)Q=4J>V=)eCI
zMM=w(Lo}1ANT=T<;1*9r$t^>sQFU%tL0BxHp(|Q_^6~q$vCMtkj9;%#zrIWDg*m7d
z0Q|N$Y0^3s>F@#N_<gq2e?9*p&O^?()eeXFU|^!NkS|V0M-m1O6x0$}))UHI4H%)6
zu%-&fB6IMSKJ<Mq$zJ=WM#sqF^8E1AeOqf~cV=b&c1udeyWfRP-wfDF-^Xj_wuskZ
zeS&I0c-JkzGp9hWYPE`}wQn$K)|z?hrUcn?sx42&Q^(`+8=HakiHYzA)#5&k@GMp3
zm?<YvlC0`n3+Jr4o$=df;j0a*M{Y4;bgL5lR4do!-^uClp`X;e+S>56ox1CkeO*OL
zK)!^-yMA3)7t?s1E|ZoqO=sEQ%yi$<|C=_y?_$0A+azt;nx(pesGmiRb>~+*rwHrI
z0@c<04fh%M-m3R~=@eg)I<z=Y(qxc5&%E6>FK*6VntV!hn<TbPSNANomS`L?3-od=
zQa<tQ-<_=7{R;D1cLrp?zTH)tlEwg=$;*){pJX|0@pU4?Il$@w;TDcBz^JEHjWD8n
z91)JtP{SjC0B!MsSSxFEn-|1U)ib!G4O|(0`Vk+zKBK-23u<-e(?f4P6~<jf79m$(
zVPJZSmLsjS)gb?z@SEt1#O2Ni8SKA_tKUcShVq@<90p(B7bVE9zc|(=_FQ;b5P6D8
z;_-1*|KgQ0V6Rx>7oU7wW{noO{z_EgBzU)Vapyl%wx`JI#Z;sbBWN9R<+9EWv2R#D
z<XXa8JxI)TPR(67L9t}5YkH>&D#b(coYSeO`9;)_DTnw(%<_ACk`FqHthJ8c-bKRm
zKYb7q229G3j=<v0D!C5E#IA&{WoC%H-CWbJbH(U*e4^T1E>BV&m>xLOD4>p2ygXII
zwie=VlL9$(T|+}uPmHs_Yd68LCd5YjRtG8}@qwLVe*X;h^ggbmM?y5Jgyh3E;m_dF
z8D0EIwpS;{j3;8Q#UVUJG+CouoqlTDz1^6sq>9&(U{Z9C+qOvDxi8Z%*K#R&?R+Mj
zc~?|9ueTx4Mw^(+IY^aGiZ125R8#RYoxt4n|1hu?xiBTjxZ8&dH5Bn4=nm4qw8I4I
zpronW8>Q(sADh^3evl96q~+WyVyr@`mr=3;0V?p6BnalUCFEKpF39{Q5SV0|$aq>1
z0I!&Y>!@&#t?E^J<w1lRjbl)=@#O25i`wKt)y!KpPIb8;4fX2vqF4nTA~5|m*?xSU
z_9R={UKFGxjX=1~3gNG;p3OC!a5?@ngnpTx_p)ibgv7^;w49<M=(@|W#@bia(bG|c
zx&LP^rbY>=B}~bC?%tq)F85w#GBeM8N<<>`VbfGeE!%;4>2sZ~nVjt4+sfC@%*I;y
zVlv8QvfY!Ci8EFob5Z1;RE(@uWs`d6tE}#1Tk%kWHs5#dZms8g;4WoAcW`}YXJxu-
z_E+&zuU@tN=g2e;@}Rk44ZVUKagYY@_3m?OHO=4snxNC@?!UHhue_Y?moaqj>NJ~t
z?t`hLP=hI6KF?~FF-KeV#$y~%>Xxr5PQLbN;4%yf4-gX%icSS`4A}6j72ma8B_6Wz
zNax95&ZvH#BJG3>SQ~*1fQf*gOeepXfSsKqGan7W49BgbF6nQczoAYqUT!HU2%mq2
z9o5W`ynpUhF_fjq74%*716ptkKatQW1wK{P1CcFe86QgmDPJL1%pEhKGS9v%ii+fo
zp|dsz<5zRrr&JF*=a}|@5nNCZCskLVlWC7yu2a1Hu&_YfIGdg(rPCxSC&rzR6x^-P
zJ6ES#R5SXbZ6=Wd?{Y5xD*H`<_F8Jo)1O&b$Wfd2m!DZ_j69nM*2HO@R!qGrO_O{&
z4-*-I;*Bg?oKix#S@EQh>L9yvzDdy?wnSM~J=cbJ-452QDcxlh+~i0(S@h%Irk<;4
zeIuD`Q1iMpeZGWRR{d<`DAq*@x56i5`0Rk(RL*~?yxoBqwA0V6nldb_w%#Jr?IDLG
z(O0|CfK9IaVCty0+-t_WN!xF$m-!_1PFq71l9%w`uWt?nD)wAfzsRRAPf7XTkf^Du
z5smBkexKQ!lH08|b;>8=U1S7DR$bs7GrX{zy|x&-0+qbpbcbYuVa~q$oW8S>@;@c`
zH8SoC5TTO~;Q3GbAmHP<2yma|P6?;iiN76{q{TUm7$`5g{o{?xPpCSpcf=IGOZaZU
z+7vo;GP}bTlr?v(_5ILezB0mXN1CxGl4sOqW2mO7KWB2DQ@`rqgb~^j<rS$ejf6vP
zm~fHM0oyx<Ei|Yap2J#WjVU(@4TJ=_M>W3`FY5JpcqR}wp(*3zZ+U{VXkTytQy%}d
z_)1ZAm~rcd`|yEhZQb6*m8`5BWfIpzHPa&Kn;=wM`dujI4dg<~thJzh;-yFC(-bO<
z2vW0%q0SLi!@YOcH^<l^KdE(X-~F2_X|Zy8LXvCR51TZ<*-({r(U(EL9IOL=VkcGT
z1Q$&7{9Qd9uEiq?@t<8KO}41j6~FQ!6P83voXDA|QE%52Ql?8QrYf6V)k`x9Gs=f~
zIk@$#JA{PDaWF@CB6wQJpUD8S81?iD+(%z8|Dn+hXR)|-7d)w+9RBh4RGWks3Ukv5
zE+Y>o@{&>Qr^z_Wj!$(*r)Su5rMQTNLDQGRdgg^GSD1Ekf$?AuHLOT-M=5jIlaw4u
zFM9R;U=iBgrjn8QYul^>wAvk47JT8kSLi2hx*YTiPst)pwXA0wBiq_&2i`fS#Lpe8
z#=yIS-zZQLsz{4k?IfD1nWf3_82xmBJ<_^SF+LVW@pYnKUxW=Wu8ir|1gO(<H-8g_
z>lKn@tH~8UXf5FAcKGz?(^K(5I+ApoG;1dPG;QLJ_RXXDV+<!166;B7LR4iA`p7ZJ
zl=)yfjvJoywgEsyNcRM)o;c^U{^-~gDr9G2z?Dw;L#>PkSkkDNv83SQe58Q8(m9T%
zmpSw?U-C_yGUWZ5^VtOt-T7W4NMAmvwVfJbkypdL^aseI!6bgLFv69Dq=TFg^$QWt
znHPd16qS769o@@^OcF*CA9FoAUUQ`yx?dkDS5Vw(UCe*2T0#&wO<MIdrs*%^ene~@
zIAI?Pdl^O%=$Jk^3duU^3ooc`%WLRUlUvlkQn;aP@b-qb{DXN^Xmxv>t|>uP2{yJa
z*2luw79UDY55-~3V7#~}`BD)VFQc!c(q?jPZOg#KIjEt|t=wmt2hOLEpfgtapt@s|
z>lh;%z8Is!l}K2<**G{VyIDY*<FlTh2U4k${cN%ZX$c9GTgU|wr;SNhQqk5}P2fQ6
z<HoZdyHcA;j`Q>BzET?^c%9yKUT)VdB@WxE54m)>5ic-F`I<!}FoAOg-UGO?gBDp>
zSemn=`ML`d>7gz8%Yo|Rg#Y(p-wkWT04?-FMn=>>dqG^N?<FC4a|@=Um0MPN(mXag
zJG3es@m6~?^6KhB?f7npwJWU+mkZPYl3PCSkKwhQVy;<khAn{#Fd557yCjoU4qIc{
zAeEV#x(8yN)qNUL^R5*}5LVtczTI}0Hv0s+;QVvP9e&Ija50S9m3w=wSkSXG^*Pe;
zO$6sgndgZu80D@M)YfQ&zEo5sUZG$e&Rqw>q#GLAP<wXAD+r3fpcEg@;!NdkH$s@i
zJ|Bz_l04}Jas|`;4SW|<oLW`acU`w8TDQ8vyXd&LCz8<hqVdY}=D*$@QV!c0VWzYf
zkE1o(|1FZpjD~5?sJ-Px$6d~@i<`AmC9rL_G363e!2P1Z)~`s2KO#pGyZgXdS7P*N
zV&SBGsa%o1j3GV{1q)I|$YII?ZAQ>s`5bck-Uo_FcQ-mbryU4bv`3m+U9E#+@M@-W
zDzywIsfB-=R@T-U6uV9pGm%bCPL4O(k%3T1N8tAQX;s-W-lFy>9=GJ<ZPbxCl=vpw
zOeRQ+H6C|sbmE0WPmLn@JEOoT)JrM~0zZ=&({4>Bo1;amW5yktO@{Y9PqxGc*}Vjq
zXT3liQlc+mZcfwMN-6mgf}s`=9Z?A18y~2=V0`ARyP8jvVK80m0?BTUHJ>&a-aR84
zDOpW1Z<MAbHuCZDx94h!Z4LD}2<spuN&BM1boeV?q15KW6>jK1KLb%bb{nwl>6Cv<
zL=n#?XLv@vV~~fb0yOx{KcCS7LU^%<bC!Y-4dFYh2e*|Jyef5yEcEvsh=0y)40~OT
zn~x)md0{96O5ReZRe27Zsb4TJgGL50Sd3Dr`vgyjw{2`-VT|H;{g2<%wcPWB6jW_m
zO|~CsGTZ}5cq?zs{}uDG8N7;BxN?JVdRYw9Kc|DM55C!`q!o47ZI75M6wG<9fZ(&5
zw=A|tbI(XUwjRPgAp;CY7)9eo6g#fA%V~4H-*Vuv8E=Pf?thX0mA>!6ZgGI(O9_+A
zI{~jy9pN;pSFBePq{ZZGE#!FQnM^k_EF$BwAsJ>o$#sxTL#I2e_<DOJ_%q&m$FA3j
z=eyK)!Lt!NHg0YqCnri$-R$!0^ib0GAD}*3?M)XMbw(F4KPpgjcK&gA%)6UK2ZWM4
z<S&$~b>C6OVq?UjYFAn3z(2uK_-x|n7+|CAR%+Js3^)nDmgzO%D)Xmt3cS(KAc&7w
zK`$bqO6z3d=Z(e=0Cn9|%e~OF)KbQHQHr0BnCm~x@3XM~2sy6gc<<>M*0K1B$0eLG
zjS~h5t;1H7gdsu{DNDQh@52)5HTow;dM^X&V${?ynwS;Y_=Ibf^1->nMf?_L90o-^
zq^*&uDEEBe5eMV^tX!1V^EsMl5wH4Tel86%P~emk`0jZh?@sph_hYA%*j)aj5hN#m
zSZ;WQU1<sjUDNXJ{)yM!vI?&R1foo}LB{n;fTMj`Ci!D}n#7>9<2Z4q0k)dI7gJZ)
z%_$mfsaqc@xXJcV0_rbjJU{VzMhRZF3O>gTSETa}{~en^NQxzl3dX6;!_iu_&D4;-
zO%b)%@6XTIHa3jBoIjq`q@)f~1<fI7K0`Z91szM@botNlcg>pcu4E=`i+3%H`-)7-
zXK78BPB7|N=#S0TskLvclu=r}Hf$-(%zsw!a`(N`c|-V1Dzaq0LOQhbqIL-|8<;M(
zN8Y;g=3^g^U>2DUZw#YH|CeRK6N*XvrKu@8KCe%aVTDkqA*8oh9%M2ADFZ~x%*`HE
zGLxQ>y?xBp#c_-zmB(_ThGw1F>og9V76;<+HXOTpk58cRI)@n$xXt=q(j}>&!%7=2
z%tH8_I0~%qJ)ikKV}$J&mR>rZ@l96Q-A<C=#aK9a+Wqfetgmm}{_=A3zWvke=)LPu
z8cAvu)Rzx~1EE4MbJ@hFLenS#&z&PqN9F1C>;*q`MQ_LZB@NflQe>0tybg)#&sO%|
zmc*{FTSSow_SR;SkDwRNH@MA;NQdPXxF<QIkGf!Jr6@#7+cRVD!6*f!rSA&DEmG?*
z59lRda@)_{iHwY$!1OQPlq7$wJXi92%ClZiIiJc383j?q>hBi~^TB-$-=k6MnfkEM
zC}MFTh;)gqE-)`?x_*Yx{Nzj>QM?HoUlg%`ENd)PT2Glv7xnx1o?s;XQOQ0qJ=_V<
zpg)b?o*;5E?n+{W_v-*IxU)dtGnC7<;SANGA%UmGtp$oqiBq7f&)!6?v{^(IdQMm`
z5Q-+`DM15_4<~c^SKP0JV29Y|*&46P;PgFy7IAn;%;go7yRwpc>GU<zALh;n^B21Z
zLmG|ke-aD1-H!j!2<Uy|MLEGMuDNv2_Gp@a7(&S9oNz3sJ@2YS^ODeKJ@i+xj_8zl
znl_pcb^K3;wA(M;u$8B_&hs|L<f1nnoRgEF{fD{QeMy71@Vg+nbUzv<W0twAC7}P3
z?{rQtC<ff5K)2dq>ersEc08gB#Uc?^!HeQ^4g&jf#2XeQTBudg&V+mBz)zV=P2;|^
z*>}&@QUS0&b0_=FAsClu88<YzV#|M*>Df6s7xz6<^grB#zV^qI6tlq<IqQk)u)#b9
zHUR<n{4gw>#?Vl=eW^QI!@+kun!Pw?^rM%%gvAKpUL2yPMDHQm4zVxQcztA^9GRKb
z9QGtnv&P8J-yd(Rvd4%$WOQ|L+&m*kla`f@Uj&r4!f0QEK)2AvDwR`?j!|R^w_|&|
z_{8KS_w@)b#Hb=8pKFzyVUR(H#ct!tUGv`0w=!&7GQV&$?@UFLu9cq4^^EI>>#~q`
z`n%-jyo53c<{Q<M6>c92EEu}`jI}xDC6OMuMO;pevjGx_@@rs1Kq5WL`o<19AsUD{
zko7Jno5)inRVfs%F55D$9zyi8DxJTnmODC@?zArLn`W{vd3m8OM5J?<T2+DG=@-#)
zS&Hkg-|JKO`HqZA_epTIYjw=K^K=m9^R?R$e}gVWZa&yjZ!>2~Nzl%SQLuI-&^rJ9
zV~-X%V9_YnF@zaay~m}E&vIIy)Ac1tFSt7nn=XlOE}G6L8;^=+7ou-YXC2n&1U`Eo
zTfy7}Y$3m_N}76&qxr=F#7F!vz6W2C9!*b%ja%_K&cj=sGb9bbSZ$_J57fwe=a;{X
z9=dLi_10EcDXB#cARI=D^h2{~Vd|&ERKvRyQtWiR<uNfaIacrS1Z`(0*&@~16)=T#
zl-Y|gct<cqT>JaL!aDwG(t<ZdmW7q!wmwWv({|rJ8cj)0TihCVf@`JAVVBrNz1pk)
zr7mwYQBDIF*7!~nR_j^B{g?_pa$!`C@A`d@n7v9W<4sbj1--XlhlGrLp+ytEt@j?c
z7_LT<6pLhiJFORh(ajnep@Dt>{~SGZgJ5{1#a&q&$cB4X&-<u@fk7OAK+i$e!2Mc|
zirB2}kD6$<66iN0B9veiR1i2r>gnmJ|Myq$V7lpw^vug&tq>Wy9vx*n-}f_3wIJVb
z{^UZ7jXfx<fGXahH-lH?Iicq9+j%b34)VYKzh<tyL4I|3tZfH@9w6p6H?&Q1XAke#
zT%Jhm`l=!|VmJ1Nj}Uq;keso;ww2}EChc>+sIjx=o(ZZa4fgCZ;a4A<=i@IL_4Vp|
zdj4&ViQELD*fp7cqy1`@D<%IQg(F$IyyA4rpelx%+RMa0Abz!<YracOLqkZ~*bd6@
z@dk4&=B9tFpnfGJ?Q=<%E8F4{7Z)dd_O>G&kKTQ=XpyhljkyqIw0~p*tUHg27#X|!
zdf7O5q-p1}^Yc^QF;p^OY^wK^vde*@DMFM^4xuSLhyi+#v2t@PHZ~`a`ABoB1Urr|
zErqEN)(V0BDO0huGT5i^kU*J<NLoTNNar|fBWz~j>YjvjOmX?Z%#1i);u1u)o4W2!
zNPQ)5sVE#BtFjXWFqSM&>w*z1y{%B@b9tYm1AyW7B2a-yxc+=Y0lUSpCv|vhrXr%9
zeiTqTb?YBdP&8gaQPT*z1XZJbs@bz0x3goxGmdm!lCR3^X;DY<6hVPHtk}Z{;o3ST
zj7SV(-$j?+&jOuQKD$j><>hJCIsTe1p)ZInAbukfy_jTy`Fb&92p_k$<4Z-u6S={6
z)|RfDIzK#LA-?ub|7xh)(HOm>`cU7_>Q~;hK*Ki%q+EM<#>7>1rXRT$|3ya+4h?k=
zgihf$iLyRyK0n$7MJ_}f%<f94skL`dS9`5ffSMLsP)-Z2Sf@QV3!H1)J0?b6aR73g
zQJtHdJ%{8_^QTWq%v@cgA_$mowL9R3oxR$b%^I>qOPF|(@E4;WM((9Ib3%9Eb{{MA
zU<1fE+_i5&7}=ws?->cy+fvUH`L7E*=nQhc@yb)|SRZrSG#U?NZoflCJlaHQ2r07P
z8j!ff-eAs;B|0-k>NGZE`JUovSJ|3vPgHyoa9OEbr*j<VQ{VP3yR3jm&SpZEHO1i7
zGwow7;on4NC~opv*DgCub=t{uFcfVgL&a90I$iX=xEUB4YldQ+keJxS*2f>b=4Imy
zY;1#kXTP3sRm!oZP!VI68yVbDQ}bBQNgn%QL7ASu4JNw8s3=!>i~93*v!3%RIX^os
z<x;-?8l-bNh-}RxLZ(sh`HiyMBm$4GRiAg@O0L=8&ZQ&Ids3j;Q{cP8oAJJ2bk;5D
zf#8r2QN6arlN7jUPjq$avlojB@unr5>F8|2!+magiK;|DQmd0k>(UvftrXq-dGSdH
z|D}NNLrEnla@upvz@bp>zK(MzwK&s?4jvpVP|-S__8b0P$AyXsNHr;mh3XVR-^5;k
zPWJ<Qbu8AP^Ud~Djni$23>-x$Fd}toox=$9y!>xY&2Pdw*PjASZI2N7=j}(PcfqZ?
z@zAIWAoKo5XxDVaky;FE((i$6Eb`!1&)vodL-&66bf92ilJGT$`{N~qzfcu(84R?o
zjz({F>fqi`mWGp5FGjnDn%d>{9n(Qzi5c+PqD&8(_w5n*o+W>3vi~f~DwL@ys`NaW
ze(vM~L_R`;uT|xiL3vYZW{+Lcp>il?i;kZpBi4AHsK3y&XlJO!QRlY3G$0YB%#iqU
zr7TD!Q^89<16NHgjEM=fe4?NnsI?uUR_So~`1!NZ>P`bdCjm8DNQn|&_gwacO1<|b
z#*FtS2ApDa>)fDsmVu4-i-Abx!{qg{P3RBri=6?W5KEh43qz;V_TY@+@UWZ~4e%xM
z>3p4Tjfc8GITVZQ6g4GK8TsT*PK>KYp26HdIU4al7e%r)$0I-7ILDgqy$U6DbaWWj
zg_+<~C`-(7Ve(H;2eldo+~u?>x7Mn^8kwX;<12NbjKZ!zxvsk$*1s{=yS&D#c3wuC
zm;5LxazDh-&smIIpy0E-w3N9yFUZh7aXW#I1ZuctIA*p?0zK*15_@XF{5~PnM~4;Q
z+KTRw3*Eo)w%zEDi+0<@7?Q@k=yPiT#ptie-TDX%t#1Wy5rbqmW*R1~V8cw5<Pxp1
zR#!%RDX9vD;u<*T(>z$@U?ON^NKW~jN{thSjTU^{iU!D;@y$;W^dfz%HwaarG!G7q
zNor_tHXZcX?UiRVfUdWt&rP^$(OCJipoORfF<#~Z9ELH`=Y&YOqf*KSu4YNsc!eO#
zGcq{^^u=Yacyc!7sQb-yRkiaxAN*vsEc$Z1;w*QyLd+Y~#DIjcqwiU!xLFZidt}#S
z@>jzdE!+4*%0{_yTvgikYT<@A>$^9kcYIGym|qE!<!Ca%7Yy`{%Z-xjXCQLG61<GD
zr)|zx$?GIQBj$0B*}dLAfwctmS-0Jl%c`3mvN-9Svw>)z|3+8m=Q0D?MJeEXml{ta
z4=h|EpQ}-yNE5ow*{iu-Fc9$FTrz`LvSoeHe5}^=QND8=y+-kH7D;$PT-Wj&hxE`W
zc{h3wTU*SM(boP6AyOX4ps=uqw?xU0pQzI1<E3+6rs4PT9pcHBck}Kx%Fv}#5JwrL
zQb*Y=zCtJUUZMrUlk20gpl0^%i3N4FDX*>^H0dv(H+igVFo`*PojyB1dpU69{}_$X
z#Ype}v;gEmBKb@Bh6;VMh~1ylm%Vm3_|S@i5(DG>;@tfbVVocr;d|LZ_KK@Iygfv`
zH(gKx6pXXy$5n)683yjB-skT<Jx=Gd!L)Kv&N)LB>&#nA5Z)%8`o#H%n=%I@*p-x}
zL37ex)p(@+UB8KRvXYR9=tlOh^H-!UcB{5f7%UEbn+pDOR&IW}QQp)IvYs$TCIANp
z+f3db;xG3u_zt%Yx5g^K$>x4&UXp3a1C-2;$3NVD?Dt)_kp*P!#gpBjmhAQpet~9n
z3&o3@e}CBhqiJPbW4_viPQD;b$pvD!tenE&>}&_<S2FDhC-LjA%Q>NQC~{l+x6@ER
zB_nh4Z4DRB)NHBLCDQo48rHr5(8<Hln*%J6-QHZLH{~?sJe6}Ae$P6No}F#1)95wK
zNIaqjDf6wZt$gpd9%GX5G@qU#33@JKs29Dx4JA}myrmD_a#yfOxVxjaC&6t%0id$w
zX8-%vvz3Xk>{*xp;{5Czm8|a*eD>mz_DibZ03ulj;!w&^EWnXyk5vZGlFhA&ND#i|
z4a)j<+js;GQJIl}pN7vrN<~%hHr&X7(jQK*#I1{MuEc+G!zihsu1KU;hwTY2k^S)J
z1WO(^zpt8zx-b0$<NjJqulQdF+Y^HkmaEj4Z1(2oYz^;7j&c#^-8YiZh4;&?bKQlh
z;N_w3zJB}%8u#sr(eXxa6j)CN241Nb>9u`ssC!CEI^Pl;VLe&<0F*Wy0wD#K^?M6g
zG0J7e7aXc;rq*7cBuKgcl)$let@dXVyi5PQ44-iD3`dcAe+(t%xrO3p#7k1`o{r!O
zR|^p>pI641rY0gz%H3w~!r=<ULgqI=DSx=RIvx)_#M#%B8`v=~Y4}6g@%dXmPEU_4
zw8Rl4pxs^R7l|&l=yHXrr|%VkZ%9^w+tPE|>o<x_YV>i+kW{BcHzTcEw04Y24m(4x
zDxC@gzTj@_nIr?1zLNJZ;k(6}FUoTM5{L&=5u#;T@ubMEunDddl(j&&IVXXgL%jc1
zk|)X$FE)q~a91!``C*Kxu#jvQh$I(YIlmE-)bRPP!%@-|_zc;nDOovRwuT~Y^~7`F
zbs$th7Fysiyyv4Y=cqc&-tzNK<u=GP#IA%(osHE|g+R9#-wATH)ZE2aKf-ap5mkH$
zx|c|-pn*ID%9}|c2mulM^F#4Fqcwkszlu^*fp`LOhuR#AGf7va)hZt9=_~p&$Kh9x
zPQ76k5EK&>a2KqSskvE}&-9{|E|@g_41tjU7ds<*D}+SX#(mC(r~n}~T<K--84_gl
zC7!U$JrYwwJ)O>~gyG9K$-}eyneb2Pg%nv<bm}>G#vF(*eaJGuWVln@PpltTkU7#R
zxS}mUlTnt2@d=uL=BB&1UU;Ih?)$6%{_Mn9yuC%Gklu%hVZIJ^ndl$(<i2dHXDtr4
z6OlD|Nv2FH1&VYJj)x!SM@8i3pL$)tZT#0D3DmGb_Bep6@^krKcnJX46|yuoIgYg5
z!j;DxuGmrMCk({YEW`OKZHx(#m8HAO!T>3}`T943G^)gxb-E-|4eL*l7D)g;SUR+A
z^f4CsXp}G8sQ4?p?l6*)iho*{@95uP{a#CiX!by=<$qb#%Dtqmx=6`#PjpB3FT5mQ
zzD$xXJ`Eg=FeJp4$qDBx$BLfc;lh`BQBN9JW-%Hb_;Wh*p9lZaqn*?jxacv=NtS0k
zKi}NR=vy2SdnhEJFRJnyt?gb&aUD*7k{Cj#I9~)*O*WH~>-dz9$nA+yN=Dy+_UqGk
zyx~-{;T_9&sc&VxmDTVRmc5$OPh<!4kyPkhI~U3Izjq6Pkh4HC1)u&;i0!lQFkWAL
zO^XlnduoA_O*C~k+UE4Yf)kn7s87(4Y4K$~CW)~SHm@EHt<;IKdUqTvLYK$_j6?aV
zvARXwC}pgA#m@PGrZviwwT6ncOIG13bAM`)?+Njdo=h=xeV0r@<0HlLX(F@VR>@Z_
zere)8<WN{pSgXdML-3}U7bPQrInGH@{D8>P&q|0)V;d*9*6EIyYp+l`&k2Rg>RkD<
zo+~ERoJb}&Zq}E4_ybaL>9Enw`I-{n^x!rzy{mnNolYyY)vllETqq~kCEt3@Lr~m!
zkJ?!?U@SS5f7m8|rw}(XF*TIzux;JgNid5RE!Se7bM~y52=AsI>zjN!(KiCBS(<OO
zOR=~PG_n8xUo8vWLq-#?@I&<SE4*$iYjo0G)yr;lvd=KMBlv`RE??p${BD(1nGbi^
zsgU=^PvT2pdU_>1&0QV+f%3zhlXB$aqSNY;1(^LS<<AbEV9^=ee=+B?W2;mWo3CQd
z?N-*9&x@ijY^!t5Y$KxV_9$tw;M_}eH{kZ=&+g5&so6<Aa?loAVdi!5)XVEN7n$Zh
zjmx|r`ORGk`wg;Cre1(f9!y^KExoF<p1d&OM^%OYRS>)Vse#OQTk7au;lg)2wG3aq
zB-ubD{O`9OEX?IbS)y)u{<?h)_M!AZ=EwI?GfVyEvWy?MZr2v5SEg-F@k(li?RdA-
z;SEo<)SipMWgzgN;$Fv2x_8xB%=1kp17*YO?amnYH`ltlv)O5*=VCQ8{=Gf#H7udM
zXQyVH@j}0;#@7c4TU1Dd;!eX3&ZRIo^5w&$jE%Kii+)Z-a+el>=9m!m<;&!rw9of7
z7UTzYs&-Z_jMUmz4*}wyqkNW2L3KOpGvLK6$eP<H+}V{0P_fu7ws=;XYskwXtmE61
z<yX8eIVB$_$*CqcsQOh$Z%_5gS5Cz$LungRi}5;1*=UWYAh%|F$&Og2^^K$wkwk0%
zfGP(0i%J`2dLC7JT^<s0y4mck{Ab5;?aU!QS7Rk^1w*Bbbt5@%)l?PVph=B0IB{l`
z4BK`O-;~Tysz%AdG{`vY7i-akJJWXQx@(rJqFTk@=JuZ~1t%GkFD?iSd6RqZli6(A
z{a99ee5VaVmsVysGv|2r$}T-xB2!P}SSwSlc9f}NdYI{lTix6^G$vj1OC}zP<^TEY
zb2*$Sj2#yAQiErT*|Ye7XwapBwc{OO2xeTWw=*${?kHGuMrz#G5$m;4xc9moz8qY*
z`A){=s6<`7#UMAyA*!F`*HRl!CDC&<Aq?>k5FRhH6_9zk@6P|xbZ|T1d;W8WRn$RY
z;U0YTKAF*q2`lTa?TgHH9$_x7UgpYo4Lr7LlgvSy9LU3~g*|_gdhREB*st>$5bjLr
zUj1kJq<rJ@x!o%TALX6j+$`wnFk5F$(Q)-xQ_HET!Fvc+YU0T(^1mPEkDv;KL=*s8
z&F<!9W+E2eNJ3H-=zitpX^1f?gT5%z0$^if<Gvs#&Xceh`$NaV-f7W$U{(Suj4}g$
zN@^;3dT0OOG#H5}Ow0en#leL{QftkoD6h=lHBPHm?P`PU(9yZu31hc(l4<t_(v=l_
z9ZKdGs(SR(cxMM4lF-bi#>G6G52Z<F#C|Q8U6B(BymXi^inPpQi&%{e{a1k<;I!IX
zZnP|Y&xb5uHKemsO0;e7#}9yJ4)|kZIvqYTVbgk+_RPZ48u%^X-L&d}Rul}?TKZqF
z5a2_v4G8lvWJ&q>3B=TZ7}aE}M$;XYqEeQXl^=?#0897h9eL>-oZDfX!C-r&J33fF
ze*apc>NG(UbFh)pFwf&PD|h-<APtt;NQ}ogVN~UZkJvdxA)!`82`@J<7tR6D_{4b#
zgdNCCVgj~IC^R|-ae?pIG5h|4O;1M#Ob6hTi<Jxl**j~>m+b6#@HyR~rfG*adW)M7
zQ-g0#r_tG8mPcj%+lHw@+wB22*Wwii&wrwsb#-a(eC;p|`@QN2K@dy7xX!$;i@8z5
zv%rnL?_LkwnV<yF5Q8;&xlD>D-ElYgjh{WOC~Hb{WeM{SI3Z^$qINg{_XqVQc*(~q
zfqT}%f-XA<hBpu>Z3<=aG_eHPL(DM+4kp_xZm~?oUyJ*tFd;%{27pDtEmIHC^g2nP
zF|i04S55brunprYldi<sl>pDgWLUcqz{VyfC-&ZBh<CIr4R7)aSEZrAaU@ej!SQGU
zm6DPYwZs396HKCDFc9z)!1%hk6&1n$*8+FI!D!|hWkS(ephkaJiXGqF)wS{1OG5(%
z*d{P32kHz<mnpmmU^HO=Knpgq5!ifZm)FqHQz4-;hzjS)ZHW3RD<w2FG|a3dw6(h(
zz}#0;OZl8mgCAKNC1LuC1TA!|(&Z7XcgTh6nAoVnIw+W2p2vK(hW*3CVK!Ref&V))
zA*=0KN3>REv$9G6Qi`M%Gqg4w;6yGty7dV#iAlqV4vYlJ_FO@^n+Xvw+G!xO_mD7E
zUfYuw%s%i=arOygLy&<oG41y(ZoW|C_p+m(FfDObULIC-$Mg73=*EiyHVO3iGcy9I
z+HV0&^S_gPp_|T^lBXf7`m=<YulPQ{rT7yWm}l{<Py_2=ZBfBtXG$yR8~gqp7(k6(
z&G~?RAEvNCq&+6#leN<q>|reG?&*O|lE1+l95Bzp0b^>gY#Ee*6d(j0YkCc=vfVlI
zx7w2ss!bU$AK$mS)7dE`E%kh^qmqO(^_)BVi=t?psB*2`<Fe7sB99_{xM{Hp3Y3|A
z8~;q(emWchvB1sV?2TJ@AM@Yg;WoHTw?#fo2%vM!(3M+W4pa5eT#N7eRhVjnnjiI_
z<6?po{~_|dtuaI-ghn&zH?~}RW3jTc{{qT4VC!;oslQ@#Rf1(S2n6t|Vr@SdK;UIl
zR0Q*<Sjn&cXEof4#q@4)W`<N~zY^c8&HB@pN9>n3TMeV}CaWGRXS~!6Ct5QX8wJOh
z@BEO2!n5v*^@P8*aLXBPvoxY~-BEvB=k%&hqjoGTecac8lltq!$dG4r@7~<Oy~~6B
z&aSYwuD;|?L3hEw>*@wBt?}VC+nBYxwP}j{oau?_9s*ACjk_nct4C)Lg!60la1cKA
z-W;}e7%-f#d4Tu_d?^mjD%#{Ou5?Us3Gp?uwY<7Kl;lAvgeJ6ppFoq`1CYc-Y1(p>
z*?^IBGVg=?tP_Tasku%IzZ@E`w(ZI*YsG<W>1Y%%s(*uXN8jhlW#;AxWkn#I!uNpY
zh7ph@?-;_ZV`=fjf$4l1ty!ebfDg=fd^r`wqz(GNlf#X|62Ip$lGcN;_>QxgqXxG)
zJ3A{DsorKz^EdFLV_;@(^2mp#Q!YyEq1^i<=oVE3no0KXJ~EhwW<UdB#`oqbx@Izi
zxYiastewkcg@HysojSP-QB~CytkEb5gSqJjZ^GJ;)^!TPaBMUQuA2jT2Bz-#E;E3_
z#+&!DzVbkqs$}6}hji*Zy%LA(WsUsdg3JAk>l165%C(K17ucYXV>#(JTv%Mq<6jDT
zjC6P0$YW{F$Va_n^@NR!y=B0d1_=AY*bnqPujqgLsDKdSmV<?R0nZ&by0yRqHZD(<
z+N2-a`g1=%kC6BoIli4x+zaVt96+_Z*OThi?mghC^ZZctg90_cL(yI6dHB6D>$~p1
z3eOn~MZT!T*gvAc6jgmUlDOT~Wm$19ydkHR6l?laOi53&Bcq@|$NkK-@p75Dydu%S
zlUE2_@V?jPz9Gsb<+ZipeVgRCXhsHrMfJ&uHem5<U2nFndV=}jm2;qFQB=n^WJ~~|
zk~W#XdRm@ho(29cxl1lbxy`I%!L{yXB0YrLGu2<>j9VvxGY?utgoJD6uC_@)JAtIW
z!R|Gi=Y-D*Q4Q9R3$kuiW=NOy*XNsC*1HC4&xYR?J>4fHeY$da=0wcv`rnD~)m<1p
z6@MlL5(&gxKxiP4+PQhS{W}(y*AUrLjcmjH+ycEBf)WhRva`$Y=d}tIsV~#(UqeI&
zKU@p2ilGMd_j8uOeJBMVGsiKdw^zQsqvN4O3&2y$fl*weBR<HkSF^`zv%M`!sRYg6
z8n+WBM#fj*2aBWHpRm$jQn>l2a5i%Sc~E17Fu`+YXzx_Xt7d!Mw!hc`dFV(L?;`=%
zL@|%bSY!iPE`LWyBm970kzG_2i9o!PZo8+AVg9$=Z`w8wHorG4vTh23+v(}w8JLud
z6T(EZi3J_PkBe>3QILBi{ivRV{en9vr@Sz&qCySr>|WOMy*~tvlG>gqwpGco0}krR
z1nWE7B1#)x`$r}H<HK^gN*?Pi^bpLU{B9~fy0y_TpESlIgUivNVgi&3|Bf*DvSiOu
zLTQtw?*J(rXI%Cf>=9`-eOCI{{AT96<!Q2I2*h0-GZX7i|8|(F?54jK-NIw+>-fLM
zN#)wkE-Y&_zM)H@NSQi=BpCCDcWK#W0|*pe)K|wm2rGU4LBTa}KPdf)LEY!9FZcr)
z%};fThCwk<^|Sx1u<2ZXeRG?d7;SOCdVOmvE3YnIxdv?Zw`m6_7au<o<|!A&$>;ft
zzx(0fp@bVN8VjJ1iHWxkJn2()ZW+!zJ!50HNgqatU%-~&ayUS;O^%O>!UTR~Scfq%
z^f)-45QbQwH{M)d)E{gV64uHyWh~|idSlg1w-=V^7;N;CK+sVumH?!7I9y+HPmyxw
zPwV1}nHoBTi5jI*K9NX8iB3t;3dl4NX%;|@He=JWoo(!yGY|}T4lyx<gKiM!rOB29
zdzw;_x~7)ae0RzqfITzQ^2HnYr!Qy0X!CQ~c`wxW)CPZr0FI&Ey?shA(_&NH8A2wv
zjZ93CT3LX=2VIW^M#in}?fsESyTc;R8Ay;L@51q{dx<V0f!k(g@;sw&pZR84-)Ie)
z%*#IZeM2wV%|6*}W9qqNhUM-fA#B=Y83xAgMc2B=4}Sg^^NdHML<fSqpG0=l_#Cm0
zf{pO<H<fx}uxe|a86k2>{rNNB8?u}G<JM78#q#w6WOezt5dL!)@DNkgu8E%;eZ<8(
z<f081pI=x&J>=yhNLrE%51ObHglpQH9MImJV)=HE`K&g<Eb`<-Ri)$crOf5IMw4g~
zW6zIo5STQuNOLyhcJl;a-ch|w93!JKjQA!I|5+pKuQpy7?W><7BLl=C@A?zTeP$fd
zFJduV^l!&sIft(?5F%HI$n!i2iQ@em@ebkBEy2FghF-D26usy@>_QUVAwx^pOwon@
z4{Of3<{P~Wl+gglf?*D#Jl@2OQ_R;_Fgy!8vTY2eh)GnI6+FQC$Jf7HAc!%2gc%wM
z2|iEI9^8f_0goNV6f+m&eft-eP=WiL6`njsVte6q!$%WtmSAh*9u(I3upkl5ZAUh9
zQ(Oe=R7*?C7_!_E2qkL{dMF%~f(8a27wa|&aioc0BOM<fS391e&7O}`-GN)d)YKF&
zbo$Tf7#G|oPYH?VPy{dU$|uJQp2Z8cnIXOm;n5|sa@x(btlQt##nWaGb5~kg`i2kR
zlUDcd>WMMpEkvUt@4F}1)BbL5e(ttAy}0v_9Y#1ePi_aH)PYo;@Dz}Z8)bscnNp%1
zF>XyP=<{iL+4pNxQ<a6mx72nNG95r717`;t>9JA*m&*ZC#G?pRdNtTH2i<mGvGI1K
z4Ca9@270}e(yV&Xp^$b&A;sEP@CY)}LBm(9Ul+j8^`C+)4tfYUiauloQAvF(5O(xT
z)2t7E+t8k_&B@{%sG;wfZbYs?oi2_m1`VnGB#!I#^r~;_e~9^g?xjsfLCBPCIRt+a
zZ5B?|`viZU(W}=J)J{uNc)hD&O`OnW>T|rKP`$Tdg(Yn4XZt2!)5Lm#w!$)TdmG8B
zklvaG=hq@5?jsNBwt%O{1;bEYCPavZ2lIig!hVU6DS7e-kGB9IpJJ)@5u`f=ZA3;Z
z_rgCcM5qw$r<ox#`rfUu3&g*?(l8d3Jxe=2wZL-H8*kg3cOpKF5^zAjAIRx8vuw12
zskXQnSBXwH%u`qA`J<}pNm$Un2S0i=I-&*<#vl{aN>1#`D?&-hMJ(TVF}=$Xgom;;
z99RL_LJN*HaJ(6_RtGht3>A*4i%W24HiQGR{X057$mX17-$XV^If|4kNR%G*W5xwc
zX3om&g~tp?mSL>|q6NvDW;4*At|>WB8yL6Z(jC1|2bVG*J|zxj`Hvr>)M<c$D@fcB
zDI^e!9ok_sfTY9e%WJ5c5~UwJV~?ou!Yt|QSR13wpXPU#lfZrhD%Ys!l#`alBjv);
zltxd2=#JL8=I6C{-FBvOK~VCB1#AeJ4Mh-i1DAQo@^yIdy#RyWytjqGO4#@CW?*Jy
z^FARBFL1mZQ^L`Hs9Xm|vere1!I_bEn13DRbGAW(wy=N#Yt7(yM5*R?ReHRH_v!B&
zLV7I4;!I4W%)E>O>QvlPXY{4wAgt8dj^^FwT2^-UBP9Q$VKpdf1MUDp%$P=gV0^ge
zeB+ND$?Mav*kZB6%ch{L2o#|-cvJBf!a>hbLLNVeRnGt2IcN@nYk+WpRnqIm^Tv-h
z+`V3)ECpQ~(Cozg?K8IFlI-me44p=_Ikx4Rh2Rosn*GOQg|+Fo`qJuTxxtW6FvU)!
z`NfBBqGz1{iThL<@ZoL)yLP`SCZ+HG#kuk+#`{AH-@p*tey3}N(%MUf%m4IB%J?tt
zrg8cPy+iPuMNwE;S&dn9fN%nsVlZ~ykWPO@pofffa7HW<O$tmpG^sfElj)OFjhhW$
zLvNSFjD{P5o0XeW!5RpQ$m{#Ge5(=S_FQ3~y<Fj}_TI#=(E-v-@!pZ0S0s44DL+tf
z7SD<%kY4pX`#A8$oe#dvY)x7?$3nRcNq4|-d;0XLnL+cvcKwF;!7v&?7nxh>(Z)q<
zTS={~#95p8spD3jG{4mO#M;INQCB5#?uZN;>#!%3Q%$}Z&|RmMQY{1*K6_x~@2!T5
zlg{OXtt~2|^-}iYm(cNq8WqHyP(XE>v2AT_VWWk>vf93SXlOB1AC}b&@Fg1gPX_Pa
zeSoy&8s+&wEP-E}hx->zHy1G43G@Fcw8cShFz3k2{eFw~*3XZPdJC#safAi{c9f|5
zVGr4phoR7Rrox%Deo+bkfsTb?STUi9yUZ3J4TXuh04^FpQecqb9fPc1Xoz?lR#i#)
zMn%xwORrvlxsX0Wl@4!^Ywzs0$+6<bYbbET+7_&fOBVOtOL>V=-vDVoUc%~jsW>>x
z`+P{lfq9I#BXmuqJKF4*REfDGr(js2xwf;Jtyl6SO7tl)siBW;k{5@0NWn?dG%mXE
zAp_M13ft&pKS4jLlm`)i{mK4g=;~?dTg7PYcNp9LfHJxt&^lk5ZFyik_&`sUYs=L{
zN?Z-^GrMVPf4*vgLIri<JM!nA548i~-tqHSIDY<60iQNk8Q+0x>(t9kkNe{~3b+B0
z?g@Rzf7GV@G@>nFavQm|*|uDzSQR|S_e&?O$G&qg;M1q(A`mq~GFJ3Z+T2P*Ry)@1
z7wl^_wY5Po3SvsoUMuGZbu5C<JmEg~Of*|DLs>Tvd0>a=cmrs9kXQ=a=`+Jcu*0Y2
zCBX#eJW(1E5L#PeSxBokV~@Jx{(W&jZ&oBD(N@Ei&*1AUO5;2`WA^#kbk%gt$dvp<
zEMKK$)MK-#>M04yZDu7bftjsW7i?7Vyr63h85zMZ28N2V2J}s)8h9h0fB5m^he7!y
zLaPXp97L5`mK}{^O+kGeAczf7UkisG4?`)@v9KK0|C)kmsy5f*dg^Jhe$%n!<Jr6i
zLfE8nX<*K-7)Ok6!SedQTwtEsT5Pc}sJY8+MMqsAg#&gK>EL_AmXRQ2a6FvAYsSq;
zv<%K^d%&({YVeLwP9>Hx!)NJ>$0;tEJLj}5*05zT1Wiov)IwXQT9=f`XODhIes;d(
z`oy<YVdnf*f#psSEt=-{TbJm=;MS>HhaP8+rz=9V#8F1&lbt5V&mN4ub+RrT4rdS~
z%i@>9MNDoJ@--E2$lv#>m6W=Zce*C<v4V}_sP-_pKOPINW0i4*=1&&I&wE}F_?Jbi
zP}LFQ*GkY~<f|&aEuv<rnJ)18t73QHKYaPT2*f@mv?pK~j!pD<_N^R*yd%oWq+!t;
zb%Fe2AY*K&lenJzg}0}}#0f>3bdEG@O3UhDCK0lyrzdXL3-~O{(T#@^@F<OsO^I4x
zj=1P{Y#$qxkC$pPfOrv>ZCGdFIMU#Z4Eej0+aP2|)FeKC78%pC0_d8dO&9dmFUt7>
zar1_a?xpI5!!2FRP2IP7gA`q?5YRJ-5q+U;*AzHLyHhdQb6$Kq-0$q91kJ;Kg#P7U
zzK++?Z&nNi0SDz`emkdxSJMt-w4LR+u?_1`!cA00d>EpA{+Wxl7s93<9hP6(-JI(m
zW?T=>0>^;x*)xh~k*TkxnFzp{0z9?BkqLMj3>_R&8fQq4k0D`XUj!7t&`}YJGXY5^
zV*Gn|Pv4UWF)00Y>Ri($*@anf-<!P@yND5uwWkW`*)ec2&5`PVY-b^oPhWqyNak?9
z<<T;a8b<}w)}OX?V(*!!KUtAy05aIPd|c{<+i8nc$&;{R{vSyYv-alz&HH}f4;NQB
z>l~{(&aJ<&HfE4hv9Q}UfdeooirR;}+`R>;qey7n?|IJupB8`+{q}HwM^j(BZF^ri
zKY>i)`?$Nzs7oaWXSKs3UC9Fx_l6lWrb8dGS_T<Z<~NTd<FCYo2bV(1-VY${XU8zI
zq8h|j(ByX1zl$*)OtVy<7rbV>cuA?C;-#Y6B}-tQzoz!t3kw5ZdUNQAhK%@ufzbjg
zenhaBK;LD{J^k;a5GqkK_4VW!`jg~1Q8ArnHLgd`a+FhyJE9!-|C&PaJFfFN^XFZV
z9ggzF5Frn3qQMjNhUK?91t@^1YRUr(EMT*E#mCwWpvvv-Z4)PMqXE=5qu2)LW4{1A
z(t=6*nos}zhkkf-?R#@qE9q7SQ^D*VmYz<<Q5U&W%(QXD<60Nl*eC!MaU6pRlZK*d
zh1OQi=E{tli%VHuodk87P3enwSnc>oxMDC87F9AZr-3e;xtH~)=?4A{m*DItix74f
z{Ogzlcmusrn7O&Rs7QhJ&ez2B^z<OFRv#UKTqw%$dtf;RItIKT?3*U6ouJv*KW!oC
zrl?7$8hDog#4%t8g3tk=p;jf{vDO?SEVvNq5!dr^^lb9xv?}9eeDKfv_+iQjKPoB6
zFNWPo%GySmVTs#&h1jY5<Rw1Y(A%dWKO;9sxg0jw3+d^hjWsf={)&ZPuGS3N4@^~$
z)KoH_YRA@4+jEh?SDEsUblK=}^eB){p8;yqo@&Bt2jZ+^`W9V1p{;0cYWlFQ)$rPu
zDD*!gMDtcRf4zWUrhT=c`^Q;Mr|X<mOXA;UQ@>yP3OHe71cswM7%;)Upk=^NPw;L}
zA$TNSzVgPF<pV!vZEog)a~N3wDlglvv4i_(FYg?2A5YBrSD)YCksAccI>fb6N6W`a
znU9T+i;p_5tPqq=Zhckmq|T06Z^r#b_AUF{sAX>K^E3-)03w4_VOsJD`_p$LoE(pl
zpsg+fJ&rgkptE_dqqnxgEvpCZ6zJ-?h6XAlf(F-H)}0YGHBwB;l!?+D|9)}|Xa+5I
zL@zqm^t(i6X5NLD1E3n#h%I5RTkX$wb_bJBI!t{N=OJ3|{CwR6dftgx%zDrjqU^$l
zE<Biy;`8Kj?84?D&T#TIR*@OWr>BvnZyA7HO_zw)ImF}|ny$(4XGA@qp@H2s4Wp!^
z2e@Ql^#YwBxGSCtItIaj;Gl+KbCYOn+ZD>OaT)V!_kA>uwEJp<@WC}1Sr-=<ry9LO
z-xi63);zs)?+<;+0wB_*sqAZ}!I-C<uM1~2LJ|@)_jez4m_o&ph}s(ZFhdOIj!>Xq
z_`RekYqM61aK|;9)&)uFYe@-NXlrk;>%F>ZaduMk<7<AjV6Vfy4EbH9B2}m(sFQn?
zi_~dx4^Hp<fZIw5Zwr$bGcV8)aVolaQuR|sij%Fxq9K1RM55#OvXf5DKPy;AI#|%5
zdD60b0(s}XQ&VsZY5mT`tdjo`D?f{NsqATZ4o=o{m@z5h;YAEf1MSpnfi_t9^Y*V1
ze^peK#{zxArGaC4p9<8iz_7kb_u(YM^nrlhmmL)ywL*neQ(w}tJnF8S5bW{6;=FHa
zr!MEn$z@f7BlU&rbgBD6f!T)k%YX0y5S><&+h!C7qRx2P?X30w$>}yo_kq!o`xKL<
zOR!~yw7EG-9F<ZDJwUJKN+;i0SQ*mC&h1QJNS1+yi)|bQA0O!N=onaVUg|U}+uGT7
zI9y=_^xe8_NJWLqcXfJ>y8A-ENxtAGLK%!xW*y@6Ld(qZoGDm1Q|T8iB28N9_o{`R
z)r*>VRy>pZ-v<Y1a1TPAy0W_RO_dI=a8gpTRNf#Uz9$z!^mj+GXb1|SythRh?Mc<X
zyNxNvblUDWqh$6_Qb23S16oV@s&q&qhUn<l9J~V`o?<q-`68!H_bx1Ct@}?*nECkJ
z&FGV<P@dmuxFCK?CNiiB=EhF5ayT~tA_CGBy1RShx>naW*E8Q1Iry64E8&jGQ?anT
zi|mlv&B-6#oT_z+kghpDy|{P@KT%fpLz1UKqDbA?$2J5Iez1Lab-@`MuPlYVOD19n
z6E{IR?$<Jw;M`bPJd{aatax^B4hY~A+RoMral{+0T=N4@K7SN%<|5B6Mv!{-e9$k~
zVntwsrw;B@R~6zEzK~oisK^!bbrxC*OAHYc)gFtf>x4K+u5rAe(Pwq|hg4e}J2UyB
zp-O_a#+a_&F?i>*-kmsJUR<=``^KpZu6<pPDZ{Dn`WX^NdhmJT`s3VtjZP{-Z&-F6
zwsdfIUum1*K6P4DK#y6DPQjON(WA>ZYPC|hnoVaSNCLh7@4jrJ1^j!rB#aAj_oHvH
z$0n!6uz`%L{%zP2N{!>cPa!M{x(HB<NbPRNcA7x=dVW6dS7k`2`xQ#&BblkWG=1VD
z4*3GG9RWh?$-fJ-1a8!O+S(6cwTIpWw6E|ZfNaF(u=HUaT}#&(;^f}3Lx|@KL_-f?
zDHEkrpj8Sb1|YZ~V+$hb2+@IS3kOgU1v|TPKOeG0>BPw@Th1(8WRALYx7mvnk2`qH
zX62>T)qV^zaGY1pSKWVK&%ns!uzL*?*KL!sakKO{9LdHO9&jgqVCaItV_dN|vvQn=
z5`eihcX1&>LX{9EY|iP@0Ou>xJ+q*bzsp_!MMmL7RP2pt+ZiJ?p-b$wH!qfyl=KRn
zB)O||8(gHGd|Nq#Qw^R3T1mHAevsjonMqzYPVAPO8~Y+wltPFuQ8>wzgR^q4nxEQu
zX5$$ofhc@kypioEq`xf!f0!tTO<Kd@7HWtX)0C)UTiDpN-hPsZGsRzBm3$G8)uV(f
z=5tk;!N%$XE1@g?iWy`riVU)Yh`Rh_7l4>jo)Rd4Q-=!CW8*a%W?mQ9Z*>#)kAX-?
zhs|dnA8ppcg`m;aPJ5RsuHmMzh+Q%;FpLrM)0M)%$1FRi0)s^nFA*BnWm@qEib<xh
zsk#8&g>HWTeeAQgr?KylbVtEzVZxS@muqzX9fm2HiZPZIBfs-}qMYt#ebDsB<xybG
zs3&C(FSwL{iUPZ)RvgUInYTX46-d!%J^y0)?5Otde~$U7QJI@#-_?I0s|@{Qnfv)6
z)X)#68dz$BsZ%3m){b0-;o&25Y?Z%p!Y#|XQ3E~<8y(*rJ288DLBPi%Q8+AIl*@kT
zgB8UXPB9|>|7bePs4CR1?J6SO0s_(@jfj+_bV!#-Nl15tlynIQNFPADqy?m<yIZ8C
zJ0zsO#q*8#-*Josd$Z$?wXQYi`yTdw|7j6D+t+PIh4~gQ{+XV>WbgVy+w<vwtMm8z
z)_j-uuV@1z6WjZ5C1b=bFxh;<J4AJrN#@^<Y4ZJ$itp6hD}CJd^C#(>d*ctbKhvVh
zbDhcJAhJ{h7!2<m>X&z$48Bk*wcH4Ldu(Udl#WVLySSFNDgV}tNV4+4Eq(uA*7SO1
zHRt){c9<WnOvEo1vZ9F-e9J;fU1cHVX&vP)?C0tzejn$SUg77^bM%HpuwU3P1;QM;
z9~B@PE`oR-ea*=ssBde5tJOsB1LUx_B}$U;2cKo>l((FrJo{HG^%eA5Y&hz7_Hr2#
z(lJ*TZ6C<smCuq5P4Iq<GF5P_pOcP(Qjyovrw8mw+E(08R#h%SJ6nze42YyN5fKLR
z^I^^{Go<B#X&g%^L&QctCE7-^uLQU8f4Q5}-w5&5JJ^5PytwRR2%G%6IF3sf`lu^v
zY;3Fz+vj9W%oOE;s-A4-$I%c@G(X12XRAa(BVRMQX?`S^q%4@9q$#WaE%$QiCwW><
zJX59lUQOP13oV?5ss}UDYwne@eA3%D;0&@l^-xm(oAKeNS1L`}v!Z~t->2Bi$d}|F
zWx`7tNCt$E{azL8+4gRH&^6bawJ1-#t$DT}T)`GDAvqP1>piE~72scS?2F|-d7j@i
zrzke*<mhwu*JzBG4JAr&pQtX<s+_a5YGEJgl%~kx_{K8%RJ&*J+O$E1O)znPj0pLa
zYWeQMy<=ywTJps_uE!Qa9G5)bYP(I8`~BtFXXKnJ*_LS1eMSzbiILHeOdm44+_%|c
zTBUEt#)|M4BVER!=zw2xVD{+yb=&xj$7Sd8%KO^~G)MYv{SWxQF3EUBJN*ndB=sbP
z|9#;hk%`{L1`4cpadGP6haL5Ag3s4|yNHn$Q#mh`ht~b4qE02;@UYOXucy|UhnmwC
zT`>_5*hF5fe;(b#3Fd9DY>_fPms-7!&3qiie?qbKQS9p2_hW9s?*`}kO=Y2WDm_|K
zq3HBSn)jb5@$W=>hTJ_v_&Ic}u|y$G46H-y<%?lf(q+|P%=@VKS5Z@=u@4X3qE#Ma
z*@q}T2xfFkSKN7B*j9h(M%sG>KYKq-1DlitIsH*$u?WT&vADy~gIR7({&p(wsj~Db
zA2V7{Z~gm*esAsSBE5<J-J)QrI>B!WE`Nu9Dr0X(>Zw3^pALhGXh;Wkm^F#?nZM2t
z#MqNN_7wdNzC6^WV2u}OrxL<u$7uUQDa?r_#8XB+%-D@T{MHAr_(<3h9vPnd1A*e$
zjbUE5PPhN2IeM5VI=tV`uh<kEMxQbN^ea(rcgw|C%%ojDnk}ytrcrQi%NE3!K(&0k
zETa)pLi{I2;`_gF84r&TF#$^yKRY6+E7F#G;)o3>J48bogB0-UoX@q36wWC6iLERW
zi*$W`_jwaPI~XGX4XJr_TT_U7OM)`8JLKH#aStC7b6qDB->C1ln)}ZeS1kHONG>&T
z(Qht8TpkLg_=gy9=%M<3EEFtRjSAH&7@VMxi=AV0AVTDAr@}hC2=IM_!ysrxKTHL$
zkdGcOCsrCR{$hi^@t_g~pZFW$HEG=kM^WXcTSVjJ#}}r1beum8t8ge#aCZ)brqF5~
znu4r6IIQ==1N<?|gm!Vxg-Wlwlu`cwAJEpc(iM78{$b_ClZBnab7{2Pj1>8w<eR*f
zJ3gg{O?G9xqi%m3f3{6b22T#D!qEm%L_n^buU&NoUe};$vGwW<JEbjRqVA|@Kfcc*
z>w_zNf9`KN=CiuJCr6_6W!tc#R~@Q4DA!O^+Uj*2qYpB`L3<cY8|`ox5q%ZYuW>|S
z&1+gY6Cy#wP$)}X?)55zo9_%wsd%z%<{OINfl}V$LO{G5M*ZAiXXn#jzSOjB?89mV
zQB!co5Q#DN^G=^hX#ZH3`FZfY-832Re^`(%s;V2^Sp!8ql%2$;U_foaa`u}BMw^)n
z{X9kAii<C$5>vbq7g_xrG>ECwpK;a;`J4CirYh(tAaBYc>E3QEiT&LCo;AMRO^8lj
z^MqZAD^;aHJVyuia{Y3xf{87t%<CxR&3qn#PFonD0%uo60Y;s}@lOi-`4CD_h7pne
z+(M-!vTEK~Xi3VpeXY(knM);Vj=>#bkp%aJ?o`=q>JJ?SxFJEoT_(nkmlP_IfDHGe
zR4UeB{Bs-<jI_Ltg=eCCRLOyb#mz)Od*3!Z_P17+a?HI<mSsz4mFdF8kY5F>_&<LV
zS1A7~_PwW3^RVh00zxKY42wRx^f<1vBLZO_BHpx@hJ}0J2W1HtX)|X`T@P}}&%Sde
zV)zdWt3Ehl|7Lsate&BFY1Pvzq1<j!rBpgK;#^tO$bh0&ShXN)!x+}u-p*TJAb2{u
z862kUtSg2i{vQ_ds_etyHs2|uUbVK5khd;Z>s+xnh&Ha6(WxXZF@WO{SPt<ea@5#T
zFtHv&62aWXZ2^KSnyiF~BH|OA7-C%pH3l`ajQFqf3mK;%d_{zGAzFShcdc*;32wuY
zFV2@ikrNgoF|-ie6~n~0)?g+q3UsI){V#aJLIVFGQye6=llTafNQ~-r6j&<c%3=11
z>zf9;O-(q|wRTnOhUBj|U7&h)588RXIe5vrFuYF~4$oSqQSa`gzqTfdBhj0qGM4nC
zxfHnLuy<$ZZ>d6UE|USyZE!?EQewf+*RWKa)7ghlx?~yUL55x)nkVO@bD0{2;3#Xe
z(<?G&BtJwpOR}t{YtM)W5^Yb%(^J}HzR=!W4c#E`&DRG*%J<th4ld_}=xDH&LjLb4
zqWTnxI|Zs6dSN*nDJiJ$XFL}yDmer=5rbOdiryq85_PTrb%6U$FM+B)>F<^6k|5;U
zy$v&f?tPw~7bz0Pv4L33Se^pFrCOUW&u-Jo=zF`nQ7R<BJ_?=~_x05D0|>0Blui{)
zSTx+WAdeSvkz(;f1n7TLu_Q&7mR2@a>>M1T+S*TeZ07)RabFo9VkSL3sNfg6>x0)h
zr$DU`a9aonNHHC)Q9f7PvRO}T1;|%g1JU1)dYoT*H=Q;5h~uvYMc-Sp3lVl(Nx3>o
zXwEKSfXcjKm8M;t&fWBP-1ORcxy<RPIRp_=0{xtvU8uF+Yc1QuD-*@i6VN8IgGCRG
zOpr!fRG0Z^z$~0TL;G+y5hV8tW@|L{^bC)tQK_R*;Pukxu?5oz+@!lJ<ZN&6?ca<k
zN?Tb2hVamhId3p6OO0ju_~K%5sySPY={bi>Kyid~(`hF~89TrK+>-v<jc$BGeA*@n
z_Th}^Pb-%s579s8l^?C*>;kOtYnXW-Xz&e5B+b0-n%xvFDr6vtIDLVOS92Poh{TX*
zk^KhkI|X*ke~d~qMUT=?R0qfHez0`AM9V645L8gvko?GU@g!3yyx`mW9M`XfnuEn1
zF7lyRuJ~%lvKz)QuG;PE>gxf^8*XJy2d@H*V=U;yoaHu;4JUT>rE>H&+v4Ss+wI?#
zn|=MtW|NG3O3LBSk6I{KR*V303-w$gV)D*im*eAiR|rKDlcZ;hRai}V1!!GSWGjQ?
zx*WASjygd7*xogEvcj()7!<xr*vG{R2A7!_4)pwA@bgRY#jcEp8sUdMES%sIzFmFx
z+=;Aos;?lHUM~1eaqq8RFmVwdORos`$f?qIrmnW7GZ^K-aaie!tgNW(-JNwkaQpoq
zpF2WPhiH!0>YM%B<h!d=#y!2#guo6uo4LA(k`%rpZClS+D>jgjucf+rivk0{pys&q
z$pTOe4%;XiL+5P7zR*ItkeH0vz|qp*<IF_)3m^Q3<MqMJO+FZ$%7t_&d<Y@q`NQR!
zPl}#?b91xBq!J26J<Fqb^pO-&@pPnE^!wL4rhgnR6jzffepxv=pDiB$JNV~mRtNRe
z1nK=<P@6!WhmJHf!<^(SHxEkn->a()s%Ak0ZD?+grZvE62U1|b4}%VuMT5EdYQ{r6
z6Bpn`&`zVl$BLEP!$FmDzbxiqBtTc>TL0h9j#!aiDWEKZW2Y^_w?h!LGaE%DIE44I
zXEFZ#PjbKlqR1B<Z!r{&DNZ*$u@K5(IO4kAE;Zjn@Hr^9t!QkN2XxVFC@b|6yOB{A
zL`c9Pbl3fffdVO|OG*Uf2v?kVfy28I@jXk4U7Qxr(2`m5^=sx9{f|jAFRQDop|+h_
zTpaf|0@Gw~h@F!YCidvbc6Y68_n~hqU#|3?xqMCyYj#$<;joiODUJ^s6&`1%Wm>E-
zA4)01(V`Rr=??G@_&>P*-fsBqTZsY4g`I+Ab3}dKQ2<<qwi*vw=CBOwm157a)4YwL
zwg1!2`(*pcH(M)qcc++c4Fs^qto9|m^w}egmQLK=CA(t)al$At;~(_9)EqG+B8(sv
zHS~9z2d?lSTM07zUmV57JKC^ZT!0)@*M9IMq7R<~_JI*UJS6kyphApj6A<gsmz0RW
zsGAr2{!WzeQobQ45WJO4alNX-%!=sp6G|3bS3*GRew@%JK}$$eRp~#qol#jC-qG<8
zTD#?L|M@QAT1=opO>>j)-TCMnX!jXdI|sTo1WI#CS{tQSpJF-8a4y*e?BC2S43F`2
zZ@yShN=a%NJy0WCo)KGIVo9Qx>57WwL(Yk~htKZzt|;qxhF=6mb{<u}a1v@i@sObw
z6OydQI5KTJIhn=bjQEq*a;O(!uKhVSm9Gjblt1HMmKVY{*5d+e{ziY7BLZe?y@%-&
z`c&Jk){nX+errlZ*eOvax#GFJ;@A<1d!=2ZGXG7W3YWGIf#NaG3w9-EH`2DOjBT*g
z!EkEF))q+-a}g-A@4z|GqFDiY4KGy0pp^ly<ttlT3i7BY5-@l#8{kg`<mVq=reP2=
z{P*uezDD64mc@*-6_6Wa$KDsC#=rHRm79IBoGLY{0lA1dyf9=U5X%(}5EX&xGhjuF
z<0Izo&BFr9!ObnpKxAm+od&P|(@4^m?Z522yxlOY_pI3|ErrJx2;s@N^Ux^RNHRdY
z56gPt7y*XZdV5bSJZREhnhgYq^S_{Z!o1xbyQ9MpSAJ}IUM6#!PdAn9#ObW8(F<1$
z27bKYkT&g67PYEETt5&7;cc9Uk)*^@Q_eQ?bv;wfFyOt=Jk;~3tJY<gNuwz4u>3i!
zFqlMZu86)+R6GW$VH^ngN_1*FH#Qhxm1KEVYFMT9((xZ>rK96rBGgHjK2DZehPsYz
z1eh_KV|kjII-+01q2p(hkfP5X!Vm@?2p3mZ7(0TYcGyH38ykN&xceU-5+ZmD2Z|mR
zn7zV=<pBZ+RTBi@^l^LtNt#o(T%Y`xmyobtX_P11YY(Z%WMru!ncahf+~6GjHL2iW
znqpBEHfLhAyzzYRcN5rE*1Fr3NfnS=^gmnV$Xa?J*Y}X^{cdP^vT#H5i=QvC(PzJ4
z&C85bK+H1@<H6j=#J*Mv3e;iNZVdI^kfA<q9R1Q<qbYTAjl5={8^tOO$^0(AA3#4(
z=RbFW%}D$B`S-583rNZvdLZYNKy>VZm)G~2stSAzyOU}ANsTvPcb<$V1W#*LC3<OB
z8!}Kwlx#NIqK$kZZS>m)J4ueDv`hZ#{5dqkx=luP+&1Yra|R1k>1+7~<$tcXv11%v
z2;>-+Z^{>{6+$H~tI*;_4j8l{oC3z$mCJ=&A!i9FvbJwK8$o+>RlZb4R~ZE97+9F2
zb7KRLxl6J_nqvnR20Q)lA7?P2QZsW`2I0ADEhY3VJMk7w;QwahVLc=&_>vS9-?Ij}
zkA|aOW+H&+npiqQvK+cJPy~Lf{jTfhS2ZSOrZ^Nt1Sk&zoZwmW6$c0o=O?jH8g6e&
zVHv`}z<@h|rmileJR&LhWj!pPz#1xFx=<PLzu*z~B<M#r#G#vQr_B0hdS*UT=X7*p
zE<AHw=BaBU?}txGm#&QXM?@cK!%i?U4zBmFO+}YbfM0D<942um+3mdE<o}^#BiR)>
zJUJt8!Q-sydPHh)?~$KeivGMmv92*$M3<nusW`fKyA-V=fq!_N=<3I}5X3*{OqIKA
z&0T8bMt>kjY>|(2NcA}OkoWW%Bd;e`-3j|<sP5Bm238JnyLP^bB*BxkOBRp0#7wj4
zMVM_G4*3d{;xy`mlZ(Ps?Wv{&F)md#G5Gx|L-KpOlhI2{KZ>1=686!cJKL1-4M%VY
zxO54T2VvbF*B}IVDSF@ZaruXj(aqOuEZLt{8oXjl@7l8i3zw+22Xl~tQo)y(_E$vY
zrH|#6f7mV2K{LeM($c`fBCOPFcN_R)?7}=<`(A&~65nb5v24Co_df8a;NauyPiQ(J
z>G^|ozxgi7sQ2N5j>CM+Lx<rDZeUkp7y{g+fO-?!Ww^7uhlhqlOhQVDhXva)Y~gnU
z14R?PlWR{WEC@t!AatBRA@}HY46O?wW;i2W<SE`qSXF_Bnl#X~CS>DQ<J2plc`X`!
z)1=qCiWYbGLy!iC_z$n^9x3Y~q0K_A7+bojm(hcifz#m^1?D6v+Njm8E=pW4QaJ#-
zR?*PEyv#wl=;8s+V;DlgixB_eb*b<IFQ(`H`KICmT}t1hgUgxO*)|9vuJxNkn906g
z5Q6v$4#>?5L$7><VK4#66<_m7w6(Rrw;R#oq2hPQJ)C8t1t?PlD*=$Rb9D;X1vtfp
z66lj;p?C=-xQv{ts_4nTo5K$+lO@?wI#wMZ{Gh3;m#I-i6-J$7h?+7da{Ch}Iaiqh
zU-PYAwnnkT^2yuY9O|l0!2@LfaZ9c-U;J=bvhAl+A>9F5L4@JaU!8C^E_Z7%|0sZY
zS3nXV!1%fQCCSP$tB8%XcG@u|{GR4(l0vO6TIcKcg=2=!%i-9Mc7#sLv(#L87<WrD
z1zULUz4*`S9$bd1wBX8_`}Ozl?5s+ExQbiYK2E3)2c8$C>1R>L#O%t{_Vxb_pAKTp
zxgZ0W3W~RN^?cB(Z8LDxui=N7uUZioAz^&k?5<m*5JwW}ghkE_VJrKIlmkPt26Jj^
z>L0X+qe-8VZud|ej{Y!K<IQG2X_ds0Ycn-=j)P=&2enb<T~J4PiScK|HqXZX{@oN*
zC^b5I__Q?^_>yEOiLy)bi6m)C)$n>&(E-+x)Y9VZ*Yb6fpkn5{vD7ngW`-CE3Hi{?
zD<l(qwpm5>;hUTF-Gt0lS`klpY^Y_a$!m~<+d^k|X-P0EYm+Dw`i!c&AtG@H-+P%l
zy>n`!HCE|IiLz05Gn@w1mki4_y^S?rMSO9X;eojH)pBFHO3?&)_EQvuI-A_Ln%^{#
zf`Z;ArnD{D-9xG~_?piIijd=r5zgH*%EOl}zOPCtm4E7Y4fkXTPg)z?lhMti6xe#J
zj8R#=qZ*iD5P?A{t6||0KHchtQW3Xxig6mROq&ulx@C;`V0j5A)mjMAmBJ3~bJ_o8
z0ZeC&@i`q%4I;x`^QHas{Up`qXl$d#GJbW})&0yLD>1{*X4`Ry)_aX45w@t__r+R|
zDTb_OOC)Yby3mhFD_@Ju?L^mtkjKyPD+7YWHc8=+Yqi(-PUrvJpOLS}reDhreAOAb
z$a`(f5-;^PkT&#Naq+T!eXZS+@pzDbJG&DIq#-aP+VqjOPdY~WY3kC=HL;%0wKF#l
zPp#KFx6kRij{+@zwpJ0OK4Es(bDjSdvp_9opqLdJ>}Kz*SFSFO)tF$>XrmDPLeb=-
z#Ek)GL(txU?g&MybtgLpuB13oT{2HqiHLyv>9G3?6TZ)FGmh)*h?;M8ElH3e6U`v|
zV&P`d<K0E?n;)L5OvxqD3Z|P|JAY0#$F8o{n_sD_#|nty<f|7!e-=~=A>ys$mVfE_
zv?22|b`sn<`nU6#<s&5#Y>oC8y#(BzLT~_04l*y+$kHf2+!elhFgZE(R#*4#ZVO;c
zrd5s+GmMmpUYP#z@@fRo=KMvEA`v->p{FN4g#AH~4ed)G%8wm}8IYqfF1`Q00-A)s
zU{5nJF+mdJQNj=0taoL6!vrTRm3oi#<Pvrae=`<IcKo$B!ak)*7KCWQ$^>zJkA<^K
zeeNa9$``0*!hfVM3^i^7BFrRpsOgY_@~b)DE}1SI@F4;f{eFyy+miITYLTZNH#ZhP
zEyXgiC}GQHnNmf-4^@gKi;H$g^azw!1zOZbS2$z5=kJG|33BvA3*ydyNSMi9^q5P0
zqzu!1k3OHDpvlsC)_m&)5~3*<lGL;`llSifKvM~^VdlQqD4B4$eAdUz%-~#k&boMp
zi-vS?(O_a9a~}wuu&6^)QnQ%bC5F*vt|7E<l^O_E92}5no8FC-9Lx)0KvA^%SmiVA
zxtVi(bu#CQD}f3tC^Hb?Ro=iV3CU@3c==F<g@=dc_t;=KOP}FAVLds9Jqm(LN?aYa
zovlfH>iaMwsVIlr8?V#T(W|XD`;X9&p{s7}X!J-1ujMnGSKCco50;QAC}r^~Sm4-U
zSNj{D6CZ#5#@5c=GCE)%`%(B63(0EU?TIRwY8m4Cp!B9D(PB{r@LzaG!2|s3AD>=S
zN_4a`UZ_0iVJbTOPW(s{nd3Nwd_DqCn;l<L86ScJG)615+&th59Qe;fcWg%U-O73B
z*zbCN3GS4ZO$UP=4|hz4gs|V~X_<*b#}l@m=<=%AV_|8Jen-&u(TN$&4G+6}%BkMd
z7$JY+%*Fn8Pe>kxkUwqj(KJFTz6RUU_J6Oc-KF`j5j_<3?aybNFUpbli7^V#uO;HQ
z9yom<H4E!^s7=64`1$EqaEQWq+|#!a!^Y0#CDl|a^lTo}oSEm}=sZ7!{zv}Pu%JBe
zM+*+Bw&*y<6HP9rI)aWeylDR~&h!<!88+S7;|R$&PR*)fAKy!g;G|vcJnkc@jrk}3
z%TfeK#<T(eALT|}=N-?y2Vu_>`3Sc{?iA>jA~i2yZ=m=EWHP`Rvq~#RuariXdes6F
zz9AD9bR-c<Eb%|t^QX39vsyD*KmYZ{CmqzKF0N<E!OrRvX12C82}6*`NS?opTP4UW
zXIQdBoMVSRyOD(jnsN-hT|f8AmYixo8>6<|OBrCX@>UW2YCr_>c|f_H*Ee5!&?>`>
z>Cx&lpHSd2LPs>378S~KQ`@Wko3Vg9O0wd9EhW{JHAR5<{%z;5^H!&rtt!KxP{~&D
zEE9S40=3rlvuL@e1sX;F3Ap2lu%j}Bb#MUW(bBDv-1};!2EM5A@w^b`V%H~6HaaA#
z)rp7FVU?C8{$?*^1R#85Q<DNPU@Mm=hi;#A*v<eFtDr5#zdo2|Y-t$|tK9M-ZzgTb
zZyCI(y9}9h=6S(25}5+BcXPT9w^X@iyGbS0YYwbDbVO;|YG5C?npBR>&2}Ah6EXLN
z@8ptyZp>EU7hkczx-Sg9)qC$RmevJoD+l@;!GKpETJzoB_QSt|H4nHTJlI)JA@3LQ
zqS7a#SV^#O66EGQekbFde=bA#P{4(muBXehF=9@u&$0NWlEurdpq0%gZN@UkGu_j8
zHlO}$-2AoJ4aG1LA|yCb`5ZoLiYR2bI%zzUe(DM_2-wJb<Cq>jiUnET)fKfuUh4QB
zX608<`M{ruFJa(r41s>d<J5gmWC`UTA9nfl*=HsK7xqnojaxh84w1UVL|#$8SOXWE
z$l_we(x!iC5Hej|HU8jH2Tj^<#kN9fv<Y&#IO3?v_^60i8+DzX|DI}u2M$KML@Fp$
zRL1`K`>e53!!QNn-#IEk#~4iG2My2fM%Q$e&0EubLH|FzWBfx4DJ2d2C8tQ$BbYc}
z@1u%+q<q;%97&fmqGa;MqeiP^?msqBioZ+TE@FI}Y=$%nzkbZ3?-py&4474s41AKd
z*m%X?KJ0ri&#mL}X8ui%`@Wb4Pu-HVA7xAQKMLhnZ`3u`Vr@-?_Ah_js)AMl7$s0Z
zH7o4(I-BcSWv0m<BMu4*LJ1P}{P90jaYlwn5YklnS)11%^oNt!n94;{#7`*Jx8Gfo
z2+ryL$L|_hTZ^wKd~JQ|^&>s~>Ll;HL1-)DuFmB^gM7#fvt{kkpL^az%n0vnuBL~}
zOd$<09HK2aAe+ioaWqSg?6NGgoVo)@`}!k8{-nk^{Wt1#q!`Gz=JS=A2=2sNZJqM@
zg`G?O$Y5as-JAXL`Sae@(bgAv3~08Eha@Q!zaX_MoNRN@QosLEsr&tCVti<!xxmFh
z-YZ#fSdw9^ys(h_@hM8YOom4*Iwt4JX=>$I)*&`Bf`nr6MnQO&)z9eg*|EMp8e?Gt
z#Roqr|5)(}WxW%@b~M|EZ8)0k?%90(+H3cCnHDOdjs?!jdj4y9CcBexz4M17c$dv3
z`Edbi%gf@_;z@$1UkFX&Xqk5rUM?+pd;Iq`-*IN=t5|&Z>(p$PF@;cjE|Jpz=;S|t
z8rK|=j*k1=!MH;~fp*n{y?#K<!^6g+&5=+u9I;*cDFs0ji3*TlK=1Sq4Gn$DteJ`}
zbpF|6uQqrfg+kxKAx!QmW~+1j`^p)U?}`RCE|FGj5Ll-_|7)5iGNtCy{Ey^*^VDCG
z*D?Uybh7%g1paQ)C+g}DUH?y5xc~ZWp|3ZNIq`MQ-8>I#DDRx0pql`B&@&yFtokCK
z!tHST;LP!GSpopDErL&Yj{d|d8p0RLB9IJwUw=RN5{3%i49!*iK0{!cU7MFrnFg|T
zl@?~3k==q<3LJCWs;yyL;`LZ#+1<4!6>!6ujrLr5@-9z_!D0E23}pS3ZGTt^=LRmU
z-{F!)GrIqbbFPMM+dTsA?Kx_-?QEy2qF@I^vp4191wH1CXHRz_=LSRkUJy+^`(5dq
z)um8o)P)7!xbxmeitK#coy_&`+Sa)=8!hMr8yoS_A6DBg49+)R@;aW9DheDT<`_m}
z3r+V;PxI0%q?wqReHN!4Jn6>}MUm~mgYJ|zAJD>vepOkTo68JOO?CPD2PdT_8BLX>
zf-tAWUn-wx55p*Wg*QM9w{?jjPk{`XQ3jNx$#TGt5~Ge@EPp2GYn}{ZxiS}hGG>ip
zYP^UF!wCx^w=*)}+f}p9)SP*7&wB_5EkX2&<K^?Pt}Fv?IkXFb2irj*op?k+Fx9KD
zpz(n7-qJC0w#VVer(S8oICcdmnp&7XHB|P+#1KSYB0LHT(?FO{xsqHy#r!ccJV3E6
z$sU~;DMr1N>(u|47fr_`v%{k2z6*n7Z1Kk4DGO$BYof*jsl&{CBvECY!jb+b3DV{?
z_)|E;UIqd;45H7w<w^5m(shX>(n}7ye-Snv{c$;+npCEc`8}~_RQ18Pk-|IO%KPfk
zT;*{;nrN-i`dKn-3ih<T0Q)OjSDyG?eeI_+o@tVe3YM?Y1Mg~Kp#frv@gTDl<#8hI
zYN@vN6cWDhwDE0X#YbEE`vFp5P#O-v0kqurr_OI1HE8~qaxa+pZ4JZa-ah&*m8-nm
z@y5@FGkvwOfg;uO=MQaRAyn6vltOBqNYs@NF1=`%QRVtN%dIW`lH{7RW#>ViD|<!B
zOeMRZ5FpCgBWBQ64Uwc)vs4Eh0bw}nxKLuQ1TQJ1z?GS5dtc&X7`~Q)N5+lH+T>ex
z2-RUz1ax9Tp8;3f4D@+E6f3k<9Jn`5pH3Vfxe35C&2|!0jga(*BZ2V@RFJ105um_?
zt-V#SD3#(07UR`yi-5CvmH}iLp>PAil!V^W&v_a}xQevEaMPR$s3ee}B8^-;`~WUf
zNKLNriW@zLF)Y>|ZmYi5YSts*u|IeEkM2t~kH0y0JgFjzZ_P~7mBQ-Wjq1ljCb)TK
zf2rZ*s1J~pLz66H^c)n&ZvlMvST~_;NUmzvFs7Q%my(v<tGx%#+!v;aY!{mttM}qw
zcOWunIl2Y*%vi<fDUx?-Fv|GPD<vP#&~jzi+iugEuJdi2<tRC&BsnCWO8bU-eoB)L
zsw?Ku2rXkuq<Zr=_PN*h50>Msf%&C=h5UbH?>B@+e5Wh4Sm9#f;1U+f^5rD3Dmdso
ze13C!O`Ln2-tUAbKjd6l+{(I?YdgQ_xCt!2dm@c`^f)L=jG$|2n64Isf01GVL#{Ut
z5ImVoXb?&hf9(es^Bk?aQg=ZCBV>9ql)B~Rd)E$#O7d!SibrSX26&ndG1EM5+)a|v
zHSJV|Xre*hqFkT`L!oYhNG-WKfqt*;NwI>TWB5DNisz`%;iGYF@)J1Bus|-_Q>dBt
zuavU7Ay^O8dUF;dy9#(nzVs0UeAI;73Ql_kt5sjFCe!jE(fi7mtp*9w86#$#&h-Fi
z0OzL?(BR3Cqq_X9-;O`QglUkUt^XKE?Ek*0)d3qkEQlj!h*XHR|1q1w$4-rDWMX1<
z)a|uQm4>tGJA#L$Q~q5mU;)Mr?|?+x`SpF^kL1o!raxmDpS-xfdDyF%*YkrjeJWj=
z7Ctx9Qq(zOPg6SBF%WJ(TD~%V;VO3~!}uJ-$N=lR^^>TnZ4&!9G`;kwSCk<$W=bps
zs7P}cqxPhvT~sLp`rIVwXRf@UX~sO``{Q`-DYW$$$@gPDRv8&`A7>BuP)qf$c3Pij
zm}-@Z-uX^KFR$H4bx~t!v-6VZ*Y~=tVhwh-<885Gx(KjYc^FQ6WP6YmjATY0|L`2W
z7B%+IbhNe`MO5H>`q(;lnyb?nyM?=hvMJFJBjoE5O})dM{T?UnqBMGsr(R{9exdXx
z4py+)c;WYj%c6D<?yp<q`0B2um0zU0B=ZM8#$;0A6VR$vto)%LWHVE3-a60^?)cS$
zxGsC0_^5p7q(KM`Rvp)~Yp$98jVgl1nsz^XJLEmbmI+B=*I*U(19Scn)<MT>f%;!_
zC9X!q;ltTtIs%c$a#9q5#w&{}ODiPEOnYNy$1{QwDt-g%x+^!&P=ftv|8e7NYf4a~
zgne#Dz(Hfc2ts#~cyiwO6qQa<=Fl$-C!VfCmgq?!VUh$1Q{nF7wBL8UoB@TEdylAP
zgvZ7){QU^BC3<4wpHsW|egU%jL**nII>UBx)Y5N|DRyF!ZB-n29ukfasl<-|2tBT1
zg-$vy<^)fP<eW3M`NNB@O52ENX3q-Fk&BM8$Cy)FHSSWwkKTFzXIRkhvF~#b*vpid
z-uD~PuRbfmR($LqF{!b#{LN$Qn_9t{lEJ0d9txf+D~sW0_;UydiJ!3;XMWtT@$cKS
z%c8<Z!Qy+mh3RcXV>|u&CsJp2+kd*vY-^O!<3H@N%*lF$^2%wK+4pU4zF|JN*Su`-
zQ}|VV%|qW;Z!qvP*oZI-GYl_TQA$Mq@rjJ->*4-HunaViX^3w(<)_roHs<o3^j_mR
z2`6DqQ+BZM|0XP2u)0T#Ecz-dQ-98+GK&A<%k;30Ia!L!le4KgmCx@4I<8)aXy>A`
ztsJ+T_6$C|uZ!#ChVem=?^<uli>vwGgqQcXJ(piR0Yn&z{#hB!SjiSfOnN2Rbx8$*
z&qXo&3;oy#{FXT48WMuCaKh9Ri#n9lk)zB$GY3hFJ8l&AxG~AtQcKj~WzMrpi*vk3
zdyeOe;MjqJg@gU4hd^vYFZgSoY~!AYGMNPzraAhR5V{na6_v78sCA*6C*j|qpaL_7
z!aw6DdL(P(ro3V4&q^k2MNzC~*LDRxN(eW-eaqa~>Mc1u*&O{E3{Ez}eP?5L6(VMz
zrP>d_T7LS_6X7))!(5E{zs?`2MlWAoa7Q}RFH&wEJiU-T!bS4C9#AZOn_E{R(I10+
z?C>}DzU{<)d09>=>W3%6&MFy2HQ{gUH$o<)c^ba;eC+ma0#g;`SDnfqR;XwcH2*bx
zGG;L%ZvOQ7<2zhWM%=Y`F4Z_n1b*mWs%&<CjtY=+VOXpf*M*JcbE8NtqlgTKl$E5J
z{Pb<$5&e-SMakeM*3L})87t|PA7+FBnj}g#rQQJh6S+|wzLfC1M9k{S@()N<bd@(6
z+;0?Aj{@BD<J<7iBoq@hS;a<BR3|*eN$9L3S}Zk`$byrXkQvJZ{S2lKr!jjaaR#`{
z@i8T&cWT2iW}Wx+oQK!_wTegNe6`Z5;txAopT*giebR1=C!Cvi;cL^)zrl$tWO=Tv
zHY;MyOGy{>pu#%>mqw)M*<bg8qHhEQ!A(g;tmd4y#1ko9YU*{8+vldeuFmRdRm=?*
z-Zxi&`!qW_;t$=aH%HuaD+5n8zXVN5)yf!apCKw)Kblo$_h;n|lH}w3n3bPMPBHJ`
zyV1{EB~BC|YAPf~hbtK!6R8p}>PlZ|Jeri$aYWqSr;0*brSy?&6}QZ~Fq+*GEujn}
zB4}!;u9eQBg|d8$GtLaLtvpoSq(I_<Q~YQ?0eauIGtK%T4vNTYA^vyEl5`~Zm#E%$
z8@M~+*9UDSGU#Dm41HDXddz6;LENYL36`969M7<Xc>O1}!I#8y)4r<{pTkwGzt=_R
zmH%wAR}+&SE}V=g`W|l+Iy5+{N@2`RNY!Y8X|Zye=(mS~n4?0t-F&$;X_d{>E{c9>
z%(9YBbW<=lfsmlnY9Z<T*p+e;Hvos{zj3B+6LD8YS{%v6M&Hr0&wrw)bxKt*5Xrx6
zN7C76jk|`q844*|`J#v_|DfNXA6^)G^6v8SxF7D;4JCqIGP=AnlZwo0bOy>;v9haF
z*uB}7cfCfId@AZATk3M96id7t5hPsA+C=-s_|LuWdj_&l<_Be+qrD9<R#u=zeZQ9f
zux&b7fifYJL_uHewVD_%KAg}QmC*y97aE^@i2Fc^_|e==>GQ?}6UvecBe#IGM2jk;
z(I!%uwLi{(?$-o`u|sXvP8{z_qTj;%yX-Q_<2u0mS;cU+Bo7Rgv75YDk=8Uh{+Ski
zx<bNFX=5~KBr~&~)V8AQ8h^KZ%AiezA4l1({b{qSAy||y{FlVDO+sNwOVSKC;lPu0
zLO+MjP8Hj%l-w`Vr>03%cVDFyNjs}2AmvfB&Uia})j&yxoWZ~#|7*_O4d)vH$%|1F
zgy4?kZx36p!xT1<+8?z=b{M#OZDrjH!cX<KZ&c`i9gLldH1mX^gFB-_<N3k6m5VCh
zN0B`e=5x4Vqah^X>YPU=xDxq@T!9nT);jKs&rSYKA|SXIV-Un9+hhb9<##sd#eWqW
z+_p_7#v_j8`g`rk=vc|khJ$oJN2%SKgz_tX7@O4_te_;Ggx-vN?Gu8CXQa*ek+rjd
z)IZhRObqb-l}os4dNU-_QAOqseowlwZXd&+HMm$pgsj3BK!b}kwczhWI+*%Wo-N_Q
zS0G8XWc=Nz8{F7HdHhW0t5yL^!Ot5OVoD*@Y^T(N>Mx1u_3Q3U#gQI568RYCZ}4PY
z#s<mB2hzk<;}sOSnM~Bb%K4sup+gweNF=!buh@K#xxtre&qh`;cUr$R(de{9w*2m8
zrJ)j;;6$3lgaP!Hg9CP&glAa{XfQ4549P1eCt!~7x~^dqjQ{rYRg!QJ=f(-43-Y~}
zTjoAfd)TVfiYdc#PsnM@(+%C;_6xSqQ`SK~o@0w}iQ9Rh?9ZNgD@EThOZ2k^WR%cx
zl$bCiIph>-D*xp~KOv{tP5d&zH1}6PXm-~*W768HRJOJ)nB6+y!CyiOi#a51Ll69h
z8NNtr_ADfexfTqwkL}&s<ICiTcr?0s^UD&vc#UR;k{BnR5179i;FIu%{X{d{phNE~
zrQ&*6ymjh6S-3|!g2FX(NE)i)BK$&(FO1Qi)7L1!A0vUdgs)~~)B(QjovA-{pJM@n
zO-$^p%zn%Z?gCn|);r#t4@pe?n{MJDro-|4`QV@wIX%%QJG)!GgfJP|x(1|1J+c+_
z;Z-%h7`x%uZCNU378Ea^NEhg5d2cP#h@FRSS-Xw@Y&F$eGPZWZVI`qeOQI6s3NO?p
zqcKNif2H{P{Zf2{w=iLE>uV|;DwB1YcojFH8Vw<yAeD-*hswJ_@$k<4wnmZ2$jeKx
z^}IA^)8idldH2CD{pNZB&dDL2hTq7Dvh_;GrkZ2kYxCPS{Od)q&YzV&>Kr;RKG`b%
z-nzTBGE^7xeKzG!^f}J`fj%Z5BHz%b7KmGfNB%5W?yp#K1|GeV`x?x`r@}2M-~2BS
z(H-yAXup^iAG=}G;i@`GU!WJ;&Fqqelp?ayk6){?5<c%{uN@C>3^vOjUrXM5ytalj
z>3})I5pQ2(_vVwoCQIbd`fA+c+h`@;{^6hqVC<W$n?(Q234iQnI;4#VY2Ed+jC>|w
zu_9=<-oH_IMQ8mtpq=GYl34ofA5lK9b$@ac&4p8e3W6`S8h%EZc-udckS${^Y?E?y
zrqgA+O2mwhznI<MdWGQTpsyn>okgKfM1MD3chlct$G7UQC+#h_pbT?;6Lh!fQox|P
zOf@}tG!4$eg^jjPcTZ0L+Mo6(nY_qm>53$6-N$BU=M50X(P78R{(}B|Oncen--c>6
zLixjdmAX&1;fxHWx*PK<A=^GKyYb}eOJ{ZbZ&xl~B0Qm@MR+3hfnnM*nu#cbI?at-
zk=m7urpun43|lJ~a}I-*K(4>$qq(=s9OudNg845gSJ%<!ZkNry<+l>u*svAexG%%^
zy>QJXyLiF^QH+Y#A;Uft$1k|r%5==@PEZVQCR)S?vJtBTRY?^mTJnpI#XJJEfx%Xa
z#$rZ!D}%X=T<SHh7h(Q3k&CH9iXBW!l{RvDg;BCt;+g-Qx-5pwHecPZ?@e%gQzlEG
z@^>iyoi1+X%)rsp!0}hVV$^)h5s)2xXSHhEaM>BjvadKVudQZlWEg!yiTHk(pHuf<
zNqpH{5k>LMwLm8mX6=K7tm8_~7wCAE+sxshv>aSiW~(})H)DctOw7AZkgrC|6IqQQ
zy@cg$JvV7^9V_bQ>o*;EX46>Yf43&l5K5`p>Bh;BwPo?Cln8ta%}XkOJ2@W9Gcsyp
zam`ZY7r3dP)e(ud(O@Ku>D6(yOzAz(*>p(=H+eXAKPvNBUri}?wMdluc}}kyO~|99
z+{@?(ZYvK1$_R;(V@h;TSS!<X8rRW_ux%$!l<uj&ZL8hxX-h9=Ygmm=F><UQ`r%|%
zV;r6N+kwJWHcI-BwZy2<)_KK@>*g<3A?)k3zHB2~+U>l!TX;*3=Y9#0M`_!!yk(${
zQE}KBw?EzYN>7dQ4xN0@ER-IlRUCvxTA2802!EuRGO#y2yRztOKxdTj3ooNS5{1ea
zZSv1CxvY8OGv~f{wRDM)_q^7Ko7(v&WqVaXg|j?~lxRNN|JF4sM^v_Fc=6sn7&YuE
zFbApP%r9B)gpP`mHPK){s>xD{Y_$@*tMkynzy=&YC3X}P$PpZB;>)Y{tfEmA^|AiU
zjX1->2;{X}#97OXtWojnG8&GzS~`k*4mmjHe;&$eHC+0Q^NU~-`c4-Mnp5bEZ(3pH
z6zE(DJ!54>C1sS!86CH9283VBtB<l(vN>-b)8>dP<HL{F*(fo^m9c~ae^P)PnD#ID
zd4e<Zzv)dh52yY+Njm-^|Be<=XD|Rt5`pyS(HQS&%la|i!6mRQIZ2)ZY6vYD<)7Dk
z#|x8S2jAR6sO;iJNJ4=~PH~8m?tAsqd>)ei91hMc02M8_XDU}*AS3~<PJMH0>mF5N
zVqz<&d`vMbtQ>19=A)bac^rS%x;hTrzyS&~gwWW6K$1AMukmdEz#!0B0Gj~{%S;A9
z>Z=s1B{!lH;Gv#f8kTqe{!I!hSn2PdhfFv3-}&zHLPS0HY2N2_Zr6hst)3(Kh2{)}
zeuV{`Byavs>R3d2U7k{t1<yBm!|WmPlPAvm&m^GZJF2(9N_PB$lWZuwS{V@qbH_4R
zLOK9pw6+kN4sVmQ(jZ_BDWnDSE$3Q_I2W1L$4tLMwA}k=%FYp}Q!CB9&1+h`Q(p9T
zpQ}4&$DCOhOJ?e%2fQ&k7E`#C$G4GN%9%MW%;k>5Ys+eX$&lMP;Xd?Jdnqq5Ddaly
zlTJd0))0!fqnjAH=2QV+i;7~QqQaKYEQZyzO_kHmjsbNC7)<}rD8h*+ImKnNK1%T#
zIVpl~;bO4VZf(b%O}Ea|**b8W^XRex#>Qc=P^R4o-i_Ku!T^02ZV9&ZyvjyQ`6-z0
z%hF`3AACy%$vWC)<-!RP#{$mC6&#d1XQ;}Z@Dv?gMO_^=SS&GDrglg221A#gF#NNu
zsX3?ImG`qoK|!-*Xg#eS#o?}zalnW~lmyVVg?G)n|1S#w!<_**=XX$|<^G&eH6||L
zg6oo5s}*wPny%TA&Zdf82>}-L@Iv73T{1O+$DNEvT$K%U;tRhQ)1v_z(HE7BK%7lY
zB@?H?g}#o3MY2xQ$D!?vV%DDVaf}JA-AB)U<a_~sHAhlA1xhA^pH@{buw<*&ZeU7s
zMDx>KV=z_(1rY9llrS+}PoAy4994@0oB??oWy(Oz&^oFV^>`rxcpwkmNN4T40nj=y
zI9Kg^x375$N#&>*Z@2No$C#4@6Ov_%AB4QT0ZXR~MarX@e!m+W(a&sgG6b((=kgBv
zKJjxIdybU&j;iU`L`D7E9T?JNK=V03_W4;kB&aArE`{sY{I7`Opt~g1^WX*<vP!jK
zqZK-I6TiZi7@>Qv7bOA+bbPc5>sdmUzNL-?J&=ncLk0-ge^20R%c+~CQZQ_m2wfRZ
zJ?uEGh!2gC25u<ljo`Xk{(AvD9%<D0RT7k*Ny4Vf{?bFh;s_jXH;b^4<P`tU&|~?!
z!a+iKNbr(WQSci7(W6J_5ALUV?74$%0ZOIC+BE<G49qS3^eNJQ?Sz=z>qJ?jRIdm9
zSyOwH*X0N&=4^HC{=COb`LO{EfjnzCz^f}c?00SMYyX4zgxhLS_&QIxYnaP>|I9n;
z0Wy}pHg{Xw<L9jC61Z0>KF9nppD#E2G<MMLq#O6{`9Y@TBBlAl7PvWqT$WP@6Qu$z
zU=^IXToMAoG=rabW?-r3DszAs6?h>0#FuU^_i0EXaIga1&#uoBi73|LQbZDG5x2KT
z-gJB2{AYIIh8uH?7B7@tNT>&b;%-};dA#n+h|Slt%>&KXHMe`Jzu)ZnWtEnu>qhw`
zoenDKEnGuJn`||dzFCBUh!#K8&g}MX{2qK|QC)q5x>1K&&DZxIKf^G3`*fCke$ZdL
z+F`Sm-4YqeeLG?bd=yL3T}|x;kEAXre9k-?{vCxoot-+YE=$bcT%@4m&OF1D8+&hK
z6Nyazt2g(OXKZ9<AX+S#uxW}j!j0M&2L`GlS6Bq5;(~fclJEz+?7DT<ts8pQUD0^7
zZhT0{UZxlNRPNhU?LW(XdvHi4l*86MG2JpzUOz(gtGc6Ywx-hk*u?uNHXXV!jFaEq
z4&46pxJBP@x+Jf6Z4N3daKlKI%?aD(C93o7$}&nOtfo11ca~k<^0UEu=#`i&pK&Kt
z_7tK(C?g97l1{F<n*b8T)+XP_JQJ)AZ}d2G*gQhP7COO!mXgnztB)cBJ|gO>?1V1!
zh37_{WR+Hyo-NM7rP2d$5LW=6fF(mI1VBA2yqdW^S@q-wmu<7pol=FbvV;M_J2Em8
zh;y*$k6m%whK(E6n=60DF8D%>W2Q6x_QEF@&a?CLojlEl&Lp{^g|M(g7l@;Gtoev@
zLN@U6JI~PQ5#^s=HZ?YLt#6wD5rFpRPRJ(m`n6vdxz}Bf>&VpSl%m$tIKX3XrhAZV
zRwhRUwjMj<_ZW<H<Wa#3&`WbO>m$7RS9%);^4CWgLFe;lH}o*F?RH$8o@GvQ2do=W
z^Br1WKS`?Gxn6t_K)td5u4StEly+=P6@J&^8M0=L4OwVBjF}(L*YA&v{*rz7jv_1*
zQU%l3N3XAbxi<OZpaGvl%S$-f<RGQ_?~^ZK5A{B{^HlxYeJRE@M>+CKl9x22vi?c)
zP}g39-dBy3+~USmR&9!>q@jz)mlun3g0xyOPJd6958a3w9g-ego&rX@TrM`x`)~dE
zl~Ca-$2Iet<1?R29yru;2yyquE_kBBTtwjUx|`W-8<>2qOhJQTv;DS?`Gr)D&Qj}v
zyWt^GwYB3;w*gC^xVoB2ULG(e4aaglh>2_adyKmBCrUry2o;aQ`LrYu2TiXns$?Nd
zNKvIYuKZi4e4`|6HlP_vf*}0ujg(LKzYOQ^)!*?#1BgjT-otN!_$leM&pkU!+qCl|
zBTl*4sdqkOtVCZNHg9s?4<vJa)2@k(k4FTn>^dAv?wrB%Y2;6z(gRj0z0z`u26BoJ
zrvgAI{@FJQ+VmmEy{m^-U4S?^-~muzkwysuBO^X~!}aMbv`(5%rrGqKkavD((ev1K
zF8TDS%xhKys{I9O$qu!x^Vp}$ha2z^a0BRBtGK$_ttlh3EO6Dh3yLBDHUj$J_rMx%
z+uRtenx_EPjzdjEiB~yVE%u~?X~I%joAw+S*a^?xt-;a@V7Rz_p<|5Frn;0j@4Vv3
z_+2OwA=ju;swK}rB&tr(x<m;JEwm9F9U1W@GE^8}2nt3}f7M~Cuw4-PclqXX2>phc
z<;p=c4RlOD?|bcgKwK<Fn)V!g$*72Jw6Uyma&iaP%~z$cMS_?&XlOsrJLQo-Kbv1t
zlKK2)$E?+S1p#e98$^gXq_Fnr@ghd&XF4v9O_KyU+lK#P!gR~0f*$*XU#hY$f~UN~
zS2yq2xws^>XThyruZ$n)CJ_1MvrLZr@!z>`#6<6>vZ9XHo|Jl1MLd|TzPlYQAn%Wi
z%?=%ANp-I~GK9$%Xws%AjLgoy7D`_^FQ<`H_%uY{M-$MelFc@BzwZZ}9yigq5yw+J
zW~`++-qiGr?*wja7{bN~n`d!xF(ustOXLH$Mztb>x;p-uCTo81mEE<c$H!??c!Wbr
zED;falCp*p+y=+C<E-Xe)P;+QJab!HF=aLH)8%ld>YBritSHFzE3gwS&a9{9Rndt^
znLdV%M&*UPyYfESX0ERA!B4N9-xnx&J<q%kv4HWD%1@EYI&&8X0)P!hJ-K@TkkG-{
zH(l=vx}mix_uaodNvWw4>IC3d80hckgoBbRjwm|^UoS8X4v0u*tF2ezO|ts+J+v8K
z!YoUs+vBsQ;Hm8nPWjPImfQ2n$0*4DRzFN1khd*DoBhggh#ca0ngXBVjqO3#lsO_D
zYmEmnWO$@0b8~a}Fl7U4-2hTr5t6B3c4hmo(t5Vxd^sF;TQw@M0>Ns9gN9UY9sa%|
zZYGKNLtXtj;4qC`cBXqKS+%=!RRPWorykK)Lg}WEYu0BMFHl=vO?bD~_wEL7Zcgxz
z<6HRna{<=q-Q};?08s<0zD@@cm_&ia%>AgR6pnB`>m1*!=pb%!*)I4X07s44IFjsT
z0FEEDCqBY#2{5*m)G>9Z3e;q?M;%Z8mQvzJ!l~JAr<<y?OVWM0=p8+2<maLF5IQ`l
zP3gJq<z<gCl22dZM1Ds_^ml6@&;IfszgJAnyl3iZq=J@~c2e?x=i*0$D<%D;U@()(
zb6f35=US-OnH2pAOB1ipDd!?qVMRW2E0lxZ{#-|`uwOMgsVQyFsoy-P<@v$sjM3L5
zvlWkH1}VpvFhVvuJ3Drw8B9c^*>$<!9GtruKw|)x6o3EiJBlD|M#6Qg)FsWO*t6Al
z2HOkIwB6b2Xz6y)WHRu(?7aWr5K}UUmF96u@dHjQ%A66Z;P)-iARLW`JWHUcF>c%s
zW=mR9L;X2Ey_=|8Tq?x6T#&qeXpLq_couc9Br{%xqs-=WMg}G+utW{ZL%s~>KO+O}
z4MV&vWU)xQT+%ngAB)Jwz#vj=v7CZD?g28d_YN;`eHJdJn%iz&mKGrI0%@G9l_76Q
zT2f>9`W=M}dX!lQt1*Q;{XW5HUXZeU?N?j-a;mM#2pI&99FN)bXkqvb#vCEBxjo4W
z%C&fX_U^?xXD4S@81pQ%N^!^uTj7QK7H}g+MwH3j^k0A_(RJQE814hKcuU(0=TG6f
zYEk8v`P-W*3kU6g49&97dpX-kf3-0Cs>@i=qq<&AVRFi^-V9*dAGME|@V*sMC-7@w
zFBm6%!fmrWf4N7W-p9ekB?28t6cKGH<l7^kb26>i-JQ!t!SBz|%-gtdM2F2dAtdtb
z^0X;RNlk5{@z$}H#kQ%b{^fmieD%f^=a+rwd6)yZSHcTB*);hJoOLRN{8uOMBX3>b
zA*~=qfmaLCaHzUdGfw+Y0mm2TkR+MaQliUWpkYBO=<?qHw!lZ@B(N5^?9UJE-`?zl
z{dSOlzo89em=uSA9kJhUOgTThy}<^DnDy1xm?FqpMFvv^`}W?vTQA6K8d$sBmzv^=
zOy><PoYU-r9xBX<GX8Odm4^n$%6&sbO=9VHZRIzu#+bA;8}NLBu4?Y;)b^H{6j|@X
zrtwkWa_dWD$Cm<WMJt({mUz`Rv%T%-h>isq!ag3@kQGCw_}$qN{uqeI`GsM|+^=M-
ztrrwvI+bE)?sbk9%{zusuK{WPNHMmAJe`udO;1s!0yW&QFmvsJWw#c%r6x0h<#eUy
zro;9y?{+HPK#Q>2`URI@eHqRhf<S=3fd~O|j#s^7iif`|hqy2GQCVhlZMb>8kKiK`
z4BW54CG-G45tkh|q6`K&up4M;ym(B3Mb0M<SF%1u&!mxPT-i9Z^=CQ|Hs=0Dk*Uez
zFeLZ{sIi|ueL93=_mitbid%{S{7J>23oa|r6pWaCIyP0L3Gn+81B2s~L~CjCXR1Z&
zBC`1EE#=lMV}QEPuwYUV1^;bqvV<}h`Q_-NZ@Tr7uHJ{-AVH7nvR*wOt`0We-Y~Sg
zMsjIBTBeV8CU=$Jt_y!eCO?+I;3J_v;`BhCM~Ta8hF!DM6iZ@+-RW7-p2(EV4F~7D
zSgNhg#3&2%!e9NfL-%0J<HBx12z<3K*x5gtCj*WPj}=vJ3}K1MtjpexG_(+$NMVJA
z(~)iED^fCfsxZL=t@)6SOz;lWd3>k^mEqr@o_?z^&y2gFeLgJAu~xlt)Jw^sXoC${
z?4#R)v1tNQu$yh>?wtuA+(QNr_&hDb!3P010X>iw_NEDXfE&e(_Jfzbv12B#q4{b~
zCIif69-NFVtQDv4L-I$tSl#`w<FWhZ>Kh`mCp3f+Upco!VE8vm@E;09OpLk|_1>91
zd|&bQba%F^e1$$4-4i?49Ofrxd=~Ew3Em386%34{8Ddf}M=UO&Ae5e^!?OI>ZP=Mi
zcM1d$z|8SJ8Z!m^s89D~v397qD4efu|0OJ#{^=zE&z{hX{NLyLGd5vK%)ybyzd+mZ
zCQ2KfgX^VC))EO`<O+z=LnO206y)pxw&pB$#=>4FO*>;1RI~8GUkv%Qe6#7YykBvq
z|Idp6oYux6XCs-c*HnmwxjgIl{`VHq2YntU<UAl|x=Cpe)r(7f)5y3R2UQnEIUE!u
z_p9<Q2Erq_#lp4Qj26I**>utR=dBNAS2<uA1avQi)joU(bK>*QwS@gpQj$J@avP>Q
zVbJ&SR&`+&6DW=hx2ubt&Q6|lKi`b8l@2um4~l<oEhd6vtpL4ZYVHX8+Zr3tuFFy4
ze1+`XEB5w{=^xrJ*b@w48d)+c@=J_GRdx31hRJq87lqG%JPRMtb*CUxB=F<HTcbp0
zGgpZV(<yx+cxq*dBFzh`Jwop%dgG?2h6e_>Z!cC@gnkPY^b2IKus?s^vR&HT0;YP$
z^K0)0q1zaehCpjys3z3!H?=ik3uhZ7|G%EjJD%$Qi{lL;WR#gLDKmSID4Xn6wp^R+
zS-uSlA%yG@vM!fgE?G&}NJ3WENLE~%YsAg(_~+*@59_-3em?K_Ij{G5y`GR-<%pAR
zMCO-f;t4YPdP6*^I-A={;UTkq^<4<@&jn&^xOP!0diD02iOiC|ESXDGBy#?1Cpo28
zo+oa6$@1CiS)1hj?fZ<DO}08O@Aya<=oa{9BBDx-{O;XklBe7vw#*u4X766_?Ccte
zFdVeo{fm5Qi_t5nV@Slt6}vG<lMPAwdXk+s)wz1~n6|8-At|JTE9u3JffN^mytxjV
zsoAZfIJha-(2Z9*Y*t<!^}aaBdZav8a$TUT%wDERe%cjxV7^wiEV8RN^l>#Vu*CUC
z0Q+OsGp~(Bx?HVB7N?%rnhi%87M=`HN6(Ip1~&c3n))8SB&}vl&tPVP60XNBufBCK
z&*-yO)k2wO**p#K{iI)rIq!)pt`ydmrPsJlp_#zpym%$?EuNG}B(6-iCW5u4#<5ce
z{K~B`vi<&b&qU<(!xfe4Je@iXlqo_zlJhBkgf6~QtHk*BCnKFAaTr&IP9JRKSt*_T
zk~Y`UyWxOF=|lZhZ8Tr0%<}CkC;CH?pK~`+I`8t8to&uDs5b5X_1e8H6JYmRRs2_k
z1^hc31cq7)Me_i0L_${fcA@PpGX|)c2w@k1th5&!Px}O{hEQkCFNiI!3szx&0ob$`
zAmQVBq*bGuke`0mW3>9X?X+4uSB7W8zbTIB=QlQ>wXCp_X@h(LCs>aLOX;~#LYJ1b
zAg%%880$Pnle-bG24O?xNuq_Cn2MTO91u7{$%5eHAiq$n$}<4j6ui*Vwg=)}B_|4&
zVN855gDU3sOM3}n`}v+!&xwYZQQL<M`R))}hHI=xb{;jz!T_yh8z(t96m^9-uI1>M
z2rY~s{koK`917!BAKv>{cO-R?jkWkQY0_|h#&3$s$UJ?WtWo&bNdffM%klE#dOw>N
z>^>B{wNtaMGN@YS>qV!d&(nJEgrmM$&<{8JtiS!nq{c<>teQuuuIjPe-}%>Aa!Bl#
z`;O0}d>I3ZEh~pj%LdXsQe(&Q-HWk<9`nA~y}$kkybtI@X7qA*Uj+?mzMXg=D`}&S
z>89vHd%>$(=N{ju?*b|vJ$m&4%$|DU9700gz`PT-5b%ClqJ5x!)O?2j4}?GH0i4zC
zX!fR>V!+am8C6SyRdH;L8Fo6*;2<YsbfU3FPXyc6b}E*KoWxqw1RU5VCMKpHQUM(h
zOpt~#jjdh$=76JK`oYG&s@>x;BI)ss4YqvdyzF-^*FWJU14$c3T^`sA&l|@8J{7J_
z=q!H^XmZXUECT%TJ>2x4+PTQvEuh<fPQ(7miFwXX?itU6cTbzEqYcUTK`v2mw#C-0
z@MUy;yma<!bUD@whv-cc_I@|IekHw^dzI9yo7ZG$=#*tK=7G;ik|*I79+j!l1{03}
zb%qOJ@aJ;z6OB&}REf{iM$DzXCc5Bom%P0@<(eVMM3Wo9z+Y@HK3`hL&pswwTO8ZG
z#B~)!IZ(iQ!I_@c(qe1u@0P$O2a<!zxL%qgN~<y~Tz$(}2QZ%bT5oijo+n*|3OU-r
zUV52aoqK!=&Rf3f89aWLcApjgG$w-u?in?sH#u1lk{0$iEF&W*Mgp|1H0R&4)Wyz@
zR?;v$siwSFnvE|*vPS-?X>a@3WFYhM+}$$gekICt;$B{>pDzhhri5Dr(>x>!o{#$U
zT5vw9(-4;C!rCmbtz+h*cg(BU-`3Z2CSr#wG+JwC1&Ti72}z##w^HL89i9My0}Rng
zx54JuQLvqIyQVTHRnTH^WB>*@3ypkEhHaIai6KN~@ui*0k?vrs+=ZtT<HImM?nfze
zXfcSJ)|6ztme((%v`j5rsXbC*qpMpJ4-RHGY0Ksy_U7h?@IFESTzxH14SSra!;_>8
zlb7GJ@6Yj7IZF9ck}|6XTae|jgFW$d?!#TVvS9&;D}W%rq;AAXAqq0+dUGoi7R}7b
z>Eh{`eVeC!=LbmQ&<JgWHG7U#=XRI!Q*+9z$!EcU<5T$d=Ik{%jN!6PY|k7n2iL}l
zlijiO^UvXO)wZrb%#Aa5EWw&x=9rdjDcJ)6Uq}Shl6^KSdjeDLaQZ%y_O8B!Ox+9w
znKsdYfLkTTA}M`{B|N^v*Ar&7RUz`8jv})d%wu2)qM}9?nwJ|1r5R><Dl7%08Oq)U
z=TjpRdibZSve`-xqv5iGasPeL*dQ=?VZcT~E_9h*A$a92O!xrVMOT+{@tfVvVbcJ8
z@Uvt_v`gK*d++W>h!W^GwCZMV+PvUTRg88J6|GJKWb2)5MfIAxsC>dLsyxnxm5f@j
zQ(ubFU}3iG1+WV<M@w4~h_wyAX9rxL<uz}dDZEk$r58XJ<a}3{JD5bK=x(5CP@
zP7anyXoZnTZ=s>zb1_c$2i?H@#H<{d=7;&vb@ti`>>W5_f%s@csdx*!N9TLdpc|qF
z1bK1t5PAXO>ziAY#|`gZ?G^r#)n$rPBOeX@PWABEzvJWP#K_vRN$pb1>Yo+I&K@&p
zvE7FS5dKN?dt~sdJj~=qRij2`QE;BWL)a^PPXQ@FShPyr)My}duGC;@2NyP=94riO
z2%1;$GE*6q4~zCi--}Cjb(k+3{=k>gx1+Mu^J6p-xdew40In_cPojNdsi+F586aeq
zzSicwYl#Vyib*pU>b16)rX+c?vs?AHyorgM1WcXq80Hn$>enyk8w&_Kv>r6PY72K_
zux+;dJxnR{h<N0ep=(vE?dVJ7038;THn<p5y5F5dghKroAkdLih}D7zs6{X=1;hsM
z-6}G65J}~s-H=e0zSCj|*?4|)f5brW8*dC0EHaL<2wK-LqlX(kBLFh*4GM~)I-XOD
zDd2<7RE^^2wyl1qc!A#bU}?*FcU|Q_9{RAbM&RE88u-EPiq&t_byyU6v%3BM?zj~U
zki+f`PZ?+q{XeBVz+6x|oHpWhx$#?3Z#s-Vw+EhOQwn>j#}`-TPIUp<F-xG0*8m4q
ziEa7d<YZ??t&13|_v<?Avg*AKq9r;C=`n`xv=*2zPUK6`dTWh@K!1LQxch@FD+|PR
zLKxJ~{_%yI=cT7=b5C#(A;b%yov;3^dzlb_Hrbx53pNtSkqeN&RU@n&94vF9a>GRi
zHNx1|cSb)98{E0+2?;^KRkqO3IKNK>u}xf2@#|DGCqO7YMk)|~e#x^~1HcYxN?rz}
z#K6!{-=8sAa7tI$)RN+&A0F=cFRZX6ck_CTAZOxbrtgO#c6UeAfdw2*zJC@7S&Y3k
zuKIl7$G;yiM{%b8XW-MX-}L;K=g#wCvCzz2xt!?#d(6mKU*3hAgy~zJ6XEA+5aqFB
ze;DqtsYLV81E*my3CP5QfFlB9DlvF3LP%#Ql&tHwYwgCtSwEC7R}mayab=Q#p7U72
zcXx-d-G#&s1m*<qevEgMYS?QbtJX_tVGs<(6D*+Rfs;{E($VejBVKdcp|+tjoH3nF
z5yX22{%bq@XwS$uDny#&MXzvmZ&DoEvKjFod!k~r3hgg~g<Y|2Im#K=0kV)e(yF&V
zOB_*a^=N)HmpiX-Fw^r2sIWWVPv`y}wwwKoDqI;O$R6+I{UZaL4twh6UD<?=*wpfn
zU+u#18gEY@<7nX6xGECQ&xh5(L~b)aIx1`}G8Redbq?LaPv17OQGbUgU2m;@9!YGP
zp517FSi!+OH=cL&0yCb`<kzpmkE%Q%>m|HCe>%-A|Gjsue2E;LU>W-U3?Dn$fVG}3
z|0H>=)0Jm6uiR(Hq>bf82=5IUr<z(#vReI{{o*i{RedS-dbRvn57t%rZK^ns*EB_T
z`6vc<PQ{*Md1kLlDs$v@qian>a-x+TYxT+*<#|fYhzT8B@77W;WU7BpGQk3$&_-C`
zkHdDOGj}4EKS>$VpIegkmYmH*8PV6b#=5TcvIh_Bm_C`c?Av@W#A2h)pB1_u94&99
zgS|i}=>4PDt%pKrZc+g~$u^4*Ezc?Tr9ozI=V6?@Z&=F^E{(WnAe@#ybCKBQ`KW%0
z^nSqh96YTi)1jnQ*xvFRt<c_j;x@_SqkC^k$ccU1EPS4140~Na5}Rv}aDM{tzCNrr
ztn1CdiPqv7=)pJHA>7@!OjzEiUFS{FZuuMULl^&LzkToc447Au*p}NE>o4nj5`OdI
zaJt2PF-BZe_BL=7q8%O_464KNJzU{{f0)@m2zBYly-cuHHClVw62Q+(T$vy+13WET
z`C+Wna~jk^zVL?+Xr5<kC`<ePdp`CdRG@1Q)H|MQEOx?4Gu_B`flmKxw01#Vs*+E0
zJIwp6z3|MVN4A`K_JB}fn3=#mqwGQX*CKHAPT!O`dbK!4WW;4n!bd{o#@D?9SmTB7
zaX8xB|JQoFX^=KobK_5aF|}Ei|Cb{P<aKumiS}Wq?M5$K5%^oLsol4m$`=>bG>0ax
ze{{~gURLvV7FJ_<8gkUH>*l6}GH<VM`UP^z+eVzHmaKE0vf(s%nC5a+szP&G_Z4lF
zZe-DsTQJ?#Cv7@6E>w<bE%px1F5gZl6Jg0aK>2!PPVB`k3I^vkm*Ex?Bc--vRMxF?
zN*GISJ~HkqPVs*<!MG5r9<{(GrQ*_VW>fY4=f!5<+3*fq=EHJoJ(TEZB>e)m@Gk$2
z2sE4Az9lXAOJ%-Rm4Sc-ix?s-wzk9oVqJQF%#l14H0LUUwm2E`Sh$$)&uyuXRJA^b
zSb(VrFBu$qeQvPRp{GcpX@l_$6lbY^bYQan`a=@7PmucWu&eaIt(TFJQ4AA;j-@0C
z_ty{C?G>cE(bDw8!WSb6sp(_88+X2FR!J&t<_WtK1X3=|LVxY&u&-#WgFqC6MoBJc
zjzk3Pz(JC^J&tj)KlkeB{VOl9m*)KC3O1Ql!vB@Pv<97;gS+1ra-w#P$J{0aBmN>P
zYUk6Q{#A^uik;PmH+hjNb}uj?SyvAmXQY=4`X@%~EI<CqwsV!~|Fx{VXxAfkXvceu
zYtzv@b&7mn`?jj7qZQM-&t~v%jT+(P(9(~Ns%Q`Ah6CBj{cztDlvVb2W5|&;G1x3O
zYTK$IEm&loSeD&WuqUI^&q@s1R6>h-$5rL{H9Kq?SthVq(+o-SFKh#215sS^-n8e3
zyIBI8;!Q5v6N&0NMUv~zvCsNM<j*do>_3cz6RT7B%hR{WX|-y&Apo|iT*s`a>}O;^
z<oh4fhqrzVqnnKPl0KBXvNE1w{WSE^i|ptPOMl4U4g#|$`Am)whSO~h<s6={{<41}
zd`)S(V`ZgkY+gJUU(=ZB5a5{|p^P21Q<|S5Y6=N`P3fP%BPY87d+N#vpO+WE?XmpR
z_1<|m72=|m4T^;G<lMmejZ2t&P0O=)RmYb-1O+1qJL?lHnBHAny{C6Yo|%95f4Ay-
za1jZ9rMIuMA+FZGv>@ysbQ;vyYU|QtegCYkF7~ZZ31(a^s1&>FWc+B{Uny7RkfU{Z
zCQQU<`#^%`9s6p%Yv6IwYN+SfG~Pq%!t(LFMkHf^^`3INZp)lrTW`#H$gjRk>elxU
zHB-lDM|X6bMZER>vG?w|_B|5GL)psi^cCV{UrXTLVbH_Xsb8<hw#S>XQ;XO=bn1v}
zuQKj~O?dFS?(@9DU)gKnK0`|PI9f6Bto<F`Ri#hY9iC6tQd3-HkMMFOpmEbQa+zLz
z5@Z64zsSkCtG%-PN?!_T@LD1n<}niTI{DSN{(0p_Maf0n|Ikog&N`irKjaZM+QJB_
zxrUe}rgb?aXI!f@>hR6}JIKvVq8mpElNSJyz0OGCSy8nahPaF^txmJznH=uh-+!1(
z+*g`ZvhZai)0dh1uzyaAi-McXM$I)aYjo6n%+k&!WRAMU?rM5p4LZ3UEx7+EHGf9I
zx^<HUGr<VOoDkyx!BBs-D2m2v*f`(Nn)*pb-D*zeV4O%@|2BqA#^(Z^TZ|~7mjqvz
z(W6uJ#7yK;BK9-}t@1*r=O}TAruyh-<}SpDG)`<Te32io)Q?_&2?fgB*6TWk1%#cG
zg7hkTPC!7hmGzrzW&%dOHrcU4Jo_Tf*(T$bl{K}^@h4s~V`D!Tm#hE_CcscsAQ5lE
zw=?JGuL>me{UWeJ3EO)WW7ylBLO1)$AzQ%sPz)f<zr!N7`|9gne9-x55n=saaO;I+
zVjGw;>s#|4KW5c4&`-wwJab#$+qZv__O;GA#~6|sE#?k#ps>oR1g-uE%<1>OAf~9;
z1FI9p6UoTFBZf0R+BAsdOR+*YJj!(h2A9J{>gR4T8oqb(mmV31t7?!UFHmj$*<3u@
zm~7=|qzK8?yVIl~{pIV9;J@9`8!X3@XFZ$r6mz-g#a(02h5`&KT@{bj@*C#%Yh-bC
z?W*1vCLt^7X=*A}TP{ob&1;rOR+*Qy1Fm=$)<MguUQsnFs;OTKl@JuRVAU<uJLh)7
zL)J{pv%kma?}ONM_rnxteBLAaGhzSZBFoQ78W4lEGUd{Zfj~?^^<fW#Cw2xGNxU?@
z2YEiv)JT)kUVJ2zqedQjpMEhducqZJQq)zn&unBdFSb#}k>EAkC{l@HZaqGtam{Qa
zXW=#B4?Fw|D<XOROc-*-p7Kq&gl=PP984hSbgC&~=Bzz;6v6A~Z=)yCU3e{TR@OLK
zoFmb{uAatb6m$HGZVBmKb1%yp(ltVTAMYkeUMVcJoEOLAU1TPYY$G^(lN+~%lNkSP
zbuz)*5nyA_m$I{C4e11;@<EAYG@O3KFZz6NDitB32}e33-@P1BBpLIaakW-(O@=|!
ziuRgm6amh_Br5z3;$pccG<W(gjd5txvf`HCzfIXB^HCofZpvOngv^PISG=xNEN_ci
zw?GNUl`STT>aR^k-sEv`Ow|o2R?z0d{b?EO>zWjUXN;;4NARcydBj;Ne(As(Tu+Ui
z^T+tJuxY6yDHyQa^whqGyQ1~c-X=oy+9gd(dL>JL{y-kcf18`()~w8LtDF0>#z)EZ
zogQpJ4oD7x1?I|pH{WMJb>hC-hTcA*(4a<`^B=r;mhl<g19eO3jIF?vbtohtR->{~
ze<yRRGcxa3OC(DH8$|GB%Yv)~*^9+em(|Htc^r%dQbkj=(bEgs!GR7q#!8g=T_-WV
z$c&q#Qn09o{_6;?Kq9RzZ+GlD^Ykq&KpOiCG@2f)z(ab!ErHb`nBXO$B-J_GqU?y0
zwL6~Wk8(^hM%~;?<v<{8yDN@o(dDi`7A>-ViVS}l*l9BT2Dv@E<)#9jUf%Y9<V$yh
ztPQB?pUkPfO0|sQs~e+?I>U+|Ob-kyJ~-&4lpZm7@3%$WG@)~n0{F=xlnRU1dc&8y
zI1?&@5Rb8|1ao0Dotg~Q!s6nFBF&KAmb-iMaOzh~4i3-~P^_Vae*QEDET`<nQr+}u
zHHWlx#(@C#A<2wTsZKbuMms0z6m{KCv$DObm~=O3Yth~0-t4aOGedXv5;b=l-T5;S
zd1ZE!X7+TKm6iM4h5Otkn#TVux;p6-`Nn7($sWh6@*PhFRzH41T{m4~^XqQ^&3w)9
zl0Na7yJb5Kf#FfKgqM%<V=mQ|(;8Q5*eu5OY7K8Mo7K?VDrI2*itL{@TPZU!h<%5Q
zWtiX$dN_nk{%VE0E&OcMaJtCc?(NhP4M)`b@+J}ig+->Lq<_|3;td2R(x4wf_p?a7
z%xkY1zM@l;<VABZaDUDpUSNndNZK2glGCcxBE}^=W{X;CzqE79+*wM&c6?m<n7W?!
zj1hi}GIUga<KbgHi&+mQCnpJ2GNrM|^uAM#1D5!IJY-@Nojx%JQoke9B=;k3%1l{s
zHyfQ>P&`^v&Po{QW@7q1%X(I7U1cFxdg#L~VyjxdEQji8>}&xkS*$^>ft+|*!^Hd3
zPkx)s-qOkwpijRbC2JTlm>pnR39OOWM9TSohS*xwzG;3CVb${CYZNyxQ2+mP_4u=7
zWGzBxKQ>jJ{CIE7`nurMb-UIOlan9uMeQqJSWZ24Ojfa=YxN>z%jpz+Xsh43ja0LL
F@;|)yNq+zU

literal 0
HcmV?d00001

diff --git a/doc/source/cluster/running-applications/monitoring-and-observability.rst b/doc/source/cluster/running-applications/monitoring-and-observability.rst
index 9f5938d94ebc..83f621a214d6 100644
--- a/doc/source/cluster/running-applications/monitoring-and-observability.rst
+++ b/doc/source/cluster/running-applications/monitoring-and-observability.rst
@@ -87,8 +87,15 @@ below.
 
 .. _multi-node-metrics:
 
-Prometheus metrics
-^^^^^^^^^^^^^^^^^^
+Prometheus
+^^^^^^^^^^
+Ray supports prometheus for emitting and recording time-series metrics.
+See :ref:`metrics <ray-metrics>` for more details of the metrics emitted.
+When using Prometheus in a Ray cluster, one must decide where they want to host prometheus and then configure
+Prometheus so that Prometheus can scrape the metrics from Ray.
+
+Scraping metrics
+################
 
 Ray runs a metrics agent per node to export :ref:`metrics <ray-metrics>` about Ray core as well as
 custom user-defined metrics. Each metrics agent collects metrics from the local
@@ -142,7 +149,7 @@ start``.  If using KubeRay, you can specify
 ``rayStartParams.metrics-export-port`` in the RayCluster configuration file.
 The port must be specified on all nodes in the cluster.
 
-If you do not know the IP addresses of the nodes in your Ray cluster, 
+If you do not know the IP addresses of the nodes in your Ray cluster,
 you can also programmatically discover the endpoints by reading the
 Ray Cluster information. Here, we will use a Python script and the
 ``ray.nodes()`` API to find the metrics agents' URLs, by combining the
@@ -188,3 +195,67 @@ Ray Cluster information. Here, we will use a Python script and the
                     'object_store_memory': 2.0},
      'alive': True}]
     """
+
+
+.. _multi-node-metrics-grafana:
+
+
+Grafana
+^^^^^^^
+Ray dashboard integrates with grafana to show visualizations of time-series metrics.
+
+.. image:: images/graphs.png
+    :align: center
+
+First, you must decide where you want to host Grafana. One common place is to run it on the head node of the cluster.
+See :ref:`here <grafana>` for instructions on how to install Grafana and how to use the default Grafana configurations
+exported by Ray.
+
+Next, the head node must be able to access Prometheus and Grafana and the browser of the dashboard user
+must be able to access Grafana. You can configure these settings using the `RAY_GRAFANA_HOST`, `RAY_PROMETHEUS_HOST`,
+and `RAY_GRAFANA_IFRAME_HOST` environment variables.
+
+* `RAY_GRAFANA_HOST` should be set to an address that the head node can use to access Grafana.
+* `RAY_PROMETHEUS_HOST` should be set to an address the head node can use to access Prometheus.
+* `RAY_GRAFANA_IFRAME_HOST` can be set to an address for the user's browsers to use to access Grafana. By default, `RAY_GRAFANA_IFRAME_HOST` will be equal to `RAY_GRAFANA_HOST`.
+
+For example, if the ip of the head node is 55.66.77.88 and grafana is hosted on port 3000. One should set the value
+to `RAY_GRAFANA_HOST=55.66.77.88:3000`.
+
+
+.. _multi-node-metrics-grafana-existing:
+
+Using an existing Grafana instance
+##################################
+
+When you want to use existing Grafana instance, before starting your Ray cluster you will need to setup environment variable `RAY_GRAFANA_HOST` with an URL of your Grafana. After starting Ray, you can find Grafana dashboard json at `/tmp/ray/session_latest/metrics/grafana/dashboards/default_grafana_dashboard.json`. `Import this dashboard <https://grafana.com/docs/grafana/latest/dashboards/manage-dashboards/#import-a-dashboard>`_ to your Grafana.
+
+If Grafana reports that datasource is not found, you can `add a datasource variable <https://grafana.com/docs/grafana/latest/dashboards/variables/add-template-variables/?pg=graf&plcmt=data-sources-prometheus-btn-1#add-a-data-source-variable>`_ and using `JSON model view <https://grafana.com/docs/grafana/latest/dashboards/build-dashboards/modify-dashboard-settings/#view-dashboard-json-model>`_ change all values of `datasource` key in the imported `default_grafana_dashboard.json` to the name of the variable. For example, if the variable name is `data_source`, all `"datasource"` mappings should be:
+
+.. code-block:: json
+
+  "datasource": {
+    "type": "prometheus",
+    "uid": "$data_source"
+  }
+
+When existing Grafana instance requires user authentication, the following settings have to be in its `configuration file <https://grafana.com/docs/grafana/latest/setup-grafana/configure-grafana/>`_ to correctly embed in Ray dashboard:
+
+.. code-block:: ini
+
+  [security]
+  allow_embedding = true
+  cookie_secure = true
+  cookie_samesite = none
+
+If Grafana is exposed via nginx ingress on Kubernetes cluster, the following line should be present in the Grafana ingress annotation:
+
+.. code-block:: yaml
+
+  nginx.ingress.kubernetes.io/configuration-snippet: |
+      add_header X-Frame-Options SAMEORIGIN always;
+
+When both Grafana and Ray cluster are on the same Kubernetes cluster, it is important to set `RAY_GRAFANA_HOST` to the external URL of the Grafana ingress. For successful embedding, `RAY_GRAFANA_HOST` needs to be accessible to both Ray cluster backend and Ray dashboard frontend:
+
+* On the backend, *Ray cluster head* does health checks on Grafana. Hence `RAY_GRAFANA_HOST` needs to be accessible in the Kubernetes pod which is running the head node.
+* When accessing *Ray dashboard* from the browser, frontend embeds Grafana dashboard using the URL specified in `RAY_GRAFANA_HOST`. Hence `RAY_GRAFANA_HOST` needs to be accessible from the browser as well.
diff --git a/doc/source/ray-observability/ray-metrics.rst b/doc/source/ray-observability/ray-metrics.rst
index d05363102cbe..5a13cb7f2384 100644
--- a/doc/source/ray-observability/ray-metrics.rst
+++ b/doc/source/ray-observability/ray-metrics.rst
@@ -14,6 +14,11 @@ To help monitor Ray applications, Ray
 Getting Started
 ---------------
 
+.. tip::
+
+  The below instructions for Prometheus to enable a basic workflow of running and accessing the dashboard on your local machine.
+  For more information about how to run Prometheus on a remote cluster, see :ref:`here <multi-node-metrics>`.
+
 Ray exposes its metrics in Prometheus format. This allows us to easily scrape them using Prometheus.
 
 First, `download Prometheus <https://prometheus.io/download/>`_. Make sure to download the correct binary for your operating system. (Ex: darwin for mac osx)
@@ -64,6 +69,12 @@ See :ref:`here <multi-node-metrics>` for more information on how to set up Prome
 
 Grafana
 -------
+
+.. tip::
+
+  The below instructions for Grafana setup to enable a basic workflow of running and accessing the dashboard on your local machine.
+  For more information about how to run Grafana on a remote cluster, see :ref:`here <multi-node-metrics-grafana>`.
+
 Grafana is a tool that supports more advanced visualizations of prometheus metrics and
 allows you to create custom dashboards with your favorite metrics. Ray exports some default
 configurations which includes a default dashboard showing some of the most valuable metrics
@@ -91,40 +102,8 @@ You can then see the default dashboard by going to dashboards -> manage -> Ray -
 .. image:: images/graphs.png
     :align: center
 
-Using an existing Grafana instance
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-When you want to use existing Grafana instance, before starting your Ray cluster you will need to setup environment variable `RAY_GRAFANA_HOST` with an URL of your Grafana. After starting Ray, you can find Grafana dashboard json at `/tmp/ray/session_latest/metrics/grafana/dashboards/default_grafana_dashboard.json`. `Import this dashboard <https://grafana.com/docs/grafana/latest/dashboards/manage-dashboards/#import-a-dashboard>`_ to your Grafana.
-
-If Grafana reports that datasource is not found, you can `add a datasource variable <https://grafana.com/docs/grafana/latest/dashboards/variables/add-template-variables/?pg=graf&plcmt=data-sources-prometheus-btn-1#add-a-data-source-variable>`_ and using `JSON model view <https://grafana.com/docs/grafana/latest/dashboards/build-dashboards/modify-dashboard-settings/#view-dashboard-json-model>`_ change all values of `datasource` key in the imported `default_grafana_dashboard.json` to the name of the variable. For example, if the variable name is `data_source`, all `"datasource"` mappings should be:
-
-.. code-block:: json
-
-  "datasource": {
-    "type": "prometheus",
-    "uid": "$data_source"
-  }
-
-When existing Grafana instance requires user authentication, the following settings have to be in its `configuration file <https://grafana.com/docs/grafana/latest/setup-grafana/configure-grafana/>`_ to correctly embed in Ray dashboard:
-
-.. code-block:: ini
-
-  [security]
-  allow_embedding = true
-  cookie_secure = true
-  cookie_samesite = none
 
-If Grafana is exposed via nginx ingress on Kubernetes cluster, the following line should be present in the Grafana ingress annotation:
-
-.. code-block:: yaml
-
-  nginx.ingress.kubernetes.io/configuration-snippet: |
-      add_header X-Frame-Options SAMEORIGIN always;
-
-When both Grafana and Ray cluster are on the same Kubernetes cluster, it is important to set `RAY_GRAFANA_HOST` to the external URL of the Grafana ingress. For successful embedding, `RAY_GRAFANA_HOST` needs to be accessible to both Ray cluster backend and Ray dashboard frontend:
-
-* On the backend, *Ray cluster head* does health checks on Grafana. Hence `RAY_GRAFANA_HOST` needs to be accessible in the Kubernetes pod which is running the head node.
-* When accessing *Ray dashboard* from the browser, frontend embeds Grafana dashboard using the URL specified in `RAY_GRAFANA_HOST`. Hence `RAY_GRAFANA_HOST` needs to be accessible from the browser as well.
+See :ref:`here <multi-node-metrics-grafana>` for more information on how to set up Grafana on a Ray Cluster.
 
 .. _system-metrics:
 
@@ -249,8 +228,11 @@ If you open this in the browser, you should see the following output:
 
 Please see :ref:`ray.util.metrics <custom-metric-api-ref>` for more details.
 
+Configurations
+--------------
+
 Customize prometheus export port
---------------------------------
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Ray by default provides the service discovery file, but you can directly scrape metrics from prometheus ports.
 To do that, you may want to customize the port that metrics gets exposed to a pre-defined port.
@@ -261,6 +243,34 @@ To do that, you may want to customize the port that metrics gets exposed to a pr
 
 Now, you can scrape Ray's metrics using Prometheus via ``<ip>:8080``.
 
+Alternate Prometheus host location
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+You can choose to run Prometheus on a non-default port or on a different machine. When doing so, you should
+make sure that prometheus can scrape the metrics from your ray nodes following instructions :ref:`here <multi-node-metrics>`.
+
+In addition, both Ray and Grafana needs to know how to access this prometheus instance. This can be configured
+by setting the `RAY_PROMETHEUS_HOST` env var when launching ray. The env var takes in the address to access Prometheus. More
+info can be found :ref:`here <multi-node-metrics-grafana>`. By default, we assume Prometheus is hosted at `localhost:9090`.
+
+For example, if Prometheus is hosted at port 9000 on a node with ip 55.66.77.88, One should set the value to
+`RAY_PROMETHEUS_HOST=http://55.66.77.88:9000`.
+
+
+Alternate Grafana host location
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+You can choose to run Grafana on a non-default port or on a different machine. If you choose to do this, the
+:ref:`Dashboard <ray-dashboard>` needs to be configured with a public address to that service so the web page
+can load the graphs. This can be done with the `RAY_GRAFANA_HOST` env var when launching ray. The env var takes
+in the address to access Grafana. More info can be found :ref:`here <multi-node-metrics-grafana>`. Instructions
+to use an existing Grafana instance can be found :ref:`here <multi-node-metrics-grafana-existing>`.
+
+For the Grafana charts to work on the Ray dashboard, the user of the dashboard's browser must be able to reach
+the Grafana service. If this browser cannot reach Grafana the same way the Ray head node can, you can use a separate
+env var `RAY_GRAFANA_IFRAME_HOST` to customize the host the browser users to attempt to reach Grafana. If this is not set,
+we use the value of `RAY_GRAFANA_HOST` by default.
+
+For example, if Grafana is hosted at is 55.66.77.88 on port 3000. One should set the value
+to `RAY_GRAFANA_HOST=http://55.66.77.88:3000`.
 
 Troubleshooting
 ---------------
@@ -284,4 +294,4 @@ Grafana dashboards are not embedded in the Ray dashboard
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 If you're getting error that `RAY_GRAFANA_HOST` is not setup despite you've set it up, please check:
 That you've included protocol in the URL (e.g. `http://your-grafana-url.com` instead of `your-grafana-url.com`).
-Also, make sure that url doesn't have trailing slash (e.g. `http://your-grafana-url.com` instead of `http://your-grafana-url.com/`).
\ No newline at end of file
+Also, make sure that url doesn't have trailing slash (e.g. `http://your-grafana-url.com` instead of `http://your-grafana-url.com/`).