eloqdata · lzxddz · Oct 14, 2025 · Sep 3, 2025 · Sep 24, 2025 · Sep 30, 2025
diff --git a/data_store_service_client.cpp b/data_store_service_client.cpp
diff --git a/data_store_service_client.h b/data_store_service_client.h
@@ -55,6 +55,8 @@ class ScanNextClosure;
 class CreateSnapshotForBackupClosure;
 class SinglePartitionScanner;
 
+class DssClusterConfig;
+
 typedef void (*DataStoreCallback)(void *data,
                                   ::google::protobuf::Closure *closure,
                                   DataStoreServiceClient &client,
@@ -69,16 +71,27 @@ class DataStoreServiceClient : public txservice::store::DataStoreHandler
         txservice::CatalogFactory *catalog_factory[3],
         const DataStoreServiceClusterManager &cluster_manager,
         DataStoreService *data_store_service = nullptr)
-        : ds_serv_shutdown_indicator_(false),
-          catalog_factory_array_{catalog_factory[0],
+        : catalog_factory_array_{catalog_factory[0],
                                  catalog_factory[1],
                                  catalog_factory[2],
                                  &range_catalog_factory_,
                                  &hash_catalog_factory_},
-          cluster_manager_(cluster_manager),
-          data_store_service_(data_store_service),
-          flying_remote_fetch_count_(0)
+          data_store_service_(data_store_service)
     {
+        // Init dss cluster config.
+        dss_topology_version_ = cluster_manager.GetTopologyVersion();
+        auto all_shards = cluster_manager.GetAllShards();
+        assert(all_shards.size() == 1);
+        for (auto &[shard_id, shard] : all_shards)
+        {
+            uint32_t node_idx = FindFreeNodeIndex();
+            auto &node_ref = dss_nodes_[node_idx];
+            node_ref.Reset(shard.nodes_[0].host_name_,
+                           shard.nodes_[0].port_,
+                           shard.version_);
+            dss_shards_[shard_id].store(shard_id);
+        }
+
         if (data_store_service_ != nullptr)
         {
             data_store_service_->AddListenerForUpdateConfig(
@@ -359,24 +372,6 @@ class DataStoreServiceClient : public txservice::store::DataStoreHandler
 
     void OnShutdown() override;
 
-    void HandleShardingError(const ::EloqDS::remote::CommonResult &result)
-    {
-        cluster_manager_.HandleShardingError(result);
-    }
-
-    std::shared_ptr<brpc::Channel> GetDataStoreServiceChannelByPartitionId(
-        uint32_t partition_id);
-    std::shared_ptr<brpc::Channel> UpdateDataStoreServiceChannelByPartitionId(
-        uint32_t partition_id);
-    std::shared_ptr<brpc::Channel> GetDataStoreServiceChannelByShardId(
-        uint32_t shard_id);
-    std::shared_ptr<brpc::Channel> UpdateDataStoreServiceChannelByShardId(
-        uint32_t shard_id);
-    std::shared_ptr<brpc::Channel> GetDataStoreServiceChannel(
-        const DSSNode &node);
-    std::shared_ptr<brpc::Channel> UpdateDataStoreServiceChannel(
-        const DSSNode &node);
-
     /**
      * Serialize a record with is_deleted flag and record string.
      * @param is_deleted
@@ -616,50 +611,115 @@ class DataStoreServiceClient : public txservice::store::DataStoreHandler
 #endif
     }
 
+    const txservice::CatalogFactory *GetCatalogFactory(
+        txservice::TableEngine table_engine)
+    {
+        return catalog_factory_array_.at(static_cast<int>(table_engine) - 1);
+    }
+
     /**
      * @brief Check if the shard_id is local to the current node.
      * @param shard_id
      * @return true if the shard_id is local to the current node.
      */
     bool IsLocalShard(uint32_t shard_id);
 
-    uint32_t GetShardIdByPartitionId(int32_t partition_id)
-    {
-        return cluster_manager_.GetShardIdByPartitionId(partition_id);
-    }
-
-    const txservice::CatalogFactory *GetCatalogFactory(
-        txservice::TableEngine table_engine)
-    {
-        return catalog_factory_array_.at(static_cast<int>(table_engine) - 1);
-    }
-
     /**
      * @brief Check if the partition_id is local to the current node.
      * @param partition_id
      * @return true if the partition_id is local to the current node.
      */
     bool IsLocalPartition(int32_t partition_id);
 
-    bthread::Mutex ds_service_mutex_;
-    bthread::ConditionVariable ds_service_cv_;
-    std::atomic<bool> ds_serv_shutdown_indicator_;
+    uint32_t GetShardIdByPartitionId(int32_t partition_id) const;
+    uint32_t AllDataShardCount() const;
+    uint32_t GetOwnerNodeIndexOfShard(uint32_t shard_id) const;
+    bool UpdateOwnerNodeIndexOfShard(uint32_t shard_id,
+                                     uint32_t old_node_index,
+                                     uint32_t &new_node_index);
+    uint32_t FindFreeNodeIndex();
+    void HandleShardingError(const ::EloqDS::remote::CommonResult &result);
+    bool UpgradeShardVersion(uint32_t shard_id,
+                             uint64_t shard_version,
+                             const std::string &host_name,
+                             uint16_t port);
 
     txservice::EloqHashCatalogFactory hash_catalog_factory_{};
     txservice::EloqRangeCatalogFactory range_catalog_factory_{};
     // TODO(lzx): define a global catalog factory array that used by
     // EngineServer TxService and DataStoreHandler
     std::array<const txservice::CatalogFactory *, 5> catalog_factory_array_;
 
-    // remote data store service configuration
-    DataStoreServiceClusterManager cluster_manager_;
-
+    // bthread::Mutex ds_service_mutex_;
+    // bthread::ConditionVariable ds_service_cv_;
+    // std::atomic<bool> ds_serv_shutdown_indicator_;
     // point to the data store service if it is colocated
     DataStoreService *data_store_service_;
 
-    std::atomic<uint64_t> flying_remote_fetch_count_{0};
-    // Work queue for fetch records from primary node
-    std::deque<txservice::FetchRecordCc *> remote_fetch_cc_queue_;
+    struct DssNode
+    {
+        DssNode() = default;
+        ~DssNode() = default;
+        DssNode(const DssNode &rhs)
+            : host_name_(rhs.host_name_),
+              port_(rhs.port_),
+              shard_verion_(rhs.shard_verion_)
+        {
+        }
+        DssNode &operator=(const DssNode &) = delete;
+
+        void Reset(const std::string hostname,
+                   uint16_t port,
+                   uint64_t shard_version)
+        {
+            assert(expired_ts_.load(std::memory_order_acquire) == 0);
+            host_name_ = hostname;
+            port_ = port;
+            shard_verion_ = shard_version;
+            channel_.Init(host_name_.c_str(), port_, nullptr);
+        }
+
+        const std::string &HostName() const
+        {
+            return host_name_;
+        }
+        uint16_t Port() const
+        {
+            return port_;
+        }
+        uint64_t ShardVersion() const
+        {
+            return shard_verion_;
+        }
+        brpc::Channel *Channel()
+        {
+            assert(!host_name_.empty() && port_ != 0);
+            return &channel_;
+        }
+
+        // expired_ts_ is the timestamp when the node is expired.
+        // If expired_ts_ is 0, the node is not expired.
+        // If expired_ts_ is not 0, the node is expired and the value is the
+        // timestamp when the node is expired.
+        std::atomic<uint64_t> expired_ts_{1U};
+
+    private:
+        std::string host_name_;
+        uint16_t port_;
+        brpc::Channel channel_;
+        uint64_t shard_verion_;
+    };
+    // Cached leader nodes info of data shard.
+    std::array<DssNode, 1024> dss_nodes_;
+    const uint64_t NodeExpiredTime = 10 * 1000 * 1000;  // 10s
+    // Now only support one shard. dss_shards_ caches the index in dss_nodes_ of
+    // shard owner.
+    std::array<std::atomic<uint32_t>, 1> dss_shards_;
+    std::atomic<uint64_t> dss_topology_version_{0};
+
+    // std::atomic<uint64_t> flying_remote_fetch_count_{0};
+    // // Work queue for fetch records from primary node
+    // std::deque<txservice::FetchRecordCc *> remote_fetch_cc_queue_;
 
     // table names and their kv table names
     std::unordered_map<txservice::TableName, std::string>
@@ -674,9 +734,9 @@ class DataStoreServiceClient : public txservice::store::DataStoreHandler
     friend class ScanNextClosure;
     friend class CreateSnapshotForBackupClosure;
     friend void PartitionBatchCallback(void *data,
-                                      ::google::protobuf::Closure *closure,
-                                      DataStoreServiceClient &client,
-                                      const remote::CommonResult &result);
+                                       ::google::protobuf::Closure *closure,
+                                       DataStoreServiceClient &client,
+                                       const remote::CommonResult &result);
     friend class SinglePartitionScanner;
     friend void FetchAllDatabaseCallback(void *data,
                                          ::google::protobuf::Closure *closure,