@@ -1465,16 +1465,19 @@ class CacheTransceiverConfig
14651465 NIXL = 3
14661466 };
14671467 explicit CacheTransceiverConfig (std::optional<BackendType> backendType = std::nullopt ,
1468- std::optional<size_t > maxNumTokens = std::nullopt , std::optional<int > kvTransferTimeoutMs = std::nullopt );
1468+ std::optional<size_t > maxNumTokens = std::nullopt , std::optional<int > kvTransferTimeoutMs = std::nullopt ,
1469+ std::optional<int > kvTransferSenderFutureTimeoutMs = std::nullopt );
14691470
14701471 bool operator ==(CacheTransceiverConfig const & other) const ;
14711472 void setBackendType (std::optional<BackendType> backendType);
14721473 void setMaxTokensInBuffer (std::optional<size_t > maxTokensInBuffer);
14731474 void setKvTransferTimeoutMs (std::optional<int > kvTransferTimeoutMs);
1475+ void setKvTransferSenderFutureTimeoutMs (std::optional<int > kvTransferSenderFutureTimeoutMs);
14741476
1475- [[nodiscard]] std::optional<int > getKvTransferTimeoutMs () const ;
14761477 [[nodiscard]] std::optional<size_t > getMaxTokensInBuffer () const ;
14771478 [[nodiscard]] std::optional<BackendType> getBackendType () const ;
1479+ [[nodiscard]] std::optional<int > getKvTransferTimeoutMs () const ;
1480+ [[nodiscard]] std::optional<int > getKvTransferSenderFutureTimeoutMs () const ;
14781481
14791482private:
14801483 std::optional<BackendType> mBackendType ;
@@ -1483,6 +1486,9 @@ class CacheTransceiverConfig
14831486 // / transfer may be degraded.
14841487 std::optional<size_t > mMaxTokensInBuffer ;
14851488 std::optional<int > mKvTransferTimeoutMs ;
1489+ // @brief Timeout in milliseconds to wait for the sender future to be ready when scheduled batch size is 0. This
1490+ // allows the request to be eventually cancelled by the user or because of kv_transfer_timeout_ms
1491+ std::optional<int > mKvTransferSenderFutureTimeoutMs ;
14861492};
14871493
14881494// / @brief Configuration class for the model executor
0 commit comments