@@ -47,7 +47,7 @@ static fs::path getTransferOutputPath(char const* tag)
47
47
return {};
48
48
}
49
49
50
- DataSenderImpl::DataSenderImpl (executor::kv_cache::ConnectionManager* manager,
50
+ CacheSenderImpl::CacheSenderImpl (executor::kv_cache::ConnectionManager* manager,
51
51
executor::kv_cache::CacheState selfCacheState, SizeType32 selfIndex, std::unique_ptr<BaseCacheFormatter> formatter)
52
52
: mManager {manager}
53
53
, mSelfState {std::move (selfCacheState), executor::kv_cache::CommState{manager->getCommState ()}}
@@ -58,7 +58,7 @@ DataSenderImpl::DataSenderImpl(executor::kv_cache::ConnectionManager* manager,
58
58
TLLM_CHECK (mManager ->getCommState ().getSelfIdx () == selfIndex);
59
59
}
60
60
61
- [[nodiscard]] RequestInfo DataSenderImpl ::recvRequestInfo ()
61
+ [[nodiscard]] RequestInfo CacheSenderImpl ::recvRequestInfo ()
62
62
{
63
63
using DataContext = tensorrt_llm::executor::kv_cache::DataContext;
64
64
auto * agentConnectionManager = dynamic_cast <executor::kv_cache::AgentConnectionManager*>(mManager );
@@ -111,7 +111,7 @@ DataSenderImpl::DataSenderImpl(executor::kv_cache::ConnectionManager* manager,
111
111
return info;
112
112
}
113
113
114
- void DataSenderImpl ::sendSync (LlmRequest const & llmRequest)
114
+ void CacheSenderImpl ::sendSync (LlmRequest const & llmRequest)
115
115
{
116
116
auto it = mRequestToSession .find (llmRequest.mRequestId );
117
117
TLLM_CHECK (it != mRequestToSession .end ());
@@ -120,24 +120,24 @@ void DataSenderImpl::sendSync(LlmRequest const& llmRequest)
120
120
mFormatter ->format (session);
121
121
}
122
122
123
- [[nodiscard]] executor::kv_cache::CommState const & DataSenderImpl ::getCommState () const
123
+ [[nodiscard]] executor::kv_cache::CommState const & CacheSenderImpl ::getCommState () const
124
124
{
125
125
return mSelfState .getCommState ().value ();
126
126
}
127
127
128
- void DataSenderImpl ::setCommState (executor::kv_cache::CommState commState)
128
+ void CacheSenderImpl ::setCommState (executor::kv_cache::CommState commState)
129
129
{
130
130
mSelfState .setCommState (std::move (commState));
131
131
}
132
132
133
- [[nodiscard]] size_t DataSenderImpl ::getCounterpartsCount (LlmRequest::RequestIdType requestId) const
133
+ [[nodiscard]] size_t CacheSenderImpl ::getCounterpartsCount (LlmRequest::RequestIdType requestId) const
134
134
{
135
135
auto it = mRequestToSession .find (requestId);
136
136
TLLM_CHECK (it != mRequestToSession .end ());
137
137
return it->second .getConnections ().size ();
138
138
}
139
139
140
- void DataSenderImpl ::release (LlmRequest::RequestIdType requestId)
140
+ void CacheSenderImpl ::release (LlmRequest::RequestIdType requestId)
141
141
{
142
142
auto it = mRequestToSession .find (requestId);
143
143
TLLM_CHECK (it != mRequestToSession .end ());
@@ -156,7 +156,7 @@ void DataSenderImpl::release(LlmRequest::RequestIdType requestId)
156
156
mRequestToSession .erase (it);
157
157
}
158
158
159
- DataReceiverImpl::DataReceiverImpl (executor::kv_cache::ConnectionManager* manager,
159
+ CacheReceiverImpl::CacheReceiverImpl (executor::kv_cache::ConnectionManager* manager,
160
160
executor::kv_cache::CacheState selfCacheState, SizeType32 selfIndex, std::unique_ptr<BaseCacheFormatter> formatter)
161
161
: mManager {manager}
162
162
, mSelfState {std::move (selfCacheState), executor::kv_cache::CommState{manager->getCommState ()}}
@@ -167,7 +167,7 @@ DataReceiverImpl::DataReceiverImpl(executor::kv_cache::ConnectionManager* manage
167
167
TLLM_CHECK (mFormatter );
168
168
}
169
169
170
- TransferSession DataReceiverImpl ::sendRequestInfo (LlmRequest const & llmRequest)
170
+ TransferSession CacheReceiverImpl ::sendRequestInfo (LlmRequest const & llmRequest)
171
171
{
172
172
uint64_t requestId = llmRequest.getContextPhaseParams ().value ().getReqId ();
173
173
auto const & contextState = llmRequest.getDataTransceiverState ();
@@ -233,7 +233,7 @@ TransferSession DataReceiverImpl::sendRequestInfo(LlmRequest const& llmRequest)
233
233
contextState, resource->mBufferManager , &llmRequest, !common::getEnvKVCacheTransferOutputPath ().empty ());
234
234
}
235
235
236
- void DataReceiverImpl ::receiveSync (TransferSession& session)
236
+ void CacheReceiverImpl ::receiveSync (TransferSession& session)
237
237
{
238
238
mFormatter ->unformat (session);
239
239
if (!common::getEnvKVCacheTransferOutputPath ().empty ())
@@ -250,7 +250,7 @@ void DataReceiverImpl::receiveSync(TransferSession& session)
250
250
}
251
251
}
252
252
253
- void DataReceiverImpl ::sendRequestInfo (executor::kv_cache::Connection const * connection, RequestInfo const & info)
253
+ void CacheReceiverImpl ::sendRequestInfo (executor::kv_cache::Connection const * connection, RequestInfo const & info)
254
254
{
255
255
std::ostringstream oss;
256
256
RequestInfo::serialize (info, oss);
@@ -262,7 +262,7 @@ void DataReceiverImpl::sendRequestInfo(executor::kv_cache::Connection const* con
262
262
connection->send (executor::kv_cache::DataContext{kINFO_TAG }, serializedInfo.data (), infoSize);
263
263
}
264
264
265
- std::unique_ptr<DataReceiverImpl ::ReceiveCacheResource> const & DataReceiverImpl ::getReceiveCacheResource (
265
+ std::unique_ptr<CacheReceiverImpl ::ReceiveCacheResource> const & CacheReceiverImpl ::getReceiveCacheResource (
266
266
LlmRequest const & llmRequest)
267
267
{
268
268
std::scoped_lock<std::mutex> lock (mProcessIoResouceMutex );
0 commit comments