This commit is contained in:
Rongwei Zhang 2026-01-13 11:41:59 +00:00 committed by GitHub
commit e5a5720d3d
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -2868,6 +2868,18 @@ void KVCacheManager::removeToken(RequestIdType requestId)
void KVCacheManager::rewindKVCache(RequestIdType requestId, SizeType32 rewindLengths)
{
// Check if the sequence still exists before rewinding
// In overlap mode with MTP, the request may have been terminated and removed
// from mSequences before rewindKVCache is called
{
std::scoped_lock lck(mSequencesMtx);
if (mSequences.find(requestId) == mSequences.end())
{
TLLM_LOG_DEBUG("Request %lu has already been removed from KV cache manager, skipping rewind", requestId);
return;
}
}
for (SizeType32 si = 0; si < rewindLengths; ++si)
{
removeToken(requestId);