fix(embeddings): truncate query content for temp doc query (#12573)

* fix(embeddings): truncate query content for temp doc query * fix: use tokenService
2026-02-06 11:01:13 +08:00 · 2026-01-23 20:34:54 +08:00 · 2026-01-23 20:34:54 +08:00 · 022e1aee4a
commit 022e1aee4a
parent 46fa59a10c
1 changed files with 11 additions and 0 deletions
--- a/src/renderer/src/services/KnowledgeService.ts
+++ b/src/renderer/src/services/KnowledgeService.ts
@ -30,6 +30,7 @@ import { isEmpty } from 'lodash'
 import { getProviderByModel } from './AssistantService'
 import FileManager from './FileManager'
 import type { BlockManager } from './messageStreaming'
+import { estimateTextTokens } from './TokenService'

 const logger = loggerService.withContext('RendererKnowledgeService')

@ -146,6 +147,16 @@ export const searchKnowledgeBase = async (
  parentSpanId?: string,
  modelName?: string
 ): Promise<Array<KnowledgeSearchResult & { file: FileMetadata | null }>> => {
+  // Truncate query based on embedding model's max_context to prevent embedding errors
+  const maxContext = getEmbeddingMaxContext(base.model.id)
+  if (maxContext) {
+    const estimatedTokens = estimateTextTokens(query)
+    if (estimatedTokens > maxContext) {
+      const ratio = maxContext / estimatedTokens
+      query = query.slice(0, Math.floor(query.length * ratio))
+    }
+  }
+
  let currentSpan: Span | undefined = undefined
  try {
    const baseParams = getKnowledgeBaseParams(base)