mirror of
https://github.com/langgenius/dify.git
synced 2026-01-14 06:07:33 +08:00
Signed-off-by: -LAN- <laipz8200@outlook.com> Signed-off-by: kenwoodjw <blackxin55+@gmail.com> Signed-off-by: Yongtao Huang <yongtaoh2022@gmail.com> Signed-off-by: yihong0618 <zouzou0208@gmail.com> Signed-off-by: zhanluxianshen <zhanluxianshen@163.com> Co-authored-by: -LAN- <laipz8200@outlook.com> Co-authored-by: GuanMu <ballmanjq@gmail.com> Co-authored-by: Davide Delbianco <davide.delbianco@outlook.com> Co-authored-by: NeatGuyCoding <15627489+NeatGuyCoding@users.noreply.github.com> Co-authored-by: kenwoodjw <blackxin55+@gmail.com> Co-authored-by: Yongtao Huang <yongtaoh2022@gmail.com> Co-authored-by: Yongtao Huang <99629139+hyongtao-db@users.noreply.github.com> Co-authored-by: Qiang Lee <18018968632@163.com> Co-authored-by: 李强04 <liqiang04@gaotu.cn> Co-authored-by: autofix-ci[bot] <114827586+autofix-ci[bot]@users.noreply.github.com> Co-authored-by: Asuka Minato <i@asukaminato.eu.org> Co-authored-by: Matri Qi <matrixdom@126.com> Co-authored-by: huayaoyue6 <huayaoyue@163.com> Co-authored-by: Bowen Liang <liangbowen@gf.com.cn> Co-authored-by: znn <jubinkumarsoni@gmail.com> Co-authored-by: crazywoola <427733928@qq.com> Co-authored-by: crazywoola <100913391+crazywoola@users.noreply.github.com> Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com> Co-authored-by: yihong <zouzou0208@gmail.com> Co-authored-by: Muke Wang <shaodwaaron@gmail.com> Co-authored-by: wangmuke <wangmuke@kingsware.cn> Co-authored-by: Wu Tianwei <30284043+WTW0313@users.noreply.github.com> Co-authored-by: quicksand <quicksandzn@gmail.com> Co-authored-by: 非法操作 <hjlarry@163.com> Co-authored-by: zxhlyh <jasonapring2015@outlook.com> Co-authored-by: Eric Guo <eric.guocz@gmail.com> Co-authored-by: Zhedong Cen <cenzhedong2@126.com> Co-authored-by: jiangbo721 <jiangbo721@163.com> Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: hjlarry <25834719+hjlarry@users.noreply.github.com> Co-authored-by: lxsummer <35754229+lxjustdoit@users.noreply.github.com> Co-authored-by: 湛露先生 <zhanluxianshen@163.com> Co-authored-by: Guangdong Liu <liugddx@gmail.com> Co-authored-by: QuantumGhost <obelisk.reg+git@gmail.com> Co-authored-by: Claude <noreply@anthropic.com> Co-authored-by: Yessenia-d <yessenia.contact@gmail.com> Co-authored-by: huangzhuo1949 <167434202+huangzhuo1949@users.noreply.github.com> Co-authored-by: huangzhuo <huangzhuo1@xiaomi.com> Co-authored-by: 17hz <0x149527@gmail.com> Co-authored-by: Amy <1530140574@qq.com> Co-authored-by: Joel <iamjoel007@gmail.com> Co-authored-by: Nite Knite <nkCoding@gmail.com> Co-authored-by: Yeuoly <45712896+Yeuoly@users.noreply.github.com> Co-authored-by: Petrus Han <petrus.hanks@gmail.com> Co-authored-by: iamjoel <2120155+iamjoel@users.noreply.github.com> Co-authored-by: Kalo Chin <frog.beepers.0n@icloud.com> Co-authored-by: Ujjwal Maurya <ujjwalsbx@gmail.com> Co-authored-by: Maries <xh001x@hotmail.com>
93 lines
3.5 KiB
Python
93 lines
3.5 KiB
Python
from collections.abc import Generator
|
|
from dataclasses import dataclass, field
|
|
from typing import TypeVar, Union, cast
|
|
|
|
from core.agent.entities import AgentInvokeMessage
|
|
from core.tools.entities.tool_entities import ToolInvokeMessage
|
|
|
|
MessageType = TypeVar("MessageType", bound=Union[ToolInvokeMessage, AgentInvokeMessage])
|
|
|
|
|
|
@dataclass
|
|
class FileChunk:
|
|
"""
|
|
Buffer for accumulating file chunks during streaming.
|
|
"""
|
|
|
|
total_length: int
|
|
bytes_written: int = field(default=0, init=False)
|
|
data: bytearray = field(init=False)
|
|
|
|
def __post_init__(self) -> None:
|
|
self.data = bytearray(self.total_length)
|
|
|
|
|
|
def merge_blob_chunks(
|
|
response: Generator[MessageType, None, None],
|
|
max_file_size: int = 30 * 1024 * 1024,
|
|
max_chunk_size: int = 8192,
|
|
) -> Generator[MessageType, None, None]:
|
|
"""
|
|
Merge streaming blob chunks into complete blob messages.
|
|
|
|
This function processes a stream of plugin invoke messages, accumulating
|
|
BLOB_CHUNK messages by their ID until the final chunk is received,
|
|
then yielding a single complete BLOB message.
|
|
|
|
Args:
|
|
response: Generator yielding messages that may include blob chunks
|
|
max_file_size: Maximum allowed file size in bytes (default: 30MB)
|
|
max_chunk_size: Maximum allowed chunk size in bytes (default: 8KB)
|
|
|
|
Yields:
|
|
Messages from the response stream, with blob chunks merged into complete blobs
|
|
|
|
Raises:
|
|
ValueError: If file size exceeds max_file_size or chunk size exceeds max_chunk_size
|
|
"""
|
|
files: dict[str, FileChunk] = {}
|
|
|
|
for resp in response:
|
|
if resp.type == ToolInvokeMessage.MessageType.BLOB_CHUNK:
|
|
assert isinstance(resp.message, ToolInvokeMessage.BlobChunkMessage)
|
|
# Get blob chunk information
|
|
chunk_id = resp.message.id
|
|
total_length = resp.message.total_length
|
|
blob_data = resp.message.blob
|
|
is_end = resp.message.end
|
|
|
|
# Initialize buffer for this file if it doesn't exist
|
|
if chunk_id not in files:
|
|
files[chunk_id] = FileChunk(total_length)
|
|
|
|
# Check if file is too large (before appending)
|
|
if files[chunk_id].bytes_written + len(blob_data) > max_file_size:
|
|
# Delete the file if it's too large
|
|
del files[chunk_id]
|
|
raise ValueError(f"File is too large which reached the limit of {max_file_size / 1024 / 1024}MB")
|
|
|
|
# Check if single chunk is too large
|
|
if len(blob_data) > max_chunk_size:
|
|
raise ValueError(f"File chunk is too large which reached the limit of {max_chunk_size / 1024}KB")
|
|
|
|
# Append the blob data to the buffer
|
|
files[chunk_id].data[files[chunk_id].bytes_written : files[chunk_id].bytes_written + len(blob_data)] = (
|
|
blob_data
|
|
)
|
|
files[chunk_id].bytes_written += len(blob_data)
|
|
|
|
# If this is the final chunk, yield a complete blob message
|
|
if is_end:
|
|
# Create the appropriate message type based on the response type
|
|
message_class = type(resp)
|
|
merged_message = message_class(
|
|
type=ToolInvokeMessage.MessageType.BLOB,
|
|
message=ToolInvokeMessage.BlobMessage(blob=files[chunk_id].data[: files[chunk_id].bytes_written]),
|
|
meta=resp.meta,
|
|
)
|
|
yield cast(MessageType, merged_message)
|
|
# Clean up the buffer
|
|
del files[chunk_id]
|
|
else:
|
|
yield resp
|