enh: CHAT_RESPONSE_STREAM_DELTA_CHUNK_SIZE

This commit is contained in:
Timothy Jaeryang Baek 2025-08-09 23:49:56 +04:00
parent a068ba88de
commit 4e9c75be50
2 changed files with 21 additions and 1 deletions

View file

@ -487,6 +487,25 @@ else:
MODELS_CACHE_TTL = 1 MODELS_CACHE_TTL = 1
####################################
# CHAT
####################################
CHAT_RESPONSE_STREAM_DELTA_CHUNK_SIZE = os.environ.get(
"CHAT_RESPONSE_STREAM_DELTA_CHUNK_SIZE", "1"
)
if CHAT_RESPONSE_STREAM_DELTA_CHUNK_SIZE == "":
CHAT_RESPONSE_STREAM_DELTA_CHUNK_SIZE = 1
else:
try:
CHAT_RESPONSE_STREAM_DELTA_CHUNK_SIZE = int(
CHAT_RESPONSE_STREAM_DELTA_CHUNK_SIZE
)
except Exception:
CHAT_RESPONSE_STREAM_DELTA_CHUNK_SIZE = 1
#################################### ####################################
# WEBSOCKET SUPPORT # WEBSOCKET SUPPORT
#################################### ####################################

View file

@ -95,6 +95,7 @@ from open_webui.config import (
from open_webui.env import ( from open_webui.env import (
SRC_LOG_LEVELS, SRC_LOG_LEVELS,
GLOBAL_LOG_LEVEL, GLOBAL_LOG_LEVEL,
CHAT_RESPONSE_STREAM_DELTA_CHUNK_SIZE,
BYPASS_MODEL_ACCESS_CONTROL, BYPASS_MODEL_ACCESS_CONTROL,
ENABLE_REALTIME_CHAT_SAVE, ENABLE_REALTIME_CHAT_SAVE,
) )
@ -1819,7 +1820,7 @@ async def process_chat_response(
delta_count = 0 delta_count = 0
delta_chunk_size = max( delta_chunk_size = max(
1, CHAT_RESPONSE_STREAM_DELTA_CHUNK_SIZE,
int( int(
metadata.get("params", {}).get("stream_delta_chunk_size") metadata.get("params", {}).get("stream_delta_chunk_size")
or 1 or 1