diff --git a/backend/open_webui/utils/middleware.py b/backend/open_webui/utils/middleware.py index c2378db885..fa5634edbd 100644 --- a/backend/open_webui/utils/middleware.py +++ b/backend/open_webui/utils/middleware.py @@ -1964,6 +1964,10 @@ async def process_chat_response( } ) usage = data.get("usage", {}) + usage.update( + data.get("timing", {}) + ) # llama.cpp + if usage: await event_emitter( {