Merge d85ab787cf into ae47101dc6

refac
Merge branch 'dev' into feat/rate-limit-web-search
2025-12-11 20:05:19 +00:00 · 2025-12-10 17:18:53 +01:00 · 2025-12-10 11:07:41 -05:00 · 2025-11-29 17:21:39 -08:00 · 2025-10-02 19:15:40 -07:00 · 2025-09-21 19:56:19 -07:00
3 changed files with 88 additions and 2 deletions
--- a/backend/open_webui/config.py
+++ b/backend/open_webui/config.py
@ -2967,6 +2967,29 @@ WEB_SEARCH_RESULT_COUNT = PersistentConfig(
 )


+# Web Search Rate Limiting Config
+
+WEB_SEARCH_RATE_LIMIT_ENABLED = PersistentConfig(
+    "WEB_SEARCH_RATE_LIMIT_ENABLED",
+    "rag.web.search.rate_limit.enabled",
+    os.getenv("WEB_SEARCH_RATE_LIMIT_ENABLED", "False").lower(),
+)
+
+# The maximum number of requests that can be made to the web search engine per N seconds, where N=WEB_SEARCH_RATE_LIMIT_MIN_SECONDS
+WEB_SEARCH_RATE_LIMIT_MAX_REQUESTS = PersistentConfig(
+    "WEB_SEARCH_RATE_LIMIT_MAX_REQUESTS",
+    "rag.web.search.rate_limit.max_requests",
+    int(os.getenv("WEB_SEARCH_RATE_LIMIT_MAX_REQUESTS", "1")),
+)
+
+#
+WEB_SEARCH_RATE_LIMIT_MIN_SECONDS = PersistentConfig(
+    "WEB_SEARCH_RATE_LIMIT_MIN_SECONDS",
+    "rag.web.search.rate_limit.min_seconds",
+    int(os.getenv("WEB_SEARCH_RATE_MIN_SECONDS", "1")),
+)
+
+
 # You can provide a list of your own websites to filter after performing a web search.
 # This ensures the highest level of safety and reliability of the information sources.
 WEB_SEARCH_DOMAIN_FILTER_LIST = PersistentConfig(
--- a/backend/open_webui/routers/retrieval.py
+++ b/backend/open_webui/routers/retrieval.py
@ -4,10 +4,12 @@ import mimetypes
 import os
 import shutil
 import asyncio
+import time

 import re
 import uuid
-from datetime import datetime
+from datetime import datetime, timedelta
+from multiprocessing import Value
 from pathlib import Path
 from typing import Iterator, List, Optional, Sequence, Union

@ -24,6 +26,9 @@ from fastapi import (
 )
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.concurrency import run_in_threadpool
+
+from functools import wraps
+from collections import deque
 from pydantic import BaseModel
 import tiktoken

@ -1766,7 +1771,62 @@ async def process_web(
            detail=ERROR_MESSAGES.DEFAULT(e),
        )

+from open_webui.config import (
+    WEB_SEARCH_RATE_LIMIT_MAX_REQUESTS,
+    WEB_SEARCH_RATE_LIMIT_MIN_SECONDS,
+    WEB_SEARCH_RATE_LIMIT_ENABLED,
+)

+# Rate Limit (Specifically for search: This references environment variables named for search)
+
+
+web_search_lock = asyncio.Lock()
+# Track timestamps of previous calls
+web_search_timestamps = deque()
+
+
+def search_rate_limit(max_calls: int, period: float):
+    """
+    Async-friendly decorator for limiting function calls to `max_calls` per `period` seconds.
+    Works in FastAPI async endpoints without blocking the event loop.
+    """
+
+    def decorator(func):
+        @wraps(func)
+        async def wrapper(*args, **kwargs):
+            async with web_search_lock:
+                now = asyncio.get_event_loop().time()
+
+                # Remove timestamps older than the period
+                while web_search_timestamps and now - web_search_timestamps[0] > period:
+                    web_search_timestamps.popleft()
+
+                if len(web_search_timestamps) >= max_calls:
+                    # Need to wait until oldest call is outside the period
+                    wait_time = period - (now - web_search_timestamps[0])
+                    await asyncio.sleep(wait_time)
+                    now = asyncio.get_event_loop().time()
+                    while (
+                        web_search_timestamps
+                        and now - web_search_timestamps[0] > period
+                    ):
+                        web_search_timestamps.popleft()
+
+                # Record this call
+                web_search_timestamps.append(now)
+
+            # Call the actual function
+            return await func(*args, **kwargs)
+
+        return wrapper
+
+    return decorator
+
+
+@search_rate_limit(
+    int(WEB_SEARCH_RATE_LIMIT_MAX_REQUESTS.value),
+    int(WEB_SEARCH_RATE_LIMIT_MIN_SECONDS.value),
+)
 def search_web(
    request: Request, engine: str, query: str, user=None
 ) -> list[SearchResult]:
@ -1792,6 +1852,8 @@ def search_web(
        query (str): The query to search for
    """

+    logging.info(f"search_web: {engine} query: {query}")
+
    # TODO: add playwright to search the web
    if engine == "ollama_cloud":
        return search_ollama_cloud(
@ -2087,6 +2149,7 @@ async def process_web_search(

        for result in search_results:
            if result:
+                result = await result
                for item in result:
                    if item and item.link:
                        result_items.append(item)
--- a/src/lib/components/admin/Users/UserList.svelte
+++ b/src/lib/components/admin/Users/UserList.svelte
@ -339,7 +339,7 @@
 				</tr>
 			</thead>
 			<tbody class="">
-				{#each users as user, userIdx}
+				{#each users as user, userIdx (user.id)}
 					<tr class="bg-white dark:bg-gray-900 dark:border-gray-850 text-xs">
 						<td class="px-3 py-1 min-w-[7rem] w-28">
 							<button
Author	SHA1	Message	Date
cvaz1306	7c9d4aacbe	Merge `d85ab787cf` into `ae47101dc6`	2025-12-10 17:18:53 +01:00
Timothy Jaeryang Baek	ae47101dc6	refac	2025-12-10 11:07:41 -05:00
cvaz1306	d85ab787cf	Merge branch 'dev' into feat/rate-limit-web-search	2025-11-29 17:21:39 -08:00
cvaz1306	551bc64a8d	Merge branch 'dev' into feat/rate-limit-web-search	2025-10-02 19:15:40 -07:00
Christopher Vaz	2a9f13a451	removing redundant asyncio.ensure_future() in retrieval.py	2025-09-21 19:56:19 -07:00
Christopher Vaz	76e70128f6	Merge branch 'feat/rate-limit-web-search' of https://github.com/cvaz1306/open-webui into feat/rate-limit-web-search	2025-09-14 19:31:46 -07:00
Christopher Vaz	15cb2e289d	adding configurable rate limit for web search	2025-09-14 18:50:29 -07:00
Christopher Vaz	ba25c26b11	adding configurable rate limit for web search	2025-09-14 18:24:49 -07:00