123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749 |
- import asyncio
- import inspect
- import json
- import logging
- import mimetypes
- import os
- import shutil
- import sys
- import time
- import random
- from contextlib import asynccontextmanager
- from urllib.parse import urlencode, parse_qs, urlparse
- from pydantic import BaseModel
- from sqlalchemy import text
- from typing import Optional
- from aiocache import cached
- import aiohttp
- import requests
- from fastapi import (
- Depends,
- FastAPI,
- File,
- Form,
- HTTPException,
- Request,
- UploadFile,
- status,
- )
- from fastapi.middleware.cors import CORSMiddleware
- from fastapi.responses import JSONResponse, RedirectResponse
- from fastapi.staticfiles import StaticFiles
- from starlette.exceptions import HTTPException as StarletteHTTPException
- from starlette.middleware.base import BaseHTTPMiddleware
- from starlette.middleware.sessions import SessionMiddleware
- from starlette.responses import Response, StreamingResponse
- from open_webui.socket.main import (
- app as socket_app,
- periodic_usage_pool_cleanup,
- get_event_call,
- get_event_emitter,
- )
- from open_webui.routers import (
- audio,
- images,
- ollama,
- openai,
- retrieval,
- pipelines,
- tasks,
- auths,
- chats,
- folders,
- configs,
- groups,
- files,
- functions,
- memories,
- models,
- knowledge,
- prompts,
- evaluations,
- tools,
- users,
- utils,
- )
- from open_webui.routers.retrieval import (
- get_embedding_function,
- get_ef,
- get_rf,
- )
- from open_webui.routers.pipelines import (
- process_pipeline_inlet_filter,
- )
- from open_webui.retrieval.utils import get_sources_from_files
- from open_webui.internal.db import Session
- from open_webui.models.functions import Functions
- from open_webui.models.models import Models
- from open_webui.models.users import UserModel, Users
- from open_webui.constants import TASKS
- from open_webui.config import (
- # Ollama
- ENABLE_OLLAMA_API,
- OLLAMA_BASE_URLS,
- OLLAMA_API_CONFIGS,
- # OpenAI
- ENABLE_OPENAI_API,
- OPENAI_API_BASE_URLS,
- OPENAI_API_KEYS,
- OPENAI_API_CONFIGS,
- # Image
- AUTOMATIC1111_API_AUTH,
- AUTOMATIC1111_BASE_URL,
- AUTOMATIC1111_CFG_SCALE,
- AUTOMATIC1111_SAMPLER,
- AUTOMATIC1111_SCHEDULER,
- COMFYUI_BASE_URL,
- COMFYUI_WORKFLOW,
- COMFYUI_WORKFLOW_NODES,
- ENABLE_IMAGE_GENERATION,
- IMAGE_GENERATION_ENGINE,
- IMAGE_GENERATION_MODEL,
- IMAGE_SIZE,
- IMAGE_STEPS,
- IMAGES_OPENAI_API_BASE_URL,
- IMAGES_OPENAI_API_KEY,
- # Audio
- AUDIO_STT_ENGINE,
- AUDIO_STT_MODEL,
- AUDIO_STT_OPENAI_API_BASE_URL,
- AUDIO_STT_OPENAI_API_KEY,
- AUDIO_TTS_API_KEY,
- AUDIO_TTS_ENGINE,
- AUDIO_TTS_MODEL,
- AUDIO_TTS_OPENAI_API_BASE_URL,
- AUDIO_TTS_OPENAI_API_KEY,
- AUDIO_TTS_SPLIT_ON,
- AUDIO_TTS_VOICE,
- AUDIO_TTS_AZURE_SPEECH_REGION,
- AUDIO_TTS_AZURE_SPEECH_OUTPUT_FORMAT,
- WHISPER_MODEL,
- WHISPER_MODEL_AUTO_UPDATE,
- WHISPER_MODEL_DIR,
- # Retrieval
- RAG_TEMPLATE,
- DEFAULT_RAG_TEMPLATE,
- RAG_EMBEDDING_MODEL,
- RAG_EMBEDDING_MODEL_AUTO_UPDATE,
- RAG_EMBEDDING_MODEL_TRUST_REMOTE_CODE,
- RAG_RERANKING_MODEL,
- RAG_RERANKING_MODEL_AUTO_UPDATE,
- RAG_RERANKING_MODEL_TRUST_REMOTE_CODE,
- RAG_EMBEDDING_ENGINE,
- RAG_EMBEDDING_BATCH_SIZE,
- RAG_RELEVANCE_THRESHOLD,
- RAG_FILE_MAX_COUNT,
- RAG_FILE_MAX_SIZE,
- RAG_OPENAI_API_BASE_URL,
- RAG_OPENAI_API_KEY,
- RAG_OLLAMA_BASE_URL,
- RAG_OLLAMA_API_KEY,
- CHUNK_OVERLAP,
- CHUNK_SIZE,
- CONTENT_EXTRACTION_ENGINE,
- TIKA_SERVER_URL,
- RAG_TOP_K,
- RAG_TEXT_SPLITTER,
- TIKTOKEN_ENCODING_NAME,
- PDF_EXTRACT_IMAGES,
- YOUTUBE_LOADER_LANGUAGE,
- YOUTUBE_LOADER_PROXY_URL,
- # Retrieval (Web Search)
- RAG_WEB_SEARCH_ENGINE,
- RAG_WEB_SEARCH_RESULT_COUNT,
- RAG_WEB_SEARCH_CONCURRENT_REQUESTS,
- RAG_WEB_SEARCH_DOMAIN_FILTER_LIST,
- JINA_API_KEY,
- SEARCHAPI_API_KEY,
- SEARCHAPI_ENGINE,
- SEARXNG_QUERY_URL,
- SERPER_API_KEY,
- SERPLY_API_KEY,
- SERPSTACK_API_KEY,
- SERPSTACK_HTTPS,
- TAVILY_API_KEY,
- BING_SEARCH_V7_ENDPOINT,
- BING_SEARCH_V7_SUBSCRIPTION_KEY,
- BRAVE_SEARCH_API_KEY,
- KAGI_SEARCH_API_KEY,
- MOJEEK_SEARCH_API_KEY,
- GOOGLE_PSE_API_KEY,
- GOOGLE_PSE_ENGINE_ID,
- ENABLE_RAG_HYBRID_SEARCH,
- ENABLE_RAG_LOCAL_WEB_FETCH,
- ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION,
- ENABLE_RAG_WEB_SEARCH,
- UPLOAD_DIR,
- # WebUI
- WEBUI_AUTH,
- WEBUI_NAME,
- WEBUI_BANNERS,
- WEBHOOK_URL,
- ADMIN_EMAIL,
- SHOW_ADMIN_DETAILS,
- JWT_EXPIRES_IN,
- ENABLE_SIGNUP,
- ENABLE_LOGIN_FORM,
- ENABLE_API_KEY,
- ENABLE_COMMUNITY_SHARING,
- ENABLE_MESSAGE_RATING,
- ENABLE_EVALUATION_ARENA_MODELS,
- USER_PERMISSIONS,
- DEFAULT_USER_ROLE,
- DEFAULT_PROMPT_SUGGESTIONS,
- DEFAULT_MODELS,
- DEFAULT_ARENA_MODEL,
- MODEL_ORDER_LIST,
- EVALUATION_ARENA_MODELS,
- # WebUI (OAuth)
- ENABLE_OAUTH_ROLE_MANAGEMENT,
- OAUTH_ROLES_CLAIM,
- OAUTH_EMAIL_CLAIM,
- OAUTH_PICTURE_CLAIM,
- OAUTH_USERNAME_CLAIM,
- OAUTH_ALLOWED_ROLES,
- OAUTH_ADMIN_ROLES,
- # WebUI (LDAP)
- ENABLE_LDAP,
- LDAP_SERVER_LABEL,
- LDAP_SERVER_HOST,
- LDAP_SERVER_PORT,
- LDAP_ATTRIBUTE_FOR_USERNAME,
- LDAP_SEARCH_FILTERS,
- LDAP_SEARCH_BASE,
- LDAP_APP_DN,
- LDAP_APP_PASSWORD,
- LDAP_USE_TLS,
- LDAP_CA_CERT_FILE,
- LDAP_CIPHERS,
- # Misc
- ENV,
- CACHE_DIR,
- STATIC_DIR,
- FRONTEND_BUILD_DIR,
- CORS_ALLOW_ORIGIN,
- DEFAULT_LOCALE,
- OAUTH_PROVIDERS,
- # Admin
- ENABLE_ADMIN_CHAT_ACCESS,
- ENABLE_ADMIN_EXPORT,
- # Tasks
- TASK_MODEL,
- TASK_MODEL_EXTERNAL,
- ENABLE_TAGS_GENERATION,
- ENABLE_SEARCH_QUERY_GENERATION,
- ENABLE_RETRIEVAL_QUERY_GENERATION,
- ENABLE_AUTOCOMPLETE_GENERATION,
- TITLE_GENERATION_PROMPT_TEMPLATE,
- TAGS_GENERATION_PROMPT_TEMPLATE,
- TOOLS_FUNCTION_CALLING_PROMPT_TEMPLATE,
- QUERY_GENERATION_PROMPT_TEMPLATE,
- AUTOCOMPLETE_GENERATION_PROMPT_TEMPLATE,
- AUTOCOMPLETE_GENERATION_INPUT_MAX_LENGTH,
- AppConfig,
- reset_config,
- )
- from open_webui.env import (
- CHANGELOG,
- GLOBAL_LOG_LEVEL,
- SAFE_MODE,
- SRC_LOG_LEVELS,
- VERSION,
- WEBUI_URL,
- WEBUI_BUILD_HASH,
- WEBUI_SECRET_KEY,
- WEBUI_SESSION_COOKIE_SAME_SITE,
- WEBUI_SESSION_COOKIE_SECURE,
- WEBUI_AUTH_TRUSTED_EMAIL_HEADER,
- WEBUI_AUTH_TRUSTED_NAME_HEADER,
- BYPASS_MODEL_ACCESS_CONTROL,
- RESET_CONFIG_ON_START,
- OFFLINE_MODE,
- )
- from open_webui.utils.models import get_all_models, get_all_base_models
- from open_webui.utils.chat import (
- generate_chat_completion as chat_completion_handler,
- chat_completed as chat_completed_handler,
- chat_action as chat_action_handler,
- )
- from open_webui.utils.plugin import load_function_module_by_id
- from open_webui.utils.misc import (
- add_or_update_system_message,
- get_last_user_message,
- prepend_to_first_user_message_content,
- openai_chat_chunk_message_template,
- openai_chat_completion_message_template,
- )
- from open_webui.utils.payload import convert_payload_openai_to_ollama
- from open_webui.utils.response import (
- convert_response_ollama_to_openai,
- convert_streaming_response_ollama_to_openai,
- )
- from open_webui.utils.task import (
- get_task_model_id,
- rag_template,
- tools_function_calling_generation_template,
- )
- from open_webui.utils.tools import get_tools
- from open_webui.utils.access_control import has_access
- from open_webui.utils.auth import (
- decode_token,
- get_admin_user,
- get_current_user,
- get_http_authorization_cred,
- get_verified_user,
- )
- from open_webui.utils.oauth import oauth_manager
- from open_webui.utils.security_headers import SecurityHeadersMiddleware
- if SAFE_MODE:
- print("SAFE MODE ENABLED")
- Functions.deactivate_all_functions()
- logging.basicConfig(stream=sys.stdout, level=GLOBAL_LOG_LEVEL)
- log = logging.getLogger(__name__)
- log.setLevel(SRC_LOG_LEVELS["MAIN"])
- class SPAStaticFiles(StaticFiles):
- async def get_response(self, path: str, scope):
- try:
- return await super().get_response(path, scope)
- except (HTTPException, StarletteHTTPException) as ex:
- if ex.status_code == 404:
- return await super().get_response("index.html", scope)
- else:
- raise ex
- print(
- rf"""
- ___ __ __ _ _ _ ___
- / _ \ _ __ ___ _ __ \ \ / /__| |__ | | | |_ _|
- | | | | '_ \ / _ \ '_ \ \ \ /\ / / _ \ '_ \| | | || |
- | |_| | |_) | __/ | | | \ V V / __/ |_) | |_| || |
- \___/| .__/ \___|_| |_| \_/\_/ \___|_.__/ \___/|___|
- |_|
- v{VERSION} - building the best open-source AI user interface.
- {f"Commit: {WEBUI_BUILD_HASH}" if WEBUI_BUILD_HASH != "dev-build" else ""}
- https://github.com/open-webui/open-webui
- """
- )
- @asynccontextmanager
- async def lifespan(app: FastAPI):
- if RESET_CONFIG_ON_START:
- reset_config()
- asyncio.create_task(periodic_usage_pool_cleanup())
- yield
- app = FastAPI(
- docs_url="/docs" if ENV == "dev" else None,
- openapi_url="/openapi.json" if ENV == "dev" else None,
- redoc_url=None,
- lifespan=lifespan,
- )
- app.state.config = AppConfig()
- ########################################
- #
- # OLLAMA
- #
- ########################################
- app.state.config.ENABLE_OLLAMA_API = ENABLE_OLLAMA_API
- app.state.config.OLLAMA_BASE_URLS = OLLAMA_BASE_URLS
- app.state.config.OLLAMA_API_CONFIGS = OLLAMA_API_CONFIGS
- app.state.OLLAMA_MODELS = {}
- ########################################
- #
- # OPENAI
- #
- ########################################
- app.state.config.ENABLE_OPENAI_API = ENABLE_OPENAI_API
- app.state.config.OPENAI_API_BASE_URLS = OPENAI_API_BASE_URLS
- app.state.config.OPENAI_API_KEYS = OPENAI_API_KEYS
- app.state.config.OPENAI_API_CONFIGS = OPENAI_API_CONFIGS
- app.state.OPENAI_MODELS = {}
- ########################################
- #
- # WEBUI
- #
- ########################################
- app.state.config.ENABLE_SIGNUP = ENABLE_SIGNUP
- app.state.config.ENABLE_LOGIN_FORM = ENABLE_LOGIN_FORM
- app.state.config.ENABLE_API_KEY = ENABLE_API_KEY
- app.state.config.JWT_EXPIRES_IN = JWT_EXPIRES_IN
- app.state.config.SHOW_ADMIN_DETAILS = SHOW_ADMIN_DETAILS
- app.state.config.ADMIN_EMAIL = ADMIN_EMAIL
- app.state.config.DEFAULT_MODELS = DEFAULT_MODELS
- app.state.config.DEFAULT_PROMPT_SUGGESTIONS = DEFAULT_PROMPT_SUGGESTIONS
- app.state.config.DEFAULT_USER_ROLE = DEFAULT_USER_ROLE
- app.state.config.USER_PERMISSIONS = USER_PERMISSIONS
- app.state.config.WEBHOOK_URL = WEBHOOK_URL
- app.state.config.BANNERS = WEBUI_BANNERS
- app.state.config.MODEL_ORDER_LIST = MODEL_ORDER_LIST
- app.state.config.ENABLE_COMMUNITY_SHARING = ENABLE_COMMUNITY_SHARING
- app.state.config.ENABLE_MESSAGE_RATING = ENABLE_MESSAGE_RATING
- app.state.config.ENABLE_EVALUATION_ARENA_MODELS = ENABLE_EVALUATION_ARENA_MODELS
- app.state.config.EVALUATION_ARENA_MODELS = EVALUATION_ARENA_MODELS
- app.state.config.OAUTH_USERNAME_CLAIM = OAUTH_USERNAME_CLAIM
- app.state.config.OAUTH_PICTURE_CLAIM = OAUTH_PICTURE_CLAIM
- app.state.config.OAUTH_EMAIL_CLAIM = OAUTH_EMAIL_CLAIM
- app.state.config.ENABLE_OAUTH_ROLE_MANAGEMENT = ENABLE_OAUTH_ROLE_MANAGEMENT
- app.state.config.OAUTH_ROLES_CLAIM = OAUTH_ROLES_CLAIM
- app.state.config.OAUTH_ALLOWED_ROLES = OAUTH_ALLOWED_ROLES
- app.state.config.OAUTH_ADMIN_ROLES = OAUTH_ADMIN_ROLES
- app.state.config.ENABLE_LDAP = ENABLE_LDAP
- app.state.config.LDAP_SERVER_LABEL = LDAP_SERVER_LABEL
- app.state.config.LDAP_SERVER_HOST = LDAP_SERVER_HOST
- app.state.config.LDAP_SERVER_PORT = LDAP_SERVER_PORT
- app.state.config.LDAP_ATTRIBUTE_FOR_USERNAME = LDAP_ATTRIBUTE_FOR_USERNAME
- app.state.config.LDAP_APP_DN = LDAP_APP_DN
- app.state.config.LDAP_APP_PASSWORD = LDAP_APP_PASSWORD
- app.state.config.LDAP_SEARCH_BASE = LDAP_SEARCH_BASE
- app.state.config.LDAP_SEARCH_FILTERS = LDAP_SEARCH_FILTERS
- app.state.config.LDAP_USE_TLS = LDAP_USE_TLS
- app.state.config.LDAP_CA_CERT_FILE = LDAP_CA_CERT_FILE
- app.state.config.LDAP_CIPHERS = LDAP_CIPHERS
- app.state.AUTH_TRUSTED_EMAIL_HEADER = WEBUI_AUTH_TRUSTED_EMAIL_HEADER
- app.state.AUTH_TRUSTED_NAME_HEADER = WEBUI_AUTH_TRUSTED_NAME_HEADER
- app.state.TOOLS = {}
- app.state.FUNCTIONS = {}
- ########################################
- #
- # RETRIEVAL
- #
- ########################################
- app.state.config.TOP_K = RAG_TOP_K
- app.state.config.RELEVANCE_THRESHOLD = RAG_RELEVANCE_THRESHOLD
- app.state.config.FILE_MAX_SIZE = RAG_FILE_MAX_SIZE
- app.state.config.FILE_MAX_COUNT = RAG_FILE_MAX_COUNT
- app.state.config.ENABLE_RAG_HYBRID_SEARCH = ENABLE_RAG_HYBRID_SEARCH
- app.state.config.ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION = (
- ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION
- )
- app.state.config.CONTENT_EXTRACTION_ENGINE = CONTENT_EXTRACTION_ENGINE
- app.state.config.TIKA_SERVER_URL = TIKA_SERVER_URL
- app.state.config.TEXT_SPLITTER = RAG_TEXT_SPLITTER
- app.state.config.TIKTOKEN_ENCODING_NAME = TIKTOKEN_ENCODING_NAME
- app.state.config.CHUNK_SIZE = CHUNK_SIZE
- app.state.config.CHUNK_OVERLAP = CHUNK_OVERLAP
- app.state.config.RAG_EMBEDDING_ENGINE = RAG_EMBEDDING_ENGINE
- app.state.config.RAG_EMBEDDING_MODEL = RAG_EMBEDDING_MODEL
- app.state.config.RAG_EMBEDDING_BATCH_SIZE = RAG_EMBEDDING_BATCH_SIZE
- app.state.config.RAG_RERANKING_MODEL = RAG_RERANKING_MODEL
- app.state.config.RAG_TEMPLATE = RAG_TEMPLATE
- app.state.config.RAG_OPENAI_API_BASE_URL = RAG_OPENAI_API_BASE_URL
- app.state.config.RAG_OPENAI_API_KEY = RAG_OPENAI_API_KEY
- app.state.config.RAG_OLLAMA_BASE_URL = RAG_OLLAMA_BASE_URL
- app.state.config.RAG_OLLAMA_API_KEY = RAG_OLLAMA_API_KEY
- app.state.config.PDF_EXTRACT_IMAGES = PDF_EXTRACT_IMAGES
- app.state.config.YOUTUBE_LOADER_LANGUAGE = YOUTUBE_LOADER_LANGUAGE
- app.state.config.YOUTUBE_LOADER_PROXY_URL = YOUTUBE_LOADER_PROXY_URL
- app.state.config.ENABLE_RAG_WEB_SEARCH = ENABLE_RAG_WEB_SEARCH
- app.state.config.RAG_WEB_SEARCH_ENGINE = RAG_WEB_SEARCH_ENGINE
- app.state.config.RAG_WEB_SEARCH_DOMAIN_FILTER_LIST = RAG_WEB_SEARCH_DOMAIN_FILTER_LIST
- app.state.config.SEARXNG_QUERY_URL = SEARXNG_QUERY_URL
- app.state.config.GOOGLE_PSE_API_KEY = GOOGLE_PSE_API_KEY
- app.state.config.GOOGLE_PSE_ENGINE_ID = GOOGLE_PSE_ENGINE_ID
- app.state.config.BRAVE_SEARCH_API_KEY = BRAVE_SEARCH_API_KEY
- app.state.config.KAGI_SEARCH_API_KEY = KAGI_SEARCH_API_KEY
- app.state.config.MOJEEK_SEARCH_API_KEY = MOJEEK_SEARCH_API_KEY
- app.state.config.SERPSTACK_API_KEY = SERPSTACK_API_KEY
- app.state.config.SERPSTACK_HTTPS = SERPSTACK_HTTPS
- app.state.config.SERPER_API_KEY = SERPER_API_KEY
- app.state.config.SERPLY_API_KEY = SERPLY_API_KEY
- app.state.config.TAVILY_API_KEY = TAVILY_API_KEY
- app.state.config.SEARCHAPI_API_KEY = SEARCHAPI_API_KEY
- app.state.config.SEARCHAPI_ENGINE = SEARCHAPI_ENGINE
- app.state.config.JINA_API_KEY = JINA_API_KEY
- app.state.config.BING_SEARCH_V7_ENDPOINT = BING_SEARCH_V7_ENDPOINT
- app.state.config.BING_SEARCH_V7_SUBSCRIPTION_KEY = BING_SEARCH_V7_SUBSCRIPTION_KEY
- app.state.config.RAG_WEB_SEARCH_RESULT_COUNT = RAG_WEB_SEARCH_RESULT_COUNT
- app.state.config.RAG_WEB_SEARCH_CONCURRENT_REQUESTS = RAG_WEB_SEARCH_CONCURRENT_REQUESTS
- app.state.EMBEDDING_FUNCTION = None
- app.state.ef = None
- app.state.rf = None
- app.state.YOUTUBE_LOADER_TRANSLATION = None
- app.state.EMBEDDING_FUNCTION = get_embedding_function(
- app.state.config.RAG_EMBEDDING_ENGINE,
- app.state.config.RAG_EMBEDDING_MODEL,
- app.state.ef,
- (
- app.state.config.RAG_OPENAI_API_BASE_URL
- if app.state.config.RAG_EMBEDDING_ENGINE == "openai"
- else app.state.config.RAG_OLLAMA_BASE_URL
- ),
- (
- app.state.config.RAG_OPENAI_API_KEY
- if app.state.config.RAG_EMBEDDING_ENGINE == "openai"
- else app.state.config.RAG_OLLAMA_API_KEY
- ),
- app.state.config.RAG_EMBEDDING_BATCH_SIZE,
- )
- try:
- app.state.ef = get_ef(
- app.state.config.RAG_EMBEDDING_ENGINE,
- app.state.config.RAG_EMBEDDING_MODEL,
- RAG_EMBEDDING_MODEL_AUTO_UPDATE,
- )
- app.state.rf = get_rf(
- app.state.config.RAG_RERANKING_MODEL,
- RAG_RERANKING_MODEL_AUTO_UPDATE,
- )
- except Exception as e:
- log.error(f"Error updating models: {e}")
- pass
- ########################################
- #
- # IMAGES
- #
- ########################################
- app.state.config.IMAGE_GENERATION_ENGINE = IMAGE_GENERATION_ENGINE
- app.state.config.ENABLE_IMAGE_GENERATION = ENABLE_IMAGE_GENERATION
- app.state.config.IMAGES_OPENAI_API_BASE_URL = IMAGES_OPENAI_API_BASE_URL
- app.state.config.IMAGES_OPENAI_API_KEY = IMAGES_OPENAI_API_KEY
- app.state.config.IMAGE_GENERATION_MODEL = IMAGE_GENERATION_MODEL
- app.state.config.AUTOMATIC1111_BASE_URL = AUTOMATIC1111_BASE_URL
- app.state.config.AUTOMATIC1111_API_AUTH = AUTOMATIC1111_API_AUTH
- app.state.config.AUTOMATIC1111_CFG_SCALE = AUTOMATIC1111_CFG_SCALE
- app.state.config.AUTOMATIC1111_SAMPLER = AUTOMATIC1111_SAMPLER
- app.state.config.AUTOMATIC1111_SCHEDULER = AUTOMATIC1111_SCHEDULER
- app.state.config.COMFYUI_BASE_URL = COMFYUI_BASE_URL
- app.state.config.COMFYUI_WORKFLOW = COMFYUI_WORKFLOW
- app.state.config.COMFYUI_WORKFLOW_NODES = COMFYUI_WORKFLOW_NODES
- app.state.config.IMAGE_SIZE = IMAGE_SIZE
- app.state.config.IMAGE_STEPS = IMAGE_STEPS
- ########################################
- #
- # AUDIO
- #
- ########################################
- app.state.config.STT_OPENAI_API_BASE_URL = AUDIO_STT_OPENAI_API_BASE_URL
- app.state.config.STT_OPENAI_API_KEY = AUDIO_STT_OPENAI_API_KEY
- app.state.config.STT_ENGINE = AUDIO_STT_ENGINE
- app.state.config.STT_MODEL = AUDIO_STT_MODEL
- app.state.config.WHISPER_MODEL = WHISPER_MODEL
- app.state.config.TTS_OPENAI_API_BASE_URL = AUDIO_TTS_OPENAI_API_BASE_URL
- app.state.config.TTS_OPENAI_API_KEY = AUDIO_TTS_OPENAI_API_KEY
- app.state.config.TTS_ENGINE = AUDIO_TTS_ENGINE
- app.state.config.TTS_MODEL = AUDIO_TTS_MODEL
- app.state.config.TTS_VOICE = AUDIO_TTS_VOICE
- app.state.config.TTS_API_KEY = AUDIO_TTS_API_KEY
- app.state.config.TTS_SPLIT_ON = AUDIO_TTS_SPLIT_ON
- app.state.config.TTS_AZURE_SPEECH_REGION = AUDIO_TTS_AZURE_SPEECH_REGION
- app.state.config.TTS_AZURE_SPEECH_OUTPUT_FORMAT = AUDIO_TTS_AZURE_SPEECH_OUTPUT_FORMAT
- app.state.faster_whisper_model = None
- app.state.speech_synthesiser = None
- app.state.speech_speaker_embeddings_dataset = None
- ########################################
- #
- # TASKS
- #
- ########################################
- app.state.config.TASK_MODEL = TASK_MODEL
- app.state.config.TASK_MODEL_EXTERNAL = TASK_MODEL_EXTERNAL
- app.state.config.ENABLE_SEARCH_QUERY_GENERATION = ENABLE_SEARCH_QUERY_GENERATION
- app.state.config.ENABLE_RETRIEVAL_QUERY_GENERATION = ENABLE_RETRIEVAL_QUERY_GENERATION
- app.state.config.ENABLE_AUTOCOMPLETE_GENERATION = ENABLE_AUTOCOMPLETE_GENERATION
- app.state.config.ENABLE_TAGS_GENERATION = ENABLE_TAGS_GENERATION
- app.state.config.TITLE_GENERATION_PROMPT_TEMPLATE = TITLE_GENERATION_PROMPT_TEMPLATE
- app.state.config.TAGS_GENERATION_PROMPT_TEMPLATE = TAGS_GENERATION_PROMPT_TEMPLATE
- app.state.config.TOOLS_FUNCTION_CALLING_PROMPT_TEMPLATE = (
- TOOLS_FUNCTION_CALLING_PROMPT_TEMPLATE
- )
- app.state.config.QUERY_GENERATION_PROMPT_TEMPLATE = QUERY_GENERATION_PROMPT_TEMPLATE
- app.state.config.AUTOCOMPLETE_GENERATION_PROMPT_TEMPLATE = (
- AUTOCOMPLETE_GENERATION_PROMPT_TEMPLATE
- )
- app.state.config.AUTOCOMPLETE_GENERATION_INPUT_MAX_LENGTH = (
- AUTOCOMPLETE_GENERATION_INPUT_MAX_LENGTH
- )
- ########################################
- #
- # WEBUI
- #
- ########################################
- app.state.MODELS = {}
- ##################################
- #
- # ChatCompletion Middleware
- #
- ##################################
- async def chat_completion_filter_functions_handler(body, model, extra_params):
- skip_files = None
- def get_filter_function_ids(model):
- def get_priority(function_id):
- function = Functions.get_function_by_id(function_id)
- if function is not None and hasattr(function, "valves"):
- # TODO: Fix FunctionModel
- return (function.valves if function.valves else {}).get("priority", 0)
- return 0
- filter_ids = [
- function.id for function in Functions.get_global_filter_functions()
- ]
- if "info" in model and "meta" in model["info"]:
- filter_ids.extend(model["info"]["meta"].get("filterIds", []))
- filter_ids = list(set(filter_ids))
- enabled_filter_ids = [
- function.id
- for function in Functions.get_functions_by_type("filter", active_only=True)
- ]
- filter_ids = [
- filter_id for filter_id in filter_ids if filter_id in enabled_filter_ids
- ]
- filter_ids.sort(key=get_priority)
- return filter_ids
- filter_ids = get_filter_function_ids(model)
- for filter_id in filter_ids:
- filter = Functions.get_function_by_id(filter_id)
- if not filter:
- continue
- if filter_id in app.state.FUNCTIONS:
- function_module = app.state.FUNCTIONS[filter_id]
- else:
- function_module, _, _ = load_function_module_by_id(filter_id)
- app.state.FUNCTIONS[filter_id] = function_module
- # Check if the function has a file_handler variable
- if hasattr(function_module, "file_handler"):
- skip_files = function_module.file_handler
- if hasattr(function_module, "valves") and hasattr(function_module, "Valves"):
- valves = Functions.get_function_valves_by_id(filter_id)
- function_module.valves = function_module.Valves(
- **(valves if valves else {})
- )
- if not hasattr(function_module, "inlet"):
- continue
- try:
- inlet = function_module.inlet
- # Get the signature of the function
- sig = inspect.signature(inlet)
- params = {"body": body} | {
- k: v
- for k, v in {
- **extra_params,
- "__model__": model,
- "__id__": filter_id,
- }.items()
- if k in sig.parameters
- }
- if "__user__" in params and hasattr(function_module, "UserValves"):
- try:
- params["__user__"]["valves"] = function_module.UserValves(
- **Functions.get_user_valves_by_id_and_user_id(
- filter_id, params["__user__"]["id"]
- )
- )
- except Exception as e:
- print(e)
- if inspect.iscoroutinefunction(inlet):
- body = await inlet(**params)
- else:
- body = inlet(**params)
- except Exception as e:
- print(f"Error: {e}")
- raise e
- if skip_files and "files" in body.get("metadata", {}):
- del body["metadata"]["files"]
- return body, {}
- async def chat_completion_tools_handler(
- request: Request, body: dict, user: UserModel, models, extra_params: dict
- ) -> tuple[dict, dict]:
- async def get_content_from_response(response) -> Optional[str]:
- content = None
- if hasattr(response, "body_iterator"):
- async for chunk in response.body_iterator:
- data = json.loads(chunk.decode("utf-8"))
- content = data["choices"][0]["message"]["content"]
- # Cleanup any remaining background tasks if necessary
- if response.background is not None:
- await response.background()
- else:
- content = response["choices"][0]["message"]["content"]
- return content
- def get_tools_function_calling_payload(messages, task_model_id, content):
- user_message = get_last_user_message(messages)
- history = "\n".join(
- f"{message['role'].upper()}: \"\"\"{message['content']}\"\"\""
- for message in messages[::-1][:4]
- )
- prompt = f"History:\n{history}\nQuery: {user_message}"
- return {
- "model": task_model_id,
- "messages": [
- {"role": "system", "content": content},
- {"role": "user", "content": f"Query: {prompt}"},
- ],
- "stream": False,
- "metadata": {"task": str(TASKS.FUNCTION_CALLING)},
- }
- # If tool_ids field is present, call the functions
- metadata = body.get("metadata", {})
- tool_ids = metadata.get("tool_ids", None)
- log.debug(f"{tool_ids=}")
- if not tool_ids:
- return body, {}
- skip_files = False
- sources = []
- task_model_id = get_task_model_id(
- body["model"],
- request.app.state.config.TASK_MODEL,
- request.app.state.config.TASK_MODEL_EXTERNAL,
- models,
- )
- tools = get_tools(
- request,
- tool_ids,
- user,
- {
- **extra_params,
- "__model__": models[task_model_id],
- "__messages__": body["messages"],
- "__files__": metadata.get("files", []),
- },
- )
- log.info(f"{tools=}")
- specs = [tool["spec"] for tool in tools.values()]
- tools_specs = json.dumps(specs)
- if app.state.config.TOOLS_FUNCTION_CALLING_PROMPT_TEMPLATE != "":
- template = app.state.config.TOOLS_FUNCTION_CALLING_PROMPT_TEMPLATE
- else:
- template = """Available Tools: {{TOOLS}}\nReturn an empty string if no tools match the query. If a function tool matches, construct and return a JSON object in the format {\"name\": \"functionName\", \"parameters\": {\"requiredFunctionParamKey\": \"requiredFunctionParamValue\"}} using the appropriate tool and its parameters. Only return the object and limit the response to the JSON object without additional text."""
- tools_function_calling_prompt = tools_function_calling_generation_template(
- template, tools_specs
- )
- log.info(f"{tools_function_calling_prompt=}")
- payload = get_tools_function_calling_payload(
- body["messages"], task_model_id, tools_function_calling_prompt
- )
- try:
- payload = process_pipeline_inlet_filter(request, payload, user, models)
- except Exception as e:
- raise e
- try:
- response = await generate_chat_completions(form_data=payload, user=user)
- log.debug(f"{response=}")
- content = await get_content_from_response(response)
- log.debug(f"{content=}")
- if not content:
- return body, {}
- try:
- content = content[content.find("{") : content.rfind("}") + 1]
- if not content:
- raise Exception("No JSON object found in the response")
- result = json.loads(content)
- tool_function_name = result.get("name", None)
- if tool_function_name not in tools:
- return body, {}
- tool_function_params = result.get("parameters", {})
- try:
- required_params = (
- tools[tool_function_name]
- .get("spec", {})
- .get("parameters", {})
- .get("required", [])
- )
- tool_function = tools[tool_function_name]["callable"]
- tool_function_params = {
- k: v
- for k, v in tool_function_params.items()
- if k in required_params
- }
- tool_output = await tool_function(**tool_function_params)
- except Exception as e:
- tool_output = str(e)
- if isinstance(tool_output, str):
- if tools[tool_function_name]["citation"]:
- sources.append(
- {
- "source": {
- "name": f"TOOL:{tools[tool_function_name]['toolkit_id']}/{tool_function_name}"
- },
- "document": [tool_output],
- "metadata": [
- {
- "source": f"TOOL:{tools[tool_function_name]['toolkit_id']}/{tool_function_name}"
- }
- ],
- }
- )
- else:
- sources.append(
- {
- "source": {},
- "document": [tool_output],
- "metadata": [
- {
- "source": f"TOOL:{tools[tool_function_name]['toolkit_id']}/{tool_function_name}"
- }
- ],
- }
- )
- if tools[tool_function_name]["file_handler"]:
- skip_files = True
- except Exception as e:
- log.exception(f"Error: {e}")
- content = None
- except Exception as e:
- log.exception(f"Error: {e}")
- content = None
- log.debug(f"tool_contexts: {sources}")
- if skip_files and "files" in body.get("metadata", {}):
- del body["metadata"]["files"]
- return body, {"sources": sources}
- async def chat_completion_files_handler(
- request: Request, body: dict, user: UserModel
- ) -> tuple[dict, dict[str, list]]:
- sources = []
- if files := body.get("metadata", {}).get("files", None):
- try:
- queries_response = await generate_queries(
- {
- "model": body["model"],
- "messages": body["messages"],
- "type": "retrieval",
- },
- user,
- )
- queries_response = queries_response["choices"][0]["message"]["content"]
- try:
- bracket_start = queries_response.find("{")
- bracket_end = queries_response.rfind("}") + 1
- if bracket_start == -1 or bracket_end == -1:
- raise Exception("No JSON object found in the response")
- queries_response = queries_response[bracket_start:bracket_end]
- queries_response = json.loads(queries_response)
- except Exception as e:
- queries_response = {"queries": [queries_response]}
- queries = queries_response.get("queries", [])
- except Exception as e:
- queries = []
- if len(queries) == 0:
- queries = [get_last_user_message(body["messages"])]
- sources = get_sources_from_files(
- files=files,
- queries=queries,
- embedding_function=request.app.state.EMBEDDING_FUNCTION,
- k=request.app.state.config.TOP_K,
- reranking_function=request.app.state.rf,
- r=request.app.state.config.RELEVANCE_THRESHOLD,
- hybrid_search=request.app.state.config.ENABLE_RAG_HYBRID_SEARCH,
- )
- log.debug(f"rag_contexts:sources: {sources}")
- return body, {"sources": sources}
- class ChatCompletionMiddleware(BaseHTTPMiddleware):
- async def dispatch(self, request: Request, call_next):
- if not (
- request.method == "POST"
- and any(
- endpoint in request.url.path
- for endpoint in ["/ollama/api/chat", "/chat/completions"]
- )
- ):
- return await call_next(request)
- log.debug(f"request.url.path: {request.url.path}")
- await get_all_models(request)
- models = app.state.MODELS
- async def get_body_and_model_and_user(request, models):
- # Read the original request body
- body = await request.body()
- body_str = body.decode("utf-8")
- body = json.loads(body_str) if body_str else {}
- model_id = body["model"]
- if model_id not in models:
- raise Exception("Model not found")
- model = models[model_id]
- user = get_current_user(
- request,
- get_http_authorization_cred(request.headers.get("Authorization")),
- )
- return body, model, user
- try:
- body, model, user = await get_body_and_model_and_user(request, models)
- except Exception as e:
- return JSONResponse(
- status_code=status.HTTP_400_BAD_REQUEST,
- content={"detail": str(e)},
- )
- model_info = Models.get_model_by_id(model["id"])
- if user.role == "user" and not BYPASS_MODEL_ACCESS_CONTROL:
- if model.get("arena"):
- if not has_access(
- user.id,
- type="read",
- access_control=model.get("info", {})
- .get("meta", {})
- .get("access_control", {}),
- ):
- raise HTTPException(
- status_code=403,
- detail="Model not found",
- )
- else:
- if not model_info:
- return JSONResponse(
- status_code=status.HTTP_404_NOT_FOUND,
- content={"detail": "Model not found"},
- )
- elif not (
- user.id == model_info.user_id
- or has_access(
- user.id, type="read", access_control=model_info.access_control
- )
- ):
- return JSONResponse(
- status_code=status.HTTP_403_FORBIDDEN,
- content={"detail": "User does not have access to the model"},
- )
- metadata = {
- "chat_id": body.pop("chat_id", None),
- "message_id": body.pop("id", None),
- "session_id": body.pop("session_id", None),
- "tool_ids": body.get("tool_ids", None),
- "files": body.get("files", None),
- }
- body["metadata"] = metadata
- extra_params = {
- "__event_emitter__": get_event_emitter(metadata),
- "__event_call__": get_event_call(metadata),
- "__user__": {
- "id": user.id,
- "email": user.email,
- "name": user.name,
- "role": user.role,
- },
- "__metadata__": metadata,
- }
- # Initialize data_items to store additional data to be sent to the client
- # Initialize contexts and citation
- data_items = []
- sources = []
- try:
- body, flags = await chat_completion_filter_functions_handler(
- body, model, extra_params
- )
- except Exception as e:
- return JSONResponse(
- status_code=status.HTTP_400_BAD_REQUEST,
- content={"detail": str(e)},
- )
- tool_ids = body.pop("tool_ids", None)
- files = body.pop("files", None)
- metadata = {
- **metadata,
- "tool_ids": tool_ids,
- "files": files,
- }
- body["metadata"] = metadata
- try:
- body, flags = await chat_completion_tools_handler(
- request, body, user, models, extra_params
- )
- sources.extend(flags.get("sources", []))
- except Exception as e:
- log.exception(e)
- try:
- body, flags = await chat_completion_files_handler(request, body, user)
- sources.extend(flags.get("sources", []))
- except Exception as e:
- log.exception(e)
- # If context is not empty, insert it into the messages
- if len(sources) > 0:
- context_string = ""
- for source_idx, source in enumerate(sources):
- source_id = source.get("source", {}).get("name", "")
- if "document" in source:
- for doc_idx, doc_context in enumerate(source["document"]):
- metadata = source.get("metadata")
- doc_source_id = None
- if metadata:
- doc_source_id = metadata[doc_idx].get("source", source_id)
- if source_id:
- context_string += f"<source><source_id>{doc_source_id if doc_source_id is not None else source_id}</source_id><source_context>{doc_context}</source_context></source>\n"
- else:
- # If there is no source_id, then do not include the source_id tag
- context_string += f"<source><source_context>{doc_context}</source_context></source>\n"
- context_string = context_string.strip()
- prompt = get_last_user_message(body["messages"])
- if prompt is None:
- raise Exception("No user message found")
- if (
- app.state.config.RELEVANCE_THRESHOLD == 0
- and context_string.strip() == ""
- ):
- log.debug(
- f"With a 0 relevancy threshold for RAG, the context cannot be empty"
- )
- # Workaround for Ollama 2.0+ system prompt issue
- # TODO: replace with add_or_update_system_message
- if model["owned_by"] == "ollama":
- body["messages"] = prepend_to_first_user_message_content(
- rag_template(app.state.config.RAG_TEMPLATE, context_string, prompt),
- body["messages"],
- )
- else:
- body["messages"] = add_or_update_system_message(
- rag_template(app.state.config.RAG_TEMPLATE, context_string, prompt),
- body["messages"],
- )
- # If there are citations, add them to the data_items
- sources = [
- source for source in sources if source.get("source", {}).get("name", "")
- ]
- if len(sources) > 0:
- data_items.append({"sources": sources})
- modified_body_bytes = json.dumps(body).encode("utf-8")
- # Replace the request body with the modified one
- request._body = modified_body_bytes
- # Set custom header to ensure content-length matches new body length
- request.headers.__dict__["_list"] = [
- (b"content-length", str(len(modified_body_bytes)).encode("utf-8")),
- *[(k, v) for k, v in request.headers.raw if k.lower() != b"content-length"],
- ]
- response = await call_next(request)
- if not isinstance(response, StreamingResponse):
- return response
- content_type = response.headers["Content-Type"]
- is_openai = "text/event-stream" in content_type
- is_ollama = "application/x-ndjson" in content_type
- if not is_openai and not is_ollama:
- return response
- def wrap_item(item):
- return f"data: {item}\n\n" if is_openai else f"{item}\n"
- async def stream_wrapper(original_generator, data_items):
- for item in data_items:
- yield wrap_item(json.dumps(item))
- async for data in original_generator:
- yield data
- return StreamingResponse(
- stream_wrapper(response.body_iterator, data_items),
- headers=dict(response.headers),
- )
- async def _receive(self, body: bytes):
- return {"type": "http.request", "body": body, "more_body": False}
- app.add_middleware(ChatCompletionMiddleware)
- class PipelineMiddleware(BaseHTTPMiddleware):
- async def dispatch(self, request: Request, call_next):
- if not (
- request.method == "POST"
- and any(
- endpoint in request.url.path
- for endpoint in ["/ollama/api/chat", "/chat/completions"]
- )
- ):
- return await call_next(request)
- log.debug(f"request.url.path: {request.url.path}")
- # Read the original request body
- body = await request.body()
- # Decode body to string
- body_str = body.decode("utf-8")
- # Parse string to JSON
- data = json.loads(body_str) if body_str else {}
- try:
- user = get_current_user(
- request,
- get_http_authorization_cred(request.headers["Authorization"]),
- )
- except KeyError as e:
- if len(e.args) > 1:
- return JSONResponse(
- status_code=e.args[0],
- content={"detail": e.args[1]},
- )
- else:
- return JSONResponse(
- status_code=status.HTTP_401_UNAUTHORIZED,
- content={"detail": "Not authenticated"},
- )
- except HTTPException as e:
- return JSONResponse(
- status_code=e.status_code,
- content={"detail": e.detail},
- )
- await get_all_models(request)
- models = app.state.MODELS
- try:
- data = process_pipeline_inlet_filter(request, data, user, models)
- except Exception as e:
- if len(e.args) > 1:
- return JSONResponse(
- status_code=e.args[0],
- content={"detail": e.args[1]},
- )
- else:
- return JSONResponse(
- status_code=status.HTTP_400_BAD_REQUEST,
- content={"detail": str(e)},
- )
- modified_body_bytes = json.dumps(data).encode("utf-8")
- # Replace the request body with the modified one
- request._body = modified_body_bytes
- # Set custom header to ensure content-length matches new body length
- request.headers.__dict__["_list"] = [
- (b"content-length", str(len(modified_body_bytes)).encode("utf-8")),
- *[(k, v) for k, v in request.headers.raw if k.lower() != b"content-length"],
- ]
- response = await call_next(request)
- return response
- async def _receive(self, body: bytes):
- return {"type": "http.request", "body": body, "more_body": False}
- app.add_middleware(PipelineMiddleware)
- class RedirectMiddleware(BaseHTTPMiddleware):
- async def dispatch(self, request: Request, call_next):
- # Check if the request is a GET request
- if request.method == "GET":
- path = request.url.path
- query_params = dict(parse_qs(urlparse(str(request.url)).query))
- # Check for the specific watch path and the presence of 'v' parameter
- if path.endswith("/watch") and "v" in query_params:
- video_id = query_params["v"][0] # Extract the first 'v' parameter
- encoded_video_id = urlencode({"youtube": video_id})
- redirect_url = f"/?{encoded_video_id}"
- return RedirectResponse(url=redirect_url)
- # Proceed with the normal flow of other requests
- response = await call_next(request)
- return response
- # Add the middleware to the app
- app.add_middleware(RedirectMiddleware)
- app.add_middleware(SecurityHeadersMiddleware)
- @app.middleware("http")
- async def commit_session_after_request(request: Request, call_next):
- response = await call_next(request)
- # log.debug("Commit session after request")
- Session.commit()
- return response
- @app.middleware("http")
- async def check_url(request: Request, call_next):
- start_time = int(time.time())
- request.state.enable_api_key = app.state.config.ENABLE_API_KEY
- response = await call_next(request)
- process_time = int(time.time()) - start_time
- response.headers["X-Process-Time"] = str(process_time)
- return response
- @app.middleware("http")
- async def inspect_websocket(request: Request, call_next):
- if (
- "/ws/socket.io" in request.url.path
- and request.query_params.get("transport") == "websocket"
- ):
- upgrade = (request.headers.get("Upgrade") or "").lower()
- connection = (request.headers.get("Connection") or "").lower().split(",")
- # Check that there's the correct headers for an upgrade, else reject the connection
- # This is to work around this upstream issue: https://github.com/miguelgrinberg/python-engineio/issues/367
- if upgrade != "websocket" or "upgrade" not in connection:
- return JSONResponse(
- status_code=status.HTTP_400_BAD_REQUEST,
- content={"detail": "Invalid WebSocket upgrade request"},
- )
- return await call_next(request)
- app.add_middleware(
- CORSMiddleware,
- allow_origins=CORS_ALLOW_ORIGIN,
- allow_credentials=True,
- allow_methods=["*"],
- allow_headers=["*"],
- )
- app.mount("/ws", socket_app)
- app.include_router(ollama.router, prefix="/ollama", tags=["ollama"])
- app.include_router(openai.router, prefix="/openai", tags=["openai"])
- app.include_router(pipelines.router, prefix="/api/v1/pipelines", tags=["pipelines"])
- app.include_router(tasks.router, prefix="/api/v1/tasks", tags=["tasks"])
- app.include_router(images.router, prefix="/api/v1/images", tags=["images"])
- app.include_router(audio.router, prefix="/api/v1/audio", tags=["audio"])
- app.include_router(retrieval.router, prefix="/api/v1/retrieval", tags=["retrieval"])
- app.include_router(configs.router, prefix="/api/v1/configs", tags=["configs"])
- app.include_router(auths.router, prefix="/api/v1/auths", tags=["auths"])
- app.include_router(users.router, prefix="/api/v1/users", tags=["users"])
- app.include_router(chats.router, prefix="/api/v1/chats", tags=["chats"])
- app.include_router(models.router, prefix="/api/v1/models", tags=["models"])
- app.include_router(knowledge.router, prefix="/api/v1/knowledge", tags=["knowledge"])
- app.include_router(prompts.router, prefix="/api/v1/prompts", tags=["prompts"])
- app.include_router(tools.router, prefix="/api/v1/tools", tags=["tools"])
- app.include_router(memories.router, prefix="/api/v1/memories", tags=["memories"])
- app.include_router(folders.router, prefix="/api/v1/folders", tags=["folders"])
- app.include_router(groups.router, prefix="/api/v1/groups", tags=["groups"])
- app.include_router(files.router, prefix="/api/v1/files", tags=["files"])
- app.include_router(functions.router, prefix="/api/v1/functions", tags=["functions"])
- app.include_router(
- evaluations.router, prefix="/api/v1/evaluations", tags=["evaluations"]
- )
- app.include_router(utils.router, prefix="/api/v1/utils", tags=["utils"])
- ##################################
- #
- # Chat Endpoints
- #
- ##################################
- @app.get("/api/models")
- async def get_models(request: Request, user=Depends(get_verified_user)):
- def get_filtered_models(models, user):
- filtered_models = []
- for model in models:
- if model.get("arena"):
- if has_access(
- user.id,
- type="read",
- access_control=model.get("info", {})
- .get("meta", {})
- .get("access_control", {}),
- ):
- filtered_models.append(model)
- continue
- model_info = Models.get_model_by_id(model["id"])
- if model_info:
- if user.id == model_info.user_id or has_access(
- user.id, type="read", access_control=model_info.access_control
- ):
- filtered_models.append(model)
- return filtered_models
- models = await get_all_models(request)
- # Filter out filter pipelines
- models = [
- model
- for model in models
- if "pipeline" not in model or model["pipeline"].get("type", None) != "filter"
- ]
- model_order_list = request.app.state.config.MODEL_ORDER_LIST
- if model_order_list:
- model_order_dict = {model_id: i for i, model_id in enumerate(model_order_list)}
- # Sort models by order list priority, with fallback for those not in the list
- models.sort(
- key=lambda x: (model_order_dict.get(x["id"], float("inf")), x["name"])
- )
- # Filter out models that the user does not have access to
- if user.role == "user" and not BYPASS_MODEL_ACCESS_CONTROL:
- models = get_filtered_models(models, user)
- log.debug(
- f"/api/models returned filtered models accessible to the user: {json.dumps([model['id'] for model in models])}"
- )
- return {"data": models}
- @app.get("/api/models/base")
- async def get_base_models(request: Request, user=Depends(get_admin_user)):
- models = await get_all_base_models(request)
- return {"data": models}
- @app.post("/api/chat/completions")
- async def chat_completion(
- request: Request,
- form_data: dict,
- user=Depends(get_verified_user),
- bypass_filter: bool = False,
- ):
- try:
- return await chat_completion_handler(request, form_data, user, bypass_filter)
- except Exception as e:
- raise HTTPException(
- status_code=status.HTTP_400_BAD_REQUEST,
- detail=str(e),
- )
- generate_chat_completions = chat_completion
- generate_chat_completion = chat_completion
- @app.post("/api/chat/completed")
- async def chat_completed(
- request: Request, form_data: dict, user=Depends(get_verified_user)
- ):
- try:
- return await chat_completed_handler(request, form_data, user)
- except Exception as e:
- raise HTTPException(
- status_code=status.HTTP_400_BAD_REQUEST,
- detail=str(e),
- )
- @app.post("/api/chat/actions/{action_id}")
- async def chat_action(
- request: Request, action_id: str, form_data: dict, user=Depends(get_verified_user)
- ):
- try:
- return await chat_action_handler(request, action_id, form_data, user)
- except Exception as e:
- raise HTTPException(
- status_code=status.HTTP_400_BAD_REQUEST,
- detail=str(e),
- )
- ##################################
- #
- # Config Endpoints
- #
- ##################################
- @app.get("/api/config")
- async def get_app_config(request: Request):
- user = None
- if "token" in request.cookies:
- token = request.cookies.get("token")
- try:
- data = decode_token(token)
- except Exception as e:
- log.debug(e)
- raise HTTPException(
- status_code=status.HTTP_401_UNAUTHORIZED,
- detail="Invalid token",
- )
- if data is not None and "id" in data:
- user = Users.get_user_by_id(data["id"])
- onboarding = False
- if user is None:
- user_count = Users.get_num_users()
- onboarding = user_count == 0
- return {
- **({"onboarding": True} if onboarding else {}),
- "status": True,
- "name": WEBUI_NAME,
- "version": VERSION,
- "default_locale": str(DEFAULT_LOCALE),
- "oauth": {
- "providers": {
- name: config.get("name", name)
- for name, config in OAUTH_PROVIDERS.items()
- }
- },
- "features": {
- "auth": WEBUI_AUTH,
- "auth_trusted_header": bool(app.state.AUTH_TRUSTED_EMAIL_HEADER),
- "enable_ldap": app.state.config.ENABLE_LDAP,
- "enable_api_key": app.state.config.ENABLE_API_KEY,
- "enable_signup": app.state.config.ENABLE_SIGNUP,
- "enable_login_form": app.state.config.ENABLE_LOGIN_FORM,
- **(
- {
- "enable_web_search": app.state.config.ENABLE_RAG_WEB_SEARCH,
- "enable_image_generation": app.state.config.ENABLE_IMAGE_GENERATION,
- "enable_community_sharing": app.state.config.ENABLE_COMMUNITY_SHARING,
- "enable_message_rating": app.state.config.ENABLE_MESSAGE_RATING,
- "enable_admin_export": ENABLE_ADMIN_EXPORT,
- "enable_admin_chat_access": ENABLE_ADMIN_CHAT_ACCESS,
- }
- if user is not None
- else {}
- ),
- },
- **(
- {
- "default_models": app.state.config.DEFAULT_MODELS,
- "default_prompt_suggestions": app.state.config.DEFAULT_PROMPT_SUGGESTIONS,
- "audio": {
- "tts": {
- "engine": app.state.config.TTS_ENGINE,
- "voice": app.state.config.TTS_VOICE,
- "split_on": app.state.config.TTS_SPLIT_ON,
- },
- "stt": {
- "engine": app.state.config.STT_ENGINE,
- },
- },
- "file": {
- "max_size": app.state.config.FILE_MAX_SIZE,
- "max_count": app.state.config.FILE_MAX_COUNT,
- },
- "permissions": {**app.state.config.USER_PERMISSIONS},
- }
- if user is not None
- else {}
- ),
- }
- class UrlForm(BaseModel):
- url: str
- @app.get("/api/webhook")
- async def get_webhook_url(user=Depends(get_admin_user)):
- return {
- "url": app.state.config.WEBHOOK_URL,
- }
- @app.post("/api/webhook")
- async def update_webhook_url(form_data: UrlForm, user=Depends(get_admin_user)):
- app.state.config.WEBHOOK_URL = form_data.url
- app.state.WEBHOOK_URL = app.state.config.WEBHOOK_URL
- return {"url": app.state.config.WEBHOOK_URL}
- @app.get("/api/version")
- async def get_app_version():
- return {
- "version": VERSION,
- }
- @app.get("/api/version/updates")
- async def get_app_latest_release_version():
- if OFFLINE_MODE:
- log.debug(
- f"Offline mode is enabled, returning current version as latest version"
- )
- return {"current": VERSION, "latest": VERSION}
- try:
- timeout = aiohttp.ClientTimeout(total=1)
- async with aiohttp.ClientSession(timeout=timeout, trust_env=True) as session:
- async with session.get(
- "https://api.github.com/repos/open-webui/open-webui/releases/latest"
- ) as response:
- response.raise_for_status()
- data = await response.json()
- latest_version = data["tag_name"]
- return {"current": VERSION, "latest": latest_version[1:]}
- except Exception as e:
- log.debug(e)
- return {"current": VERSION, "latest": VERSION}
- @app.get("/api/changelog")
- async def get_app_changelog():
- return {key: CHANGELOG[key] for idx, key in enumerate(CHANGELOG) if idx < 5}
- ############################
- # OAuth Login & Callback
- ############################
- # SessionMiddleware is used by authlib for oauth
- if len(OAUTH_PROVIDERS) > 0:
- app.add_middleware(
- SessionMiddleware,
- secret_key=WEBUI_SECRET_KEY,
- session_cookie="oui-session",
- same_site=WEBUI_SESSION_COOKIE_SAME_SITE,
- https_only=WEBUI_SESSION_COOKIE_SECURE,
- )
- @app.get("/oauth/{provider}/login")
- async def oauth_login(provider: str, request: Request):
- return await oauth_manager.handle_login(provider, request)
- # OAuth login logic is as follows:
- # 1. Attempt to find a user with matching subject ID, tied to the provider
- # 2. If OAUTH_MERGE_ACCOUNTS_BY_EMAIL is true, find a user with the email address provided via OAuth
- # - This is considered insecure in general, as OAuth providers do not always verify email addresses
- # 3. If there is no user, and ENABLE_OAUTH_SIGNUP is true, create a user
- # - Email addresses are considered unique, so we fail registration if the email address is already taken
- @app.get("/oauth/{provider}/callback")
- async def oauth_callback(provider: str, request: Request, response: Response):
- return await oauth_manager.handle_callback(provider, request, response)
- @app.get("/manifest.json")
- async def get_manifest_json():
- return {
- "name": WEBUI_NAME,
- "short_name": WEBUI_NAME,
- "description": "Open WebUI is an open, extensible, user-friendly interface for AI that adapts to your workflow.",
- "start_url": "/",
- "display": "standalone",
- "background_color": "#343541",
- "orientation": "natural",
- "icons": [
- {
- "src": "/static/logo.png",
- "type": "image/png",
- "sizes": "500x500",
- "purpose": "any",
- },
- {
- "src": "/static/logo.png",
- "type": "image/png",
- "sizes": "500x500",
- "purpose": "maskable",
- },
- ],
- }
- @app.get("/opensearch.xml")
- async def get_opensearch_xml():
- xml_content = rf"""
- <OpenSearchDescription xmlns="http://a9.com/-/spec/opensearch/1.1/" xmlns:moz="http://www.mozilla.org/2006/browser/search/">
- <ShortName>{WEBUI_NAME}</ShortName>
- <Description>Search {WEBUI_NAME}</Description>
- <InputEncoding>UTF-8</InputEncoding>
- <Image width="16" height="16" type="image/x-icon">{WEBUI_URL}/static/favicon.png</Image>
- <Url type="text/html" method="get" template="{WEBUI_URL}/?q={"{searchTerms}"}"/>
- <moz:SearchForm>{WEBUI_URL}</moz:SearchForm>
- </OpenSearchDescription>
- """
- return Response(content=xml_content, media_type="application/xml")
- @app.get("/health")
- async def healthcheck():
- return {"status": True}
- @app.get("/health/db")
- async def healthcheck_with_db():
- Session.execute(text("SELECT 1;")).all()
- return {"status": True}
- app.mount("/static", StaticFiles(directory=STATIC_DIR), name="static")
- app.mount("/cache", StaticFiles(directory=CACHE_DIR), name="cache")
- if os.path.exists(FRONTEND_BUILD_DIR):
- mimetypes.add_type("text/javascript", ".js")
- app.mount(
- "/",
- SPAStaticFiles(directory=FRONTEND_BUILD_DIR, html=True),
- name="spa-static-files",
- )
- else:
- log.warning(
- f"Frontend build directory not found at '{FRONTEND_BUILD_DIR}'. Serving API only."
- )
|