main.py 6.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217
  1. from bs4 import BeautifulSoup
  2. import json
  3. import markdown
  4. import time
  5. import os
  6. import sys
  7. import requests
  8. from fastapi import FastAPI, Request, Depends, status
  9. from fastapi.staticfiles import StaticFiles
  10. from fastapi import HTTPException
  11. from fastapi.middleware.wsgi import WSGIMiddleware
  12. from fastapi.middleware.cors import CORSMiddleware
  13. from starlette.exceptions import HTTPException as StarletteHTTPException
  14. from starlette.middleware.base import BaseHTTPMiddleware
  15. from apps.ollama.main import app as ollama_app
  16. from apps.openai.main import app as openai_app
  17. from apps.litellm.main import app as litellm_app, startup as litellm_app_startup
  18. from apps.audio.main import app as audio_app
  19. from apps.images.main import app as images_app
  20. from apps.rag.main import app as rag_app
  21. from apps.web.main import app as webui_app
  22. from apps.rag.utils import query_doc, query_collection, rag_template
  23. from config import WEBUI_NAME, ENV, VERSION, CHANGELOG, FRONTEND_BUILD_DIR
  24. from constants import ERROR_MESSAGES
  25. class SPAStaticFiles(StaticFiles):
  26. async def get_response(self, path: str, scope):
  27. try:
  28. return await super().get_response(path, scope)
  29. except (HTTPException, StarletteHTTPException) as ex:
  30. if ex.status_code == 404:
  31. return await super().get_response("index.html", scope)
  32. else:
  33. raise ex
  34. app = FastAPI(docs_url="/docs" if ENV == "dev" else None, redoc_url=None)
  35. origins = ["*"]
  36. app.add_middleware(
  37. CORSMiddleware,
  38. allow_origins=origins,
  39. allow_credentials=True,
  40. allow_methods=["*"],
  41. allow_headers=["*"],
  42. )
  43. @app.on_event("startup")
  44. async def on_startup():
  45. await litellm_app_startup()
  46. class RAGMiddleware(BaseHTTPMiddleware):
  47. async def dispatch(self, request: Request, call_next):
  48. print(request.url.path)
  49. if request.method == "POST":
  50. # Read the original request body
  51. body = await request.body()
  52. # Decode body to string
  53. body_str = body.decode("utf-8")
  54. # Parse string to JSON
  55. data = json.loads(body_str) if body_str else {}
  56. # Example: Add a new key-value pair or modify existing ones
  57. # data["modified"] = True # Example modification
  58. if "docs" in data:
  59. docs = data["docs"]
  60. print(docs)
  61. last_user_message_idx = None
  62. for i in range(len(data["messages"]) - 1, -1, -1):
  63. if data["messages"][i]["role"] == "user":
  64. last_user_message_idx = i
  65. break
  66. query = data["messages"][last_user_message_idx]["content"]
  67. relevant_contexts = []
  68. for doc in docs:
  69. context = None
  70. if doc["type"] == "collection":
  71. context = query_collection(
  72. collection_names=doc["collection_names"],
  73. query=query,
  74. k=rag_app.state.TOP_K,
  75. embedding_function=rag_app.state.sentence_transformer_ef,
  76. )
  77. else:
  78. context = query_doc(
  79. collection_name=doc["collection_name"],
  80. query=query,
  81. k=rag_app.state.TOP_K,
  82. embedding_function=rag_app.state.sentence_transformer_ef,
  83. )
  84. relevant_contexts.append(context)
  85. context_string = ""
  86. for context in relevant_contexts:
  87. if context:
  88. context_string += " ".join(context["documents"][0]) + "\n"
  89. content = rag_template(
  90. template=rag_app.state.RAG_TEMPLATE,
  91. context=context_string,
  92. query=query,
  93. )
  94. new_user_message = {
  95. **data["messages"][last_user_message_idx],
  96. "content": content,
  97. }
  98. data["messages"][last_user_message_idx] = new_user_message
  99. del data["docs"]
  100. print("DATAAAAAAAAAAAAAAAAAA")
  101. print(data)
  102. modified_body_bytes = json.dumps(data).encode("utf-8")
  103. # Create a new request with the modified body
  104. scope = request.scope
  105. scope["body"] = modified_body_bytes
  106. request = Request(scope, receive=lambda: self._receive(modified_body_bytes))
  107. response = await call_next(request)
  108. return response
  109. async def _receive(self, body: bytes):
  110. return {"type": "http.request", "body": body, "more_body": False}
  111. app.add_middleware(RAGMiddleware)
  112. @app.middleware("http")
  113. async def check_url(request: Request, call_next):
  114. start_time = int(time.time())
  115. response = await call_next(request)
  116. process_time = int(time.time()) - start_time
  117. response.headers["X-Process-Time"] = str(process_time)
  118. return response
  119. app.mount("/api/v1", webui_app)
  120. app.mount("/litellm/api", litellm_app)
  121. app.mount("/ollama", ollama_app)
  122. app.mount("/openai/api", openai_app)
  123. app.mount("/images/api/v1", images_app)
  124. app.mount("/audio/api/v1", audio_app)
  125. app.mount("/rag/api/v1", rag_app)
  126. @app.get("/api/config")
  127. async def get_app_config():
  128. return {
  129. "status": True,
  130. "name": WEBUI_NAME,
  131. "version": VERSION,
  132. "images": images_app.state.ENABLED,
  133. "default_models": webui_app.state.DEFAULT_MODELS,
  134. "default_prompt_suggestions": webui_app.state.DEFAULT_PROMPT_SUGGESTIONS,
  135. }
  136. @app.get("/api/version")
  137. async def get_app_config():
  138. return {
  139. "version": VERSION,
  140. }
  141. @app.get("/api/changelog")
  142. async def get_app_changelog():
  143. return CHANGELOG
  144. @app.get("/api/version/updates")
  145. async def get_app_latest_release_version():
  146. try:
  147. response = requests.get(
  148. f"https://api.github.com/repos/open-webui/open-webui/releases/latest"
  149. )
  150. response.raise_for_status()
  151. latest_version = response.json()["tag_name"]
  152. return {"current": VERSION, "latest": latest_version[1:]}
  153. except Exception as e:
  154. raise HTTPException(
  155. status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
  156. detail=ERROR_MESSAGES.RATE_LIMIT_EXCEEDED,
  157. )
  158. app.mount("/static", StaticFiles(directory="static"), name="static")
  159. app.mount("/cache", StaticFiles(directory="data/cache"), name="cache")
  160. app.mount(
  161. "/",
  162. SPAStaticFiles(directory=FRONTEND_BUILD_DIR, html=True),
  163. name="spa-static-files",
  164. )