config.py 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846
  1. import os
  2. import sys
  3. import logging
  4. import importlib.metadata
  5. import pkgutil
  6. import chromadb
  7. from chromadb import Settings
  8. from base64 import b64encode
  9. from bs4 import BeautifulSoup
  10. from typing import TypeVar, Generic, Union
  11. from pathlib import Path
  12. import json
  13. import yaml
  14. import markdown
  15. import requests
  16. import shutil
  17. from secrets import token_bytes
  18. from constants import ERROR_MESSAGES
  19. ####################################
  20. # Load .env file
  21. ####################################
  22. BACKEND_DIR = Path(__file__).parent # the path containing this file
  23. BASE_DIR = BACKEND_DIR.parent # the path containing the backend/
  24. try:
  25. from dotenv import load_dotenv, find_dotenv
  26. load_dotenv(find_dotenv(str(BASE_DIR / ".env")))
  27. except ImportError:
  28. print("dotenv not installed, skipping...")
  29. ####################################
  30. # LOGGING
  31. ####################################
  32. log_levels = ["CRITICAL", "ERROR", "WARNING", "INFO", "DEBUG"]
  33. GLOBAL_LOG_LEVEL = os.environ.get("GLOBAL_LOG_LEVEL", "").upper()
  34. if GLOBAL_LOG_LEVEL in log_levels:
  35. logging.basicConfig(stream=sys.stdout, level=GLOBAL_LOG_LEVEL, force=True)
  36. else:
  37. GLOBAL_LOG_LEVEL = "INFO"
  38. log = logging.getLogger(__name__)
  39. log.info(f"GLOBAL_LOG_LEVEL: {GLOBAL_LOG_LEVEL}")
  40. log_sources = [
  41. "AUDIO",
  42. "COMFYUI",
  43. "CONFIG",
  44. "DB",
  45. "IMAGES",
  46. "LITELLM",
  47. "MAIN",
  48. "MODELS",
  49. "OLLAMA",
  50. "OPENAI",
  51. "RAG",
  52. "WEBHOOK",
  53. ]
  54. SRC_LOG_LEVELS = {}
  55. for source in log_sources:
  56. log_env_var = source + "_LOG_LEVEL"
  57. SRC_LOG_LEVELS[source] = os.environ.get(log_env_var, "").upper()
  58. if SRC_LOG_LEVELS[source] not in log_levels:
  59. SRC_LOG_LEVELS[source] = GLOBAL_LOG_LEVEL
  60. log.info(f"{log_env_var}: {SRC_LOG_LEVELS[source]}")
  61. log.setLevel(SRC_LOG_LEVELS["CONFIG"])
  62. WEBUI_NAME = os.environ.get("WEBUI_NAME", "Open WebUI")
  63. if WEBUI_NAME != "Open WebUI":
  64. WEBUI_NAME += " (Open WebUI)"
  65. WEBUI_URL = os.environ.get("WEBUI_URL", "http://localhost:3000")
  66. WEBUI_FAVICON_URL = "https://openwebui.com/favicon.png"
  67. ####################################
  68. # ENV (dev,test,prod)
  69. ####################################
  70. ENV = os.environ.get("ENV", "dev")
  71. try:
  72. PACKAGE_DATA = json.loads((BASE_DIR / "package.json").read_text())
  73. except:
  74. try:
  75. PACKAGE_DATA = {"version": importlib.metadata.version("open-webui")}
  76. except importlib.metadata.PackageNotFoundError:
  77. PACKAGE_DATA = {"version": "0.0.0"}
  78. VERSION = PACKAGE_DATA["version"]
  79. # Function to parse each section
  80. def parse_section(section):
  81. items = []
  82. for li in section.find_all("li"):
  83. # Extract raw HTML string
  84. raw_html = str(li)
  85. # Extract text without HTML tags
  86. text = li.get_text(separator=" ", strip=True)
  87. # Split into title and content
  88. parts = text.split(": ", 1)
  89. title = parts[0].strip() if len(parts) > 1 else ""
  90. content = parts[1].strip() if len(parts) > 1 else text
  91. items.append({"title": title, "content": content, "raw": raw_html})
  92. return items
  93. try:
  94. changelog_content = (BASE_DIR / "CHANGELOG.md").read_text()
  95. except:
  96. changelog_content = (pkgutil.get_data("open_webui", "CHANGELOG.md") or b"").decode()
  97. # Convert markdown content to HTML
  98. html_content = markdown.markdown(changelog_content)
  99. # Parse the HTML content
  100. soup = BeautifulSoup(html_content, "html.parser")
  101. # Initialize JSON structure
  102. changelog_json = {}
  103. # Iterate over each version
  104. for version in soup.find_all("h2"):
  105. version_number = version.get_text().strip().split(" - ")[0][1:-1] # Remove brackets
  106. date = version.get_text().strip().split(" - ")[1]
  107. version_data = {"date": date}
  108. # Find the next sibling that is a h3 tag (section title)
  109. current = version.find_next_sibling()
  110. while current and current.name != "h2":
  111. if current.name == "h3":
  112. section_title = current.get_text().lower() # e.g., "added", "fixed"
  113. section_items = parse_section(current.find_next_sibling("ul"))
  114. version_data[section_title] = section_items
  115. # Move to the next element
  116. current = current.find_next_sibling()
  117. changelog_json[version_number] = version_data
  118. CHANGELOG = changelog_json
  119. ####################################
  120. # WEBUI_BUILD_HASH
  121. ####################################
  122. WEBUI_BUILD_HASH = os.environ.get("WEBUI_BUILD_HASH", "dev-build")
  123. ####################################
  124. # DATA/FRONTEND BUILD DIR
  125. ####################################
  126. DATA_DIR = Path(os.getenv("DATA_DIR", BACKEND_DIR / "data")).resolve()
  127. FRONTEND_BUILD_DIR = Path(os.getenv("FRONTEND_BUILD_DIR", BASE_DIR / "build")).resolve()
  128. try:
  129. CONFIG_DATA = json.loads((DATA_DIR / "config.json").read_text())
  130. except:
  131. CONFIG_DATA = {}
  132. ####################################
  133. # Config helpers
  134. ####################################
  135. def save_config():
  136. try:
  137. with open(f"{DATA_DIR}/config.json", "w") as f:
  138. json.dump(CONFIG_DATA, f, indent="\t")
  139. except Exception as e:
  140. log.exception(e)
  141. def get_config_value(config_path: str):
  142. path_parts = config_path.split(".")
  143. cur_config = CONFIG_DATA
  144. for key in path_parts:
  145. if key in cur_config:
  146. cur_config = cur_config[key]
  147. else:
  148. return None
  149. return cur_config
  150. T = TypeVar("T")
  151. class PersistentConfig(Generic[T]):
  152. def __init__(self, env_name: str, config_path: str, env_value: T):
  153. self.env_name = env_name
  154. self.config_path = config_path
  155. self.env_value = env_value
  156. self.config_value = get_config_value(config_path)
  157. if self.config_value is not None:
  158. log.info(f"'{env_name}' loaded from config.json")
  159. self.value = self.config_value
  160. else:
  161. self.value = env_value
  162. def __str__(self):
  163. return str(self.value)
  164. @property
  165. def __dict__(self):
  166. raise TypeError(
  167. "PersistentConfig object cannot be converted to dict, use config_get or .value instead."
  168. )
  169. def __getattribute__(self, item):
  170. if item == "__dict__":
  171. raise TypeError(
  172. "PersistentConfig object cannot be converted to dict, use config_get or .value instead."
  173. )
  174. return super().__getattribute__(item)
  175. def save(self):
  176. # Don't save if the value is the same as the env value and the config value
  177. if self.env_value == self.value:
  178. if self.config_value == self.value:
  179. return
  180. log.info(f"Saving '{self.env_name}' to config.json")
  181. path_parts = self.config_path.split(".")
  182. config = CONFIG_DATA
  183. for key in path_parts[:-1]:
  184. if key not in config:
  185. config[key] = {}
  186. config = config[key]
  187. config[path_parts[-1]] = self.value
  188. save_config()
  189. self.config_value = self.value
  190. class AppConfig:
  191. _state: dict[str, PersistentConfig]
  192. def __init__(self):
  193. super().__setattr__("_state", {})
  194. def __setattr__(self, key, value):
  195. if isinstance(value, PersistentConfig):
  196. self._state[key] = value
  197. else:
  198. self._state[key].value = value
  199. self._state[key].save()
  200. def __getattr__(self, key):
  201. return self._state[key].value
  202. ####################################
  203. # WEBUI_AUTH (Required for security)
  204. ####################################
  205. WEBUI_AUTH = os.environ.get("WEBUI_AUTH", "True").lower() == "true"
  206. WEBUI_AUTH_TRUSTED_EMAIL_HEADER = os.environ.get(
  207. "WEBUI_AUTH_TRUSTED_EMAIL_HEADER", None
  208. )
  209. JWT_EXPIRES_IN = PersistentConfig(
  210. "JWT_EXPIRES_IN", "auth.jwt_expiry", os.environ.get("JWT_EXPIRES_IN", "-1")
  211. )
  212. ####################################
  213. # Static DIR
  214. ####################################
  215. STATIC_DIR = Path(os.getenv("STATIC_DIR", BACKEND_DIR / "static")).resolve()
  216. frontend_favicon = FRONTEND_BUILD_DIR / "favicon.png"
  217. if frontend_favicon.exists():
  218. shutil.copyfile(frontend_favicon, STATIC_DIR / "favicon.png")
  219. else:
  220. logging.warning(f"Frontend favicon not found at {frontend_favicon}")
  221. ####################################
  222. # CUSTOM_NAME
  223. ####################################
  224. CUSTOM_NAME = os.environ.get("CUSTOM_NAME", "")
  225. if CUSTOM_NAME:
  226. try:
  227. r = requests.get(f"https://api.openwebui.com/api/v1/custom/{CUSTOM_NAME}")
  228. data = r.json()
  229. if r.ok:
  230. if "logo" in data:
  231. WEBUI_FAVICON_URL = url = (
  232. f"https://api.openwebui.com{data['logo']}"
  233. if data["logo"][0] == "/"
  234. else data["logo"]
  235. )
  236. r = requests.get(url, stream=True)
  237. if r.status_code == 200:
  238. with open(f"{STATIC_DIR}/favicon.png", "wb") as f:
  239. r.raw.decode_content = True
  240. shutil.copyfileobj(r.raw, f)
  241. WEBUI_NAME = data["name"]
  242. except Exception as e:
  243. log.exception(e)
  244. pass
  245. ####################################
  246. # File Upload DIR
  247. ####################################
  248. UPLOAD_DIR = f"{DATA_DIR}/uploads"
  249. Path(UPLOAD_DIR).mkdir(parents=True, exist_ok=True)
  250. ####################################
  251. # Cache DIR
  252. ####################################
  253. CACHE_DIR = f"{DATA_DIR}/cache"
  254. Path(CACHE_DIR).mkdir(parents=True, exist_ok=True)
  255. ####################################
  256. # Docs DIR
  257. ####################################
  258. DOCS_DIR = os.getenv("DOCS_DIR", f"{DATA_DIR}/docs")
  259. Path(DOCS_DIR).mkdir(parents=True, exist_ok=True)
  260. ####################################
  261. # LITELLM_CONFIG
  262. ####################################
  263. def create_config_file(file_path):
  264. directory = os.path.dirname(file_path)
  265. # Check if directory exists, if not, create it
  266. if not os.path.exists(directory):
  267. os.makedirs(directory)
  268. # Data to write into the YAML file
  269. config_data = {
  270. "general_settings": {},
  271. "litellm_settings": {},
  272. "model_list": [],
  273. "router_settings": {},
  274. }
  275. # Write data to YAML file
  276. with open(file_path, "w") as file:
  277. yaml.dump(config_data, file)
  278. LITELLM_CONFIG_PATH = f"{DATA_DIR}/litellm/config.yaml"
  279. if not os.path.exists(LITELLM_CONFIG_PATH):
  280. log.info("Config file doesn't exist. Creating...")
  281. create_config_file(LITELLM_CONFIG_PATH)
  282. log.info("Config file created successfully.")
  283. ####################################
  284. # OLLAMA_BASE_URL
  285. ####################################
  286. ENABLE_OLLAMA_API = PersistentConfig(
  287. "ENABLE_OLLAMA_API",
  288. "ollama.enable",
  289. os.environ.get("ENABLE_OLLAMA_API", "True").lower() == "true",
  290. )
  291. OLLAMA_API_BASE_URL = os.environ.get(
  292. "OLLAMA_API_BASE_URL", "http://localhost:11434/api"
  293. )
  294. OLLAMA_BASE_URL = os.environ.get("OLLAMA_BASE_URL", "")
  295. K8S_FLAG = os.environ.get("K8S_FLAG", "")
  296. USE_OLLAMA_DOCKER = os.environ.get("USE_OLLAMA_DOCKER", "false")
  297. if OLLAMA_BASE_URL == "" and OLLAMA_API_BASE_URL != "":
  298. OLLAMA_BASE_URL = (
  299. OLLAMA_API_BASE_URL[:-4]
  300. if OLLAMA_API_BASE_URL.endswith("/api")
  301. else OLLAMA_API_BASE_URL
  302. )
  303. if ENV == "prod":
  304. if OLLAMA_BASE_URL == "/ollama" and not K8S_FLAG:
  305. if USE_OLLAMA_DOCKER.lower() == "true":
  306. # if you use all-in-one docker container (Open WebUI + Ollama)
  307. # with the docker build arg USE_OLLAMA=true (--build-arg="USE_OLLAMA=true") this only works with http://localhost:11434
  308. OLLAMA_BASE_URL = "http://localhost:11434"
  309. else:
  310. OLLAMA_BASE_URL = "http://host.docker.internal:11434"
  311. elif K8S_FLAG:
  312. OLLAMA_BASE_URL = "http://ollama-service.open-webui.svc.cluster.local:11434"
  313. OLLAMA_BASE_URLS = os.environ.get("OLLAMA_BASE_URLS", "")
  314. OLLAMA_BASE_URLS = OLLAMA_BASE_URLS if OLLAMA_BASE_URLS != "" else OLLAMA_BASE_URL
  315. OLLAMA_BASE_URLS = [url.strip() for url in OLLAMA_BASE_URLS.split(";")]
  316. OLLAMA_BASE_URLS = PersistentConfig(
  317. "OLLAMA_BASE_URLS", "ollama.base_urls", OLLAMA_BASE_URLS
  318. )
  319. ####################################
  320. # OPENAI_API
  321. ####################################
  322. ENABLE_OPENAI_API = PersistentConfig(
  323. "ENABLE_OPENAI_API",
  324. "openai.enable",
  325. os.environ.get("ENABLE_OPENAI_API", "True").lower() == "true",
  326. )
  327. OPENAI_API_KEY = os.environ.get("OPENAI_API_KEY", "")
  328. OPENAI_API_BASE_URL = os.environ.get("OPENAI_API_BASE_URL", "")
  329. if OPENAI_API_BASE_URL == "":
  330. OPENAI_API_BASE_URL = "https://api.openai.com/v1"
  331. OPENAI_API_KEYS = os.environ.get("OPENAI_API_KEYS", "")
  332. OPENAI_API_KEYS = OPENAI_API_KEYS if OPENAI_API_KEYS != "" else OPENAI_API_KEY
  333. OPENAI_API_KEYS = [url.strip() for url in OPENAI_API_KEYS.split(";")]
  334. OPENAI_API_KEYS = PersistentConfig(
  335. "OPENAI_API_KEYS", "openai.api_keys", OPENAI_API_KEYS
  336. )
  337. OPENAI_API_BASE_URLS = os.environ.get("OPENAI_API_BASE_URLS", "")
  338. OPENAI_API_BASE_URLS = (
  339. OPENAI_API_BASE_URLS if OPENAI_API_BASE_URLS != "" else OPENAI_API_BASE_URL
  340. )
  341. OPENAI_API_BASE_URLS = [
  342. url.strip() if url != "" else "https://api.openai.com/v1"
  343. for url in OPENAI_API_BASE_URLS.split(";")
  344. ]
  345. OPENAI_API_BASE_URLS = PersistentConfig(
  346. "OPENAI_API_BASE_URLS", "openai.api_base_urls", OPENAI_API_BASE_URLS
  347. )
  348. OPENAI_API_KEY = ""
  349. try:
  350. OPENAI_API_KEY = OPENAI_API_KEYS.value[
  351. OPENAI_API_BASE_URLS.value.index("https://api.openai.com/v1")
  352. ]
  353. except:
  354. pass
  355. OPENAI_API_BASE_URL = "https://api.openai.com/v1"
  356. ####################################
  357. # WEBUI
  358. ####################################
  359. ENABLE_SIGNUP = PersistentConfig(
  360. "ENABLE_SIGNUP",
  361. "ui.enable_signup",
  362. (
  363. False
  364. if not WEBUI_AUTH
  365. else os.environ.get("ENABLE_SIGNUP", "True").lower() == "true"
  366. ),
  367. )
  368. DEFAULT_MODELS = PersistentConfig(
  369. "DEFAULT_MODELS", "ui.default_models", os.environ.get("DEFAULT_MODELS", None)
  370. )
  371. DEFAULT_PROMPT_SUGGESTIONS = PersistentConfig(
  372. "DEFAULT_PROMPT_SUGGESTIONS",
  373. "ui.prompt_suggestions",
  374. [
  375. {
  376. "title": ["Help me study", "vocabulary for a college entrance exam"],
  377. "content": "Help me study vocabulary: write a sentence for me to fill in the blank, and I'll try to pick the correct option.",
  378. },
  379. {
  380. "title": ["Give me ideas", "for what to do with my kids' art"],
  381. "content": "What are 5 creative things I could do with my kids' art? I don't want to throw them away, but it's also so much clutter.",
  382. },
  383. {
  384. "title": ["Tell me a fun fact", "about the Roman Empire"],
  385. "content": "Tell me a random fun fact about the Roman Empire",
  386. },
  387. {
  388. "title": ["Show me a code snippet", "of a website's sticky header"],
  389. "content": "Show me a code snippet of a website's sticky header in CSS and JavaScript.",
  390. },
  391. {
  392. "title": [
  393. "Explain options trading",
  394. "if I'm familiar with buying and selling stocks",
  395. ],
  396. "content": "Explain options trading in simple terms if I'm familiar with buying and selling stocks.",
  397. },
  398. {
  399. "title": ["Overcome procrastination", "give me tips"],
  400. "content": "Could you start by asking me about instances when I procrastinate the most and then give me some suggestions to overcome it?",
  401. },
  402. ],
  403. )
  404. DEFAULT_USER_ROLE = PersistentConfig(
  405. "DEFAULT_USER_ROLE",
  406. "ui.default_user_role",
  407. os.getenv("DEFAULT_USER_ROLE", "pending"),
  408. )
  409. USER_PERMISSIONS_CHAT_DELETION = (
  410. os.environ.get("USER_PERMISSIONS_CHAT_DELETION", "True").lower() == "true"
  411. )
  412. USER_PERMISSIONS = PersistentConfig(
  413. "USER_PERMISSIONS",
  414. "ui.user_permissions",
  415. {"chat": {"deletion": USER_PERMISSIONS_CHAT_DELETION}},
  416. )
  417. ENABLE_MODEL_FILTER = PersistentConfig(
  418. "ENABLE_MODEL_FILTER",
  419. "model_filter.enable",
  420. os.environ.get("ENABLE_MODEL_FILTER", "False").lower() == "true",
  421. )
  422. MODEL_FILTER_LIST = os.environ.get("MODEL_FILTER_LIST", "")
  423. MODEL_FILTER_LIST = PersistentConfig(
  424. "MODEL_FILTER_LIST",
  425. "model_filter.list",
  426. [model.strip() for model in MODEL_FILTER_LIST.split(";")],
  427. )
  428. WEBHOOK_URL = PersistentConfig(
  429. "WEBHOOK_URL", "webhook_url", os.environ.get("WEBHOOK_URL", "")
  430. )
  431. ENABLE_ADMIN_EXPORT = os.environ.get("ENABLE_ADMIN_EXPORT", "True").lower() == "true"
  432. ####################################
  433. # WEBUI_SECRET_KEY
  434. ####################################
  435. WEBUI_SECRET_KEY = os.environ.get(
  436. "WEBUI_SECRET_KEY",
  437. os.environ.get(
  438. "WEBUI_JWT_SECRET_KEY", "t0p-s3cr3t"
  439. ), # DEPRECATED: remove at next major version
  440. )
  441. if WEBUI_AUTH and WEBUI_SECRET_KEY == "":
  442. raise ValueError(ERROR_MESSAGES.ENV_VAR_NOT_FOUND)
  443. ####################################
  444. # RAG
  445. ####################################
  446. CHROMA_DATA_PATH = f"{DATA_DIR}/vector_db"
  447. CHROMA_TENANT = os.environ.get("CHROMA_TENANT", chromadb.DEFAULT_TENANT)
  448. CHROMA_DATABASE = os.environ.get("CHROMA_DATABASE", chromadb.DEFAULT_DATABASE)
  449. CHROMA_HTTP_HOST = os.environ.get("CHROMA_HTTP_HOST", "")
  450. CHROMA_HTTP_PORT = int(os.environ.get("CHROMA_HTTP_PORT", "8000"))
  451. # Comma-separated list of header=value pairs
  452. CHROMA_HTTP_HEADERS = os.environ.get("CHROMA_HTTP_HEADERS", "")
  453. if CHROMA_HTTP_HEADERS:
  454. CHROMA_HTTP_HEADERS = dict(
  455. [pair.split("=") for pair in CHROMA_HTTP_HEADERS.split(",")]
  456. )
  457. else:
  458. CHROMA_HTTP_HEADERS = None
  459. CHROMA_HTTP_SSL = os.environ.get("CHROMA_HTTP_SSL", "false").lower() == "true"
  460. # this uses the model defined in the Dockerfile ENV variable. If you dont use docker or docker based deployments such as k8s, the default embedding model will be used (sentence-transformers/all-MiniLM-L6-v2)
  461. RAG_TOP_K = PersistentConfig(
  462. "RAG_TOP_K", "rag.top_k", int(os.environ.get("RAG_TOP_K", "5"))
  463. )
  464. RAG_RELEVANCE_THRESHOLD = PersistentConfig(
  465. "RAG_RELEVANCE_THRESHOLD",
  466. "rag.relevance_threshold",
  467. float(os.environ.get("RAG_RELEVANCE_THRESHOLD", "0.0")),
  468. )
  469. ENABLE_RAG_HYBRID_SEARCH = PersistentConfig(
  470. "ENABLE_RAG_HYBRID_SEARCH",
  471. "rag.enable_hybrid_search",
  472. os.environ.get("ENABLE_RAG_HYBRID_SEARCH", "").lower() == "true",
  473. )
  474. ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION = PersistentConfig(
  475. "ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION",
  476. "rag.enable_web_loader_ssl_verification",
  477. os.environ.get("ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION", "True").lower() == "true",
  478. )
  479. RAG_EMBEDDING_ENGINE = PersistentConfig(
  480. "RAG_EMBEDDING_ENGINE",
  481. "rag.embedding_engine",
  482. os.environ.get("RAG_EMBEDDING_ENGINE", ""),
  483. )
  484. PDF_EXTRACT_IMAGES = PersistentConfig(
  485. "PDF_EXTRACT_IMAGES",
  486. "rag.pdf_extract_images",
  487. os.environ.get("PDF_EXTRACT_IMAGES", "False").lower() == "true",
  488. )
  489. RAG_EMBEDDING_MODEL = PersistentConfig(
  490. "RAG_EMBEDDING_MODEL",
  491. "rag.embedding_model",
  492. os.environ.get("RAG_EMBEDDING_MODEL", "sentence-transformers/all-MiniLM-L6-v2"),
  493. )
  494. log.info(f"Embedding model set: {RAG_EMBEDDING_MODEL.value}"),
  495. RAG_EMBEDDING_MODEL_AUTO_UPDATE = (
  496. os.environ.get("RAG_EMBEDDING_MODEL_AUTO_UPDATE", "").lower() == "true"
  497. )
  498. RAG_EMBEDDING_MODEL_TRUST_REMOTE_CODE = (
  499. os.environ.get("RAG_EMBEDDING_MODEL_TRUST_REMOTE_CODE", "").lower() == "true"
  500. )
  501. RAG_RERANKING_MODEL = PersistentConfig(
  502. "RAG_RERANKING_MODEL",
  503. "rag.reranking_model",
  504. os.environ.get("RAG_RERANKING_MODEL", ""),
  505. )
  506. if RAG_RERANKING_MODEL.value != "":
  507. log.info(f"Reranking model set: {RAG_RERANKING_MODEL.value}"),
  508. RAG_RERANKING_MODEL_AUTO_UPDATE = (
  509. os.environ.get("RAG_RERANKING_MODEL_AUTO_UPDATE", "").lower() == "true"
  510. )
  511. RAG_RERANKING_MODEL_TRUST_REMOTE_CODE = (
  512. os.environ.get("RAG_RERANKING_MODEL_TRUST_REMOTE_CODE", "").lower() == "true"
  513. )
  514. if CHROMA_HTTP_HOST != "":
  515. CHROMA_CLIENT = chromadb.HttpClient(
  516. host=CHROMA_HTTP_HOST,
  517. port=CHROMA_HTTP_PORT,
  518. headers=CHROMA_HTTP_HEADERS,
  519. ssl=CHROMA_HTTP_SSL,
  520. tenant=CHROMA_TENANT,
  521. database=CHROMA_DATABASE,
  522. settings=Settings(allow_reset=True, anonymized_telemetry=False),
  523. )
  524. else:
  525. CHROMA_CLIENT = chromadb.PersistentClient(
  526. path=CHROMA_DATA_PATH,
  527. settings=Settings(allow_reset=True, anonymized_telemetry=False),
  528. tenant=CHROMA_TENANT,
  529. database=CHROMA_DATABASE,
  530. )
  531. # device type embedding models - "cpu" (default), "cuda" (nvidia gpu required) or "mps" (apple silicon) - choosing this right can lead to better performance
  532. USE_CUDA = os.environ.get("USE_CUDA_DOCKER", "false")
  533. if USE_CUDA.lower() == "true":
  534. DEVICE_TYPE = "cuda"
  535. else:
  536. DEVICE_TYPE = "cpu"
  537. CHUNK_SIZE = PersistentConfig(
  538. "CHUNK_SIZE", "rag.chunk_size", int(os.environ.get("CHUNK_SIZE", "1500"))
  539. )
  540. CHUNK_OVERLAP = PersistentConfig(
  541. "CHUNK_OVERLAP",
  542. "rag.chunk_overlap",
  543. int(os.environ.get("CHUNK_OVERLAP", "100")),
  544. )
  545. DEFAULT_RAG_TEMPLATE = """Use the following context as your learned knowledge, inside <context></context> XML tags.
  546. <context>
  547. [context]
  548. </context>
  549. When answer to user:
  550. - If you don't know, just say that you don't know.
  551. - If you don't know when you are not sure, ask for clarification.
  552. Avoid mentioning that you obtained the information from the context.
  553. And answer according to the language of the user's question.
  554. Given the context information, answer the query.
  555. Query: [query]"""
  556. RAG_TEMPLATE = PersistentConfig(
  557. "RAG_TEMPLATE",
  558. "rag.template",
  559. os.environ.get("RAG_TEMPLATE", DEFAULT_RAG_TEMPLATE),
  560. )
  561. RAG_OPENAI_API_BASE_URL = PersistentConfig(
  562. "RAG_OPENAI_API_BASE_URL",
  563. "rag.openai_api_base_url",
  564. os.getenv("RAG_OPENAI_API_BASE_URL", OPENAI_API_BASE_URL),
  565. )
  566. RAG_OPENAI_API_KEY = PersistentConfig(
  567. "RAG_OPENAI_API_KEY",
  568. "rag.openai_api_key",
  569. os.getenv("RAG_OPENAI_API_KEY", OPENAI_API_KEY),
  570. )
  571. ENABLE_RAG_LOCAL_WEB_FETCH = (
  572. os.getenv("ENABLE_RAG_LOCAL_WEB_FETCH", "False").lower() == "true"
  573. )
  574. YOUTUBE_LOADER_LANGUAGE = PersistentConfig(
  575. "YOUTUBE_LOADER_LANGUAGE",
  576. "rag.youtube_loader_language",
  577. os.getenv("YOUTUBE_LOADER_LANGUAGE", "en").split(","),
  578. )
  579. ####################################
  580. # Transcribe
  581. ####################################
  582. WHISPER_MODEL = os.getenv("WHISPER_MODEL", "base")
  583. WHISPER_MODEL_DIR = os.getenv("WHISPER_MODEL_DIR", f"{CACHE_DIR}/whisper/models")
  584. WHISPER_MODEL_AUTO_UPDATE = (
  585. os.environ.get("WHISPER_MODEL_AUTO_UPDATE", "").lower() == "true"
  586. )
  587. ####################################
  588. # Images
  589. ####################################
  590. IMAGE_GENERATION_ENGINE = PersistentConfig(
  591. "IMAGE_GENERATION_ENGINE",
  592. "image_generation.engine",
  593. os.getenv("IMAGE_GENERATION_ENGINE", ""),
  594. )
  595. ENABLE_IMAGE_GENERATION = PersistentConfig(
  596. "ENABLE_IMAGE_GENERATION",
  597. "image_generation.enable",
  598. os.environ.get("ENABLE_IMAGE_GENERATION", "").lower() == "true",
  599. )
  600. AUTOMATIC1111_BASE_URL = PersistentConfig(
  601. "AUTOMATIC1111_BASE_URL",
  602. "image_generation.automatic1111.base_url",
  603. os.getenv("AUTOMATIC1111_BASE_URL", ""),
  604. )
  605. COMFYUI_BASE_URL = PersistentConfig(
  606. "COMFYUI_BASE_URL",
  607. "image_generation.comfyui.base_url",
  608. os.getenv("COMFYUI_BASE_URL", ""),
  609. )
  610. IMAGES_OPENAI_API_BASE_URL = PersistentConfig(
  611. "IMAGES_OPENAI_API_BASE_URL",
  612. "image_generation.openai.api_base_url",
  613. os.getenv("IMAGES_OPENAI_API_BASE_URL", OPENAI_API_BASE_URL),
  614. )
  615. IMAGES_OPENAI_API_KEY = PersistentConfig(
  616. "IMAGES_OPENAI_API_KEY",
  617. "image_generation.openai.api_key",
  618. os.getenv("IMAGES_OPENAI_API_KEY", OPENAI_API_KEY),
  619. )
  620. IMAGE_SIZE = PersistentConfig(
  621. "IMAGE_SIZE", "image_generation.size", os.getenv("IMAGE_SIZE", "512x512")
  622. )
  623. IMAGE_STEPS = PersistentConfig(
  624. "IMAGE_STEPS", "image_generation.steps", int(os.getenv("IMAGE_STEPS", 50))
  625. )
  626. IMAGE_GENERATION_MODEL = PersistentConfig(
  627. "IMAGE_GENERATION_MODEL",
  628. "image_generation.model",
  629. os.getenv("IMAGE_GENERATION_MODEL", ""),
  630. )
  631. ####################################
  632. # Audio
  633. ####################################
  634. AUDIO_OPENAI_API_BASE_URL = PersistentConfig(
  635. "AUDIO_OPENAI_API_BASE_URL",
  636. "audio.openai.api_base_url",
  637. os.getenv("AUDIO_OPENAI_API_BASE_URL", OPENAI_API_BASE_URL),
  638. )
  639. AUDIO_OPENAI_API_KEY = PersistentConfig(
  640. "AUDIO_OPENAI_API_KEY",
  641. "audio.openai.api_key",
  642. os.getenv("AUDIO_OPENAI_API_KEY", OPENAI_API_KEY),
  643. )
  644. AUDIO_OPENAI_API_MODEL = PersistentConfig(
  645. "AUDIO_OPENAI_API_MODEL",
  646. "audio.openai.api_model",
  647. os.getenv("AUDIO_OPENAI_API_MODEL", "tts-1"),
  648. )
  649. AUDIO_OPENAI_API_VOICE = PersistentConfig(
  650. "AUDIO_OPENAI_API_VOICE",
  651. "audio.openai.api_voice",
  652. os.getenv("AUDIO_OPENAI_API_VOICE", "alloy"),
  653. )
  654. ####################################
  655. # LiteLLM
  656. ####################################
  657. ENABLE_LITELLM = os.environ.get("ENABLE_LITELLM", "True").lower() == "true"
  658. LITELLM_PROXY_PORT = int(os.getenv("LITELLM_PROXY_PORT", "14365"))
  659. if LITELLM_PROXY_PORT < 0 or LITELLM_PROXY_PORT > 65535:
  660. raise ValueError("Invalid port number for LITELLM_PROXY_PORT")
  661. LITELLM_PROXY_HOST = os.getenv("LITELLM_PROXY_HOST", "127.0.0.1")
  662. ####################################
  663. # Database
  664. ####################################
  665. DATABASE_URL = os.environ.get("DATABASE_URL", f"sqlite:///{DATA_DIR}/webui.db")