config.py 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837
  1. import os
  2. import sys
  3. import logging
  4. import importlib.metadata
  5. import pkgutil
  6. import chromadb
  7. from chromadb import Settings
  8. from base64 import b64encode
  9. from bs4 import BeautifulSoup
  10. from typing import TypeVar, Generic, Union
  11. from pathlib import Path
  12. import json
  13. import yaml
  14. import markdown
  15. import requests
  16. import shutil
  17. from secrets import token_bytes
  18. from constants import ERROR_MESSAGES
  19. ####################################
  20. # Load .env file
  21. ####################################
  22. BACKEND_DIR = Path(__file__).parent # the path containing this file
  23. BASE_DIR = BACKEND_DIR.parent # the path containing the backend/
  24. print(BASE_DIR)
  25. try:
  26. from dotenv import load_dotenv, find_dotenv
  27. load_dotenv(find_dotenv(str(BASE_DIR / ".env")))
  28. except ImportError:
  29. print("dotenv not installed, skipping...")
  30. ####################################
  31. # LOGGING
  32. ####################################
  33. log_levels = ["CRITICAL", "ERROR", "WARNING", "INFO", "DEBUG"]
  34. GLOBAL_LOG_LEVEL = os.environ.get("GLOBAL_LOG_LEVEL", "").upper()
  35. if GLOBAL_LOG_LEVEL in log_levels:
  36. logging.basicConfig(stream=sys.stdout, level=GLOBAL_LOG_LEVEL, force=True)
  37. else:
  38. GLOBAL_LOG_LEVEL = "INFO"
  39. log = logging.getLogger(__name__)
  40. log.info(f"GLOBAL_LOG_LEVEL: {GLOBAL_LOG_LEVEL}")
  41. log_sources = [
  42. "AUDIO",
  43. "COMFYUI",
  44. "CONFIG",
  45. "DB",
  46. "IMAGES",
  47. "MAIN",
  48. "MODELS",
  49. "OLLAMA",
  50. "OPENAI",
  51. "RAG",
  52. "WEBHOOK",
  53. ]
  54. SRC_LOG_LEVELS = {}
  55. for source in log_sources:
  56. log_env_var = source + "_LOG_LEVEL"
  57. SRC_LOG_LEVELS[source] = os.environ.get(log_env_var, "").upper()
  58. if SRC_LOG_LEVELS[source] not in log_levels:
  59. SRC_LOG_LEVELS[source] = GLOBAL_LOG_LEVEL
  60. log.info(f"{log_env_var}: {SRC_LOG_LEVELS[source]}")
  61. log.setLevel(SRC_LOG_LEVELS["CONFIG"])
  62. WEBUI_NAME = os.environ.get("WEBUI_NAME", "Open WebUI")
  63. if WEBUI_NAME != "Open WebUI":
  64. WEBUI_NAME += " (Open WebUI)"
  65. WEBUI_URL = os.environ.get("WEBUI_URL", "http://localhost:3000")
  66. WEBUI_FAVICON_URL = "https://openwebui.com/favicon.png"
  67. ####################################
  68. # ENV (dev,test,prod)
  69. ####################################
  70. ENV = os.environ.get("ENV", "dev")
  71. try:
  72. PACKAGE_DATA = json.loads((BASE_DIR / "package.json").read_text())
  73. except:
  74. try:
  75. PACKAGE_DATA = {"version": importlib.metadata.version("open-webui")}
  76. except importlib.metadata.PackageNotFoundError:
  77. PACKAGE_DATA = {"version": "0.0.0"}
  78. VERSION = PACKAGE_DATA["version"]
  79. # Function to parse each section
  80. def parse_section(section):
  81. items = []
  82. for li in section.find_all("li"):
  83. # Extract raw HTML string
  84. raw_html = str(li)
  85. # Extract text without HTML tags
  86. text = li.get_text(separator=" ", strip=True)
  87. # Split into title and content
  88. parts = text.split(": ", 1)
  89. title = parts[0].strip() if len(parts) > 1 else ""
  90. content = parts[1].strip() if len(parts) > 1 else text
  91. items.append({"title": title, "content": content, "raw": raw_html})
  92. return items
  93. try:
  94. with open(BASE_DIR / "CHANGELOG.md", "r") as file:
  95. changelog_content = file.read()
  96. except:
  97. changelog_content = (pkgutil.get_data("open_webui", "CHANGELOG.md") or b"").decode()
  98. # Convert markdown content to HTML
  99. html_content = markdown.markdown(changelog_content)
  100. # Parse the HTML content
  101. soup = BeautifulSoup(html_content, "html.parser")
  102. # Initialize JSON structure
  103. changelog_json = {}
  104. # Iterate over each version
  105. for version in soup.find_all("h2"):
  106. version_number = version.get_text().strip().split(" - ")[0][1:-1] # Remove brackets
  107. date = version.get_text().strip().split(" - ")[1]
  108. version_data = {"date": date}
  109. # Find the next sibling that is a h3 tag (section title)
  110. current = version.find_next_sibling()
  111. while current and current.name != "h2":
  112. if current.name == "h3":
  113. section_title = current.get_text().lower() # e.g., "added", "fixed"
  114. section_items = parse_section(current.find_next_sibling("ul"))
  115. version_data[section_title] = section_items
  116. # Move to the next element
  117. current = current.find_next_sibling()
  118. changelog_json[version_number] = version_data
  119. CHANGELOG = changelog_json
  120. ####################################
  121. # WEBUI_VERSION
  122. ####################################
  123. WEBUI_VERSION = os.environ.get("WEBUI_VERSION", "v1.0.0-alpha.100")
  124. ####################################
  125. # DATA/FRONTEND BUILD DIR
  126. ####################################
  127. DATA_DIR = Path(os.getenv("DATA_DIR", BACKEND_DIR / "data")).resolve()
  128. FRONTEND_BUILD_DIR = Path(os.getenv("FRONTEND_BUILD_DIR", BASE_DIR / "build")).resolve()
  129. try:
  130. CONFIG_DATA = json.loads((DATA_DIR / "config.json").read_text())
  131. except:
  132. CONFIG_DATA = {}
  133. ####################################
  134. # Config helpers
  135. ####################################
  136. def save_config():
  137. try:
  138. with open(f"{DATA_DIR}/config.json", "w") as f:
  139. json.dump(CONFIG_DATA, f, indent="\t")
  140. except Exception as e:
  141. log.exception(e)
  142. def get_config_value(config_path: str):
  143. path_parts = config_path.split(".")
  144. cur_config = CONFIG_DATA
  145. for key in path_parts:
  146. if key in cur_config:
  147. cur_config = cur_config[key]
  148. else:
  149. return None
  150. return cur_config
  151. T = TypeVar("T")
  152. class PersistentConfig(Generic[T]):
  153. def __init__(self, env_name: str, config_path: str, env_value: T):
  154. self.env_name = env_name
  155. self.config_path = config_path
  156. self.env_value = env_value
  157. self.config_value = get_config_value(config_path)
  158. if self.config_value is not None:
  159. log.info(f"'{env_name}' loaded from config.json")
  160. self.value = self.config_value
  161. else:
  162. self.value = env_value
  163. def __str__(self):
  164. return str(self.value)
  165. @property
  166. def __dict__(self):
  167. raise TypeError(
  168. "PersistentConfig object cannot be converted to dict, use config_get or .value instead."
  169. )
  170. def __getattribute__(self, item):
  171. if item == "__dict__":
  172. raise TypeError(
  173. "PersistentConfig object cannot be converted to dict, use config_get or .value instead."
  174. )
  175. return super().__getattribute__(item)
  176. def save(self):
  177. # Don't save if the value is the same as the env value and the config value
  178. if self.env_value == self.value:
  179. if self.config_value == self.value:
  180. return
  181. log.info(f"Saving '{self.env_name}' to config.json")
  182. path_parts = self.config_path.split(".")
  183. config = CONFIG_DATA
  184. for key in path_parts[:-1]:
  185. if key not in config:
  186. config[key] = {}
  187. config = config[key]
  188. config[path_parts[-1]] = self.value
  189. save_config()
  190. self.config_value = self.value
  191. class AppConfig:
  192. _state: dict[str, PersistentConfig]
  193. def __init__(self):
  194. super().__setattr__("_state", {})
  195. def __setattr__(self, key, value):
  196. if isinstance(value, PersistentConfig):
  197. self._state[key] = value
  198. else:
  199. self._state[key].value = value
  200. self._state[key].save()
  201. def __getattr__(self, key):
  202. return self._state[key].value
  203. ####################################
  204. # WEBUI_AUTH (Required for security)
  205. ####################################
  206. WEBUI_AUTH = os.environ.get("WEBUI_AUTH", "True").lower() == "true"
  207. WEBUI_AUTH_TRUSTED_EMAIL_HEADER = os.environ.get(
  208. "WEBUI_AUTH_TRUSTED_EMAIL_HEADER", None
  209. )
  210. JWT_EXPIRES_IN = PersistentConfig(
  211. "JWT_EXPIRES_IN", "auth.jwt_expiry", os.environ.get("JWT_EXPIRES_IN", "-1")
  212. )
  213. ####################################
  214. # Static DIR
  215. ####################################
  216. STATIC_DIR = Path(os.getenv("STATIC_DIR", BACKEND_DIR / "static")).resolve()
  217. frontend_favicon = FRONTEND_BUILD_DIR / "favicon.png"
  218. if frontend_favicon.exists():
  219. shutil.copyfile(frontend_favicon, STATIC_DIR / "favicon.png")
  220. else:
  221. logging.warning(f"Frontend favicon not found at {frontend_favicon}")
  222. ####################################
  223. # CUSTOM_NAME
  224. ####################################
  225. CUSTOM_NAME = os.environ.get("CUSTOM_NAME", "")
  226. if CUSTOM_NAME:
  227. try:
  228. r = requests.get(f"https://api.openwebui.com/api/v1/custom/{CUSTOM_NAME}")
  229. data = r.json()
  230. if r.ok:
  231. if "logo" in data:
  232. WEBUI_FAVICON_URL = url = (
  233. f"https://api.openwebui.com{data['logo']}"
  234. if data["logo"][0] == "/"
  235. else data["logo"]
  236. )
  237. r = requests.get(url, stream=True)
  238. if r.status_code == 200:
  239. with open(f"{STATIC_DIR}/favicon.png", "wb") as f:
  240. r.raw.decode_content = True
  241. shutil.copyfileobj(r.raw, f)
  242. WEBUI_NAME = data["name"]
  243. except Exception as e:
  244. log.exception(e)
  245. pass
  246. ####################################
  247. # File Upload DIR
  248. ####################################
  249. UPLOAD_DIR = f"{DATA_DIR}/uploads"
  250. Path(UPLOAD_DIR).mkdir(parents=True, exist_ok=True)
  251. ####################################
  252. # Cache DIR
  253. ####################################
  254. CACHE_DIR = f"{DATA_DIR}/cache"
  255. Path(CACHE_DIR).mkdir(parents=True, exist_ok=True)
  256. ####################################
  257. # Docs DIR
  258. ####################################
  259. DOCS_DIR = os.getenv("DOCS_DIR", f"{DATA_DIR}/docs")
  260. Path(DOCS_DIR).mkdir(parents=True, exist_ok=True)
  261. ####################################
  262. # LITELLM_CONFIG
  263. ####################################
  264. def create_config_file(file_path):
  265. directory = os.path.dirname(file_path)
  266. # Check if directory exists, if not, create it
  267. if not os.path.exists(directory):
  268. os.makedirs(directory)
  269. # Data to write into the YAML file
  270. config_data = {
  271. "general_settings": {},
  272. "litellm_settings": {},
  273. "model_list": [],
  274. "router_settings": {},
  275. }
  276. # Write data to YAML file
  277. with open(file_path, "w") as file:
  278. yaml.dump(config_data, file)
  279. LITELLM_CONFIG_PATH = f"{DATA_DIR}/litellm/config.yaml"
  280. # if not os.path.exists(LITELLM_CONFIG_PATH):
  281. # log.info("Config file doesn't exist. Creating...")
  282. # create_config_file(LITELLM_CONFIG_PATH)
  283. # log.info("Config file created successfully.")
  284. ####################################
  285. # OLLAMA_BASE_URL
  286. ####################################
  287. ENABLE_OLLAMA_API = PersistentConfig(
  288. "ENABLE_OLLAMA_API",
  289. "ollama.enable",
  290. os.environ.get("ENABLE_OLLAMA_API", "True").lower() == "true",
  291. )
  292. OLLAMA_API_BASE_URL = os.environ.get(
  293. "OLLAMA_API_BASE_URL", "http://localhost:11434/api"
  294. )
  295. OLLAMA_BASE_URL = os.environ.get("OLLAMA_BASE_URL", "")
  296. K8S_FLAG = os.environ.get("K8S_FLAG", "")
  297. USE_OLLAMA_DOCKER = os.environ.get("USE_OLLAMA_DOCKER", "false")
  298. if OLLAMA_BASE_URL == "" and OLLAMA_API_BASE_URL != "":
  299. OLLAMA_BASE_URL = (
  300. OLLAMA_API_BASE_URL[:-4]
  301. if OLLAMA_API_BASE_URL.endswith("/api")
  302. else OLLAMA_API_BASE_URL
  303. )
  304. if ENV == "prod":
  305. if OLLAMA_BASE_URL == "/ollama" and not K8S_FLAG:
  306. if USE_OLLAMA_DOCKER.lower() == "true":
  307. # if you use all-in-one docker container (Open WebUI + Ollama)
  308. # with the docker build arg USE_OLLAMA=true (--build-arg="USE_OLLAMA=true") this only works with http://localhost:11434
  309. OLLAMA_BASE_URL = "http://localhost:11434"
  310. else:
  311. OLLAMA_BASE_URL = "http://host.docker.internal:11434"
  312. elif K8S_FLAG:
  313. OLLAMA_BASE_URL = "http://ollama-service.open-webui.svc.cluster.local:11434"
  314. OLLAMA_BASE_URLS = os.environ.get("OLLAMA_BASE_URLS", "")
  315. OLLAMA_BASE_URLS = OLLAMA_BASE_URLS if OLLAMA_BASE_URLS != "" else OLLAMA_BASE_URL
  316. OLLAMA_BASE_URLS = [url.strip() for url in OLLAMA_BASE_URLS.split(";")]
  317. OLLAMA_BASE_URLS = PersistentConfig(
  318. "OLLAMA_BASE_URLS", "ollama.base_urls", OLLAMA_BASE_URLS
  319. )
  320. ####################################
  321. # OPENAI_API
  322. ####################################
  323. ENABLE_OPENAI_API = PersistentConfig(
  324. "ENABLE_OPENAI_API",
  325. "openai.enable",
  326. os.environ.get("ENABLE_OPENAI_API", "True").lower() == "true",
  327. )
  328. OPENAI_API_KEY = os.environ.get("OPENAI_API_KEY", "")
  329. OPENAI_API_BASE_URL = os.environ.get("OPENAI_API_BASE_URL", "")
  330. if OPENAI_API_BASE_URL == "":
  331. OPENAI_API_BASE_URL = "https://api.openai.com/v1"
  332. OPENAI_API_KEYS = os.environ.get("OPENAI_API_KEYS", "")
  333. OPENAI_API_KEYS = OPENAI_API_KEYS if OPENAI_API_KEYS != "" else OPENAI_API_KEY
  334. OPENAI_API_KEYS = [url.strip() for url in OPENAI_API_KEYS.split(";")]
  335. OPENAI_API_KEYS = PersistentConfig(
  336. "OPENAI_API_KEYS", "openai.api_keys", OPENAI_API_KEYS
  337. )
  338. OPENAI_API_BASE_URLS = os.environ.get("OPENAI_API_BASE_URLS", "")
  339. OPENAI_API_BASE_URLS = (
  340. OPENAI_API_BASE_URLS if OPENAI_API_BASE_URLS != "" else OPENAI_API_BASE_URL
  341. )
  342. OPENAI_API_BASE_URLS = [
  343. url.strip() if url != "" else "https://api.openai.com/v1"
  344. for url in OPENAI_API_BASE_URLS.split(";")
  345. ]
  346. OPENAI_API_BASE_URLS = PersistentConfig(
  347. "OPENAI_API_BASE_URLS", "openai.api_base_urls", OPENAI_API_BASE_URLS
  348. )
  349. OPENAI_API_KEY = ""
  350. try:
  351. OPENAI_API_KEY = OPENAI_API_KEYS.value[
  352. OPENAI_API_BASE_URLS.value.index("https://api.openai.com/v1")
  353. ]
  354. except:
  355. pass
  356. OPENAI_API_BASE_URL = "https://api.openai.com/v1"
  357. ####################################
  358. # WEBUI
  359. ####################################
  360. ENABLE_SIGNUP = PersistentConfig(
  361. "ENABLE_SIGNUP",
  362. "ui.enable_signup",
  363. (
  364. False
  365. if not WEBUI_AUTH
  366. else os.environ.get("ENABLE_SIGNUP", "True").lower() == "true"
  367. ),
  368. )
  369. DEFAULT_MODELS = PersistentConfig(
  370. "DEFAULT_MODELS", "ui.default_models", os.environ.get("DEFAULT_MODELS", None)
  371. )
  372. DEFAULT_PROMPT_SUGGESTIONS = PersistentConfig(
  373. "DEFAULT_PROMPT_SUGGESTIONS",
  374. "ui.prompt_suggestions",
  375. [
  376. {
  377. "title": ["Help me study", "vocabulary for a college entrance exam"],
  378. "content": "Help me study vocabulary: write a sentence for me to fill in the blank, and I'll try to pick the correct option.",
  379. },
  380. {
  381. "title": ["Give me ideas", "for what to do with my kids' art"],
  382. "content": "What are 5 creative things I could do with my kids' art? I don't want to throw them away, but it's also so much clutter.",
  383. },
  384. {
  385. "title": ["Tell me a fun fact", "about the Roman Empire"],
  386. "content": "Tell me a random fun fact about the Roman Empire",
  387. },
  388. {
  389. "title": ["Show me a code snippet", "of a website's sticky header"],
  390. "content": "Show me a code snippet of a website's sticky header in CSS and JavaScript.",
  391. },
  392. {
  393. "title": [
  394. "Explain options trading",
  395. "if I'm familiar with buying and selling stocks",
  396. ],
  397. "content": "Explain options trading in simple terms if I'm familiar with buying and selling stocks.",
  398. },
  399. {
  400. "title": ["Overcome procrastination", "give me tips"],
  401. "content": "Could you start by asking me about instances when I procrastinate the most and then give me some suggestions to overcome it?",
  402. },
  403. ],
  404. )
  405. DEFAULT_USER_ROLE = PersistentConfig(
  406. "DEFAULT_USER_ROLE",
  407. "ui.default_user_role",
  408. os.getenv("DEFAULT_USER_ROLE", "pending"),
  409. )
  410. USER_PERMISSIONS_CHAT_DELETION = (
  411. os.environ.get("USER_PERMISSIONS_CHAT_DELETION", "True").lower() == "true"
  412. )
  413. USER_PERMISSIONS = PersistentConfig(
  414. "USER_PERMISSIONS",
  415. "ui.user_permissions",
  416. {"chat": {"deletion": USER_PERMISSIONS_CHAT_DELETION}},
  417. )
  418. ENABLE_MODEL_FILTER = PersistentConfig(
  419. "ENABLE_MODEL_FILTER",
  420. "model_filter.enable",
  421. os.environ.get("ENABLE_MODEL_FILTER", "False").lower() == "true",
  422. )
  423. MODEL_FILTER_LIST = os.environ.get("MODEL_FILTER_LIST", "")
  424. MODEL_FILTER_LIST = PersistentConfig(
  425. "MODEL_FILTER_LIST",
  426. "model_filter.list",
  427. [model.strip() for model in MODEL_FILTER_LIST.split(";")],
  428. )
  429. WEBHOOK_URL = PersistentConfig(
  430. "WEBHOOK_URL", "webhook_url", os.environ.get("WEBHOOK_URL", "")
  431. )
  432. ENABLE_ADMIN_EXPORT = os.environ.get("ENABLE_ADMIN_EXPORT", "True").lower() == "true"
  433. ####################################
  434. # WEBUI_SECRET_KEY
  435. ####################################
  436. WEBUI_SECRET_KEY = os.environ.get(
  437. "WEBUI_SECRET_KEY",
  438. os.environ.get(
  439. "WEBUI_JWT_SECRET_KEY", "t0p-s3cr3t"
  440. ), # DEPRECATED: remove at next major version
  441. )
  442. if WEBUI_AUTH and WEBUI_SECRET_KEY == "":
  443. raise ValueError(ERROR_MESSAGES.ENV_VAR_NOT_FOUND)
  444. ####################################
  445. # RAG
  446. ####################################
  447. CHROMA_DATA_PATH = f"{DATA_DIR}/vector_db"
  448. CHROMA_TENANT = os.environ.get("CHROMA_TENANT", chromadb.DEFAULT_TENANT)
  449. CHROMA_DATABASE = os.environ.get("CHROMA_DATABASE", chromadb.DEFAULT_DATABASE)
  450. CHROMA_HTTP_HOST = os.environ.get("CHROMA_HTTP_HOST", "")
  451. CHROMA_HTTP_PORT = int(os.environ.get("CHROMA_HTTP_PORT", "8000"))
  452. # Comma-separated list of header=value pairs
  453. CHROMA_HTTP_HEADERS = os.environ.get("CHROMA_HTTP_HEADERS", "")
  454. if CHROMA_HTTP_HEADERS:
  455. CHROMA_HTTP_HEADERS = dict(
  456. [pair.split("=") for pair in CHROMA_HTTP_HEADERS.split(",")]
  457. )
  458. else:
  459. CHROMA_HTTP_HEADERS = None
  460. CHROMA_HTTP_SSL = os.environ.get("CHROMA_HTTP_SSL", "false").lower() == "true"
  461. # this uses the model defined in the Dockerfile ENV variable. If you dont use docker or docker based deployments such as k8s, the default embedding model will be used (sentence-transformers/all-MiniLM-L6-v2)
  462. RAG_TOP_K = PersistentConfig(
  463. "RAG_TOP_K", "rag.top_k", int(os.environ.get("RAG_TOP_K", "5"))
  464. )
  465. RAG_RELEVANCE_THRESHOLD = PersistentConfig(
  466. "RAG_RELEVANCE_THRESHOLD",
  467. "rag.relevance_threshold",
  468. float(os.environ.get("RAG_RELEVANCE_THRESHOLD", "0.0")),
  469. )
  470. ENABLE_RAG_HYBRID_SEARCH = PersistentConfig(
  471. "ENABLE_RAG_HYBRID_SEARCH",
  472. "rag.enable_hybrid_search",
  473. os.environ.get("ENABLE_RAG_HYBRID_SEARCH", "").lower() == "true",
  474. )
  475. ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION = PersistentConfig(
  476. "ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION",
  477. "rag.enable_web_loader_ssl_verification",
  478. os.environ.get("ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION", "True").lower() == "true",
  479. )
  480. RAG_EMBEDDING_ENGINE = PersistentConfig(
  481. "RAG_EMBEDDING_ENGINE",
  482. "rag.embedding_engine",
  483. os.environ.get("RAG_EMBEDDING_ENGINE", ""),
  484. )
  485. PDF_EXTRACT_IMAGES = PersistentConfig(
  486. "PDF_EXTRACT_IMAGES",
  487. "rag.pdf_extract_images",
  488. os.environ.get("PDF_EXTRACT_IMAGES", "False").lower() == "true",
  489. )
  490. RAG_EMBEDDING_MODEL = PersistentConfig(
  491. "RAG_EMBEDDING_MODEL",
  492. "rag.embedding_model",
  493. os.environ.get("RAG_EMBEDDING_MODEL", "sentence-transformers/all-MiniLM-L6-v2"),
  494. )
  495. log.info(f"Embedding model set: {RAG_EMBEDDING_MODEL.value}"),
  496. RAG_EMBEDDING_MODEL_AUTO_UPDATE = (
  497. os.environ.get("RAG_EMBEDDING_MODEL_AUTO_UPDATE", "").lower() == "true"
  498. )
  499. RAG_EMBEDDING_MODEL_TRUST_REMOTE_CODE = (
  500. os.environ.get("RAG_EMBEDDING_MODEL_TRUST_REMOTE_CODE", "").lower() == "true"
  501. )
  502. RAG_RERANKING_MODEL = PersistentConfig(
  503. "RAG_RERANKING_MODEL",
  504. "rag.reranking_model",
  505. os.environ.get("RAG_RERANKING_MODEL", ""),
  506. )
  507. if RAG_RERANKING_MODEL.value != "":
  508. log.info(f"Reranking model set: {RAG_RERANKING_MODEL.value}"),
  509. RAG_RERANKING_MODEL_AUTO_UPDATE = (
  510. os.environ.get("RAG_RERANKING_MODEL_AUTO_UPDATE", "").lower() == "true"
  511. )
  512. RAG_RERANKING_MODEL_TRUST_REMOTE_CODE = (
  513. os.environ.get("RAG_RERANKING_MODEL_TRUST_REMOTE_CODE", "").lower() == "true"
  514. )
  515. if CHROMA_HTTP_HOST != "":
  516. CHROMA_CLIENT = chromadb.HttpClient(
  517. host=CHROMA_HTTP_HOST,
  518. port=CHROMA_HTTP_PORT,
  519. headers=CHROMA_HTTP_HEADERS,
  520. ssl=CHROMA_HTTP_SSL,
  521. tenant=CHROMA_TENANT,
  522. database=CHROMA_DATABASE,
  523. settings=Settings(allow_reset=True, anonymized_telemetry=False),
  524. )
  525. else:
  526. CHROMA_CLIENT = chromadb.PersistentClient(
  527. path=CHROMA_DATA_PATH,
  528. settings=Settings(allow_reset=True, anonymized_telemetry=False),
  529. tenant=CHROMA_TENANT,
  530. database=CHROMA_DATABASE,
  531. )
  532. # device type embedding models - "cpu" (default), "cuda" (nvidia gpu required) or "mps" (apple silicon) - choosing this right can lead to better performance
  533. USE_CUDA = os.environ.get("USE_CUDA_DOCKER", "false")
  534. if USE_CUDA.lower() == "true":
  535. DEVICE_TYPE = "cuda"
  536. else:
  537. DEVICE_TYPE = "cpu"
  538. CHUNK_SIZE = PersistentConfig(
  539. "CHUNK_SIZE", "rag.chunk_size", int(os.environ.get("CHUNK_SIZE", "1500"))
  540. )
  541. CHUNK_OVERLAP = PersistentConfig(
  542. "CHUNK_OVERLAP",
  543. "rag.chunk_overlap",
  544. int(os.environ.get("CHUNK_OVERLAP", "100")),
  545. )
  546. DEFAULT_RAG_TEMPLATE = """Use the following context as your learned knowledge, inside <context></context> XML tags.
  547. <context>
  548. [context]
  549. </context>
  550. When answer to user:
  551. - If you don't know, just say that you don't know.
  552. - If you don't know when you are not sure, ask for clarification.
  553. Avoid mentioning that you obtained the information from the context.
  554. And answer according to the language of the user's question.
  555. Given the context information, answer the query.
  556. Query: [query]"""
  557. RAG_TEMPLATE = PersistentConfig(
  558. "RAG_TEMPLATE",
  559. "rag.template",
  560. os.environ.get("RAG_TEMPLATE", DEFAULT_RAG_TEMPLATE),
  561. )
  562. RAG_OPENAI_API_BASE_URL = PersistentConfig(
  563. "RAG_OPENAI_API_BASE_URL",
  564. "rag.openai_api_base_url",
  565. os.getenv("RAG_OPENAI_API_BASE_URL", OPENAI_API_BASE_URL),
  566. )
  567. RAG_OPENAI_API_KEY = PersistentConfig(
  568. "RAG_OPENAI_API_KEY",
  569. "rag.openai_api_key",
  570. os.getenv("RAG_OPENAI_API_KEY", OPENAI_API_KEY),
  571. )
  572. ENABLE_RAG_LOCAL_WEB_FETCH = (
  573. os.getenv("ENABLE_RAG_LOCAL_WEB_FETCH", "False").lower() == "true"
  574. )
  575. YOUTUBE_LOADER_LANGUAGE = PersistentConfig(
  576. "YOUTUBE_LOADER_LANGUAGE",
  577. "rag.youtube_loader_language",
  578. os.getenv("YOUTUBE_LOADER_LANGUAGE", "en").split(","),
  579. )
  580. ####################################
  581. # Transcribe
  582. ####################################
  583. WHISPER_MODEL = os.getenv("WHISPER_MODEL", "base")
  584. WHISPER_MODEL_DIR = os.getenv("WHISPER_MODEL_DIR", f"{CACHE_DIR}/whisper/models")
  585. WHISPER_MODEL_AUTO_UPDATE = (
  586. os.environ.get("WHISPER_MODEL_AUTO_UPDATE", "").lower() == "true"
  587. )
  588. ####################################
  589. # Images
  590. ####################################
  591. IMAGE_GENERATION_ENGINE = PersistentConfig(
  592. "IMAGE_GENERATION_ENGINE",
  593. "image_generation.engine",
  594. os.getenv("IMAGE_GENERATION_ENGINE", ""),
  595. )
  596. ENABLE_IMAGE_GENERATION = PersistentConfig(
  597. "ENABLE_IMAGE_GENERATION",
  598. "image_generation.enable",
  599. os.environ.get("ENABLE_IMAGE_GENERATION", "").lower() == "true",
  600. )
  601. AUTOMATIC1111_BASE_URL = PersistentConfig(
  602. "AUTOMATIC1111_BASE_URL",
  603. "image_generation.automatic1111.base_url",
  604. os.getenv("AUTOMATIC1111_BASE_URL", ""),
  605. )
  606. COMFYUI_BASE_URL = PersistentConfig(
  607. "COMFYUI_BASE_URL",
  608. "image_generation.comfyui.base_url",
  609. os.getenv("COMFYUI_BASE_URL", ""),
  610. )
  611. IMAGES_OPENAI_API_BASE_URL = PersistentConfig(
  612. "IMAGES_OPENAI_API_BASE_URL",
  613. "image_generation.openai.api_base_url",
  614. os.getenv("IMAGES_OPENAI_API_BASE_URL", OPENAI_API_BASE_URL),
  615. )
  616. IMAGES_OPENAI_API_KEY = PersistentConfig(
  617. "IMAGES_OPENAI_API_KEY",
  618. "image_generation.openai.api_key",
  619. os.getenv("IMAGES_OPENAI_API_KEY", OPENAI_API_KEY),
  620. )
  621. IMAGE_SIZE = PersistentConfig(
  622. "IMAGE_SIZE", "image_generation.size", os.getenv("IMAGE_SIZE", "512x512")
  623. )
  624. IMAGE_STEPS = PersistentConfig(
  625. "IMAGE_STEPS", "image_generation.steps", int(os.getenv("IMAGE_STEPS", 50))
  626. )
  627. IMAGE_GENERATION_MODEL = PersistentConfig(
  628. "IMAGE_GENERATION_MODEL",
  629. "image_generation.model",
  630. os.getenv("IMAGE_GENERATION_MODEL", ""),
  631. )
  632. ####################################
  633. # Audio
  634. ####################################
  635. AUDIO_OPENAI_API_BASE_URL = PersistentConfig(
  636. "AUDIO_OPENAI_API_BASE_URL",
  637. "audio.openai.api_base_url",
  638. os.getenv("AUDIO_OPENAI_API_BASE_URL", OPENAI_API_BASE_URL),
  639. )
  640. AUDIO_OPENAI_API_KEY = PersistentConfig(
  641. "AUDIO_OPENAI_API_KEY",
  642. "audio.openai.api_key",
  643. os.getenv("AUDIO_OPENAI_API_KEY", OPENAI_API_KEY),
  644. )
  645. AUDIO_OPENAI_API_MODEL = PersistentConfig(
  646. "AUDIO_OPENAI_API_MODEL",
  647. "audio.openai.api_model",
  648. os.getenv("AUDIO_OPENAI_API_MODEL", "tts-1"),
  649. )
  650. AUDIO_OPENAI_API_VOICE = PersistentConfig(
  651. "AUDIO_OPENAI_API_VOICE",
  652. "audio.openai.api_voice",
  653. os.getenv("AUDIO_OPENAI_API_VOICE", "alloy"),
  654. )
  655. ####################################
  656. # Database
  657. ####################################
  658. DATABASE_URL = os.environ.get("DATABASE_URL", f"sqlite:///{DATA_DIR}/webui.db")