config.py 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833
  1. import os
  2. import sys
  3. import logging
  4. import importlib.metadata
  5. import pkgutil
  6. import chromadb
  7. from chromadb import Settings
  8. from base64 import b64encode
  9. from bs4 import BeautifulSoup
  10. from typing import TypeVar, Generic, Union
  11. from pathlib import Path
  12. import json
  13. import yaml
  14. import markdown
  15. import requests
  16. import shutil
  17. from secrets import token_bytes
  18. from constants import ERROR_MESSAGES
  19. ####################################
  20. # Load .env file
  21. ####################################
  22. BACKEND_DIR = Path(__file__).parent # the path containing this file
  23. BASE_DIR = BACKEND_DIR.parent # the path containing the backend/
  24. try:
  25. from dotenv import load_dotenv, find_dotenv
  26. load_dotenv(find_dotenv(str(BASE_DIR / ".env")))
  27. except ImportError:
  28. print("dotenv not installed, skipping...")
  29. ####################################
  30. # LOGGING
  31. ####################################
  32. log_levels = ["CRITICAL", "ERROR", "WARNING", "INFO", "DEBUG"]
  33. GLOBAL_LOG_LEVEL = os.environ.get("GLOBAL_LOG_LEVEL", "").upper()
  34. if GLOBAL_LOG_LEVEL in log_levels:
  35. logging.basicConfig(stream=sys.stdout, level=GLOBAL_LOG_LEVEL, force=True)
  36. else:
  37. GLOBAL_LOG_LEVEL = "INFO"
  38. log = logging.getLogger(__name__)
  39. log.info(f"GLOBAL_LOG_LEVEL: {GLOBAL_LOG_LEVEL}")
  40. log_sources = [
  41. "AUDIO",
  42. "COMFYUI",
  43. "CONFIG",
  44. "DB",
  45. "IMAGES",
  46. "MAIN",
  47. "MODELS",
  48. "OLLAMA",
  49. "OPENAI",
  50. "RAG",
  51. "WEBHOOK",
  52. ]
  53. SRC_LOG_LEVELS = {}
  54. for source in log_sources:
  55. log_env_var = source + "_LOG_LEVEL"
  56. SRC_LOG_LEVELS[source] = os.environ.get(log_env_var, "").upper()
  57. if SRC_LOG_LEVELS[source] not in log_levels:
  58. SRC_LOG_LEVELS[source] = GLOBAL_LOG_LEVEL
  59. log.info(f"{log_env_var}: {SRC_LOG_LEVELS[source]}")
  60. log.setLevel(SRC_LOG_LEVELS["CONFIG"])
  61. WEBUI_NAME = os.environ.get("WEBUI_NAME", "Open WebUI")
  62. if WEBUI_NAME != "Open WebUI":
  63. WEBUI_NAME += " (Open WebUI)"
  64. WEBUI_URL = os.environ.get("WEBUI_URL", "http://localhost:3000")
  65. WEBUI_FAVICON_URL = "https://openwebui.com/favicon.png"
  66. ####################################
  67. # ENV (dev,test,prod)
  68. ####################################
  69. ENV = os.environ.get("ENV", "dev")
  70. try:
  71. PACKAGE_DATA = json.loads((BASE_DIR / "package.json").read_text())
  72. except:
  73. try:
  74. PACKAGE_DATA = {"version": importlib.metadata.version("open-webui")}
  75. except importlib.metadata.PackageNotFoundError:
  76. PACKAGE_DATA = {"version": "0.0.0"}
  77. VERSION = PACKAGE_DATA["version"]
  78. # Function to parse each section
  79. def parse_section(section):
  80. items = []
  81. for li in section.find_all("li"):
  82. # Extract raw HTML string
  83. raw_html = str(li)
  84. # Extract text without HTML tags
  85. text = li.get_text(separator=" ", strip=True)
  86. # Split into title and content
  87. parts = text.split(": ", 1)
  88. title = parts[0].strip() if len(parts) > 1 else ""
  89. content = parts[1].strip() if len(parts) > 1 else text
  90. items.append({"title": title, "content": content, "raw": raw_html})
  91. return items
  92. try:
  93. changelog_content = (BASE_DIR / "CHANGELOG.md").read_text()
  94. except:
  95. changelog_content = (pkgutil.get_data("open_webui", "CHANGELOG.md") or b"").decode()
  96. # Convert markdown content to HTML
  97. html_content = markdown.markdown(changelog_content)
  98. # Parse the HTML content
  99. soup = BeautifulSoup(html_content, "html.parser")
  100. # Initialize JSON structure
  101. changelog_json = {}
  102. # Iterate over each version
  103. for version in soup.find_all("h2"):
  104. version_number = version.get_text().strip().split(" - ")[0][1:-1] # Remove brackets
  105. date = version.get_text().strip().split(" - ")[1]
  106. version_data = {"date": date}
  107. # Find the next sibling that is a h3 tag (section title)
  108. current = version.find_next_sibling()
  109. while current and current.name != "h2":
  110. if current.name == "h3":
  111. section_title = current.get_text().lower() # e.g., "added", "fixed"
  112. section_items = parse_section(current.find_next_sibling("ul"))
  113. version_data[section_title] = section_items
  114. # Move to the next element
  115. current = current.find_next_sibling()
  116. changelog_json[version_number] = version_data
  117. CHANGELOG = changelog_json
  118. ####################################
  119. # WEBUI_VERSION
  120. ####################################
  121. WEBUI_VERSION = os.environ.get("WEBUI_VERSION", "v1.0.0-alpha.100")
  122. ####################################
  123. # DATA/FRONTEND BUILD DIR
  124. ####################################
  125. DATA_DIR = Path(os.getenv("DATA_DIR", BACKEND_DIR / "data")).resolve()
  126. FRONTEND_BUILD_DIR = Path(os.getenv("FRONTEND_BUILD_DIR", BASE_DIR / "build")).resolve()
  127. try:
  128. CONFIG_DATA = json.loads((DATA_DIR / "config.json").read_text())
  129. except:
  130. CONFIG_DATA = {}
  131. ####################################
  132. # Config helpers
  133. ####################################
  134. def save_config():
  135. try:
  136. with open(f"{DATA_DIR}/config.json", "w") as f:
  137. json.dump(CONFIG_DATA, f, indent="\t")
  138. except Exception as e:
  139. log.exception(e)
  140. def get_config_value(config_path: str):
  141. path_parts = config_path.split(".")
  142. cur_config = CONFIG_DATA
  143. for key in path_parts:
  144. if key in cur_config:
  145. cur_config = cur_config[key]
  146. else:
  147. return None
  148. return cur_config
  149. T = TypeVar("T")
  150. class PersistentConfig(Generic[T]):
  151. def __init__(self, env_name: str, config_path: str, env_value: T):
  152. self.env_name = env_name
  153. self.config_path = config_path
  154. self.env_value = env_value
  155. self.config_value = get_config_value(config_path)
  156. if self.config_value is not None:
  157. log.info(f"'{env_name}' loaded from config.json")
  158. self.value = self.config_value
  159. else:
  160. self.value = env_value
  161. def __str__(self):
  162. return str(self.value)
  163. @property
  164. def __dict__(self):
  165. raise TypeError(
  166. "PersistentConfig object cannot be converted to dict, use config_get or .value instead."
  167. )
  168. def __getattribute__(self, item):
  169. if item == "__dict__":
  170. raise TypeError(
  171. "PersistentConfig object cannot be converted to dict, use config_get or .value instead."
  172. )
  173. return super().__getattribute__(item)
  174. def save(self):
  175. # Don't save if the value is the same as the env value and the config value
  176. if self.env_value == self.value:
  177. if self.config_value == self.value:
  178. return
  179. log.info(f"Saving '{self.env_name}' to config.json")
  180. path_parts = self.config_path.split(".")
  181. config = CONFIG_DATA
  182. for key in path_parts[:-1]:
  183. if key not in config:
  184. config[key] = {}
  185. config = config[key]
  186. config[path_parts[-1]] = self.value
  187. save_config()
  188. self.config_value = self.value
  189. class AppConfig:
  190. _state: dict[str, PersistentConfig]
  191. def __init__(self):
  192. super().__setattr__("_state", {})
  193. def __setattr__(self, key, value):
  194. if isinstance(value, PersistentConfig):
  195. self._state[key] = value
  196. else:
  197. self._state[key].value = value
  198. self._state[key].save()
  199. def __getattr__(self, key):
  200. return self._state[key].value
  201. ####################################
  202. # WEBUI_AUTH (Required for security)
  203. ####################################
  204. WEBUI_AUTH = os.environ.get("WEBUI_AUTH", "True").lower() == "true"
  205. WEBUI_AUTH_TRUSTED_EMAIL_HEADER = os.environ.get(
  206. "WEBUI_AUTH_TRUSTED_EMAIL_HEADER", None
  207. )
  208. JWT_EXPIRES_IN = PersistentConfig(
  209. "JWT_EXPIRES_IN", "auth.jwt_expiry", os.environ.get("JWT_EXPIRES_IN", "-1")
  210. )
  211. ####################################
  212. # Static DIR
  213. ####################################
  214. STATIC_DIR = Path(os.getenv("STATIC_DIR", BACKEND_DIR / "static")).resolve()
  215. frontend_favicon = FRONTEND_BUILD_DIR / "favicon.png"
  216. if frontend_favicon.exists():
  217. shutil.copyfile(frontend_favicon, STATIC_DIR / "favicon.png")
  218. else:
  219. logging.warning(f"Frontend favicon not found at {frontend_favicon}")
  220. ####################################
  221. # CUSTOM_NAME
  222. ####################################
  223. CUSTOM_NAME = os.environ.get("CUSTOM_NAME", "")
  224. if CUSTOM_NAME:
  225. try:
  226. r = requests.get(f"https://api.openwebui.com/api/v1/custom/{CUSTOM_NAME}")
  227. data = r.json()
  228. if r.ok:
  229. if "logo" in data:
  230. WEBUI_FAVICON_URL = url = (
  231. f"https://api.openwebui.com{data['logo']}"
  232. if data["logo"][0] == "/"
  233. else data["logo"]
  234. )
  235. r = requests.get(url, stream=True)
  236. if r.status_code == 200:
  237. with open(f"{STATIC_DIR}/favicon.png", "wb") as f:
  238. r.raw.decode_content = True
  239. shutil.copyfileobj(r.raw, f)
  240. WEBUI_NAME = data["name"]
  241. except Exception as e:
  242. log.exception(e)
  243. pass
  244. ####################################
  245. # File Upload DIR
  246. ####################################
  247. UPLOAD_DIR = f"{DATA_DIR}/uploads"
  248. Path(UPLOAD_DIR).mkdir(parents=True, exist_ok=True)
  249. ####################################
  250. # Cache DIR
  251. ####################################
  252. CACHE_DIR = f"{DATA_DIR}/cache"
  253. Path(CACHE_DIR).mkdir(parents=True, exist_ok=True)
  254. ####################################
  255. # Docs DIR
  256. ####################################
  257. DOCS_DIR = os.getenv("DOCS_DIR", f"{DATA_DIR}/docs")
  258. Path(DOCS_DIR).mkdir(parents=True, exist_ok=True)
  259. ####################################
  260. # LITELLM_CONFIG
  261. ####################################
  262. def create_config_file(file_path):
  263. directory = os.path.dirname(file_path)
  264. # Check if directory exists, if not, create it
  265. if not os.path.exists(directory):
  266. os.makedirs(directory)
  267. # Data to write into the YAML file
  268. config_data = {
  269. "general_settings": {},
  270. "litellm_settings": {},
  271. "model_list": [],
  272. "router_settings": {},
  273. }
  274. # Write data to YAML file
  275. with open(file_path, "w") as file:
  276. yaml.dump(config_data, file)
  277. LITELLM_CONFIG_PATH = f"{DATA_DIR}/litellm/config.yaml"
  278. # if not os.path.exists(LITELLM_CONFIG_PATH):
  279. # log.info("Config file doesn't exist. Creating...")
  280. # create_config_file(LITELLM_CONFIG_PATH)
  281. # log.info("Config file created successfully.")
  282. ####################################
  283. # OLLAMA_BASE_URL
  284. ####################################
  285. ENABLE_OLLAMA_API = PersistentConfig(
  286. "ENABLE_OLLAMA_API",
  287. "ollama.enable",
  288. os.environ.get("ENABLE_OLLAMA_API", "True").lower() == "true",
  289. )
  290. OLLAMA_API_BASE_URL = os.environ.get(
  291. "OLLAMA_API_BASE_URL", "http://localhost:11434/api"
  292. )
  293. OLLAMA_BASE_URL = os.environ.get("OLLAMA_BASE_URL", "")
  294. K8S_FLAG = os.environ.get("K8S_FLAG", "")
  295. USE_OLLAMA_DOCKER = os.environ.get("USE_OLLAMA_DOCKER", "false")
  296. if OLLAMA_BASE_URL == "" and OLLAMA_API_BASE_URL != "":
  297. OLLAMA_BASE_URL = (
  298. OLLAMA_API_BASE_URL[:-4]
  299. if OLLAMA_API_BASE_URL.endswith("/api")
  300. else OLLAMA_API_BASE_URL
  301. )
  302. if ENV == "prod":
  303. if OLLAMA_BASE_URL == "/ollama" and not K8S_FLAG:
  304. if USE_OLLAMA_DOCKER.lower() == "true":
  305. # if you use all-in-one docker container (Open WebUI + Ollama)
  306. # with the docker build arg USE_OLLAMA=true (--build-arg="USE_OLLAMA=true") this only works with http://localhost:11434
  307. OLLAMA_BASE_URL = "http://localhost:11434"
  308. else:
  309. OLLAMA_BASE_URL = "http://host.docker.internal:11434"
  310. elif K8S_FLAG:
  311. OLLAMA_BASE_URL = "http://ollama-service.open-webui.svc.cluster.local:11434"
  312. OLLAMA_BASE_URLS = os.environ.get("OLLAMA_BASE_URLS", "")
  313. OLLAMA_BASE_URLS = OLLAMA_BASE_URLS if OLLAMA_BASE_URLS != "" else OLLAMA_BASE_URL
  314. OLLAMA_BASE_URLS = [url.strip() for url in OLLAMA_BASE_URLS.split(";")]
  315. OLLAMA_BASE_URLS = PersistentConfig(
  316. "OLLAMA_BASE_URLS", "ollama.base_urls", OLLAMA_BASE_URLS
  317. )
  318. ####################################
  319. # OPENAI_API
  320. ####################################
  321. ENABLE_OPENAI_API = PersistentConfig(
  322. "ENABLE_OPENAI_API",
  323. "openai.enable",
  324. os.environ.get("ENABLE_OPENAI_API", "True").lower() == "true",
  325. )
  326. OPENAI_API_KEY = os.environ.get("OPENAI_API_KEY", "")
  327. OPENAI_API_BASE_URL = os.environ.get("OPENAI_API_BASE_URL", "")
  328. if OPENAI_API_BASE_URL == "":
  329. OPENAI_API_BASE_URL = "https://api.openai.com/v1"
  330. OPENAI_API_KEYS = os.environ.get("OPENAI_API_KEYS", "")
  331. OPENAI_API_KEYS = OPENAI_API_KEYS if OPENAI_API_KEYS != "" else OPENAI_API_KEY
  332. OPENAI_API_KEYS = [url.strip() for url in OPENAI_API_KEYS.split(";")]
  333. OPENAI_API_KEYS = PersistentConfig(
  334. "OPENAI_API_KEYS", "openai.api_keys", OPENAI_API_KEYS
  335. )
  336. OPENAI_API_BASE_URLS = os.environ.get("OPENAI_API_BASE_URLS", "")
  337. OPENAI_API_BASE_URLS = (
  338. OPENAI_API_BASE_URLS if OPENAI_API_BASE_URLS != "" else OPENAI_API_BASE_URL
  339. )
  340. OPENAI_API_BASE_URLS = [
  341. url.strip() if url != "" else "https://api.openai.com/v1"
  342. for url in OPENAI_API_BASE_URLS.split(";")
  343. ]
  344. OPENAI_API_BASE_URLS = PersistentConfig(
  345. "OPENAI_API_BASE_URLS", "openai.api_base_urls", OPENAI_API_BASE_URLS
  346. )
  347. OPENAI_API_KEY = ""
  348. try:
  349. OPENAI_API_KEY = OPENAI_API_KEYS.value[
  350. OPENAI_API_BASE_URLS.value.index("https://api.openai.com/v1")
  351. ]
  352. except:
  353. pass
  354. OPENAI_API_BASE_URL = "https://api.openai.com/v1"
  355. ####################################
  356. # WEBUI
  357. ####################################
  358. ENABLE_SIGNUP = PersistentConfig(
  359. "ENABLE_SIGNUP",
  360. "ui.enable_signup",
  361. (
  362. False
  363. if not WEBUI_AUTH
  364. else os.environ.get("ENABLE_SIGNUP", "True").lower() == "true"
  365. ),
  366. )
  367. DEFAULT_MODELS = PersistentConfig(
  368. "DEFAULT_MODELS", "ui.default_models", os.environ.get("DEFAULT_MODELS", None)
  369. )
  370. DEFAULT_PROMPT_SUGGESTIONS = PersistentConfig(
  371. "DEFAULT_PROMPT_SUGGESTIONS",
  372. "ui.prompt_suggestions",
  373. [
  374. {
  375. "title": ["Help me study", "vocabulary for a college entrance exam"],
  376. "content": "Help me study vocabulary: write a sentence for me to fill in the blank, and I'll try to pick the correct option.",
  377. },
  378. {
  379. "title": ["Give me ideas", "for what to do with my kids' art"],
  380. "content": "What are 5 creative things I could do with my kids' art? I don't want to throw them away, but it's also so much clutter.",
  381. },
  382. {
  383. "title": ["Tell me a fun fact", "about the Roman Empire"],
  384. "content": "Tell me a random fun fact about the Roman Empire",
  385. },
  386. {
  387. "title": ["Show me a code snippet", "of a website's sticky header"],
  388. "content": "Show me a code snippet of a website's sticky header in CSS and JavaScript.",
  389. },
  390. {
  391. "title": [
  392. "Explain options trading",
  393. "if I'm familiar with buying and selling stocks",
  394. ],
  395. "content": "Explain options trading in simple terms if I'm familiar with buying and selling stocks.",
  396. },
  397. {
  398. "title": ["Overcome procrastination", "give me tips"],
  399. "content": "Could you start by asking me about instances when I procrastinate the most and then give me some suggestions to overcome it?",
  400. },
  401. ],
  402. )
  403. DEFAULT_USER_ROLE = PersistentConfig(
  404. "DEFAULT_USER_ROLE",
  405. "ui.default_user_role",
  406. os.getenv("DEFAULT_USER_ROLE", "pending"),
  407. )
  408. USER_PERMISSIONS_CHAT_DELETION = (
  409. os.environ.get("USER_PERMISSIONS_CHAT_DELETION", "True").lower() == "true"
  410. )
  411. USER_PERMISSIONS = PersistentConfig(
  412. "USER_PERMISSIONS",
  413. "ui.user_permissions",
  414. {"chat": {"deletion": USER_PERMISSIONS_CHAT_DELETION}},
  415. )
  416. ENABLE_MODEL_FILTER = PersistentConfig(
  417. "ENABLE_MODEL_FILTER",
  418. "model_filter.enable",
  419. os.environ.get("ENABLE_MODEL_FILTER", "False").lower() == "true",
  420. )
  421. MODEL_FILTER_LIST = os.environ.get("MODEL_FILTER_LIST", "")
  422. MODEL_FILTER_LIST = PersistentConfig(
  423. "MODEL_FILTER_LIST",
  424. "model_filter.list",
  425. [model.strip() for model in MODEL_FILTER_LIST.split(";")],
  426. )
  427. WEBHOOK_URL = PersistentConfig(
  428. "WEBHOOK_URL", "webhook_url", os.environ.get("WEBHOOK_URL", "")
  429. )
  430. ENABLE_ADMIN_EXPORT = os.environ.get("ENABLE_ADMIN_EXPORT", "True").lower() == "true"
  431. ####################################
  432. # WEBUI_SECRET_KEY
  433. ####################################
  434. WEBUI_SECRET_KEY = os.environ.get(
  435. "WEBUI_SECRET_KEY",
  436. os.environ.get(
  437. "WEBUI_JWT_SECRET_KEY", "t0p-s3cr3t"
  438. ), # DEPRECATED: remove at next major version
  439. )
  440. if WEBUI_AUTH and WEBUI_SECRET_KEY == "":
  441. raise ValueError(ERROR_MESSAGES.ENV_VAR_NOT_FOUND)
  442. ####################################
  443. # RAG
  444. ####################################
  445. CHROMA_DATA_PATH = f"{DATA_DIR}/vector_db"
  446. CHROMA_TENANT = os.environ.get("CHROMA_TENANT", chromadb.DEFAULT_TENANT)
  447. CHROMA_DATABASE = os.environ.get("CHROMA_DATABASE", chromadb.DEFAULT_DATABASE)
  448. CHROMA_HTTP_HOST = os.environ.get("CHROMA_HTTP_HOST", "")
  449. CHROMA_HTTP_PORT = int(os.environ.get("CHROMA_HTTP_PORT", "8000"))
  450. # Comma-separated list of header=value pairs
  451. CHROMA_HTTP_HEADERS = os.environ.get("CHROMA_HTTP_HEADERS", "")
  452. if CHROMA_HTTP_HEADERS:
  453. CHROMA_HTTP_HEADERS = dict(
  454. [pair.split("=") for pair in CHROMA_HTTP_HEADERS.split(",")]
  455. )
  456. else:
  457. CHROMA_HTTP_HEADERS = None
  458. CHROMA_HTTP_SSL = os.environ.get("CHROMA_HTTP_SSL", "false").lower() == "true"
  459. # this uses the model defined in the Dockerfile ENV variable. If you dont use docker or docker based deployments such as k8s, the default embedding model will be used (sentence-transformers/all-MiniLM-L6-v2)
  460. RAG_TOP_K = PersistentConfig(
  461. "RAG_TOP_K", "rag.top_k", int(os.environ.get("RAG_TOP_K", "5"))
  462. )
  463. RAG_RELEVANCE_THRESHOLD = PersistentConfig(
  464. "RAG_RELEVANCE_THRESHOLD",
  465. "rag.relevance_threshold",
  466. float(os.environ.get("RAG_RELEVANCE_THRESHOLD", "0.0")),
  467. )
  468. ENABLE_RAG_HYBRID_SEARCH = PersistentConfig(
  469. "ENABLE_RAG_HYBRID_SEARCH",
  470. "rag.enable_hybrid_search",
  471. os.environ.get("ENABLE_RAG_HYBRID_SEARCH", "").lower() == "true",
  472. )
  473. ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION = PersistentConfig(
  474. "ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION",
  475. "rag.enable_web_loader_ssl_verification",
  476. os.environ.get("ENABLE_RAG_WEB_LOADER_SSL_VERIFICATION", "True").lower() == "true",
  477. )
  478. RAG_EMBEDDING_ENGINE = PersistentConfig(
  479. "RAG_EMBEDDING_ENGINE",
  480. "rag.embedding_engine",
  481. os.environ.get("RAG_EMBEDDING_ENGINE", ""),
  482. )
  483. PDF_EXTRACT_IMAGES = PersistentConfig(
  484. "PDF_EXTRACT_IMAGES",
  485. "rag.pdf_extract_images",
  486. os.environ.get("PDF_EXTRACT_IMAGES", "False").lower() == "true",
  487. )
  488. RAG_EMBEDDING_MODEL = PersistentConfig(
  489. "RAG_EMBEDDING_MODEL",
  490. "rag.embedding_model",
  491. os.environ.get("RAG_EMBEDDING_MODEL", "sentence-transformers/all-MiniLM-L6-v2"),
  492. )
  493. log.info(f"Embedding model set: {RAG_EMBEDDING_MODEL.value}"),
  494. RAG_EMBEDDING_MODEL_AUTO_UPDATE = (
  495. os.environ.get("RAG_EMBEDDING_MODEL_AUTO_UPDATE", "").lower() == "true"
  496. )
  497. RAG_EMBEDDING_MODEL_TRUST_REMOTE_CODE = (
  498. os.environ.get("RAG_EMBEDDING_MODEL_TRUST_REMOTE_CODE", "").lower() == "true"
  499. )
  500. RAG_RERANKING_MODEL = PersistentConfig(
  501. "RAG_RERANKING_MODEL",
  502. "rag.reranking_model",
  503. os.environ.get("RAG_RERANKING_MODEL", ""),
  504. )
  505. if RAG_RERANKING_MODEL.value != "":
  506. log.info(f"Reranking model set: {RAG_RERANKING_MODEL.value}"),
  507. RAG_RERANKING_MODEL_AUTO_UPDATE = (
  508. os.environ.get("RAG_RERANKING_MODEL_AUTO_UPDATE", "").lower() == "true"
  509. )
  510. RAG_RERANKING_MODEL_TRUST_REMOTE_CODE = (
  511. os.environ.get("RAG_RERANKING_MODEL_TRUST_REMOTE_CODE", "").lower() == "true"
  512. )
  513. if CHROMA_HTTP_HOST != "":
  514. CHROMA_CLIENT = chromadb.HttpClient(
  515. host=CHROMA_HTTP_HOST,
  516. port=CHROMA_HTTP_PORT,
  517. headers=CHROMA_HTTP_HEADERS,
  518. ssl=CHROMA_HTTP_SSL,
  519. tenant=CHROMA_TENANT,
  520. database=CHROMA_DATABASE,
  521. settings=Settings(allow_reset=True, anonymized_telemetry=False),
  522. )
  523. else:
  524. CHROMA_CLIENT = chromadb.PersistentClient(
  525. path=CHROMA_DATA_PATH,
  526. settings=Settings(allow_reset=True, anonymized_telemetry=False),
  527. tenant=CHROMA_TENANT,
  528. database=CHROMA_DATABASE,
  529. )
  530. # device type embedding models - "cpu" (default), "cuda" (nvidia gpu required) or "mps" (apple silicon) - choosing this right can lead to better performance
  531. USE_CUDA = os.environ.get("USE_CUDA_DOCKER", "false")
  532. if USE_CUDA.lower() == "true":
  533. DEVICE_TYPE = "cuda"
  534. else:
  535. DEVICE_TYPE = "cpu"
  536. CHUNK_SIZE = PersistentConfig(
  537. "CHUNK_SIZE", "rag.chunk_size", int(os.environ.get("CHUNK_SIZE", "1500"))
  538. )
  539. CHUNK_OVERLAP = PersistentConfig(
  540. "CHUNK_OVERLAP",
  541. "rag.chunk_overlap",
  542. int(os.environ.get("CHUNK_OVERLAP", "100")),
  543. )
  544. DEFAULT_RAG_TEMPLATE = """Use the following context as your learned knowledge, inside <context></context> XML tags.
  545. <context>
  546. [context]
  547. </context>
  548. When answer to user:
  549. - If you don't know, just say that you don't know.
  550. - If you don't know when you are not sure, ask for clarification.
  551. Avoid mentioning that you obtained the information from the context.
  552. And answer according to the language of the user's question.
  553. Given the context information, answer the query.
  554. Query: [query]"""
  555. RAG_TEMPLATE = PersistentConfig(
  556. "RAG_TEMPLATE",
  557. "rag.template",
  558. os.environ.get("RAG_TEMPLATE", DEFAULT_RAG_TEMPLATE),
  559. )
  560. RAG_OPENAI_API_BASE_URL = PersistentConfig(
  561. "RAG_OPENAI_API_BASE_URL",
  562. "rag.openai_api_base_url",
  563. os.getenv("RAG_OPENAI_API_BASE_URL", OPENAI_API_BASE_URL),
  564. )
  565. RAG_OPENAI_API_KEY = PersistentConfig(
  566. "RAG_OPENAI_API_KEY",
  567. "rag.openai_api_key",
  568. os.getenv("RAG_OPENAI_API_KEY", OPENAI_API_KEY),
  569. )
  570. ENABLE_RAG_LOCAL_WEB_FETCH = (
  571. os.getenv("ENABLE_RAG_LOCAL_WEB_FETCH", "False").lower() == "true"
  572. )
  573. YOUTUBE_LOADER_LANGUAGE = PersistentConfig(
  574. "YOUTUBE_LOADER_LANGUAGE",
  575. "rag.youtube_loader_language",
  576. os.getenv("YOUTUBE_LOADER_LANGUAGE", "en").split(","),
  577. )
  578. ####################################
  579. # Transcribe
  580. ####################################
  581. WHISPER_MODEL = os.getenv("WHISPER_MODEL", "base")
  582. WHISPER_MODEL_DIR = os.getenv("WHISPER_MODEL_DIR", f"{CACHE_DIR}/whisper/models")
  583. WHISPER_MODEL_AUTO_UPDATE = (
  584. os.environ.get("WHISPER_MODEL_AUTO_UPDATE", "").lower() == "true"
  585. )
  586. ####################################
  587. # Images
  588. ####################################
  589. IMAGE_GENERATION_ENGINE = PersistentConfig(
  590. "IMAGE_GENERATION_ENGINE",
  591. "image_generation.engine",
  592. os.getenv("IMAGE_GENERATION_ENGINE", ""),
  593. )
  594. ENABLE_IMAGE_GENERATION = PersistentConfig(
  595. "ENABLE_IMAGE_GENERATION",
  596. "image_generation.enable",
  597. os.environ.get("ENABLE_IMAGE_GENERATION", "").lower() == "true",
  598. )
  599. AUTOMATIC1111_BASE_URL = PersistentConfig(
  600. "AUTOMATIC1111_BASE_URL",
  601. "image_generation.automatic1111.base_url",
  602. os.getenv("AUTOMATIC1111_BASE_URL", ""),
  603. )
  604. COMFYUI_BASE_URL = PersistentConfig(
  605. "COMFYUI_BASE_URL",
  606. "image_generation.comfyui.base_url",
  607. os.getenv("COMFYUI_BASE_URL", ""),
  608. )
  609. IMAGES_OPENAI_API_BASE_URL = PersistentConfig(
  610. "IMAGES_OPENAI_API_BASE_URL",
  611. "image_generation.openai.api_base_url",
  612. os.getenv("IMAGES_OPENAI_API_BASE_URL", OPENAI_API_BASE_URL),
  613. )
  614. IMAGES_OPENAI_API_KEY = PersistentConfig(
  615. "IMAGES_OPENAI_API_KEY",
  616. "image_generation.openai.api_key",
  617. os.getenv("IMAGES_OPENAI_API_KEY", OPENAI_API_KEY),
  618. )
  619. IMAGE_SIZE = PersistentConfig(
  620. "IMAGE_SIZE", "image_generation.size", os.getenv("IMAGE_SIZE", "512x512")
  621. )
  622. IMAGE_STEPS = PersistentConfig(
  623. "IMAGE_STEPS", "image_generation.steps", int(os.getenv("IMAGE_STEPS", 50))
  624. )
  625. IMAGE_GENERATION_MODEL = PersistentConfig(
  626. "IMAGE_GENERATION_MODEL",
  627. "image_generation.model",
  628. os.getenv("IMAGE_GENERATION_MODEL", ""),
  629. )
  630. ####################################
  631. # Audio
  632. ####################################
  633. AUDIO_OPENAI_API_BASE_URL = PersistentConfig(
  634. "AUDIO_OPENAI_API_BASE_URL",
  635. "audio.openai.api_base_url",
  636. os.getenv("AUDIO_OPENAI_API_BASE_URL", OPENAI_API_BASE_URL),
  637. )
  638. AUDIO_OPENAI_API_KEY = PersistentConfig(
  639. "AUDIO_OPENAI_API_KEY",
  640. "audio.openai.api_key",
  641. os.getenv("AUDIO_OPENAI_API_KEY", OPENAI_API_KEY),
  642. )
  643. AUDIO_OPENAI_API_MODEL = PersistentConfig(
  644. "AUDIO_OPENAI_API_MODEL",
  645. "audio.openai.api_model",
  646. os.getenv("AUDIO_OPENAI_API_MODEL", "tts-1"),
  647. )
  648. AUDIO_OPENAI_API_VOICE = PersistentConfig(
  649. "AUDIO_OPENAI_API_VOICE",
  650. "audio.openai.api_voice",
  651. os.getenv("AUDIO_OPENAI_API_VOICE", "alloy"),
  652. )
  653. ####################################
  654. # Database
  655. ####################################
  656. DATABASE_URL = os.environ.get("DATABASE_URL", f"sqlite:///{DATA_DIR}/webui.db")