payload.py 6.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218
  1. from open_webui.utils.task import prompt_template, prompt_variables_template
  2. from open_webui.utils.misc import (
  3. add_or_update_system_message,
  4. )
  5. from typing import Callable, Optional
  6. # inplace function: form_data is modified
  7. def apply_model_system_prompt_to_body(
  8. params: dict, form_data: dict, metadata: Optional[dict] = None, user=None
  9. ) -> dict:
  10. system = params.get("system", None)
  11. if not system:
  12. return form_data
  13. # Metadata (WebUI Usage)
  14. if metadata:
  15. variables = metadata.get("variables", {})
  16. if variables:
  17. system = prompt_variables_template(system, variables)
  18. # Legacy (API Usage)
  19. if user:
  20. template_params = {
  21. "user_name": user.name,
  22. "user_location": user.info.get("location") if user.info else None,
  23. }
  24. else:
  25. template_params = {}
  26. system = prompt_template(system, **template_params)
  27. form_data["messages"] = add_or_update_system_message(
  28. system, form_data.get("messages", [])
  29. )
  30. return form_data
  31. # inplace function: form_data is modified
  32. def apply_model_params_to_body(
  33. params: dict, form_data: dict, mappings: dict[str, Callable]
  34. ) -> dict:
  35. if not params:
  36. return form_data
  37. for key, cast_func in mappings.items():
  38. if (value := params.get(key)) is not None:
  39. form_data[key] = cast_func(value)
  40. return form_data
  41. # inplace function: form_data is modified
  42. def apply_model_params_to_body_openai(params: dict, form_data: dict) -> dict:
  43. mappings = {
  44. "temperature": float,
  45. "top_p": float,
  46. "max_tokens": int,
  47. "frequency_penalty": float,
  48. "reasoning_effort": str,
  49. "seed": lambda x: x,
  50. "stop": lambda x: [bytes(s, "utf-8").decode("unicode_escape") for s in x],
  51. }
  52. return apply_model_params_to_body(params, form_data, mappings)
  53. def apply_model_params_to_body_ollama(params: dict, form_data: dict) -> dict:
  54. name_differences = {
  55. "max_tokens": "num_predict",
  56. }
  57. for key, value in name_differences.items():
  58. if (param := params.get(key, None)) is not None:
  59. form_data[value] = param
  60. opts = [
  61. "temperature",
  62. "top_p",
  63. "seed",
  64. "mirostat",
  65. "mirostat_eta",
  66. "mirostat_tau",
  67. "num_ctx",
  68. "num_batch",
  69. "num_keep",
  70. "num_predict",
  71. "repeat_last_n",
  72. "top_k",
  73. "min_p",
  74. "typical_p",
  75. "repeat_penalty",
  76. "presence_penalty",
  77. "frequency_penalty",
  78. "penalize_newline",
  79. "stop",
  80. "numa",
  81. "num_gpu",
  82. "main_gpu",
  83. "low_vram",
  84. "vocab_only",
  85. "use_mmap",
  86. "use_mlock",
  87. "num_thread",
  88. ]
  89. mappings = {i: lambda x: x for i in opts}
  90. form_data = apply_model_params_to_body(params, form_data, mappings)
  91. return form_data
  92. def convert_messages_openai_to_ollama(messages: list[dict]) -> list[dict]:
  93. ollama_messages = []
  94. for message in messages:
  95. # Initialize the new message structure with the role
  96. new_message = {"role": message["role"]}
  97. content = message.get("content", [])
  98. # Check if the content is a string (just a simple message)
  99. if isinstance(content, str):
  100. # If the content is a string, it's pure text
  101. new_message["content"] = content
  102. else:
  103. # Otherwise, assume the content is a list of dicts, e.g., text followed by an image URL
  104. content_text = ""
  105. images = []
  106. # Iterate through the list of content items
  107. for item in content:
  108. # Check if it's a text type
  109. if item.get("type") == "text":
  110. content_text += item.get("text", "")
  111. # Check if it's an image URL type
  112. elif item.get("type") == "image_url":
  113. img_url = item.get("image_url", {}).get("url", "")
  114. if img_url:
  115. # If the image url starts with data:, it's a base64 image and should be trimmed
  116. if img_url.startswith("data:"):
  117. img_url = img_url.split(",")[-1]
  118. images.append(img_url)
  119. # Add content text (if any)
  120. if content_text:
  121. new_message["content"] = content_text.strip()
  122. # Add images (if any)
  123. if images:
  124. new_message["images"] = images
  125. # Append the new formatted message to the result
  126. ollama_messages.append(new_message)
  127. return ollama_messages
  128. def convert_payload_openai_to_ollama(openai_payload: dict) -> dict:
  129. """
  130. Converts a payload formatted for OpenAI's API to be compatible with Ollama's API endpoint for chat completions.
  131. Args:
  132. openai_payload (dict): The payload originally designed for OpenAI API usage.
  133. Returns:
  134. dict: A modified payload compatible with the Ollama API.
  135. """
  136. ollama_payload = {}
  137. # Mapping basic model and message details
  138. ollama_payload["model"] = openai_payload.get("model")
  139. ollama_payload["messages"] = convert_messages_openai_to_ollama(
  140. openai_payload.get("messages")
  141. )
  142. ollama_payload["stream"] = openai_payload.get("stream", False)
  143. if "tools" in openai_payload:
  144. ollama_payload["tools"] = openai_payload["tools"]
  145. if "format" in openai_payload:
  146. ollama_payload["format"] = openai_payload["format"]
  147. # If there are advanced parameters in the payload, format them in Ollama's options field
  148. ollama_options = {}
  149. if openai_payload.get("options"):
  150. ollama_payload["options"] = openai_payload["options"]
  151. ollama_options = openai_payload["options"]
  152. # Handle parameters which map directly
  153. for param in ["temperature", "top_p", "seed"]:
  154. if param in openai_payload:
  155. ollama_options[param] = openai_payload[param]
  156. # Mapping OpenAI's `max_tokens` -> Ollama's `num_predict`
  157. if "max_completion_tokens" in openai_payload:
  158. ollama_options["num_predict"] = openai_payload["max_completion_tokens"]
  159. elif "max_tokens" in openai_payload:
  160. ollama_options["num_predict"] = openai_payload["max_tokens"]
  161. # Handle frequency / presence_penalty, which needs renaming and checking
  162. if "frequency_penalty" in openai_payload:
  163. ollama_options["repeat_penalty"] = openai_payload["frequency_penalty"]
  164. if "presence_penalty" in openai_payload and "penalty" not in ollama_options:
  165. # We are assuming presence penalty uses a similar concept in Ollama, which needs custom handling if exists.
  166. ollama_options["new_topic_penalty"] = openai_payload["presence_penalty"]
  167. # Add options to payload if any have been set
  168. if ollama_options:
  169. ollama_payload["options"] = ollama_options
  170. if "metadata" in openai_payload:
  171. ollama_payload["metadata"] = openai_payload["metadata"]
  172. return ollama_payload