payload.py 6.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220
  1. from open_webui.utils.task import prompt_template, prompt_variables_template
  2. from open_webui.utils.misc import (
  3. add_or_update_system_message,
  4. )
  5. from typing import Callable, Optional
  6. # inplace function: form_data is modified
  7. def apply_model_system_prompt_to_body(
  8. params: dict, form_data: dict, metadata: Optional[dict] = None, user=None
  9. ) -> dict:
  10. system = params.get("system", None)
  11. if not system:
  12. return form_data
  13. # Metadata (WebUI Usage)
  14. if metadata:
  15. variables = metadata.get("variables", {})
  16. if variables:
  17. system = prompt_variables_template(system, variables)
  18. # Legacy (API Usage)
  19. if user:
  20. template_params = {
  21. "user_name": user.name,
  22. "user_location": user.info.get("location") if user.info else None,
  23. }
  24. else:
  25. template_params = {}
  26. system = prompt_template(system, **template_params)
  27. form_data["messages"] = add_or_update_system_message(
  28. system, form_data.get("messages", [])
  29. )
  30. return form_data
  31. # inplace function: form_data is modified
  32. def apply_model_params_to_body(
  33. params: dict, form_data: dict, mappings: dict[str, Callable]
  34. ) -> dict:
  35. if not params:
  36. return form_data
  37. for key, cast_func in mappings.items():
  38. if (value := params.get(key)) is not None:
  39. form_data[key] = cast_func(value)
  40. return form_data
  41. # inplace function: form_data is modified
  42. def apply_model_params_to_body_openai(params: dict, form_data: dict) -> dict:
  43. mappings = {
  44. "temperature": float,
  45. "top_p": float,
  46. "max_tokens": int,
  47. "frequency_penalty": float,
  48. "reasoning_effort": str,
  49. "seed": lambda x: x,
  50. "stop": lambda x: [bytes(s, "utf-8").decode("unicode_escape") for s in x],
  51. }
  52. return apply_model_params_to_body(params, form_data, mappings)
  53. def apply_model_params_to_body_ollama(params: dict, form_data: dict) -> dict:
  54. opts = [
  55. "temperature",
  56. "top_p",
  57. "seed",
  58. "mirostat",
  59. "mirostat_eta",
  60. "mirostat_tau",
  61. "num_ctx",
  62. "num_batch",
  63. "num_keep",
  64. "num_predict",
  65. "repeat_last_n",
  66. "tfs_z",
  67. "top_k",
  68. "min_p",
  69. "typical_p",
  70. "repeat_penalty",
  71. "presence_penalty",
  72. "frequency_penalty",
  73. "penalize_newline",
  74. "stop",
  75. "numa",
  76. "num_gpu",
  77. "main_gpu",
  78. "low_vram",
  79. "vocab_only",
  80. "use_mmap",
  81. "use_mlock",
  82. "num_thread",
  83. ]
  84. mappings = {i: lambda x: x for i in opts}
  85. form_data = apply_model_params_to_body(params, form_data, mappings)
  86. name_differences = {
  87. "max_tokens": "num_predict",
  88. "frequency_penalty": "repeat_penalty",
  89. }
  90. for key, value in name_differences.items():
  91. if (param := params.get(key, None)) is not None:
  92. form_data[value] = param
  93. return form_data
  94. def convert_messages_openai_to_ollama(messages: list[dict]) -> list[dict]:
  95. ollama_messages = []
  96. for message in messages:
  97. # Initialize the new message structure with the role
  98. new_message = {"role": message["role"]}
  99. content = message.get("content", [])
  100. # Check if the content is a string (just a simple message)
  101. if isinstance(content, str):
  102. # If the content is a string, it's pure text
  103. new_message["content"] = content
  104. else:
  105. # Otherwise, assume the content is a list of dicts, e.g., text followed by an image URL
  106. content_text = ""
  107. images = []
  108. # Iterate through the list of content items
  109. for item in content:
  110. # Check if it's a text type
  111. if item.get("type") == "text":
  112. content_text += item.get("text", "")
  113. # Check if it's an image URL type
  114. elif item.get("type") == "image_url":
  115. img_url = item.get("image_url", {}).get("url", "")
  116. if img_url:
  117. # If the image url starts with data:, it's a base64 image and should be trimmed
  118. if img_url.startswith("data:"):
  119. img_url = img_url.split(",")[-1]
  120. images.append(img_url)
  121. # Add content text (if any)
  122. if content_text:
  123. new_message["content"] = content_text.strip()
  124. # Add images (if any)
  125. if images:
  126. new_message["images"] = images
  127. # Append the new formatted message to the result
  128. ollama_messages.append(new_message)
  129. return ollama_messages
  130. def convert_payload_openai_to_ollama(openai_payload: dict) -> dict:
  131. """
  132. Converts a payload formatted for OpenAI's API to be compatible with Ollama's API endpoint for chat completions.
  133. Args:
  134. openai_payload (dict): The payload originally designed for OpenAI API usage.
  135. Returns:
  136. dict: A modified payload compatible with the Ollama API.
  137. """
  138. ollama_payload = {}
  139. # Mapping basic model and message details
  140. ollama_payload["model"] = openai_payload.get("model")
  141. ollama_payload["messages"] = convert_messages_openai_to_ollama(
  142. openai_payload.get("messages")
  143. )
  144. ollama_payload["stream"] = openai_payload.get("stream", False)
  145. if "tools" in openai_payload:
  146. ollama_payload["tools"] = openai_payload["tools"]
  147. if "format" in openai_payload:
  148. ollama_payload["format"] = openai_payload["format"]
  149. # If there are advanced parameters in the payload, format them in Ollama's options field
  150. ollama_options = {}
  151. if openai_payload.get("options"):
  152. ollama_payload["options"] = openai_payload["options"]
  153. ollama_options = openai_payload["options"]
  154. # Handle parameters which map directly
  155. for param in ["temperature", "top_p", "seed"]:
  156. if param in openai_payload:
  157. ollama_options[param] = openai_payload[param]
  158. # Mapping OpenAI's `max_tokens` -> Ollama's `num_predict`
  159. if "max_completion_tokens" in openai_payload:
  160. ollama_options["num_predict"] = openai_payload["max_completion_tokens"]
  161. elif "max_tokens" in openai_payload:
  162. ollama_options["num_predict"] = openai_payload["max_tokens"]
  163. # Handle frequency / presence_penalty, which needs renaming and checking
  164. if "frequency_penalty" in openai_payload:
  165. ollama_options["repeat_penalty"] = openai_payload["frequency_penalty"]
  166. if "presence_penalty" in openai_payload and "penalty" not in ollama_options:
  167. # We are assuming presence penalty uses a similar concept in Ollama, which needs custom handling if exists.
  168. ollama_options["new_topic_penalty"] = openai_payload["presence_penalty"]
  169. # Add options to payload if any have been set
  170. if ollama_options:
  171. ollama_payload["options"] = ollama_options
  172. if "metadata" in openai_payload:
  173. ollama_payload["metadata"] = openai_payload["metadata"]
  174. return ollama_payload