comfyui.py 5.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174
  1. import asyncio
  2. import json
  3. import logging
  4. import random
  5. import urllib.parse
  6. import urllib.request
  7. from typing import Optional
  8. import websocket # NOTE: websocket-client (https://github.com/websocket-client/websocket-client)
  9. from open_webui.env import SRC_LOG_LEVELS
  10. from pydantic import BaseModel
  11. log = logging.getLogger(__name__)
  12. log.setLevel(SRC_LOG_LEVELS["COMFYUI"])
  13. default_headers = {"User-Agent": "Mozilla/5.0"}
  14. def queue_prompt(prompt, client_id, base_url):
  15. log.info("queue_prompt")
  16. p = {"prompt": prompt, "client_id": client_id}
  17. data = json.dumps(p).encode("utf-8")
  18. log.debug(f"queue_prompt data: {data}")
  19. try:
  20. req = urllib.request.Request(
  21. f"{base_url}/prompt", data=data, headers=default_headers
  22. )
  23. response = urllib.request.urlopen(req).read()
  24. return json.loads(response)
  25. except Exception as e:
  26. log.exception(f"Error while queuing prompt: {e}")
  27. raise e
  28. def get_image(filename, subfolder, folder_type, base_url):
  29. log.info("get_image")
  30. data = {"filename": filename, "subfolder": subfolder, "type": folder_type}
  31. url_values = urllib.parse.urlencode(data)
  32. req = urllib.request.Request(
  33. f"{base_url}/view?{url_values}", headers=default_headers
  34. )
  35. with urllib.request.urlopen(req) as response:
  36. return response.read()
  37. def get_image_url(filename, subfolder, folder_type, base_url):
  38. log.info("get_image")
  39. data = {"filename": filename, "subfolder": subfolder, "type": folder_type}
  40. url_values = urllib.parse.urlencode(data)
  41. return f"{base_url}/view?{url_values}"
  42. def get_history(prompt_id, base_url):
  43. log.info("get_history")
  44. req = urllib.request.Request(
  45. f"{base_url}/history/{prompt_id}", headers=default_headers
  46. )
  47. with urllib.request.urlopen(req) as response:
  48. return json.loads(response.read())
  49. def get_images(ws, prompt, client_id, base_url):
  50. prompt_id = queue_prompt(prompt, client_id, base_url)["prompt_id"]
  51. output_images = []
  52. while True:
  53. out = ws.recv()
  54. if isinstance(out, str):
  55. message = json.loads(out)
  56. if message["type"] == "executing":
  57. data = message["data"]
  58. if data["node"] is None and data["prompt_id"] == prompt_id:
  59. break # Execution is done
  60. else:
  61. continue # previews are binary data
  62. history = get_history(prompt_id, base_url)[prompt_id]
  63. for o in history["outputs"]:
  64. for node_id in history["outputs"]:
  65. node_output = history["outputs"][node_id]
  66. if "images" in node_output:
  67. for image in node_output["images"]:
  68. url = get_image_url(
  69. image["filename"], image["subfolder"], image["type"], base_url
  70. )
  71. output_images.append({"url": url})
  72. return {"data": output_images}
  73. class ComfyUINodeInput(BaseModel):
  74. type: Optional[str] = None
  75. node_ids: list[str] = []
  76. key: Optional[str] = "text"
  77. value: Optional[str] = None
  78. class ComfyUIWorkflow(BaseModel):
  79. workflow: str
  80. nodes: list[ComfyUINodeInput]
  81. class ComfyUIGenerateImageForm(BaseModel):
  82. workflow: ComfyUIWorkflow
  83. prompt: str
  84. negative_prompt: Optional[str] = None
  85. width: int
  86. height: int
  87. n: int = 1
  88. steps: Optional[int] = None
  89. seed: Optional[int] = None
  90. async def comfyui_generate_image(
  91. model: str, payload: ComfyUIGenerateImageForm, client_id, base_url
  92. ):
  93. ws_url = base_url.replace("http://", "ws://").replace("https://", "wss://")
  94. workflow = json.loads(payload.workflow.workflow)
  95. for node in payload.workflow.nodes:
  96. if node.type:
  97. if node.type == "model":
  98. for node_id in node.node_ids:
  99. workflow[node_id]["inputs"][node.key] = model
  100. elif node.type == "prompt":
  101. for node_id in node.node_ids:
  102. workflow[node_id]["inputs"]["text"] = payload.prompt
  103. elif node.type == "negative_prompt":
  104. for node_id in node.node_ids:
  105. workflow[node_id]["inputs"]["text"] = payload.negative_prompt
  106. elif node.type == "width":
  107. for node_id in node.node_ids:
  108. workflow[node_id]["inputs"]["width"] = payload.width
  109. elif node.type == "height":
  110. for node_id in node.node_ids:
  111. workflow[node_id]["inputs"]["height"] = payload.height
  112. elif node.type == "n":
  113. for node_id in node.node_ids:
  114. workflow[node_id]["inputs"]["batch_size"] = payload.n
  115. elif node.type == "steps":
  116. for node_id in node.node_ids:
  117. workflow[node_id]["inputs"]["steps"] = payload.steps
  118. elif node.type == "seed":
  119. seed = (
  120. payload.seed
  121. if payload.seed
  122. else random.randint(0, 18446744073709551614)
  123. )
  124. for node_id in node.node_ids:
  125. workflow[node_id]["inputs"][node.key] = seed
  126. else:
  127. for node_id in node.node_ids:
  128. workflow[node_id]["inputs"][node.key] = node.value
  129. try:
  130. ws = websocket.WebSocket()
  131. ws.connect(f"{ws_url}/ws?clientId={client_id}")
  132. log.info("WebSocket connection established.")
  133. except Exception as e:
  134. log.exception(f"Failed to connect to WebSocket server: {e}")
  135. return None
  136. try:
  137. log.info("Sending workflow to WebSocket server.")
  138. log.info(f"Workflow: {workflow}")
  139. images = await asyncio.to_thread(get_images, ws, workflow, client_id, base_url)
  140. except Exception as e:
  141. log.exception(f"Error while receiving images: {e}")
  142. images = None
  143. ws.close()
  144. return images