[pull] master from comfyanonymous:master #451

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged

pull merged 3 commits into code:master from Comfy-Org:master

Dec 3, 2025

comfy_api/latest/_io.py

            
                      Original file line number
                      Diff line number
                      Diff line change
                  
    @@ -5,7 +5,7 @@
  
    from abc import ABC, abstractmethod

    from collections import Counter

    from collections.abc import Iterable

    from dataclasses import asdict, dataclass

    from dataclasses import asdict, dataclass, field

    from enum import Enum

    from typing import Any, Callable, Literal, TypedDict, TypeVar, TYPE_CHECKING

    from typing_extensions import NotRequired, final

    @@ -1199,9 +1199,9 @@ class Schema:
  
        """Display name of node."""

        category: str = "sd"

        """The category of the node, as per the "Add Node" menu."""

        inputs: list[Input]=None

        outputs: list[Output]=None

        hidden: list[Hidden]=None

        inputs: list[Input] = field(default_factory=list)

        outputs: list[Output] = field(default_factory=list)

        hidden: list[Hidden] = field(default_factory=list)

        description: str=""

        """Node description, shown as a tooltip when hovering over the node."""

        is_input_list: bool = False

comfy_api/latest/_ui.py

-Original file line number
+Diff line change
@@ Expand Up / @@ -3,6 +3,7 @@ @@
     import json
     import os
     import random
+    import uuid
     from io import BytesIO
     from typing import Type
@@ Expand Down Expand Up / @@ -436,9 +437,19 @@ class PreviewUI3D(_UIOutput): @@
         def __init__(self, model_file, camera_info, **kwargs):
             self.model_file = model_file
             self.camera_info = camera_info
+            self.bg_image_path = None
+            bg_image = kwargs.get("bg_image", None)
+            if bg_image is not None:
+                img_array = (bg_image[0].cpu().numpy() * 255).astype(np.uint8)
+                img = PILImage.fromarray(img_array)
+                temp_dir = folder_paths.get_temp_directory()
+                filename = f"bg_{uuid.uuid4().hex}.png"
+                bg_image_path = os.path.join(temp_dir, filename)
+                img.save(bg_image_path, compress_level=1)
+                self.bg_image_path = f"temp/{filename}"
         def as_dict(self):
-            return {"result": [self.model_file, self.camera_info]}
+            return {"result": [self.model_file, self.camera_info, self.bg_image_path]}
     class PreviewText(_UIOutput):
@@ Expand Down @@

comfy_api_nodes/apis/kling_api.py

            
                      Original file line number
                      Diff line number
                      Diff line change
                  
    @@ -46,21 +46,41 @@ class TaskStatusVideoResult(BaseModel):
  
        url: str | None = Field(None, description="URL for generated video")

    class TaskStatusVideoResults(BaseModel):

    class TaskStatusImageResult(BaseModel):

        index: int = Field(..., description="Image Number，0-9")

        url: str = Field(..., description="URL for generated image")

    class OmniTaskStatusResults(BaseModel):

        videos: list[TaskStatusVideoResult] | None = Field(None)

        images: list[TaskStatusImageResult] | None = Field(None)

    class TaskStatusVideoResponseData(BaseModel):

    class OmniTaskStatusResponseData(BaseModel):

        created_at: int | None = Field(None, description="Task creation time")

        updated_at: int | None = Field(None, description="Task update time")

        task_status: str | None = None

        task_status_msg: str | None = Field(None, description="Additional failure reason. Only for polling endpoint.")

        task_id: str | None = Field(None, description="Task ID")

        task_result: TaskStatusVideoResults | None = Field(None)

        task_result: OmniTaskStatusResults | None = Field(None)

    class TaskStatusVideoResponse(BaseModel):

    class OmniTaskStatusResponse(BaseModel):

        code: int | None = Field(None, description="Error code")

        message: str | None = Field(None, description="Error message")

        request_id: str | None = Field(None, description="Request ID")

        data: TaskStatusVideoResponseData | None = Field(None)

        data: OmniTaskStatusResponseData | None = Field(None)

    class OmniImageParamImage(BaseModel):

        image: str = Field(...)

    class OmniProImageRequest(BaseModel):

        model_name: str = Field(..., description="kling-image-o1")

        resolution: str = Field(..., description="'1k' or '2k'")

        aspect_ratio: str | None = Field(...)

        prompt: str = Field(...)

        mode: str = Field("pro")

        n: int | None = Field(1, le=9)

        image_list: list[OmniImageParamImage] | None = Field(..., max_length=10)

comfy_api_nodes/nodes_kling.py

            
                      Original file line number
                      Diff line number
                      Diff line change
                  
    @@ -6,6 +6,7 @@
  
    import logging

    import math

    import re

    import torch

    from typing_extensions import override

    @@ -49,12 +50,14 @@
  
        KlingSingleImageEffectModelName,

    )

    from comfy_api_nodes.apis.kling_api import (

        OmniImageParamImage,

        OmniParamImage,

        OmniParamVideo,

        OmniProFirstLastFrameRequest,

        OmniProImageRequest,

        OmniProReferences2VideoRequest,

        OmniProText2VideoRequest,

        TaskStatusVideoResponse,

        OmniTaskStatusResponse,

    )

    from comfy_api_nodes.util import (

        ApiEndpoint,

    @@ -210,16 +213,46 @@
  
    }

    async def finish_omni_video_task(cls: type[IO.ComfyNode], response: TaskStatusVideoResponse) -> IO.NodeOutput:

    def normalize_omni_prompt_references(prompt: str) -> str:

        """

        Rewrites Kling Omni-style placeholders used in the app, like:

            @image, @image1, @image2, ... @imageN

            @video, @video1, @video2, ... @videoN

        into the API-compatible form:

            <<<image_1>>>, <<<image_2>>>, ...

            <<<video_1>>>, <<<video_2>>>, ...

        This is a UX shim for ComfyUI so users can type the same syntax as in the Kling app.

        """

        if not prompt:

            return prompt

        def _image_repl(match):

            return f"<<<image_{match.group('idx') or '1'}>>>"

        def _video_repl(match):

            return f"<<<video_{match.group('idx') or '1'}>>>"

        # (?<!\w) avoids matching e.g. "[email protected]"

        # (?!\w) makes sure we only match @image / @image<digits> and not @imageFoo

        prompt = re.sub(r"(?<!\w)@image(?P<idx>\d*)(?!\w)", _image_repl, prompt)

        return re.sub(r"(?<!\w)@video(?P<idx>\d*)(?!\w)", _video_repl, prompt)

    async def finish_omni_video_task(cls: type[IO.ComfyNode], response: OmniTaskStatusResponse) -> IO.NodeOutput:

        if response.code:

            raise RuntimeError(

                f"Kling request failed. Code: {response.code}, Message: {response.message}, Data: {response.data}"

            )

        final_response = await poll_op(

            cls,

            ApiEndpoint(path=f"/proxy/kling/v1/videos/omni-video/{response.data.task_id}"),

            response_model=TaskStatusVideoResponse,

            response_model=OmniTaskStatusResponse,

            status_extractor=lambda r: (r.data.task_status if r.data else None),

            max_poll_attempts=160,

        )

        return IO.NodeOutput(await download_url_to_video_output(final_response.data.task_result.videos[0].url))

    @@ -801,7 +834,7 @@ async def execute(
  
            response = await sync_op(

                cls,

                ApiEndpoint(path="/proxy/kling/v1/videos/omni-video", method="POST"),

                response_model=TaskStatusVideoResponse,

                response_model=OmniTaskStatusResponse,

                data=OmniProText2VideoRequest(

                    model_name=model_name,

                    prompt=prompt,

    @@ -864,6 +897,7 @@ async def execute(
  
            end_frame: Input.Image | None = None,

            reference_images: Input.Image | None = None,

        ) -> IO.NodeOutput:

            prompt = normalize_omni_prompt_references(prompt)

            validate_string(prompt, min_length=1, max_length=2500)

            if end_frame is not None and reference_images is not None:

                raise ValueError("The 'end_frame' input cannot be used simultaneously with 'reference_images'.")

    @@ -895,7 +929,7 @@ async def execute(
  
            response = await sync_op(

                cls,

                ApiEndpoint(path="/proxy/kling/v1/videos/omni-video", method="POST"),

                response_model=TaskStatusVideoResponse,

                response_model=OmniTaskStatusResponse,

                data=OmniProFirstLastFrameRequest(

                    model_name=model_name,

                    prompt=prompt,

    @@ -950,6 +984,7 @@ async def execute(
  
            duration: int,

            reference_images: Input.Image,

        ) -> IO.NodeOutput:

            prompt = normalize_omni_prompt_references(prompt)

            validate_string(prompt, min_length=1, max_length=2500)

            if get_number_of_images(reference_images) > 7:

                raise ValueError("The maximum number of reference images is 7.")

    @@ -962,7 +997,7 @@ async def execute(
  
            response = await sync_op(

                cls,

                ApiEndpoint(path="/proxy/kling/v1/videos/omni-video", method="POST"),

                response_model=TaskStatusVideoResponse,

                response_model=OmniTaskStatusResponse,

                data=OmniProReferences2VideoRequest(

                    model_name=model_name,

                    prompt=prompt,

    @@ -1023,6 +1058,7 @@ async def execute(
  
            keep_original_sound: bool,

            reference_images: Input.Image | None = None,

        ) -> IO.NodeOutput:

            prompt = normalize_omni_prompt_references(prompt)

            validate_string(prompt, min_length=1, max_length=2500)

            validate_video_duration(reference_video, min_duration=3.0, max_duration=10.05)

            validate_video_dimensions(reference_video, min_width=720, min_height=720, max_width=2160, max_height=2160)

    @@ -1045,7 +1081,7 @@ async def execute(
  
            response = await sync_op(

                cls,

                ApiEndpoint(path="/proxy/kling/v1/videos/omni-video", method="POST"),

                response_model=TaskStatusVideoResponse,

                response_model=OmniTaskStatusResponse,

                data=OmniProReferences2VideoRequest(

                    model_name=model_name,

                    prompt=prompt,

    @@ -1103,6 +1139,7 @@ async def execute(
  
            keep_original_sound: bool,

            reference_images: Input.Image | None = None,

        ) -> IO.NodeOutput:

            prompt = normalize_omni_prompt_references(prompt)

            validate_string(prompt, min_length=1, max_length=2500)

            validate_video_duration(video, min_duration=3.0, max_duration=10.05)

            validate_video_dimensions(video, min_width=720, min_height=720, max_width=2160, max_height=2160)

    @@ -1125,7 +1162,7 @@ async def execute(
  
            response = await sync_op(

                cls,

                ApiEndpoint(path="/proxy/kling/v1/videos/omni-video", method="POST"),

                response_model=TaskStatusVideoResponse,

                response_model=OmniTaskStatusResponse,

                data=OmniProReferences2VideoRequest(

                    model_name=model_name,

                    prompt=prompt,

    @@ -1138,6 +1175,90 @@ async def execute(
  
            return await finish_omni_video_task(cls, response)

    class OmniProImageNode(IO.ComfyNode):

        @classmethod

        def define_schema(cls) -> IO.Schema:

            return IO.Schema(

                node_id="KlingOmniProImageNode",

                display_name="Kling Omni Image (Pro)",

                category="api node/image/Kling",

                description="Create or edit images with the latest model from Kling.",

                inputs=[

                    IO.Combo.Input("model_name", options=["kling-image-o1"]),

                    IO.String.Input(

                        "prompt",

                        multiline=True,

                        tooltip="A text prompt describing the image content. "

                        "This can include both positive and negative descriptions.",

                    ),

                    IO.Combo.Input("resolution", options=["1K", "2K"]),

                    IO.Combo.Input(

                        "aspect_ratio",

                        options=["16:9", "9:16", "1:1", "4:3", "3:4", "3:2", "2:3", "21:9"],

                    ),

                    IO.Image.Input(

                        "reference_images",

                        tooltip="Up to 10 additional reference images.",

                        optional=True,

                    ),

                ],

                outputs=[

                    IO.Image.Output(),

                ],

                hidden=[

                    IO.Hidden.auth_token_comfy_org,

                    IO.Hidden.api_key_comfy_org,

                    IO.Hidden.unique_id,

                ],

                is_api_node=True,

            )

        @classmethod

        async def execute(

            cls,

            model_name: str,

            prompt: str,

            resolution: str,

            aspect_ratio: str,

            reference_images: Input.Image | None = None,

        ) -> IO.NodeOutput:

            prompt = normalize_omni_prompt_references(prompt)

            validate_string(prompt, min_length=1, max_length=2500)

            image_list: list[OmniImageParamImage] = []

            if reference_images is not None:

                if get_number_of_images(reference_images) > 10:

                    raise ValueError("The maximum number of reference images is 10.")

                for i in reference_images:

                    validate_image_dimensions(i, min_width=300, min_height=300)

                    validate_image_aspect_ratio(i, (1, 2.5), (2.5, 1))

                for i in await upload_images_to_comfyapi(cls, reference_images, wait_label="Uploading reference image"):

                    image_list.append(OmniImageParamImage(image=i))

            response = await sync_op(

                cls,

                ApiEndpoint(path="/proxy/kling/v1/images/omni-image", method="POST"),

                response_model=OmniTaskStatusResponse,

                data=OmniProImageRequest(

                    model_name=model_name,

                    prompt=prompt,

                    resolution=resolution.lower(),

                    aspect_ratio=aspect_ratio,

                    image_list=image_list if image_list else None,

                ),

            )

            if response.code:

                raise RuntimeError(

                    f"Kling request failed. Code: {response.code}, Message: {response.message}, Data: {response.data}"

                )

            final_response = await poll_op(

                cls,

                ApiEndpoint(path=f"/proxy/kling/v1/images/omni-image/{response.data.task_id}"),

                response_model=OmniTaskStatusResponse,

                status_extractor=lambda r: (r.data.task_status if r.data else None),

            )

            return IO.NodeOutput(await download_url_to_image_tensor(final_response.data.task_result.images[0].url))

    class KlingCameraControlT2VNode(IO.ComfyNode):

        """

        Kling Text to Video Camera Control Node. This node is a text to video node, but it supports controlling the camera.

    @@ -1935,6 +2056,7 @@ async def get_node_list(self) -> list[type[IO.ComfyNode]]:
  
                OmniProImageToVideoNode,

                OmniProVideoToVideoNode,

                OmniProEditVideoNode,

                # OmniProImageNode,  # need support from backend

            ]

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

[pull] master from comfyanonymous:master #451

Uh oh!

Diff view

Diff view

There are no files selected for viewing

Uh oh!

Uh oh!