Add Create Video to the essentials tab (#13863 )

2026-05-13 21:37:16 +08:00 · 2026-05-13 14:42:31 +08:00
3 changed files with 1 additions and 320 deletions
--- a/comfy_api_nodes/apis/anthropic.py
+++ b/comfy_api_nodes/apis/anthropic.py
@ -1,70 +0,0 @@
-from enum import Enum
-from typing import Literal
-
-from pydantic import BaseModel, Field
-
-
-class AnthropicRole(str, Enum):
-    user = "user"
-    assistant = "assistant"
-
-
-class AnthropicTextContent(BaseModel):
-    type: Literal["text"] = "text"
-    text: str = Field(...)
-
-
-class AnthropicImageSourceBase64(BaseModel):
-    type: Literal["base64"] = "base64"
-    media_type: str = Field(..., description="MIME type of the image, e.g. image/png, image/jpeg")
-    data: str = Field(..., description="Base64-encoded image data")
-
-
-class AnthropicImageContent(BaseModel):
-    type: Literal["image"] = "image"
-    source: AnthropicImageSourceBase64 = Field(...)
-
-
-class AnthropicMessage(BaseModel):
-    role: AnthropicRole = Field(...)
-    content: list[AnthropicTextContent | AnthropicImageContent] = Field(...)
-
-
-class AnthropicMessagesRequest(BaseModel):
-    model: str = Field(...)
-    messages: list[AnthropicMessage] = Field(...)
-    max_tokens: int = Field(..., ge=1)
-    system: str | None = Field(None, description="Top-level system prompt")
-    temperature: float | None = Field(None, ge=0.0, le=1.0)
-    top_p: float | None = Field(None, ge=0.0, le=1.0)
-    top_k: int | None = Field(None, ge=0)
-    stop_sequences: list[str] | None = Field(None)
-
-
-class AnthropicResponseTextBlock(BaseModel):
-    type: Literal["text"] = "text"
-    text: str = Field(...)
-
-
-class AnthropicCacheCreationUsage(BaseModel):
-    ephemeral_5m_input_tokens: int | None = Field(None)
-    ephemeral_1h_input_tokens: int | None = Field(None)
-
-
-class AnthropicMessagesUsage(BaseModel):
-    input_tokens: int | None = Field(None)
-    output_tokens: int | None = Field(None)
-    cache_creation_input_tokens: int | None = Field(None)
-    cache_read_input_tokens: int | None = Field(None)
-    cache_creation: AnthropicCacheCreationUsage | None = Field(None)
-
-
-class AnthropicMessagesResponse(BaseModel):
-    id: str | None = Field(None)
-    type: str | None = Field(None)
-    role: str | None = Field(None)
-    model: str | None = Field(None)
-    content: list[AnthropicResponseTextBlock] | None = Field(None)
-    stop_reason: str | None = Field(None)
-    stop_sequence: str | None = Field(None)
-    usage: AnthropicMessagesUsage | None = Field(None)
--- a/comfy_api_nodes/nodes_anthropic.py
+++ b/comfy_api_nodes/nodes_anthropic.py
@ -1,250 +0,0 @@
-"""API Nodes for Anthropic Claude (Messages API). See: https://docs.anthropic.com/en/api/messages"""
-
-from typing_extensions import override
-
-from comfy_api.latest import IO, ComfyExtension, Input
-from comfy_api_nodes.apis.anthropic import (
-    AnthropicImageContent,
-    AnthropicImageSourceBase64,
-    AnthropicMessage,
-    AnthropicMessagesRequest,
-    AnthropicMessagesResponse,
-    AnthropicRole,
-    AnthropicTextContent,
-)
-from comfy_api_nodes.util import (
-    ApiEndpoint,
-    downscale_image_tensor,
-    get_number_of_images,
-    sync_op,
-    tensor_to_base64_string,
-    validate_string,
-)
-
-ANTHROPIC_MESSAGES_ENDPOINT = "/proxy/anthropic/v1/messages"
-ANTHROPIC_IMAGE_MAX_PIXELS = 1568 * 1568  # Anthropic recommends max ~1568px on the longest edge
-CLAUDE_MAX_IMAGES = 20  # Anthropic supports up to 20 images per request
-
-CLAUDE_MODELS: dict[str, str] = {
-    "Opus 4.7": "claude-opus-4-7",
-    "Opus 4.6": "claude-opus-4-6",
-    "Sonnet 4.6": "claude-sonnet-4-6",
-    "Sonnet 4.5": "claude-sonnet-4-5-20250929",
-    "Haiku 4.5": "claude-haiku-4-5-20251001",
-}
-
-
-def _claude_model_inputs():
-    return [
-        IO.Int.Input(
-            "max_tokens",
-            default=16000,
-            min=32,
-            max=32000,
-            tooltip="Maximum number of tokens to generate before stopping.",
-            advanced=True,
-        ),
-        IO.Float.Input(
-            "temperature",
-            default=1.0,
-            min=0.0,
-            max=1.0,
-            step=0.01,
-            tooltip="Controls randomness. 0.0 is deterministic, 1.0 is most random.",
-            advanced=True,
-        ),
-    ]
-
-
-def _model_price_per_million(model: str) -> tuple[float, float] | None:
-    """Return (input_per_1M, output_per_1M) USD for a Claude model, or None if unknown."""
-    if "opus-4" in model:
-        return 15.0, 75.0
-    if "sonnet-4" in model:
-        return 3.0, 15.0
-    if "haiku-4-5" in model:
-        return 1.0, 5.0
-    return None
-
-
-def calculate_tokens_price(response: AnthropicMessagesResponse) -> float | None:
-    """Compute approximate USD price from response usage. Server-side billing is authoritative."""
-    if not response.usage or not response.model:
-        return None
-    rates = _model_price_per_million(response.model)
-    if rates is None:
-        return None
-    input_rate, output_rate = rates
-    input_tokens = response.usage.input_tokens or 0
-    output_tokens = response.usage.output_tokens or 0
-    cache_read = response.usage.cache_read_input_tokens or 0
-    cache_5m = 0
-    cache_1h = 0
-    if response.usage.cache_creation:
-        cache_5m = response.usage.cache_creation.ephemeral_5m_input_tokens or 0
-        cache_1h = response.usage.cache_creation.ephemeral_1h_input_tokens or 0
-    total = (
-        input_tokens * input_rate
-        + output_tokens * output_rate
-        + cache_read * input_rate * 0.1
-        + cache_5m * input_rate * 1.25
-        + cache_1h * input_rate * 2.0
-    )
-    return total / 1_000_000.0
-
-
-def _get_text_from_response(response: AnthropicMessagesResponse) -> str:
-    if not response.content:
-        return ""
-    return "\n".join(block.text for block in response.content if block.text)
-
-
-def _build_image_content_blocks(image_tensors: list[Input.Image]) -> list[AnthropicImageContent]:
-    """Convert image tensors (possibly batched) into Anthropic content blocks (base64 PNG)."""
-    blocks: list[AnthropicImageContent] = []
-    for tensor in image_tensors:
-        batch = tensor if len(tensor.shape) == 4 else tensor.unsqueeze(0)
-        for i in range(batch.shape[0]):
-            scaled = downscale_image_tensor(batch[i : i + 1], total_pixels=ANTHROPIC_IMAGE_MAX_PIXELS)
-            blocks.append(
-                AnthropicImageContent(
-                    source=AnthropicImageSourceBase64(
-                        media_type="image/png",
-                        data=tensor_to_base64_string(scaled),
-                    ),
-                )
-            )
-    return blocks
-
-
-class ClaudeNode(IO.ComfyNode):
-    """Generate text responses from an Anthropic Claude model."""
-
-    @classmethod
-    def define_schema(cls):
-        return IO.Schema(
-            node_id="ClaudeNode",
-            display_name="Anthropic Claude",
-            category="api node/text/Anthropic",
-            essentials_category="Text Generation",
-            description="Generate text responses with Anthropic's Claude models. "
-            "Provide a text prompt and optionally one or more images for multimodal context.",
-            inputs=[
-                IO.String.Input(
-                    "prompt",
-                    multiline=True,
-                    default="",
-                    tooltip="Text input to the model.",
-                ),
-                IO.DynamicCombo.Input(
-                    "model",
-                    options=[IO.DynamicCombo.Option(label, _claude_model_inputs()) for label in CLAUDE_MODELS],
-                    tooltip="The Claude model used to generate the response.",
-                ),
-                IO.Int.Input(
-                    "seed",
-                    default=0,
-                    min=0,
-                    max=2147483647,
-                    control_after_generate=True,
-                    tooltip="Seed controls whether the node should re-run; "
-                    "results are non-deterministic regardless of seed.",
-                ),
-                IO.Autogrow.Input(
-                    "images",
-                    template=IO.Autogrow.TemplateNames(
-                        IO.Image.Input("image"),
-                        names=[f"image_{i}" for i in range(1, CLAUDE_MAX_IMAGES + 1)],
-                        min=0,
-                    ),
-                    tooltip=f"Optional image(s) to use as context for the model. Up to {CLAUDE_MAX_IMAGES} images.",
-                ),
-                IO.String.Input(
-                    "system_prompt",
-                    multiline=True,
-                    default="",
-                    optional=True,
-                    advanced=True,
-                    tooltip="Foundational instructions that dictate the model's behavior.",
-                ),
-            ],
-            outputs=[IO.String.Output()],
-            hidden=[
-                IO.Hidden.auth_token_comfy_org,
-                IO.Hidden.api_key_comfy_org,
-                IO.Hidden.unique_id,
-            ],
-            is_api_node=True,
-            price_badge=IO.PriceBadge(
-                depends_on=IO.PriceBadgeDepends(widgets=["model"]),
-                expr="""
-                (
-                  $m := widgets.model;
-                  $contains($m, "opus") ? {
-                    "type": "list_usd",
-                    "usd": [0.015, 0.075],
-                    "format": { "approximate": true, "separator": "-", "suffix": " per 1K tokens" }
-                  }
-                  : $contains($m, "sonnet") ? {
-                    "type": "list_usd",
-                    "usd": [0.003, 0.015],
-                    "format": { "approximate": true, "separator": "-", "suffix": " per 1K tokens" }
-                  }
-                  : $contains($m, "haiku") ? {
-                    "type": "list_usd",
-                    "usd": [0.001, 0.005],
-                    "format": { "approximate": true, "separator": "-", "suffix": " per 1K tokens" }
-                  }
-                  : {"type":"text", "text":"Token-based"}
-                )
-                """,
-            ),
-        )
-
-    @classmethod
-    async def execute(
-        cls,
-        prompt: str,
-        model: dict,
-        seed: int,
-        images: dict | None = None,
-        system_prompt: str = "",
-    ) -> IO.NodeOutput:
-        validate_string(prompt, strip_whitespace=True, min_length=1)
-        model_label = model["model"]
-        max_tokens = model["max_tokens"]
-        temperature = model["temperature"]
-
-        image_tensors: list[Input.Image] = [t for t in (images or {}).values() if t is not None]
-        if sum(get_number_of_images(t) for t in image_tensors) > CLAUDE_MAX_IMAGES:
-            raise ValueError(f"Up to {CLAUDE_MAX_IMAGES} images are supported per request.")
-
-        content: list[AnthropicTextContent | AnthropicImageContent] = []
-        if image_tensors:
-            content.extend(_build_image_content_blocks(image_tensors))
-        content.append(AnthropicTextContent(text=prompt))
-
-        response = await sync_op(
-            cls,
-            ApiEndpoint(path=ANTHROPIC_MESSAGES_ENDPOINT, method="POST"),
-            response_model=AnthropicMessagesResponse,
-            data=AnthropicMessagesRequest(
-                model=CLAUDE_MODELS[model_label],
-                max_tokens=max_tokens,
-                messages=[AnthropicMessage(role=AnthropicRole.user, content=content)],
-                system=system_prompt or None,
-                temperature=temperature,
-            ),
-            price_extractor=calculate_tokens_price,
-        )
-        return IO.NodeOutput(_get_text_from_response(response) or "Empty response from Claude model.")
-
-
-class AnthropicExtension(ComfyExtension):
-    @override
-    async def get_node_list(self) -> list[type[IO.ComfyNode]]:
-        return [ClaudeNode]
-
-
-async def comfy_entrypoint() -> AnthropicExtension:
-    return AnthropicExtension()
--- a/comfy_extras/nodes_video.py
+++ b/comfy_extras/nodes_video.py
@ -123,6 +123,7 @@ class CreateVideo(io.ComfyNode):
            search_aliases=["images to video"],
            display_name="Create Video",
            category="video",
+            essentials_category="Video Tools",
            description="Create a video from images.",
            inputs=[
                io.Image.Input("images", tooltip="The images to create a video from."),