Fix void failing with RuntimeError: start (0) + length (464) exceeds dimension size (461).

Add Create Video to the essentials tab (#13863 )
chore: update embedded docs to v0.5.0 (#13865 )
2026-05-13 21:37:16 +08:00 · 2026-05-13 14:21:31 +02:00 · 2026-05-13 14:42:31 +08:00 · 2026-05-13 13:33:29 +08:00 · 2026-05-12 20:55:38 -07:00 · 2026-05-13 10:41:07 +08:00
8 changed files with 47 additions and 27 deletions
--- a/.spectral.yaml
+++ b/.spectral.yaml
@ -89,3 +89,12 @@ rules:
    then:
      field: description
      function: truthy
+
+overrides:
+  # /ws uses HTTP 101 (Switching Protocols) — a legitimate response for a
+  # WebSocket upgrade, but not a 2xx, so operation-success-response fires
+  # as a false positive. OpenAPI 3.x has no native WebSocket support.
+  - files:
+      - "openapi.yaml#/paths/~1ws"
+    rules:
+      operation-success-response: off
--- a/comfy/supported_models.py
+++ b/comfy/supported_models.py
@ -1443,7 +1443,7 @@ class HiDreamO1(supported_models_base.BASE):
    }

    latent_format = latent_formats.HiDreamO1Pixel
-    memory_usage_factor = 0.6
+    memory_usage_factor = 0.033
    # fp16 not supported: LM MLP down_proj activations fp16 overflow, causing NaNs
    supported_inference_dtypes = [torch.bfloat16, torch.float32]

--- a/comfy/utils.py
+++ b/comfy/utils.py
@ -1164,12 +1164,18 @@ def tiled_scale_multidim(samples, function, tile=(64, 64), overlap=8, upscale_am

            o = out
            o_d = out_div
+            ps_view = ps
+            mask_view = mask
            for d in range(dims):
-                o = o.narrow(d + 2, upscaled[d], mask.shape[d + 2])
-                o_d = o_d.narrow(d + 2, upscaled[d], mask.shape[d + 2])
+                l = min(ps_view.shape[d + 2], o.shape[d + 2] - upscaled[d])
+                o = o.narrow(d + 2, upscaled[d], l)
+                o_d = o_d.narrow(d + 2, upscaled[d], l)
+                if l < ps_view.shape[d + 2]:
+                    ps_view = ps_view.narrow(d + 2, 0, l)
+                    mask_view = mask_view.narrow(d + 2, 0, l)

-            o.add_(ps * mask)
-            o_d.add_(mask)
+            o.add_(ps_view * mask_view)
+            o_d.add_(mask_view)

            if pbar is not None:
                pbar.update(1)
--- a/comfy_extras/nodes_audio.py
+++ b/comfy_extras/nodes_audio.py
@ -297,6 +297,7 @@ class LoadAudio(IO.ComfyNode):
    @classmethod
    def define_schema(cls):
        input_dir = folder_paths.get_input_directory()
+        os.makedirs(input_dir, exist_ok=True)
        files = folder_paths.filter_files_content_types(os.listdir(input_dir), ["audio", "video"])
        return IO.Schema(
            node_id="LoadAudio",
--- a/comfy_extras/nodes_lt.py
+++ b/comfy_extras/nodes_lt.py
@ -338,8 +338,25 @@ class LTXVAddGuide(io.ComfyNode):
        noise_mask = get_noise_mask(latent)

        _, _, latent_length, latent_height, latent_width = latent_image.shape
+
+        # For mid-video multi-frame guides, prepend+strip a throwaway first frame so the VAE's "first latent = 1 pixel frame" asymmetry lands on the discarded slot
+        time_scale_factor = scale_factors[0]
+        num_frames_to_keep = ((image.shape[0] - 1) // time_scale_factor) * time_scale_factor + 1
+        resolved_frame_idx = frame_idx
+        if frame_idx < 0:
+            _, num_keyframes = get_keyframe_idxs(positive)
+            resolved_frame_idx = max((latent_length - num_keyframes - 1) * time_scale_factor + 1 + frame_idx, 0)
+        causal_fix = resolved_frame_idx == 0 or num_frames_to_keep == 1
+
+        if not causal_fix:
+            image = torch.cat([image[:1], image], dim=0)
+
        image, t = cls.encode(vae, latent_width, latent_height, image, scale_factors)

+        if not causal_fix:
+            t = t[:, :, 1:, :, :]
+            image = image[1:]
+
        frame_idx, latent_idx = cls.get_latent_index(positive, latent_length, len(image), frame_idx, scale_factors)
        assert latent_idx + t.shape[2] <= latent_length, "Conditioning frames exceed the length of the latent sequence."

@ -352,6 +369,7 @@ class LTXVAddGuide(io.ComfyNode):
            t,
            strength,
            scale_factors,
+            causal_fix=causal_fix,
        )

        # Track this guide for per-reference attention control.
--- a/comfy_extras/nodes_mask.py
+++ b/comfy_extras/nodes_mask.py
@ -40,23 +40,13 @@ def composite(destination, source, x, y, mask = None, multiplier = 8, resize_sou

    inverse_mask = torch.ones_like(mask) - mask

-    source_rgb = source[:, :3, :visible_height, :visible_width]
-    dest_slice = destination[..., top:bottom, left:right]
-
-    if destination.shape[1] == 4:
-        if torch.max(dest_slice) == 0:
-            destination[:, :3, top:bottom, left:right] = source_rgb
-            destination[:, 3:4, top:bottom, left:right] = mask
-        else:
-            destination[:, :3, top:bottom, left:right] = (mask * source_rgb) + (inverse_mask * dest_slice[:, :3])
-            destination[:, 3:4, top:bottom, left:right] = torch.max(mask, dest_slice[:, 3:4])
-    else:
-        source_portion = mask * source_rgb
-        destination_portion = inverse_mask * dest_slice
-        destination[..., top:bottom, left:right] = source_portion + destination_portion
+    source_portion = mask * source[..., :visible_height, :visible_width]
+    destination_portion = inverse_mask  * destination[..., top:bottom, left:right]

+    destination[..., top:bottom, left:right] = source_portion + destination_portion
    return destination

+
 class LatentCompositeMasked(IO.ComfyNode):
    @classmethod
    def define_schema(cls):
@ -95,23 +85,18 @@ class ImageCompositeMasked(IO.ComfyNode):
            display_name="Image Composite Masked",
            category="image",
            inputs=[
+                IO.Image.Input("destination"),
                IO.Image.Input("source"),
                IO.Int.Input("x", default=0, min=0, max=nodes.MAX_RESOLUTION, step=1),
                IO.Int.Input("y", default=0, min=0, max=nodes.MAX_RESOLUTION, step=1),
                IO.Boolean.Input("resize_source", default=False),
-                IO.Image.Input("destination", optional=True),
                IO.Mask.Input("mask", optional=True),
            ],
            outputs=[IO.Image.Output()],
        )

    @classmethod
-    def execute(cls, source, x, y, resize_source, destination = None, mask = None) -> IO.NodeOutput:
-        if destination is None: # transparent rgba
-            B, H, W, C = source.shape
-            destination = torch.zeros((B, H, W, 4), dtype=source.dtype, device=source.device)
-            if C == 3:
-                source = torch.nn.functional.pad(source, (0, 1), value=1.0)
+    def execute(cls, destination, source, x, y, resize_source, mask = None) -> IO.NodeOutput:
        destination, source = node_helpers.image_alpha_fix(destination, source)
        destination = destination.clone().movedim(-1, 1)
        output = composite(destination, source.movedim(-1, 1), x, y, mask, 1, resize_source).movedim(1, -1)
--- a/comfy_extras/nodes_video.py
+++ b/comfy_extras/nodes_video.py
@ -123,6 +123,7 @@ class CreateVideo(io.ComfyNode):
            search_aliases=["images to video"],
            display_name="Create Video",
            category="video",
+            essentials_category="Video Tools",
            description="Create a video from images.",
            inputs=[
                io.Image.Input("images", tooltip="The images to create a video from."),
--- a/requirements.txt
+++ b/requirements.txt
@ -1,6 +1,6 @@
 comfyui-frontend-package==1.43.18
 comfyui-workflow-templates==0.9.73
-comfyui-embedded-docs==0.4.4
+comfyui-embedded-docs==0.5.0
 torch
 torchsde
 torchvision
Author	SHA1	Message	Date
Talmaj Marinc	dce0c22b69	Fix void failing with RuntimeError: start (0) + length (464) exceeds dimension size (461).	2026-05-13 14:21:31 +02:00
AustinMroz	a5189fed51	Add Create Video to the essentials tab (#13863 )	2026-05-13 14:42:31 +08:00
Daxiong (Lin)	240363f11e	chore: update embedded docs to v0.5.0 (#13865 )	2026-05-13 13:33:29 +08:00
comfyanonymous	2bd65f2091	Better Hidream O1 mem usage factor for non dynamic vram. (#13864 )	2026-05-12 20:55:38 -07:00
angad777	cccb697aa3	fix: create input directory if missing in LoadAudio define_schema (#13834 )	2026-05-13 10:41:07 +08:00
comfyanonymous	300b6c8c91	Revert some breaking changes. (#13861 )	2026-05-12 17:28:20 -07:00
drozbay	1d95ed211e	Fix LTXV mid-video multi-frame guide alignment (CORE-129) (#13625 )	2026-05-13 06:57:31 +08:00
Matt Miller	a5f7bc5658	Suppress false-positive Spectral lint on WebSocket endpoint (#13842 ) The /ws path uses HTTP 101 (Switching Protocols), which is the correct response for a WebSocket upgrade but not a 2xx. The built-in operation-success-response rule fires as a false positive because OpenAPI 3.x has no native WebSocket support. Add a path-scoped override in .spectral.yaml to disable the rule for /ws only, leaving it active for all other operations.	2026-05-12 13:14:50 -07:00
Matt Miller	fb097bedc2	Mark deprecated cloud-runtime endpoints in spec (#13789 ) * Mark deprecated cloud-runtime endpoints in openapi.yaml Add five cloud-runtime FE-facing endpoints to the OSS spec with deprecated: true and standardized description prefixes: - GET /api/history_v2 — superseded by GET /api/jobs - GET /api/history_v2/{prompt_id} — superseded by GET /api/jobs/{prompt_id} - GET /api/logs — returns static placeholder; no real log data - GET /api/viewvideo — alias of GET /api/view for legacy video playback - GET /api/job/{job_id}/status — superseded by GET /api/jobs/{job_id} Each endpoint is tagged x-runtime: [cloud] and follows the same deprecation convention established for /api/history endpoints. Co-authored-by: Matt Miller <MillerMedia@users.noreply.github.com> * fix(spec): consolidate duplicate path entries on deprecated cloud-runtime endpoints Previous commit added new path entries with `deprecated: true` for `/api/job/{job_id}/status`, `/api/history_v2`, `/api/history_v2/{prompt_id}`, `/api/logs`, and `/api/viewvideo`, but the canonical entries already existed elsewhere in the file. Result: 5 duplicate path keys (Spectral parser errors), and the deprecation flag did not land on the operations that FE clients consume by operationId. This commit moves `deprecated: true` plus the standardized "Deprecated." description onto the canonical operations (`getCloudJobStatus`, `getHistoryV2`, `getHistoryV2ByPromptId`, `getCloudLogs`, `viewVideo`) and removes the duplicate entries. Operation IDs and response schemas are unchanged. Spectral lint passes with zero new warnings.	2026-05-12 11:06:28 -07:00