feat: allow --comfy-api-base target ephemeral testenvs

Signed-off-by: bigcat88 <bigcat88@icloud.com>
2026-06-23 14:47:21 +08:00 · 2026-06-20 21:24:34 +03:00
18 changed files with 179 additions and 569 deletions
--- a/comfy/comfy_api_env.py
+++ b/comfy/comfy_api_env.py
@ -0,0 +1,46 @@
+"""Runtime config the frontend reads from /features to follow --comfy-api-base.
+
+For a non-prod comfy.org backend (staging or an ephemeral preview env), "/features" exposes the api and
+platform base so the frontend talks to it without a rebuild; the frontend picks the Firebase project from the api base.
+Prod bases are left alone and keep their build-time defaults.
+"""
+
+from typing import Any
+from urllib.parse import urlparse
+
+from comfy.cli_args import args
+
+# Staging and the ephemeral preview envs ("testenvs") are one tier: same dev Firebase project and platform.
+_STAGING_API_HOST = "stagingapi.comfy.org"
+_TESTENV_HOST_SUFFIX = ".testenvs.comfy.org"
+_STAGING_PLATFORM_BASE_URL = "https://stagingplatform.comfy.org"
+
+
+def _is_staging_tier(host: str) -> bool:
+    return host == _STAGING_API_HOST or host.endswith(_TESTENV_HOST_SUFFIX)
+
+
+def normalize_comfy_api_base(url: str) -> str:
+    """Rewrite a testenv's friendly main host to its comfy-api '-registry' sibling."""
+    parsed = urlparse(url)
+    host = parsed.hostname or ""
+    if not host.endswith(_TESTENV_HOST_SUFFIX):
+        return url
+    label = host[: -len(_TESTENV_HOST_SUFFIX)]
+    if label.endswith("-registry"):
+        return url
+    return f"{parsed.scheme or 'https'}://{label}-registry{_TESTENV_HOST_SUFFIX}"
+
+
+def frontend_config_for_base(base_url: str) -> dict[str, Any] | None:
+    """The /features overrides for a staging-tier base, or None for prod."""
+    if not _is_staging_tier(urlparse(base_url).hostname or ""):
+        return None
+    return {
+        "comfy_api_base_url": normalize_comfy_api_base(base_url).rstrip("/"),
+        "comfy_platform_base_url": _STAGING_PLATFORM_BASE_URL,
+    }
+
+
+def get_frontend_config() -> dict[str, Any] | None:
+    return frontend_config_for_base(getattr(args, "comfy_api_base", "") or "")
--- a/comfy/ldm/krea2/model.py
+++ b/comfy/ldm/krea2/model.py
@ -1,290 +0,0 @@
-"""Krea 2 (K2) — single-stream MMDiT.
-
-Text tokens produced by a Qwen3-VL-4B 12-layer ``txtfusion`` adapter and patchified image tokens are
-concatenated into one sequence and run through ``layers`` shared transformer blocks with
-AdaLN-single modulation, GQA + per-head QK-norm + sigmoid-gated attention, SwiGLU MLP, and 3-axis RoPE.
-"""
-
-from typing import Optional
-
-import torch
-import torch.nn as nn
-import torch.nn.functional as F
-from einops import rearrange
-
-import comfy.model_management
-import comfy.patcher_extension
-import comfy.ldm.common_dit
-from comfy.ldm.flux.layers import EmbedND, timestep_embedding
-from comfy.ldm.flux.math import apply_rope
-from comfy.ldm.modules.attention import optimized_attention_masked
-
-
-class RMSNorm(nn.Module):
-    """RMSNorm with the reference ``(1 + scale)`` weight convention (scale stored zero-centered)."""
-
-    def __init__(self, features: int, eps: float = 1e-5, device=None, dtype=None, operations=None):
-        super().__init__()
-        self.eps = eps
-        self.scale = nn.Parameter(torch.empty(features, device=device, dtype=dtype))
-
-    def forward(self, x: torch.Tensor) -> torch.Tensor:
-        dtype = x.dtype
-        weight = comfy.model_management.cast_to(self.scale, dtype=torch.float32, device=x.device) + 1.0
-        return F.rms_norm(x.float(), (x.shape[-1],), weight=weight, eps=self.eps).to(dtype)
-
-
-class QKNorm(nn.Module):
-    def __init__(self, dim: int, device=None, dtype=None, operations=None):
-        super().__init__()
-        self.qnorm = RMSNorm(dim, device=device, dtype=dtype, operations=operations)
-        self.knorm = RMSNorm(dim, device=device, dtype=dtype, operations=operations)
-
-    def forward(self, q, k):
-        return self.qnorm(q), self.knorm(k)
-
-
-class SwiGLU(nn.Module):
-    def __init__(self, features: int, multiplier: int, bias: bool = False, multiple: int = 128,
-                 device=None, dtype=None, operations=None):
-        super().__init__()
-        mlpdim = int(2 * features / 3) * multiplier
-        mlpdim = multiple * ((mlpdim + multiple - 1) // multiple)
-        self.gate = operations.Linear(features, mlpdim, bias=bias, device=device, dtype=dtype)
-        self.up = operations.Linear(features, mlpdim, bias=bias, device=device, dtype=dtype)
-        self.down = operations.Linear(mlpdim, features, bias=bias, device=device, dtype=dtype)
-
-    def forward(self, x):
-        return self.down(F.silu(self.gate(x)).mul_(self.up(x)))
-
-
-class Attention(nn.Module):
-    def __init__(self, dim: int, heads: int, kvheads: Optional[int] = None, bias: bool = False,
-                 device=None, dtype=None, operations=None):
-        super().__init__()
-        self.heads = heads
-        self.kvheads = kvheads if kvheads is not None else heads
-        self.headdim = dim // self.heads
-        self.wq = operations.Linear(dim, self.headdim * self.heads, bias=bias, device=device, dtype=dtype)
-        self.wk = operations.Linear(dim, self.headdim * self.kvheads, bias=bias, device=device, dtype=dtype)
-        self.wv = operations.Linear(dim, self.headdim * self.kvheads, bias=bias, device=device, dtype=dtype)
-        self.gate = operations.Linear(dim, dim, bias=bias, device=device, dtype=dtype)
-        self.qknorm = QKNorm(self.headdim, device=device, dtype=dtype, operations=operations)
-        self.wo = operations.Linear(dim, dim, bias=bias, device=device, dtype=dtype)
-
-    def forward(self, x, freqs=None, mask=None, transformer_options={}):
-        q, k, v, gate = self.wq(x), self.wk(x), self.wv(x), self.gate(x)
-        q = rearrange(q, "B L (H D) -> B H L D", H=self.heads)
-        k = rearrange(k, "B L (H D) -> B H L D", H=self.kvheads)
-        v = rearrange(v, "B L (H D) -> B H L D", H=self.kvheads)
-        q, k = self.qknorm(q, k)
-        if freqs is not None:
-            q, k = apply_rope(q, k, freqs)
-        if self.kvheads != self.heads:
-            rep = self.heads // self.kvheads
-            k = k.repeat_interleave(rep, dim=1)
-            v = v.repeat_interleave(rep, dim=1)
-        out = optimized_attention_masked(q, k, v, self.heads, mask=mask, skip_reshape=True,
-                                         transformer_options=transformer_options)
-        return self.wo(out * F.sigmoid(gate))
-
-
-class SimpleModulation(nn.Module):
-    def __init__(self, dim: int, device=None, dtype=None, operations=None):
-        super().__init__()
-        self.lin = nn.Parameter(torch.empty(2, dim, device=device, dtype=dtype))
-
-    def forward(self, vec):
-        out = vec + comfy.model_management.cast_to(self.lin, dtype=vec.dtype, device=vec.device).unsqueeze(0)
-        scale, shift = out.chunk(2, dim=1)
-        return scale, shift
-
-
-class DoubleSharedModulation(nn.Module):
-    def __init__(self, dim: int, device=None, dtype=None, operations=None):
-        super().__init__()
-        self.lin = nn.Parameter(torch.empty(6 * dim, device=device, dtype=dtype))
-
-    def forward(self, vec):
-        out = vec + comfy.model_management.cast_to(self.lin, dtype=vec.dtype, device=vec.device)
-        return out.chunk(6, dim=-1)
-
-
-class TextFusionBlock(nn.Module):
-    def __init__(self, features, heads, multiplier, bias=False, kvheads=None, device=None, dtype=None, operations=None):
-        super().__init__()
-        self.prenorm = RMSNorm(features, device=device, dtype=dtype, operations=operations)
-        self.postnorm = RMSNorm(features, device=device, dtype=dtype, operations=operations)
-        self.attn = Attention(features, heads, kvheads=kvheads, bias=bias, device=device, dtype=dtype, operations=operations)
-        self.mlp = SwiGLU(features, multiplier, bias, device=device, dtype=dtype, operations=operations)
-
-    def forward(self, x, mask=None, transformer_options={}):
-        x = x + self.attn(self.prenorm(x), mask=mask, transformer_options=transformer_options)
-        x = x + self.mlp(self.postnorm(x))
-        return x
-
-
-class TextFusionTransformer(nn.Module):
-    def __init__(self, num_txt_layers, txt_dim, heads, multiplier, bias=False, kvheads=None, device=None, dtype=None, operations=None):
-        super().__init__()
-        self.layerwise_blocks = nn.ModuleList([
-            TextFusionBlock(txt_dim, heads, multiplier, bias, kvheads, device=device, dtype=dtype, operations=operations)
-            for _ in range(2)
-        ])
-        self.projector = operations.Linear(num_txt_layers, 1, bias=False, device=device, dtype=dtype)
-        self.refiner_blocks = nn.ModuleList([
-            TextFusionBlock(txt_dim, heads, multiplier, bias, kvheads, device=device, dtype=dtype, operations=operations)
-            for _ in range(2)
-        ])
-
-    def forward(self, x, mask=None, transformer_options={}):
-        b, l, n, d = x.shape
-        x = x.reshape(b * l, n, d)
-        for block in self.layerwise_blocks:
-            x = block(x.contiguous(), mask=None, transformer_options=transformer_options)
-        x = rearrange(x, "(b l) n d -> b l d n", b=b, l=l)
-        x = self.projector(x).squeeze(-1)
-        for block in self.refiner_blocks:
-            x = block(x, mask=mask, transformer_options=transformer_options)
-        return x
-
-
-class SingleStreamBlock(nn.Module):
-    def __init__(self, features, heads, multiplier, bias=False, kvheads=None, device=None, dtype=None, operations=None):
-        super().__init__()
-        self.mod = DoubleSharedModulation(features, device=device, dtype=dtype, operations=operations)
-        self.prenorm = RMSNorm(features, device=device, dtype=dtype, operations=operations)
-        self.postnorm = RMSNorm(features, device=device, dtype=dtype, operations=operations)
-        self.attn = Attention(features, heads, kvheads=kvheads, bias=bias, device=device, dtype=dtype, operations=operations)
-        self.mlp = SwiGLU(features, multiplier, bias, device=device, dtype=dtype, operations=operations)
-
-    def forward(self, x, vec, freqs, mask=None, transformer_options={}):
-        prescale, preshift, pregate, postscale, postshift, postgate = self.mod(vec)
-        x = x + pregate * self.attn((1 + prescale) * self.prenorm(x) + preshift, freqs, mask, transformer_options=transformer_options)
-        x = x + postgate * self.mlp((1 + postscale) * self.postnorm(x) + postshift)
-        return x
-
-
-class LastLayer(nn.Module):
-    def __init__(self, features, patch, channels, device=None, dtype=None, operations=None):
-        super().__init__()
-        self.norm = RMSNorm(features, device=device, dtype=dtype, operations=operations)
-        self.linear = operations.Linear(features, patch * patch * channels, bias=True, device=device, dtype=dtype)
-        self.modulation = SimpleModulation(features, device=device, dtype=dtype, operations=operations)
-
-    def forward(self, x, tvec):
-        scale, shift = self.modulation(tvec)
-        x = (1 + scale) * self.norm(x) + shift
-        return self.linear(x)
-
-
-class SingleStreamDiT(nn.Module):
-    def __init__(self, features=6144, tdim=256, txtdim=2560, heads=48, kvheads=12, multiplier=4,
-                 layers=28, patch=2, channels=16, bias=False, theta=1e3, txtlayers=12,
-                 txtheads=20, txtkvheads=20, image_model=None,
-                 device=None, dtype=None, operations=None, **kwargs):
-        super().__init__()
-        self.dtype = dtype
-        self.patch = patch
-        self.channels = channels
-        self.tdim = tdim
-        self.heads = heads
-        self.txtdim = txtdim
-        self.txtlayers = txtlayers
-
-        headdim = features // heads
-        axes = [headdim - 12 * (headdim // 16), 6 * (headdim // 16), 6 * (headdim // 16)]
-        assert sum(axes) == headdim, f"axes {axes} sum != headdim {headdim}"
-        self.pe_embedder = EmbedND(dim=headdim, theta=int(theta), axes_dim=axes)
-
-        self.first = operations.Linear(channels * patch ** 2, features, bias=True, device=device, dtype=dtype)
-        self.blocks = nn.ModuleList([
-            SingleStreamBlock(features, heads, multiplier, bias, kvheads, device=device, dtype=dtype, operations=operations)
-            for _ in range(layers)
-        ])
-        self.tmlp = nn.Sequential(
-            operations.Linear(tdim, features, device=device, dtype=dtype),
-            nn.GELU(approximate="tanh"),
-            operations.Linear(features, features, device=device, dtype=dtype),
-        )
-        self.txtfusion = TextFusionTransformer(txtlayers, txtdim, txtheads, multiplier, bias, txtkvheads,
-                                               device=device, dtype=dtype, operations=operations)
-        self.txtmlp = nn.Sequential(
-            RMSNorm(txtdim, device=device, dtype=dtype, operations=operations),
-            operations.Linear(txtdim, features, device=device, dtype=dtype),
-            nn.GELU(approximate="tanh"),
-            operations.Linear(features, features, device=device, dtype=dtype),
-        )
-        self.last = LastLayer(features, patch, channels, device=device, dtype=dtype, operations=operations)
-        self.tproj = nn.Sequential(
-            nn.GELU(approximate="tanh"),
-            operations.Linear(features, features * 6, device=device, dtype=dtype),
-        )
-
-    def forward(self, x, timesteps, context, attention_mask=None, transformer_options={}, **kwargs):
-        return comfy.patcher_extension.WrapperExecutor.new_class_executor(
-            self._forward,
-            self,
-            comfy.patcher_extension.get_all_wrappers(comfy.patcher_extension.WrappersMP.DIFFUSION_MODEL, transformer_options),
-        ).execute(x, timesteps, context, attention_mask, transformer_options, **kwargs)
-
-    def _forward(self, x, timesteps, context, attention_mask=None, transformer_options={}, **kwargs):
-        temporal = x.ndim == 5
-        if temporal:
-            b5, c5, t5, h5, w5 = x.shape
-            x = x.reshape(b5 * t5, c5, h5, w5)
-        bs, c, H_orig, W_orig = x.shape
-        patch = self.patch
-        # Pad the latent up to a multiple of patch (as Flux/Lumina/QwenImage do); crop back at the end.
-        x = comfy.ldm.common_dit.pad_to_patch_size(x, (patch, patch))
-        H, W = x.shape[-2], x.shape[-1]
-        h_, w_ = H // patch, W // patch
-
-        # context arrives as (B, seq, txtlayers*txtdim); reshape to (B, txtlayers, seq, txtdim).
-        context = self._unpack_context(context)
-
-        img = rearrange(x, "b c (h ph) (w pw) -> b (h w) (c ph pw)", ph=patch, pw=patch)
-        img = self.first(img)
-
-        t = self.tmlp(timestep_embedding(timesteps, self.tdim).unsqueeze(1).to(img.dtype))
-        tvec = self.tproj(t)
-
-        context = self.txtfusion(context, mask=None, transformer_options=transformer_options)
-        context = self.txtmlp(context)
-
-        txtlen, imglen = context.shape[1], img.shape[1]
-        combined = torch.cat((context, img), dim=1)
-
-        # Position ids: text at 0, image at (0, h_idx, w_idx).
-        device = combined.device
-        txtpos = torch.zeros(bs, txtlen, 3, device=device, dtype=torch.float32)
-        imgids = torch.zeros(h_, w_, 3, device=device, dtype=torch.float32)
-        imgids[..., 1] = torch.arange(h_, device=device, dtype=torch.float32)[:, None]
-        imgids[..., 2] = torch.arange(w_, device=device, dtype=torch.float32)[None, :]
-        imgpos = imgids.reshape(1, h_ * w_, 3).repeat(bs, 1, 1)
-        pos = torch.cat((txtpos, imgpos), dim=1)
-
-        freqs = self.pe_embedder(pos)
-
-        for block in self.blocks:
-            combined = block(combined, tvec, freqs, None, transformer_options=transformer_options)
-
-        final = self.last(combined, t)
-        out = final[:, txtlen:txtlen + imglen, :]
-        out = rearrange(out, "b (h w) (c ph pw) -> b c (h ph) (w pw)",
-                        h=h_, w=w_, ph=patch, pw=patch, c=self.channels)
-        out = out[:, :, :H_orig, :W_orig]  # crop padding back off
-        if temporal:
-            out = out.reshape(b5, t5, self.channels, H_orig, W_orig).movedim(1, 2)
-        return out
-
-    def _unpack_context(self, context):
-        # context: (B, seq, txtlayers*txtdim) -> (B, seq, txtlayers, txtdim).
-        b, seq, fused = context.shape
-        if fused != self.txtlayers * self.txtdim:
-            raise ValueError(
-                f"Krea2 expects conditioning with {self.txtlayers}x{self.txtdim}={self.txtlayers * self.txtdim} "
-                f"features (a {self.txtlayers}-layer Qwen3-VL stack) but got {fused}. "
-                f"Load the text encoder with CLIPLoader type 'krea2'."
-            )
-        return context.reshape(b, seq, self.txtlayers, self.txtdim)
--- a/comfy/lora.py
+++ b/comfy/lora.py
@ -326,17 +326,6 @@ def model_lora_keys_unet(model, key_map={}):
                key_map["transformer.{}".format(key_lora)] = k
                key_map["lycoris_{}".format(key_lora.replace(".", "_"))] = k #SimpleTuner lycoris format

-    if isinstance(model, comfy.model_base.Krea2):
-        diffusers_keys = comfy.utils.krea2_to_diffusers(model.model_config.unet_config, output_prefix="diffusion_model.")
-        for k in diffusers_keys:
-            if k.endswith(".weight"):
-                to = diffusers_keys[k]
-                key_lora = k[:-len(".weight")]
-                key_map["diffusion_model.{}".format(key_lora)] = to
-                key_map["transformer.{}".format(key_lora)] = to
-                key_map["lycoris_{}".format(key_lora.replace(".", "_"))] = to
-                key_map[key_lora] = to
-
    if isinstance(model, comfy.model_base.Lumina2):
        diffusers_keys = comfy.utils.z_image_to_diffusers(model.model_config.unet_config, output_prefix="diffusion_model.")
        for k in diffusers_keys:
--- a/comfy/model_base.py
+++ b/comfy/model_base.py
@ -58,7 +58,6 @@ import comfy.ldm.omnigen.omnigen2
 import comfy.ldm.boogu.model
 import comfy.ldm.qwen_image.model
 import comfy.ldm.ideogram4.model
-import comfy.ldm.krea2.model
 import comfy.ldm.kandinsky5.model
 import comfy.ldm.anima.model
 import comfy.ldm.ace.ace_step15
@ -2279,17 +2278,6 @@ class Ideogram4(BaseModel):
            out['c_crossattn'] = comfy.conds.CONDRegular(cross_attn)
        return out

-class Krea2(BaseModel):
-    def __init__(self, model_config, model_type=ModelType.FLUX, device=None):
-        super().__init__(model_config, model_type, device=device, unet_model=comfy.ldm.krea2.model.SingleStreamDiT)
-
-    def extra_conds(self, **kwargs):
-        out = super().extra_conds(**kwargs)
-        cross_attn = kwargs.get("cross_attn", None)
-        if cross_attn is not None:
-            out['c_crossattn'] = comfy.conds.CONDRegular(cross_attn)
-        return out
-
 class HunyuanImage21(BaseModel):
    def __init__(self, model_config, model_type=ModelType.FLOW, device=None):
        super().__init__(model_config, model_type, device=device, unet_model=comfy.ldm.hunyuan_video.model.HunyuanVideo)
--- a/comfy/model_detection.py
+++ b/comfy/model_detection.py
@ -834,21 +834,6 @@ def detect_unet_config(state_dict, key_prefix, metadata=None):
        dit_config["num_layers"] = count_blocks(state_dict_keys, '{}layers.'.format(key_prefix) + '{}.')
        return dit_config

-    if '{}txtfusion.projector.weight'.format(key_prefix) in state_dict_keys:  # Krea 2 (K2)
-        dit_config = {}
-        dit_config["image_model"] = "krea2"
-        head_dim = 128
-        first_w = state_dict['{}first.weight'.format(key_prefix)]  # (features, channels*patch^2)
-        dit_config["features"] = first_w.shape[0]
-        dit_config["channels"] = first_w.shape[1] // (2 * 2)  # patch=2
-        dit_config["patch"] = 2
-        dit_config["layers"] = count_blocks(state_dict_keys, '{}blocks.'.format(key_prefix) + '{}.')
-        dit_config["heads"] = state_dict['{}blocks.0.attn.wq.weight'.format(key_prefix)].shape[0] // head_dim
-        dit_config["kvheads"] = state_dict['{}blocks.0.attn.wk.weight'.format(key_prefix)].shape[0] // head_dim
-        dit_config["txtlayers"] = state_dict['{}txtfusion.projector.weight'.format(key_prefix)].shape[1]
-        dit_config["txtdim"] = state_dict['{}txtfusion.layerwise_blocks.0.prenorm.scale'.format(key_prefix)].shape[0]
-        return dit_config
-
    if '{}visual_transformer_blocks.0.cross_attention.key_norm.weight'.format(key_prefix) in state_dict_keys: # Kandinsky 5
        dit_config = {}
        model_dim = state_dict['{}visual_embeddings.in_layer.bias'.format(key_prefix)].shape[0]
--- a/comfy/sd.py
+++ b/comfy/sd.py
@ -58,7 +58,6 @@ import comfy.text_encoders.omnigen2
 import comfy.text_encoders.qwen_image
 import comfy.text_encoders.hunyuan_image
 import comfy.text_encoders.z_image
-import comfy.text_encoders.krea2
 import comfy.text_encoders.ideogram4
 import comfy.text_encoders.ovis
 import comfy.text_encoders.kandinsky5
@ -1304,7 +1303,6 @@ class CLIPType(Enum):
    PIXELDIT = 29
    IDEOGRAM4 = 30
    BOOGU = 31
-    KREA2 = 32



@ -1630,10 +1628,6 @@ def load_text_encoder_state_dicts(state_dicts=[], embedding_directory=None, clip
                clip_data[0] = comfy.utils.state_dict_prefix_replace(clip_data[0], {"model.language_model.": "model.", "model.visual.": "visual.", "lm_head.": "model.lm_head."})
                clip_target.clip = comfy.text_encoders.boogu.te(**llama_detect(clip_data))
                clip_target.tokenizer = comfy.text_encoders.boogu.BooguTokenizer
-            elif clip_type == CLIPType.KREA2 and te_model == TEModel.QWEN3VL_4B:  # Krea2: full Qwen3-VL-4B (12-layer tap for conditioning + multimodal generate).
-                clip_data[0] = comfy.utils.state_dict_prefix_replace(clip_data[0], {"model.language_model.": "model.", "model.visual.": "visual.", "lm_head.": "model.lm_head."})
-                clip_target.clip = comfy.text_encoders.krea2.te(**llama_detect(clip_data))
-                clip_target.tokenizer = comfy.text_encoders.krea2.Krea2Tokenizer
            elif clip_type in (CLIPType.FLUX, CLIPType.FLUX2):  # Flux2 Klein reuses the Qwen3-VL LM (3-layer tap -> 12288); visual unused.
                klein_model_type = "qwen3_8b" if te_model == TEModel.QWEN3VL_8B else "qwen3_4b"
                clip_target.clip = comfy.text_encoders.flux.klein_te(**llama_detect(clip_data), model_type=klein_model_type)
--- a/comfy/supported_models.py
+++ b/comfy/supported_models.py
@ -26,7 +26,6 @@ import comfy.text_encoders.kandinsky5
 import comfy.text_encoders.z_image
 import comfy.text_encoders.ideogram4
 import comfy.text_encoders.boogu
-import comfy.text_encoders.krea2
 import comfy.text_encoders.anima
 import comfy.text_encoders.ace15
 import comfy.text_encoders.longcat_image
@ -1819,35 +1818,6 @@ class Ideogram4(supported_models_base.BASE):
        hunyuan_detect = comfy.text_encoders.hunyuan_video.llama_detect(state_dict, "{}qwen3vl_8b.transformer.".format(pref))
        return supported_models_base.ClipTarget(comfy.text_encoders.ideogram4.Ideogram4Tokenizer, comfy.text_encoders.ideogram4.te(**hunyuan_detect))

-
-class Krea2(supported_models_base.BASE):
-    unet_config = {
-        "image_model": "krea2",
-    }
-
-    sampling_settings = {
-        "multiplier": 1.0,
-        "shift": 1.15,
-    }
-
-    memory_usage_factor = 2.2
-
-    latent_format = latent_formats.Wan21
-
-    supported_inference_dtypes = [torch.bfloat16, torch.float16, torch.float32]
-
-    vae_key_prefix = ["vae."]
-    text_encoder_key_prefix = ["text_encoders."]
-
-    def get_model(self, state_dict, prefix="", device=None):
-        out = model_base.Krea2(self, device=device)
-        return out
-
-    def clip_target(self, state_dict={}):
-        pref = self.text_encoder_key_prefix[0]
-        hunyuan_detect = comfy.text_encoders.hunyuan_video.llama_detect(state_dict, "{}qwen3vl_4b.transformer.".format(pref))
-        return supported_models_base.ClipTarget(comfy.text_encoders.krea2.Krea2Tokenizer, comfy.text_encoders.krea2.te(**hunyuan_detect))
-
 class QwenImage(supported_models_base.BASE):
    unet_config = {
        "image_model": "qwen_image",
@ -2355,7 +2325,6 @@ models = [
    Boogu,
    QwenImage,
    Ideogram4,
-    Krea2,
    Flux2,
    Lens,
    Kandinsky5Image,
--- a/comfy/text_encoders/krea2.py
+++ b/comfy/text_encoders/krea2.py
@ -1,84 +0,0 @@
-"""Krea 2 (K2) text encoder: Qwen3-VL-4B, 12-layer tap.
-
-K2 conditions on a stack of hidden states from 12 layers of Qwen3-VL-4B
-(reference taps ``hidden_states[2,5,8,...,35]``), kept as a ``(B, 12, seq, 2560)`` tensor and
-consumed by the DiT's internal ``txtfusion`` adapter. Comfy carries conditioning as a 3D tensor,
-so the 12-layer stack is flattened to ``(B, seq, 12*2560)`` here and unpacked inside the model.
-"""
-
-import numbers
-
-import torch
-
-import comfy.text_encoders.qwen3vl
-from comfy import sd1_clip
-
-# tap k == hidden_states[k] (no offset).
-KREA2_TAP_LAYERS = [2, 5, 8, 11, 14, 17, 20, 23, 26, 29, 32, 35]
-
-# Identical system template to Qwen-Image; Krea2 strips the system+user-opening prefix.
-KREA2_TEMPLATE = "<|im_start|>system\nDescribe the image by detailing the color, shape, size, texture, quantity, text, spatial relationships of the objects and background:<|im_end|>\n<|im_start|>user\n{}<|im_end|>\n<|im_start|>assistant\n"
-
-
-class Krea2Tokenizer(comfy.text_encoders.qwen3vl.Qwen3VLTokenizer):
-    def __init__(self, embedding_directory=None, tokenizer_data={}):
-        super().__init__(embedding_directory=embedding_directory, tokenizer_data=tokenizer_data, model_type="qwen3vl_4b")
-        self.llama_template = KREA2_TEMPLATE  # conditioning template; image text-gen uses qwen3vl's default image template.
-
-    def tokenize_with_weights(self, text, return_word_ids=False, llama_template=None, images=[], prevent_empty_text=False, thinking=True, **kwargs):
-        # Krea2 conditions on the no-think template; thinking=True drops the empty <think> block qwen3vl adds.
-        return super().tokenize_with_weights(text, return_word_ids=return_word_ids, llama_template=llama_template, images=images, prevent_empty_text=prevent_empty_text, thinking=thinking, **kwargs)
-
-
-class Krea2Qwen3VLClipModel(comfy.text_encoders.qwen3vl.Qwen3VLClipModel):
-    def __init__(self, device="cpu", dtype=None, attention_mask=True, model_options={}):
-        super().__init__(device=device, layer=KREA2_TAP_LAYERS, layer_idx=None, dtype=dtype,
-                         attention_mask=attention_mask, model_options=model_options, model_type="qwen3vl_4b")
-
-
-class Krea2TEModel(sd1_clip.SD1ClipModel):
-    def __init__(self, device="cpu", dtype=None, model_options={}):
-        super().__init__(device=device, dtype=dtype, name="qwen3vl_4b", clip_model=Krea2Qwen3VLClipModel, model_options=model_options)
-
-    def encode_token_weights(self, token_weight_pairs, template_end=-1):
-        out, pooled, extra = super().encode_token_weights(token_weight_pairs)  # out: (B, 12, seq, 2560)
-        tok_pairs = token_weight_pairs["qwen3vl_4b"][0]
-
-        # Strip the system + user-opening prefix
-        count_im_start = 0
-        if template_end == -1:
-            for i, v in enumerate(tok_pairs):
-                elem = v[0]
-                if not torch.is_tensor(elem) and isinstance(elem, numbers.Integral):
-                    if elem == 151644 and count_im_start < 2:
-                        template_end = i
-                        count_im_start += 1
-            if out.shape[2] > (template_end + 3):
-                if tok_pairs[template_end + 1][0] == 872:      # "user"
-                    if tok_pairs[template_end + 2][0] == 198:   # "\n"
-                        template_end += 3
-
-        out = out[:, :, template_end:]
-
-        b, n, seq, h = out.shape
-        # Flatten the 12-layer axis into the feature dim: (B, seq, 12*2560). Unpacked in the model.
-        out = out.permute(0, 2, 1, 3).reshape(b, seq, n * h)
-
-        if "attention_mask" in extra:
-            extra["attention_mask"] = extra["attention_mask"][:, template_end:]
-            if extra["attention_mask"].sum() == torch.numel(extra["attention_mask"]):
-                extra.pop("attention_mask")
-
-        return out, pooled, extra
-
-
-def te(dtype_llama=None, llama_quantization_metadata=None):
-    class Krea2TEModel_(Krea2TEModel):
-        def __init__(self, device="cpu", dtype=None, model_options={}):
-            if llama_quantization_metadata is not None:
-                model_options = model_options.copy()
-                model_options["quantization_metadata"] = llama_quantization_metadata
-            if dtype_llama is not None:
-                dtype = dtype_llama
-            super().__init__(device=device, dtype=dtype, model_options=model_options)
-    return Krea2TEModel_
--- a/comfy/utils.py
+++ b/comfy/utils.py
@ -818,44 +818,6 @@ def z_image_to_diffusers(mmdit_config, output_prefix=""):

    return key_map

-def krea2_to_diffusers(mmdit_config, output_prefix=""):
-    n_layers = mmdit_config.get("layers", 0)
-    n_txt_layerwise = 2  # TextFusionTransformer hardcodes 2 layerwise + 2 refiner blocks
-    n_txt_refiner = 2
-    key_map = {}
-
-    def add_block(prefix_to, prefix_from):
-        block_map = {
-            "attn.to_q": "attn.wq", "attn.to_k": "attn.wk", "attn.to_v": "attn.wv",
-            "attn.to_gate": "attn.gate", "attn.to_out.0": "attn.wo",
-            "attn.to_out": "attn.wo",  # some tools drop the ".0" on to_out
-            "ff.gate": "mlp.gate", "ff.up": "mlp.up", "ff.down": "mlp.down",
-        }
-        for d, c in block_map.items():
-            key_map["{}.{}.weight".format(prefix_to, d)] = "{}{}.{}.weight".format(output_prefix, prefix_from, c)
-
-    for i in range(n_layers):
-        add_block("transformer_blocks.{}".format(i), "blocks.{}".format(i))
-    for i in range(n_txt_layerwise):
-        add_block("text_fusion.layerwise_blocks.{}".format(i), "txtfusion.layerwise_blocks.{}".format(i))
-    for i in range(n_txt_refiner):
-        add_block("text_fusion.refiner_blocks.{}".format(i), "txtfusion.refiner_blocks.{}".format(i))
-
-    MAP_BASIC = [
-        ("img_in", "first"),
-        ("time_embed.linear_1", "tmlp.0"),
-        ("time_embed.linear_2", "tmlp.2"),
-        ("time_mod_proj", "tproj.1"),
-        ("txt_in.linear_1", "txtmlp.1"),
-        ("txt_in.linear_2", "txtmlp.3"),
-        ("text_fusion.projector", "txtfusion.projector"),
-        ("final_layer.linear", "last.linear"),
-    ]
-    for d, c in MAP_BASIC:
-        key_map["{}.weight".format(d)] = "{}{}.weight".format(output_prefix, c)
-
-    return key_map
-
 def repeat_to_batch_size(tensor, batch_size, dim=0):
    if tensor.shape[dim] > batch_size:
        return tensor.narrow(dim, 0, batch_size)
--- a/comfy_api/feature_flags.py
+++ b/comfy_api/feature_flags.py
@ -9,6 +9,7 @@ import logging
 from typing import Any, TypedDict

 from comfy.cli_args import args
+from comfy.comfy_api_env import get_frontend_config


 class FeatureFlagInfo(TypedDict):
@ -162,4 +163,11 @@ def get_server_features() -> dict[str, Any]:
    Returns:
        Dictionary of server feature flags
    """
-    return SERVER_FEATURE_FLAGS.copy()
+    features = SERVER_FEATURE_FLAGS.copy()
+    # When --comfy-api-base targets a staging-tier comfy.org backend (the staging api host or an ephemeral testenv),
+    # surface the api + platform base so the frontend can reach it without a rebuild
+    # (it derives the Firebase project from the api base). Prod / self-hosted bases keep build-time defaults.
+    overrides = get_frontend_config()
+    if overrides:
+        features.update(overrides)
+    return features
--- a/comfy_api_nodes/util/_helpers.py
+++ b/comfy_api_nodes/util/_helpers.py
@ -11,6 +11,7 @@ from io import BytesIO
 from yarl import URL

 from comfy.cli_args import args
+from comfy.comfy_api_env import normalize_comfy_api_base
 from comfy.deploy_environment import get_deploy_environment
 from comfy.model_management import processing_interrupted
 from comfy_api.latest import IO
@ -63,7 +64,7 @@ def get_comfy_api_headers(node_cls: type[IO.ComfyNode]) -> dict[str, str]:


 def default_base_url() -> str:
-    return getattr(args, "comfy_api_base", "https://api.comfy.org")
+    return normalize_comfy_api_base(getattr(args, "comfy_api_base", "https://api.comfy.org"))


 async def sleep_with_interrupt(
--- a/comfy_extras/nodes_audio.py
+++ b/comfy_extras/nodes_audio.py
@ -158,7 +158,7 @@ class SaveAudio(IO.ComfyNode):
        return IO.Schema(
            node_id="SaveAudio",
            search_aliases=["export flac"],
-            display_name="Save Audio (FLAC) (DEPRECATED)",
+            display_name="Save Audio (FLAC) (Deprecated)",
            category="audio",
            essentials_category="Audio",
            inputs=[
@ -166,9 +166,8 @@ class SaveAudio(IO.ComfyNode):
                IO.String.Input("filename_prefix", default="audio/ComfyUI"),
            ],
            hidden=[IO.Hidden.prompt, IO.Hidden.extra_pnginfo],
-            is_deprecated=True,
            is_output_node=True,
-            outputs=[IO.Audio.Output("audio")]
+            is_deprecated=True,
        )

    @classmethod
@ -176,10 +175,11 @@ class SaveAudio(IO.ComfyNode):
        if audio is None:
            raise ValueError("SaveAudio: input audio is None (source video may have no audio track).")
        return IO.NodeOutput(
-            audio,
            ui=UI.AudioSaveHelper.get_save_audio_ui(audio, filename_prefix=filename_prefix, cls=cls, format=format)
        )

+    save_flac = execute  # TODO: remove
+

 class SaveAudioMP3(IO.ComfyNode):
    @classmethod
@ -187,7 +187,7 @@ class SaveAudioMP3(IO.ComfyNode):
        return IO.Schema(
            node_id="SaveAudioMP3",
            search_aliases=["export mp3"],
-            display_name="Save Audio (MP3) (DEPRECATED)",
+            display_name="Save Audio (MP3) (Deprecated)",
            category="audio",
            essentials_category="Audio",
            inputs=[
@ -196,9 +196,8 @@ class SaveAudioMP3(IO.ComfyNode):
                IO.Combo.Input("quality", options=["V0", "128k", "320k"], default="V0"),
            ],
            hidden=[IO.Hidden.prompt, IO.Hidden.extra_pnginfo],
-            is_deprecated=True,
            is_output_node=True,
-            outputs=[IO.Audio.Output("audio")]
+            is_deprecated=True,
        )

    @classmethod
@ -206,12 +205,13 @@ class SaveAudioMP3(IO.ComfyNode):
        if audio is None:
            raise ValueError("SaveAudioMP3: input audio is None (source video may have no audio track).")
        return IO.NodeOutput(
-            audio,
            ui=UI.AudioSaveHelper.get_save_audio_ui(
                audio, filename_prefix=filename_prefix, cls=cls, format=format, quality=quality
            )
        )

+    save_mp3 = execute  # TODO: remove
+

 class SaveAudioOpus(IO.ComfyNode):
    @classmethod
@ -219,7 +219,7 @@ class SaveAudioOpus(IO.ComfyNode):
        return IO.Schema(
            node_id="SaveAudioOpus",
            search_aliases=["export opus"],
-            display_name="Save Audio (Opus) (DEPRECATED)",
+            display_name="Save Audio (Opus) (Deprecated)",
            category="audio",
            inputs=[
                IO.Audio.Input("audio"),
@ -227,9 +227,8 @@ class SaveAudioOpus(IO.ComfyNode):
                IO.Combo.Input("quality", options=["64k", "96k", "128k", "192k", "320k"], default="128k"),
            ],
            hidden=[IO.Hidden.prompt, IO.Hidden.extra_pnginfo],
-            is_deprecated=True,
            is_output_node=True,
-            outputs=[IO.Audio.Output("audio")]
+            is_deprecated=True,
        )

    @classmethod
@ -237,12 +236,13 @@ class SaveAudioOpus(IO.ComfyNode):
        if audio is None:
            raise ValueError("SaveAudioOpus: input audio is None (source video may have no audio track).")
        return IO.NodeOutput(
-            audio,
            ui=UI.AudioSaveHelper.get_save_audio_ui(
                audio, filename_prefix=filename_prefix, cls=cls, format=format, quality=quality
            )
        )

+    save_opus = execute  # TODO: remove
+

 class SaveAudioAdvanced(IO.ComfyNode):
    @classmethod
@ -258,7 +258,10 @@ class SaveAudioAdvanced(IO.ComfyNode):
                IO.String.Input(
                    "filename_prefix",
                    default="audio/ComfyUI",
-                    tooltip=("The prefix for the file to save. May include formatting tokens such as %date:yyyy-MM-dd%."),
+                    tooltip=(
+                        "The prefix for the file to save. May include formatting tokens "
+                        "such as %date:yyyy-MM-dd%."
+                    ),
                ),
                IO.DynamicCombo.Input(
                    "format",
@ -276,7 +279,6 @@ class SaveAudioAdvanced(IO.ComfyNode):
            ],
            hidden=[IO.Hidden.prompt, IO.Hidden.extra_pnginfo],
            is_output_node=True,
-            outputs=[IO.Audio.Output("audio")],
        )

    @classmethod
@ -287,7 +289,7 @@ class SaveAudioAdvanced(IO.ComfyNode):
            ui=UI.AudioSaveHelper.get_save_audio_ui(audio, filename_prefix=filename_prefix, cls=cls, format=file_format, quality=quality)
        else:
            ui=UI.AudioSaveHelper.get_save_audio_ui(audio, filename_prefix=filename_prefix, cls=cls, format=file_format)
-        return IO.NodeOutput(audio, ui=ui)
+        return IO.NodeOutput(ui=ui)


 class PreviewAudio(IO.ComfyNode):
@ -303,14 +305,13 @@ class PreviewAudio(IO.ComfyNode):
            ],
            hidden=[IO.Hidden.prompt, IO.Hidden.extra_pnginfo],
            is_output_node=True,
-            outputs=[IO.Audio.Output("audio")]
        )

    @classmethod
    def execute(cls, audio) -> IO.NodeOutput:
        if audio is None:
            raise ValueError("PreviewAudio: input audio is None (source video may have no audio track).")
-        return IO.NodeOutput(audio, ui=UI.PreviewAudio(audio, cls=cls))
+        return IO.NodeOutput(ui=UI.PreviewAudio(audio, cls=cls))

    save_flac = execute  # TODO: remove

--- a/comfy_extras/nodes_images.py
+++ b/comfy_extras/nodes_images.py
@ -214,13 +214,11 @@ class SaveAnimatedWEBP(IO.ComfyNode):
            ],
            hidden=[IO.Hidden.prompt, IO.Hidden.extra_pnginfo],
            is_output_node=True,
-            outputs=[IO.Image.Output(display_name="images")]
        )

    @classmethod
    def execute(cls, images, fps, filename_prefix, lossless, quality, method, num_frames=0) -> IO.NodeOutput:
        return IO.NodeOutput(
-            images,
            ui=UI.ImageSaveHelper.get_save_animated_webp_ui(
                images=images,
                filename_prefix=filename_prefix,
@ -232,6 +230,8 @@ class SaveAnimatedWEBP(IO.ComfyNode):
            )
        )

+    save_images = execute  # TODO: remove
+

 class SaveAnimatedPNG(IO.ComfyNode):

@ -249,13 +249,11 @@ class SaveAnimatedPNG(IO.ComfyNode):
            ],
            hidden=[IO.Hidden.prompt, IO.Hidden.extra_pnginfo],
            is_output_node=True,
-            outputs=[IO.Image.Output(display_name="images")]
        )

    @classmethod
    def execute(cls, images, fps, compress_level, filename_prefix="ComfyUI") -> IO.NodeOutput:
        return IO.NodeOutput(
-            images,
            ui=UI.ImageSaveHelper.get_save_animated_png_ui(
                images=images,
                filename_prefix=filename_prefix,
@ -265,6 +263,8 @@ class SaveAnimatedPNG(IO.ComfyNode):
            )
        )

+    save_images = execute  # TODO: remove
+

 class ImageStitch(IO.ComfyNode):
    """Upstreamed from https://github.com/kijai/ComfyUI-KJNodes"""
@ -513,7 +513,6 @@ class SaveSVGNode(IO.ComfyNode):
            ],
            hidden=[IO.Hidden.prompt, IO.Hidden.extra_pnginfo],
            is_output_node=True,
-            outputs=[IO.SVG.Output("svg")],
        )

    @classmethod
@ -563,7 +562,9 @@ class SaveSVGNode(IO.ComfyNode):

            results.append(UI.SavedResult(filename=file, subfolder=subfolder, type=IO.FolderType.output))
            counter += 1
-        return IO.NodeOutput(svg, ui={"images": results})
+        return IO.NodeOutput(ui={"images": results})
+
+    save_svg = execute  # TODO: remove


 class GetImageSize(IO.ComfyNode):
@ -1156,27 +1157,40 @@ class SaveImageAdvanced(IO.ComfyNode):
                IO.String.Input(
                    "filename_prefix",
                    default="ComfyUI",
-                    tooltip=("The prefix for the file to save. May include formatting tokens such as %date:yyyy-MM-dd% or %Empty Latent Image.width%."),
+                    tooltip=(
+                        "The prefix for the file to save. May include formatting tokens "
+                        "such as %date:yyyy-MM-dd% or %Empty Latent Image.width%."
+                    ),
                ),
                IO.DynamicCombo.Input(
                    "format",
                    options=[
                        IO.DynamicCombo.Option("png", [
-                            IO.Combo.Input("bit_depth", options=["8-bit", "16-bit"], default="8-bit", advanced=True),
-                            IO.Combo.Input("input_color_space", options=["sRGB"], default="sRGB", advanced=True),
+                            IO.Combo.Input("bit_depth", options=["8-bit", "16-bit"],
+                                           default="8-bit", advanced=True),
+                            IO.Combo.Input("input_color_space", options=["sRGB"],
+                                           default="sRGB", advanced=True),
                        ]),
                        IO.DynamicCombo.Option("exr", [
-                            IO.Combo.Input("bit_depth", options=["32-bit float"], default="32-bit float", advanced=True),
+                            IO.Combo.Input("bit_depth", options=["32-bit float"],
+                                           default="32-bit float", advanced=True),
                            IO.Combo.Input(
                                "input_color_space",
                                options=["sRGB", "HDR", "linear"],
                                default="sRGB",
                                advanced=True,
                                tooltip=(
-                                    "Colorspace of the input tensor. The EXR is always written as scene-linear in the matching gamut.\n"
-                                    "sRGB — input is sRGB-encoded Rec.709; the inverse sRGB EOTF is applied.\n"
-                                    "HDR — input is HLG-encoded Rec.2020 (BT.2100); the inverse HLG OETF is applied to get scene-linear light.\n"
-                                    "linear — input is already scene-linear (Rec.709 primaries); written through unchanged. Use this for renderer/compositor output."
+                                    "Colorspace of the input tensor. The EXR is "
+                                    "always written as scene-linear in the matching "
+                                    "gamut.\n"
+                                    "  'sRGB'   — input is sRGB-encoded Rec.709; "
+                                    "the inverse sRGB EOTF is applied.\n"
+                                    "  'HDR'    — input is HLG-encoded Rec.2020 "
+                                    "(BT.2100); the inverse HLG OETF is applied "
+                                    "to get scene-linear light.\n"
+                                    "  'linear' — input is already scene-linear "
+                                    "(Rec.709 primaries); written through unchanged. "
+                                    "Use this for renderer/compositor output."
                                ),
                            ),
                        ]),
@ -1186,7 +1200,6 @@ class SaveImageAdvanced(IO.ComfyNode):
            ],
            hidden=[IO.Hidden.prompt, IO.Hidden.extra_pnginfo],
            is_output_node=True,
-            outputs=[IO.Image.Output(display_name="images")]
        )

    @classmethod
@ -1224,7 +1237,7 @@ class SaveImageAdvanced(IO.ComfyNode):
            results.append({"filename": file, "subfolder": subfolder, "type": "output"})
            counter += 1

-        return IO.NodeOutput(images, ui={"images": results})
+        return IO.NodeOutput(ui={"images": results})


 class ImagesExtension(ComfyExtension):
--- a/comfy_extras/nodes_video.py
+++ b/comfy_extras/nodes_video.py
@ -27,7 +27,6 @@ class SaveWEBM(io.ComfyNode):
            ],
            hidden=[io.Hidden.prompt, io.Hidden.extra_pnginfo],
            is_output_node=True,
-            outputs=[io.Image.Output(display_name="images")]
        )

    @classmethod
@ -70,7 +69,7 @@ class SaveWEBM(io.ComfyNode):
        container.mux(stream.encode())
        container.close()

-        return io.NodeOutput(images, ui=ui.PreviewVideo([ui.SavedResult(file, subfolder, io.FolderType.output)]))
+        return io.NodeOutput(ui=ui.PreviewVideo([ui.SavedResult(file, subfolder, io.FolderType.output)]))

 class SaveVideo(io.ComfyNode):
    @classmethod
@ -90,7 +89,6 @@ class SaveVideo(io.ComfyNode):
            ],
            hidden=[io.Hidden.prompt, io.Hidden.extra_pnginfo],
            is_output_node=True,
-            outputs=[io.Video.Output("video")],
        )

    @classmethod
@ -119,7 +117,7 @@ class SaveVideo(io.ComfyNode):
            metadata=saved_metadata
        )

-        return io.NodeOutput(video, ui=ui.PreviewVideo([ui.SavedResult(file, subfolder, io.FolderType.output)]))
+        return io.NodeOutput(ui=ui.PreviewVideo([ui.SavedResult(file, subfolder, io.FolderType.output)]))


 class CreateVideo(io.ComfyNode):
--- a/extra_model_paths.yaml.example
+++ b/extra_model_paths.yaml.example
@ -8,37 +8,21 @@
 #     # You can use is_default to mark that these folders should be listed first, and used as the default dirs for eg downloads
 #     #is_default: true
 #     checkpoints: models/checkpoints/
-#     configs: models/configs/
-#     loras: models/loras/
-#     vae: models/vae/
 #     text_encoders: |
 #          models/text_encoders/
-#          models/clip/
-#     diffusion_models: |
-#          models/unet/
-#          models/diffusion_models/
+#          models/clip/  # legacy location still supported
 #     clip_vision: models/clip_vision/
-#     style_models: models/style_models/
+#     configs: models/configs/
+#     controlnet: models/controlnet/
+#     diffusion_models: |
+#                  models/diffusion_models
+#                  models/unet
 #     embeddings: models/embeddings/
-#     diffusers: models/diffusers/
-#     vae_approx: models/vae_approx/
-#     controlnet: |
-#          models/controlnet/
-#          models/t2i_adapter/
-#     gligen: models/gligen/
+#     loras: models/loras/
 #     upscale_models: models/upscale_models/
-#     latent_upscale_models: models/latent_upscale_models/
-#     custom_nodes: custom_nodes/
-#     hypernetworks: models/hypernetworks/
-#     photomaker: models/photomaker/
-#     classifiers: models/classifiers/
-#     model_patches: models/model_patches/
+#     vae: models/vae/
 #     audio_encoders: models/audio_encoders/
-#     background_removal: models/background_removal/
-#     frame_interpolation: models/frame_interpolation/
-#     geometry_estimation: models/geometry_estimation/
-#     optical_flow: models/optical_flow/
-#     detection: models/detection/
+#     model_patches: models/model_patches/


 #config for a1111 ui
@ -61,7 +45,8 @@
 #     controlnet: models/ControlNet


-# For the canonical list of supported keys and extensions, see folder_paths.py.
+# For a full list of supported keys (style_models, vae_approx, hypernetworks, photomaker,
+# model_patches, audio_encoders, classifiers, etc.) see folder_paths.py.

 #other_ui:
 #    base_path: path/to/ui
--- a/nodes.py
+++ b/nodes.py
@ -480,13 +480,11 @@ class SaveLatent:

    @classmethod
    def INPUT_TYPES(s):
-        return { "required": {
-            "samples": ("LATENT",),
-            "filename_prefix": ("STRING", {"default": "latents/ComfyUI"})},
-            "hidden": {"prompt": "PROMPT", "extra_pnginfo": "EXTRA_PNGINFO"},
-        }
-    RETURN_TYPES = ("LATENT",)
-    RETURN_NAMES = ("samples",)
+        return {"required": { "samples": ("LATENT", ),
+                              "filename_prefix": ("STRING", {"default": "latents/ComfyUI"})},
+                "hidden": {"prompt": "PROMPT", "extra_pnginfo": "EXTRA_PNGINFO"},
+                }
+    RETURN_TYPES = ()
    FUNCTION = "save"

    OUTPUT_NODE = True
@ -524,7 +522,7 @@ class SaveLatent:
        output["latent_format_version_0"] = torch.tensor([])

        comfy.utils.save_torch_file(output, file, metadata=metadata)
-        return { "ui": { "latents": results }, "result": (samples,) }
+        return { "ui": { "latents": results } }


 class LoadLatent:
@ -969,7 +967,7 @@ class CLIPLoader:
    @classmethod
    def INPUT_TYPES(s):
        return {"required": { "clip_name": (folder_paths.get_filename_list("text_encoders"), ),
-                              "type": (["stable_diffusion", "stable_cascade", "sd3", "stable_audio", "mochi", "ltxv", "pixart", "cosmos", "lumina2", "wan", "hidream", "chroma", "ace", "omnigen2", "qwen_image", "hunyuan_image", "flux2", "ovis", "longcat_image", "cogvideox", "lens", "pixeldit", "ideogram4", "boogu", "krea2"], ),
+                              "type": (["stable_diffusion", "stable_cascade", "sd3", "stable_audio", "mochi", "ltxv", "pixart", "cosmos", "lumina2", "wan", "hidream", "chroma", "ace", "omnigen2", "qwen_image", "hunyuan_image", "flux2", "ovis", "longcat_image", "cogvideox", "lens", "pixeldit", "ideogram4", "boogu"], ),
                              },
                "optional": {
                              "device": (["default", "cpu"], {"advanced": True}),
@ -1629,18 +1627,14 @@ class SaveImage:
        return {
            "required": {
                "images": ("IMAGE", {"tooltip": "The images to save."}),
-                "filename_prefix": ("STRING", {
-                    "default": "ComfyUI",
-                    "tooltip": "The prefix for the file to save. This may include formatting information such as %date:yyyy-MM-dd% or %Empty Latent Image.width% to include values from nodes."
-                })
+                "filename_prefix": ("STRING", {"default": "ComfyUI", "tooltip": "The prefix for the file to save. This may include formatting information such as %date:yyyy-MM-dd% or %Empty Latent Image.width% to include values from nodes."})
            },
            "hidden": {
                "prompt": "PROMPT", "extra_pnginfo": "EXTRA_PNGINFO"
            },
        }

-    RETURN_TYPES = ("IMAGE",)
-    RETURN_NAMES = ("images",)
+    RETURN_TYPES = ()
    FUNCTION = "save_images"

    OUTPUT_NODE = True
@ -1676,7 +1670,7 @@ class SaveImage:
            })
            counter += 1

-        return { "ui": { "images": results }, "result" : (images,) }
+        return { "ui": { "images": results } }

 class PreviewImage(SaveImage):
    def __init__(self):
--- a/requirements.txt
+++ b/requirements.txt
@ -1,6 +1,6 @@
 comfyui-frontend-package==1.45.19
 comfyui-workflow-templates==0.10.0
-comfyui-embedded-docs==0.5.5
+comfyui-embedded-docs==0.5.4
 torch
 torchsde
 torchvision
--- a/tests-unit/feature_flags_test.py
+++ b/tests-unit/feature_flags_test.py
@ -11,6 +11,10 @@ from comfy_api.feature_flags import (
    _coerce_flag_value,
    _parse_cli_feature_flags,
 )
+from comfy.comfy_api_env import (
+    frontend_config_for_base,
+    normalize_comfy_api_base,
+)


 class TestFeatureFlags:
@ -181,3 +185,50 @@ class TestCliFeatureFlagRegistry:
            assert "type" in info, f"{key} missing 'type'"
            assert "default" in info, f"{key} missing 'default'"
            assert "description" in info, f"{key} missing 'description'"
+
+
+class TestComfyApiEnv:
+    """--comfy-api-base staging-tier detection + testenv main-host -> -registry rewrite."""
+
+    @pytest.mark.parametrize(
+        "url, expected",
+        [
+            # testenv friendly main host -> comfy-api -registry sibling (slash trimmed)
+            ("https://pr-4398.testenvs.comfy.org", "https://pr-4398-registry.testenvs.comfy.org"),
+            ("https://pr-4398.testenvs.comfy.org/", "https://pr-4398-registry.testenvs.comfy.org"),
+            ("https://pr-4398-registry.testenvs.comfy.org", "https://pr-4398-registry.testenvs.comfy.org"),
+            # staging + everything else -> unchanged (no -registry split)
+            ("https://stagingapi.comfy.org", "https://stagingapi.comfy.org"),
+            ("https://api.comfy.org", "https://api.comfy.org"),
+            ("https://pr-1.testenvs.comfy.org.evil.com", "https://pr-1.testenvs.comfy.org.evil.com"),
+            ("", ""),
+        ],
+    )
+    def test_normalize_comfy_api_base(self, url, expected):
+        assert normalize_comfy_api_base(url) == expected
+
+    def test_config_for_staging_tier_else_none(self):
+        # ephemeral testenv: friendly main host -> -registry, staging platform
+        eph = frontend_config_for_base("https://pr-1234.testenvs.comfy.org/")
+        assert eph["comfy_api_base_url"] == "https://pr-1234-registry.testenvs.comfy.org"
+        assert eph["comfy_platform_base_url"] == "https://stagingplatform.comfy.org"
+        # staging api host: emitted as-is
+        stg = frontend_config_for_base("https://stagingapi.comfy.org")
+        assert stg["comfy_api_base_url"] == "https://stagingapi.comfy.org"
+        assert stg["comfy_platform_base_url"] == "https://stagingplatform.comfy.org"
+        # prod / unknown: nothing
+        assert frontend_config_for_base("https://api.comfy.org") is None
+
+    def test_server_features_merge_only_for_staging_tier(self, monkeypatch):
+        def set_base(url):
+            monkeypatch.setattr(
+                "comfy.comfy_api_env.args",
+                type("Args", (), {"comfy_api_base": url})(),
+            )
+
+        set_base("https://stagingapi.comfy.org")
+        assert "comfy_api_base_url" in get_server_features()
+        set_base("https://pr-7.testenvs.comfy.org")
+        assert "comfy_api_base_url" in get_server_features()
+        set_base("https://api.comfy.org")
+        assert "comfy_api_base_url" not in get_server_features()