invoke-ai · JPPhoto · Apr 11, 2026 · Apr 11, 2026 · Apr 11, 2026 · Apr 14, 2026
diff --git a/docs-old/contributing/NEW_MODEL_INTEGRATION.md b/docs-old/contributing/NEW_MODEL_INTEGRATION.md
@@ -442,6 +442,7 @@ class NewModelTextEncoderInvocation(BaseInvocation):
 class NewModelDenoiseInvocation(BaseInvocation):
     # Standard Fields
     latents: LatentsField | None = InputField(default=None)
+    noise: LatentsField | None = InputField(default=None)
     positive_conditioning: ConditioningField = InputField()
     negative_conditioning: ConditioningField | None = InputField(default=None)
 
@@ -453,6 +454,7 @@ class NewModelDenoiseInvocation(BaseInvocation):
     denoising_end: float = InputField(default=1.0, ge=0, le=1)
     steps: int = InputField(default=20, ge=1)
     cfg_scale: float = InputField(default=7.0)
+    add_noise: bool = InputField(default=True)
 
     # Image-to-Image / Inpainting
     denoise_mask: DenoiseMaskField | None = InputField(default=None)
@@ -461,16 +463,27 @@ class NewModelDenoiseInvocation(BaseInvocation):
     scheduler: Literal["euler", "heun", "lcm"] = InputField(default="euler")
 
     def invoke(self, context: InvocationContext) -> LatentsOutput:
-        # 1. Generate noise
-        noise = get_noise_newmodel(seed, height, width, ...)
-
-        # 2. Pack latents (if needed)
-        x = pack_newmodel(latents)
+        # 1. Load or generate noise
+        if self.noise is not None:
+            noise = self._load_and_validate_noise(context)
+        else:
+            noise = get_noise_newmodel(seed, height, width, ...)
 
-        # 3. Compute schedule
+        # 2. Compute schedule
         timesteps = get_schedule_newmodel(num_steps, denoising_start, denoising_end)
 
-        # 4. Denoising loop
+        # 3. Prepare init latents and img2img preblend
+        if latents is not None and self.add_noise:
+            x = noise * timesteps[0] + latents * (1.0 - timesteps[0])
+        elif latents is not None:
+            x = latents
+        else:
+            x = noise
+
+        # 4. Pack latents (if needed)
+        x = pack_newmodel(x)
+
+        # 5. Denoising loop
         x = denoise(
             model=transformer,
             x=x,
@@ -480,12 +493,19 @@ class NewModelDenoiseInvocation(BaseInvocation):
             inpaint_extension=inpaint_extension,  # For inpainting
         )
 
-        # 5. Unpack latents
+        # 6. Unpack latents
         latents = unpack_newmodel(x)
 
         return LatentsOutput(latents=latents)
 ```
 
+If the architecture supports external noise, the denoise invocation should
+accept an optional `noise: LatentsField` input and preserve the existing
+seed-driven path when it is not connected. Validate external noise against
+the architecture's expected rank, channel count, and spatial shape before
+using it. Existing workflows must continue to work unchanged when `noise` is
+left disconnected.
+
 ### 4.4 VAE Encode Invocation
 
 **File:** `invokeai/app/invocations/[newmodel]_vae_encode.py`
@@ -536,6 +556,9 @@ class NewModelVaeDecodeInvocation(BaseInvocation):
 - [ ] Model loader invocation (`[newmodel]_model_loader.py`)
 - [ ] Text encoder invocation (`[newmodel]_text_encoder.py`)
 - [ ] Denoise invocation (`[newmodel]_denoise.py`)
+- [ ] Add optional `noise: LatentsField` when the architecture supports
+      external noise
+- [ ] Preserve the seed-driven fallback path when `noise` is not connected
 - [ ] VAE encode invocation (`[newmodel]_vae_encode.py`)
 - [ ] VAE decode invocation (`[newmodel]_vae_decode.py`)
 - [ ] Define output classes (e.g., `NewModelLoaderOutput`)
@@ -574,6 +597,11 @@ def get_noise_newmodel(
         dtype=dtype,
     )
 
+# If the architecture supports external noise, extend the standard
+# invokeai/app/invocations/noise.py node when the tensor contract can be
+# represented there. Only create a dedicated noise invocation when the
+# standard noise node cannot express the architecture cleanly.
+
 def pack_newmodel(x: torch.Tensor) -> torch.Tensor:
     """Pack latents for transformer input.
 
@@ -670,6 +698,13 @@ def denoise(
     return img
 ```
 
+If the architecture supports external noise, the denoise path should accept
+validated external noise without changing the legacy seed-driven behavior.
+Review img2img and inpaint preblend logic carefully when adding scheduler
+support. If the initial latent/noise mix is computed before
+`scheduler.set_timesteps()`, confirm that the preblend matches the
+scheduler's true first effective sigma or timestep.
+
 ### 5.3 Scheduler (if model-specific)
 
 **File:** `invokeai/backend/[newmodel]/schedulers.py` or use existing
@@ -690,11 +725,16 @@ NEWMODEL_SCHEDULER_MAP = {
 ### Backend Sampling and Denoise Checklist
 
 - [ ] Noise generation (`get_noise_newmodel()`)
+- [ ] Extend `invokeai/app/invocations/noise.py` when the architecture's
+      noise tensor contract fits the standard architecture selector
 - [ ] Pack/unpack functions (if transformer-based)
 - [ ] Schedule generation (`get_schedule_newmodel()`)
 - [ ] Position ID generation (if needed)
 - [ ] Implement denoise loop
+- [ ] Validate external noise shape and rank if the architecture supports it
 - [ ] Scheduler integration
+- [ ] Verify img2img and inpaint preblend parity with the scheduler's first
+      effective timestep or sigma
 - [ ] Inpaint extension integration
 - [ ] Progress callbacks
 
@@ -847,6 +887,11 @@ if (
 }
 ```
 
+If the architecture supports external noise, do not require generated
+workflows to connect it. Keep the denoise node backward compatible by
+leaving `noise` disconnected unless the workflow explicitly needs external
+noise.
+
 ### Frontend Graph Building Checklist
 
 - [ ] Create graph builder (`buildNewModelGraph.ts`)
@@ -1209,6 +1254,25 @@ export const NewModelSchedulerSelect = () => {
 - [ ] Frontend UI component
 - [ ] State management
 
+**External Noise:**
+- [ ] Add optional `noise: LatentsField` input to the denoise invocation
+- [ ] Validate external noise shape against the architecture's expected
+      latent shape
+- [ ] Preserve existing behavior when `noise` is not connected
+- [ ] Extend the standard `noise` invocation when the architecture's latent
+      noise contract can be represented there
+- [ ] Add a dedicated architecture-compatible noise invocation only when
+      the standard `noise` invocation cannot support the architecture cleanly
+
+If your model supports external noise, the denoise invocation should accept
+it as an optional input rather than replacing the existing seed-driven path.
+When possible, wire the architecture into the standard `noise` invocation's
+architecture selector instead of creating a separate noise node. Only create
+a dedicated noise invocation if the architecture has a noise tensor contract
+that the standard `noise` invocation cannot express cleanly. When external
+noise is connected, validate rank, channel count, and spatial shape before
+blending it with init latents or using it as the initial latent state.
+
 ---
 
 ## Summary: Minimal Integration
@@ -1240,6 +1304,11 @@ For a **minimal txt2img integration**, the following files are required:
 3. `src/features/nodes/util/graph/generation/addInpaint.ts`
 4. `src/features/nodes/util/graph/generation/addOutpaint.ts`
 
+If the architecture supports external noise, also extend
+`invokeai/app/invocations/noise.py` when possible and keep the denoise
+invocation's `noise` input optional so existing generated workflows continue
+to work without modification.
+
 ---
 
 ## Reference: Existing Implementations

diff --git a/docs-old/nodes/NODES.md b/docs-old/nodes/NODES.md
@@ -43,7 +43,11 @@ There are several node grouping concepts that can be examined with a narrow focu
 
 ### Create Latent Noise
 
-An initial noise tensor is necessary for the latent diffusion process. As a result, the Denoising node requires a noise node input.  
+An initial noise tensor is necessary for the latent diffusion process. As a result, the Denoising node requires a noise node input.
+
+The standard Create Latent Noise node includes a Noise Type selector for architecture-specific latent shapes. Leave it
+at SD for classic 4-channel Stable Diffusion workflows, or switch it to match the downstream denoiser when using
+architectures like FLUX, FLUX.2, SD3, CogView4, Z-Image, or Anima.
 
 ![groupsnoise](../assets/nodes/groupsnoise.png)
 
@@ -94,4 +98,3 @@ Iteration is a common concept in any processing, and means to repeat a process w
 Batch or multiple image generation in the workflow editor is done using the RandomRange node. In this case, the 'Size' field represents the number of images to generate, meaning this example will generate 4 images. As RandomRange produces a collection of integers, we need to add the Iterate node to iterate through the collection. This noise can then be fed to the Denoise Latents node for it to iterate through the denoising process with the different seeds provided.
 
 ![groupsmultigenseeding](../assets/nodes/groupsmultigenseeding.png)
-
diff --git a/docs/src/content/docs/development/Guides/models.mdx b/docs/src/content/docs/development/Guides/models.mdx
@@ -224,6 +224,12 @@ This is where the actual mathematical implementation of the model lives.
        return rearrange(x, "b c (h ph) (w pw) -> b (h w) (c ph pw)", ph=2, pw=2)
    ```
 
+   If the architecture supports external noise, prefer extending the standard
+   `invokeai/app/invocations/noise.py` node's `noise_type` selector instead of
+   adding a brand new noise node. Only add a dedicated noise invocation when the
+   architecture's noise tensor rank or layout cannot be expressed by the
+   standard node.
+
 2. **The Denoising Loop**
 
    Implement the core sampling loop. This interacts with schedulers and handles classifier-free guidance (CFG).
@@ -311,6 +317,7 @@ Invocations expose your PyTorch functions as isolated execution nodes in InvokeA
    @invocation("newmodel_denoise", title="NewModel Denoise", category="latents")
    class NewModelDenoiseInvocation(BaseInvocation):
        latents: LatentsField | None = InputField(default=None)
+       noise: LatentsField | None = InputField(default=None)
        positive_conditioning: ConditioningField = InputField()
        transformer: TransformerField = InputField()
        steps: int = InputField(default=20)
@@ -321,6 +328,10 @@ Invocations expose your PyTorch functions as isolated execution nodes in InvokeA
            pass
    ```
 
+   If you add external noise support, keep it optional so seed-driven workflows
+   continue to work. Validate connected noise against the architecture's
+   expected shape before using it.
+
 4. **VAE Encode / Decode Invocations**
 
    Create nodes to transition between pixel space (images) and latent space.
@@ -331,6 +342,7 @@ Invocations expose your PyTorch functions as isolated execution nodes in InvokeA
   - [ ] Model loader invocation (`[newmodel]_model_loader.py`)
   - [ ] Text encoder invocation (`[newmodel]_text_encoder.py`)
   - [ ] Denoise invocation (`[newmodel]_denoise.py`)
+  - [ ] Extend the standard `noise` invocation if the architecture supports external noise
   - [ ] VAE encode/decode invocations (`[newmodel]_vae_encode.py`, `[newmodel]_vae_decode.py`)
 :::
 

diff --git a/docs/src/content/docs/workflows/editor-interface.mdx b/docs/src/content/docs/workflows/editor-interface.mdx
@@ -73,6 +73,10 @@ The screenshots below aren't examples of complete functioning node graphs, but r
     ### Create Latent Noise
     An initial noise tensor is necessary for the latent diffusion process. As a result, the Denoising node requires a noise node input.
 
+    The standard **Create Latent Noise** node now includes a **Noise Type** selector for architecture-specific latent
+    shapes. Leave it at **SD** for classic 4-channel Stable Diffusion workflows, or switch it to the architecture that
+    matches the downstream denoiser when working with models like FLUX, FLUX.2, SD3, CogView4, Z-Image, or Anima.
+
     ![Create Latent Noise](./assets/groupsnoise.png)
 
     ### Text Prompt Conditioning

@@ -34,6 +34,7 @@
     InputField,
     LatentsField,
 )
+from invokeai.app.invocations.latent_noise import validate_noise_tensor_shape
 from invokeai.app.invocations.model import TransformerField
 from invokeai.app.invocations.primitives import LatentsOutput
 from invokeai.app.services.shared.invocation_context import InvocationContext
@@ -166,7 +167,7 @@ def merge_intermediate_latents_with_init_latents(
     title="Denoise - Anima",
     tags=["image", "anima"],
     category="image",
-    version="1.5.0",
+    version="1.6.0",
     classification=Classification.Prototype,
 )
 class AnimaDenoiseInvocation(BaseInvocation):
@@ -182,6 +183,9 @@ class AnimaDenoiseInvocation(BaseInvocation):
     latents: Optional[LatentsField] = InputField(
         default=None, description=FieldDescriptions.latents, input=Input.Connection
     )
+    noise: Optional[LatentsField] = InputField(
+        default=None, description=FieldDescriptions.noise, input=Input.Connection
+    )
     # denoise_mask is used for inpainting. Only the masked region is modified.
     denoise_mask: Optional[DenoiseMaskField] = InputField(
         default=None, description=FieldDescriptions.denoise_mask, input=Input.Connection
@@ -459,19 +463,35 @@ def _run_diffusion(self, context: InvocationContext) -> torch.Tensor:
             if init_latents.ndim == 4:
                 init_latents = init_latents.unsqueeze(2)  # [B, C, H, W] -> [B, C, 1, H, W]
 
-        # Generate initial noise (3D latent: [B, C, T, H, W])
-        noise = self._get_noise(self.height, self.width, inference_dtype, device, self.seed)
+        # Generate initial noise (3D latent: [B, C, T, H, W]).
+        # If noise will never be consumed, avoid validating/loading it.
+        should_ignore_noise = init_latents is not None and not self.add_noise and self.denoise_mask is None
+        noise: torch.Tensor | None
+        if should_ignore_noise:
+            noise = None
+        else:
+            noise = self._prepare_noise_tensor(context, inference_dtype, device)
 
         # Prepare input latents
         if init_latents is not None:
             if self.add_noise:
+                assert noise is not None
+                # Noise the init latents using the first sigma from the clipped
+                # InvokeAI schedule.
+                #
+                # Known limitation: if the selected scheduler later starts from a
+                # different first effective sigma/timestep than sigmas[0], the
+                # img2img preblend below may not match that scheduler exactly.
+                # This is an existing pipeline limitation and affects both
+                # internally generated noise and externally supplied noise.
                 s_0 = sigmas[0]
                 latents = s_0 * noise + (1.0 - s_0) * init_latents
             else:
                 latents = init_latents
         else:
             if self.denoising_start > 1e-5:
                 raise ValueError("denoising_start should be 0 when initial latents are not provided.")
+            assert noise is not None
             latents = noise
 
         if total_steps <= 0:
@@ -483,6 +503,7 @@ def _run_diffusion(self, context: InvocationContext) -> torch.Tensor:
         if inpaint_mask is not None:
             if init_latents is None:
                 raise ValueError("Initial latents are required when using an inpaint mask (image-to-image inpainting)")
+            assert noise is not None
             inpaint_extension = AnimaInpaintExtension(
                 init_latents=init_latents.squeeze(2),
                 inpaint_mask=inpaint_mask,
@@ -669,6 +690,16 @@ def _run_transformer(ctx: torch.Tensor, x: torch.Tensor, t: torch.Tensor) -> tor
         # Remove temporal dimension for output: [B, C, 1, H, W] -> [B, C, H, W]
         return latents.squeeze(2)
 
+    def _prepare_noise_tensor(
+        self, context: InvocationContext, inference_dtype: torch.dtype, device: torch.device
+    ) -> torch.Tensor:
+        if self.noise is not None:
+            noise = context.tensors.load(self.noise.latents_name).to(device=device, dtype=inference_dtype)
+            validate_noise_tensor_shape(noise, "Anima", self.width, self.height)
+            return noise
+
+        return self._get_noise(self.height, self.width, inference_dtype, device, self.seed)
+
     def _build_step_callback(self, context: InvocationContext) -> Callable[[PipelineIntermediateState], None]:
         def step_callback(state: PipelineIntermediateState) -> None:
             context.util.sd_step_callback(state, BaseModelType.Anima)