File tree Expand file tree Collapse file tree 1 file changed +8
-0
lines changed
Expand file tree Collapse file tree 1 file changed +8
-0
lines changed Original file line number Diff line number Diff line change 11import nodes
22import node_helpers
33import torch
4+ import comfy
5+ import comfy .latent_formats
46import comfy .model_management
57import comfy .utils
68from comfy_api .latest import io , ComfyExtension
@@ -144,6 +146,12 @@ def _match_temporal(lat, target_t):
144146
145147 inpaint_latents = torch .cat ([mask_latents , masked_video_latents ], dim = 1 )
146148
149+ # CogVideoX.concat_cond() applies process_latent_in (x scale_factor) to
150+ # concat_latent_image before feeding it to the transformer. Pre-divide here
151+ # so the net scaling is identity — the VOID model expects raw VAE latents.
152+ scale_factor = comfy .latent_formats .CogVideoX ().scale_factor
153+ inpaint_latents = inpaint_latents / scale_factor
154+
147155 positive = node_helpers .conditioning_set_values (
148156 positive , {"concat_latent_image" : inpaint_latents }
149157 )
You can’t perform that action at this time.
0 commit comments