Fix default shift and any latent size for qwen image model. (Comfy-Org#9186)

comfyanonymous · web-flow · commit d044a2439867 · 2025-08-05T06:12:27.000-04:00
diff --git a/comfy/ldm/qwen_image/model.py b/comfy/ldm/qwen_image/model.py
@@ -8,7 +8,7 @@
 from comfy.ldm.lightricks.model import TimestepEmbedding, Timesteps
 from comfy.ldm.modules.attention import optimized_attention_masked
 from comfy.ldm.flux.layers import EmbedND
-
+import comfy.ldm.common_dit
 
 class GELU(nn.Module):
     def __init__(self, dim_in: int, dim_out: int, approximate: str = "none", bias: bool = True, dtype=None, device=None, operations=None):
@@ -364,8 +364,9 @@ def forward(
 
         image_rotary_emb = self.pos_embeds(x, context)
 
-        orig_shape = x.shape
-        hidden_states = x.view(orig_shape[0], orig_shape[1], orig_shape[-2] // 2, 2, orig_shape[-1] // 2, 2)
+        hidden_states = comfy.ldm.common_dit.pad_to_patch_size(x, (1, self.patch_size, self.patch_size))
+        orig_shape = hidden_states.shape
+        hidden_states = hidden_states.view(orig_shape[0], orig_shape[1], orig_shape[-2] // 2, 2, orig_shape[-1] // 2, 2)
         hidden_states = hidden_states.permute(0, 2, 4, 1, 3, 5)
         hidden_states = hidden_states.reshape(orig_shape[0], (orig_shape[-2] // 2) * (orig_shape[-1] // 2), orig_shape[1] * 4)
 
@@ -396,4 +397,4 @@ def forward(
 
         hidden_states = hidden_states.view(orig_shape[0], orig_shape[-2] // 2, orig_shape[-1] // 2, orig_shape[1], 2, 2)
         hidden_states = hidden_states.permute(0, 3, 1, 4, 2, 5)
-        return hidden_states.reshape(orig_shape)
+        return hidden_states.reshape(orig_shape)[:, :, :, :x.shape[-2], :x.shape[-1]]
diff --git a/comfy/supported_models.py b/comfy/supported_models.py
@@ -1237,7 +1237,7 @@ class QwenImage(supported_models_base.BASE):
 
     sampling_settings = {
         "multiplier": 1.0,
-        "shift": 2.6,
+        "shift": 1.15,
     }
 
     memory_usage_factor = 1.8 #TODO

Original file line number	Diff line number	Diff line change
`@@ -1237,7 +1237,7 @@ class QwenImage(supported_models_base.BASE):`
`1237`	`1237`
`1238`	`1238`	`sampling_settings = {`
`1239`	`1239`	`"multiplier": 1.0,`
`1240`		`- "shift": 2.6,`
	`1240`	`+ "shift": 1.15,`
`1241`	`1241`	`}`
`1242`	`1242`
`1243`	`1243`	`memory_usage_factor = 1.8 #TODO`