Tiny wan vae optimizations. (Comfy-Org#9136)

comfyanonymous · web-flow · commit 1e638a140b2f · 2025-08-01T05:25:38.000-04:00
diff --git a/comfy/ldm/wan/vae.py b/comfy/ldm/wan/vae.py
@@ -24,12 +24,17 @@ def __init__(self, *args, **kwargs):
                          self.padding[1], 2 * self.padding[0], 0)
         self.padding = (0, 0, 0)
 
-    def forward(self, x, cache_x=None):
+    def forward(self, x, cache_x=None, cache_list=None, cache_idx=None):
+        if cache_list is not None:
+            cache_x = cache_list[cache_idx]
+            cache_list[cache_idx] = None
+
         padding = list(self._padding)
         if cache_x is not None and self._padding[4] > 0:
             cache_x = cache_x.to(x.device)
             x = torch.cat([cache_x, x], dim=2)
             padding[4] -= cache_x.shape[2]
+            del cache_x
         x = F.pad(x, padding)
 
         return super().forward(x)
@@ -166,7 +171,7 @@ def __init__(self, in_dim, out_dim, dropout=0.0):
             if in_dim != out_dim else nn.Identity()
 
     def forward(self, x, feat_cache=None, feat_idx=[0]):
-        h = self.shortcut(x)
+        old_x = x
         for layer in self.residual:
             if isinstance(layer, CausalConv3d) and feat_cache is not None:
                 idx = feat_idx[0]
@@ -178,12 +183,12 @@ def forward(self, x, feat_cache=None, feat_idx=[0]):
                             cache_x.device), cache_x
                     ],
                                         dim=2)
-                x = layer(x, feat_cache[idx])
+                x = layer(x, cache_list=feat_cache, cache_idx=idx)
                 feat_cache[idx] = cache_x
                 feat_idx[0] += 1
             else:
                 x = layer(x)
-        return x + h
+        return x + self.shortcut(old_x)
 
 
 class AttentionBlock(nn.Module):
diff --git a/comfy/ldm/wan/vae2_2.py b/comfy/ldm/wan/vae2_2.py
@@ -151,7 +151,7 @@ def forward(self, x, feat_cache=None, feat_idx=[0]):
                         ],
                         dim=2,
                     )
-                x = layer(x, feat_cache[idx])
+                x = layer(x, cache_list=feat_cache, cache_idx=idx)
                 feat_cache[idx] = cache_x
                 feat_idx[0] += 1
             else:

Original file line number	Diff line number	Diff line change
`@@ -151,7 +151,7 @@ def forward(self, x, feat_cache=None, feat_idx=[0]):`
`151`	`151`	`],`
`152`	`152`	`dim=2,`
`153`	`153`	`)`
`154`		`- x = layer(x, feat_cache[idx])`
	`154`	`+ x = layer(x, cache_list=feat_cache, cache_idx=idx)`
`155`	`155`	`feat_cache[idx] = cache_x`
`156`	`156`	`feat_idx[0] += 1`
`157`	`157`	`else:`