Slightly lower hunyuan video memory usage.

2025-06-17 08:45:33 +08:00 · 2025-01-16 00:23:01 -05:00 · 2025-01-16 00:23:01 -05:00 · 6320d05696
commit 6320d05696
parent 25683b5b02
1 changed files with 8 additions and 1 deletions
--- a/comfy/ldm/flux/math.py
+++ b/comfy/ldm/flux/math.py
@ -5,8 +5,15 @@ from torch import Tensor
 from comfy.ldm.modules.attention import optimized_attention
 import comfy.model_management

+
 def attention(q: Tensor, k: Tensor, v: Tensor, pe: Tensor, mask=None) -> Tensor:
-    q, k = apply_rope(q, k, pe)
+    q_shape = q.shape
+    k_shape = k.shape
+
+    q = q.float().reshape(*q.shape[:-1], -1, 1, 2)
+    k = k.float().reshape(*k.shape[:-1], -1, 1, 2)
+    q = (pe[..., 0] * q[..., 0] + pe[..., 1] * q[..., 1]).reshape(*q_shape).type_as(v)
+    k = (pe[..., 0] * k[..., 0] + pe[..., 1] * k[..., 1]).reshape(*k_shape).type_as(v)

    heads = q.shape[1]
    x = optimized_attention(q, k, v, heads, skip_reshape=True, mask=mask)