* Force cast to fp32 to avoid atten layer overflow

2024-12-22 23:55:00 +00:00 · 2022-12-07 19:56:39 +08:00 · 2022-12-07 19:56:39 +08:00 · 6e92cda76d
commit 6e92cda76d
parent d7440ac160
1 changed files with 6 additions and 2 deletions
--- a/ldm/modules/attention.py
+++ b/ldm/modules/attention.py
@ -167,7 +167,11 @@ class CrossAttention(nn.Module):
        q, k, v = map(lambda t: rearrange(t, 'b n (h d) -> (b h) n d', h=h), (q, k, v))
        # force cast to fp32 to avoid overflowing
        with torch.autocast(enabled=False, device_type = 'cuda'):
            q, k = q.float(), k.float()
            sim = einsum('b i d, b j d -> b i j', q, k) * self.scale
        del q, k
        if exists(mask):