Merge 72a07190bf into 978267f461

2024-03-21 20:47:38 +02:00 · 2024-03-21 20:47:38 +02:00 · ca22cdc697
commit ca22cdc697
parent 978267f461 72a07190bf
1 changed files with 1 additions and 3 deletions
--- a/extras/resampler.py
+++ b/extras/resampler.py
@ -1,6 +1,4 @@
 # modified from https://github.com/mlfoundations/open_flamingo/blob/main/open_flamingo/src/helpers.py
 import math
 import torch
 import torch.nn as nn
@ -65,7 +63,7 @@ class PerceiverAttention(nn.Module):
        v = reshape_tensor(v, self.heads)
        # attention
-        scale = 1 / math.sqrt(math.sqrt(self.dim_head))
+        scale = 1 / (self.dim_head ** 0.5)	
        weight = (q * scale) @ (k * scale).transpose(-2, -1) # More stable with f16 than dividing afterwards
        weight = torch.softmax(weight.float(), dim=-1).type(weight.dtype)
        out = weight @ v