mirror of
https://github.com/lucidrains/DALLE2-pytorch.git
synced 2026-02-22 01:54:22 +01:00
Compare commits
1 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
3df86acc8b |
@@ -251,9 +251,7 @@ class XClipAdapter(BaseClipAdapter):
|
|||||||
text_mask = text != 0
|
text_mask = text != 0
|
||||||
encoder_output = self.clip.text_transformer(text)
|
encoder_output = self.clip.text_transformer(text)
|
||||||
|
|
||||||
encoder_output_is_cls = encoder_output.ndim == 3
|
text_cls, text_encodings = (encoder_output[:, 0], encoder_output[:, 1:]) if encoder_output.ndim == 3 else (encoder_output, None)
|
||||||
|
|
||||||
text_cls, text_encodings = (encoder_output[:, 0], encoder_output[:, 1:]) if encoder_output_is_cls else (encoder_output, None)
|
|
||||||
text_embed = self.clip.to_text_latent(text_cls)
|
text_embed = self.clip.to_text_latent(text_cls)
|
||||||
|
|
||||||
if exists(text_encodings):
|
if exists(text_encodings):
|
||||||
@@ -879,8 +877,6 @@ class Attention(nn.Module):
|
|||||||
# attention
|
# attention
|
||||||
|
|
||||||
attn = sim.softmax(dim = -1, dtype = torch.float32)
|
attn = sim.softmax(dim = -1, dtype = torch.float32)
|
||||||
attn = attn.type(sim.dtype)
|
|
||||||
|
|
||||||
attn = self.dropout(attn)
|
attn = self.dropout(attn)
|
||||||
|
|
||||||
# aggregate values
|
# aggregate values
|
||||||
@@ -1639,7 +1635,6 @@ class CrossAttention(nn.Module):
|
|||||||
sim = sim.masked_fill(~mask, max_neg_value)
|
sim = sim.masked_fill(~mask, max_neg_value)
|
||||||
|
|
||||||
attn = sim.softmax(dim = -1, dtype = torch.float32)
|
attn = sim.softmax(dim = -1, dtype = torch.float32)
|
||||||
attn = attn.type(sim.dtype)
|
|
||||||
|
|
||||||
out = einsum('b h i j, b h j d -> b h i d', attn, v)
|
out = einsum('b h i j, b h j d -> b h i d', attn, v)
|
||||||
out = rearrange(out, 'b h n d -> b n (h d)')
|
out = rearrange(out, 'b h n d -> b n (h d)')
|
||||||
|
|||||||
@@ -1 +1 @@
|
|||||||
__version__ = '1.8.4'
|
__version__ = '1.8.3'
|
||||||
|
|||||||
Reference in New Issue
Block a user