makes more sense to keep this as True as default, for stability

This commit is contained in:
Phil Wang
2022-05-02 10:50:55 -07:00
parent 2d25c89f35
commit 11469dc0c6
2 changed files with 2 additions and 2 deletions

View File

@@ -599,7 +599,7 @@ class CausalTransformer(nn.Module):
dim_head = 64,
heads = 8,
ff_mult = 4,
norm_out = False,
norm_out = True,
attn_dropout = 0.,
ff_dropout = 0.,
final_proj = True