We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a71bb5a commit 49ddf83Copy full SHA for 49ddf83
mamba_ssm/modules/block.py
@@ -69,7 +69,7 @@ def forward(
69
if self.mlp is not None:
70
if not self.fused_add_norm:
71
residual = hidden_states + residual
72
- residual = self.norm2(residual.to(dtype=self.norm2.weight.dtype))
+ hidden_states = self.norm2(residual.to(dtype=self.norm2.weight.dtype))
73
if self.residual_in_fp32:
74
residual = residual.to(torch.float32)
75
else:
0 commit comments