We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents 59be631 + 49ddf83 commit 3bc4a51Copy full SHA for 3bc4a51
mamba_ssm/modules/block.py
@@ -69,7 +69,7 @@ def forward(
69
if self.mlp is not None:
70
if not self.fused_add_norm:
71
residual = hidden_states + residual
72
- residual = self.norm2(residual.to(dtype=self.norm2.weight.dtype))
+ hidden_states = self.norm2(residual.to(dtype=self.norm2.weight.dtype))
73
if self.residual_in_fp32:
74
residual = residual.to(torch.float32)
75
else:
0 commit comments