We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9dfd075 commit eb7cb34Copy full SHA for eb7cb34
vllm_ascend/models/glm4_moe.py
@@ -76,7 +76,7 @@ def forward(self, hidden_states: torch.Tensor) -> torch.Tensor:
76
final_hidden_states = (
77
self.experts.maybe_all_reduce_tensor_model_parallel(
78
final_hidden_states))
79
- return final_hidden_states.view(num_tokens, hidden_dim)
+ return final_hidden_states.view(-1, hidden_dim)
80
81
82
class CustomGlm4MoeDecoderLayer(nn.Module):
0 commit comments