Skip to content

Commit 97ed730

Browse files
committed
fix the search call
1 parent bdf7fe0 commit 97ed730

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

csrc/gpu/moe/fused_moe/cutlass_kernels/moe_gemm/fused_moe_gemm_kernels_template.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -706,7 +706,7 @@ void MoeGemmRunner<T, WeightType>::run_gemm<EpilogueTag, FineGrained>(
706706
for (size_t ii = 0; ii < candidate_configs.size(); ++ii) {
707707
try {
708708
for (int i = 0; i < warm_time; i++) {
709-
dispatch_to_arch<EpilogueTag>(A,
709+
dispatch_to_arch<EpilogueTag, FineGrained>(A,
710710
B,
711711
weight_scales,
712712
biases,
@@ -727,7 +727,7 @@ void MoeGemmRunner<T, WeightType>::run_gemm<EpilogueTag, FineGrained>(
727727
check_cuda_error(cudaStreamSynchronize(stream));
728728
check_cuda_error(cudaEventRecord(start, stream));
729729
for (int i = 0; i < test_time; i++) {
730-
dispatch_to_arch<EpilogueTag>(A,
730+
dispatch_to_arch<EpilogueTag, FineGrained>(A,
731731
B,
732732
weight_scales,
733733
biases,

0 commit comments

Comments
 (0)