There was an error while loading. Please reload this page.
1 parent ce3a9b1 commit 2212cd6Copy full SHA for 2212cd6
vllm/model_executor/layers/fused_moe/deep_gemm_utils.py
@@ -52,7 +52,7 @@ def compute_aligned_M(M: int, num_topk: int, local_num_experts: int,
52
@triton.jit
53
def apply_expert_map(expert_id, expert_map):
54
if expert_id != -1:
55
- expert_id = tl.load(expert_map + expert_id).to(tl.int64)
+ expert_id = tl.load(expert_map + expert_id).to(expert_id.dtype)
56
return expert_id
57
58
0 commit comments