Skip to content

Commit f4cac8d

Browse files
committed
make buffer optional
1 parent 25db7c9 commit f4cac8d

File tree

1 file changed

+7
-2
lines changed

1 file changed

+7
-2
lines changed

vllm/_custom_ops.py

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -918,8 +918,13 @@ def moe_align_block_size(topk_ids: torch.Tensor, num_experts: int,
918918
block_size: int, sorted_token_ids: torch.Tensor,
919919
experts_ids: torch.Tensor,
920920
num_tokens_post_pad: torch.Tensor,
921-
token_cnts_buffer: torch.Tensor,
922-
cumsum_buffer: torch.Tensor) -> None:
921+
token_cnts_buffer: Optional[torch.Tensor] = None,
922+
cumsum_buffer: Optional[torch.Tensor] = None,
923+
) -> None:
924+
if token_cnts_buffer is None:
925+
token_cnts_buffer = torch.empty((0,), device=topk_ids.device)
926+
if cumsum_buffer is None:
927+
cumsum_buffer = torch.empty((0,), device=topk_ids.device)
923928
torch.ops._moe_C.moe_align_block_size(topk_ids, num_experts, block_size,
924929
sorted_token_ids, experts_ids,
925930
num_tokens_post_pad,

0 commit comments

Comments
 (0)