Skip to content

Commit 1806d1a

Browse files
authored
[ROCm] [DSv4] [Perf] Support DeepSeek v4 MTP (vllm-project#43385)
Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
1 parent 5940590 commit 1806d1a

6 files changed

Lines changed: 2340 additions & 52 deletions

File tree

vllm/model_executor/layers/fused_moe/experts/gpt_oss_triton_kernels_moe.py

Lines changed: 22 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -81,17 +81,28 @@ def _patch_make_bitmatrix_metadata() -> None:
8181
import triton.language as tl
8282

8383
try:
84-
from vllm.third_party.triton_kernels.tensor_details import (
85-
bitmatrix as _bm,
86-
)
87-
from vllm.third_party.triton_kernels.tensor_details.bitmatrix import (
88-
BitmatrixMetadata,
89-
_keyed_add,
90-
cdiv,
91-
)
92-
from vllm.third_party.triton_kernels.tensor_details.bitmatrix_details.sum_bitmatrix_rows import ( # noqa: E501
93-
sum_bitmatrix_rows,
94-
)
84+
if current_platform.is_rocm():
85+
from triton_kernels.tensor_details import bitmatrix as _bm
86+
from triton_kernels.tensor_details.bitmatrix import (
87+
BitmatrixMetadata,
88+
_keyed_add,
89+
cdiv,
90+
)
91+
from triton_kernels.tensor_details.bitmatrix_details.sum_bitmatrix_rows import ( # noqa: E501
92+
sum_bitmatrix_rows,
93+
)
94+
else:
95+
from vllm.third_party.triton_kernels.tensor_details import (
96+
bitmatrix as _bm,
97+
)
98+
from vllm.third_party.triton_kernels.tensor_details.bitmatrix import (
99+
BitmatrixMetadata,
100+
_keyed_add,
101+
cdiv,
102+
)
103+
from vllm.third_party.triton_kernels.tensor_details.bitmatrix_details.sum_bitmatrix_rows import ( # noqa: E501
104+
sum_bitmatrix_rows,
105+
)
95106
except ImportError:
96107
return
97108

vllm/models/deepseek_v4/amd/model.py

Lines changed: 0 additions & 1 deletion
This file was deleted.

0 commit comments

Comments
 (0)