[Bugfix] Fix triton import with local TritonPlaceholder (#17446)

Signed-off-by: Mengqing Cao <cmq0113@163.com>
This commit is contained in:
Mengqing Cao
2025-05-06 17:53:09 +08:00
committed by GitHub
parent 05e1f96419
commit f9bc5a0693
30 changed files with 165 additions and 75 deletions

View File

@@ -7,8 +7,6 @@ import os
from typing import Any, Dict, List, Optional, Tuple, Union
import torch
import triton
import triton.language as tl
from vllm import _custom_ops as ops
from vllm.logger import init_logger
@@ -17,6 +15,7 @@ from vllm.model_executor.layers.quantization.utils.quant_utils import (
from vllm.model_executor.layers.quantization.utils.w8a8_utils import (
CUTLASS_BLOCK_FP8_SUPPORTED)
from vllm.platforms import current_platform
from vllm.triton_utils import tl, triton
from vllm.utils import direct_register_custom_op
logger = init_logger(__name__)