[Perf] Add Triton config for DeepSeek V3 FP8 EP32 H200 (#23504)

Signed-off-by: Ming Yang <minos.future@gmail.com>
This commit is contained in:
Ming Yang
2025-08-24 18:06:35 -07:00
committed by GitHub
parent 47455c424f
commit 504d914314
4 changed files with 184 additions and 1 deletions

View File

@@ -11,8 +11,8 @@ from datetime import datetime
from typing import Any
import torch
import tqdm
import triton
from tqdm import tqdm
from vllm.model_executor.layers.quantization.utils.fp8_utils import (
_w8a8_block_fp8_matmul,