[Misc] Add indirection layer for custom ops (#3913)

This commit is contained in:
Kunshang Ji
2024-04-11 03:26:07 +00:00
committed by GitHub
parent e42df7227d
commit e9da5a40c6
14 changed files with 224 additions and 32 deletions

View File

@@ -6,7 +6,7 @@ import torch
import torch.nn as nn
import torch.nn.functional as F
from vllm._C import ops
from vllm import _custom_ops as ops
from vllm.distributed import (divide, get_tensor_model_parallel_rank,
get_tensor_model_parallel_world_size)
from vllm.model_executor.layers.quantization import QuantizationConfig