[optimization] remove python function call for custom op (#11750)
Signed-off-by: youkaichao <youkaichao@gmail.com>
This commit is contained in:
@@ -753,7 +753,8 @@ def fused_experts_impl(hidden_states: torch.Tensor,
|
||||
use_int8_w8a16=use_int8_w8a16,
|
||||
block_shape=block_shape)
|
||||
|
||||
ops.silu_and_mul(intermediate_cache2, intermediate_cache1.view(-1, N))
|
||||
torch.ops._C.silu_and_mul(intermediate_cache2,
|
||||
intermediate_cache1.view(-1, N))
|
||||
|
||||
invoke_fused_moe_kernel(intermediate_cache2,
|
||||
w2,
|
||||
|
||||
Reference in New Issue
Block a user