diff --git a/csrc/cpu/sgl-kernels/gemm.cpp b/csrc/cpu/sgl-kernels/gemm.cpp index c122d0718..65c56943c 100644 --- a/csrc/cpu/sgl-kernels/gemm.cpp +++ b/csrc/cpu/sgl-kernels/gemm.cpp @@ -265,7 +265,7 @@ void tinygemm_kernel( // mb_size = 4 case 0x42: LAUNCH_TINYGEMM_KERNEL_NN(4, 32); break; case 0x44: LAUNCH_TINYGEMM_KERNEL_NN(4, 64); break; - default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", "nb_size"); + default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", nb_size); } } } diff --git a/csrc/cpu/sgl-kernels/gemm_fp8.cpp b/csrc/cpu/sgl-kernels/gemm_fp8.cpp index b5f2f07ba..ef29181ce 100644 --- a/csrc/cpu/sgl-kernels/gemm_fp8.cpp +++ b/csrc/cpu/sgl-kernels/gemm_fp8.cpp @@ -324,7 +324,7 @@ void tinygemm_kernel( case 0x22: LAUNCH_TINYGEMM_KERNEL_NN(2, 32); break; case 0x32: LAUNCH_TINYGEMM_KERNEL_NN(3, 32); break; case 0x42: LAUNCH_TINYGEMM_KERNEL_NN(4, 32); break; - default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", "nb_size"); + default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", nb_size); } } } diff --git a/csrc/cpu/sgl-kernels/gemm_int8.cpp b/csrc/cpu/sgl-kernels/gemm_int8.cpp index 9a5ca0642..4d6560cce 100644 --- a/csrc/cpu/sgl-kernels/gemm_int8.cpp +++ b/csrc/cpu/sgl-kernels/gemm_int8.cpp @@ -180,7 +180,7 @@ void tinygemm_kernel( // mb_size = 4 case 0x42: LAUNCH_TINYGEMM_KERNEL_NN(4, 32); break; case 0x44: LAUNCH_TINYGEMM_KERNEL_NN(4, 64); break; - default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", "nb_size"); + default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", nb_size); } } } diff --git a/csrc/cpu/sgl-kernels/moe.cpp b/csrc/cpu/sgl-kernels/moe.cpp index 94b24c2f1..c01bfd376 100644 --- a/csrc/cpu/sgl-kernels/moe.cpp +++ b/csrc/cpu/sgl-kernels/moe.cpp @@ -398,7 +398,7 @@ void tinygemm_kernel( case 0x32: LAUNCH_TINYGEMM_KERNEL_NN(3, 32); break; // mb_size = 4 case 0x42: LAUNCH_TINYGEMM_KERNEL_NN(4, 32); break; - default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", "nb_size"); + default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", nb_size); } } } @@ -511,7 +511,7 @@ void tinygemm_kernel( case 0x32: LAUNCH_TINYGEMM_KERNEL_NN2(3, 32); break; // mb_size = 4 case 0x42: LAUNCH_TINYGEMM_KERNEL_NN2(4, 32); break; - default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", "nb_size"); + default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", nb_size); } } } diff --git a/csrc/cpu/sgl-kernels/moe_int8.cpp b/csrc/cpu/sgl-kernels/moe_int8.cpp index 89d0fb5d9..e28b4fc4e 100644 --- a/csrc/cpu/sgl-kernels/moe_int8.cpp +++ b/csrc/cpu/sgl-kernels/moe_int8.cpp @@ -271,7 +271,7 @@ void tinygemm_kernel( case 0x22: LAUNCH_TINYGEMM_KERNEL_VNNI(2, 32); break; case 0x32: LAUNCH_TINYGEMM_KERNEL_VNNI(3, 32); break; case 0x42: LAUNCH_TINYGEMM_KERNEL_VNNI(4, 32); break; - default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", "nb_size"); + default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", nb_size); } } } @@ -401,7 +401,7 @@ void tinygemm_kernel( case 0x22: LAUNCH_TINYGEMM_KERNEL_VNNI2(2, 32); break; case 0x32: LAUNCH_TINYGEMM_KERNEL_VNNI2(3, 32); break; case 0x42: LAUNCH_TINYGEMM_KERNEL_VNNI2(4, 32); break; - default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", "nb_size"); + default: TORCH_CHECK(false, "Unexpected block size, ", mb_size, "x", nb_size); } } } diff --git a/csrc/moe/marlin_moe_wna16/ops.cu b/csrc/moe/marlin_moe_wna16/ops.cu index 6f229a4df..e3f3b4175 100644 --- a/csrc/moe/marlin_moe_wna16/ops.cu +++ b/csrc/moe/marlin_moe_wna16/ops.cu @@ -770,7 +770,7 @@ torch::Tensor moe_wna16_marlin_gemm( b_bias = b_bias_or_none.value(); TORCH_CHECK(b_bias.device().is_cuda(), "b_bias is not on GPU"); TORCH_CHECK(b_bias.is_contiguous(), "b_bias is not contiguous"); - TORCH_CHECK(b_bias.size(1) == size_n, "b_bias.size(0) != size_n"); + TORCH_CHECK(b_bias.size(1) == size_n, "b_bias.size(1) != size_n"); TORCH_CHECK(b_bias.stride(1) == 1, "b_bias.stride(1) != 1"); } else { b_bias = torch::empty({0}, options);