workaround of AWQ for Turing GPUs (#1252)

This commit is contained in:
twaka
2023-10-11 11:48:16 +09:00
committed by GitHub
parent 91fce82c6f
commit 8285736840
3 changed files with 73 additions and 5 deletions

View File

@@ -16,7 +16,7 @@ namespace awq {
__device__ uint4 dequantize_s4_to_fp16x2(uint32_t const& source)
{
#if defined(__CUDA_ARCH__) && __CUDA_ARCH__ < 800
#if defined(__CUDA_ARCH__) && __CUDA_ARCH__ < 750
assert(false);
#else
uint4 result;