diff --git a/dsv4/kernels/attention/fmha_sm100.cpp b/dsv4/kernels/attention/fmha_sm100.cpp index a4188a8c..6c64144a 100644 --- a/dsv4/kernels/attention/fmha_sm100.cpp +++ b/dsv4/kernels/attention/fmha_sm100.cpp @@ -5,7 +5,6 @@ #include "fmha_sm100.cuh" #include #include -#include namespace dsv4 { namespace kernels { diff --git a/dsv4/kernels/attention/fmha_sm100.cuh b/dsv4/kernels/attention/fmha_sm100.cuh index bd69d497..06683854 100644 --- a/dsv4/kernels/attention/fmha_sm100.cuh +++ b/dsv4/kernels/attention/fmha_sm100.cuh @@ -29,16 +29,18 @@ #pragma once -#include #include -#include #include + +// CUTLASS C++ includes (CUDA device code only) +#if defined(__CUDA_ARCH__) #include #include #include #include #include #include +#endif namespace dsv4 { namespace kernels {