- Add BF16 support for SM90 and SM100 - Refactor Python APIs - Other fixes and code refactoring
76 lines
1.9 KiB
C++
76 lines
1.9 KiB
C++
#pragma once
|
|
|
|
#include <exception>
|
|
#include <string>
|
|
#include <sstream>
|
|
|
|
namespace deep_gemm {
|
|
|
|
class DGException final : public std::exception {
|
|
std::string message = {};
|
|
|
|
public:
|
|
explicit DGException(const char *name, const char* file, const int line, const std::string& error) {
|
|
message = std::string(name) + " error (" + file + ":" + std::to_string(line) + "): " + error;
|
|
}
|
|
|
|
const char *what() const noexcept override {
|
|
return message.c_str();
|
|
}
|
|
};
|
|
|
|
#ifndef DG_STATIC_ASSERT
|
|
#define DG_STATIC_ASSERT(cond, ...) static_assert(cond, __VA_ARGS__)
|
|
#endif
|
|
|
|
#ifndef DG_HOST_ASSERT
|
|
#define DG_HOST_ASSERT(cond) \
|
|
do { \
|
|
if (not (cond)) { \
|
|
throw DGException("Assertion", __FILE__, __LINE__, #cond); \
|
|
} \
|
|
} while (0)
|
|
#endif
|
|
|
|
#ifndef DG_HOST_UNREACHABLE
|
|
#define DG_HOST_UNREACHABLE(reason) (throw DGException("Assertion", __FILE__, __LINE__, reason))
|
|
#endif
|
|
|
|
#ifndef DG_NVRTC_CHECK
|
|
#define DG_NVRTC_CHECK(cmd) \
|
|
do { \
|
|
const auto& e = (cmd); \
|
|
if (e != NVRTC_SUCCESS) { \
|
|
throw DGException("NVRTC", __FILE__, __LINE__, nvrtcGetErrorString(e)); \
|
|
} \
|
|
} while (0)
|
|
#endif
|
|
|
|
#ifndef DG_CUDA_DRIVER_CHECK
|
|
#define DG_CUDA_DRIVER_CHECK(cmd) \
|
|
do { \
|
|
const auto& e = (cmd); \
|
|
if (e != CUDA_SUCCESS) { \
|
|
std::stringstream ss; \
|
|
const char *name, *info; \
|
|
cuGetErrorName(e, &name), cuGetErrorString(e, &info); \
|
|
ss << static_cast<int>(e) << " (" << name << ", " << info << ")"; \
|
|
throw DGException("CUDA driver", __FILE__, __LINE__, ss.str()); \
|
|
} \
|
|
} while (0)
|
|
#endif
|
|
|
|
#ifndef DG_CUDA_RUNTIME_CHECK
|
|
#define DG_CUDA_RUNTIME_CHECK(cmd) \
|
|
do { \
|
|
const auto& e = (cmd); \
|
|
if (e != cudaSuccess) { \
|
|
std::stringstream ss; \
|
|
ss << static_cast<int>(e) << " (" << cudaGetErrorName(e) << ", " << cudaGetErrorString(e) << ")"; \
|
|
throw DGException("CUDA runtime", __FILE__, __LINE__, ss.str()); \
|
|
} \
|
|
} while (0)
|
|
#endif
|
|
|
|
} // namespace deep_gemm
|