|
#pragma once |
|
|
|
#include <cuda_runtime.h> |
|
#include <cuda.h> |
|
#include <cublas_v2.h> |
|
#include <cuda_fp16.h> |
|
|
|
#if CUDART_VERSION < 11020 |
|
#define CU_DEVICE_ATTRIBUTE_VIRTUAL_MEMORY_MANAGEMENT_SUPPORTED CU_DEVICE_ATTRIBUTE_VIRTUAL_ADDRESS_MANAGEMENT_SUPPORTED |
|
#define CUBLAS_TF32_TENSOR_OP_MATH CUBLAS_TENSOR_OP_MATH |
|
#define CUBLAS_COMPUTE_16F CUDA_R_16F |
|
#define CUBLAS_COMPUTE_32F CUDA_R_32F |
|
#define cublasComputeType_t cudaDataType_t |
|
#endif |
|
|