|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#ifndef CLBLAST_CLBLAST_C_H_ |
|
#define CLBLAST_CLBLAST_C_H_ |
|
|
|
|
|
#if defined(__APPLE__) || defined(__MACOSX) |
|
#include <OpenCL/opencl.h> |
|
#else |
|
#include <CL/opencl.h> |
|
#endif |
|
|
|
|
|
|
|
#if defined(_WIN32) && defined(CLBLAST_DLL) |
|
#if defined(COMPILING_DLL) |
|
#define PUBLIC_API __declspec(dllexport) |
|
#else |
|
#define PUBLIC_API __declspec(dllimport) |
|
#endif |
|
#else |
|
#define PUBLIC_API |
|
#endif |
|
|
|
|
|
#define CLBLAST_VERSION_MAJOR 1 |
|
#define CLBLAST_VERSION_MINOR 6 |
|
#define CLBLAST_VERSION_PATCH 0 |
|
|
|
|
|
#ifdef __cplusplus |
|
extern "C" { |
|
#endif |
|
|
|
|
|
|
|
|
|
|
|
typedef enum CLBlastStatusCode_ { |
|
|
|
|
|
CLBlastSuccess = 0, |
|
CLBlastOpenCLCompilerNotAvailable= -3, |
|
CLBlastTempBufferAllocFailure = -4, |
|
CLBlastOpenCLOutOfResources = -5, |
|
CLBlastOpenCLOutOfHostMemory = -6, |
|
CLBlastOpenCLBuildProgramFailure = -11, |
|
CLBlastInvalidValue = -30, |
|
CLBlastInvalidCommandQueue = -36, |
|
CLBlastInvalidMemObject = -38, |
|
CLBlastInvalidBinary = -42, |
|
CLBlastInvalidBuildOptions = -43, |
|
CLBlastInvalidProgram = -44, |
|
CLBlastInvalidProgramExecutable = -45, |
|
CLBlastInvalidKernelName = -46, |
|
CLBlastInvalidKernelDefinition = -47, |
|
CLBlastInvalidKernel = -48, |
|
CLBlastInvalidArgIndex = -49, |
|
CLBlastInvalidArgValue = -50, |
|
CLBlastInvalidArgSize = -51, |
|
CLBlastInvalidKernelArgs = -52, |
|
CLBlastInvalidLocalNumDimensions = -53, |
|
CLBlastInvalidLocalThreadsTotal = -54, |
|
CLBlastInvalidLocalThreadsDim = -55, |
|
CLBlastInvalidGlobalOffset = -56, |
|
CLBlastInvalidEventWaitList = -57, |
|
CLBlastInvalidEvent = -58, |
|
CLBlastInvalidOperation = -59, |
|
CLBlastInvalidBufferSize = -61, |
|
CLBlastInvalidGlobalWorkSize = -63, |
|
|
|
|
|
CLBlastNotImplemented = -1024, |
|
CLBlastInvalidMatrixA = -1022, |
|
CLBlastInvalidMatrixB = -1021, |
|
CLBlastInvalidMatrixC = -1020, |
|
CLBlastInvalidVectorX = -1019, |
|
CLBlastInvalidVectorY = -1018, |
|
CLBlastInvalidDimension = -1017, |
|
CLBlastInvalidLeadDimA = -1016, |
|
CLBlastInvalidLeadDimB = -1015, |
|
CLBlastInvalidLeadDimC = -1014, |
|
CLBlastInvalidIncrementX = -1013, |
|
CLBlastInvalidIncrementY = -1012, |
|
CLBlastInsufficientMemoryA = -1011, |
|
CLBlastInsufficientMemoryB = -1010, |
|
CLBlastInsufficientMemoryC = -1009, |
|
CLBlastInsufficientMemoryX = -1008, |
|
CLBlastInsufficientMemoryY = -1007, |
|
|
|
|
|
CLBlastInsufficientMemoryTemp = -2050, |
|
CLBlastInvalidBatchCount = -2049, |
|
CLBlastInvalidOverrideKernel = -2048, |
|
CLBlastMissingOverrideParameter = -2047, |
|
CLBlastInvalidLocalMemUsage = -2046, |
|
CLBlastNoHalfPrecision = -2045, |
|
CLBlastNoDoublePrecision = -2044, |
|
CLBlastInvalidVectorScalar = -2043, |
|
CLBlastInsufficientMemoryScalar = -2042, |
|
CLBlastDatabaseError = -2041, |
|
CLBlastUnknownError = -2040, |
|
CLBlastUnexpectedError = -2039, |
|
} CLBlastStatusCode; |
|
|
|
|
|
typedef enum CLBlastLayout_ { CLBlastLayoutRowMajor = 101, |
|
CLBlastLayoutColMajor = 102 } CLBlastLayout; |
|
typedef enum CLBlastTranspose_ { CLBlastTransposeNo = 111, CLBlastTransposeYes = 112, |
|
CLBlastTransposeConjugate = 113 } CLBlastTranspose; |
|
typedef enum CLBlastTriangle_ { CLBlastTriangleUpper = 121, |
|
CLBlastTriangleLower = 122 } CLBlastTriangle; |
|
typedef enum CLBlastDiagonal_ { CLBlastDiagonalNonUnit = 131, |
|
CLBlastDiagonalUnit = 132 } CLBlastDiagonal; |
|
typedef enum CLBlastSide_ { CLBlastSideLeft = 141, CLBlastSideRight = 142 } CLBlastSide; |
|
typedef enum CLBlastKernelMode_ { CLBlastKernelModeCrossCorrelation = 151, CLBlastKernelModeConvolution = 152 } CLBlastKernelMode; |
|
|
|
|
|
typedef enum CLBlastPrecision_ { CLBlastPrecisionHalf = 16, CLBlastPrecisionSingle = 32, |
|
CLBlastPrecisionDouble = 64, CLBlastPrecisionComplexSingle = 3232, |
|
CLBlastPrecisionComplexDouble = 6464 } CLBlastPrecision; |
|
|
|
|
|
|
|
|
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSrotg(cl_mem sa_buffer, const size_t sa_offset, |
|
cl_mem sb_buffer, const size_t sb_offset, |
|
cl_mem sc_buffer, const size_t sc_offset, |
|
cl_mem ss_buffer, const size_t ss_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDrotg(cl_mem sa_buffer, const size_t sa_offset, |
|
cl_mem sb_buffer, const size_t sb_offset, |
|
cl_mem sc_buffer, const size_t sc_offset, |
|
cl_mem ss_buffer, const size_t ss_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSrotmg(cl_mem sd1_buffer, const size_t sd1_offset, |
|
cl_mem sd2_buffer, const size_t sd2_offset, |
|
cl_mem sx1_buffer, const size_t sx1_offset, |
|
const cl_mem sy1_buffer, const size_t sy1_offset, |
|
cl_mem sparam_buffer, const size_t sparam_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDrotmg(cl_mem sd1_buffer, const size_t sd1_offset, |
|
cl_mem sd2_buffer, const size_t sd2_offset, |
|
cl_mem sx1_buffer, const size_t sx1_offset, |
|
const cl_mem sy1_buffer, const size_t sy1_offset, |
|
cl_mem sparam_buffer, const size_t sparam_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSrot(const size_t n, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
const float cos, |
|
const float sin, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDrot(const size_t n, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
const double cos, |
|
const double sin, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSrotm(const size_t n, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem sparam_buffer, const size_t sparam_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDrotm(const size_t n, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem sparam_buffer, const size_t sparam_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSswap(const size_t n, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDswap(const size_t n, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCswap(const size_t n, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZswap(const size_t n, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHswap(const size_t n, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSscal(const size_t n, |
|
const float alpha, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDscal(const size_t n, |
|
const double alpha, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCscal(const size_t n, |
|
const cl_float2 alpha, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZscal(const size_t n, |
|
const cl_double2 alpha, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHscal(const size_t n, |
|
const cl_half alpha, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastScopy(const size_t n, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDcopy(const size_t n, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCcopy(const size_t n, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZcopy(const size_t n, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHcopy(const size_t n, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSaxpy(const size_t n, |
|
const float alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDaxpy(const size_t n, |
|
const double alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCaxpy(const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZaxpy(const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHaxpy(const size_t n, |
|
const cl_half alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSdot(const size_t n, |
|
cl_mem dot_buffer, const size_t dot_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDdot(const size_t n, |
|
cl_mem dot_buffer, const size_t dot_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHdot(const size_t n, |
|
cl_mem dot_buffer, const size_t dot_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastCdotu(const size_t n, |
|
cl_mem dot_buffer, const size_t dot_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZdotu(const size_t n, |
|
cl_mem dot_buffer, const size_t dot_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastCdotc(const size_t n, |
|
cl_mem dot_buffer, const size_t dot_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZdotc(const size_t n, |
|
cl_mem dot_buffer, const size_t dot_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSnrm2(const size_t n, |
|
cl_mem nrm2_buffer, const size_t nrm2_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDnrm2(const size_t n, |
|
cl_mem nrm2_buffer, const size_t nrm2_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastScnrm2(const size_t n, |
|
cl_mem nrm2_buffer, const size_t nrm2_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDznrm2(const size_t n, |
|
cl_mem nrm2_buffer, const size_t nrm2_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHnrm2(const size_t n, |
|
cl_mem nrm2_buffer, const size_t nrm2_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSasum(const size_t n, |
|
cl_mem asum_buffer, const size_t asum_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDasum(const size_t n, |
|
cl_mem asum_buffer, const size_t asum_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastScasum(const size_t n, |
|
cl_mem asum_buffer, const size_t asum_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDzasum(const size_t n, |
|
cl_mem asum_buffer, const size_t asum_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHasum(const size_t n, |
|
cl_mem asum_buffer, const size_t asum_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSsum(const size_t n, |
|
cl_mem sum_buffer, const size_t sum_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDsum(const size_t n, |
|
cl_mem sum_buffer, const size_t sum_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastScsum(const size_t n, |
|
cl_mem sum_buffer, const size_t sum_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDzsum(const size_t n, |
|
cl_mem sum_buffer, const size_t sum_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHsum(const size_t n, |
|
cl_mem sum_buffer, const size_t sum_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastiSamax(const size_t n, |
|
cl_mem imax_buffer, const size_t imax_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiDamax(const size_t n, |
|
cl_mem imax_buffer, const size_t imax_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiCamax(const size_t n, |
|
cl_mem imax_buffer, const size_t imax_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiZamax(const size_t n, |
|
cl_mem imax_buffer, const size_t imax_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiHamax(const size_t n, |
|
cl_mem imax_buffer, const size_t imax_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastiSamin(const size_t n, |
|
cl_mem imin_buffer, const size_t imin_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiDamin(const size_t n, |
|
cl_mem imin_buffer, const size_t imin_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiCamin(const size_t n, |
|
cl_mem imin_buffer, const size_t imin_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiZamin(const size_t n, |
|
cl_mem imin_buffer, const size_t imin_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiHamin(const size_t n, |
|
cl_mem imin_buffer, const size_t imin_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastiSmax(const size_t n, |
|
cl_mem imax_buffer, const size_t imax_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiDmax(const size_t n, |
|
cl_mem imax_buffer, const size_t imax_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiCmax(const size_t n, |
|
cl_mem imax_buffer, const size_t imax_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiZmax(const size_t n, |
|
cl_mem imax_buffer, const size_t imax_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiHmax(const size_t n, |
|
cl_mem imax_buffer, const size_t imax_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastiSmin(const size_t n, |
|
cl_mem imin_buffer, const size_t imin_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiDmin(const size_t n, |
|
cl_mem imin_buffer, const size_t imin_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiCmin(const size_t n, |
|
cl_mem imin_buffer, const size_t imin_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiZmin(const size_t n, |
|
cl_mem imin_buffer, const size_t imin_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastiHmin(const size_t n, |
|
cl_mem imin_buffer, const size_t imin_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
|
|
|
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSgemv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const float beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDgemv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const double beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCgemv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_float2 beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZgemv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_double2 beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHgemv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_half beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSgbmv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, const size_t kl, const size_t ku, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const float beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDgbmv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, const size_t kl, const size_t ku, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const double beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCgbmv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, const size_t kl, const size_t ku, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_float2 beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZgbmv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, const size_t kl, const size_t ku, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_double2 beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHgbmv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, const size_t kl, const size_t ku, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_half beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastChemv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_float2 beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZhemv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_double2 beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastChbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, const size_t k, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_float2 beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZhbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, const size_t k, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_double2 beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastChpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_float2 beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZhpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_double2 beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSsymv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const float beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDsymv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const double beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHsymv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_half beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSsbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, const size_t k, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const float beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDsbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, const size_t k, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const double beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHsbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, const size_t k, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_half beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSspmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const float alpha, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const float beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDspmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const double alpha, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const double beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHspmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_half alpha, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_half beta, |
|
cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastStrmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDtrmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCtrmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZtrmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHtrmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastStbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, const size_t k, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDtbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, const size_t k, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCtbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, const size_t k, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZtbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, const size_t k, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHtbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, const size_t k, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastStpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDtpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCtpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZtpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHtpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastStrsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDtrsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCtrsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZtrsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastStbsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, const size_t k, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDtbsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, const size_t k, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCtbsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, const size_t k, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZtbsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, const size_t k, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastStpsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDtpsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCtpsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZtpsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t n, |
|
const cl_mem ap_buffer, const size_t ap_offset, |
|
cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSger(const CLBlastLayout layout, |
|
const size_t m, const size_t n, |
|
const float alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDger(const CLBlastLayout layout, |
|
const size_t m, const size_t n, |
|
const double alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHger(const CLBlastLayout layout, |
|
const size_t m, const size_t n, |
|
const cl_half alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastCgeru(const CLBlastLayout layout, |
|
const size_t m, const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZgeru(const CLBlastLayout layout, |
|
const size_t m, const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastCgerc(const CLBlastLayout layout, |
|
const size_t m, const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZgerc(const CLBlastLayout layout, |
|
const size_t m, const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastCher(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const float alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZher(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const double alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastChpr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const float alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem ap_buffer, const size_t ap_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZhpr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const double alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem ap_buffer, const size_t ap_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastCher2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZher2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastChpr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem ap_buffer, const size_t ap_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZhpr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem ap_buffer, const size_t ap_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSsyr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const float alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDsyr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const double alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHsyr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_half alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSspr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const float alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem ap_buffer, const size_t ap_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDspr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const double alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem ap_buffer, const size_t ap_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHspr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_half alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
cl_mem ap_buffer, const size_t ap_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSsyr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const float alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDsyr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const double alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHsyr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_half alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSspr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const float alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem ap_buffer, const size_t ap_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDspr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const double alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem ap_buffer, const size_t ap_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHspr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
|
const size_t n, |
|
const cl_half alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
cl_mem ap_buffer, const size_t ap_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
|
|
|
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSgemm(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const float beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDgemm(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const double beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCgemm(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_float2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZgemm(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_double2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHgemm(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_half beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSsymm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
|
const size_t m, const size_t n, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const float beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDsymm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
|
const size_t m, const size_t n, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const double beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCsymm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
|
const size_t m, const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_float2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZsymm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
|
const size_t m, const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_double2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHsymm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
|
const size_t m, const size_t n, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_half beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastChemm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
|
const size_t m, const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_float2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZhemm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
|
const size_t m, const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_double2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSsyrk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
|
const size_t n, const size_t k, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const float beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDsyrk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
|
const size_t n, const size_t k, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const double beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCsyrk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
|
const size_t n, const size_t k, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_float2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZsyrk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
|
const size_t n, const size_t k, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_double2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHsyrk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
|
const size_t n, const size_t k, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_half beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastCherk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
|
const size_t n, const size_t k, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const float beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZherk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
|
const size_t n, const size_t k, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const double beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSsyr2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
|
const size_t n, const size_t k, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const float beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDsyr2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
|
const size_t n, const size_t k, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const double beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCsyr2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
|
const size_t n, const size_t k, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_float2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZsyr2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
|
const size_t n, const size_t k, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_double2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHsyr2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
|
const size_t n, const size_t k, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_half beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastCher2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
|
const size_t n, const size_t k, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const float beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZher2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
|
const size_t n, const size_t k, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const double beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastStrmm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t m, const size_t n, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDtrmm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t m, const size_t n, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCtrmm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t m, const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZtrmm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t m, const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHtrmm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t m, const size_t n, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastStrsm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t m, const size_t n, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDtrsm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t m, const size_t n, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCtrsm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t m, const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZtrsm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
|
const size_t m, const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
|
|
|
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastShad(const size_t n, |
|
const float alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
const float beta, |
|
cl_mem z_buffer, const size_t z_offset, const size_t z_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDhad(const size_t n, |
|
const double alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
const double beta, |
|
cl_mem z_buffer, const size_t z_offset, const size_t z_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastChad(const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
const cl_float2 beta, |
|
cl_mem z_buffer, const size_t z_offset, const size_t z_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZhad(const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
const cl_double2 beta, |
|
cl_mem z_buffer, const size_t z_offset, const size_t z_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHhad(const size_t n, |
|
const cl_half alpha, |
|
const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
|
const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
|
const cl_half beta, |
|
cl_mem z_buffer, const size_t z_offset, const size_t z_inc, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSomatcopy(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDomatcopy(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastComatcopy(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZomatcopy(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHomatcopy(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
|
const size_t m, const size_t n, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSim2col(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
|
const cl_mem im_buffer, const size_t im_offset, |
|
cl_mem col_buffer, const size_t col_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDim2col(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
|
const cl_mem im_buffer, const size_t im_offset, |
|
cl_mem col_buffer, const size_t col_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCim2col(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
|
const cl_mem im_buffer, const size_t im_offset, |
|
cl_mem col_buffer, const size_t col_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZim2col(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
|
const cl_mem im_buffer, const size_t im_offset, |
|
cl_mem col_buffer, const size_t col_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHim2col(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
|
const cl_mem im_buffer, const size_t im_offset, |
|
cl_mem col_buffer, const size_t col_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastScol2im(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
|
const cl_mem col_buffer, const size_t col_offset, |
|
cl_mem im_buffer, const size_t im_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDcol2im(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
|
const cl_mem col_buffer, const size_t col_offset, |
|
cl_mem im_buffer, const size_t im_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCcol2im(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
|
const cl_mem col_buffer, const size_t col_offset, |
|
cl_mem im_buffer, const size_t im_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZcol2im(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
|
const cl_mem col_buffer, const size_t col_offset, |
|
cl_mem im_buffer, const size_t im_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHcol2im(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
|
const cl_mem col_buffer, const size_t col_offset, |
|
cl_mem im_buffer, const size_t im_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSconvgemm(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, const size_t num_kernels, const size_t batch_count, |
|
const cl_mem im_buffer, const size_t im_offset, |
|
const cl_mem kernel_buffer, const size_t kernel_offset, |
|
cl_mem result_buffer, const size_t result_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDconvgemm(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, const size_t num_kernels, const size_t batch_count, |
|
const cl_mem im_buffer, const size_t im_offset, |
|
const cl_mem kernel_buffer, const size_t kernel_offset, |
|
cl_mem result_buffer, const size_t result_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHconvgemm(const CLBlastKernelMode kernel_mode, |
|
const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, const size_t num_kernels, const size_t batch_count, |
|
const cl_mem im_buffer, const size_t im_offset, |
|
const cl_mem kernel_buffer, const size_t kernel_offset, |
|
cl_mem result_buffer, const size_t result_offset, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSaxpyBatched(const size_t n, |
|
const float *alphas, |
|
const cl_mem x_buffer, const size_t *x_offsets, const size_t x_inc, |
|
cl_mem y_buffer, const size_t *y_offsets, const size_t y_inc, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDaxpyBatched(const size_t n, |
|
const double *alphas, |
|
const cl_mem x_buffer, const size_t *x_offsets, const size_t x_inc, |
|
cl_mem y_buffer, const size_t *y_offsets, const size_t y_inc, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCaxpyBatched(const size_t n, |
|
const cl_float2 *alphas, |
|
const cl_mem x_buffer, const size_t *x_offsets, const size_t x_inc, |
|
cl_mem y_buffer, const size_t *y_offsets, const size_t y_inc, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZaxpyBatched(const size_t n, |
|
const cl_double2 *alphas, |
|
const cl_mem x_buffer, const size_t *x_offsets, const size_t x_inc, |
|
cl_mem y_buffer, const size_t *y_offsets, const size_t y_inc, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHaxpyBatched(const size_t n, |
|
const cl_half *alphas, |
|
const cl_mem x_buffer, const size_t *x_offsets, const size_t x_inc, |
|
cl_mem y_buffer, const size_t *y_offsets, const size_t y_inc, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSgemmBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const float *alphas, |
|
const cl_mem a_buffer, const size_t *a_offsets, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t *b_offsets, const size_t b_ld, |
|
const float *betas, |
|
cl_mem c_buffer, const size_t *c_offsets, const size_t c_ld, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDgemmBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const double *alphas, |
|
const cl_mem a_buffer, const size_t *a_offsets, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t *b_offsets, const size_t b_ld, |
|
const double *betas, |
|
cl_mem c_buffer, const size_t *c_offsets, const size_t c_ld, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCgemmBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_float2 *alphas, |
|
const cl_mem a_buffer, const size_t *a_offsets, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t *b_offsets, const size_t b_ld, |
|
const cl_float2 *betas, |
|
cl_mem c_buffer, const size_t *c_offsets, const size_t c_ld, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZgemmBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_double2 *alphas, |
|
const cl_mem a_buffer, const size_t *a_offsets, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t *b_offsets, const size_t b_ld, |
|
const cl_double2 *betas, |
|
cl_mem c_buffer, const size_t *c_offsets, const size_t c_ld, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHgemmBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_half *alphas, |
|
const cl_mem a_buffer, const size_t *a_offsets, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t *b_offsets, const size_t b_ld, |
|
const cl_half *betas, |
|
cl_mem c_buffer, const size_t *c_offsets, const size_t c_ld, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSgemmStridedBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, const size_t a_stride, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, const size_t b_stride, |
|
const float beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, const size_t c_stride, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastDgemmStridedBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, const size_t a_stride, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, const size_t b_stride, |
|
const double beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, const size_t c_stride, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastCgemmStridedBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, const size_t a_stride, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, const size_t b_stride, |
|
const cl_float2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, const size_t c_stride, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastZgemmStridedBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, const size_t a_stride, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, const size_t b_stride, |
|
const cl_double2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, const size_t c_stride, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
CLBlastStatusCode PUBLIC_API CLBlastHgemmStridedBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, const size_t a_stride, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, const size_t b_stride, |
|
const cl_half beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, const size_t c_stride, |
|
const size_t batch_count, |
|
cl_command_queue* queue, cl_event* event); |
|
|
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSgemmWithTempBuffer(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const float alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const float beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event, cl_mem temp_buffer); |
|
CLBlastStatusCode PUBLIC_API CLBlastDgemmWithTempBuffer(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const double alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const double beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event, cl_mem temp_buffer); |
|
CLBlastStatusCode PUBLIC_API CLBlastCgemmWithTempBuffer(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_float2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_float2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event, cl_mem temp_buffer); |
|
CLBlastStatusCode PUBLIC_API CLBlastZgemmWithTempBuffer(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_double2 alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_double2 beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event, cl_mem temp_buffer); |
|
CLBlastStatusCode PUBLIC_API CLBlastHgemmWithTempBuffer(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const cl_half alpha, |
|
const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
|
const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
|
const cl_half beta, |
|
cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, cl_event* event, cl_mem temp_buffer); |
|
|
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastSGemmTempBufferSize(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const size_t a_offset, const size_t a_ld, |
|
const size_t b_offset, const size_t b_ld, |
|
const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, |
|
size_t* temp_buffer_size); |
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastDGemmTempBufferSize(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const size_t a_offset, const size_t a_ld, |
|
const size_t b_offset, const size_t b_ld, |
|
const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, |
|
size_t* temp_buffer_size); |
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastCGemmTempBufferSize(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const size_t a_offset, const size_t a_ld, |
|
const size_t b_offset, const size_t b_ld, |
|
const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, |
|
size_t* temp_buffer_size); |
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastZGemmTempBufferSize(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const size_t a_offset, const size_t a_ld, |
|
const size_t b_offset, const size_t b_ld, |
|
const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, |
|
size_t* temp_buffer_size); |
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastHGemmTempBufferSize(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
|
const size_t m, const size_t n, const size_t k, |
|
const size_t a_offset, const size_t a_ld, |
|
const size_t b_offset, const size_t b_ld, |
|
const size_t c_offset, const size_t c_ld, |
|
cl_command_queue* queue, |
|
size_t* temp_buffer_size); |
|
|
|
|
|
|
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastClearCache(); |
|
|
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastFillCache(const cl_device_id device); |
|
|
|
|
|
|
|
|
|
|
|
CLBlastStatusCode PUBLIC_API CLBlastOverrideParameters(const cl_device_id device, const char* kernel_name, |
|
const CLBlastPrecision precision, const size_t num_parameters, |
|
const char** parameters_names, const size_t* parameters_values); |
|
|
|
|
|
|
|
#ifdef __cplusplus |
|
} |
|
#endif |
|
|
|
|
|
#endif |
|
|