|
|
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| #ifndef CLBLAST_CLBLAST_C_H_ |
| #define CLBLAST_CLBLAST_C_H_ |
|
|
| |
| #if defined(__APPLE__) || defined(__MACOSX) |
| #include <OpenCL/opencl.h> |
| #else |
| #include <CL/opencl.h> |
| #endif |
|
|
| |
| |
| #if defined(_WIN32) && defined(CLBLAST_DLL) |
| #if defined(COMPILING_DLL) |
| #define PUBLIC_API __declspec(dllexport) |
| #else |
| #define PUBLIC_API __declspec(dllimport) |
| #endif |
| #else |
| #define PUBLIC_API |
| #endif |
|
|
| |
| #define CLBLAST_VERSION_MAJOR 1 |
| #define CLBLAST_VERSION_MINOR 6 |
| #define CLBLAST_VERSION_PATCH 0 |
|
|
| |
| #ifdef __cplusplus |
| extern "C" { |
| #endif |
|
|
| |
|
|
| |
| |
| typedef enum CLBlastStatusCode_ { |
|
|
| |
| CLBlastSuccess = 0, |
| CLBlastOpenCLCompilerNotAvailable= -3, |
| CLBlastTempBufferAllocFailure = -4, |
| CLBlastOpenCLOutOfResources = -5, |
| CLBlastOpenCLOutOfHostMemory = -6, |
| CLBlastOpenCLBuildProgramFailure = -11, |
| CLBlastInvalidValue = -30, |
| CLBlastInvalidCommandQueue = -36, |
| CLBlastInvalidMemObject = -38, |
| CLBlastInvalidBinary = -42, |
| CLBlastInvalidBuildOptions = -43, |
| CLBlastInvalidProgram = -44, |
| CLBlastInvalidProgramExecutable = -45, |
| CLBlastInvalidKernelName = -46, |
| CLBlastInvalidKernelDefinition = -47, |
| CLBlastInvalidKernel = -48, |
| CLBlastInvalidArgIndex = -49, |
| CLBlastInvalidArgValue = -50, |
| CLBlastInvalidArgSize = -51, |
| CLBlastInvalidKernelArgs = -52, |
| CLBlastInvalidLocalNumDimensions = -53, |
| CLBlastInvalidLocalThreadsTotal = -54, |
| CLBlastInvalidLocalThreadsDim = -55, |
| CLBlastInvalidGlobalOffset = -56, |
| CLBlastInvalidEventWaitList = -57, |
| CLBlastInvalidEvent = -58, |
| CLBlastInvalidOperation = -59, |
| CLBlastInvalidBufferSize = -61, |
| CLBlastInvalidGlobalWorkSize = -63, |
|
|
| |
| CLBlastNotImplemented = -1024, |
| CLBlastInvalidMatrixA = -1022, |
| CLBlastInvalidMatrixB = -1021, |
| CLBlastInvalidMatrixC = -1020, |
| CLBlastInvalidVectorX = -1019, |
| CLBlastInvalidVectorY = -1018, |
| CLBlastInvalidDimension = -1017, |
| CLBlastInvalidLeadDimA = -1016, |
| CLBlastInvalidLeadDimB = -1015, |
| CLBlastInvalidLeadDimC = -1014, |
| CLBlastInvalidIncrementX = -1013, |
| CLBlastInvalidIncrementY = -1012, |
| CLBlastInsufficientMemoryA = -1011, |
| CLBlastInsufficientMemoryB = -1010, |
| CLBlastInsufficientMemoryC = -1009, |
| CLBlastInsufficientMemoryX = -1008, |
| CLBlastInsufficientMemoryY = -1007, |
|
|
| |
| CLBlastInsufficientMemoryTemp = -2050, |
| CLBlastInvalidBatchCount = -2049, |
| CLBlastInvalidOverrideKernel = -2048, |
| CLBlastMissingOverrideParameter = -2047, |
| CLBlastInvalidLocalMemUsage = -2046, |
| CLBlastNoHalfPrecision = -2045, |
| CLBlastNoDoublePrecision = -2044, |
| CLBlastInvalidVectorScalar = -2043, |
| CLBlastInsufficientMemoryScalar = -2042, |
| CLBlastDatabaseError = -2041, |
| CLBlastUnknownError = -2040, |
| CLBlastUnexpectedError = -2039, |
| } CLBlastStatusCode; |
|
|
| |
| typedef enum CLBlastLayout_ { CLBlastLayoutRowMajor = 101, |
| CLBlastLayoutColMajor = 102 } CLBlastLayout; |
| typedef enum CLBlastTranspose_ { CLBlastTransposeNo = 111, CLBlastTransposeYes = 112, |
| CLBlastTransposeConjugate = 113 } CLBlastTranspose; |
| typedef enum CLBlastTriangle_ { CLBlastTriangleUpper = 121, |
| CLBlastTriangleLower = 122 } CLBlastTriangle; |
| typedef enum CLBlastDiagonal_ { CLBlastDiagonalNonUnit = 131, |
| CLBlastDiagonalUnit = 132 } CLBlastDiagonal; |
| typedef enum CLBlastSide_ { CLBlastSideLeft = 141, CLBlastSideRight = 142 } CLBlastSide; |
| typedef enum CLBlastKernelMode_ { CLBlastKernelModeCrossCorrelation = 151, CLBlastKernelModeConvolution = 152 } CLBlastKernelMode; |
|
|
| |
| typedef enum CLBlastPrecision_ { CLBlastPrecisionHalf = 16, CLBlastPrecisionSingle = 32, |
| CLBlastPrecisionDouble = 64, CLBlastPrecisionComplexSingle = 3232, |
| CLBlastPrecisionComplexDouble = 6464 } CLBlastPrecision; |
|
|
| |
| |
| |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSrotg(cl_mem sa_buffer, const size_t sa_offset, |
| cl_mem sb_buffer, const size_t sb_offset, |
| cl_mem sc_buffer, const size_t sc_offset, |
| cl_mem ss_buffer, const size_t ss_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDrotg(cl_mem sa_buffer, const size_t sa_offset, |
| cl_mem sb_buffer, const size_t sb_offset, |
| cl_mem sc_buffer, const size_t sc_offset, |
| cl_mem ss_buffer, const size_t ss_offset, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSrotmg(cl_mem sd1_buffer, const size_t sd1_offset, |
| cl_mem sd2_buffer, const size_t sd2_offset, |
| cl_mem sx1_buffer, const size_t sx1_offset, |
| const cl_mem sy1_buffer, const size_t sy1_offset, |
| cl_mem sparam_buffer, const size_t sparam_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDrotmg(cl_mem sd1_buffer, const size_t sd1_offset, |
| cl_mem sd2_buffer, const size_t sd2_offset, |
| cl_mem sx1_buffer, const size_t sx1_offset, |
| const cl_mem sy1_buffer, const size_t sy1_offset, |
| cl_mem sparam_buffer, const size_t sparam_offset, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSrot(const size_t n, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| const float cos, |
| const float sin, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDrot(const size_t n, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| const double cos, |
| const double sin, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSrotm(const size_t n, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem sparam_buffer, const size_t sparam_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDrotm(const size_t n, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem sparam_buffer, const size_t sparam_offset, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSswap(const size_t n, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDswap(const size_t n, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCswap(const size_t n, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZswap(const size_t n, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHswap(const size_t n, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSscal(const size_t n, |
| const float alpha, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDscal(const size_t n, |
| const double alpha, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCscal(const size_t n, |
| const cl_float2 alpha, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZscal(const size_t n, |
| const cl_double2 alpha, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHscal(const size_t n, |
| const cl_half alpha, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastScopy(const size_t n, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDcopy(const size_t n, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCcopy(const size_t n, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZcopy(const size_t n, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHcopy(const size_t n, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSaxpy(const size_t n, |
| const float alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDaxpy(const size_t n, |
| const double alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCaxpy(const size_t n, |
| const cl_float2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZaxpy(const size_t n, |
| const cl_double2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHaxpy(const size_t n, |
| const cl_half alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSdot(const size_t n, |
| cl_mem dot_buffer, const size_t dot_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDdot(const size_t n, |
| cl_mem dot_buffer, const size_t dot_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHdot(const size_t n, |
| cl_mem dot_buffer, const size_t dot_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastCdotu(const size_t n, |
| cl_mem dot_buffer, const size_t dot_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZdotu(const size_t n, |
| cl_mem dot_buffer, const size_t dot_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastCdotc(const size_t n, |
| cl_mem dot_buffer, const size_t dot_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZdotc(const size_t n, |
| cl_mem dot_buffer, const size_t dot_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSnrm2(const size_t n, |
| cl_mem nrm2_buffer, const size_t nrm2_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDnrm2(const size_t n, |
| cl_mem nrm2_buffer, const size_t nrm2_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastScnrm2(const size_t n, |
| cl_mem nrm2_buffer, const size_t nrm2_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDznrm2(const size_t n, |
| cl_mem nrm2_buffer, const size_t nrm2_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHnrm2(const size_t n, |
| cl_mem nrm2_buffer, const size_t nrm2_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSasum(const size_t n, |
| cl_mem asum_buffer, const size_t asum_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDasum(const size_t n, |
| cl_mem asum_buffer, const size_t asum_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastScasum(const size_t n, |
| cl_mem asum_buffer, const size_t asum_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDzasum(const size_t n, |
| cl_mem asum_buffer, const size_t asum_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHasum(const size_t n, |
| cl_mem asum_buffer, const size_t asum_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSsum(const size_t n, |
| cl_mem sum_buffer, const size_t sum_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDsum(const size_t n, |
| cl_mem sum_buffer, const size_t sum_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastScsum(const size_t n, |
| cl_mem sum_buffer, const size_t sum_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDzsum(const size_t n, |
| cl_mem sum_buffer, const size_t sum_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHsum(const size_t n, |
| cl_mem sum_buffer, const size_t sum_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastiSamax(const size_t n, |
| cl_mem imax_buffer, const size_t imax_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiDamax(const size_t n, |
| cl_mem imax_buffer, const size_t imax_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiCamax(const size_t n, |
| cl_mem imax_buffer, const size_t imax_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiZamax(const size_t n, |
| cl_mem imax_buffer, const size_t imax_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiHamax(const size_t n, |
| cl_mem imax_buffer, const size_t imax_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastiSamin(const size_t n, |
| cl_mem imin_buffer, const size_t imin_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiDamin(const size_t n, |
| cl_mem imin_buffer, const size_t imin_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiCamin(const size_t n, |
| cl_mem imin_buffer, const size_t imin_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiZamin(const size_t n, |
| cl_mem imin_buffer, const size_t imin_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiHamin(const size_t n, |
| cl_mem imin_buffer, const size_t imin_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastiSmax(const size_t n, |
| cl_mem imax_buffer, const size_t imax_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiDmax(const size_t n, |
| cl_mem imax_buffer, const size_t imax_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiCmax(const size_t n, |
| cl_mem imax_buffer, const size_t imax_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiZmax(const size_t n, |
| cl_mem imax_buffer, const size_t imax_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiHmax(const size_t n, |
| cl_mem imax_buffer, const size_t imax_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastiSmin(const size_t n, |
| cl_mem imin_buffer, const size_t imin_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiDmin(const size_t n, |
| cl_mem imin_buffer, const size_t imin_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiCmin(const size_t n, |
| cl_mem imin_buffer, const size_t imin_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiZmin(const size_t n, |
| cl_mem imin_buffer, const size_t imin_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastiHmin(const size_t n, |
| cl_mem imin_buffer, const size_t imin_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| |
| |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSgemv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const float beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDgemv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const double beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCgemv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_float2 beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZgemv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_double2 beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHgemv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_half beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSgbmv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, const size_t kl, const size_t ku, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const float beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDgbmv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, const size_t kl, const size_t ku, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const double beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCgbmv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, const size_t kl, const size_t ku, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_float2 beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZgbmv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, const size_t kl, const size_t ku, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_double2 beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHgbmv(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, const size_t kl, const size_t ku, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_half beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastChemv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_float2 beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZhemv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_double2 beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastChbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, const size_t k, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_float2 beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZhbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, const size_t k, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_double2 beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastChpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_float2 alpha, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_float2 beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZhpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_double2 alpha, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_double2 beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSsymv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const float beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDsymv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const double beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHsymv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_half beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSsbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, const size_t k, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const float beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDsbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, const size_t k, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const double beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHsbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, const size_t k, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_half beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSspmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const float alpha, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const float beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDspmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const double alpha, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const double beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHspmv(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_half alpha, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_half beta, |
| cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastStrmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDtrmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCtrmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZtrmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHtrmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastStbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, const size_t k, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDtbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, const size_t k, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCtbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, const size_t k, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZtbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, const size_t k, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHtbmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, const size_t k, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastStpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDtpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCtpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZtpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHtpmv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastStrsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDtrsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCtrsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZtrsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastStbsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, const size_t k, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDtbsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, const size_t k, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCtbsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, const size_t k, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZtbsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, const size_t k, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastStpsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDtpsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCtpsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZtpsv(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t n, |
| const cl_mem ap_buffer, const size_t ap_offset, |
| cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSger(const CLBlastLayout layout, |
| const size_t m, const size_t n, |
| const float alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDger(const CLBlastLayout layout, |
| const size_t m, const size_t n, |
| const double alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHger(const CLBlastLayout layout, |
| const size_t m, const size_t n, |
| const cl_half alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastCgeru(const CLBlastLayout layout, |
| const size_t m, const size_t n, |
| const cl_float2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZgeru(const CLBlastLayout layout, |
| const size_t m, const size_t n, |
| const cl_double2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastCgerc(const CLBlastLayout layout, |
| const size_t m, const size_t n, |
| const cl_float2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZgerc(const CLBlastLayout layout, |
| const size_t m, const size_t n, |
| const cl_double2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastCher(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const float alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZher(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const double alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastChpr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const float alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem ap_buffer, const size_t ap_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZhpr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const double alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem ap_buffer, const size_t ap_offset, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastCher2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_float2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZher2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_double2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastChpr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_float2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem ap_buffer, const size_t ap_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZhpr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_double2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem ap_buffer, const size_t ap_offset, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSsyr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const float alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDsyr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const double alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHsyr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_half alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSspr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const float alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem ap_buffer, const size_t ap_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDspr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const double alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem ap_buffer, const size_t ap_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHspr(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_half alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| cl_mem ap_buffer, const size_t ap_offset, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSsyr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const float alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDsyr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const double alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHsyr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_half alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSspr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const float alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem ap_buffer, const size_t ap_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDspr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const double alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem ap_buffer, const size_t ap_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHspr2(const CLBlastLayout layout, const CLBlastTriangle triangle, |
| const size_t n, |
| const cl_half alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| cl_mem ap_buffer, const size_t ap_offset, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| |
| |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSgemm(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const float beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDgemm(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const double beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCgemm(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_float2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZgemm(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_double2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHgemm(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_half beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSsymm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
| const size_t m, const size_t n, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const float beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDsymm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
| const size_t m, const size_t n, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const double beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCsymm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
| const size_t m, const size_t n, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_float2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZsymm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
| const size_t m, const size_t n, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_double2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHsymm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
| const size_t m, const size_t n, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_half beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastChemm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
| const size_t m, const size_t n, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_float2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZhemm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, |
| const size_t m, const size_t n, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_double2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSsyrk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
| const size_t n, const size_t k, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const float beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDsyrk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
| const size_t n, const size_t k, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const double beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCsyrk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
| const size_t n, const size_t k, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_float2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZsyrk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
| const size_t n, const size_t k, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_double2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHsyrk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
| const size_t n, const size_t k, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_half beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastCherk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
| const size_t n, const size_t k, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const float beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZherk(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, |
| const size_t n, const size_t k, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const double beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSsyr2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
| const size_t n, const size_t k, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const float beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDsyr2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
| const size_t n, const size_t k, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const double beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCsyr2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
| const size_t n, const size_t k, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_float2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZsyr2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
| const size_t n, const size_t k, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_double2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHsyr2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
| const size_t n, const size_t k, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_half beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastCher2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
| const size_t n, const size_t k, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const float beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZher2k(const CLBlastLayout layout, const CLBlastTriangle triangle, const CLBlastTranspose ab_transpose, |
| const size_t n, const size_t k, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const double beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastStrmm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t m, const size_t n, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDtrmm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t m, const size_t n, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCtrmm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t m, const size_t n, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZtrmm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t m, const size_t n, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHtrmm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t m, const size_t n, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastStrsm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t m, const size_t n, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDtrsm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t m, const size_t n, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCtrsm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t m, const size_t n, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZtrsm(const CLBlastLayout layout, const CLBlastSide side, const CLBlastTriangle triangle, const CLBlastTranspose a_transpose, const CLBlastDiagonal diagonal, |
| const size_t m, const size_t n, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| |
| |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastShad(const size_t n, |
| const float alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| const float beta, |
| cl_mem z_buffer, const size_t z_offset, const size_t z_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDhad(const size_t n, |
| const double alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| const double beta, |
| cl_mem z_buffer, const size_t z_offset, const size_t z_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastChad(const size_t n, |
| const cl_float2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| const cl_float2 beta, |
| cl_mem z_buffer, const size_t z_offset, const size_t z_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZhad(const size_t n, |
| const cl_double2 alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| const cl_double2 beta, |
| cl_mem z_buffer, const size_t z_offset, const size_t z_inc, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHhad(const size_t n, |
| const cl_half alpha, |
| const cl_mem x_buffer, const size_t x_offset, const size_t x_inc, |
| const cl_mem y_buffer, const size_t y_offset, const size_t y_inc, |
| const cl_half beta, |
| cl_mem z_buffer, const size_t z_offset, const size_t z_inc, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSomatcopy(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDomatcopy(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastComatcopy(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZomatcopy(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHomatcopy(const CLBlastLayout layout, const CLBlastTranspose a_transpose, |
| const size_t m, const size_t n, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSim2col(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
| const cl_mem im_buffer, const size_t im_offset, |
| cl_mem col_buffer, const size_t col_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDim2col(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
| const cl_mem im_buffer, const size_t im_offset, |
| cl_mem col_buffer, const size_t col_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCim2col(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
| const cl_mem im_buffer, const size_t im_offset, |
| cl_mem col_buffer, const size_t col_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZim2col(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
| const cl_mem im_buffer, const size_t im_offset, |
| cl_mem col_buffer, const size_t col_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHim2col(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
| const cl_mem im_buffer, const size_t im_offset, |
| cl_mem col_buffer, const size_t col_offset, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastScol2im(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
| const cl_mem col_buffer, const size_t col_offset, |
| cl_mem im_buffer, const size_t im_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDcol2im(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
| const cl_mem col_buffer, const size_t col_offset, |
| cl_mem im_buffer, const size_t im_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCcol2im(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
| const cl_mem col_buffer, const size_t col_offset, |
| cl_mem im_buffer, const size_t im_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZcol2im(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
| const cl_mem col_buffer, const size_t col_offset, |
| cl_mem im_buffer, const size_t im_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHcol2im(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, |
| const cl_mem col_buffer, const size_t col_offset, |
| cl_mem im_buffer, const size_t im_offset, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSconvgemm(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, const size_t num_kernels, const size_t batch_count, |
| const cl_mem im_buffer, const size_t im_offset, |
| const cl_mem kernel_buffer, const size_t kernel_offset, |
| cl_mem result_buffer, const size_t result_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDconvgemm(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, const size_t num_kernels, const size_t batch_count, |
| const cl_mem im_buffer, const size_t im_offset, |
| const cl_mem kernel_buffer, const size_t kernel_offset, |
| cl_mem result_buffer, const size_t result_offset, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHconvgemm(const CLBlastKernelMode kernel_mode, |
| const size_t channels, const size_t height, const size_t width, const size_t kernel_h, const size_t kernel_w, const size_t pad_h, const size_t pad_w, const size_t stride_h, const size_t stride_w, const size_t dilation_h, const size_t dilation_w, const size_t num_kernels, const size_t batch_count, |
| const cl_mem im_buffer, const size_t im_offset, |
| const cl_mem kernel_buffer, const size_t kernel_offset, |
| cl_mem result_buffer, const size_t result_offset, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSaxpyBatched(const size_t n, |
| const float *alphas, |
| const cl_mem x_buffer, const size_t *x_offsets, const size_t x_inc, |
| cl_mem y_buffer, const size_t *y_offsets, const size_t y_inc, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDaxpyBatched(const size_t n, |
| const double *alphas, |
| const cl_mem x_buffer, const size_t *x_offsets, const size_t x_inc, |
| cl_mem y_buffer, const size_t *y_offsets, const size_t y_inc, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCaxpyBatched(const size_t n, |
| const cl_float2 *alphas, |
| const cl_mem x_buffer, const size_t *x_offsets, const size_t x_inc, |
| cl_mem y_buffer, const size_t *y_offsets, const size_t y_inc, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZaxpyBatched(const size_t n, |
| const cl_double2 *alphas, |
| const cl_mem x_buffer, const size_t *x_offsets, const size_t x_inc, |
| cl_mem y_buffer, const size_t *y_offsets, const size_t y_inc, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHaxpyBatched(const size_t n, |
| const cl_half *alphas, |
| const cl_mem x_buffer, const size_t *x_offsets, const size_t x_inc, |
| cl_mem y_buffer, const size_t *y_offsets, const size_t y_inc, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSgemmBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const float *alphas, |
| const cl_mem a_buffer, const size_t *a_offsets, const size_t a_ld, |
| const cl_mem b_buffer, const size_t *b_offsets, const size_t b_ld, |
| const float *betas, |
| cl_mem c_buffer, const size_t *c_offsets, const size_t c_ld, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDgemmBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const double *alphas, |
| const cl_mem a_buffer, const size_t *a_offsets, const size_t a_ld, |
| const cl_mem b_buffer, const size_t *b_offsets, const size_t b_ld, |
| const double *betas, |
| cl_mem c_buffer, const size_t *c_offsets, const size_t c_ld, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCgemmBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_float2 *alphas, |
| const cl_mem a_buffer, const size_t *a_offsets, const size_t a_ld, |
| const cl_mem b_buffer, const size_t *b_offsets, const size_t b_ld, |
| const cl_float2 *betas, |
| cl_mem c_buffer, const size_t *c_offsets, const size_t c_ld, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZgemmBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_double2 *alphas, |
| const cl_mem a_buffer, const size_t *a_offsets, const size_t a_ld, |
| const cl_mem b_buffer, const size_t *b_offsets, const size_t b_ld, |
| const cl_double2 *betas, |
| cl_mem c_buffer, const size_t *c_offsets, const size_t c_ld, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHgemmBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_half *alphas, |
| const cl_mem a_buffer, const size_t *a_offsets, const size_t a_ld, |
| const cl_mem b_buffer, const size_t *b_offsets, const size_t b_ld, |
| const cl_half *betas, |
| cl_mem c_buffer, const size_t *c_offsets, const size_t c_ld, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| CLBlastStatusCode PUBLIC_API CLBlastSgemmStridedBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, const size_t a_stride, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, const size_t b_stride, |
| const float beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, const size_t c_stride, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastDgemmStridedBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, const size_t a_stride, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, const size_t b_stride, |
| const double beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, const size_t c_stride, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastCgemmStridedBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, const size_t a_stride, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, const size_t b_stride, |
| const cl_float2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, const size_t c_stride, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastZgemmStridedBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, const size_t a_stride, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, const size_t b_stride, |
| const cl_double2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, const size_t c_stride, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
| CLBlastStatusCode PUBLIC_API CLBlastHgemmStridedBatched(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, const size_t a_stride, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, const size_t b_stride, |
| const cl_half beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, const size_t c_stride, |
| const size_t batch_count, |
| cl_command_queue* queue, cl_event* event); |
|
|
| |
| |
| CLBlastStatusCode PUBLIC_API CLBlastSgemmWithTempBuffer(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const float alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const float beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event, cl_mem temp_buffer); |
| CLBlastStatusCode PUBLIC_API CLBlastDgemmWithTempBuffer(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const double alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const double beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event, cl_mem temp_buffer); |
| CLBlastStatusCode PUBLIC_API CLBlastCgemmWithTempBuffer(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_float2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_float2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event, cl_mem temp_buffer); |
| CLBlastStatusCode PUBLIC_API CLBlastZgemmWithTempBuffer(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_double2 alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_double2 beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event, cl_mem temp_buffer); |
| CLBlastStatusCode PUBLIC_API CLBlastHgemmWithTempBuffer(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const cl_half alpha, |
| const cl_mem a_buffer, const size_t a_offset, const size_t a_ld, |
| const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, |
| const cl_half beta, |
| cl_mem c_buffer, const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, cl_event* event, cl_mem temp_buffer); |
|
|
| |
| |
| CLBlastStatusCode PUBLIC_API CLBlastSGemmTempBufferSize(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const size_t a_offset, const size_t a_ld, |
| const size_t b_offset, const size_t b_ld, |
| const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, |
| size_t* temp_buffer_size); |
|
|
| CLBlastStatusCode PUBLIC_API CLBlastDGemmTempBufferSize(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const size_t a_offset, const size_t a_ld, |
| const size_t b_offset, const size_t b_ld, |
| const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, |
| size_t* temp_buffer_size); |
|
|
| CLBlastStatusCode PUBLIC_API CLBlastCGemmTempBufferSize(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const size_t a_offset, const size_t a_ld, |
| const size_t b_offset, const size_t b_ld, |
| const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, |
| size_t* temp_buffer_size); |
|
|
| CLBlastStatusCode PUBLIC_API CLBlastZGemmTempBufferSize(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const size_t a_offset, const size_t a_ld, |
| const size_t b_offset, const size_t b_ld, |
| const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, |
| size_t* temp_buffer_size); |
|
|
| CLBlastStatusCode PUBLIC_API CLBlastHGemmTempBufferSize(const CLBlastLayout layout, const CLBlastTranspose a_transpose, const CLBlastTranspose b_transpose, |
| const size_t m, const size_t n, const size_t k, |
| const size_t a_offset, const size_t a_ld, |
| const size_t b_offset, const size_t b_ld, |
| const size_t c_offset, const size_t c_ld, |
| cl_command_queue* queue, |
| size_t* temp_buffer_size); |
|
|
| |
|
|
| |
| |
| CLBlastStatusCode PUBLIC_API CLBlastClearCache(); |
|
|
| |
| |
| CLBlastStatusCode PUBLIC_API CLBlastFillCache(const cl_device_id device); |
|
|
| |
|
|
| |
| |
| CLBlastStatusCode PUBLIC_API CLBlastOverrideParameters(const cl_device_id device, const char* kernel_name, |
| const CLBlastPrecision precision, const size_t num_parameters, |
| const char** parameters_names, const size_t* parameters_values); |
|
|
| |
|
|
| #ifdef __cplusplus |
| } |
| #endif |
|
|
| |
| #endif |
|
|