forked from JuliaGPU/oneAPI.jl
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathonemkl.h
More file actions
82 lines (72 loc) · 3.82 KB
/
onemkl.h
File metadata and controls
82 lines (72 loc) · 3.82 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
#pragma once
#include "sycl.h"
#include <stddef.h>
#include <stdint.h>
#ifdef __cplusplus
extern "C" {
#endif
typedef enum {
ONEMKL_TRANSPOSE_NONTRANS,
ONEMKL_TRANSPOSE_TRANS,
ONEMLK_TRANSPOSE_CONJTRANS
} onemklTranspose;
// XXX: how to expose half in C?
// int onemklHgemm(syclQueue_t device_queue, onemklTranspose transA,
// onemklTranspose transB, int64_t m, int64_t n, int64_t k,
// half alpha, const half *A, int64_t lda, const half *B,
// int64_t ldb, half beta, half *C, int64_t ldc);
int onemklSgemm(syclQueue_t device_queue, onemklTranspose transA,
onemklTranspose transB, int64_t m, int64_t n, int64_t k,
float alpha, const float *A, int64_t lda, const float *B,
int64_t ldb, float beta, float *C, int64_t ldc);
int onemklDgemm(syclQueue_t device_queue, onemklTranspose transA,
onemklTranspose transB, int64_t m, int64_t n, int64_t k,
double alpha, const double *A, int64_t lda, const double *B,
int64_t ldb, double beta, double *C, int64_t ldc);
int onemklCgemm(syclQueue_t device_queue, onemklTranspose transA,
onemklTranspose transB, int64_t m, int64_t n, int64_t k,
float _Complex alpha, const float _Complex *A, int64_t lda,
const float _Complex *B, int64_t ldb, float _Complex beta,
float _Complex *C, int64_t ldc);
int onemklZgemm(syclQueue_t device_queue, onemklTranspose transA,
onemklTranspose transB, int64_t m, int64_t n, int64_t k,
double _Complex alpha, const double _Complex *A, int64_t lda,
const double _Complex *B, int64_t ldb, double _Complex beta,
double _Complex *C, int64_t ldc);
// Supported Level-1: Nrm2
void onemklDnrm2(syclQueue_t device_queue, int64_t n, const double *x,
int64_t incx, double *result);
void onemklSnrm2(syclQueue_t device_queue, int64_t n, const float *x,
int64_t incx, float *result);
void onemklCnrm2(syclQueue_t device_queue, int64_t n, const float _Complex *x,
int64_t incx, float *result);
void onemklZnrm2(syclQueue_t device_queue, int64_t n, const double _Complex *x,
int64_t incx, double *result);
void onemklDcopy(syclQueue_t device_queue, int64_t n, const double *x,
int64_t incx, double *y, int64_t incy);
void onemklScopy(syclQueue_t device_queue, int64_t n, const float *x,
int64_t incx, float *y, int64_t incy);
void onemklZcopy(syclQueue_t device_queue, int64_t n, const double _Complex *x,
int64_t incx, double _Complex *y, int64_t incy);
void onemklCcopy(syclQueue_t device_queue, int64_t n, const float _Complex *x,
int64_t incx, float _Complex *y, int64_t incy);
void onemklDamax(syclQueue_t device_queue, int64_t n, const double *x, int64_t incx,
int64_t *result);
void onemklSamax(syclQueue_t device_queue, int64_t n, const float *x, int64_t incx,
int64_t *result);
void onemklZamax(syclQueue_t device_queue, int64_t n, const double _Complex *x, int64_t incx,
int64_t *result);
void onemklCamax(syclQueue_t device_queue, int64_t n, const float _Complex *x, int64_t incx,
int64_t *result);
void onemklDamin(syclQueue_t device_queue, int64_t n, const double *x, int64_t incx,
int64_t *result);
void onemklSamin(syclQueue_t device_queue, int64_t n, const float *x, int64_t incx,
int64_t *result);
void onemklZamin(syclQueue_t device_queue, int64_t n, const double _Complex *x, int64_t incx,
int64_t *result);
void onemklCamin(syclQueue_t device_queue, int64_t n, const float _Complex *x, int64_t incx,
int64_t *result);
void onemklDestroy();
#ifdef __cplusplus
}
#endif