|
6 | 6 | #define CUBLAS_OP_N HIPBLAS_OP_N
|
7 | 7 | #define CUBLAS_OP_T HIPBLAS_OP_T
|
8 | 8 | #define CUBLAS_STATUS_SUCCESS HIPBLAS_STATUS_SUCCESS
|
| 9 | +#define CUBLAS_TF32_TENSOR_OP_MATH 0 |
9 | 10 | #define cublasCreate hipblasCreate
|
10 | 11 | #define cublasGemmEx hipblasGemmEx
|
11 | 12 | #define cublasHandle_t hipblasHandle_t
|
| 13 | +#define cublasSetMathMode(h, m) HIPBLAS_STATUS_SUCCESS |
12 | 14 | #define cublasSetStream hipblasSetStream
|
13 | 15 | #define cublasSgemm hipblasSgemm
|
14 | 16 | #define cublasStatus_t hipblasStatus_t
|
15 | 17 | #define CUDA_R_16F HIPBLAS_R_16F
|
16 | 18 | #define CUDA_R_32F HIPBLAS_R_32F
|
| 19 | +#define cudaDeviceSynchronize hipDeviceSynchronize |
17 | 20 | #define cudaError_t hipError_t
|
| 21 | +#define cudaEvent_t hipEvent_t |
| 22 | +#define cudaEventCreateWithFlags hipEventCreateWithFlags |
| 23 | +#define cudaEventDisableTiming hipEventDisableTiming |
| 24 | +#define cudaEventRecord hipEventRecord |
18 | 25 | #define cudaFree hipFree
|
| 26 | +#define cudaFreeHost hipFreeHost |
19 | 27 | #define cudaGetErrorString hipGetErrorString
|
20 | 28 | #define cudaGetLastError hipGetLastError
|
21 | 29 | #define cudaMalloc hipMalloc
|
| 30 | +#define cudaMallocHost hipMallocHost |
22 | 31 | #define cudaMemcpyAsync hipMemcpyAsync
|
23 | 32 | #define cudaMemcpyDeviceToHost hipMemcpyDeviceToHost
|
24 | 33 | #define cudaMemcpyHostToDevice hipMemcpyHostToDevice
|
25 | 34 | #define cudaStream_t hipStream_t
|
26 | 35 | #define cudaStreamCreateWithFlags hipStreamCreateWithFlags
|
27 | 36 | #define cudaStreamNonBlocking hipStreamNonBlocking
|
28 | 37 | #define cudaStreamSynchronize hipStreamSynchronize
|
| 38 | +#define cudaStreamWaitEvent hipStreamWaitEvent |
29 | 39 | #define cudaSuccess hipSuccess
|
30 | 40 | #define GGML_USE_CUBLAS
|
31 | 41 | #else
|
|
0 commit comments