|
6 | 6 | #define CUBLAS_OP_N HIPBLAS_OP_N |
7 | 7 | #define CUBLAS_OP_T HIPBLAS_OP_T |
8 | 8 | #define CUBLAS_STATUS_SUCCESS HIPBLAS_STATUS_SUCCESS |
| 9 | +#define CUBLAS_TF32_TENSOR_OP_MATH 0 |
9 | 10 | #define cublasCreate hipblasCreate |
10 | 11 | #define cublasGemmEx hipblasGemmEx |
11 | 12 | #define cublasHandle_t hipblasHandle_t |
| 13 | +#define cublasSetMathMode(h, m) HIPBLAS_STATUS_SUCCESS |
12 | 14 | #define cublasSetStream hipblasSetStream |
13 | 15 | #define cublasSgemm hipblasSgemm |
14 | 16 | #define cublasStatus_t hipblasStatus_t |
15 | 17 | #define CUDA_R_16F HIPBLAS_R_16F |
16 | 18 | #define CUDA_R_32F HIPBLAS_R_32F |
| 19 | +#define cudaDeviceSynchronize hipDeviceSynchronize |
17 | 20 | #define cudaError_t hipError_t |
| 21 | +#define cudaEvent_t hipEvent_t |
| 22 | +#define cudaEventCreateWithFlags hipEventCreateWithFlags |
| 23 | +#define cudaEventDisableTiming hipEventDisableTiming |
| 24 | +#define cudaEventRecord hipEventRecord |
18 | 25 | #define cudaFree hipFree |
| 26 | +#define cudaFreeHost hipFreeHost |
19 | 27 | #define cudaGetErrorString hipGetErrorString |
20 | 28 | #define cudaGetLastError hipGetLastError |
21 | 29 | #define cudaMalloc hipMalloc |
| 30 | +#define cudaMallocHost hipMallocHost |
22 | 31 | #define cudaMemcpyAsync hipMemcpyAsync |
23 | 32 | #define cudaMemcpyDeviceToHost hipMemcpyDeviceToHost |
24 | 33 | #define cudaMemcpyHostToDevice hipMemcpyHostToDevice |
25 | 34 | #define cudaStream_t hipStream_t |
26 | 35 | #define cudaStreamCreateWithFlags hipStreamCreateWithFlags |
27 | 36 | #define cudaStreamNonBlocking hipStreamNonBlocking |
28 | 37 | #define cudaStreamSynchronize hipStreamSynchronize |
| 38 | +#define cudaStreamWaitEvent hipStreamWaitEvent |
29 | 39 | #define cudaSuccess hipSuccess |
30 | 40 | #define GGML_USE_CUBLAS |
31 | 41 | #else |
|
0 commit comments