add more cuda defines
This is so 'slaren/cuda-f16f32' would merge.
This commit is contained in:
parent
ecc056519f
commit
a1caa48611
1 changed files with 10 additions and 0 deletions
10
ggml-cuda.h
10
ggml-cuda.h
|
@ -6,19 +6,28 @@
|
||||||
#define CUBLAS_OP_N HIPBLAS_OP_N
|
#define CUBLAS_OP_N HIPBLAS_OP_N
|
||||||
#define CUBLAS_OP_T HIPBLAS_OP_T
|
#define CUBLAS_OP_T HIPBLAS_OP_T
|
||||||
#define CUBLAS_STATUS_SUCCESS HIPBLAS_STATUS_SUCCESS
|
#define CUBLAS_STATUS_SUCCESS HIPBLAS_STATUS_SUCCESS
|
||||||
|
#define CUBLAS_TF32_TENSOR_OP_MATH 0
|
||||||
#define cublasCreate hipblasCreate
|
#define cublasCreate hipblasCreate
|
||||||
#define cublasGemmEx hipblasGemmEx
|
#define cublasGemmEx hipblasGemmEx
|
||||||
#define cublasHandle_t hipblasHandle_t
|
#define cublasHandle_t hipblasHandle_t
|
||||||
|
#define cublasSetMathMode(h, m) HIPBLAS_STATUS_SUCCESS
|
||||||
#define cublasSetStream hipblasSetStream
|
#define cublasSetStream hipblasSetStream
|
||||||
#define cublasSgemm hipblasSgemm
|
#define cublasSgemm hipblasSgemm
|
||||||
#define cublasStatus_t hipblasStatus_t
|
#define cublasStatus_t hipblasStatus_t
|
||||||
#define CUDA_R_16F HIPBLAS_R_16F
|
#define CUDA_R_16F HIPBLAS_R_16F
|
||||||
#define CUDA_R_32F HIPBLAS_R_32F
|
#define CUDA_R_32F HIPBLAS_R_32F
|
||||||
|
#define cudaDeviceSynchronize hipDeviceSynchronize
|
||||||
#define cudaError_t hipError_t
|
#define cudaError_t hipError_t
|
||||||
|
#define cudaEvent_t hipEvent_t
|
||||||
|
#define cudaEventCreateWithFlags hipEventCreateWithFlags
|
||||||
|
#define cudaEventDisableTiming hipEventDisableTiming
|
||||||
|
#define cudaEventRecord hipEventRecord
|
||||||
#define cudaFree hipFree
|
#define cudaFree hipFree
|
||||||
|
#define cudaFreeHost hipFreeHost
|
||||||
#define cudaGetErrorString hipGetErrorString
|
#define cudaGetErrorString hipGetErrorString
|
||||||
#define cudaGetLastError hipGetLastError
|
#define cudaGetLastError hipGetLastError
|
||||||
#define cudaMalloc hipMalloc
|
#define cudaMalloc hipMalloc
|
||||||
|
#define cudaMallocHost hipMallocHost
|
||||||
#define cudaMemcpyAsync hipMemcpyAsync
|
#define cudaMemcpyAsync hipMemcpyAsync
|
||||||
#define cudaMemcpyDeviceToHost hipMemcpyDeviceToHost
|
#define cudaMemcpyDeviceToHost hipMemcpyDeviceToHost
|
||||||
#define cudaMemcpyHostToDevice hipMemcpyHostToDevice
|
#define cudaMemcpyHostToDevice hipMemcpyHostToDevice
|
||||||
|
@ -26,6 +35,7 @@
|
||||||
#define cudaStreamCreateWithFlags hipStreamCreateWithFlags
|
#define cudaStreamCreateWithFlags hipStreamCreateWithFlags
|
||||||
#define cudaStreamNonBlocking hipStreamNonBlocking
|
#define cudaStreamNonBlocking hipStreamNonBlocking
|
||||||
#define cudaStreamSynchronize hipStreamSynchronize
|
#define cudaStreamSynchronize hipStreamSynchronize
|
||||||
|
#define cudaStreamWaitEvent hipStreamWaitEvent
|
||||||
#define cudaSuccess hipSuccess
|
#define cudaSuccess hipSuccess
|
||||||
#define GGML_USE_CUBLAS
|
#define GGML_USE_CUBLAS
|
||||||
#else
|
#else
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue