try MUSA fix
This commit is contained in:
parent
ab20aa99c2
commit
6a5cdad219
1 changed files with 3 additions and 0 deletions
3
ggml/src/ggml-cuda/vendors/musa.h
vendored
3
ggml/src/ggml-cuda/vendors/musa.h
vendored
|
@ -3,6 +3,7 @@
|
||||||
#include <musa_runtime.h>
|
#include <musa_runtime.h>
|
||||||
#include <musa.h>
|
#include <musa.h>
|
||||||
#include <mublas.h>
|
#include <mublas.h>
|
||||||
|
#include <musa_bf16.h>
|
||||||
#include <musa_fp16.h>
|
#include <musa_fp16.h>
|
||||||
#define CUBLAS_COMPUTE_16F CUDA_R_16F
|
#define CUBLAS_COMPUTE_16F CUDA_R_16F
|
||||||
#define CUBLAS_COMPUTE_32F CUDA_R_32F
|
#define CUBLAS_COMPUTE_32F CUDA_R_32F
|
||||||
|
@ -132,3 +133,5 @@
|
||||||
#define cudaKernelNodeParams musaKernelNodeParams
|
#define cudaKernelNodeParams musaKernelNodeParams
|
||||||
#define cudaStreamCaptureModeRelaxed musaStreamCaptureModeRelaxed
|
#define cudaStreamCaptureModeRelaxed musaStreamCaptureModeRelaxed
|
||||||
#define cudaStreamEndCapture musaStreamEndCapture
|
#define cudaStreamEndCapture musaStreamEndCapture
|
||||||
|
|
||||||
|
typedef musa_bfloat16 nv_bfloat16;
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue