diff --git a/ggml.h b/ggml.h index bdbd12800..413bc1de5 100644 --- a/ggml.h +++ b/ggml.h @@ -255,9 +255,11 @@ extern "C" { #endif -#ifdef __ARM_NEON +#if defined(__ARM_NEON) && !defined(GGML_CUDA_F16) // we use the built-in 16-bit float type typedef __fp16 ggml_fp16_t; +#elif defined(GGML_CUDA_F16) + typedef half ggml_fp16_t; #else typedef uint16_t ggml_fp16_t; #endif