diff --git a/ggml-cuda.cu b/ggml-cuda.cu index 4c37f4278..7873f4f6b 100644 --- a/ggml-cuda.cu +++ b/ggml-cuda.cu @@ -206,7 +206,8 @@ static __global__ void dequantize_block_q8_0(const void * vx, float * y) { } } -template static __global__ void dequantize_mul_mat_vec(const void * vx, const float * y, float * dst, const int ncols) { +template +static __global__ void dequantize_mul_mat_vec(const void * vx, const float * y, float * dst, const int ncols) { const int row = blockIdx.x; const int tid = threadIdx.x;