ggml : update get_rows f16 and q
This commit is contained in:
parent
ac3f7d8e23
commit
2e4db48291
2 changed files with 26 additions and 18 deletions
5
Makefile
5
Makefile
|
@ -396,6 +396,11 @@ ifdef LLAMA_CUBLAS
|
|||
MK_LDFLAGS += -lcublas -lculibos -lcudart -lcublasLt -lpthread -ldl -lrt -L/usr/local/cuda/lib64 -L/opt/cuda/lib64 -L$(CUDA_PATH)/targets/x86_64-linux/lib
|
||||
OBJS += ggml-cuda.o
|
||||
NVCCFLAGS = --forward-unknown-to-host-compiler -use_fast_math
|
||||
|
||||
ifdef LLAMA_DEBUG
|
||||
NVCCFLAGS += -lineinfo
|
||||
endif
|
||||
|
||||
ifdef LLAMA_CUDA_NVCC
|
||||
NVCC = $(LLAMA_CUDA_NVCC)
|
||||
else
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue