revert cuda changes as they are bugggy
This commit is contained in:
parent
f8376c7e61
commit
a07e6dd3ad
3 changed files with 392 additions and 681 deletions
5
Makefile
5
Makefile
|
@ -176,6 +176,11 @@ ifdef LLAMA_CUDA_KQUANTS_ITER
|
|||
else
|
||||
NVCCFLAGS += -DK_QUANTS_PER_ITERATION=2
|
||||
endif
|
||||
ifdef LLAMA_CUDA_MMQ_Y
|
||||
NVCCFLAGS += -DGGML_CUDA_MMQ_Y=$(LLAMA_CUDA_MMQ_Y)
|
||||
else
|
||||
NVCCFLAGS += -DGGML_CUDA_MMQ_Y=64
|
||||
endif # LLAMA_CUDA_MMQ_Y
|
||||
#ifdef LLAMA_CUDA_CUBLAS
|
||||
# NVCCFLAGS += -DGGML_CUDA_CUBLAS
|
||||
#endif # LLAMA_CUDA_CUBLAS
|
||||
|
|
1066
ggml-cuda.cu
1066
ggml-cuda.cu
File diff suppressed because it is too large
Load diff
|
@ -154,9 +154,11 @@ typedef double ggml_v1_float;
|
|||
#undef bool
|
||||
#define bool _Bool
|
||||
#else
|
||||
#if !defined(__riscv)
|
||||
#include <immintrin.h>
|
||||
#endif
|
||||
#endif
|
||||
#endif
|
||||
|
||||
#ifdef __F16C__
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue