wip dont use

2023-04-21 00:35:54 +08:00 · 2023-04-21 00:35:54 +08:00 · 07bb31b034
commit 07bb31b034
parent 7ba36c2c6c
42 changed files with 8 additions and 7 deletions
--- a/10
+++ b/10
@ -1,4 +1,4 @@
-default: koboldcpp koboldcpp_noavx2 koboldcpp_openblas koboldcpp_openblas_noavx2 koboldcpp_clblast 
+default: koboldcpp koboldcpp_noavx2 koboldcpp_openblas koboldcpp_openblas_noavx2 koboldcpp_clblast koboldcpp_cublas
 simple: koboldcpp koboldcpp_noavx2
 dev: koboldcpp_openblas

@ -45,8 +45,8 @@ endif
 #

 # keep standard at C11 and C++11
-CFLAGS   = -I.              -Ofast -DNDEBUG -std=c11   -fPIC
-CXXFLAGS = -I. -I./examples -Ofast -DNDEBUG -std=c++11 -fPIC
+CFLAGS   = -I.              -I./include -I./include/CL -Ofast -DNDEBUG -std=c11   -fPIC
+CXXFLAGS = -I. -I./examples -I./include -I./include/CL -Ofast -DNDEBUG -std=c++11 -fPIC
 LDFLAGS  =

 # these are used on windows, to build some libraries with extra old device compatibility
@ -55,7 +55,7 @@ BONUSCFLAGS2 =

 OPENBLAS_FLAGS = -DGGML_USE_OPENBLAS -I/usr/local/include/openblas
 CLBLAST_FLAGS = -DGGML_USE_CLBLAST -DGGML_USE_OPENBLAS -I/usr/local/include/openblas
-CUBLAS_FLAGS = -DGGML_USE_CUBLAS -I/usr/local/cuda/include
+CUBLAS_FLAGS = -DGGML_USE_CUBLAS -I/usr/local/cuda/include -I./include/cuda -I./include/cuda/crt

 #lets try enabling everything
 CFLAGS   += -pthread -s
@ -251,7 +251,7 @@ gpttype_adapter.o: gpttype_adapter.cpp
 	$(CXX) $(CXXFLAGS) -c $< -o $@

 clean:
-	rm -vf *.o main quantize_llama quantize_gpt2 quantize_gptj quantize-stats perplexity embedding benchmark-q4_0-matmult main.exe quantize_llama.exe quantize_gptj.exe quantize_gpt2.exe koboldcpp.dll koboldcpp_openblas.dll koboldcpp_noavx2.dll koboldcpp_openblas_noavx2.dll koboldcpp_clblast.dll koboldcpp.so koboldcpp_openblas.so koboldcpp_noavx2.so koboldcpp_openblas_noavx2.so koboldcpp_clblast.so gptj.exe gpt2.exe
+	rm -vf *.o main quantize_llama quantize_gpt2 quantize_gptj quantize-stats perplexity embedding benchmark-q4_0-matmult main.exe quantize_llama.exe quantize_gptj.exe quantize_gpt2.exe koboldcpp.dll koboldcpp_openblas.dll koboldcpp_noavx2.dll koboldcpp_openblas_noavx2.dll koboldcpp_clblast.dll koboldcpp_cublas.dll koboldcpp.so koboldcpp_openblas.so koboldcpp_noavx2.so koboldcpp_openblas_noavx2.so koboldcpp_clblast.so koboldcpp_cublas.so gptj.exe gpt2.exe

 main: examples/main/main.cpp ggml.o llama.o common.o $(OBJS)
 	$(CXX) $(CXXFLAGS) $^ -o $@ $(LDFLAGS)
--- a/README.md
+++ b/README.md
@ -36,7 +36,8 @@ What does it mean? You get llama.cpp with a fancy UI, persistent stories, editin
 - You will have to compile your binaries from source. A makefile is provided, simply run `make`
 - If you want you can also link your own install of OpenBLAS manually with `make LLAMA_OPENBLAS=1`
 - Alternatively, if you want you can also link your own install of CLBlast manually with `make LLAMA_CLBLAST=1`, for this you will need to obtain and link OpenCL and CLBlast libraries.
-  - For Arch Linux: Install `cblas` and `openblas`. In the makefile, find the `ifdef LLAMA_OPENBLAS` conditional and add `-lcblas` to `LDFLAGS`.
+- For a full featured build, do `make LLAMA_OPENBLAS=1 LLAMA_CLBLAST=1`
+  - For Arch Linux: Install `cblas` and `openblas`. 
  - For Debian: Install `libclblast-dev` and `libopenblas-dev`.
 - After all binaries are built, you can run the python script with the command `koboldcpp.py [ggml_model.bin] [port]`

--- a/include/CL/Utils/Context.h
+++ b/include/CL/Utils/Context.h
--- a/include/CL/Utils/Context.hpp
+++ b/include/CL/Utils/Context.hpp
--- a/include/CL/Utils/Detail.hpp
+++ b/include/CL/Utils/Detail.hpp
--- a/include/CL/Utils/Device.hpp
+++ b/include/CL/Utils/Device.hpp
--- a/include/CL/Utils/Error.h
+++ b/include/CL/Utils/Error.h
--- a/include/CL/Utils/Error.hpp
+++ b/include/CL/Utils/Error.hpp
--- a/include/CL/Utils/ErrorCodes.h
+++ b/include/CL/Utils/ErrorCodes.h
--- a/include/CL/Utils/Event.h
+++ b/include/CL/Utils/Event.h
--- a/include/CL/Utils/Event.hpp
+++ b/include/CL/Utils/Event.hpp
--- a/include/CL/Utils/File.h
+++ b/include/CL/Utils/File.h
--- a/include/CL/Utils/File.hpp
+++ b/include/CL/Utils/File.hpp
--- a/include/CL/Utils/InteropContext.hpp
+++ b/include/CL/Utils/InteropContext.hpp
--- a/include/CL/Utils/OpenCLUtilsCpp_Export.h
+++ b/include/CL/Utils/OpenCLUtilsCpp_Export.h
--- a/include/CL/Utils/OpenCLUtils_Export.h
+++ b/include/CL/Utils/OpenCLUtils_Export.h
--- a/include/CL/Utils/Platform.hpp
+++ b/include/CL/Utils/Platform.hpp
--- a/include/CL/Utils/Utils.h
+++ b/include/CL/Utils/Utils.h
--- a/include/CL/Utils/Utils.hpp
+++ b/include/CL/Utils/Utils.hpp
--- a/include/CL/cl.h
+++ b/include/CL/cl.h
--- a/include/CL/cl2.hpp
+++ b/include/CL/cl2.hpp
--- a/include/CL/cl_d3d10.h
+++ b/include/CL/cl_d3d10.h
--- a/include/CL/cl_d3d11.h
+++ b/include/CL/cl_d3d11.h
--- a/include/CL/cl_dx9_media_sharing.h
+++ b/include/CL/cl_dx9_media_sharing.h
--- a/include/CL/cl_dx9_media_sharing_intel.h
+++ b/include/CL/cl_dx9_media_sharing_intel.h
--- a/include/CL/cl_egl.h
+++ b/include/CL/cl_egl.h
--- a/include/CL/cl_ext.h
+++ b/include/CL/cl_ext.h
--- a/include/CL/cl_ext_intel.h
+++ b/include/CL/cl_ext_intel.h
--- a/include/CL/cl_gl.h
+++ b/include/CL/cl_gl.h
--- a/include/CL/cl_gl_ext.h
+++ b/include/CL/cl_gl_ext.h
--- a/include/CL/cl_half.h
+++ b/include/CL/cl_half.h
--- a/include/CL/cl_icd.h
+++ b/include/CL/cl_icd.h
--- a/include/CL/cl_layer.h
+++ b/include/CL/cl_layer.h
--- a/include/CL/cl_platform.h
+++ b/include/CL/cl_platform.h
--- a/include/CL/cl_va_api_media_sharing_intel.h
+++ b/include/CL/cl_va_api_media_sharing_intel.h
--- a/include/CL/cl_version.h
+++ b/include/CL/cl_version.h
--- a/include/CL/license.txt
+++ b/include/CL/license.txt
--- a/include/CL/opencl.h
+++ b/include/CL/opencl.h
--- a/include/CL/opencl.hpp
+++ b/include/CL/opencl.hpp
--- a/include/cblas.h
+++ b/include/cblas.h
@ -4,7 +4,7 @@
 #define CBLAS_H

 #include <stddef.h>
-#include "openblas_config.h"
+#include <openblas_config.h>

 #ifdef __cplusplus
 extern "C" {
--- a/include/clblast_c.h
+++ b/include/clblast_c.h
--- a/include/openblas_config.h
+++ b/include/openblas_config.h