Introduce C-style API (#370)

* Major refactoring - introduce C-style API * Clean up * Add <cassert> * Add <iterator> * Add <algorithm> .... * Fix timing reporting and accumulation * Measure eval time only for single-token calls * Change llama_tokenize return meaning
2023-03-22 07:32:36 +02:00 · 2023-03-22 07:32:36 +02:00 · f5a77a629b
commit f5a77a629b
parent da0e9fe90c
14 changed files with 1954 additions and 1752 deletions
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@ -207,15 +207,10 @@ else()
    message(STATUS "Unknown architecture")
 endif()

-
 #
-# Build library
+# Build libraries
 #

-add_executable(llama main.cpp)
-
-add_executable(quantize quantize.cpp)
-
 add_library(utils OBJECT
            utils.cpp
            utils.h)
@ -229,14 +224,24 @@ add_library(ggml OBJECT

 target_include_directories(ggml PUBLIC .)
 target_compile_features(ggml PUBLIC c_std_11) # don't bump
-
-#
-# Linking
-#
-
 target_link_libraries(ggml PRIVATE Threads::Threads ${LLAMA_EXTRA_LIBS})
-target_link_libraries(llama PRIVATE ggml utils)
-target_link_libraries(quantize PRIVATE ggml utils)
+
+add_library(llama OBJECT
+            llama.cpp
+            llama.h)
+
+target_include_directories(llama PUBLIC .)
+target_compile_features(llama PUBLIC cxx_std_11) # don't bump
+
+#
+# Executables
+#
+
+add_executable(main main.cpp)
+target_link_libraries(main PRIVATE llama ggml utils)
+
+add_executable(quantize quantize.cpp)
+target_link_libraries(quantize PRIVATE llama ggml utils)

 #
 # programs, examples and tests