llama : clean-up

2024-07-23 08:38:50 +03:00 · 2024-07-23 08:38:50 +03:00 · fe28a7b9d8
commit fe28a7b9d8
parent dae3cae841
5 changed files with 20 additions and 29 deletions
--- a/src/llama-impl.h
+++ b/src/llama-impl.h
@ -3,24 +3,6 @@
 #define LLAMA_API_INTERNAL
 #include "llama.h"
 #ifdef __has_include
    #if __has_include(<unistd.h>)
        #include <unistd.h>
        #if defined(_POSIX_MAPPED_FILES)
            #include <sys/mman.h>
            #include <fcntl.h>
        #endif
        #if defined(_POSIX_MEMLOCK_RANGE)
            #include <sys/resource.h>
        #endif
    #endif
 #endif
 // bump if necessary
 #define LLAMA_MAX_NODES   8192
 #define LLAMA_MAX_LAYERS  512
 #define LLAMA_MAX_EXPERTS 160  // DeepSeekV2
 #ifdef __GNUC__
 #ifdef __MINGW32__
 #define LLAMA_ATTRIBUTE_FORMAT(...) __attribute__((format(gnu_printf, __VA_ARGS__)))
--- a/src/llama-sampling.h
+++ b/src/llama-sampling.h
@ -18,8 +18,6 @@ struct llama_sampling {
    }
 };
 struct llama_sampling * llama_get_sampling(struct llama_context * ctx);
 //
 // internal API
 //
--- a/src/llama-vocab.h
+++ b/src/llama-vocab.h
@ -62,7 +62,6 @@ struct llama_vocab {
 };
 const struct llama_vocab * llama_get_vocab(const struct llama_context * ctx);
 const struct llama_vocab * llama_get_vocab(const struct llama_model   * model);
 //
 // internal API
--- a/src/llama.cpp
+++ b/src/llama.cpp
@ -36,6 +36,19 @@
 // TODO: replace with ggml API call
 #define QK_K 256
 #ifdef __has_include
    #if __has_include(<unistd.h>)
        #include <unistd.h>
        #if defined(_POSIX_MAPPED_FILES)
            #include <sys/mman.h>
            #include <fcntl.h>
        #endif
        #if defined(_POSIX_MEMLOCK_RANGE)
            #include <sys/resource.h>
        #endif
    #endif
 #endif
 #if defined(_WIN32)
    #define WIN32_LEAN_AND_MEAN
    #ifndef NOMINMAX
@ -87,6 +100,11 @@
 #pragma warning(disable: 4244 4267) // possible loss of data
 #endif
 // bump if necessary
 #define LLAMA_MAX_NODES   8192
 #define LLAMA_MAX_LAYERS  512
 #define LLAMA_MAX_EXPERTS 160  // DeepSeekV2
 //
 // helpers
 //
@ -16794,14 +16812,6 @@ const struct llama_vocab * llama_get_vocab(const struct llama_context * ctx) {
    return &ctx->model.vocab;
 }
 const struct llama_vocab * llama_get_vocab(const struct llama_model * model) {
    return &model->vocab;
 }
 struct llama_sampling * llama_get_sampling(struct llama_context * ctx) {
    return &ctx->sampling;
 }
 struct llama_grammar * llama_get_grammar(struct llama_context * ctx) {
    return &ctx->grammar;
 }
--- a/src/unicode.h
+++ b/src/unicode.h
@ -4,6 +4,8 @@
 #include <string>
 #include <vector>
 // TODO: prefix all symbols with "llama_"
 struct codepoint_flags {
    enum {
        UNDEFINED       = 0x0001,