diff --git a/common/common.h b/common/common.h index e64292152..0d452cf0f 100644 --- a/common/common.h +++ b/common/common.h @@ -24,7 +24,6 @@ #define DEFAULT_MODEL_PATH "models/7B/ggml-model-f16.gguf" -// TODO: "lora_adapter" is tautology struct common_lora_adapter_info { std::string path; float scale; diff --git a/examples/server/server.cpp b/examples/server/server.cpp index 441c58e38..c2e62ba69 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -1626,6 +1626,7 @@ struct server_response { struct server_context { common_params params_base; + // note: keep these alive - they determine the lifetime of the model, context, etc. common_init_result llama_init; common_init_result llama_init_dft; diff --git a/src/llama-sampling.cpp b/src/llama-sampling.cpp index 86a76f71d..69cea2f14 100644 --- a/src/llama-sampling.cpp +++ b/src/llama-sampling.cpp @@ -124,6 +124,7 @@ struct ring_buffer { size_t sz = 0; size_t first = 0; size_t pos = 0; + std::vector data; };