control vector api and implementation

2024-03-09 20:22:37 -08:00 · 2024-03-09 20:22:37 -08:00 · 6b90566052
commit 6b90566052
parent 8030da7afe
4 changed files with 364 additions and 0 deletions
--- a/llama.h
+++ b/llama.h
@ -437,6 +437,20 @@ extern "C" {
                      const char * path_base_model,
                         int32_t   n_threads);

+    // Apply a loaded control vector to a llama_context, or if data is NULL, clear
+    // the currently loaded vector.
+    // n_embd should be the size of a single layer's control, and data should point
+    // to an n_embd x n_layers buffer starting from layer 1.
+    // il_start and il_end are the layer range the vector should apply to (both inclusive)
+    // See llama_control_vector_load in common to load a control vector.
+    LLAMA_API int32_t llama_control_vector_apply(
+            struct llama_context * lctx,
+                           float * data,
+                          size_t   len,
+                             int   n_embd,
+                         int32_t   il_start,
+                         int32_t   il_end);
+
    //
    // KV cache
    //