llama-bench : add model sizes (#2771)

* llama-bench : add model sizes * more compact markdown output * back to GiB * adjust column sizes
2023-08-25 15:16:19 +02:00 · 2023-08-25 15:16:19 +02:00 · 154725c543
commit 154725c543
parent 12e2e33a97
3 changed files with 74 additions and 10 deletions
--- a/llama.h
+++ b/llama.h
@ -254,7 +254,11 @@ extern "C" {
    LLAMA_API int llama_model_n_embd (const struct llama_model * model);

    // Get a string describing the model type
-    LLAMA_API int llama_model_type(const struct llama_model * model, char * buf, size_t buf_size);
+    LLAMA_API int llama_model_desc(const struct llama_model * model, char * buf, size_t buf_size);
+    // Returns the total size of all the tensors in the model in bytes
+    LLAMA_API uint64_t llama_model_size(const struct llama_model * model);
+    // Returns the total number of parameters in the model
+    LLAMA_API uint64_t llama_model_n_params(const struct llama_model * model);

    // Returns 0 on success
    LLAMA_API int llama_model_quantize(