Merge branch 'master' into compilade/pyright-tests

2024-07-07 10:51:30 -04:00 · 2024-07-07 10:51:30 -04:00 · 0caf60a79e
commit 0caf60a79e
parent 872aecbf30 f1948f1e10
31 changed files with 9399 additions and 73 deletions
--- a/examples/finetune/README.md
+++ b/examples/finetune/README.md
@ -87,4 +87,4 @@ The LORA rank can be configured for each model tensor type separately with these

 The LORA rank of 'norm' tensors should always be 1.

-To see all available options use `finetune --help`.
+To see all available options use `llama-finetune --help`.
--- a/examples/finetune/finetune.sh
+++ b/examples/finetune/finetune.sh
@ -8,7 +8,7 @@ if [[ ! $LLAMA_MODEL_DIR ]]; then LLAMA_MODEL_DIR="./models"; fi
 if [[ ! $LLAMA_TRAINING_DIR ]]; then LLAMA_TRAINING_DIR="."; fi

 # MODEL="$LLAMA_MODEL_DIR/openllama-3b-v2-q8_0.gguf" # This is the model the readme uses.
-MODEL="$LLAMA_MODEL_DIR/openllama-3b-v2.gguf" # An f16 model. Note in this case with "-g", you get an f32-format .BIN file that isn't yet supported if you use it with "main --lora" with GPU inferencing.
+MODEL="$LLAMA_MODEL_DIR/openllama-3b-v2.gguf" # An f16 model. Note in this case with "-g", you get an f32-format .BIN file that isn't yet supported if you use it with "llama-cli --lora" with GPU inferencing.

 while getopts "dg" opt; do
  case $opt in