add tests.sh

2024-04-13 16:01:34 +02:00 · 2024-04-13 16:01:34 +02:00 · 6738215a10
commit 6738215a10
parent 1d86bd87fb
1 changed files with 81 additions and 0 deletions
--- a/examples/gguf-split/tests.sh
+++ b/examples/gguf-split/tests.sh
@ -0,0 +1,81 @@
 #!/bin/bash
 set -eu
 if [ $# -lt 1 ]
 then
  echo "usage:   $0 path_to_build_binary [path_to_temp_folder]"
  echo "example: $0 ../../build/bin ../../tmp"
  exit 1
 fi
 if [ $# -gt 1 ]
 then
  TMP_DIR=$2
 else
  TMP_DIR=/tmp
 fi
 set -x
 SPLIT=$1/gguf-split
 MAIN=$1/main
 WORK_PATH=$TMP_DIR
 CUR_DIR=$(pwd)
 # 1. Get a model
 (
  cd $WORK_PATH
  "$CUR_DIR"/../../scripts/hf.sh --repo ggml-org/gemma-1.1-2b-it-Q8_0-GGUF --file gemma-1.1-2b-it.Q8_0.gguf
 )
 echo PASS
 # 2. Split with max tensors strategy
 $SPLIT --split-max-tensors 28  $WORK_PATH/gemma-1.1-2b-it.Q8_0.gguf $WORK_PATH/ggml-model-split
 echo PASS
 echo
 # 2b. Test the sharded model is loading properly
 $MAIN --model $WORK_PATH/ggml-model-split-00001-of-00006.gguf --random-prompt --n-predict 32
 echo PASS
 echo
 # 3. Merge
 $SPLIT --merge $WORK_PATH/ggml-model-split-00001-of-00006.gguf $WORK_PATH/ggml-model-merge.gguf
 echo PASS
 echo
 # 3b. Test the merged model is loading properly
 $MAIN --model $WORK_PATH/ggml-model-merge.gguf --random-prompt --n-predict 32
 echo PASS
 echo
 # 4. Split with no tensor in metadata
 #$SPLIT --split-max-tensors 32 --no-tensor-in-metadata $WORK_PATH/ggml-model-merge.gguf $WORK_PATH/ggml-model-split-32-tensors
 #echo PASS
 #echo
 # 4b. Test the sharded model is loading properly
 #$MAIN --model $WORK_PATH/ggml-model-split-32-tensors-00001-of-00006.gguf --random-prompt --n-predict 32
 #echo PASS
 #echo
 # 5. Merge
 #$SPLIT --merge $WORK_PATH/ggml-model-split-32-tensors-00001-of-00006.gguf $WORK_PATH/ggml-model-merge-2.gguf
 #echo PASS
 #echo
 # 5b. Test the merged model is loading properly
 #$MAIN --model $WORK_PATH/ggml-model-merge-2.gguf --random-prompt --n-predict 32
 #echo PASS
 #echo
 # 6. Split with size strategy
 $SPLIT --split-max-size 2G $WORK_PATH/ggml-model-merge.gguf $WORK_PATH/ggml-model-split-2G
 echo PASS
 echo
 # 6b. Test the sharded model is loading properly
 $MAIN --model $WORK_PATH/ggml-model-split-2G-00001-of-00002.gguf --random-prompt --n-predict 32
 echo PASS
 echo