llama : support save/load state with FA enabled

ggml-ci
2024-04-25 18:18:13 +03:00 · 2024-04-25 18:18:13 +03:00 · 1fd5bc3d5e
commit 1fd5bc3d5e
parent cb3547ac46
2 changed files with 12 additions and 7 deletions
--- a/ci/run.sh
+++ b/ci/run.sh
@ -517,7 +517,8 @@ function gg_run_open_llama_7b_v2 {

    (time ./bin/imatrix --model ${model_f16} -f ${wiki_test} -t 1 -ngl 999 -c 2048 -b 512 --chunks 4 ) 2>&1 | tee -a $OUT/${ci}-imatrix.log

-    (time ./bin/save-load-state --model ${model_q4_0} ) 2>&1 | tee -a $OUT/${ci}-save-load-state.log
+    (time ./bin/save-load-state --model     ${model_q4_0} ) 2>&1 | tee -a $OUT/${ci}-save-load-state.log
+    (time ./bin/save-load-state --model -fa ${model_q4_0} ) 2>&1 | tee -a $OUT/${ci}-save-load-state.log

    function check_ppl {
        qnt="$1"