diff --git a/examples/xgenmm/quantize.sh b/examples/xgenmm/quantize.sh new file mode 100644 index 000000000..afc9b9041 --- /dev/null +++ b/examples/xgenmm/quantize.sh @@ -0,0 +1,10 @@ +gguf_dir=/export/share/yutong/xgenmm/llamacpp_wd/siglip_kosmos_phi3_4k_instruct_bf16_patch128/gguf +model_name=phi3_mini_4k_instruct_f16 +quantize_method=Q4_K_M + +outname=${model_name}_${quantize_method} +input_model_path=$gguf_dir/$model_name.gguf +output_model_path=$gguf_dir/$outname.gguf +echo $outname +cd ../../ +./llama-quantize $input_model_path $output_model_path $quantize_method \ No newline at end of file diff --git a/examples/xgenmm/run_cli.sh b/examples/xgenmm/run_cli.sh index 5da2bd376..df10fa319 100644 --- a/examples/xgenmm/run_cli.sh +++ b/examples/xgenmm/run_cli.sh @@ -35,14 +35,14 @@ make xgenmm-cli # --seed 42 --ctx-size 4096 --predict 1024 \ # --temp 0 --verbose-prompt -# Q="What is the address of this resturant?" +Q="What is the address of this resturant?" # Q="Is this dine in or dine out receipt?" # Q="What is the total amount paid?" # Q="What is card holder's name?" # Q="What is the transaction date?" # Q="What is the phone number of this resturant?" # Q="Who is the attendant?" -Q="Who is the cashier?" +# Q="Who is the cashier?" # Q="Briefly describe this image." prompt="<|system|>\nA chat between a curious user and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the user's questions.<|end|>\n<|user|>\n\n $Q<|end|>\n<|assistant|>\n" echo $prompt diff --git a/test_anyres_handle_patches b/test_anyres_handle_patches new file mode 100755 index 000000000..d7807c196 Binary files /dev/null and b/test_anyres_handle_patches differ diff --git a/xgenmm-cli b/xgenmm-cli index ef1407df1..f17b35a8e 100755 Binary files a/xgenmm-cli and b/xgenmm-cli differ