check for sycl blas, better performance

This commit is contained in:
jianyuzh 2024-01-23 13:34:05 +08:00
parent 67e6b3cb7d
commit 533c647d0e

View file

@ -6703,7 +6703,7 @@ static int llama_decode_internal(
} }
const bool fully_offloaded = model.n_gpu_layers >= (int) hparams.n_layer + 1; const bool fully_offloaded = model.n_gpu_layers >= (int) hparams.n_layer + 1;
if (ggml_cpu_has_cublas() && fully_offloaded) { if ((ggml_cpu_has_cublas() || ggml_cpu_has_sycl()) && fully_offloaded) {
n_threads = 1; n_threads = 1;
} }