CUDA: add BF16 support (#11093)

* CUDA: add BF16 support
This commit is contained in:
Johannes Gäßler 2025-01-06 02:33:52 +01:00 committed by GitHub
parent b56f079e28
commit 46e3556e01
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
6 changed files with 87 additions and 39 deletions

View file

@ -680,6 +680,8 @@ to_fp32_cuda_t ggml_get_to_fp32_cuda(ggml_type type) {
return dequantize_row_iq3_s_cuda;
case GGML_TYPE_F16:
return convert_unary_cuda<half>;
case GGML_TYPE_BF16:
return convert_unary_cuda<nv_bfloat16>;
default:
return nullptr;
}