CUDA: fix partial offloading for ne0 % 256 != 0 (#8572)
This commit is contained in:
parent
705b7ecf60
commit
a15ef8f8a0
4 changed files with 29 additions and 15 deletions
|
@ -134,6 +134,10 @@ void ggml_backend_buffer_set_usage(ggml_backend_buffer_t buffer, enum ggml_backe
|
|||
}
|
||||
}
|
||||
|
||||
enum ggml_backend_buffer_usage ggml_backend_buffer_get_usage(ggml_backend_buffer_t buffer) {
|
||||
return buffer->usage;
|
||||
}
|
||||
|
||||
ggml_backend_buffer_type_t ggml_backend_buffer_get_type(ggml_backend_buffer_t buffer) {
|
||||
return buffer->buft;
|
||||
}
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue