Update CUDA graph on scale change plus clear nodes/params (#9550)
* Avoid using saved CUDA graph if scale changes and reset nodes/params on update Fixes https://github.com/ggerganov/llama.cpp/issues/9451 * clear before resize
This commit is contained in:
parent
e948a7da7a
commit
41f477879f
2 changed files with 10 additions and 0 deletions
|
@ -569,6 +569,7 @@ struct ggml_graph_node_properties {
|
|||
int64_t ne[GGML_MAX_DIMS];
|
||||
size_t nb[GGML_MAX_DIMS];
|
||||
void * src_address[GGML_MAX_SRC];
|
||||
int32_t op_params[GGML_MAX_OP_PARAMS / sizeof(int32_t)];
|
||||
};
|
||||
|
||||
struct ggml_cuda_graph {
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue