rpc : early register backend devices (#11262)

Early register RPC devices and do not propagate RPC specifics in the
llama model structures.

ref: #10609
This commit is contained in:
Radoslav Gerganov 2025-01-17 10:57:09 +02:00 committed by GitHub
parent a133566d34
commit 667d72846c
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
10 changed files with 61 additions and 55 deletions

View file

@ -323,8 +323,6 @@ struct llama_model {
// gguf metadata
std::unordered_map<std::string, std::string> gguf_kv;
std::vector<std::string> rpc_servers;
// list of devices used in this model
std::vector<ggml_backend_dev_t> devices;