fix ci errors
This commit is contained in:
parent
e44cef8144
commit
33c2a25e3f
3 changed files with 5 additions and 5 deletions
|
@ -20,4 +20,4 @@ server-parallel.exe -m models\7B\ggml-model.gguf --ctx_size 2048 -t 4 -ngl 33 --
|
||||||
The above command will start a server that by default listens on `127.0.0.1:8080`.
|
The above command will start a server that by default listens on `127.0.0.1:8080`.
|
||||||
You can consume the endpoints with Postman or NodeJS with axios library. You can visit the web front end at the same url.
|
You can consume the endpoints with Postman or NodeJS with axios library. You can visit the web front end at the same url.
|
||||||
|
|
||||||
# This example is a Proof of Concept, have bugs and unexpected behaivors
|
# This example is a Proof of Concept, have bugs and unexpected behaivors
|
||||||
|
|
|
@ -152,4 +152,4 @@ const auto index_html = R"(
|
||||||
</script>
|
</script>
|
||||||
</body>
|
</body>
|
||||||
</html>
|
</html>
|
||||||
)";
|
)";
|
||||||
|
|
|
@ -249,7 +249,7 @@ struct server_parallel_context {
|
||||||
request_clean_kv = false;
|
request_clean_kv = false;
|
||||||
LOG_TEE("%s: clearing the KV cache\n", __func__);
|
LOG_TEE("%s: clearing the KV cache\n", __func__);
|
||||||
}
|
}
|
||||||
|
|
||||||
// assign workload to the slots
|
// assign workload to the slots
|
||||||
if (params.cont_batching || batch.n_tokens == 0) {
|
if (params.cont_batching || batch.n_tokens == 0) {
|
||||||
for (llama_client_slot & slot : slots) {
|
for (llama_client_slot & slot : slots) {
|
||||||
|
@ -287,7 +287,7 @@ struct server_parallel_context {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if (batch.n_tokens == 0) {
|
if (batch.n_tokens == 0) {
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
@ -806,4 +806,4 @@ int main(int argc, char **argv)
|
||||||
{
|
{
|
||||||
return 1;
|
return 1;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue