Only one CUDA stream per device for async compute (#1898)
This commit is contained in:
parent
051e1b0e6a
commit
2c9380dd2f
3 changed files with 20 additions and 38 deletions
|
@ -106,9 +106,6 @@ bool gpt_params_parse(int argc, char ** argv, gpt_params & params) {
|
|||
}
|
||||
|
||||
if (arg == "-s" || arg == "--seed") {
|
||||
#if defined(GGML_USE_CUBLAS)
|
||||
fprintf(stderr, "WARNING: when using cuBLAS generation results are NOT guaranteed to be reproducible.\n");
|
||||
#endif
|
||||
if (++i >= argc) {
|
||||
invalid_param = true;
|
||||
break;
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue