CUDA: fixed peer access toggle synchronization
This commit is contained in:
parent
b9f47952ff
commit
e692c2d887
1 changed files with 4 additions and 0 deletions
|
@ -8,6 +8,7 @@
|
|||
#include <limits>
|
||||
#include <stdint.h>
|
||||
#include <stdio.h>
|
||||
#include <unistd.h>
|
||||
#include <vector>
|
||||
|
||||
|
||||
|
@ -7999,6 +8000,9 @@ static void ggml_cuda_set_peer_access(const int n_tokens) {
|
|||
}
|
||||
}
|
||||
}
|
||||
|
||||
usleep(100000); // 0.1 s
|
||||
|
||||
#endif // NDEBUG
|
||||
|
||||
peer_access_enabled = enable_peer_access;
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue