mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-25 02:44:36 +00:00
CUDA: fix peer access logic (#3231)
This commit is contained in:
parent
111163e246
commit
ee66942d7e
14
ggml-cuda.cu
14
ggml-cuda.cu
@ -6286,12 +6286,14 @@ void ggml_cuda_set_peer_access(const int n_tokens) {
|
||||
continue;
|
||||
}
|
||||
|
||||
int canAccessPeer;
|
||||
CUDA_CHECK(cudaDeviceCanAccessPeer(&canAccessPeer, id, id_other));
|
||||
if (enable_peer_access) {
|
||||
CUDA_CHECK(cudaDeviceEnablePeerAccess(id_other, 0));
|
||||
} else {
|
||||
CUDA_CHECK(cudaDeviceDisablePeerAccess(id_other));
|
||||
int can_access_peer;
|
||||
CUDA_CHECK(cudaDeviceCanAccessPeer(&can_access_peer, id, id_other));
|
||||
if (can_access_peer) {
|
||||
if (enable_peer_access) {
|
||||
CUDA_CHECK(cudaDeviceEnablePeerAccess(id_other, 0));
|
||||
} else {
|
||||
CUDA_CHECK(cudaDeviceDisablePeerAccess(id_other));
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user