8000 musaMemcpy3DPeerAsync is not available · makllama/llama.cpp@53ccc4f · GitHub
[go: up one dir, main page]

Skip to content

Commit 53ccc4f

Browse files
committed
musaMemcpy3DPeerAsync is not available
Signed-off-by: Xiaodong Ye <xiaodong.ye@mthreads.com>
1 parent f57b501 commit 53ccc4f

File tree

1 file changed

+5
-0
lines changed

1 file changed

+5
-0
lines changed

ggml-cuda.cu

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1341,6 +1341,7 @@ static musaError_t ggml_cuda_Memcpy2DPeerAsync(
13411341
void * dst, int dstDevice, size_t dpitch, void * src, int srcDevice, size_t spitch, size_t width, size_t height, musaStream_t stream) {
13421342

13431343
#if !defined(GGML_USE_HIPBLAS)
1344+
/* XXX: musaMemcpy3DPeerAsync is not available in MUSA
13441345
// musaMemcpy2DAsync may fail with copies between vmm pools of different devices
13451346
musaMemcpy3DPeerParms p = {};
13461347
p.dstDevice = dstDevice;
@@ -1349,6 +1350,10 @@ static musaError_t ggml_cuda_Memcpy2DPeerAsync(
13491350
p.srcPtr = make_musaPitchedPtr(src, spitch, spitch, height);
13501351
p.extent = make_musaExtent(width, height, 1);
13511352
return musaMemcpy3DPeerAsync(&p, stream);
1353+
*/
1354+
GGML_UNUSED(dstDevice);
1355+
GGML_UNUSED(srcDevice);
1356+
return musaMemcpy2DAsync(dst, dpitch, src, spitch, width, height, musaMemcpyDeviceToDevice, stream);
13521357
#else
13531358
// HIP does not support musaMemcpy3DPeerAsync or vmm pools
13541359
GGML_UNUSED(dstDevice);

0 commit comments

Comments
 (0)
0