8000 Use memcpy for copying contiguous tensors · ggml-org/llama.cpp@1f6cc01 · GitHub
[go: up one dir, main page]

Skip to content

Commit 1f6cc01

Browse files
committed
Use memcpy for copying contiguous tensors
ggml-ci
1 parent ea0c39b commit 1f6cc01

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

ggml/src/ggml-sycl/cpy.cpp

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -758,8 +758,9 @@ void ggml_sycl_cpy(ggml_backend_sycl_context & ctx, const ggml_tensor * src0, co
758758
char * src1_ddc = (char *) src1->data;
759759
GGML_SYCL_DEBUG("[SYCL] %s: Tensor supplied: %s to %s\n", __func__, ggml_type_name(src0->type),
760760
ggml_type_name(src1->type));
761-
762-
if (src0->type == GGML_TYPE_F32 && src1->type == GGML_TYPE_F32) {
761+
if ((src0->type == src1->type) && (ggml_is_contiguous(src0) && ggml_is_contiguous(src1))) {
762+
main_stream->memcpy(src1_ddc, src0_ddc, ggml_nbytes(src0));
763+
} else if (src0->type == GGML_TYPE_F32 && src1->type == GGML_TYPE_F32) {
763764
ggml_cpy_f32_f32_sycl(src0_ddc, src1_ddc, ne, ne00, ne01, ne02, nb00, nb01, nb02, nb03, ne10, ne11, ne12, nb10,
764765
nb11, nb12, nb13, main_stream);
765766
} else if (src0->type == GGML_TYPE_F32 && src1->type == GGML_TYPE_F16) {

0 commit comments

Comments
 (0)
0