Fix CudaMemcpy direction (#4599)

author Henrik Forstén <redacted>

Fri, 22 Dec 2023 13:34:05 +0000 (15:34 +0200)

committer GitHub <redacted>

Fri, 22 Dec 2023 13:34:05 +0000 (14:34 +0100)
author Henrik Forstén <redacted>
Fri, 22 Dec 2023 13:34:05 +0000 (15:34 +0200)
committer GitHub <redacted>
Fri, 22 Dec 2023 13:34:05 +0000 (14:34 +0100)
diff --git a/ggml-cuda.cu b/ggml-cuda.cu

index 37d7f27925009ab6d4b83aca787d72e5dc987fea..da8fd1e09c7be35e3fdc390b4480dd634bbaea5f 100644 (file)
--- a/ggml-cuda.cu
+++ b/ggml-cuda.cu
@@ -8843,7 +8843,7 @@ static void ggml_cuda_mul_mat_id(const ggml_tensor * src0, const ggml_tensor * s
          const cudaMemcpyKind src1_kind = src1->backend == GGML_BACKEND_CPU ?
              cudaMemcpyHostToDevice : cudaMemcpyDeviceToDevice;
          const cudaMemcpyKind dst_kind  =  dst->backend == GGML_BACKEND_CPU ?
-            cudaMemcpyHostToDevice : cudaMemcpyDeviceToDevice;
+            cudaMemcpyDeviceToHost : cudaMemcpyDeviceToDevice;
  
          for (int32_t row_id = 0; row_id < n_as; ++row_id) {
              const struct ggml_tensor * src0_row = dst->src[row_id + 2];
author	Henrik Forstén <redacted>
	Fri, 22 Dec 2023 13:34:05 +0000 (15:34 +0200)
committer	GitHub <redacted>
	Fri, 22 Dec 2023 13:34:05 +0000 (14:34 +0100)