Skip to content

Commit 25fda88

Browse files
Ttlhodlen
authored andcommitted
Fix CudaMemcpy direction (ggml-org#4599)
1 parent 6e2e24c commit 25fda88

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml-cuda.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8843,7 +8843,7 @@ static void ggml_cuda_mul_mat_id(const ggml_tensor * src0, const ggml_tensor * s
88438843
const cudaMemcpyKind src1_kind = src1->backend == GGML_BACKEND_CPU ?
88448844
cudaMemcpyHostToDevice : cudaMemcpyDeviceToDevice;
88458845
const cudaMemcpyKind dst_kind = dst->backend == GGML_BACKEND_CPU ?
8846-
cudaMemcpyHostToDevice : cudaMemcpyDeviceToDevice;
8846+
cudaMemcpyDeviceToHost : cudaMemcpyDeviceToDevice;
88478847

88488848
for (int32_t row_id = 0; row_id < n_as; ++row_id) {
88498849
const struct ggml_tensor * src0_row = dst->src[row_id + 2];

0 commit comments

Comments
 (0)