mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-30 21:34:36 +00:00
Update ggml-cuda.cu
Co-authored-by: slaren <slarengh@gmail.com>
This commit is contained in:
parent
3c8d6b160b
commit
30338c5643
@ -8419,8 +8419,8 @@ static void ggml_cuda_mul_mat_mat_batched_cublas(const ggml_tensor * src0, const
|
|||||||
cu_compute_type = CUBLAS_COMPUTE_32F;
|
cu_compute_type = CUBLAS_COMPUTE_32F;
|
||||||
cu_data_type = CUDA_R_32F;
|
cu_data_type = CUDA_R_32F;
|
||||||
|
|
||||||
alpha = (const char *) &alpha_f32;
|
alpha = &alpha_f32;
|
||||||
beta = (const char *) &beta_f32;
|
beta = &beta_f32;
|
||||||
}
|
}
|
||||||
|
|
||||||
GGML_ASSERT(ne12 % ne02 == 0);
|
GGML_ASSERT(ne12 % ne02 == 0);
|
||||||
|
Loading…
Reference in New Issue
Block a user