mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-29 04:44:34 +00:00
Update ggml-cuda.cu
Co-authored-by: slaren <slarengh@gmail.com>
This commit is contained in:
parent
3c8d6b160b
commit
30338c5643
@ -8419,8 +8419,8 @@ static void ggml_cuda_mul_mat_mat_batched_cublas(const ggml_tensor * src0, const
|
||||
cu_compute_type = CUBLAS_COMPUTE_32F;
|
||||
cu_data_type = CUDA_R_32F;
|
||||
|
||||
alpha = (const char *) &alpha_f32;
|
||||
beta = (const char *) &beta_f32;
|
||||
alpha = &alpha_f32;
|
||||
beta = &beta_f32;
|
||||
}
|
||||
|
||||
GGML_ASSERT(ne12 % ne02 == 0);
|
||||
|
Loading…
Reference in New Issue
Block a user