From 6a6cfd6c6f34747142f155192df42e11cebec026 Mon Sep 17 00:00:00 2001 From: vithulep Date: Tue, 3 Sep 2024 12:17:44 +0530 Subject: [PATCH] Implemented vector length agnostic SVE using switch case for 512-bit, 256-bit, 128-bit vector lengths --- ggml/src/ggml-quants.c | 2 -- 1 file changed, 2 deletions(-) diff --git a/ggml/src/ggml-quants.c b/ggml/src/ggml-quants.c index 8b8440cbc..5ebdf96d1 100644 --- a/ggml/src/ggml-quants.c +++ b/ggml/src/ggml-quants.c @@ -3821,7 +3821,6 @@ void ggml_vec_dot_q4_0_q8_0(int n, float * restrict s, size_t bs, const void * r svfloat32_t sumv0 = svdup_n_f32(0.0f); svfloat32_t sumv1 = svdup_n_f32(0.0f); - assert(nb % 2 == 0); // TODO: handle odd nb const int vector_length = ggml_sve_cnt_b*8; // VLA Implementation using switch case @@ -5402,7 +5401,6 @@ void ggml_vec_dot_q8_0_q8_0(int n, float * restrict s, size_t bs, const void * r svfloat32_t sumv0 = svdup_n_f32(0.0f); svfloat32_t sumv1 = svdup_n_f32(0.0f); - assert(nb % 2 == 0); // TODO: handle odd nb const int vector_length = ggml_sve_cnt_b*8; //VLA Implemenation for SVE