mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-05 00:04:36 +00:00
Fix tests
This commit is contained in:
parent
592b3b26bb
commit
5574533a72
@ -9651,7 +9651,7 @@ static int iq2_find_best_neighbour(const uint16_t * restrict neighbours, const u
|
|||||||
|
|
||||||
static void quantize_row_iq2_xxs_impl(const float * restrict x, void * restrict vy, int n, const float * restrict quant_weights) {
|
static void quantize_row_iq2_xxs_impl(const float * restrict x, void * restrict vy, int n, const float * restrict quant_weights) {
|
||||||
|
|
||||||
const int gindex = iq2_data_index(256);
|
const int gindex = iq2_data_index(GGML_TYPE_IQ2_XXS);
|
||||||
|
|
||||||
const uint64_t * kgrid_q2xs = iq2_data[gindex].grid;
|
const uint64_t * kgrid_q2xs = iq2_data[gindex].grid;
|
||||||
const int * kmap_q2xs = iq2_data[gindex].map;
|
const int * kmap_q2xs = iq2_data[gindex].map;
|
||||||
@ -9824,7 +9824,7 @@ static void quantize_row_iq2_xxs_impl(const float * restrict x, void * restrict
|
|||||||
|
|
||||||
static void quantize_row_iq2_xs_impl(const float * restrict x, void * restrict vy, int n, const float * restrict quant_weights) {
|
static void quantize_row_iq2_xs_impl(const float * restrict x, void * restrict vy, int n, const float * restrict quant_weights) {
|
||||||
|
|
||||||
const int gindex = iq2_data_index(512);
|
const int gindex = iq2_data_index(GGML_TYPE_IQ2_XS);
|
||||||
|
|
||||||
const uint64_t * kgrid_q2xs = iq2_data[gindex].grid;
|
const uint64_t * kgrid_q2xs = iq2_data[gindex].grid;
|
||||||
const int * kmap_q2xs = iq2_data[gindex].map;
|
const int * kmap_q2xs = iq2_data[gindex].map;
|
||||||
|
3
ggml.c
3
ggml.c
@ -19209,7 +19209,8 @@ size_t ggml_quantize_q8_0(const float * src, void * dst, int n, int k, int64_t *
|
|||||||
bool ggml_quantize_requires_imatrix(enum ggml_type type) {
|
bool ggml_quantize_requires_imatrix(enum ggml_type type) {
|
||||||
return
|
return
|
||||||
type == GGML_TYPE_IQ2_XXS ||
|
type == GGML_TYPE_IQ2_XXS ||
|
||||||
type == GGML_TYPE_IQ2_XS;
|
type == GGML_TYPE_IQ2_XS ||
|
||||||
|
type == GGML_TYPE_IQ1_S;
|
||||||
}
|
}
|
||||||
|
|
||||||
size_t ggml_quantize_chunk(enum ggml_type type, const float * src, void * dst, int start,
|
size_t ggml_quantize_chunk(enum ggml_type type, const float * src, void * dst, int start,
|
||||||
|
Loading…
Reference in New Issue
Block a user