mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-12 11:40:17 +00:00
ggml : disable tests involving i-matrix quantization
This commit is contained in:
parent
b0597b1493
commit
8cc7145cc7
@ -2968,12 +2968,8 @@ static void ggml_compute_forward_dup_f16(
|
|||||||
id += ne00 * (ne01 - ir1);
|
id += ne00 * (ne01 - ir1);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
} else if (ggml_get_type_traits_cpu(dst->type)->from_float || ggml_get_type_traits(dst->type)->from_float_ref) {
|
} else if (ggml_get_type_traits_cpu(dst->type)->from_float) {
|
||||||
ggml_from_float_t quantize_row_q = ggml_get_type_traits_cpu(dst->type)->from_float;
|
ggml_from_float_t const quantize_row_q = ggml_get_type_traits_cpu(dst->type)->from_float;
|
||||||
if (!quantize_row_q) {
|
|
||||||
quantize_row_q = ggml_get_type_traits(dst->type)->from_float_ref;
|
|
||||||
}
|
|
||||||
|
|
||||||
float * src0_f32 = (float *) params->wdata + (ne00 + CACHE_LINE_SIZE_F32) * ith;
|
float * src0_f32 = (float *) params->wdata + (ne00 + CACHE_LINE_SIZE_F32) * ith;
|
||||||
|
|
||||||
size_t id = 0;
|
size_t id = 0;
|
||||||
@ -3569,11 +3565,8 @@ static void ggml_compute_forward_dup_f32(
|
|||||||
id += rs * (ne01 - ir1);
|
id += rs * (ne01 - ir1);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
} else if (ggml_get_type_traits_cpu(dst->type)->from_float || ggml_get_type_traits(dst->type)->from_float_ref) {
|
} else if (ggml_get_type_traits_cpu(dst->type)->from_float) {
|
||||||
ggml_from_float_t quantize_row_q = ggml_get_type_traits_cpu(dst->type)->from_float;
|
ggml_from_float_t const quantize_row_q = ggml_get_type_traits_cpu(dst->type)->from_float;
|
||||||
if (!quantize_row_q) {
|
|
||||||
quantize_row_q = ggml_get_type_traits(dst->type)->from_float_ref;
|
|
||||||
}
|
|
||||||
|
|
||||||
size_t id = 0;
|
size_t id = 0;
|
||||||
size_t rs = nb0 * (ne00 / ggml_blck_size(dst->type));
|
size_t rs = nb0 * (ne00 / ggml_blck_size(dst->type));
|
||||||
|
@ -3549,9 +3549,9 @@ static std::vector<std::unique_ptr<test_case>> make_test_cases_eval() {
|
|||||||
|
|
||||||
for (ggml_type type_src : {GGML_TYPE_F16, GGML_TYPE_F32}) {
|
for (ggml_type type_src : {GGML_TYPE_F16, GGML_TYPE_F32}) {
|
||||||
for (ggml_type type_dst : all_types) {
|
for (ggml_type type_dst : all_types) {
|
||||||
//if (type_dst == GGML_TYPE_IQ2_S || type_dst == GGML_TYPE_IQ3_XXS || type_dst == GGML_TYPE_IQ3_S) {
|
if (type_dst == GGML_TYPE_IQ2_S || type_dst == GGML_TYPE_IQ3_XXS || type_dst == GGML_TYPE_IQ3_S) {
|
||||||
// continue;
|
continue;
|
||||||
//}
|
}
|
||||||
test_cases.emplace_back(new test_cpy(type_src, type_dst, {256, 4, 4, 4}));
|
test_cases.emplace_back(new test_cpy(type_src, type_dst, {256, 4, 4, 4}));
|
||||||
test_cases.emplace_back(new test_cpy(type_src, type_dst, {256, 2, 3, 4}, {0, 2, 1, 3})); // cpy by rows
|
test_cases.emplace_back(new test_cpy(type_src, type_dst, {256, 2, 3, 4}, {0, 2, 1, 3})); // cpy by rows
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user