gguf-py : add IQ1_M to GGML_QUANT_SIZES (#6761)

This commit is contained in:
pmysl 2024-04-21 14:49:30 +02:00 committed by GitHub
parent e8d35f47cb
commit c1386c936e
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -872,6 +872,7 @@ GGML_QUANT_SIZES = {
GGMLQuantizationType.I32: (1, 4),
GGMLQuantizationType.I64: (1, 8),
GGMLQuantizationType.F64: (1, 8),
GGMLQuantizationType.IQ1_M: (256, QK_K // 8 + QK_K // 16 + QK_K // 32),
}