mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-12 19:50:17 +00:00
fix code
This commit is contained in:
parent
97d22be58c
commit
344467f2b8
@ -1417,7 +1417,7 @@ class BitnetModel(Model):
|
||||
def weight_quant(self, weight):
|
||||
dtype = weight.dtype
|
||||
weight = weight.float()
|
||||
s = 1 / weight.abs().mean().clamp(min=1e-5)
|
||||
s = 1 / weight.abs().mean().clamp(min=1e-5)
|
||||
result = (weight * s).round().clamp(-1, 1) / s
|
||||
return result.type(dtype)
|
||||
|
||||
|
@ -3802,6 +3802,10 @@ void ggml_vec_dot_i2_i8_s(int n, float * restrict s, size_t bs, const void * res
|
||||
UNUSED(by);
|
||||
UNUSED(nrc);
|
||||
|
||||
#if defined(__AVX2__)
|
||||
// TODO
|
||||
#else
|
||||
|
||||
int sumi = 0;
|
||||
|
||||
for (int i = 0; i < n / 4; i++) {
|
||||
@ -3812,7 +3816,7 @@ void ggml_vec_dot_i2_i8_s(int n, float * restrict s, size_t bs, const void * res
|
||||
sumi += (int)y[i*4+3] * weight[3];
|
||||
}
|
||||
*s = (float)sumi;
|
||||
|
||||
#endif
|
||||
}
|
||||
|
||||
void ggml_vec_dot_q4_0_q8_0(int n, float * restrict s, size_t bs, const void * restrict vx, size_t bx, const void * restrict vy, size_t by, int nrc) {
|
||||
|
Loading…
Reference in New Issue
Block a user