Spaces:
Sleeping
Sleeping
ci : fix wikitext url + compile warnings (llama/5569)
Browse files- ggml-quants.c +3 -3
ggml-quants.c
CHANGED
|
@@ -1837,9 +1837,9 @@ static void quantize_row_q2_K_impl(const float * restrict x, block_q2_K * restri
|
|
| 1837 |
float sigma2 = sumx2/QK_K;
|
| 1838 |
for (int j = 0; j < QK_K/16; ++j) {
|
| 1839 |
const float * restrict qw = quant_weights + QK_K * i + 16*j;
|
| 1840 |
-
for (int l = 0; l < 16; ++l) weight[l] = qw[l] * sqrtf(sigma2 + x[16*j + l]*x[16*j + l]);
|
| 1841 |
-
for (int l = 0; l < 16; ++l) sw[j] += weight[l];
|
| 1842 |
-
scales[j] = make_qkx3_quants(16, 3, x + 16*j, weight, L + 16*j, &mins[j], Laux, -0.9f, 0.05f, 36, false);
|
| 1843 |
}
|
| 1844 |
|
| 1845 |
float dm = make_qp_quants(QK_K/16, 15, scales, Ls, sw);
|
|
|
|
| 1837 |
float sigma2 = sumx2/QK_K;
|
| 1838 |
for (int j = 0; j < QK_K/16; ++j) {
|
| 1839 |
const float * restrict qw = quant_weights + QK_K * i + 16*j;
|
| 1840 |
+
for (int l = 0; l < QK_K/16; ++l) weight[l] = qw[l] * sqrtf(sigma2 + x[16*j + l]*x[16*j + l]);
|
| 1841 |
+
for (int l = 0; l < QK_K/16; ++l) sw[j] += weight[l];
|
| 1842 |
+
scales[j] = make_qkx3_quants(QK_K/16, 3, x + 16*j, weight, L + 16*j, &mins[j], Laux, -0.9f, 0.05f, 36, false);
|
| 1843 |
}
|
| 1844 |
|
| 1845 |
float dm = make_qp_quants(QK_K/16, 15, scales, Ls, sw);
|