Spaces:
Running
Running
Abhilash Majumder
commited on
remove row=1 cond (llama/6532)
Browse files- ggml-sycl.cpp +1 -2
ggml-sycl.cpp
CHANGED
|
@@ -15776,7 +15776,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1
|
|
| 15776 |
#ifdef GGML_SYCL_FORCE_DMMV
|
| 15777 |
const bool use_mul_mat_vec_q = false;
|
| 15778 |
#else
|
| 15779 |
-
bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type)
|
| 15780 |
use_mul_mat_vec_q = use_mul_mat_vec_q ||
|
| 15781 |
(src0->type == GGML_TYPE_IQ2_XXS) || (src0->type == GGML_TYPE_IQ2_XS) || (src0->type == GGML_TYPE_IQ2_S) ||
|
| 15782 |
(src0->type == GGML_TYPE_IQ3_XXS) || (src0->type == GGML_TYPE_IQ3_S) ||
|
|
@@ -15787,7 +15787,6 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1
|
|
| 15787 |
#endif // GGML_SYCL_FORCE_DMMV
|
| 15788 |
|
| 15789 |
if (use_mul_mat_vec_q) {
|
| 15790 |
-
// NOTE: this kernel does not support ggml_nrows(src1) > 1
|
| 15791 |
// GGML_SYCL_DEBUG("ggml_sycl_mul_mat ggml_sycl_op_mul_mat_vec_q path\n");
|
| 15792 |
ggml_sycl_op_mul_mat(src0, src1, dst, ggml_sycl_op_mul_mat_vec_q, true);
|
| 15793 |
} else {
|
|
|
|
| 15776 |
#ifdef GGML_SYCL_FORCE_DMMV
|
| 15777 |
const bool use_mul_mat_vec_q = false;
|
| 15778 |
#else
|
| 15779 |
+
bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type);
|
| 15780 |
use_mul_mat_vec_q = use_mul_mat_vec_q ||
|
| 15781 |
(src0->type == GGML_TYPE_IQ2_XXS) || (src0->type == GGML_TYPE_IQ2_XS) || (src0->type == GGML_TYPE_IQ2_S) ||
|
| 15782 |
(src0->type == GGML_TYPE_IQ3_XXS) || (src0->type == GGML_TYPE_IQ3_S) ||
|
|
|
|
| 15787 |
#endif // GGML_SYCL_FORCE_DMMV
|
| 15788 |
|
| 15789 |
if (use_mul_mat_vec_q) {
|
|
|
|
| 15790 |
// GGML_SYCL_DEBUG("ggml_sycl_mul_mat ggml_sycl_op_mul_mat_vec_q path\n");
|
| 15791 |
ggml_sycl_op_mul_mat(src0, src1, dst, ggml_sycl_op_mul_mat_vec_q, true);
|
| 15792 |
} else {
|