Abhilash Majumder commited on
Commit
8499e3f
·
unverified ·
1 Parent(s): 873102e

remove row=1 cond (llama/6532)

Browse files
Files changed (1) hide show
  1. ggml-sycl.cpp +1 -2
ggml-sycl.cpp CHANGED
@@ -15776,7 +15776,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1
15776
  #ifdef GGML_SYCL_FORCE_DMMV
15777
  const bool use_mul_mat_vec_q = false;
15778
  #else
15779
- bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type) && ggml_nrows(src1) == 1;
15780
  use_mul_mat_vec_q = use_mul_mat_vec_q ||
15781
  (src0->type == GGML_TYPE_IQ2_XXS) || (src0->type == GGML_TYPE_IQ2_XS) || (src0->type == GGML_TYPE_IQ2_S) ||
15782
  (src0->type == GGML_TYPE_IQ3_XXS) || (src0->type == GGML_TYPE_IQ3_S) ||
@@ -15787,7 +15787,6 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1
15787
  #endif // GGML_SYCL_FORCE_DMMV
15788
 
15789
  if (use_mul_mat_vec_q) {
15790
- // NOTE: this kernel does not support ggml_nrows(src1) > 1
15791
  // GGML_SYCL_DEBUG("ggml_sycl_mul_mat ggml_sycl_op_mul_mat_vec_q path\n");
15792
  ggml_sycl_op_mul_mat(src0, src1, dst, ggml_sycl_op_mul_mat_vec_q, true);
15793
  } else {
 
15776
  #ifdef GGML_SYCL_FORCE_DMMV
15777
  const bool use_mul_mat_vec_q = false;
15778
  #else
15779
+ bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type);
15780
  use_mul_mat_vec_q = use_mul_mat_vec_q ||
15781
  (src0->type == GGML_TYPE_IQ2_XXS) || (src0->type == GGML_TYPE_IQ2_XS) || (src0->type == GGML_TYPE_IQ2_S) ||
15782
  (src0->type == GGML_TYPE_IQ3_XXS) || (src0->type == GGML_TYPE_IQ3_S) ||
 
15787
  #endif // GGML_SYCL_FORCE_DMMV
15788
 
15789
  if (use_mul_mat_vec_q) {
 
15790
  // GGML_SYCL_DEBUG("ggml_sycl_mul_mat ggml_sycl_op_mul_mat_vec_q path\n");
15791
  ggml_sycl_op_mul_mat(src0, src1, dst, ggml_sycl_op_mul_mat_vec_q, true);
15792
  } else {