Spaces:

natasa365
/

whisper.cpp

Running

germanaizek commited on May 20, 2024

Commit

8325ed5

1 Parent(s): 9794ea7

ggml-opencl, llama: using reserve() if count already known (llama/7272)

Files changed (1) hide show

ggml-opencl.cpp CHANGED Viewed

@@ -1,4 +1,4 @@
-#include "ggml.h"
 #include "ggml-opencl.h"
 #include "ggml-backend-impl.h"
@@ -1835,7 +1835,10 @@ static void ggml_cl_mul_mat_q_f32(const ggml_tensor * src0, const ggml_tensor *
                     CL_CHECK(clEnqueueNDRangeKernel(queue, *to_fp32_cl, 1, &offset, &global, local > 0 ? &local : NULL, events.size(), !events.empty() ? events.data() : NULL, NULL));
                 }
-                for (int64_t i12 = i02 * r2, e12 = i12 + r2; i12 < e12; i12++) {
                     if (mul_mat_vec) { // specialized dequantize_mul_mat_vec kernel
                         // copy src1 to device
                         events.emplace_back();

+#include "ggml.h"
 #include "ggml-opencl.h"
 #include "ggml-backend-impl.h"
                     CL_CHECK(clEnqueueNDRangeKernel(queue, *to_fp32_cl, 1, &offset, &global, local > 0 ? &local : NULL, events.size(), !events.empty() ? events.data() : NULL, NULL));
                 }
+                int64_t i12 = i02 * r2;
+                int64_t e12 = i12 + r2;
+                events.reserve(e12 - i12);
+                for (; i12 < e12; i12++) {
                     if (mul_mat_vec) { // specialized dequantize_mul_mat_vec kernel
                         // copy src1 to device
                         events.emplace_back();