Browse Source

ggml : fix OpenCL broadcast requirement for ggml_mul (close #4453)

Georgi Gerganov 2 years ago
parent
commit
55e87c3749
1 changed files with 2 additions and 2 deletions
  1. 2 2
      ggml.c

+ 2 - 2
ggml.c

@@ -7759,10 +7759,10 @@ static void ggml_compute_forward_mul_f32(
     const int ith = params->ith;
     const int ith = params->ith;
     const int nth = params->nth;
     const int nth = params->nth;
 
 
-// TODO: OpenCL kernel support broadcast
 #ifdef GGML_USE_CLBLAST
 #ifdef GGML_USE_CLBLAST
     if (src1->backend == GGML_BACKEND_GPU) {
     if (src1->backend == GGML_BACKEND_GPU) {
-        GGML_ASSERT(ggml_are_same_shape(src0, src1));
+        // TODO: OpenCL kernel support full broadcast
+        GGML_ASSERT(ggml_can_repeat_rows(src1, src0));
         if (ith == 0) {
         if (ith == 0) {
             ggml_cl_mul(src0, src1, dst);
             ggml_cl_mul(src0, src1, dst);
         }
         }