|
|
@@ -7759,10 +7759,10 @@ static void ggml_compute_forward_mul_f32(
|
|
|
const int ith = params->ith;
|
|
|
const int nth = params->nth;
|
|
|
|
|
|
-// TODO: OpenCL kernel support broadcast
|
|
|
#ifdef GGML_USE_CLBLAST
|
|
|
if (src1->backend == GGML_BACKEND_GPU) {
|
|
|
- GGML_ASSERT(ggml_are_same_shape(src0, src1));
|
|
|
+ // TODO: OpenCL kernel support full broadcast
|
|
|
+ GGML_ASSERT(ggml_can_repeat_rows(src1, src0));
|
|
|
if (ith == 0) {
|
|
|
ggml_cl_mul(src0, src1, dst);
|
|
|
}
|