|
|
@@ -496,7 +496,7 @@ ggml_tensor * llm_build_qwen3next::build_qwen3next_linear_attn_layer(llm_graph_i
|
|
|
cb(conv_input, "conv_input", il);
|
|
|
|
|
|
// Apply convolution
|
|
|
- ggml_tensor * conv_output = ggml_conv_1d_dw_f32(ctx0, conv_kernel, conv_input, 1, conv_kernel_size - 1, n_seqs);
|
|
|
+ ggml_tensor * conv_output = ggml_conv_1d_dw_f32(ctx0, conv_kernel, conv_input, 1, conv_kernel_size - 1, 1);
|
|
|
cb(conv_output, "conv_output_raw", il);
|
|
|
|
|
|
// Remove the padding
|