há 2 anos atrás · 48b24b170e
--- a/ggml.c
+++ b/ggml.c
@@ -15335,6 +15335,8 @@ static void ggml_compute_backward(struct ggml_context * ctx, struct ggml_tensor
 
				                     const int n_past = ((int32_t *) tensor->op_params)[0];
			
 
				                     src0->grad =
			
 
				                         ggml_add_or_set(ctx, src0->grad,
			
 
				+                            /* ggml_diag_mask_inf_impl() shouldn't be here */
			
 
				+                            /* ref:  https://github.com/ggerganov/llama.cpp/pull/4203#discussion_r1412377992 */
			
 
				                             ggml_diag_mask_zero_impl(ctx, tensor->grad, n_past, false),
			
 
				                         zero_table);
			
 
				                 }