|
|
// by doing so, the number of splits in the graph is reduced
|
|
// by doing so, the number of splits in the graph is reduced
|
|
|
ggml_build_forward_expand(graph, k_cur);
|
|
ggml_build_forward_expand(graph, k_cur);
|
|
|
ggml_build_forward_expand(graph, v_cur);
|
|
ggml_build_forward_expand(graph, v_cur);
|
|
|
llm_build_kv_store(ctx, hparams, kv, graph, k_cur, v_cur, n_ctx, n_tokens, kv_head, cb, il);
|
|
llm_build_kv_store(ctx, hparams, kv, graph, k_cur, v_cur, n_ctx, n_tokens, kv_head, cb, il);
|