| 12345678910111213141516171819202122232425 |
- #pragma once
- #include "../llama-model.h"
- #include "../llama-graph.h"
- #include <cmath>
- struct llm_build_granite : public llm_graph_context {
- llm_build_granite(const llama_model & model, const llm_graph_params & params);
- private:
- ggml_tensor * build_attention_layer(
- ggml_tensor * cur,
- ggml_tensor * inp_pos,
- llm_graph_input_attn_kv * inp_attn,
- const llama_model & model,
- const int64_t n_embd_head,
- const int il);
- ggml_tensor * build_layer_ffn(
- ggml_tensor * cur,
- ggml_tensor * inpSA,
- const llama_model & model,
- const int il);
- };
|