llm_build_granite.h 761 B

12345678910111213141516171819202122232425
  1. #pragma once
  2. #include "../llama-model.h"
  3. #include "../llama-graph.h"
  4. #include <cmath>
  5. struct llm_build_granite : public llm_graph_context {
  6. llm_build_granite(const llama_model & model, const llm_graph_params & params);
  7. private:
  8. ggml_tensor * build_attention_layer(
  9. ggml_tensor * cur,
  10. ggml_tensor * inp_pos,
  11. llm_graph_input_attn_kv * inp_attn,
  12. const llama_model & model,
  13. const int64_t n_embd_head,
  14. const int il);
  15. ggml_tensor * build_layer_ffn(
  16. ggml_tensor * cur,
  17. ggml_tensor * inpSA,
  18. const llama_model & model,
  19. const int il);
  20. };