ggml-rpc.h 1.0 KB

12345678910111213141516171819202122232425262728293031
  1. #pragma once
  2. #include "ggml.h"
  3. #include "ggml-backend.h"
  4. #ifdef __cplusplus
  5. extern "C" {
  6. #endif
  7. #define RPC_PROTO_MAJOR_VERSION 3
  8. #define RPC_PROTO_MINOR_VERSION 0
  9. #define RPC_PROTO_PATCH_VERSION 0
  10. #define GGML_RPC_MAX_SERVERS 16
  11. // backend API
  12. GGML_BACKEND_API ggml_backend_t ggml_backend_rpc_init(const char * endpoint, uint32_t device);
  13. GGML_BACKEND_API bool ggml_backend_is_rpc(ggml_backend_t backend);
  14. GGML_BACKEND_API ggml_backend_buffer_type_t ggml_backend_rpc_buffer_type(const char * endpoint, uint32_t device);
  15. GGML_BACKEND_API void ggml_backend_rpc_get_device_memory(const char * endpoint, uint32_t device, size_t * free, size_t * total);
  16. GGML_BACKEND_API void ggml_backend_rpc_start_server(const char * endpoint, const char * cache_dir,
  17. size_t n_threads, size_t n_devices, ggml_backend_dev_t * devices);
  18. GGML_BACKEND_API ggml_backend_reg_t ggml_backend_rpc_reg(void);
  19. GGML_BACKEND_API ggml_backend_reg_t ggml_backend_rpc_add_server(const char * endpoint);
  20. #ifdef __cplusplus
  21. }
  22. #endif