ggml-rpc.h 1.1 KB

1234567891011121314151617181920212223242526272829303132
  1. #pragma once
  2. #include "ggml.h"
  3. #include "ggml-backend.h"
  4. #ifdef __cplusplus
  5. extern "C" {
  6. #endif
  7. #define RPC_PROTO_MAJOR_VERSION 3
  8. #define RPC_PROTO_MINOR_VERSION 0
  9. #define RPC_PROTO_PATCH_VERSION 0
  10. #define GGML_RPC_MAX_SERVERS 16
  11. // backend API
  12. GGML_BACKEND_API ggml_backend_t ggml_backend_rpc_init(const char * endpoint, uint32_t device);
  13. GGML_BACKEND_API bool ggml_backend_is_rpc(ggml_backend_t backend);
  14. GGML_BACKEND_API ggml_backend_buffer_type_t ggml_backend_rpc_buffer_type(const char * endpoint, uint32_t device);
  15. GGML_BACKEND_API void ggml_backend_rpc_get_device_memory(const char * endpoint, uint32_t device, size_t * free, size_t * total);
  16. GGML_BACKEND_API void ggml_backend_rpc_start_server(const char * endpoint, const char * cache_dir,
  17. size_t n_threads, size_t n_devices,
  18. ggml_backend_dev_t * devices, size_t * free_mem, size_t * total_mem);
  19. GGML_BACKEND_API ggml_backend_reg_t ggml_backend_rpc_reg(void);
  20. GGML_BACKEND_API ggml_backend_reg_t ggml_backend_rpc_add_server(const char * endpoint);
  21. #ifdef __cplusplus
  22. }
  23. #endif