binding.h 1.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748
  1. #ifdef __cplusplus
  2. #include <string>
  3. #include <vector>
  4. extern "C" {
  5. #endif
  6. #include <stdbool.h>
  7. extern unsigned char tokenCallback(void *, char *);
  8. int load_state(void *ctx, char *statefile, char *modes);
  9. int eval(void *params_ptr, void *ctx, char *text);
  10. void save_state(void *ctx, char *dst, char *modes);
  11. void *load_model(const char *fname, int n_ctx, int n_seed, bool memory_f16,
  12. bool mlock, bool embeddings, bool mmap, bool low_vram,
  13. bool vocab_only, int n_gpu, int n_batch, const char *maingpu,
  14. const char *tensorsplit, bool numa);
  15. int get_embeddings(void *params_ptr, void *state_pr, float *res_embeddings);
  16. int get_token_embeddings(void *params_ptr, void *state_pr, int *tokens,
  17. int tokenSize, float *res_embeddings);
  18. void *llama_allocate_params(
  19. const char *prompt, int seed, int threads, int tokens, int top_k,
  20. float top_p, float temp, float repeat_penalty, int repeat_last_n,
  21. bool ignore_eos, bool memory_f16, int n_batch, int n_keep,
  22. const char **antiprompt, int antiprompt_count, float tfs_z, float typical_p,
  23. float frequency_penalty, float presence_penalty, int mirostat,
  24. float mirostat_eta, float mirostat_tau, bool penalize_nl,
  25. const char *logit_bias, bool mlock, bool mmap, const char *maingpu,
  26. const char *tensorsplit);
  27. void llama_free_params(void *params_ptr);
  28. void llama_binding_free_model(void *state);
  29. int llama_predict(void *params_ptr, void *state_pr, char *result, bool debug);
  30. #ifdef __cplusplus
  31. }
  32. std::vector<std::string> create_vector(const char **strings, int count);
  33. void delete_vector(std::vector<std::string> *vec);
  34. #endif