sampling_ext.cpp 2.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081
  1. // TODO: this is a temporary wrapper to allow calling C++ code from CGo
  2. #include "sampling.h"
  3. #include "sampling_ext.h"
  4. #include "json-schema-to-grammar.h"
  5. struct gpt_sampler *gpt_sampler_cinit(
  6. const struct llama_model *model, struct gpt_sampler_cparams *params)
  7. {
  8. try
  9. {
  10. gpt_sampler_params sparams;
  11. sparams.top_k = params->top_k;
  12. sparams.top_p = params->top_p;
  13. sparams.min_p = params->min_p;
  14. sparams.tfs_z = params->tfs_z;
  15. sparams.typ_p = params->typical_p;
  16. sparams.temp = params->temp;
  17. sparams.penalty_last_n = params->penalty_last_n;
  18. sparams.penalty_repeat = params->penalty_repeat;
  19. sparams.penalty_freq = params->penalty_freq;
  20. sparams.penalty_present = params->penalty_present;
  21. sparams.mirostat = params->mirostat;
  22. sparams.mirostat_tau = params->mirostat_tau;
  23. sparams.mirostat_eta = params->mirostat_eta;
  24. sparams.penalize_nl = params->penalize_nl;
  25. sparams.seed = params->seed;
  26. sparams.grammar = params->grammar;
  27. return gpt_sampler_init(model, sparams);
  28. }
  29. catch (const std::exception &err)
  30. {
  31. return nullptr;
  32. }
  33. }
  34. void gpt_sampler_cfree(struct gpt_sampler *sampler)
  35. {
  36. gpt_sampler_free(sampler);
  37. }
  38. void gpt_sampler_creset(struct gpt_sampler *sampler)
  39. {
  40. gpt_sampler_reset(sampler);
  41. }
  42. llama_token gpt_sampler_csample(
  43. struct gpt_sampler *sampler,
  44. struct llama_context *ctx_main,
  45. int idx)
  46. {
  47. return gpt_sampler_sample(sampler, ctx_main, idx);
  48. }
  49. void gpt_sampler_caccept(
  50. struct gpt_sampler *sampler,
  51. llama_token id,
  52. bool apply_grammar)
  53. {
  54. gpt_sampler_accept(sampler, id, apply_grammar);
  55. }
  56. int schema_to_grammar(const char *json_schema, char *grammar, size_t max_len)
  57. {
  58. try
  59. {
  60. nlohmann::json schema = nlohmann::json::parse(json_schema);
  61. std::string grammar_str = json_schema_to_grammar(schema);
  62. size_t len = grammar_str.length();
  63. if (len >= max_len)
  64. {
  65. len = max_len - 1;
  66. }
  67. strncpy(grammar, grammar_str.c_str(), len);
  68. return len;
  69. }
  70. catch (const std::exception &e)
  71. {
  72. strncpy(grammar, "", max_len - 1);
  73. return 0;
  74. }
  75. }