sampling_ext.cpp 2.2 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667
  1. // TODO: this is a temporary wrapper to allow calling C++ code from CGo
  2. #include "sampling.h"
  3. #include "sampling_ext.h"
  4. #include "json-schema-to-grammar.h"
  5. struct common_sampler *common_sampler_cinit(const struct llama_model *model, struct common_sampler_cparams *params) {
  6. try {
  7. common_params_sampling sparams;
  8. sparams.top_k = params->top_k;
  9. sparams.top_p = params->top_p;
  10. sparams.min_p = params->min_p;
  11. sparams.typ_p = params->typical_p;
  12. sparams.temp = params->temp;
  13. sparams.penalty_last_n = params->penalty_last_n;
  14. sparams.penalty_repeat = params->penalty_repeat;
  15. sparams.penalty_freq = params->penalty_freq;
  16. sparams.penalty_present = params->penalty_present;
  17. sparams.mirostat = params->mirostat;
  18. sparams.mirostat_tau = params->mirostat_tau;
  19. sparams.mirostat_eta = params->mirostat_eta;
  20. sparams.penalize_nl = params->penalize_nl;
  21. sparams.seed = params->seed;
  22. sparams.grammar = params->grammar;
  23. sparams.xtc_probability = 0.0;
  24. sparams.xtc_threshold = 0.5;
  25. return common_sampler_init(model, sparams);
  26. } catch (const std::exception &err) {
  27. return nullptr;
  28. }
  29. }
  30. void common_sampler_cfree(struct common_sampler *sampler) {
  31. common_sampler_free(sampler);
  32. }
  33. void common_sampler_creset(struct common_sampler *sampler) {
  34. common_sampler_reset(sampler);
  35. }
  36. void common_sampler_caccept(struct common_sampler *sampler, llama_token id, bool apply_grammar) {
  37. common_sampler_accept(sampler, id, apply_grammar);
  38. }
  39. llama_token common_sampler_csample(struct common_sampler *sampler, struct llama_context *ctx, int idx) {
  40. return common_sampler_sample(sampler, ctx, idx);
  41. }
  42. int schema_to_grammar(const char *json_schema, char *grammar, size_t max_len)
  43. {
  44. try
  45. {
  46. nlohmann::json schema = nlohmann::json::parse(json_schema);
  47. std::string grammar_str = json_schema_to_grammar(schema);
  48. size_t len = grammar_str.length();
  49. if (len >= max_len)
  50. {
  51. len = max_len - 1;
  52. }
  53. strncpy(grammar, grammar_str.c_str(), len);
  54. return len;
  55. }
  56. catch (const std::exception &e)
  57. {
  58. strncpy(grammar, "", max_len - 1);
  59. return 0;
  60. }
  61. }