01-cache.diff 576 B

12345678910111213141516171819
  1. diff --git a/examples/server/server.cpp b/examples/server/server.cpp
  2. index f255ad76..914ecfdd 100644
  3. --- a/examples/server/server.cpp
  4. +++ b/examples/server/server.cpp
  5. @@ -1101,12 +1101,13 @@ struct server_context {
  6. // add the token to slot queue and cache
  7. }
  8. - slot.add_token_string(result);
  9. if (slot.params.stream) {
  10. send_partial_response(slot, result);
  11. }
  12. }
  13. + slot.add_token_string(result);
  14. +
  15. if (incomplete) {
  16. slot.has_next_token = true;
  17. }