pushdown_runner.go 3.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147
  1. package sample
  2. import (
  3. "fmt"
  4. "math"
  5. "github.com/ollama/ollama/model"
  6. )
  7. type PushdownSampler struct {
  8. // stateful
  9. curNode *PDANode
  10. proc model.TextProcessor
  11. stateToNodeMap map[JSONState]*PDANode
  12. braceStack []rune
  13. }
  14. func NewPushdownSampler(proc model.TextProcessor) *PushdownSampler {
  15. startNode, stateToNodeMap, err := BuildGraph(proc)
  16. if err != nil {
  17. panic(err)
  18. }
  19. err = PreComputeValidStates(stateToNodeMap, proc)
  20. if err != nil {
  21. panic(err)
  22. }
  23. // for id, node := range stateToNodeMap[StateInComma].MaskTokenIDToNode {
  24. // token, err := proc.Decode([]int32{int32(id)})
  25. // if err != nil {
  26. // panic(err)
  27. // }
  28. // fmt.Println("id", id, "node", node, "token", token)
  29. // }
  30. // time.Sleep(10 * time.Second)
  31. return &PushdownSampler{
  32. curNode: startNode,
  33. proc: proc,
  34. stateToNodeMap: stateToNodeMap,
  35. braceStack: []rune{},
  36. }
  37. }
  38. func (s *PushdownSampler) Sample(logits []float64) ([]float64, error) {
  39. fmt.Println("sample:", s.curNode.State)
  40. switch s.curNode.State {
  41. case StateInObjectEnd:
  42. // force finish if no braces left
  43. if len(s.braceStack) == 0 {
  44. s.curNode = NewPDANode(StateTerminate)
  45. for i := range logits {
  46. if s.proc.Is(uint32(i), model.SpecialEOS) {
  47. logits[i] = 1.0
  48. } else {
  49. logits[i] = math.NaN()
  50. }
  51. }
  52. return logits, nil
  53. }
  54. valid, err := s.proc.Encode("}")
  55. if err != nil {
  56. return nil, err
  57. }
  58. for i := range logits {
  59. for _, token := range valid {
  60. if i != int(token) {
  61. logits[i] = math.NaN()
  62. }
  63. }
  64. }
  65. return logits, nil
  66. // return logits, nil
  67. case StateTerminate:
  68. for i := range logits {
  69. if s.proc.Is(uint32(i), model.SpecialEOS) {
  70. logits[i] = 1.0
  71. } else {
  72. logits[i] = math.NaN()
  73. }
  74. }
  75. return logits, nil
  76. // case StateInStringEnd:
  77. // return logits, nil
  78. default:
  79. fmt.Println("masking logits current state", s.curNode.State)
  80. logits, err := s.maskLogits(logits, s.curNode)
  81. if err != nil {
  82. return nil, err
  83. }
  84. return logits, nil
  85. }
  86. }
  87. func (s *PushdownSampler) UpdateState(tokenSlice []int32) error {
  88. fmt.Println("update state", s.curNode.State)
  89. // TODO: need to handle end states and entering object case
  90. if s.curNode.State == StateInObjectEnd {
  91. fmt.Println("in object end")
  92. if len(s.braceStack) > 0 {
  93. s.braceStack = s.braceStack[:len(s.braceStack)-1]
  94. return nil
  95. }
  96. s.curNode = NewPDANode(StateTerminate)
  97. // TODO: return here?
  98. }
  99. // need this cause there could be multiple transitions
  100. mappedString, err := s.proc.Decode(tokenSlice)
  101. if err != nil {
  102. return err
  103. }
  104. for _, r := range mappedString {
  105. if r == rune('{') {
  106. s.braceStack = append(s.braceStack, r)
  107. }
  108. if r == rune('}') {
  109. if len(s.braceStack) == 0 || s.braceStack[len(s.braceStack)-1] != rune('{') {
  110. return fmt.Errorf("unmatched closing brace")
  111. }
  112. s.braceStack = s.braceStack[:len(s.braceStack)-1]
  113. }
  114. }
  115. for _, tokenID := range tokenSlice {
  116. // transition to the next node
  117. nextNode, ok := s.curNode.MaskTokenIDToNode[tokenID]
  118. if !ok {
  119. return fmt.Errorf("invalid token: %q", mappedString)
  120. }
  121. fmt.Println("transitioning to", nextNode)
  122. s.curNode = s.stateToNodeMap[nextNode]
  123. }
  124. return nil
  125. }
  126. func (s *PushdownSampler) maskLogits(logits []float64, node *PDANode) ([]float64, error) {
  127. for i := range logits {
  128. _, exists := node.MaskTokenIDToNode[int32(i)]
  129. if !exists {
  130. logits[i] = math.NaN()
  131. }
  132. }
  133. return logits, nil
  134. }
  135. // TODO: add penalties for string \n stuff