pushdown_automata.go 8.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296
  1. package sample
  2. import (
  3. "slices"
  4. "github.com/ollama/ollama/model"
  5. )
  6. var stringInvalidRunes = []rune{'\\', '\n', '\t', '{', '}', ':', ','}
  7. var intInvalidRunes = []rune{'e', 'E', ' ', '\n', '\t', '{', '}', ':', ',', '"'}
  8. var validIntRunes = []rune{'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', '-'}
  9. var validNumberRunes = []rune{'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', '.', '-', '+', 'e', 'E'}
  10. var validBoolRunes = []rune{'t', 'r', 'u', 'e', 'f', 'a', 'l', 's', 'e'}
  11. var validNullRunes = []rune{'n', 'u', 'l', 'l'}
  12. type PDANode struct {
  13. State JSONState
  14. TransitionEdges map[rune]*PDANode
  15. MaskTokenIDToNode map[int32]JSONState
  16. }
  17. func NewPDANode(state JSONState) *PDANode {
  18. return &PDANode{
  19. State: state,
  20. TransitionEdges: make(map[rune]*PDANode),
  21. MaskTokenIDToNode: make(map[int32]JSONState),
  22. }
  23. }
  24. func BuildGraph(proc model.TextProcessor) (*PDANode, map[JSONState]*PDANode, error) {
  25. stateToNodeMap := make(map[JSONState]*PDANode)
  26. startNode := NewPDANode(StateStart)
  27. stateToNodeMap[StateStart] = startNode
  28. objNode := NewPDANode(StateInObject)
  29. stateToNodeMap[StateInObject] = objNode
  30. objEndNode := NewPDANode(StateInObjectEnd)
  31. stateToNodeMap[StateInObjectEnd] = objEndNode
  32. objKeyNode := NewPDANode(StateInObjectKey)
  33. stateToNodeMap[StateInObjectKey] = objKeyNode
  34. objKeyEndNode := NewPDANode(StateInObjectKeyEnd)
  35. stateToNodeMap[StateInObjectKeyEnd] = objKeyEndNode
  36. colonNode := NewPDANode(StateInColon)
  37. stateToNodeMap[StateInColon] = colonNode
  38. commaNode := NewPDANode(StateInComma)
  39. stateToNodeMap[StateInComma] = commaNode
  40. newlineNode := NewPDANode(StateInNewline)
  41. stateToNodeMap[StateInNewline] = newlineNode
  42. spaceNode := NewPDANode(StateInSpace)
  43. stateToNodeMap[StateInSpace] = spaceNode
  44. spaceObjNode := NewPDANode(StateInObjSpace)
  45. stateToNodeMap[StateInObjSpace] = spaceObjNode
  46. tabNode := NewPDANode(StateInTab)
  47. stateToNodeMap[StateInTab] = tabNode
  48. stringNode := NewPDANode(StateInString)
  49. stateToNodeMap[StateInString] = stringNode
  50. stringEndNode := NewPDANode(StateInStringEnd)
  51. stateToNodeMap[StateInStringEnd] = stringEndNode
  52. listNode := NewPDANode(StateInList)
  53. stateToNodeMap[StateInList] = listNode
  54. listCommaNode := NewPDANode(StateInListComma)
  55. stateToNodeMap[StateInListComma] = listCommaNode
  56. listEndNode := NewPDANode(StateListEnd)
  57. stateToNodeMap[StateListEnd] = listEndNode
  58. numberNode := NewPDANode(StateInNumber)
  59. stateToNodeMap[StateInNumber] = numberNode
  60. boolNode := NewPDANode(StateInBool)
  61. stateToNodeMap[StateInBool] = boolNode
  62. nullNode := NewPDANode(StateInNull)
  63. stateToNodeMap[StateInNull] = nullNode
  64. // Defined with structured outputs only
  65. intNode := NewPDANode(StateInInt)
  66. stateToNodeMap[StateInInt] = intNode
  67. // TODO:
  68. // consider adding a node to just point to values, could be good to compute that
  69. // mask rather than many different nodes
  70. // Connect nodes
  71. // TODO: if all are single tokens then this can just be connected instead of defining the token
  72. startNode.TransitionEdges['{'] = objNode
  73. objNode.TransitionEdges['"'] = objKeyNode
  74. objNode.TransitionEdges['\n'] = newlineNode
  75. // objNode.TransitionEdges['\t'] = tabNode
  76. newlineNode.TransitionEdges['"'] = objKeyNode
  77. newlineNode.TransitionEdges['\t'] = tabNode
  78. tabNode.TransitionEdges['"'] = objKeyNode
  79. // tabNode.TransitionEdges['\t'] = tabNode
  80. objKeyNode.TransitionEdges[rune(-1)] = objKeyNode
  81. objKeyNode.TransitionEdges['"'] = objKeyEndNode
  82. objKeyEndNode.TransitionEdges[':'] = colonNode
  83. objEndNode.TransitionEdges[' '] = spaceNode
  84. // where values should be
  85. // this could be combined but the probs might change, we're alr doing a skip ahead
  86. colonNode.TransitionEdges[' '] = spaceNode
  87. // Leads to a value
  88. spaceNode.TransitionEdges['"'] = stringNode
  89. spaceNode.TransitionEdges['['] = listNode
  90. spaceNode.TransitionEdges['{'] = objNode
  91. for _, r := range validNumberRunes {
  92. spaceNode.TransitionEdges[r] = numberNode
  93. }
  94. for _, r := range validBoolRunes {
  95. spaceNode.TransitionEdges[r] = boolNode
  96. }
  97. for _, r := range validNullRunes {
  98. spaceNode.TransitionEdges[r] = nullNode
  99. }
  100. // Values
  101. // string node
  102. stringNode.TransitionEdges[rune(-1)] = stringNode
  103. stringNode.TransitionEdges['"'] = stringEndNode
  104. stringEndNode.TransitionEdges[','] = commaNode
  105. stringEndNode.TransitionEdges['}'] = objEndNode
  106. stringEndNode.TransitionEdges[']'] = listEndNode
  107. // TODO: add counters for allowable number of decimals, e, E, etc
  108. // number node
  109. for _, r := range validNumberRunes {
  110. numberNode.TransitionEdges[r] = numberNode
  111. }
  112. numberNode.TransitionEdges[','] = commaNode
  113. numberNode.TransitionEdges['}'] = objEndNode
  114. numberNode.TransitionEdges[']'] = listEndNode
  115. for _, r := range validBoolRunes {
  116. boolNode.TransitionEdges[r] = boolNode
  117. }
  118. // list node
  119. listNode.TransitionEdges[','] = commaNode
  120. listNode.TransitionEdges['"'] = stringNode
  121. // squash states to a value
  122. for _, r := range validNumberRunes {
  123. listNode.TransitionEdges[r] = numberNode
  124. }
  125. for _, r := range validBoolRunes {
  126. listNode.TransitionEdges[r] = boolNode
  127. }
  128. for _, r := range validNullRunes {
  129. listNode.TransitionEdges[r] = nullNode
  130. }
  131. // null node
  132. for _, r := range validNullRunes {
  133. nullNode.TransitionEdges[r] = nullNode
  134. }
  135. nullNode.TransitionEdges[','] = commaNode
  136. nullNode.TransitionEdges['}'] = objEndNode
  137. nullNode.TransitionEdges[']'] = listEndNode
  138. // list comma
  139. // should point to values
  140. listCommaNode.TransitionEdges['"'] = stringNode
  141. listCommaNode.TransitionEdges[' '] = listCommaNode
  142. listCommaNode.TransitionEdges['{'] = objNode
  143. listCommaNode.TransitionEdges['\n'] = newlineNode
  144. for _, r := range validNumberRunes {
  145. listCommaNode.TransitionEdges[r] = numberNode
  146. }
  147. for _, r := range validBoolRunes {
  148. listCommaNode.TransitionEdges[r] = boolNode
  149. }
  150. for _, r := range validNullRunes {
  151. listCommaNode.TransitionEdges[r] = nullNode
  152. }
  153. // bool node
  154. for _, r := range validBoolRunes {
  155. boolNode.TransitionEdges[r] = boolNode
  156. }
  157. boolNode.TransitionEdges['}'] = objEndNode
  158. boolNode.TransitionEdges[']'] = listEndNode
  159. boolNode.TransitionEdges[','] = commaNode
  160. listEndNode.TransitionEdges['}'] = objEndNode
  161. listEndNode.TransitionEdges[','] = commaNode
  162. commaNode.TransitionEdges['{'] = objNode
  163. commaNode.TransitionEdges['\n'] = newlineNode
  164. commaNode.TransitionEdges['\t'] = tabNode
  165. commaNode.TransitionEdges['"'] = objKeyNode
  166. commaNode.TransitionEdges[' '] = spaceObjNode
  167. spaceObjNode.TransitionEdges['"'] = objKeyNode
  168. return startNode, stateToNodeMap, nil
  169. }
  170. func PreComputeValidStates(stateToNodeMap map[JSONState]*PDANode, proc model.TextProcessor) error {
  171. vocab := proc.GetVocabulary()
  172. decodedToks := make([]string, len(vocab.Values))
  173. for i := range vocab.Values {
  174. token, err := proc.Decode([]int32{int32(i)})
  175. if err != nil {
  176. return err
  177. }
  178. decodedToks[i] = token
  179. }
  180. var err error
  181. for _, node := range stateToNodeMap {
  182. for i := range vocab.Values {
  183. token := decodedToks[i]
  184. // Skip EOS/BOS tokens and empty tokens since they are not valid in JSON
  185. if proc.Is(uint32(i), model.SpecialEOS) || proc.Is(uint32(i), model.SpecialBOS) || token == "" {
  186. continue
  187. }
  188. valid := true
  189. curNode := node
  190. consumedSpecialRunes := make(map[rune]bool)
  191. for _, r := range token {
  192. valid, curNode, err = isRuneValid(r, curNode, consumedSpecialRunes)
  193. if err != nil {
  194. return err
  195. }
  196. if !valid {
  197. break
  198. }
  199. }
  200. if valid {
  201. node.MaskTokenIDToNode[int32(i)] = curNode.State
  202. }
  203. }
  204. }
  205. return nil
  206. }
  207. func isRuneValid(r rune, curNode *PDANode, consumedSpecialRunes map[rune]bool) (bool, *PDANode, error) {
  208. if consumedSpecialRunes[r] {
  209. return false, nil, nil
  210. }
  211. specialRune := slices.Contains(stringInvalidRunes, r)
  212. if specialRune {
  213. if curNode.State == StateInString || curNode.State == StateInObjectKey {
  214. return false, nil, nil
  215. }
  216. }
  217. // Check for specific rune transition
  218. if nextNode, ok := curNode.TransitionEdges[r]; ok {
  219. if specialRune {
  220. if curNode.State == nextNode.State {
  221. return false, nil, nil
  222. }
  223. // fmt.Println("special rune", r, "consumed")
  224. consumedSpecialRunes[r] = true
  225. }
  226. return true, nextNode, nil
  227. }
  228. // Check for sentinel value - if present, any rune is valid
  229. if nextNode, ok := curNode.TransitionEdges[rune(-1)]; ok {
  230. return true, nextNode, nil
  231. }
  232. return false, nil, nil
  233. }