pushdown_automata.go 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282
  1. package sample
  2. import (
  3. "slices"
  4. "github.com/ollama/ollama/model"
  5. )
  6. /*
  7. Key JSON rules to consider:
  8. 1. Whitespace handling:
  9. - Need to handle all valid JSON whitespace characters (\r, spaces between tokens)
  10. - Current code only handles some whitespace cases
  11. 2. Number validation:
  12. - Need proper validation for special number cases like -0
  13. - Should handle .5 style decimals
  14. - Need limits on scientific notation (e, E)
  15. 3. String escaping:
  16. - Currently marks \ as invalid but should allow escaped sequences:
  17. - \"
  18. - \n
  19. - \u1234 unicode escapes
  20. 4. Empty object/array transitions:
  21. - Direct {} and [] cases could be more explicit
  22. - Need clear transitions for these edge cases
  23. 5. Nested depth limits:
  24. - No protection against excessive nesting
  25. - Could cause stack overflow with deeply nested structures
  26. */
  27. // TODO: / should be valid but an escape character
  28. var stringInvalidRunes = []rune{'\n', '\t', '{', '}', ':', ',', '/'}
  29. var intInvalidRunes = []rune{'e', 'E', ' ', '\n', '\t', '{', '}', ':', ',', '"'}
  30. var validIntRunes = []rune{'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', '-'}
  31. var validNumberRunes = []rune{'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', '.', '-', '+', 'e', 'E'}
  32. var validBoolRunes = []rune{'t', 'r', 'u', 'e', 'f', 'a', 'l', 's', 'e'}
  33. var validNullRunes = []rune{'n', 'u', 'l', 'l'}
  34. type PDA struct {
  35. State JSONState
  36. TransitionEdges map[rune]*PDA
  37. MaskTokenIDToNode map[int32]*PDA
  38. }
  39. func NewPDANode(state JSONState) *PDA {
  40. return &PDA{
  41. State: state,
  42. TransitionEdges: make(map[rune]*PDA),
  43. MaskTokenIDToNode: make(map[int32]*PDA),
  44. }
  45. }
  46. type PDAGraphBuilder struct {
  47. proc model.TextProcessor
  48. decodedToks []string
  49. stateToNodeMap map[JSONState]*PDA
  50. }
  51. func (b *PDAGraphBuilder) BuildGraph() error {
  52. stateToNodeMap := make(map[JSONState]*PDA)
  53. for _, state := range JSONStates {
  54. stateToNodeMap[state] = NewPDANode(state)
  55. }
  56. stateToNodeMap[StateStart].TransitionEdges['{'] = stateToNodeMap[StateInObject]
  57. stateToNodeMap[StateStart].TransitionEdges['['] = stateToNodeMap[StateInList]
  58. stateToNodeMap[StateInObject].TransitionEdges['"'] = stateToNodeMap[StateInObjectKey]
  59. stateToNodeMap[StateInObject].TransitionEdges['\n'] = stateToNodeMap[StateInNewline]
  60. stateToNodeMap[StateInObject].TransitionEdges[' '] = stateToNodeMap[StateInObjSpace]
  61. // new line
  62. stateToNodeMap[StateInNewline].TransitionEdges['"'] = stateToNodeMap[StateInObjectKey]
  63. stateToNodeMap[StateInNewline].TransitionEdges['\t'] = stateToNodeMap[StateInTab]
  64. stateToNodeMap[StateInNewline].TransitionEdges['}'] = stateToNodeMap[StateInObjectEnd]
  65. stateToNodeMap[StateInNewline].TransitionEdges[' '] = stateToNodeMap[StateInObjSpace]
  66. // new line end value
  67. stateToNodeMap[StateInNewlineEndValue].TransitionEdges[' '] = stateToNodeMap[StateInSpaceEndValue]
  68. stateToNodeMap[StateInNewlineEndValue].TransitionEdges['}'] = stateToNodeMap[StateInObjectEnd]
  69. stateToNodeMap[StateInNewlineEndValue].TransitionEdges[']'] = stateToNodeMap[StateInListEnd]
  70. stateToNodeMap[StateInObjSpace].TransitionEdges['"'] = stateToNodeMap[StateInObjectKey]
  71. stateToNodeMap[StateInObjSpace].TransitionEdges['\n'] = stateToNodeMap[StateInNewline]
  72. // TODO: see if this is needed for formatting
  73. stateToNodeMap[StateInObjSpace].TransitionEdges[' '] = stateToNodeMap[StateInObjSpace]
  74. stateToNodeMap[StateInTab].TransitionEdges['"'] = stateToNodeMap[StateInObjectKey]
  75. stateToNodeMap[StateInObjectKey].TransitionEdges[rune(-1)] = stateToNodeMap[StateInObjectKey]
  76. stateToNodeMap[StateInObjectKey].TransitionEdges['"'] = stateToNodeMap[StateInObjectKeyEnd]
  77. stateToNodeMap[StateInObjectKeyEnd].TransitionEdges[':'] = stateToNodeMap[StateInColon]
  78. stateToNodeMap[StateInObjectEnd].TransitionEdges[','] = stateToNodeMap[StateInComma]
  79. stateToNodeMap[StateInObjectEnd].TransitionEdges['}'] = stateToNodeMap[StateInObjectEnd]
  80. // where values should be
  81. // this could be combined but the probl might change, we're alr doing a skip ahead
  82. stateToNodeMap[StateInColon].TransitionEdges[' '] = stateToNodeMap[StateInSpaceToValue]
  83. stateToNodeMap[StateInColon].TransitionEdges['['] = stateToNodeMap[StateInList]
  84. stateToNodeMap[StateInColon].TransitionEdges['{'] = stateToNodeMap[StateInObject]
  85. b.addValueConnections(stateToNodeMap[StateInColon])
  86. // Leads to a value
  87. stateToNodeMap[StateInSpaceToValue].TransitionEdges['['] = stateToNodeMap[StateInList]
  88. stateToNodeMap[StateInSpaceToValue].TransitionEdges['{'] = stateToNodeMap[StateInObject]
  89. b.addValueConnections(stateToNodeMap[StateInSpaceToValue])
  90. stateToNodeMap[StateInSpaceToValue].TransitionEdges['}'] = stateToNodeMap[StateInObjectEnd]
  91. // Values
  92. // string node
  93. stateToNodeMap[StateInString].TransitionEdges[rune(-1)] = stateToNodeMap[StateInString]
  94. stateToNodeMap[StateInString].TransitionEdges['"'] = stateToNodeMap[StateInStringEnd]
  95. // String end node
  96. b.addEnds(stateToNodeMap[StateInStringEnd])
  97. stateToNodeMap[StateInStringEnd].TransitionEdges[' '] = stateToNodeMap[StateInSpaceEndValue]
  98. stateToNodeMap[StateInStringEnd].TransitionEdges['\n'] = stateToNodeMap[StateInNewlineEndValue]
  99. // TODO: add counters for allowable number of decimals, e, E, etc
  100. // number node
  101. for _, r := range validNumberRunes {
  102. stateToNodeMap[StateInNumber].TransitionEdges[r] = stateToNodeMap[StateInNumber]
  103. }
  104. b.addEnds(stateToNodeMap[StateInNumber])
  105. stateToNodeMap[StateInNumber].TransitionEdges[' '] = stateToNodeMap[StateInSpaceEndValue]
  106. stateToNodeMap[StateInNumber].TransitionEdges['\n'] = stateToNodeMap[StateInNewlineEndValue]
  107. // list node
  108. stateToNodeMap[StateInList].TransitionEdges[','] = stateToNodeMap[StateInComma]
  109. stateToNodeMap[StateInList].TransitionEdges['{'] = stateToNodeMap[StateInObject]
  110. stateToNodeMap[StateInList].TransitionEdges[' '] = stateToNodeMap[StateInList]
  111. stateToNodeMap[StateInList].TransitionEdges['\n'] = stateToNodeMap[StateInList]
  112. // list end node
  113. stateToNodeMap[StateInListEnd].TransitionEdges['}'] = stateToNodeMap[StateInObjectEnd]
  114. stateToNodeMap[StateInListEnd].TransitionEdges[' '] = stateToNodeMap[StateInSpaceEndValue]
  115. stateToNodeMap[StateInListEnd].TransitionEdges[','] = stateToNodeMap[StateInComma]
  116. stateToNodeMap[StateInListEnd].TransitionEdges['\n'] = stateToNodeMap[StateInNewlineEndValue]
  117. // empty list
  118. stateToNodeMap[StateInList].TransitionEdges[']'] = stateToNodeMap[StateInListEnd]
  119. b.addValueConnections(stateToNodeMap[StateInList])
  120. // null node
  121. for _, r := range validNullRunes {
  122. stateToNodeMap[StateInNull].TransitionEdges[r] = stateToNodeMap[StateInNull]
  123. }
  124. b.addEnds(stateToNodeMap[StateInNull])
  125. stateToNodeMap[StateInNull].TransitionEdges[' '] = stateToNodeMap[StateInSpaceToValue]
  126. stateToNodeMap[StateInNull].TransitionEdges['\n'] = stateToNodeMap[StateInNewlineEndValue]
  127. // list comma
  128. // should point to values
  129. stateToNodeMap[StateInListComma].TransitionEdges[' '] = stateToNodeMap[StateInListComma]
  130. stateToNodeMap[StateInListComma].TransitionEdges['{'] = stateToNodeMap[StateInObject]
  131. stateToNodeMap[StateInListComma].TransitionEdges['\n'] = stateToNodeMap[StateInList]
  132. b.addValueConnections(stateToNodeMap[StateInListComma])
  133. // list object end
  134. stateToNodeMap[StateInListObjectEnd].TransitionEdges[','] = stateToNodeMap[StateInListComma]
  135. stateToNodeMap[StateInListObjectEnd].TransitionEdges[']'] = stateToNodeMap[StateInListEnd]
  136. // TODO: not sure if this is needed
  137. stateToNodeMap[StateInListObjectEnd].TransitionEdges['\n'] = stateToNodeMap[StateInNewlineEndValue]
  138. // bool node
  139. for _, r := range validBoolRunes {
  140. stateToNodeMap[StateInBool].TransitionEdges[r] = stateToNodeMap[StateInBool]
  141. }
  142. stateToNodeMap[StateInBool].TransitionEdges['\n'] = stateToNodeMap[StateInNewline]
  143. b.addEnds(stateToNodeMap[StateInBool])
  144. stateToNodeMap[StateInBool].TransitionEdges[' '] = stateToNodeMap[StateInSpaceEndValue]
  145. stateToNodeMap[StateInBool].TransitionEdges['\n'] = stateToNodeMap[StateInNewlineEndValue]
  146. // comma node
  147. stateToNodeMap[StateInComma].TransitionEdges['{'] = stateToNodeMap[StateInObject]
  148. stateToNodeMap[StateInComma].TransitionEdges['\n'] = stateToNodeMap[StateInNewline]
  149. stateToNodeMap[StateInComma].TransitionEdges['"'] = stateToNodeMap[StateInObjectKey]
  150. stateToNodeMap[StateInComma].TransitionEdges[' '] = stateToNodeMap[StateInObjSpace]
  151. // space end value
  152. stateToNodeMap[StateInSpaceEndValue].TransitionEdges[' '] = stateToNodeMap[StateInSpaceEndValue]
  153. stateToNodeMap[StateInSpaceEndValue].TransitionEdges['}'] = stateToNodeMap[StateInObjectEnd]
  154. stateToNodeMap[StateInSpaceEndValue].TransitionEdges[']'] = stateToNodeMap[StateInListEnd]
  155. stateToNodeMap[StateInSpaceEndValue].TransitionEdges['\n'] = stateToNodeMap[StateInNewlineEndValue]
  156. b.stateToNodeMap = stateToNodeMap
  157. if err := b.preComputeValidStates(); err != nil {
  158. return err
  159. }
  160. return nil
  161. }
  162. func (b *PDAGraphBuilder) addEnds(node *PDA) {
  163. node.TransitionEdges[','] = b.stateToNodeMap[StateInComma]
  164. node.TransitionEdges['}'] = b.stateToNodeMap[StateInObjectEnd]
  165. node.TransitionEdges[']'] = b.stateToNodeMap[StateInListEnd]
  166. }
  167. func (b *PDAGraphBuilder) addValueConnections(node *PDA) {
  168. node.TransitionEdges['"'] = b.stateToNodeMap[StateInString]
  169. for _, r := range validNumberRunes {
  170. node.TransitionEdges[r] = b.stateToNodeMap[StateInNumber]
  171. }
  172. // TODO(parthsareen): force the output and shift similar to structured outputs
  173. node.TransitionEdges['t'] = b.stateToNodeMap[StateInBool]
  174. node.TransitionEdges['f'] = b.stateToNodeMap[StateInBool]
  175. node.TransitionEdges['n'] = b.stateToNodeMap[StateInNull]
  176. }
  177. func (b *PDAGraphBuilder) preComputeValidStates() error {
  178. for _, node := range b.stateToNodeMap {
  179. if err := b.CreateMask(node); err != nil {
  180. return err
  181. }
  182. }
  183. return nil
  184. }
  185. func (b *PDAGraphBuilder) CreateMask(node *PDA) error {
  186. for i := range b.decodedToks {
  187. token := b.decodedToks[i]
  188. // Skip EOS/BOS tokens and empty tokens since they are not valid in JSON
  189. if b.proc.Is(uint32(i), model.SpecialEOS) || b.proc.Is(uint32(i), model.SpecialBOS) || token == "" || token == "\"\"" {
  190. continue
  191. }
  192. curNode := node
  193. valid := true
  194. consumedSpecialRunes := make(map[rune]bool)
  195. for _, r := range token {
  196. curNode, valid = isRuneValid(r, curNode, consumedSpecialRunes)
  197. if curNode == nil || !valid {
  198. break
  199. }
  200. }
  201. if valid {
  202. node.MaskTokenIDToNode[int32(i)] = curNode
  203. }
  204. }
  205. return nil
  206. }
  207. func isRuneValid(r rune, curNode *PDA, consumedSpecialRunes map[rune]bool) (*PDA, bool) {
  208. if consumedSpecialRunes[r] {
  209. return nil, false
  210. }
  211. specialRune := slices.Contains(stringInvalidRunes, r)
  212. if specialRune {
  213. if curNode.State == StateInString || curNode.State == StateInObjectKey {
  214. return nil, false
  215. }
  216. }
  217. // Check for specific rune transition
  218. if nextNode, ok := curNode.TransitionEdges[r]; ok {
  219. if specialRune {
  220. if curNode.State == nextNode.State {
  221. return nil, false
  222. }
  223. consumedSpecialRunes[r] = true
  224. }
  225. return nextNode, true
  226. }
  227. // Check for sentinel value - if present, any rune is valid
  228. if nextNode, ok := curNode.TransitionEdges[rune(-1)]; ok {
  229. return nextNode, true
  230. }
  231. return nil, false
  232. }