parser.go 2.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118
  1. package parser
  2. import (
  3. "bufio"
  4. "bytes"
  5. "errors"
  6. "fmt"
  7. "io"
  8. "log"
  9. )
  10. type Command struct {
  11. Name string
  12. Args string
  13. }
  14. func (c *Command) Reset() {
  15. c.Name = ""
  16. c.Args = ""
  17. }
  18. func Parse(reader io.Reader) ([]Command, error) {
  19. var commands []Command
  20. var command, modelCommand Command
  21. scanner := bufio.NewScanner(reader)
  22. scanner.Buffer(make([]byte, 0, bufio.MaxScanTokenSize), bufio.MaxScanTokenSize)
  23. scanner.Split(scanModelfile)
  24. for scanner.Scan() {
  25. line := scanner.Bytes()
  26. fields := bytes.SplitN(line, []byte(" "), 2)
  27. if len(fields) == 0 || len(fields[0]) == 0 {
  28. continue
  29. }
  30. switch string(bytes.ToUpper(fields[0])) {
  31. case "FROM":
  32. command.Name = "model"
  33. command.Args = string(fields[1])
  34. // copy command for validation
  35. modelCommand = command
  36. case "LICENSE", "TEMPLATE", "SYSTEM", "PROMPT", "ADAPTER":
  37. command.Name = string(bytes.ToLower(fields[0]))
  38. command.Args = string(fields[1])
  39. case "PARAMETER":
  40. fields = bytes.SplitN(fields[1], []byte(" "), 2)
  41. if len(fields) < 2 {
  42. return nil, fmt.Errorf("missing value for %s", fields)
  43. }
  44. command.Name = string(fields[0])
  45. command.Args = string(fields[1])
  46. case "EMBED":
  47. return nil, fmt.Errorf("deprecated command: EMBED is no longer supported, use the /embed API endpoint instead")
  48. default:
  49. if !bytes.HasPrefix(fields[0], []byte("#")) {
  50. // log a warning for unknown commands
  51. log.Printf("WARNING: Unknown command: %s", fields[0])
  52. }
  53. continue
  54. }
  55. commands = append(commands, command)
  56. command.Reset()
  57. }
  58. if modelCommand.Args == "" {
  59. return nil, errors.New("no FROM line for the model was specified")
  60. }
  61. return commands, scanner.Err()
  62. }
  63. func scanModelfile(data []byte, atEOF bool) (advance int, token []byte, err error) {
  64. advance, token, err = scan([]byte(`"""`), []byte(`"""`), data, atEOF)
  65. if err != nil {
  66. return 0, nil, err
  67. }
  68. if advance > 0 && token != nil {
  69. return advance, token, nil
  70. }
  71. advance, token, err = scan([]byte(`"`), []byte(`"`), data, atEOF)
  72. if err != nil {
  73. return 0, nil, err
  74. }
  75. if advance > 0 && token != nil {
  76. return advance, token, nil
  77. }
  78. return bufio.ScanLines(data, atEOF)
  79. }
  80. func scan(openBytes, closeBytes, data []byte, atEOF bool) (advance int, token []byte, err error) {
  81. newline := bytes.IndexByte(data, '\n')
  82. if start := bytes.Index(data, openBytes); start >= 0 && start < newline {
  83. end := bytes.Index(data[start+len(openBytes):], closeBytes)
  84. if end < 0 {
  85. if atEOF {
  86. return 0, nil, fmt.Errorf("unterminated %s: expecting %s", openBytes, closeBytes)
  87. } else {
  88. return 0, nil, nil
  89. }
  90. }
  91. n := start + len(openBytes) + end + len(closeBytes)
  92. newData := data[:start]
  93. newData = append(newData, data[start+len(openBytes):n-len(closeBytes)]...)
  94. return n, newData, nil
  95. }
  96. return 0, nil, nil
  97. }