parser.go 2.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121
  1. package parser
  2. import (
  3. "bufio"
  4. "bytes"
  5. "errors"
  6. "fmt"
  7. "io"
  8. "log/slog"
  9. )
  10. type Command struct {
  11. Name string
  12. Args string
  13. }
  14. func (c *Command) Reset() {
  15. c.Name = ""
  16. c.Args = ""
  17. }
  18. func Parse(reader io.Reader) ([]Command, error) {
  19. var commands []Command
  20. var command, modelCommand Command
  21. scanner := bufio.NewScanner(reader)
  22. scanner.Buffer(make([]byte, 0, bufio.MaxScanTokenSize), bufio.MaxScanTokenSize)
  23. scanner.Split(scanModelfile)
  24. for scanner.Scan() {
  25. line := scanner.Bytes()
  26. fields := bytes.SplitN(line, []byte(" "), 2)
  27. if len(fields) == 0 || len(fields[0]) == 0 {
  28. continue
  29. }
  30. switch string(bytes.ToUpper(fields[0])) {
  31. case "FROM":
  32. command.Name = "model"
  33. command.Args = string(bytes.TrimSpace(fields[1]))
  34. // copy command for validation
  35. modelCommand = command
  36. case "ADAPTER":
  37. command.Name = string(bytes.ToLower(fields[0]))
  38. command.Args = string(bytes.TrimSpace(fields[1]))
  39. case "LICENSE", "TEMPLATE", "SYSTEM", "PROMPT":
  40. command.Name = string(bytes.ToLower(fields[0]))
  41. command.Args = string(fields[1])
  42. case "PARAMETER":
  43. fields = bytes.SplitN(fields[1], []byte(" "), 2)
  44. if len(fields) < 2 {
  45. return nil, fmt.Errorf("missing value for %s", fields)
  46. }
  47. command.Name = string(fields[0])
  48. command.Args = string(bytes.TrimSpace(fields[1]))
  49. case "EMBED":
  50. return nil, fmt.Errorf("deprecated command: EMBED is no longer supported, use the /embed API endpoint instead")
  51. default:
  52. if !bytes.HasPrefix(fields[0], []byte("#")) {
  53. // log a warning for unknown commands
  54. slog.Warn(fmt.Sprintf("Unknown command: %s", fields[0]))
  55. }
  56. continue
  57. }
  58. commands = append(commands, command)
  59. command.Reset()
  60. }
  61. if modelCommand.Args == "" {
  62. return nil, errors.New("no FROM line for the model was specified")
  63. }
  64. return commands, scanner.Err()
  65. }
  66. func scanModelfile(data []byte, atEOF bool) (advance int, token []byte, err error) {
  67. advance, token, err = scan([]byte(`"""`), []byte(`"""`), data, atEOF)
  68. if err != nil {
  69. return 0, nil, err
  70. }
  71. if advance > 0 && token != nil {
  72. return advance, token, nil
  73. }
  74. advance, token, err = scan([]byte(`"`), []byte(`"`), data, atEOF)
  75. if err != nil {
  76. return 0, nil, err
  77. }
  78. if advance > 0 && token != nil {
  79. return advance, token, nil
  80. }
  81. return bufio.ScanLines(data, atEOF)
  82. }
  83. func scan(openBytes, closeBytes, data []byte, atEOF bool) (advance int, token []byte, err error) {
  84. newline := bytes.IndexByte(data, '\n')
  85. if start := bytes.Index(data, openBytes); start >= 0 && start < newline {
  86. end := bytes.Index(data[start+len(openBytes):], closeBytes)
  87. if end < 0 {
  88. if atEOF {
  89. return 0, nil, fmt.Errorf("unterminated %s: expecting %s", openBytes, closeBytes)
  90. } else {
  91. return 0, nil, nil
  92. }
  93. }
  94. n := start + len(openBytes) + end + len(closeBytes)
  95. newData := data[:start]
  96. newData = append(newData, data[start+len(openBytes):n-len(closeBytes)]...)
  97. return n, newData, nil
  98. }
  99. return 0, nil, nil
  100. }