ggml.go 3.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180
  1. package llm
  2. import (
  3. "encoding/binary"
  4. "errors"
  5. "fmt"
  6. "io"
  7. )
  8. type ModelFamily string
  9. const ModelFamilyLlama ModelFamily = "llama"
  10. type ModelType uint32
  11. const (
  12. ModelType3B ModelType = 26
  13. ModelType7B ModelType = 32
  14. ModelType13B ModelType = 40
  15. ModelType30B ModelType = 60
  16. ModelType65B ModelType = 80
  17. )
  18. type FileType uint32
  19. const (
  20. FileTypeF32 FileType = iota
  21. FileTypeF16
  22. FileTypeQ4_0
  23. FileTypeQ4_1
  24. FileTypeQ4_1_F16
  25. FileTypeQ8_0 = iota + 3
  26. FileTypeQ5_0
  27. FileTypeQ5_1
  28. FileTypeQ2_K
  29. FileTypeQ3_K
  30. FileTypeQ4_K
  31. FileTypeQ5_K
  32. FileTypeQ6_K
  33. FileTypeUnknown = -1
  34. )
  35. type GGML struct {
  36. ModelFamily
  37. ModelType
  38. magic uint32
  39. container
  40. llamaHyperparameters
  41. }
  42. type container interface {
  43. Name() string
  44. Decode(io.Reader) error
  45. }
  46. type containerGGML struct {
  47. }
  48. func (c *containerGGML) Name() string {
  49. return "ggml"
  50. }
  51. func (c *containerGGML) Decode(r io.Reader) error {
  52. return nil
  53. }
  54. type containerGGMF struct {
  55. version uint32
  56. }
  57. func (c *containerGGMF) Name() string {
  58. return "ggmf"
  59. }
  60. func (c *containerGGMF) Decode(r io.Reader) error {
  61. var version uint32
  62. binary.Read(r, binary.LittleEndian, &version)
  63. switch version {
  64. case 1:
  65. default:
  66. return errors.New("invalid version")
  67. }
  68. c.version = version
  69. return nil
  70. }
  71. type containerGGJT struct {
  72. version uint32
  73. }
  74. func (c *containerGGJT) Name() string {
  75. return "ggjt"
  76. }
  77. func (c *containerGGJT) Decode(r io.Reader) error {
  78. var version uint32
  79. binary.Read(r, binary.LittleEndian, &version)
  80. switch version {
  81. case 1, 2, 3:
  82. default:
  83. return errors.New("invalid version")
  84. }
  85. c.version = version
  86. return nil
  87. }
  88. type containerLORA struct {
  89. version uint32
  90. }
  91. func (c *containerLORA) Name() string {
  92. return "ggla"
  93. }
  94. func (c *containerLORA) Decode(r io.Reader) error {
  95. var version uint32
  96. binary.Read(r, binary.LittleEndian, &version)
  97. switch version {
  98. case 1:
  99. default:
  100. return errors.New("invalid version")
  101. }
  102. c.version = version
  103. return nil
  104. }
  105. const (
  106. // / Magic constant for `ggml` files (unversioned).
  107. FILE_MAGIC_GGML = 0x67676d6c
  108. // / Magic constant for `ggml` files (versioned, ggmf).
  109. FILE_MAGIC_GGMF = 0x67676d66
  110. // / Magic constant for `ggml` files (versioned, ggjt).
  111. FILE_MAGIC_GGJT = 0x67676a74
  112. // / Magic constant for `ggla` files (LoRA adapter).
  113. FILE_MAGIC_GGLA = 0x67676C61
  114. )
  115. func DecodeGGML(r io.ReadSeeker, hint ModelFamily) (*GGML, error) {
  116. var ggml GGML
  117. binary.Read(r, binary.LittleEndian, &ggml.magic)
  118. switch ggml.magic {
  119. case FILE_MAGIC_GGML:
  120. ggml.container = &containerGGML{}
  121. case FILE_MAGIC_GGMF:
  122. ggml.container = &containerGGMF{}
  123. case FILE_MAGIC_GGJT:
  124. ggml.container = &containerGGJT{}
  125. case FILE_MAGIC_GGLA:
  126. ggml.container = &containerLORA{}
  127. default:
  128. return nil, errors.New("invalid file magic")
  129. }
  130. if err := ggml.Decode(r); err != nil {
  131. return nil, err
  132. }
  133. // different model types may have different layouts for hyperparameters
  134. switch hint {
  135. case ModelFamilyLlama:
  136. binary.Read(r, binary.LittleEndian, &ggml.llamaHyperparameters)
  137. // TODO: sanity check hyperparameters
  138. default:
  139. return nil, fmt.Errorf("unsupported model type: %s", hint)
  140. }
  141. // final model type
  142. ggml.ModelFamily = hint
  143. ggml.ModelType = ModelType(ggml.NumLayer)
  144. return &ggml, nil
  145. }