ggml.go 3.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179
  1. package llm
  2. import (
  3. "encoding/binary"
  4. "errors"
  5. "fmt"
  6. "io"
  7. )
  8. type ModelFamily string
  9. const ModelFamilyLlama ModelFamily = "llama"
  10. type ModelType uint32
  11. const (
  12. ModelType3B ModelType = 26
  13. ModelType7B ModelType = 32
  14. ModelType13B ModelType = 40
  15. ModelType30B ModelType = 60
  16. ModelType65B ModelType = 80
  17. )
  18. type FileType uint32
  19. const (
  20. FileTypeF32 FileType = iota
  21. FileTypeF16
  22. FileTypeQ4_0
  23. FileTypeQ4_1
  24. FileTypeQ4_1_F16
  25. FileTypeQ8_0 = iota + 2
  26. FileTypeQ5_0
  27. FileTypeQ5_1
  28. FileTypeQ2_K
  29. FileTypeQ3_K
  30. FileTypeQ4_K
  31. FileTypeQ5_K
  32. FileTypeQ6_K
  33. )
  34. type GGML struct {
  35. ModelFamily
  36. ModelType
  37. magic uint32
  38. container
  39. llamaHyperparameters
  40. }
  41. type container interface {
  42. Name() string
  43. Decode(io.Reader) error
  44. }
  45. type containerGGML struct {
  46. }
  47. func (c *containerGGML) Name() string {
  48. return "ggml"
  49. }
  50. func (c *containerGGML) Decode(r io.Reader) error {
  51. return nil
  52. }
  53. type containerGGMF struct {
  54. version uint32
  55. }
  56. func (c *containerGGMF) Name() string {
  57. return "ggmf"
  58. }
  59. func (c *containerGGMF) Decode(r io.Reader) error {
  60. var version uint32
  61. binary.Read(r, binary.LittleEndian, &version)
  62. switch version {
  63. case 1:
  64. default:
  65. return errors.New("invalid version")
  66. }
  67. c.version = version
  68. return nil
  69. }
  70. type containerGGJT struct {
  71. version uint32
  72. }
  73. func (c *containerGGJT) Name() string {
  74. return "ggjt"
  75. }
  76. func (c *containerGGJT) Decode(r io.Reader) error {
  77. var version uint32
  78. binary.Read(r, binary.LittleEndian, &version)
  79. switch version {
  80. case 1, 2, 3:
  81. default:
  82. return errors.New("invalid version")
  83. }
  84. c.version = version
  85. return nil
  86. }
  87. type containerLORA struct {
  88. version uint32
  89. }
  90. func (c *containerLORA) Name() string {
  91. return "ggla"
  92. }
  93. func (c *containerLORA) Decode(r io.Reader) error {
  94. var version uint32
  95. binary.Read(r, binary.LittleEndian, &version)
  96. switch version {
  97. case 1:
  98. default:
  99. return errors.New("invalid version")
  100. }
  101. c.version = version
  102. return nil
  103. }
  104. const (
  105. // / Magic constant for `ggml` files (unversioned).
  106. FILE_MAGIC_GGML = 0x67676d6c
  107. // / Magic constant for `ggml` files (versioned, ggmf).
  108. FILE_MAGIC_GGMF = 0x67676d66
  109. // / Magic constant for `ggml` files (versioned, ggjt).
  110. FILE_MAGIC_GGJT = 0x67676a74
  111. // / Magic constant for `ggla` files (LoRA adapter).
  112. FILE_MAGIC_GGLA = 0x67676C61
  113. )
  114. func DecodeGGML(r io.ReadSeeker, hint ModelFamily) (*GGML, error) {
  115. var ggml GGML
  116. binary.Read(r, binary.LittleEndian, &ggml.magic)
  117. switch ggml.magic {
  118. case FILE_MAGIC_GGML:
  119. ggml.container = &containerGGML{}
  120. case FILE_MAGIC_GGMF:
  121. ggml.container = &containerGGMF{}
  122. case FILE_MAGIC_GGJT:
  123. ggml.container = &containerGGJT{}
  124. case FILE_MAGIC_GGLA:
  125. ggml.container = &containerLORA{}
  126. default:
  127. return nil, errors.New("invalid file magic")
  128. }
  129. if err := ggml.Decode(r); err != nil {
  130. return nil, err
  131. }
  132. // different model types may have different layouts for hyperparameters
  133. switch hint {
  134. case ModelFamilyLlama:
  135. binary.Read(r, binary.LittleEndian, &ggml.llamaHyperparameters)
  136. // TODO: sanity check hyperparameters
  137. default:
  138. return nil, fmt.Errorf("unsupported model type: %s", hint)
  139. }
  140. // final model type
  141. ggml.ModelFamily = hint
  142. ggml.ModelType = ModelType(ggml.NumLayer)
  143. return &ggml, nil
  144. }