transforms_test.go 3.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178
  1. package sample
  2. import (
  3. "math"
  4. "math/rand/v2"
  5. "testing"
  6. )
  7. // Helper to convert float64 slice to logit slice
  8. func toTokens(values []float64) []token {
  9. tokens := make([]token, len(values))
  10. for i, v := range values {
  11. tokens[i] = token{
  12. id: int32(i),
  13. value: float32(v),
  14. }
  15. }
  16. return tokens
  17. }
  18. // Helper to compare logit slices
  19. func compareLogits(t *testing.T, name string, want []float64, got []token) {
  20. t.Helper()
  21. if len(want) != len(got) {
  22. t.Errorf("%s: length mismatch: want %d, got %d", name, len(want), len(got))
  23. return
  24. }
  25. for i := range want {
  26. if math.Abs(float64(got[i].value)-want[i]) > 1e-6 {
  27. t.Errorf("%s: index %d: want %f, got %f", name, i, want[i], got[i].value)
  28. }
  29. }
  30. }
  31. func TestTemperatureAndSoftmax(t *testing.T) {
  32. input := []float64{1, 4, -2, 0}
  33. got := temperature(toTokens(input), 0.5)
  34. // Check probabilities sum to 1
  35. var sum float32
  36. for _, token := range got {
  37. sum += token.value
  38. }
  39. if math.Abs(float64(sum)-1.0) > 1e-6 {
  40. t.Errorf("probabilities don't sum to 1: got %f", sum)
  41. }
  42. got = temperature(toTokens(input), 1)
  43. // Check probabilities sum to 1
  44. sum = 0.0
  45. for _, token := range got {
  46. sum += token.value
  47. }
  48. if math.Abs(float64(sum)-1.0) > 1e-6 {
  49. t.Errorf("probabilities don't sum to 1: got %f", sum)
  50. }
  51. }
  52. func TestTopK(t *testing.T) {
  53. input := []float64{-3, -2, -1, 0, 1, 2, 4}
  54. // Test k=3
  55. got := topK(toTokens(input), 3)
  56. if len(got) != 3 {
  57. t.Errorf("topK(3): wrong length: want 3, got %d", len(got))
  58. }
  59. // Should keep highest 3 values: 4, 2, 1
  60. want := []float64{4, 2, 1}
  61. compareLogits(t, "topK(3)", want, got)
  62. // Test k > len
  63. got = topK(toTokens(input), 10)
  64. compareLogits(t, "topK(10)", input, got)
  65. }
  66. func TestTopP(t *testing.T) {
  67. input := []float64{-3, -2, -1, 0, 1, 2, 4}
  68. tokens := toTokens(input)
  69. // First apply temperature and softmax to get probabilities
  70. tokens = temperature(tokens, 1)
  71. sortLogits(tokens)
  72. // Then apply topP
  73. got := topP(tokens, 0.95)
  74. // Should keep tokens until cumsum > 0.95
  75. if len(got) > 3 {
  76. t.Errorf("topP(0.95): kept too many tokens: got %d", len(got))
  77. t.Logf("got: %v", got)
  78. }
  79. }
  80. func TestMinP(t *testing.T) {
  81. input := []float64{-3, -2, -1, 0, 1, 2, 4, 3}
  82. tokens := toTokens(input)
  83. // First apply temperature and softmax
  84. tokens = temperature(tokens, 1)
  85. // Then apply minP
  86. got := minP(tokens, 0.2)
  87. // Should keep tokens with prob >= 0.2 * max_prob
  88. if len(got) > 3 {
  89. t.Errorf("minP(0.2): kept too many tokens: got %d", len(got))
  90. }
  91. }
  92. func TestSortLogits(t *testing.T) {
  93. input := []float64{3, 1, 4, 2, -1, 0, -2}
  94. tokens := toTokens(input)
  95. sortLogits(tokens)
  96. for i := 1; i < len(tokens); i++ {
  97. if tokens[i].value > tokens[i-1].value {
  98. t.Errorf("sortLogits: tokens not sorted in descending order at index %d: %f > %f",
  99. i, tokens[i].value, tokens[i-1].value)
  100. }
  101. }
  102. want := []float64{4, 3, 2, 1, 0, -1, -2}
  103. compareLogits(t, "sortLogits", want, tokens)
  104. }
  105. func BenchmarkTransforms(b *testing.B) {
  106. // Generate random logits
  107. tokens := make([]token, 1<<16)
  108. for i := range tokens {
  109. tokens[i] = token{
  110. id: int32(i),
  111. value: rand.Float32(),
  112. }
  113. }
  114. tokensCopy := make([]token, len(tokens))
  115. b.Run("Temperature", func(b *testing.B) {
  116. b.ResetTimer()
  117. for b.Loop() {
  118. copy(tokensCopy, tokens)
  119. temperature(tokensCopy, 0.5)
  120. }
  121. })
  122. b.Run("TopK", func(b *testing.B) {
  123. b.ResetTimer()
  124. for b.Loop() {
  125. copy(tokensCopy, tokens)
  126. topK(tokensCopy, 10)
  127. }
  128. })
  129. b.Run("TopP", func(b *testing.B) {
  130. b.ResetTimer()
  131. for b.Loop() {
  132. copy(tokensCopy, tokens)
  133. topP(tokensCopy, 0.9)
  134. }
  135. })
  136. b.Run("MinP", func(b *testing.B) {
  137. b.ResetTimer()
  138. for b.Loop() {
  139. copy(tokensCopy, tokens)
  140. minP(tokensCopy, 0.2)
  141. }
  142. })
  143. b.Run("SortTokens", func(b *testing.B) {
  144. b.ResetTimer()
  145. for b.Loop() {
  146. copy(tokensCopy, tokens)
  147. sortLogits(tokensCopy)
  148. }
  149. })
  150. }