ranker_test.go 3.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123
  1. package core
  2. import (
  3. "github.com/huichen/wukong/types"
  4. "github.com/huichen/wukong/utils"
  5. "reflect"
  6. "testing"
  7. )
  8. type DummyScoringFields struct {
  9. label string
  10. counter int
  11. amount float32
  12. }
  13. type DummyScoringCriteria struct {
  14. Threshold float32
  15. }
  16. func (criteria DummyScoringCriteria) Score(
  17. doc types.IndexedDocument, fields interface{}) []float32 {
  18. if reflect.TypeOf(fields) == reflect.TypeOf(DummyScoringFields{}) {
  19. dsf := fields.(DummyScoringFields)
  20. value := float32(dsf.counter) + dsf.amount
  21. if value < criteria.Threshold {
  22. return []float32{}
  23. }
  24. return []float32{value}
  25. }
  26. return []float32{}
  27. }
  28. func TestRankDocument(t *testing.T) {
  29. var ranker Ranker
  30. ranker.Init()
  31. scoredDocs := ranker.Rank([]types.IndexedDocument{
  32. types.IndexedDocument{DocId: 1, BM25: 6},
  33. types.IndexedDocument{DocId: 3, BM25: 24},
  34. types.IndexedDocument{DocId: 4, BM25: 18},
  35. }, types.RankOptions{ScoringCriteria: types.RankByBM25{}})
  36. utils.Expect(t, "[3 [24000 ]] [4 [18000 ]] [1 [6000 ]] ", scoredDocsToString(scoredDocs))
  37. scoredDocs = ranker.Rank([]types.IndexedDocument{
  38. types.IndexedDocument{DocId: 1, BM25: 6},
  39. types.IndexedDocument{DocId: 3, BM25: 24},
  40. types.IndexedDocument{DocId: 2, BM25: 0},
  41. types.IndexedDocument{DocId: 4, BM25: 18},
  42. }, types.RankOptions{ScoringCriteria: types.RankByBM25{}, ReverseOrder: true})
  43. utils.Expect(t, "[2 [0 ]] [1 [6000 ]] [4 [18000 ]] [3 [24000 ]] ", scoredDocsToString(scoredDocs))
  44. }
  45. func TestRankWithCriteria(t *testing.T) {
  46. var ranker Ranker
  47. ranker.Init()
  48. ranker.AddScoringFields(1, DummyScoringFields{
  49. label: "label3",
  50. counter: 3,
  51. amount: 22.3,
  52. })
  53. ranker.AddScoringFields(2, DummyScoringFields{
  54. label: "label4",
  55. counter: 1,
  56. amount: 2,
  57. })
  58. ranker.AddScoringFields(3, DummyScoringFields{
  59. label: "label1",
  60. counter: 7,
  61. amount: 10.3,
  62. })
  63. ranker.AddScoringFields(4, DummyScoringFields{
  64. label: "label1",
  65. counter: -1,
  66. amount: 2.3,
  67. })
  68. criteria := DummyScoringCriteria{}
  69. scoredDocs := ranker.Rank([]types.IndexedDocument{
  70. types.IndexedDocument{DocId: 1, TokenProximity: 6},
  71. types.IndexedDocument{DocId: 2, TokenProximity: -1},
  72. types.IndexedDocument{DocId: 3, TokenProximity: 24},
  73. types.IndexedDocument{DocId: 4, TokenProximity: 18},
  74. }, types.RankOptions{ScoringCriteria: criteria})
  75. utils.Expect(t, "[1 [25300 ]] [3 [17300 ]] [2 [3000 ]] [4 [1300 ]] ", scoredDocsToString(scoredDocs))
  76. criteria.Threshold = 4
  77. scoredDocs = ranker.Rank([]types.IndexedDocument{
  78. types.IndexedDocument{DocId: 1, TokenProximity: 6},
  79. types.IndexedDocument{DocId: 2, TokenProximity: -1},
  80. types.IndexedDocument{DocId: 3, TokenProximity: 24},
  81. types.IndexedDocument{DocId: 4, TokenProximity: 18},
  82. }, types.RankOptions{ScoringCriteria: criteria})
  83. utils.Expect(t, "[1 [25300 ]] [3 [17300 ]] ", scoredDocsToString(scoredDocs))
  84. }
  85. func TestRemoveDocument(t *testing.T) {
  86. var ranker Ranker
  87. ranker.Init()
  88. ranker.AddScoringFields(1, DummyScoringFields{
  89. label: "label3",
  90. counter: 3,
  91. amount: 22.3,
  92. })
  93. ranker.AddScoringFields(2, DummyScoringFields{
  94. label: "label4",
  95. counter: 1,
  96. amount: 2,
  97. })
  98. ranker.AddScoringFields(3, DummyScoringFields{
  99. label: "label1",
  100. counter: 7,
  101. amount: 10.3,
  102. })
  103. ranker.RemoveScoringFields(3)
  104. criteria := DummyScoringCriteria{}
  105. scoredDocs := ranker.Rank([]types.IndexedDocument{
  106. types.IndexedDocument{DocId: 1, TokenProximity: 6},
  107. types.IndexedDocument{DocId: 2, TokenProximity: -1},
  108. types.IndexedDocument{DocId: 3, TokenProximity: 24},
  109. types.IndexedDocument{DocId: 4, TokenProximity: 18},
  110. }, types.RankOptions{ScoringCriteria: criteria})
  111. utils.Expect(t, "[1 [25300 ]] [2 [3000 ]] ", scoredDocsToString(scoredDocs))
  112. }