searchkick_test.rb
6.02 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
require "test_helper"
class TestSearchkick < Minitest::Unit::TestCase
def setup
$index = Tire::Index.new("products")
$index.delete
index_options = {
settings: {
number_of_shards: 1,
analysis: {
analyzer: {
searchkick_keyword: {
type: "custom",
tokenizer: "keyword",
filter: ["lowercase", "snowball"]
},
searchkick: {
type: "custom",
tokenizer: "standard",
# synonym should come last, after stemming and shingle
# shingle must come before snowball
filter: ["standard", "lowercase", "asciifolding", "stop", "searchkick_shingle", "snowball", "searchkick_synonym"]
}
},
filter: {
searchkick_shingle: {
type: "shingle",
token_separator: ""
},
searchkick_synonym: {
type: "synonym",
ignore_case: true,
synonyms: [
"clorox => bleach",
"saran wrap => plastic wrap",
"scallion => green onion",
"qtip => cotton swab"
]
}
}
}
},
mappings: {
document: {
properties: {
name: {
type: "string",
analyzer: "searchkick"
},
conversions: {
type: "nested",
properties: {
query: {
type: "string",
analyzer: "searchkick_keyword"
},
count: {
type: "integer"
}
}
}
}
}
}
}
$index.create index_options
end
# exact
def test_match
store_names ["Whole Milk", "Fat Free Milk", "Milk"]
assert_search "milk", ["Milk", "Whole Milk", "Fat Free Milk"]
end
def test_case
store_names ["Whole Milk", "Fat Free Milk", "Milk"]
assert_search "MILK", ["Milk", "Whole Milk", "Fat Free Milk"]
end
# ascii
def test_jalapenos
store_names ["Jalapeño"]
assert_search "jalapeno", ["Jalapeño"]
end
# stemming
def test_stemming
store_names ["Whole Milk", "Fat Free Milk", "Milk"]
assert_search "milks", ["Milk", "Whole Milk", "Fat Free Milk"]
end
# fuzzy
def test_fuzzy
store_names ["Sliced Beets", "Beef"]
assert_search "beets", ["Sliced Beets", "Beef"]
end
# conversions
def test_conversions
store [
{name: "Tomato Sauce", conversions: [{query: "tomato sauce", count: 100}, {query: "tomato", count: 2}]},
{name: "Tomato Paste", conversions: []},
{name: "Tomatoes", conversions: [{query: "tomato", count: 100}, {query: "tomato sauce", count: 2}]}
]
assert_search "tomato sauce", ["Tomato Sauce", "Tomatoes"] #, "Tomato Paste"]
assert_search "tomato", ["Tomatoes", "Tomato Sauce", "Tomato Paste"]
assert_search "tomato paste", ["Tomato Paste"] #, "Tomatoes", "Tomato Sauce"]
end
def test_conversions_stemmed
store [
{name: "Tomato A", conversions: [{query: "tomato", count: 1}, {query: "tomatos", count: 1}, {query: "Tomatoes", count: 3}]},
{name: "Tomato B", conversions: [{query: "tomato", count: 4}]}
]
assert_search "tomato", ["Tomato A", "Tomato B"]
end
# spaces
def test_spaces_in_field
store_names ["Red Bull"]
assert_search "redbull", ["Red Bull"]
end
def test_spaces_in_query
store_names ["Dishwasher Soap"]
assert_search "dish washer", ["Dishwasher Soap"]
end
def test_spaces_three_words
store_names ["Dish Washer Soap", "Dish Washer"]
assert_search "dish washer soap", ["Dish Washer Soap"]
end
def test_spaces_stemming
store_names ["Almond Milk"]
assert_search "almondmilks", ["Almond Milk"]
end
# keywords
def test_keywords
store_names ["Clorox Bleach", "Kroger Bleach", "Saran Wrap", "Kroger Plastic Wrap"]
assert_search "clorox", ["Clorox Bleach", "Kroger Bleach"]
assert_search "saran wrap", ["Saran Wrap", "Kroger Plastic Wrap"]
end
def test_keywords_qtips
store_names ["Q Tips", "Kroger Cotton Swabs"]
assert_search "q tips", ["Q Tips", "Kroger Cotton Swabs"]
end
def test_keywords_exact
store_names ["Green Onions", "Yellow Onions"]
assert_search "scallion", ["Green Onions"]
end
def test_keywords_stemmed
store_names ["Green Onions", "Yellow Onions"]
assert_search "scallions", ["Green Onions"]
end
# global boost
def test_boost
store [
{name: "Organic Tomato A", _boost: 10},
{name: "Tomato B"}
]
assert_search "tomato", ["Organic Tomato A", "Tomato B"]
end
def test_boost_zero
store [
{name: "Zero Boost", _boost: 0}
]
assert_search "zero", ["Zero Boost"]
end
# default to 1
def test_boost_null
store [
{name: "Zero Boost A", _boost: 1.1},
{name: "Zero Boost B"},
{name: "Zero Boost C", _boost: 0.9},
]
assert_search "zero", ["Zero Boost A", "Zero Boost B", "Zero Boost C"]
end
protected
def store(documents)
documents.each do |document|
$index.store document
end
$index.refresh
end
def store_names(names)
store names.map{|name| {name: name} }
end
def assert_search(term, expected)
fields = ["name"]
search =
Tire.search "products", type: "document" do
query do
boolean do
should do
match fields, term, boost: 10
end
should do
match fields, term, use_dis_max: false, fuzziness: 0.6, max_expansions: 4, prefix_length: 2
end
should do
nested path: "conversions", score_mode: "total" do
query do
custom_score script: "log(doc['count'].value)" do
match "query", term
end
end
end
end
end
end
explain true
end
assert_equal expected, search.results.map(&:name)
end
end