Skip to content

Commit c038ca1

Browse files
committed
Cleanup for exactish
1 parent d0140c8 commit c038ca1

File tree

3 files changed

+11
-17
lines changed

3 files changed

+11
-17
lines changed

exampledocs/exactish.json

+4
Original file line numberDiff line numberDiff line change
@@ -10,5 +10,9 @@
1010
{
1111
"id": "3",
1212
"title": "Meet the Monkees"
13+
},
14+
{
15+
"id": "4",
16+
"title": "Corportate boy bands through the ages"
1317
}
1418
]

ruby/exactish_query.rb

+3-3
Original file line numberDiff line numberDiff line change
@@ -4,21 +4,21 @@
44
'defType' => 'dismax',
55
'q' => 'the monkees',
66
'qf' => 'title',
7-
'pf' => 'title'
7+
'pf' => 'title^2'
88
},
99
{
1010
'fl' => 'score, *',
1111
'defType' => 'dismax',
1212
'q' => 'the monkees',
1313
'qf' => 'title',
14-
'pf' => 'title_exact^10 title'
14+
'pf' => 'title_exact^10 title^2'
1515
},
1616
{
1717
'fl' => 'score, *',
1818
'defType' => 'dismax',
1919
'q' => 'the monkees',
2020
'qf' => 'title',
21-
'pf' => 'title_exact^10 title_l^3 title'
21+
'pf' => 'title_exact^10 title_l^3 title^2'
2222
}
2323

2424
]

solr/conf/schema.xml

+4-14
Original file line numberDiff line numberDiff line change
@@ -103,7 +103,6 @@
103103
- Synonyms can be put in syn.txt (see sample synonyms.txt file in solr example)
104104
- Word delimiter splits on CaseChange and numbers (e.g., code4lib).
105105
- The CJK stuff produces bigrams for those languages
106-
- Remove Duplicates does what it says on the tin.
107106
-->
108107
<fieldtype name="text" class="solr.TextField" positionIncrementGap="1000">
109108
<analyzer>
@@ -113,8 +112,6 @@
113112
<!-- <filter class="solr.WordDelimiterFilterFactory" generateWordParts="1" generateNumberParts="1" catenateWords="1" catenateNumbers="1" catenateAll="0"/> -->
114113
<filter class="solr.CJKWidthFilterFactory"/>
115114
<filter class="solr.CJKBigramFilterFactory"/>
116-
<filter class="solr.TrimFilterFactory"/>
117-
<filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
118115
</analyzer>
119116
</fieldtype>
120117

@@ -124,32 +121,25 @@
124121

125122
<fieldtype name="text_lr" class="solr.TextField" positionIncrementGap="1000">
126123
<analyzer>
124+
<charFilter class="solr.PatternReplaceCharFilterFactory"
125+
pattern="^(.*)$" replacement="AAAA $1 ZZZZ" />
127126
<tokenizer class="solr.ICUTokenizerFactory"/>
128-
<charFilter class="solr.PatternReplaceCharFilterFactory"
129-
pattern="^(.*)$" replacement="AAAA $1 ZZZZ" />
130127
<filter class="solr.ICUFoldingFilterFactory"/>
131128
<filter class="solr.SynonymFilterFactory" synonyms="syn.txt" ignoreCase="true" expand="false"/>
132129
<filter class="solr.CJKWidthFilterFactory"/>
133130
<filter class="solr.CJKBigramFilterFactory"/>
134-
<filter class="solr.TrimFilterFactory"/>
135-
<filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
136131
</analyzer>
137132
</fieldtype>
138133

139134
<fieldtype name="text_l" class="solr.TextField" positionIncrementGap="1000">
140135
<analyzer>
136+
<charFilter class="solr.PatternReplaceCharFilterFactory"
137+
pattern="^(.*)$" replacement="AAAA $1" />
141138
<tokenizer class="solr.ICUTokenizerFactory"/>
142139
<filter class="solr.ICUFoldingFilterFactory"/>
143140
<filter class="solr.SynonymFilterFactory" synonyms="syn.txt" ignoreCase="true" expand="false"/>
144141
<filter class="solr.CJKWidthFilterFactory"/>
145142
<filter class="solr.CJKBigramFilterFactory"/>
146-
<filter class="solr.TrimFilterFactory"/>
147-
<filter class="solr.PatternReplaceFilterFactory"
148-
pattern="\p{Z}+" replacement=" "
149-
/>
150-
<charFilter class="solr.PatternReplaceCharFilterFactory"
151-
pattern="^(.*)$" replacement="AAAA $1" />
152-
<filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
153143
</analyzer>
154144
</fieldtype>
155145

0 commit comments

Comments
 (0)