Skip to content

Commit

Permalink
update solr config files for new argo title fields
Browse files Browse the repository at this point in the history
  • Loading branch information
ndushay committed Feb 21, 2024
1 parent 436b4e2 commit 3d20eda
Show file tree
Hide file tree
Showing 2 changed files with 76 additions and 9 deletions.
13 changes: 12 additions & 1 deletion solr_conf/conf/schema.xml
Original file line number Diff line number Diff line change
Expand Up @@ -106,7 +106,7 @@
<dynamicField name="*_bs" type="boolean" stored="true" indexed="false" multiValued="false"/>
<dynamicField name="*_bsi" type="boolean" stored="true" indexed="true" multiValued="false"/>

<!-- English text (_ten...) -->
<!-- text English (_ten...) -->
<dynamicField name="*_teni" type="textEnglish" stored="false" indexed="true" multiValued="false"/>
<dynamicField name="*_tenim" type="textEnglish" stored="false" indexed="true" multiValued="true"/>
<dynamicField name="*_tens" type="textEnglish" stored="true" indexed="false" multiValued="false"/>
Expand Down Expand Up @@ -152,6 +152,17 @@
<!-- Text tokenized without stemming but left and right anchored, for "exactish" matches -->
<dynamicField name="*_text_anchored_i" type="textAnchored" indexed="true" stored="false" multiValued="false"/>
<dynamicField name="*_text_anchored_im" type="textAnchored" indexed="true" stored="false" multiValued="true"/>

<!-- copyFields must have explicitly declared destination fields -->
<field name="main_title_text_anchored_im" type="textAnchored" indexed="true" stored="false" multiValued="true"/>
<field name="main_title_text_unstemmed_im" type="textUnstemmed" indexed="true" stored="false" multiValued="true"/>
<field name="full_title_unstemmed_im" type="textUnstemmed" indexed="true" stored="false" multiValued="true"/>
<field name="additional_titles_unstemmed_im" type="textUnstemmed" indexed="true" stored="false" multiValued="true"/>

<copyField source="main_title_tenim" dest="main_title_text_anchored_im" maxChars="5000" />
<copyField source="main_title_tenim" dest="main_title_text_unstemmed_im" maxChars="5000" />
<copyField source="full_title_tenim" dest="full_title_unstemmed_im" maxChars="5000" />
<copyField source="additional_titles_tenim" dest="additional_titles_unstemmed_im" maxChars="5000" />
</fields>

<types>
Expand Down
72 changes: 64 additions & 8 deletions solr_conf/conf/solrconfig.xml
Original file line number Diff line number Diff line change
Expand Up @@ -42,7 +42,14 @@
<str name="fl"> *, score</str>

<str name="qf">
sw_display_title_tesim^5
main_title_text_anchored_im^100
main_title_text_unstemmed_im^50
main_title_tenim^10
full_title_unstemmed_im^10
full_title_tenim^5
additional_titles_unstemmed_im^5
additional_titles_tenim^3

contributor_text_nostem_im^3
topic_tesim^2

Expand Down Expand Up @@ -75,7 +82,14 @@
contributor_orcids_ssim
</str>
<str name="pf"> <!-- (defType dismax, edismax: phrase boost within result set) -->
sw_display_title_tesim^25
main_title_text_anchored_im^500
main_title_text_unstemmed_im^250
main_title_tenim^50
full_title_unstemmed_im^50
full_title_tenim^25
additional_titles_unstemmed_im^25
additional_titles_tenim^15

contributor_text_nostem_im^15
topic_tesim^10

Expand All @@ -91,7 +105,14 @@
source_id_text_nostem_i^5
</str>
<str name="pf3"> <!-- (defType edismax: token trigrams boost within result set) -->
sw_display_title_tesim^15
main_title_text_anchored_im^300
main_title_text_unstemmed_im^150
main_title_tenim^30
full_title_unstemmed_im^30
full_title_tenim^15
additional_titles_unstemmed_im^15
additional_titles_tenim^9

contributor_text_nostem_im^9
topic_tesim^6

Expand All @@ -107,7 +128,14 @@
source_id_text_nostem_i^3
</str>
<str name="pf2"> <!--(defType edismax: token bigrams boost within result set) -->
sw_display_title_tesim^10
main_title_text_anchored_im^200
main_title_text_unstemmed_im^100
main_title_tenim^20
full_title_unstemmed_im^20
full_title_tenim^10
additional_titles_unstemmed_im^10
additional_titles_tenim^6

contributor_text_nostem_im^6
topic_tesim^4

Expand Down Expand Up @@ -151,7 +179,14 @@
<bool name="lowercaseOperators">true</bool>

<str name="qf">
sw_display_title_tesim^5
main_title_text_anchored_im^100
main_title_text_unstemmed_im^50
main_title_tenim^10
full_title_unstemmed_im^10
full_title_tenim^5
additional_titles_unstemmed_im^5
additional_titles_tenim^3

contributor_text_nostem_im^3
topic_tesim^2

Expand Down Expand Up @@ -184,7 +219,14 @@
contributor_orcids_ssim
</str>
<str name="pf"> <!-- (defType dismax, edismax: phrase boost within result set) -->
sw_display_title_tesim^25
main_title_text_anchored_im^500
main_title_text_unstemmed_im^250
main_title_tenim^50
full_title_unstemmed_im^50
full_title_tenim^25
additional_titles_unstemmed_im^25
additional_titles_tenim^15

contributor_text_nostem_im^15
topic_tesim^10

Expand All @@ -200,7 +242,14 @@
source_id_text_nostem_i^5
</str>
<str name="pf3"> <!-- (defType edismax: token trigrams boost within result set) -->
sw_display_title_tesim^15
main_title_text_anchored_im^300
main_title_text_unstemmed_im^150
main_title_tenim^30
full_title_unstemmed_im^30
full_title_tenim^15
additional_titles_unstemmed_im^15
additional_titles_tenim^9

contributor_text_nostem_im^9
topic_tesim^6

Expand All @@ -216,7 +265,14 @@
source_id_text_nostem_i^3
</str>
<str name="pf2"> <!--(defType edismax: token bigrams boost within result set) -->
sw_display_title_tesim^10
main_title_text_anchored_im^200
main_title_text_unstemmed_im^100
main_title_tenim^20
full_title_unstemmed_im^20
full_title_tenim^10
additional_titles_unstemmed_im^10
additional_titles_tenim^6

contributor_text_nostem_im^6
topic_tesim^4

Expand Down

0 comments on commit 3d20eda

Please sign in to comment.