From 11031a1eb014c74440bee571e97cbb20765f1459 Mon Sep 17 00:00:00 2001
From: Tommaso Teofili <tteofili@redhat.com>
Date: Sun, 22 Mar 2020 18:03:22 +0100
Subject: [PATCH 01/13] no args constructor for FakeWordsEncoderAnalyzer

---
 .../java/io/anserini/ann/fw/FakeWordsEncoderAnalyzer.java  | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/src/main/java/io/anserini/ann/fw/FakeWordsEncoderAnalyzer.java b/src/main/java/io/anserini/ann/fw/FakeWordsEncoderAnalyzer.java
index a9e537f4c3..214fe1be72 100644
--- a/src/main/java/io/anserini/ann/fw/FakeWordsEncoderAnalyzer.java
+++ b/src/main/java/io/anserini/ann/fw/FakeWordsEncoderAnalyzer.java
@@ -30,10 +30,17 @@
 public class FakeWordsEncoderAnalyzer extends Analyzer {
 
   static final String REMOVE_IT = "_";
+
+  private static final int DEFAULT_Q = 60;
+
   private final int q;
 
   private final CharArraySet set = new CharArraySet(1, false);
 
+  public FakeWordsEncoderAnalyzer() {
+    this(DEFAULT_Q);
+  }
+
   public FakeWordsEncoderAnalyzer(int q) {
     this.q = q;
     this.set.add(REMOVE_IT);

From 8948fa70ace666d339f3e9d30c2101df5ade628c Mon Sep 17 00:00:00 2001
From: tteofili <tommaso.teofili@gmail.com>
Date: Thu, 14 Jan 2021 17:04:39 +0100
Subject: [PATCH 02/13] merge

---
 docs/experiments-jdiq2018.md                  | 58 +++++++++----------
 docs/regressions-backgroundlinking18.md       |  4 +-
 docs/regressions-backgroundlinking19.md       |  4 +-
 docs/regressions-car17v1.5.md                 |  4 +-
 docs/regressions-car17v2.0-doc2query.md       |  4 +-
 docs/regressions-car17v2.0.md                 |  4 +-
 docs/regressions-clef06-fr.md                 |  6 +-
 docs/regressions-core17.md                    |  4 +-
 docs/regressions-core18.md                    |  4 +-
 docs/regressions-cw09b.md                     | 24 ++++----
 docs/regressions-cw12.md                      | 16 ++---
 docs/regressions-cw12b13.md                   | 16 ++---
 docs/regressions-disk12.md                    | 12 ++--
 docs/regressions-dl19-doc.md                  | 10 ++--
 docs/regressions-dl19-passage.md              | 10 ++--
 docs/regressions-fire12-bn.md                 |  6 +-
 docs/regressions-fire12-en.md                 |  6 +-
 docs/regressions-fire12-hi.md                 |  6 +-
 docs/regressions-gov2.md                      | 12 ++--
 docs/regressions-mb11.md                      |  8 +--
 docs/regressions-mb13.md                      |  8 +--
 ...sions-msmarco-doc-docTTTTTquery-per-doc.md |  4 +-
 ...s-msmarco-doc-docTTTTTquery-per-passage.md |  4 +-
 docs/regressions-msmarco-doc.md               |  4 +-
 docs/regressions-msmarco-passage-doc2query.md |  4 +-
 ...gressions-msmarco-passage-docTTTTTquery.md |  4 +-
 docs/regressions-msmarco-passage.md           |  4 +-
 docs/regressions-ntcir8-zh.md                 |  6 +-
 docs/regressions-robust04.md                  |  4 +-
 docs/regressions-robust05.md                  |  4 +-
 docs/regressions-trec02-ar.md                 |  6 +-
 docs/regressions-wt10g.md                     |  4 +-
 32 files changed, 137 insertions(+), 137 deletions(-)

diff --git a/docs/experiments-jdiq2018.md b/docs/experiments-jdiq2018.md
index 1364c72fad..8e7a5dc7b8 100644
--- a/docs/experiments-jdiq2018.md
+++ b/docs/experiments-jdiq2018.md
@@ -46,95 +46,95 @@ The script assumes hard-coded index directories; modify as appropriate.
 #### disk12
 MAP                                     | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.151-200.txt                      | 0.2614    | 0.2512    | 0.2544    | 0.2558    | 0.2571    | 0.2459    |
-topics.51-100.txt                       | 0.2274    | 0.2245    | 0.2226    | 0.2226    | 0.2260    | 0.2201    |
-topics.101-150.txt                      | 0.2071    | 0.2035    | 0.1967    | 0.2015    | 0.2031    | 0.1840    |
+topics.151-200.txt                      | 0,2614    | 0,2512    | 0,2544    | 0,2558    | 0,2571    | 0,2459    |
+topics.51-100.txt                       | 0,2274    | 0,2245    | 0,2226    | 0,2226    | 0,2260    | 0,2201    |
+topics.101-150.txt                      | 0,2071    | 0,2035    | 0,1967    | 0,2015    | 0,2031    | 0,1840    |
 
 
 #### robust04
 MAP                                     | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.robust04.301-450.601-700.txt     | 0.2543    | 0.2516    | 0.2531    | 0.2514    | 0.2523    | 0.2509    |
+topics.robust04.301-450.601-700.txt     | 0,2543    | 0,2516    | 0,2531    | 0,2514    | 0,2523    | 0,2509    |
 
 
 #### robust05
 MAP                                     | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.robust05.txt                     | 0.2097    | 0.1998    | 0.2021    | 0.2030    | 0.2023    | 0.1980    |
+topics.robust05.txt                     | 0,2097    | 0,1998    | 0,2021    | 0,2030    | 0,2023    | 0,1980    |
 
 
 #### core17
 MAP                                     | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.core17.txt                       | 0.2052    | 0.2005    | 0.2019    | 0.1943    | 0.2050    | 0.1999    |
+topics.core17.txt                       | 0,2052    | 0,2005    | 0,2019    | 0,1943    | 0,2050    | 0,1999    |
 
 
 #### wt10g
 MAP                                     | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.451-550.txt                      | 0.2005    | 0.2002    | 0.1880    | 0.2021    | 0.1946    | 0.1704    |
+topics.451-550.txt                      | 0,2005    | 0,2002    | 0,1880    | 0,2021    | 0,1946    | 0,1704    |
 
 
 #### gov2
 MAP                                     | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.701-750.txt                      | 0.2702    | 0.2592    | 0.2726    | 0.2700    | 0.2689    | 0.2734    |
-topics.751-800.txt                      | 0.3394    | 0.3195    | 0.3439    | 0.3303    | 0.3342    | 0.3393    |
-topics.801-850.txt                      | 0.3085    | 0.2900    | 0.3088    | 0.3013    | 0.3026    | 0.3139    |
+topics.701-750.txt                      | 0,2702    | 0,2592    | 0,2726    | 0,2700    | 0,2689    | 0,2734    |
+topics.751-800.txt                      | 0,3394    | 0,3195    | 0,3439    | 0,3303    | 0,3342    | 0,3393    |
+topics.801-850.txt                      | 0,3085    | 0,2900    | 0,3088    | 0,3013    | 0,3026    | 0,3139    |
 
 
 #### cw09b
 ERR20                                   | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.web.151-200.txt                  | 0.1524    | 0.1387    | 0.1439    | 0.1484    | 0.1524    | 0.1445    |
-topics.web.101-150.txt                  | 0.0981    | 0.0935    | 0.0892    | 0.0868    | 0.0944    | 0.0893    |
-topics.web.51-100.txt                   | 0.0774    | 0.0776    | 0.0635    | 0.0643    | 0.0725    | 0.0659    |
+topics.web.151-200.txt                  | 0,1524    | 0,1387    | 0,1439    | 0,1484    | 0,1524    | 0,1445    |
+topics.web.101-150.txt                  | 0,0981    | 0,0935    | 0,0892    | 0,0868    | 0,0944    | 0,0893    |
+topics.web.51-100.txt                   | 0,0774    | 0,0776    | 0,0635    | 0,0643    | 0,0725    | 0,0659    |
 
 
 NDCG20                                  | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.web.151-200.txt                  | 0.1090    | 0.0933    | 0.0927    | 0.0978    | 0.0986    | 0.0933    |
-topics.web.101-150.txt                  | 0.1927    | 0.1878    | 0.1765    | 0.1701    | 0.1917    | 0.1758    |
-topics.web.51-100.txt                   | 0.1487    | 0.1418    | 0.1217    | 0.1185    | 0.1376    | 0.1252    |
+topics.web.151-200.txt                  | 0,1090    | 0,0933    | 0,0927    | 0,0978    | 0,0986    | 0,0933    |
+topics.web.101-150.txt                  | 0,1927    | 0,1878    | 0,1765    | 0,1701    | 0,1917    | 0,1758    |
+topics.web.51-100.txt                   | 0,1487    | 0,1418    | 0,1217    | 0,1185    | 0,1376    | 0,1252    |
 
 
 MAP                                     | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.web.151-200.txt                  | 0.1226    | 0.1089    | 0.1170    | 0.1113    | 0.1091    | 0.1163    |
-topics.web.101-150.txt                  | 0.1104    | 0.1081    | 0.1067    | 0.1004    | 0.1104    | 0.1063    |
-topics.web.51-100.txt                   | 0.1165    | 0.1111    | 0.1103    | 0.1060    | 0.1110    | 0.1099    |
+topics.web.151-200.txt                  | 0,1226    | 0,1089    | 0,1170    | 0,1113    | 0,1091    | 0,1163    |
+topics.web.101-150.txt                  | 0,1104    | 0,1081    | 0,1067    | 0,1004    | 0,1104    | 0,1063    |
+topics.web.51-100.txt                   | 0,1165    | 0,1111    | 0,1103    | 0,1060    | 0,1110    | 0,1099    |
 
 
 #### cw12b13
 ERR20                                   | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.web.251-300.txt                  | 0.1224    | 0.1203    | 0.1109    | 0.1108    | 0.1209    | 0.1135    |
-topics.web.201-250.txt                  | 0.0993    | 0.0797    | 0.0933    | 0.0898    | 0.0821    | 0.0940    |
+topics.web.251-300.txt                  | 0,1224    | 0,1203    | 0,1109    | 0,1108    | 0,1209    | 0,1135    |
+topics.web.201-250.txt                  | 0,0993    | 0,0797    | 0,0933    | 0,0898    | 0,0821    | 0,0940    |
 
 
 NDCG20                                  | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.web.251-300.txt                  | 0.1247    | 0.1159    | 0.1213    | 0.1209    | 0.1189    | 0.1213    |
-topics.web.201-250.txt                  | 0.1384    | 0.1222    | 0.1247    | 0.1168    | 0.1247    | 0.1258    |
+topics.web.251-300.txt                  | 0,1247    | 0,1159    | 0,1213    | 0,1209    | 0,1189    | 0,1213    |
+topics.web.201-250.txt                  | 0,1384    | 0,1222    | 0,1247    | 0,1168    | 0,1247    | 0,1258    |
 
 
 MAP                                     | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.web.251-300.txt                  | 0.0237    | 0.0205    | 0.0242    | 0.0246    | 0.0213    | 0.0240    |
-topics.web.201-250.txt                  | 0.0481    | 0.0450    | 0.0419    | 0.0398    | 0.0454    | 0.0418    |
+topics.web.251-300.txt                  | 0,0237    | 0,0205    | 0,0242    | 0,0246    | 0,0213    | 0,0240    |
+topics.web.201-250.txt                  | 0,0481    | 0,0450    | 0,0419    | 0,0398    | 0,0454    | 0,0418    |
 
 
 #### mb11
 MAP                                     | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.microblog2012.txt                | 0.2083    | 0.2107    | 0.2046    | 0.2121    | 0.2033    | 0.2055    |
-topics.microblog2011.txt                | 0.3643    | 0.3769    | 0.3537    | 0.3607    | 0.3823    | 0.3567    |
+topics.microblog2012.txt                | 0,2083    | 0,2107    | 0,2046    | 0,2121    | 0,2033    | 0,2055    |
+topics.microblog2011.txt                | 0,3643    | 0,3769    | 0,3537    | 0,3607    | 0,3823    | 0,3567    |
 
 
 #### mb13
 MAP                                     | BM25      | F2EXP     | PL2       | QL        | F2LOG     | SPL       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-topics.microblog2013.txt                | 0.2600    | 0.2531    | 0.2524    | 0.2615    | 0.2622    | 0.2530    |
-topics.microblog2014.txt                | 0.4195    | 0.3854    | 0.4132    | 0.4200    | 0.4121    | 0.4147    |
+topics.microblog2013.txt                | 0,2600    | 0,2531    | 0,2524    | 0,2615    | 0,2622    | 0,2530    |
+topics.microblog2014.txt                | 0,4195    | 0,3854    | 0,4132    | 0,4200    | 0,4121    | 0,4147    |
 
 
diff --git a/docs/regressions-backgroundlinking18.md b/docs/regressions-backgroundlinking18.md
index 2a6d64e088..ad62257415 100644
--- a/docs/regressions-backgroundlinking18.md
+++ b/docs/regressions-backgroundlinking18.md
@@ -64,10 +64,10 @@ With the above commands, you should be able to replicate the following results:
 
 NCDG@5                                  | BM25      | +RM3      | +RM3+DF   |
 :---------------------------------------|-----------|-----------|-----------|
-[TREC 2018 Topics](../src/main/resources/topics-and-qrels/topics.backgroundlinking18.txt)| 0.3293    | 0.3526    | 0.4171    |
+[TREC 2018 Topics](../src/main/resources/topics-and-qrels/topics.backgroundlinking18.txt)| 0,3293    | 0,3526    | 0,4171    |
 
 
 AP                                      | BM25      | +RM3      | +RM3+DF   |
 :---------------------------------------|-----------|-----------|-----------|
-[TREC 2018 Topics](../src/main/resources/topics-and-qrels/topics.backgroundlinking18.txt)| 0.2490    | 0.2642    | 0.2692    |
+[TREC 2018 Topics](../src/main/resources/topics-and-qrels/topics.backgroundlinking18.txt)| 0,2490    | 0,2642    | 0,2692    |
 
diff --git a/docs/regressions-backgroundlinking19.md b/docs/regressions-backgroundlinking19.md
index 60e834ae07..76655539ff 100644
--- a/docs/regressions-backgroundlinking19.md
+++ b/docs/regressions-backgroundlinking19.md
@@ -64,10 +64,10 @@ With the above commands, you should be able to replicate the following results:
 
 NCDG@5                                  | BM25      | +RM3      | +RM3+DF   |
 :---------------------------------------|-----------|-----------|-----------|
-[TREC 2019 Topics](../src/main/resources/topics-and-qrels/topics.backgroundlinking19.txt)| 0.4785    | 0.5217    | 0.5051    |
+[TREC 2019 Topics](../src/main/resources/topics-and-qrels/topics.backgroundlinking19.txt)| 0,4785    | 0,5217    | 0,5051    |
 
 
 AP                                      | BM25      | +RM3      | +RM3+DF   |
 :---------------------------------------|-----------|-----------|-----------|
-[TREC 2019 Topics](../src/main/resources/topics-and-qrels/topics.backgroundlinking19.txt)| 0.3027    | 0.3790    | 0.3158    |
+[TREC 2019 Topics](../src/main/resources/topics-and-qrels/topics.backgroundlinking19.txt)| 0,3027    | 0,3790    | 0,3158    |
 
diff --git a/docs/regressions-car17v1.5.md b/docs/regressions-car17v1.5.md
index 634027010b..34b5b63952 100644
--- a/docs/regressions-car17v1.5.md
+++ b/docs/regressions-car17v1.5.md
@@ -86,9 +86,9 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2017 CAR: benchmarkY1test (v1.5)](../src/main/resources/topics-and-qrels/topics.car17v1.5.benchmarkY1test.txt/)| 0.1562    | 0.1295    | 0.1358    | 0.1386    | 0.1080    | 0.1048    |
+[TREC 2017 CAR: benchmarkY1test (v1.5)](../src/main/resources/topics-and-qrels/topics.car17v1.5.benchmarkY1test.txt/)| 0,1562    | 0,1295    | 0,1358    | 0,1386    | 0,1080    | 0,1048    |
 
 
 RECIP_RANK                              | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2017 CAR: benchmarkY1test (v1.5)](../src/main/resources/topics-and-qrels/topics.car17v1.5.benchmarkY1test.txt/)| 0.2331    | 0.1923    | 0.1949    | 0.2037    | 0.1599    | 0.1524    |
+[TREC 2017 CAR: benchmarkY1test (v1.5)](../src/main/resources/topics-and-qrels/topics.car17v1.5.benchmarkY1test.txt/)| 0,2331    | 0,1923    | 0,1949    | 0,2037    | 0,1599    | 0,1524    |
diff --git a/docs/regressions-car17v2.0-doc2query.md b/docs/regressions-car17v2.0-doc2query.md
index 0cf28028e1..0c9bf99307 100644
--- a/docs/regressions-car17v2.0-doc2query.md
+++ b/docs/regressions-car17v2.0-doc2query.md
@@ -92,9 +92,9 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2017 CAR: benchmarkY1test (v2.0)](../src/main/resources/topics-and-qrels/topics.car17v2.0.benchmarkY1test.txt)| 0.1807    | 0.1521    | 0.1470    | 0.1752    | 0.1453    | 0.1339    |
+[TREC 2017 CAR: benchmarkY1test (v2.0)](../src/main/resources/topics-and-qrels/topics.car17v2.0.benchmarkY1test.txt)| 0,1807    | 0,1521    | 0,1470    | 0,1752    | 0,1453    | 0,1339    |
 
 
 RECIP_RANK                              | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2017 CAR: benchmarkY1test (v2.0)](../src/main/resources/topics-and-qrels/topics.car17v2.0.benchmarkY1test.txt)| 0.2750    | 0.2275    | 0.2186    | 0.2653    | 0.2156    | 0.1981    |
+[TREC 2017 CAR: benchmarkY1test (v2.0)](../src/main/resources/topics-and-qrels/topics.car17v2.0.benchmarkY1test.txt)| 0,2750    | 0,2275    | 0,2186    | 0,2653    | 0,2156    | 0,1981    |
diff --git a/docs/regressions-car17v2.0.md b/docs/regressions-car17v2.0.md
index e7925e12e9..b3d41a1ac5 100644
--- a/docs/regressions-car17v2.0.md
+++ b/docs/regressions-car17v2.0.md
@@ -86,9 +86,9 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2017 CAR: benchmarkY1test (v2.0)](../src/main/resources/topics-and-qrels/topics.car17v2.0.benchmarkY1test.txt)| 0.1545    | 0.1286    | 0.1364    | 0.1371    | 0.1080    | 0.1077    |
+[TREC 2017 CAR: benchmarkY1test (v2.0)](../src/main/resources/topics-and-qrels/topics.car17v2.0.benchmarkY1test.txt)| 0,1545    | 0,1286    | 0,1364    | 0,1371    | 0,1080    | 0,1077    |
 
 
 RECIP_RANK                              | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2017 CAR: benchmarkY1test (v2.0)](../src/main/resources/topics-and-qrels/topics.car17v2.0.benchmarkY1test.txt)| 0.2321    | 0.1927    | 0.1978    | 0.2013    | 0.1598    | 0.1588    |
+[TREC 2017 CAR: benchmarkY1test (v2.0)](../src/main/resources/topics-and-qrels/topics.car17v2.0.benchmarkY1test.txt)| 0,2321    | 0,1927    | 0,1978    | 0,2013    | 0,1598    | 0,1588    |
diff --git a/docs/regressions-clef06-fr.md b/docs/regressions-clef06-fr.md
index f400cc222e..f99750d2ec 100644
--- a/docs/regressions-clef06-fr.md
+++ b/docs/regressions-clef06-fr.md
@@ -53,14 +53,14 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      |
 :---------------------------------------|-----------|
-[CLEF 2006 (Monolingual French)](../src/main/resources/topics-and-qrels/topics.clef06fr.mono.fr.txt)| 0.3111    |
+[CLEF 2006 (Monolingual French)](../src/main/resources/topics-and-qrels/topics.clef06fr.mono.fr.txt)| 0,3111    |
 
 
 P20                                     | BM25      |
 :---------------------------------------|-----------|
-[CLEF 2006 (Monolingual French)](../src/main/resources/topics-and-qrels/topics.clef06fr.mono.fr.txt)| 0.3184    |
+[CLEF 2006 (Monolingual French)](../src/main/resources/topics-and-qrels/topics.clef06fr.mono.fr.txt)| 0,3184    |
 
 
 NDCG20                                  | BM25      |
 :---------------------------------------|-----------|
-[CLEF 2006 (Monolingual French)](../src/main/resources/topics-and-qrels/topics.clef06fr.mono.fr.txt)| 0.4458    |
+[CLEF 2006 (Monolingual French)](../src/main/resources/topics-and-qrels/topics.clef06fr.mono.fr.txt)| 0,4458    |
diff --git a/docs/regressions-core17.md b/docs/regressions-core17.md
index 0f4d7d9a84..2feb604eb0 100644
--- a/docs/regressions-core17.md
+++ b/docs/regressions-core17.md
@@ -85,12 +85,12 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2017 Common Core Track Topics](../src/main/resources/topics-and-qrels/topics.core17.txt)| 0.2087    | 0.2823    | 0.2739    | 0.2032    | 0.2606    | 0.2579    |
+[TREC 2017 Common Core Track Topics](../src/main/resources/topics-and-qrels/topics.core17.txt)| 0,2087    | 0,2823    | 0,2739    | 0,2032    | 0,2606    | 0,2579    |
 
 
 P30                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2017 Common Core Track Topics](../src/main/resources/topics-and-qrels/topics.core17.txt)| 0.4293    | 0.5093    | 0.4940    | 0.4467    | 0.4827    | 0.4893    |
+[TREC 2017 Common Core Track Topics](../src/main/resources/topics-and-qrels/topics.core17.txt)| 0,4293    | 0,5093    | 0,4940    | 0,4467    | 0,4827    | 0,4893    |
 
 ## Replication Log
 
diff --git a/docs/regressions-core18.md b/docs/regressions-core18.md
index c7a1b07548..81110eacca 100644
--- a/docs/regressions-core18.md
+++ b/docs/regressions-core18.md
@@ -85,12 +85,12 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2018 Common Core Track Topics](../src/main/resources/topics-and-qrels/topics.core18.txt)| 0.2495    | 0.3135    | 0.2841    | 0.2526    | 0.3073    | 0.2919    |
+[TREC 2018 Common Core Track Topics](../src/main/resources/topics-and-qrels/topics.core18.txt)| 0,2495    | 0,3135    | 0,2841    | 0,2526    | 0,3073    | 0,2919    |
 
 
 P30                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2018 Common Core Track Topics](../src/main/resources/topics-and-qrels/topics.core18.txt)| 0.3567    | 0.4200    | 0.3947    | 0.3653    | 0.4000    | 0.4020    |
+[TREC 2018 Common Core Track Topics](../src/main/resources/topics-and-qrels/topics.core18.txt)| 0,3567    | 0,4200    | 0,3947    | 0,3653    | 0,4000    | 0,4020    |
 
 ## Replication Log
 
diff --git a/docs/regressions-cw09b.md b/docs/regressions-cw09b.md
index b71b1deaf9..1971dd0c9f 100644
--- a/docs/regressions-cw09b.md
+++ b/docs/regressions-cw09b.md
@@ -168,27 +168,27 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2010 Web Track (Topics 51-100)](../src/main/resources/topics-and-qrels/topics.web.51-100.txt)| 0.1126    | 0.0933    | 0.0929    | 0.1060    | 0.1019    | 0.1086    |
-[TREC 2011 Web Track (Topics 101-150)](../src/main/resources/topics-and-qrels/topics.web.101-150.txt)| 0.1094    | 0.1085    | 0.0975    | 0.0958    | 0.0839    | 0.0879    |
-[TREC 2012 Web Track (Topics 151-200)](../src/main/resources/topics-and-qrels/topics.web.151-200.txt)| 0.1105    | 0.1107    | 0.1315    | 0.1069    | 0.1058    | 0.1212    |
+[TREC 2010 Web Track (Topics 51-100)](../src/main/resources/topics-and-qrels/topics.web.51-100.txt)| 0,1126    | 0,0933    | 0,0929    | 0,1060    | 0,1019    | 0,1086    |
+[TREC 2011 Web Track (Topics 101-150)](../src/main/resources/topics-and-qrels/topics.web.101-150.txt)| 0,1094    | 0,1085    | 0,0975    | 0,0958    | 0,0839    | 0,0879    |
+[TREC 2012 Web Track (Topics 151-200)](../src/main/resources/topics-and-qrels/topics.web.151-200.txt)| 0,1105    | 0,1107    | 0,1315    | 0,1069    | 0,1058    | 0,1212    |
 
 
 P30                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2010 Web Track (Topics 51-100)](../src/main/resources/topics-and-qrels/topics.web.51-100.txt)| 0.2694    | 0.2389    | 0.2354    | 0.2431    | 0.2312    | 0.2618    |
-[TREC 2011 Web Track (Topics 101-150)](../src/main/resources/topics-and-qrels/topics.web.101-150.txt)| 0.2513    | 0.2480    | 0.2387    | 0.2147    | 0.2047    | 0.2173    |
-[TREC 2012 Web Track (Topics 151-200)](../src/main/resources/topics-and-qrels/topics.web.151-200.txt)| 0.2167    | 0.1920    | 0.2553    | 0.2080    | 0.1980    | 0.2147    |
+[TREC 2010 Web Track (Topics 51-100)](../src/main/resources/topics-and-qrels/topics.web.51-100.txt)| 0,2694    | 0,2389    | 0,2354    | 0,2431    | 0,2312    | 0,2618    |
+[TREC 2011 Web Track (Topics 101-150)](../src/main/resources/topics-and-qrels/topics.web.101-150.txt)| 0,2513    | 0,2480    | 0,2387    | 0,2147    | 0,2047    | 0,2173    |
+[TREC 2012 Web Track (Topics 151-200)](../src/main/resources/topics-and-qrels/topics.web.151-200.txt)| 0,2167    | 0,1920    | 0,2553    | 0,2080    | 0,1980    | 0,2147    |
 
 
 NDCG20                                  | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2010 Web Track (Topics 51-100)](../src/main/resources/topics-and-qrels/topics.web.51-100.txt)| 0.1354    | 0.1369    | 0.1632    | 0.1143    | 0.1182    | 0.1454    |
-[TREC 2011 Web Track (Topics 101-150)](../src/main/resources/topics-and-qrels/topics.web.101-150.txt)| 0.1890    | 0.1916    | 0.1835    | 0.1619    | 0.1449    | 0.1517    |
-[TREC 2012 Web Track (Topics 151-200)](../src/main/resources/topics-and-qrels/topics.web.151-200.txt)| 0.1014    | 0.0918    | 0.1441    | 0.0868    | 0.0896    | 0.1037    |
+[TREC 2010 Web Track (Topics 51-100)](../src/main/resources/topics-and-qrels/topics.web.51-100.txt)| 0,1354    | 0,1369    | 0,1632    | 0,1143    | 0,1182    | 0,1454    |
+[TREC 2011 Web Track (Topics 101-150)](../src/main/resources/topics-and-qrels/topics.web.101-150.txt)| 0,1890    | 0,1916    | 0,1835    | 0,1619    | 0,1449    | 0,1517    |
+[TREC 2012 Web Track (Topics 151-200)](../src/main/resources/topics-and-qrels/topics.web.151-200.txt)| 0,1014    | 0,0918    | 0,1441    | 0,0868    | 0,0896    | 0,1037    |
 
 
 ERR20                                   | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2010 Web Track (Topics 51-100)](../src/main/resources/topics-and-qrels/topics.web.51-100.txt)| 0.0733    | 0.0747    | 0.0977    | 0.0599    | 0.0592    | 0.0742    |
-[TREC 2011 Web Track (Topics 101-150)](../src/main/resources/topics-and-qrels/topics.web.101-150.txt)| 0.0959    | 0.0960    | 0.1091    | 0.0849    | 0.0787    | 0.0821    |
-[TREC 2012 Web Track (Topics 151-200)](../src/main/resources/topics-and-qrels/topics.web.151-200.txt)| 0.1303    | 0.1494    | 0.2355    | 0.1305    | 0.1334    | 0.1558    |
+[TREC 2010 Web Track (Topics 51-100)](../src/main/resources/topics-and-qrels/topics.web.51-100.txt)| 0,0733    | 0,0747    | 0,0977    | 0,0599    | 0,0592    | 0,0742    |
+[TREC 2011 Web Track (Topics 101-150)](../src/main/resources/topics-and-qrels/topics.web.101-150.txt)| 0,0959    | 0,0960    | 0,1091    | 0,0849    | 0,0787    | 0,0821    |
+[TREC 2012 Web Track (Topics 151-200)](../src/main/resources/topics-and-qrels/topics.web.151-200.txt)| 0,1303    | 0,1494    | 0,2355    | 0,1305    | 0,1334    | 0,1558    |
diff --git a/docs/regressions-cw12.md b/docs/regressions-cw12.md
index 7708f7cb72..bbb57a39fd 100644
--- a/docs/regressions-cw12.md
+++ b/docs/regressions-cw12.md
@@ -100,23 +100,23 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | QL        | +RM3      |
 :---------------------------------------|-----------|-----------|-----------|-----------|
-[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0.1694    | 0.1464    | 0.1494    | 0.1290    |
-[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0.2469    | 0.2324    | 0.2466    | 0.2177    |
+[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0,1694    | 0,1464    | 0,1494    | 0,1290    |
+[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0,2469    | 0,2324    | 0,2466    | 0,2177    |
 
 
 P30                                     | BM25      | +RM3      | QL        | +RM3      |
 :---------------------------------------|-----------|-----------|-----------|-----------|
-[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0.2773    | 0.2393    | 0.2607    | 0.2347    |
-[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0.4547    | 0.4080    | 0.4380    | 0.3800    |
+[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0,2773    | 0,2393    | 0,2607    | 0,2347    |
+[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0,4547    | 0,4080    | 0,4380    | 0,3800    |
 
 
 NDCG20                                  | BM25      | +RM3      | QL        | +RM3      |
 :---------------------------------------|-----------|-----------|-----------|-----------|
-[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0.2088    | 0.2033    | 0.1993    | 0.1725    |
-[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0.2572    | 0.2530    | 0.2218    | 0.2083    |
+[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0,2088    | 0,2033    | 0,1993    | 0,1725    |
+[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0,2572    | 0,2530    | 0,2218    | 0,2083    |
 
 
 ERR20                                   | BM25      | +RM3      | QL        | +RM3      |
 :---------------------------------------|-----------|-----------|-----------|-----------|
-[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0.1284    | 0.1264    | 0.1233    | 0.1008    |
-[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0.1616    | 0.1655    | 0.1322    | 0.1245    |
+[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0,1284    | 0,1264    | 0,1233    | 0,1008    |
+[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0,1616    | 0,1655    | 0,1322    | 0,1245    |
diff --git a/docs/regressions-cw12b13.md b/docs/regressions-cw12b13.md
index 7c528d4d44..74ba8e596e 100644
--- a/docs/regressions-cw12b13.md
+++ b/docs/regressions-cw12b13.md
@@ -128,26 +128,26 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0.0468    | 0.0408    | 0.0435    | 0.0397    | 0.0322    | 0.0358    |
-[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0.0224    | 0.0210    | 0.0180    | 0.0235    | 0.0203    | 0.0183    |
+[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0,0468    | 0,0408    | 0,0435    | 0,0397    | 0,0322    | 0,0358    |
+[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0,0224    | 0,0210    | 0,0180    | 0,0235    | 0,0203    | 0,0183    |
 
 
 P30                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0.2113    | 0.1673    | 0.1833    | 0.1780    | 0.1513    | 0.1507    |
-[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0.1273    | 0.1207    | 0.1107    | 0.1373    | 0.1173    | 0.1147    |
+[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0,2113    | 0,1673    | 0,1833    | 0,1780    | 0,1513    | 0,1507    |
+[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0,1273    | 0,1207    | 0,1107    | 0,1373    | 0,1173    | 0,1147    |
 
 
 NDCG20                                  | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0.1286    | 0.1119    | 0.1287    | 0.1106    | 0.0920    | 0.1141    |
-[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0.1183    | 0.1081    | 0.0963    | 0.1177    | 0.1004    | 0.0989    |
+[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0,1286    | 0,1119    | 0,1287    | 0,1106    | 0,0920    | 0,1141    |
+[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0,1183    | 0,1081    | 0,0963    | 0,1177    | 0,1004    | 0,0989    |
 
 
 ERR20                                   | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0.0838    | 0.0753    | 0.0941    | 0.0768    | 0.0553    | 0.0780    |
-[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0.1201    | 0.1066    | 0.0928    | 0.1092    | 0.0928    | 0.0900    |
+[TREC 2013 Web Track (Topics 201-250)](../src/main/resources/topics-and-qrels/topics.web.201-250.txt)| 0,0838    | 0,0753    | 0,0941    | 0,0768    | 0,0553    | 0,0780    |
+[TREC 2014 Web Track (Topics 251-300)](../src/main/resources/topics-and-qrels/topics.web.251-300.txt)| 0,1201    | 0,1066    | 0,0928    | 0,1092    | 0,0928    | 0,0900    |
 
 ## Replication Log
 
diff --git a/docs/regressions-disk12.md b/docs/regressions-disk12.md
index 419e9d01dc..d7ccb68cfa 100644
--- a/docs/regressions-disk12.md
+++ b/docs/regressions-disk12.md
@@ -148,13 +148,13 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC-1 Ad Hoc Topics 51-100](../src/main/resources/topics-and-qrels/topics.adhoc.51-100.txt)| 0.2273    | 0.2634    | 0.2640    | 0.2189    | 0.2435    | 0.2501    |
-[TREC-2 Ad Hoc Topics 101-150](../src/main/resources/topics-and-qrels/topics.adhoc.101-150.txt)| 0.2010    | 0.2587    | 0.2722    | 0.2015    | 0.2442    | 0.2593    |
-[TREC-3 Ad Hoc Topics 151-200](../src/main/resources/topics-and-qrels/topics.adhoc.151-200.txt)| 0.2580    | 0.3390    | 0.3318    | 0.2518    | 0.3042    | 0.3103    |
+[TREC-1 Ad Hoc Topics 51-100](../src/main/resources/topics-and-qrels/topics.adhoc.51-100.txt)| 0,2273    | 0,2634    | 0,2640    | 0,2189    | 0,2435    | 0,2501    |
+[TREC-2 Ad Hoc Topics 101-150](../src/main/resources/topics-and-qrels/topics.adhoc.101-150.txt)| 0,2010    | 0,2587    | 0,2722    | 0,2015    | 0,2442    | 0,2593    |
+[TREC-3 Ad Hoc Topics 151-200](../src/main/resources/topics-and-qrels/topics.adhoc.151-200.txt)| 0,2580    | 0,3390    | 0,3318    | 0,2518    | 0,3042    | 0,3103    |
 
 
 P30                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC-1 Ad Hoc Topics 51-100](../src/main/resources/topics-and-qrels/topics.adhoc.51-100.txt)| 0.4533    | 0.4800    | 0.5067    | 0.4520    | 0.4627    | 0.4953    |
-[TREC-2 Ad Hoc Topics 101-150](../src/main/resources/topics-and-qrels/topics.adhoc.101-150.txt)| 0.4280    | 0.4593    | 0.4753    | 0.4207    | 0.4420    | 0.4740    |
-[TREC-3 Ad Hoc Topics 151-200](../src/main/resources/topics-and-qrels/topics.adhoc.151-200.txt)| 0.4740    | 0.5273    | 0.5100    | 0.4580    | 0.4913    | 0.5167    |
+[TREC-1 Ad Hoc Topics 51-100](../src/main/resources/topics-and-qrels/topics.adhoc.51-100.txt)| 0,4533    | 0,4800    | 0,5067    | 0,4520    | 0,4627    | 0,4953    |
+[TREC-2 Ad Hoc Topics 101-150](../src/main/resources/topics-and-qrels/topics.adhoc.101-150.txt)| 0,4280    | 0,4593    | 0,4753    | 0,4207    | 0,4420    | 0,4740    |
+[TREC-3 Ad Hoc Topics 151-200](../src/main/resources/topics-and-qrels/topics.adhoc.151-200.txt)| 0,4740    | 0,5273    | 0,5100    | 0,4580    | 0,4913    | 0,5167    |
diff --git a/docs/regressions-dl19-doc.md b/docs/regressions-dl19-doc.md
index 230fd8022b..a3cbd87cb2 100644
--- a/docs/regressions-dl19-doc.md
+++ b/docs/regressions-dl19-doc.md
@@ -100,27 +100,27 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[DL19 (Doc)](https://trec.nist.gov/data/deep2019.html)| 0.3309    | 0.3870    | 0.3516    | 0.3624    | 0.3138    | 0.3697    | 0.3860    | 0.3858    |
+[DL19 (Doc)](https://trec.nist.gov/data/deep2019.html)| 0,3309    | 0,3870    | 0,3516    | 0,3624    | 0,3138    | 0,3697    | 0,3860    | 0,3858    |
 
 
 NDCG@10                                 | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[DL19 (Doc)](https://trec.nist.gov/data/deep2019.html)| 0.5190    | 0.5169    | 0.4730    | 0.5105    | 0.5140    | 0.5485    | 0.5245    | 0.5280    |
+[DL19 (Doc)](https://trec.nist.gov/data/deep2019.html)| 0,5190    | 0,5169    | 0,4730    | 0,5105    | 0,5140    | 0,5485    | 0,5245    | 0,5280    |
 
 
 RR                                      | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[DL19 (Doc)](https://trec.nist.gov/data/deep2019.html)| 0.8046    | 0.7718    | 0.7428    | 0.7775    | 0.8872    | 0.8074    | 0.7492    | 0.8007    |
+[DL19 (Doc)](https://trec.nist.gov/data/deep2019.html)| 0,8046    | 0,7718    | 0,7428    | 0,7775    | 0,8872    | 0,8074    | 0,7492    | 0,8007    |
 
 
 R@100                                   | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[DL19 (Doc)](https://trec.nist.gov/data/deep2019.html)| 0.3948    | 0.4189    | 0.3945    | 0.4004    | 0.3862    | 0.4193    | 0.4399    | 0.4287    |
+[DL19 (Doc)](https://trec.nist.gov/data/deep2019.html)| 0,3948    | 0,4189    | 0,3945    | 0,4004    | 0,3862    | 0,4193    | 0,4399    | 0,4287    |
 
 
 R@1000                                  | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[DL19 (Doc)](https://trec.nist.gov/data/deep2019.html)| 0.6966    | 0.7504    | 0.7323    | 0.7357    | 0.6810    | 0.7282    | 0.7545    | 0.7553    |
+[DL19 (Doc)](https://trec.nist.gov/data/deep2019.html)| 0,6966    | 0,7504    | 0,7323    | 0,7357    | 0,6810    | 0,7282    | 0,7545    | 0,7553    |
 
 The setting "default" refers the default BM25 settings of `k1=0.9`, `b=0.4`, while "tuned" refers to the tuned setting of `k1=3.44`, `b=0.87` (see [this page](experiments-msmarco-doc.md) for more details about tuning).
 
diff --git a/docs/regressions-dl19-passage.md b/docs/regressions-dl19-passage.md
index 308347db74..4413c84368 100644
--- a/docs/regressions-dl19-passage.md
+++ b/docs/regressions-dl19-passage.md
@@ -101,27 +101,27 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[DL19 (Passage)](https://trec.nist.gov/data/deep2019.html)| 0.3773    | 0.4270    | 0.4651    | 0.4533    | 0.3766    | 0.4249    | 0.4722    | 0.4522    |
+[DL19 (Passage)](https://trec.nist.gov/data/deep2019.html)| 0,3773    | 0,4270    | 0,4651    | 0,4533    | 0,3766    | 0,4249    | 0,4722    | 0,4522    |
 
 
 NDCG@10                                 | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[DL19 (Passage)](https://trec.nist.gov/data/deep2019.html)| 0.5058    | 0.5180    | 0.5511    | 0.5372    | 0.4973    | 0.5231    | 0.5461    | 0.5536    |
+[DL19 (Passage)](https://trec.nist.gov/data/deep2019.html)| 0,5058    | 0,5180    | 0,5511    | 0,5372    | 0,4973    | 0,5231    | 0,5461    | 0,5536    |
 
 
 RR                                      | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[DL19 (Passage)](https://trec.nist.gov/data/deep2019.html)| 0.8245    | 0.8167    | 0.7736    | 0.8170    | 0.8457    | 0.8229    | 0.8218    | 0.8178    |
+[DL19 (Passage)](https://trec.nist.gov/data/deep2019.html)| 0,8245    | 0,8167    | 0,7736    | 0,8170    | 0,8457    | 0,8229    | 0,8218    | 0,8178    |
 
 
 R@100                                   | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[DL19 (Passage)](https://trec.nist.gov/data/deep2019.html)| 0.4531    | 0.4761    | 0.4995    | 0.4974    | 0.4603    | 0.4747    | 0.5065    | 0.4969    |
+[DL19 (Passage)](https://trec.nist.gov/data/deep2019.html)| 0,4531    | 0,4761    | 0,4995    | 0,4974    | 0,4603    | 0,4747    | 0,5065    | 0,4969    |
 
 
 R@1000                                  | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[DL19 (Passage)](https://trec.nist.gov/data/deep2019.html)| 0.7389    | 0.7882    | 0.8129    | 0.7845    | 0.7384    | 0.7762    | 0.8094    | 0.7894    |
+[DL19 (Passage)](https://trec.nist.gov/data/deep2019.html)| 0,7389    | 0,7882    | 0,8129    | 0,7845    | 0,7384    | 0,7762    | 0,8094    | 0,7894    |
 
 The setting "default" refers the default BM25 settings of `k1=0.9`, `b=0.4`, while "tuned" refers to the tuned setting of `k1=0.82`, `b=0.68` (see [this page](experiments-msmarco-passage.md) for more details about tuning).
 
diff --git a/docs/regressions-fire12-bn.md b/docs/regressions-fire12-bn.md
index af234ad82f..8b0d731c83 100644
--- a/docs/regressions-fire12-bn.md
+++ b/docs/regressions-fire12-bn.md
@@ -52,14 +52,14 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      |
 :---------------------------------------|-----------|
-[FIRE 2012 (Monolingual Bengali)](../src/main/resources/topics-and-qrels/topics.fire12bn.176-225.txt)| 0.2881    |
+[FIRE 2012 (Monolingual Bengali)](../src/main/resources/topics-and-qrels/topics.fire12bn.176-225.txt)| 0,2881    |
 
 
 P20                                     | BM25      |
 :---------------------------------------|-----------|
-[FIRE 2012 (Monolingual Bengali)](../src/main/resources/topics-and-qrels/topics.fire12bn.176-225.txt)| 0.3740    |
+[FIRE 2012 (Monolingual Bengali)](../src/main/resources/topics-and-qrels/topics.fire12bn.176-225.txt)| 0,3740    |
 
 
 NDCG20                                  | BM25      |
 :---------------------------------------|-----------|
-[FIRE 2012 (Monolingual Bengali)](../src/main/resources/topics-and-qrels/topics.fire12bn.176-225.txt)| 0.4261    |
+[FIRE 2012 (Monolingual Bengali)](../src/main/resources/topics-and-qrels/topics.fire12bn.176-225.txt)| 0,4261    |
diff --git a/docs/regressions-fire12-en.md b/docs/regressions-fire12-en.md
index 1e6c99bae3..ccaa12d0d7 100644
--- a/docs/regressions-fire12-en.md
+++ b/docs/regressions-fire12-en.md
@@ -52,14 +52,14 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      |
 :---------------------------------------|-----------|
-[FIRE 2012 (Monolingual English)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0.3713    |
+[FIRE 2012 (Monolingual English)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0,3713    |
 
 
 P20                                     | BM25      |
 :---------------------------------------|-----------|
-[FIRE 2012 (Monolingual English)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0.4970    |
+[FIRE 2012 (Monolingual English)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0,4970    |
 
 
 NDCG20                                  | BM25      |
 :---------------------------------------|-----------|
-[FIRE 2012 (Monolingual English)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0.5420    |
+[FIRE 2012 (Monolingual English)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0,5420    |
diff --git a/docs/regressions-fire12-hi.md b/docs/regressions-fire12-hi.md
index 149228ac72..4f13502e6a 100644
--- a/docs/regressions-fire12-hi.md
+++ b/docs/regressions-fire12-hi.md
@@ -52,14 +52,14 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      |
 :---------------------------------------|-----------|
-[FIRE 2012 (Monolingual Hindi)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0.3867    |
+[FIRE 2012 (Monolingual Hindi)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0,3867    |
 
 
 P20                                     | BM25      |
 :---------------------------------------|-----------|
-[FIRE 2012 (Monolingual Hindi)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0.4470    |
+[FIRE 2012 (Monolingual Hindi)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0,4470    |
 
 
 NDCG20                                  | BM25      |
 :---------------------------------------|-----------|
-[FIRE 2012 (Monolingual Hindi)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0.5310    |
+[FIRE 2012 (Monolingual Hindi)](../src/main/resources/topics-and-qrels/topics.fire12en.176-225.txt)| 0,5310    |
diff --git a/docs/regressions-gov2.md b/docs/regressions-gov2.md
index c0e47f7b29..da9985ea5e 100644
--- a/docs/regressions-gov2.md
+++ b/docs/regressions-gov2.md
@@ -148,13 +148,13 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2004 Terabyte Track (Topics 701-750)](../src/main/resources/topics-and-qrels/topics.terabyte04.701-750.txt)| 0.2689    | 0.2844    | 0.2669    | 0.2681    | 0.2708    | 0.2666    |
-[TREC 2005 Terabyte Track (Topics 751-800)](../src/main/resources/topics-and-qrels/topics.terabyte05.751-800.txt)| 0.3390    | 0.3820    | 0.3666    | 0.3303    | 0.3559    | 0.3646    |
-[TREC 2006 Terabyte Track (Topics 801-850)](../src/main/resources/topics-and-qrels/topics.terabyte06.801-850.txt)| 0.3080    | 0.3377    | 0.3069    | 0.2997    | 0.3154    | 0.3084    |
+[TREC 2004 Terabyte Track (Topics 701-750)](../src/main/resources/topics-and-qrels/topics.terabyte04.701-750.txt)| 0,2689    | 0,2844    | 0,2669    | 0,2681    | 0,2708    | 0,2666    |
+[TREC 2005 Terabyte Track (Topics 751-800)](../src/main/resources/topics-and-qrels/topics.terabyte05.751-800.txt)| 0,3390    | 0,3820    | 0,3666    | 0,3303    | 0,3559    | 0,3646    |
+[TREC 2006 Terabyte Track (Topics 801-850)](../src/main/resources/topics-and-qrels/topics.terabyte06.801-850.txt)| 0,3080    | 0,3377    | 0,3069    | 0,2997    | 0,3154    | 0,3084    |
 
 
 P30                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2004 Terabyte Track (Topics 701-750)](../src/main/resources/topics-and-qrels/topics.terabyte04.701-750.txt)| 0.4864    | 0.5190    | 0.4993    | 0.4755    | 0.4925    | 0.4932    |
-[TREC 2005 Terabyte Track (Topics 751-800)](../src/main/resources/topics-and-qrels/topics.terabyte05.751-800.txt)| 0.5540    | 0.5920    | 0.5933    | 0.5347    | 0.5620    | 0.5840    |
-[TREC 2006 Terabyte Track (Topics 801-850)](../src/main/resources/topics-and-qrels/topics.terabyte06.801-850.txt)| 0.4907    | 0.5160    | 0.5033    | 0.4720    | 0.4847    | 0.4920    |
+[TREC 2004 Terabyte Track (Topics 701-750)](../src/main/resources/topics-and-qrels/topics.terabyte04.701-750.txt)| 0,4864    | 0,5190    | 0,4993    | 0,4755    | 0,4925    | 0,4932    |
+[TREC 2005 Terabyte Track (Topics 751-800)](../src/main/resources/topics-and-qrels/topics.terabyte05.751-800.txt)| 0,5540    | 0,5920    | 0,5933    | 0,5347    | 0,5620    | 0,5840    |
+[TREC 2006 Terabyte Track (Topics 801-850)](../src/main/resources/topics-and-qrels/topics.terabyte06.801-850.txt)| 0,4907    | 0,5160    | 0,5033    | 0,4720    | 0,4847    | 0,4920    |
diff --git a/docs/regressions-mb11.md b/docs/regressions-mb11.md
index 984ddfa09d..8ab4811db6 100644
--- a/docs/regressions-mb11.md
+++ b/docs/regressions-mb11.md
@@ -124,11 +124,11 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2011 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2011.txt)| 0.3384    | 0.3650    | 0.4008    | 0.3584    | 0.3923    | 0.4201    |
-[TREC 2012 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2012.txt)| 0.1948    | 0.2193    | 0.2309    | 0.2102    | 0.2389    | 0.2474    |
+[TREC 2011 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2011.txt)| 0,3384    | 0,3650    | 0,4008    | 0,3584    | 0,3923    | 0,4201    |
+[TREC 2012 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2012.txt)| 0,1948    | 0,2193    | 0,2309    | 0,2102    | 0,2389    | 0,2474    |
 
 
 P30                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2011 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2011.txt)| 0.3959    | 0.4170    | 0.4612    | 0.4061    | 0.4435    | 0.4408    |
-[TREC 2012 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2012.txt)| 0.3316    | 0.3463    | 0.3554    | 0.3333    | 0.3514    | 0.3842    |
+[TREC 2011 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2011.txt)| 0,3959    | 0,4170    | 0,4612    | 0,4061    | 0,4435    | 0,4408    |
+[TREC 2012 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2012.txt)| 0,3316    | 0,3463    | 0,3554    | 0,3333    | 0,3514    | 0,3842    |
diff --git a/docs/regressions-mb13.md b/docs/regressions-mb13.md
index 8e1803c361..c0ffa54249 100644
--- a/docs/regressions-mb13.md
+++ b/docs/regressions-mb13.md
@@ -124,11 +124,11 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2013 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2013.txt)| 0.2371    | 0.2513    | 0.2855    | 0.2602    | 0.2911    | 0.3152    |
-[TREC 2014 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2014.txt)| 0.3931    | 0.4374    | 0.4796    | 0.4181    | 0.4676    | 0.4965    |
+[TREC 2013 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2013.txt)| 0,2371    | 0,2513    | 0,2855    | 0,2602    | 0,2911    | 0,3152    |
+[TREC 2014 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2014.txt)| 0,3931    | 0,4374    | 0,4796    | 0,4181    | 0,4676    | 0,4965    |
 
 
 P30                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2013 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2013.txt)| 0.4339    | 0.4411    | 0.4728    | 0.4561    | 0.4906    | 0.5078    |
-[TREC 2014 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2014.txt)| 0.6212    | 0.6442    | 0.6648    | 0.6430    | 0.6533    | 0.6727    |
+[TREC 2013 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2013.txt)| 0,4339    | 0,4411    | 0,4728    | 0,4561    | 0,4906    | 0,5078    |
+[TREC 2014 Microblog Track Topics](../src/main/resources/topics-and-qrels/topics.microblog2014.txt)| 0,6212    | 0,6442    | 0,6648    | 0,6430    | 0,6533    | 0,6727    |
diff --git a/docs/regressions-msmarco-doc-docTTTTTquery-per-doc.md b/docs/regressions-msmarco-doc-docTTTTTquery-per-doc.md
index 0e472986f7..68dbb54528 100644
--- a/docs/regressions-msmarco-doc-docTTTTTquery-per-doc.md
+++ b/docs/regressions-msmarco-doc-docTTTTTquery-per-doc.md
@@ -49,12 +49,12 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25 (Default)|
 :---------------------------------------|-----------|
-[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0.2886    |
+[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0,2886    |
 
 
 R@1000                                  | BM25 (Default)|
 :---------------------------------------|-----------|
-[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0.9259    |
+[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0,9259    |
 
 See [this page](https://github.com/castorini/docTTTTTquery#Replicating-MS-MARCO-Document-Ranking-Results-with-Anserini) for more details.
 Note that here we are using `trec_eval` to evaluate the top 1000 hits for each query; beware, the runs provided by MS MARCO organizers for reranking have only 100 hits per query.
diff --git a/docs/regressions-msmarco-doc-docTTTTTquery-per-passage.md b/docs/regressions-msmarco-doc-docTTTTTquery-per-passage.md
index 34f155cafa..d344feae4f 100644
--- a/docs/regressions-msmarco-doc-docTTTTTquery-per-passage.md
+++ b/docs/regressions-msmarco-doc-docTTTTTquery-per-passage.md
@@ -49,12 +49,12 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25 (Default)|
 :---------------------------------------|-----------|
-[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0.3182    |
+[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0,3182    |
 
 
 R@1000                                  | BM25 (Default)|
 :---------------------------------------|-----------|
-[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0.9490    |
+[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0,9490    |
 
 See [this page](https://github.com/castorini/docTTTTTquery#Replicating-MS-MARCO-Document-Ranking-Results-with-Anserini) for more details.
 Note that here we are using `trec_eval` to evaluate the top 1000 hits for each query; beware, the runs provided by MS MARCO organizers for reranking have only 100 hits per query.
diff --git a/docs/regressions-msmarco-doc.md b/docs/regressions-msmarco-doc.md
index 209ab4bf9e..cc608dd03b 100644
--- a/docs/regressions-msmarco-doc.md
+++ b/docs/regressions-msmarco-doc.md
@@ -98,12 +98,12 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0.2310    | 0.1632    | 0.1147    | 0.1357    | 0.2788    | 0.2289    | 0.1895    | 0.1559    |
+[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0,2310    | 0,1632    | 0,1147    | 0,1357    | 0,2788    | 0,2289    | 0,1895    | 0,1559    |
 
 
 R@1000                                  | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0.8856    | 0.8785    | 0.8369    | 0.8471    | 0.9326    | 0.9320    | 0.9264    | 0.8758    |
+[MS MARCO Document Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Document-Ranking)| 0,8856    | 0,8785    | 0,8369    | 0,8471    | 0,9326    | 0,9320    | 0,9264    | 0,8758    |
 
 The setting "default" refers the default BM25 settings of `k1=0.9`, `b=0.4`, while "tuned" refers to the tuned setting of `k1=3.44`, `b=0.87`.
 See [this page](experiments-msmarco-doc.md) for more details.
diff --git a/docs/regressions-msmarco-passage-doc2query.md b/docs/regressions-msmarco-passage-doc2query.md
index a56436eb58..c9253d7c73 100644
--- a/docs/regressions-msmarco-passage-doc2query.md
+++ b/docs/regressions-msmarco-passage-doc2query.md
@@ -74,12 +74,12 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25 (Default)| +RM3      | BM25 (Tuned)| +RM3      |
 :---------------------------------------|-----------|-----------|-----------|-----------|
-[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0.2270    | 0.2028    | 0.2293    | 0.2077    |
+[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0,2270    | 0,2028    | 0,2293    | 0,2077    |
 
 
 R@1000                                  | BM25 (Default)| +RM3      | BM25 (Tuned)| +RM3      |
 :---------------------------------------|-----------|-----------|-----------|-----------|
-[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0.8900    | 0.8916    | 0.8911    | 0.8957    |
+[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0,8900    | 0,8916    | 0,8911    | 0,8957    |
 
 The setting "default" refers the default BM25 settings of `k1=0.9`, `b=0.4`, while "tuned" refers to the tuned setting of `k1=0.82`, `b=0.72` _on the original passages_.
 See [this page](experiments-msmarco-passage.md) for more details.
diff --git a/docs/regressions-msmarco-passage-docTTTTTquery.md b/docs/regressions-msmarco-passage-docTTTTTquery.md
index 74a90e05e0..2770c0ce8e 100644
--- a/docs/regressions-msmarco-passage-docTTTTTquery.md
+++ b/docs/regressions-msmarco-passage-docTTTTTquery.md
@@ -70,12 +70,12 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25 (Default)| +RM3      | BM25 (Tuned)| +RM3      |
 :---------------------------------------|-----------|-----------|-----------|-----------|
-[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0.2805    | 0.2243    | 0.2850    | 0.2266    |
+[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0,2805    | 0,2243    | 0,2850    | 0,2266    |
 
 
 R@1000                                  | BM25 (Default)| +RM3      | BM25 (Tuned)| +RM3      |
 :---------------------------------------|-----------|-----------|-----------|-----------|
-[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0.9470    | 0.9463    | 0.9471    | 0.9479    |
+[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0,9470    | 0,9463    | 0,9471    | 0,9479    |
 
 The setting "default" refers the default BM25 settings of `k1=0.9`, `b=0.4`, while "tuned" refers to the tuned setting of `k1=0.82`, `b=0.72` _on the original passages_.
 See [this page](experiments-msmarco-passage.md) for more details.
diff --git a/docs/regressions-msmarco-passage.md b/docs/regressions-msmarco-passage.md
index d9b50fe960..ef04d5d4c8 100644
--- a/docs/regressions-msmarco-passage.md
+++ b/docs/regressions-msmarco-passage.md
@@ -99,12 +99,12 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0.1926    | 0.1661    | 0.1625    | 0.1520    | 0.1958    | 0.1762    | 0.1699    | 0.1582    |
+[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0,1926    | 0,1661    | 0,1625    | 0,1520    | 0,1958    | 0,1762    | 0,1699    | 0,1582    |
 
 
 R@1000                                  | BM25 (Default)| +RM3      | +Ax       | +PRF      | BM25 (Tuned)| +RM3      | +Ax       | +PRF      |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|-----------|
-[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0.8526    | 0.8606    | 0.8747    | 0.8537    | 0.8573    | 0.8687    | 0.8809    | 0.8561    |
+[MS MARCO Passage Ranking: Dev Queries](https://github.com/microsoft/MSMARCO-Passage-Ranking)| 0,8526    | 0,8606    | 0,8747    | 0,8537    | 0,8573    | 0,8687    | 0,8809    | 0,8561    |
 
 The setting "default" refers the default BM25 settings of `k1=0.9`, `b=0.4`, while "tuned" refers to the tuned setting of `k1=0.82`, `b=0.68`.
 See [this page](experiments-msmarco-passage.md) for more details.
diff --git a/docs/regressions-ntcir8-zh.md b/docs/regressions-ntcir8-zh.md
index 33fd3b0fc1..0984b4eb60 100644
--- a/docs/regressions-ntcir8-zh.md
+++ b/docs/regressions-ntcir8-zh.md
@@ -54,14 +54,14 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      |
 :---------------------------------------|-----------|
-[NTCIR-8 ACLIA (IR4QA subtask, Monolingual Chinese)](../src/main/resources/topics-and-qrels/topics.ntcir8zh.eval.txt)| 0.4014    |
+[NTCIR-8 ACLIA (IR4QA subtask, Monolingual Chinese)](../src/main/resources/topics-and-qrels/topics.ntcir8zh.eval.txt)| 0,4014    |
 
 
 P20                                     | BM25      |
 :---------------------------------------|-----------|
-[NTCIR-8 ACLIA (IR4QA subtask, Monolingual Chinese)](../src/main/resources/topics-and-qrels/topics.ntcir8zh.eval.txt)| 0.3849    |
+[NTCIR-8 ACLIA (IR4QA subtask, Monolingual Chinese)](../src/main/resources/topics-and-qrels/topics.ntcir8zh.eval.txt)| 0,3849    |
 
 
 NDCG20                                  | BM25      |
 :---------------------------------------|-----------|
-[NTCIR-8 ACLIA (IR4QA subtask, Monolingual Chinese)](../src/main/resources/topics-and-qrels/topics.ntcir8zh.eval.txt)| 0.4757    |
+[NTCIR-8 ACLIA (IR4QA subtask, Monolingual Chinese)](../src/main/resources/topics-and-qrels/topics.ntcir8zh.eval.txt)| 0,4757    |
diff --git a/docs/regressions-robust04.md b/docs/regressions-robust04.md
index 812082c142..b98a42a07e 100644
--- a/docs/regressions-robust04.md
+++ b/docs/regressions-robust04.md
@@ -85,12 +85,12 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2004 Robust Track Topics](../src/main/resources/topics-and-qrels/topics.robust04.txt)| 0.2531    | 0.2903    | 0.2896    | 0.2467    | 0.2747    | 0.2774    |
+[TREC 2004 Robust Track Topics](../src/main/resources/topics-and-qrels/topics.robust04.txt)| 0,2531    | 0,2903    | 0,2896    | 0,2467    | 0,2747    | 0,2774    |
 
 
 P30                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2004 Robust Track Topics](../src/main/resources/topics-and-qrels/topics.robust04.txt)| 0.3102    | 0.3365    | 0.3333    | 0.3079    | 0.3232    | 0.3229    |
+[TREC 2004 Robust Track Topics](../src/main/resources/topics-and-qrels/topics.robust04.txt)| 0,3102    | 0,3365    | 0,3333    | 0,3079    | 0,3232    | 0,3229    |
 
 ## Replication Log
 
diff --git a/docs/regressions-robust05.md b/docs/regressions-robust05.md
index 35db301446..8ec389abd5 100644
--- a/docs/regressions-robust05.md
+++ b/docs/regressions-robust05.md
@@ -84,9 +84,9 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2005 Robust Track Topics](../src/main/resources/topics-and-qrels/topics.robust05.txt)| 0.2032    | 0.2602    | 0.2587    | 0.2028    | 0.2491    | 0.2476    |
+[TREC 2005 Robust Track Topics](../src/main/resources/topics-and-qrels/topics.robust05.txt)| 0,2032    | 0,2602    | 0,2587    | 0,2028    | 0,2491    | 0,2476    |
 
 
 P30                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[TREC 2005 Robust Track Topics](../src/main/resources/topics-and-qrels/topics.robust05.txt)| 0.3693    | 0.4187    | 0.4120    | 0.3653    | 0.4067    | 0.4113    |
+[TREC 2005 Robust Track Topics](../src/main/resources/topics-and-qrels/topics.robust05.txt)| 0,3693    | 0,4187    | 0,4120    | 0,3653    | 0,4067    | 0,4113    |
diff --git a/docs/regressions-trec02-ar.md b/docs/regressions-trec02-ar.md
index 8cfb84b0b6..9786e6520f 100644
--- a/docs/regressions-trec02-ar.md
+++ b/docs/regressions-trec02-ar.md
@@ -54,14 +54,14 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      |
 :---------------------------------------|-----------|
-[TREC 2002 (Monolingual Arabic)](../src/main/resources/topics-and-qrels/topics.trec02ar-ar.txt)| 0.2932    |
+[TREC 2002 (Monolingual Arabic)](../src/main/resources/topics-and-qrels/topics.trec02ar-ar.txt)| 0,2932    |
 
 
 P20                                     | BM25      |
 :---------------------------------------|-----------|
-[TREC 2002 (Monolingual Arabic)](../src/main/resources/topics-and-qrels/topics.trec02ar-ar.txt)| 0.3610    |
+[TREC 2002 (Monolingual Arabic)](../src/main/resources/topics-and-qrels/topics.trec02ar-ar.txt)| 0,3610    |
 
 
 NDCG20                                  | BM25      |
 :---------------------------------------|-----------|
-[TREC 2002 (Monolingual Arabic)](../src/main/resources/topics-and-qrels/topics.trec02ar-ar.txt)| 0.4056    |
+[TREC 2002 (Monolingual Arabic)](../src/main/resources/topics-and-qrels/topics.trec02ar-ar.txt)| 0,4056    |
diff --git a/docs/regressions-wt10g.md b/docs/regressions-wt10g.md
index 2c17cf18cc..3f86d62d49 100644
--- a/docs/regressions-wt10g.md
+++ b/docs/regressions-wt10g.md
@@ -84,9 +84,9 @@ With the above commands, you should be able to replicate the following results:
 
 MAP                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[Wt10g (Topics 451-550)](../src/main/resources/topics-and-qrels/topics.adhoc.451-550.txt)| 0.1992    | 0.2276    | 0.2200    | 0.2021    | 0.2188    | 0.2275    |
+[Wt10g (Topics 451-550)](../src/main/resources/topics-and-qrels/topics.adhoc.451-550.txt)| 0,1992    | 0,2276    | 0,2200    | 0,2021    | 0,2188    | 0,2275    |
 
 
 P30                                     | BM25      | +RM3      | +Ax       | QL        | +RM3      | +Ax       |
 :---------------------------------------|-----------|-----------|-----------|-----------|-----------|-----------|
-[Wt10g (Topics 451-550)](../src/main/resources/topics-and-qrels/topics.adhoc.451-550.txt)| 0.2214    | 0.2398    | 0.2483    | 0.2180    | 0.2310    | 0.2514    |
+[Wt10g (Topics 451-550)](../src/main/resources/topics-and-qrels/topics.adhoc.451-550.txt)| 0,2214    | 0,2398    | 0,2483    | 0,2180    | 0,2310    | 0,2514    |

From 6e09bfba6bcbe17ce4689e9e891da470c213e075 Mon Sep 17 00:00:00 2001
From: tteofili <tommaso.teofili@gmail.com>
Date: Mon, 25 Jan 2021 08:40:08 +0100
Subject: [PATCH 03/13] avoid loading vectors in a map

---
 .../java/io/anserini/ann/IndexVectors.java    | 24 ++++++++++++++-----
 1 file changed, 18 insertions(+), 6 deletions(-)

diff --git a/src/main/java/io/anserini/ann/IndexVectors.java b/src/main/java/io/anserini/ann/IndexVectors.java
index e46b6a4177..449910aac9 100644
--- a/src/main/java/io/anserini/ann/IndexVectors.java
+++ b/src/main/java/io/anserini/ann/IndexVectors.java
@@ -118,8 +118,6 @@ public static void main(String[] args) throws Exception {
     final long start = System.nanoTime();
     System.out.println(String.format("Loading model %s", indexArgs.input));
 
-    Map<String, List<float[]>> vectors = readGloVe(indexArgs.input);
-
     Path indexDir = indexArgs.path;
     if (!Files.exists(indexDir)) {
       Files.createDirectories(indexDir);
@@ -136,10 +134,23 @@ public static void main(String[] args) throws Exception {
     IndexWriter indexWriter = new IndexWriter(d, conf);
     final AtomicInteger cnt = new AtomicInteger();
 
-    for (Map.Entry<String, List<float[]>> entry : vectors.entrySet()) {
-      for (float[] vector: entry.getValue()) {
+    for (String line : IOUtils.readLines(new FileReader(indexArgs.input))) {
+      String[] s = line.split("\\s+");
+      if (s.length > 2) {
+        String key = s[0];
+        float[] vector = new float[s.length - 1];
+        float norm = 0f;
+        for (int i = 1; i < s.length; i++) {
+          float f = Float.parseFloat(s[i]);
+          vector[i - 1] = f;
+          norm += Math.pow(f, 2);
+        }
+        norm = (float) Math.sqrt(norm);
+        for (int i = 0; i < vector.length; i++) {
+          vector[i] = vector[i] / norm;
+        }
         Document doc = new Document();
-        doc.add(new StringField(FIELD_ID, entry.getKey(), Field.Store.YES));
+        doc.add(new StringField(FIELD_ID, key, Field.Store.YES));
         StringBuilder sb = new StringBuilder();
         for (double fv : vector) {
           if (sb.length() > 0) {
@@ -151,8 +162,9 @@ public static void main(String[] args) throws Exception {
         try {
           indexWriter.addDocument(doc);
           int cur = cnt.incrementAndGet();
-          if (cur % 100000 == 0) {
+          if (cur % 50000 == 0) {
             System.out.println(String.format("%s docs added", cnt));
+            indexWriter.commit();
           }
         } catch (IOException e) {
           System.err.println("Error while indexing: " + e.getLocalizedMessage());

From a914ee362180d19cd269b686adbfcd70e3ae5515 Mon Sep 17 00:00:00 2001
From: Tommaso Teofili <tteofili@redhat.com>
Date: Thu, 19 May 2022 12:11:59 +0200
Subject: [PATCH 04/13] upgrade lucene and solr to 9.0 versions

---
 pom.xml                                       | 63 +++++++++++++++++--
 .../io/anserini/index/IndexCollection.java    |  4 +-
 .../generator/AclAnthologyGenerator.java      |  4 +-
 .../index/generator/BibtexGenerator.java      |  4 +-
 .../index/generator/Cord19Generator.java      |  4 +-
 .../index/generator/CoreGenerator.java        |  6 +-
 .../DefaultLuceneDocumentGenerator.java       |  4 +-
 .../index/generator/EpidemicQAGenerator.java  |  4 +-
 .../io/anserini/rerank/ScoredDocuments.java   |  6 +-
 .../java/io/anserini/search/SearchSolr.java   |  4 +-
 .../search/query/SdmQueryGenerator.java       |  6 +-
 .../solr/anserini/conf/solrconfig.xml         | 30 ++-------
 .../java/io/anserini/IndexerTestBase.java     | 10 +--
 .../IndexerWithEmptyDocumentTestBase.java     | 12 ++--
 .../io/anserini/index/CloneIndexTest.java     | 10 ---
 .../integration/CoreEndToEndTest.java         |  2 +-
 .../io/anserini/integration/EndToEndTest.java |  2 +-
 .../integration/solr/SolrEndToEndTest.java    |  6 +-
 .../DisjunctionMaxQueryGeneratorTest.java     |  4 +-
 .../anserini/search/query/SdmQueryTest.java   |  6 +-
 20 files changed, 108 insertions(+), 83 deletions(-)

diff --git a/pom.xml b/pom.xml
index 3709a6dc1b..98ec3c12eb 100644
--- a/pom.xml
+++ b/pom.xml
@@ -26,7 +26,8 @@
   </developers>
 
   <properties>
-    <lucene.version>8.11.0</lucene.version>
+    <lucene.version>9.0.0</lucene.version>
+    <solr.version>9.0.0</solr.version>
     <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
   </properties>
 
@@ -297,7 +298,12 @@
     </dependency>
     <dependency>
       <groupId>org.apache.lucene</groupId>
-      <artifactId>lucene-analyzers-kuromoji</artifactId>
+      <artifactId>lucene-queries</artifactId>
+      <version>${lucene.version}</version>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.lucene</groupId>
+      <artifactId>lucene-analysis-kuromoji</artifactId>
       <version>${lucene.version}</version>
     </dependency>
     <dependency> <!-- only needed for testing -->
@@ -315,13 +321,62 @@
     <dependency>
       <groupId>org.apache.solr</groupId>
       <artifactId>solr-solrj</artifactId>
-      <version>${lucene.version}</version>
+      <version>${solr.version}</version>
+      <exclusions>
+        <exclusion>
+          <groupId>org.apache.lucene</groupId>
+          <artifactId>lucene-core</artifactId>
+        </exclusion>
+        <exclusion>
+          <groupId>org.apache.lucene</groupId>
+          <artifactId>lucene-analysis-common</artifactId>
+        </exclusion>
+        <exclusion>
+          <groupId>org.apache.lucene</groupId>
+          <artifactId>lucene-queries</artifactId>
+        </exclusion>
+        <exclusion>
+          <groupId>org.slf4j</groupId>
+          <artifactId>slf4j-api</artifactId>
+        </exclusion>
+        <exclusion>
+          <groupId>org.apache.logging.log4j</groupId>
+          <artifactId>log4j-slf4j-impl</artifactId>
+        </exclusion>
+      </exclusions>
     </dependency>
     <dependency> <!-- only needed for testing -->
       <groupId>org.apache.solr</groupId>
       <artifactId>solr-test-framework</artifactId>
-      <version>${lucene.version}</version>
+      <version>${solr.version}</version>
       <scope>test</scope>
+      <exclusions>
+        <exclusion>
+          <groupId>org.apache.lucene</groupId>
+          <artifactId>lucene-core</artifactId>
+        </exclusion>
+        <exclusion>
+          <groupId>org.apache.lucene</groupId>
+          <artifactId>lucene-analysis-common</artifactId>
+        </exclusion>
+        <exclusion>
+          <groupId>org.apache.lucene</groupId>
+          <artifactId>lucene-queries</artifactId>
+        </exclusion>
+        <exclusion>
+          <groupId>org.slf4j</groupId>
+          <artifactId>slf4j-api</artifactId>
+        </exclusion>
+        <exclusion>
+          <groupId>org.apache.logging.log4j</groupId>
+          <artifactId>log4j-slf4j-impl</artifactId>
+        </exclusion>
+      </exclusions>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.lucene</groupId>
+      <artifactId>lucene-codecs</artifactId>
+      <version>${lucene.version}</version>
     </dependency>
     <dependency>
       <groupId>org.elasticsearch.client</groupId>
diff --git a/src/main/java/io/anserini/index/IndexCollection.java b/src/main/java/io/anserini/index/IndexCollection.java
index ed13692d7f..76ae835577 100644
--- a/src/main/java/io/anserini/index/IndexCollection.java
+++ b/src/main/java/io/anserini/index/IndexCollection.java
@@ -408,8 +408,8 @@ private class SolrClientFactory extends BasePooledObjectFactory<SolrClient> {
     @Override
     public SolrClient create() {
       return new CloudSolrClient.Builder(Splitter.on(',').splitToList(args.zkUrl), Optional.of(args.zkChroot))
-          .withConnectionTimeout(TIMEOUT)
-          .withSocketTimeout(TIMEOUT)
+//          .withConnectionTimeout(TIMEOUT)
+//          .withSocketTimeout(TIMEOUT)
           .build();
     }
 
diff --git a/src/main/java/io/anserini/index/generator/AclAnthologyGenerator.java b/src/main/java/io/anserini/index/generator/AclAnthologyGenerator.java
index bdf6210ecf..c854ec00cb 100644
--- a/src/main/java/io/anserini/index/generator/AclAnthologyGenerator.java
+++ b/src/main/java/io/anserini/index/generator/AclAnthologyGenerator.java
@@ -23,11 +23,11 @@
 import org.apache.lucene.analysis.Analyzer;
 import org.apache.lucene.analysis.CharArraySet;
 import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.document.BinaryDocValuesField;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.document.FieldType;
 import org.apache.lucene.document.IntPoint;
-import org.apache.lucene.document.SortedDocValuesField;
 import org.apache.lucene.document.StoredField;
 import org.apache.lucene.document.StringField;
 import org.apache.lucene.index.IndexOptions;
@@ -102,7 +102,7 @@ public Document createDocument(AclAnthology.Document aclDoc) throws GeneratorExc
     // Store the collection docid.
     doc.add(new StringField(IndexArgs.ID, id, Field.Store.YES));
     // This is needed to break score ties by docid.
-    doc.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef(id)));
+    doc.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef(id)));
 
     if (args.storeRaw) {
       doc.add(new StoredField(IndexArgs.RAW, aclDoc.raw()));
diff --git a/src/main/java/io/anserini/index/generator/BibtexGenerator.java b/src/main/java/io/anserini/index/generator/BibtexGenerator.java
index 23371b5834..14b2e1a64b 100644
--- a/src/main/java/io/anserini/index/generator/BibtexGenerator.java
+++ b/src/main/java/io/anserini/index/generator/BibtexGenerator.java
@@ -22,11 +22,11 @@
 import org.apache.lucene.analysis.Analyzer;
 import org.apache.lucene.analysis.CharArraySet;
 import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.document.BinaryDocValuesField;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.document.FieldType;
 import org.apache.lucene.document.IntPoint;
-import org.apache.lucene.document.SortedDocValuesField;
 import org.apache.lucene.document.StoredField;
 import org.apache.lucene.document.StringField;
 import org.apache.lucene.index.IndexOptions;
@@ -101,7 +101,7 @@ public Document createDocument(BibtexCollection.Document bibtexDoc) throws Gener
     // Store the collection docid.
     doc.add(new StringField(IndexArgs.ID, id, Field.Store.YES));
     // This is needed to break score ties by docid.
-    doc.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef(id)));
+    doc.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef(id)));
     // Store the collection's bibtex type
     doc.add(new StringField(TYPE, type, Field.Store.YES));
 
diff --git a/src/main/java/io/anserini/index/generator/Cord19Generator.java b/src/main/java/io/anserini/index/generator/Cord19Generator.java
index 7403425f3a..f9abccc20e 100644
--- a/src/main/java/io/anserini/index/generator/Cord19Generator.java
+++ b/src/main/java/io/anserini/index/generator/Cord19Generator.java
@@ -24,11 +24,11 @@
 import org.apache.lucene.analysis.Analyzer;
 import org.apache.lucene.analysis.CharArraySet;
 import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.document.BinaryDocValuesField;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.document.FieldType;
 import org.apache.lucene.document.IntPoint;
-import org.apache.lucene.document.SortedDocValuesField;
 import org.apache.lucene.document.StoredField;
 import org.apache.lucene.document.StringField;
 import org.apache.lucene.index.IndexOptions;
@@ -115,7 +115,7 @@ public Document createDocument(Cord19BaseDocument covidDoc) throws GeneratorExce
     // Store the collection docid.
     doc.add(new StringField(IndexArgs.ID, id, Field.Store.YES));
     // This is needed to break score ties by docid.
-    doc.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef(id)));
+    doc.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef(id)));
 
     if (args.storeRaw) {
       doc.add(new StoredField(IndexArgs.RAW, raw));
diff --git a/src/main/java/io/anserini/index/generator/CoreGenerator.java b/src/main/java/io/anserini/index/generator/CoreGenerator.java
index 1f9bf3316c..8ea1710d1f 100644
--- a/src/main/java/io/anserini/index/generator/CoreGenerator.java
+++ b/src/main/java/io/anserini/index/generator/CoreGenerator.java
@@ -23,11 +23,11 @@
 import org.apache.lucene.analysis.Analyzer;
 import org.apache.lucene.analysis.CharArraySet;
 import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.document.BinaryDocValuesField;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.document.FieldType;
 import org.apache.lucene.document.IntPoint;
-import org.apache.lucene.document.SortedDocValuesField;
 import org.apache.lucene.document.StoredField;
 import org.apache.lucene.document.StringField;
 import org.apache.lucene.index.IndexOptions;
@@ -106,7 +106,7 @@ public Document createDocument(CoreCollection.Document coreDoc) throws Generator
     // Store the collection docid.
     doc.add(new StringField(IndexArgs.ID, id, Field.Store.YES));
     // This is needed to break score ties by docid.
-    doc.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef(id)));
+    doc.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef(id)));
 
     if (args.storeRaw) {
       doc.add(new StoredField(IndexArgs.RAW, coreDoc.raw()));
@@ -165,10 +165,10 @@ private void addDocumentField(Document doc, String key, JsonNode value, FieldTyp
       // index as numeric value to allow range queries
       try {
         doc.add(new IntPoint(key, Integer.parseInt(valueText)));
+        doc.add(new StoredField(key, valueText));
       } catch(Exception e) {
         // year is not numeric value
       }
-      doc.add(new StoredField(key, valueText));
     } else {
       doc.add(new Field(key, valueText, fieldType));
     }
diff --git a/src/main/java/io/anserini/index/generator/DefaultLuceneDocumentGenerator.java b/src/main/java/io/anserini/index/generator/DefaultLuceneDocumentGenerator.java
index bc226baa6b..b78962e5ae 100644
--- a/src/main/java/io/anserini/index/generator/DefaultLuceneDocumentGenerator.java
+++ b/src/main/java/io/anserini/index/generator/DefaultLuceneDocumentGenerator.java
@@ -21,10 +21,10 @@
 import io.anserini.collection.SourceDocument;
 import io.anserini.index.IndexArgs;
 import org.apache.commons.lang3.ArrayUtils;
+import org.apache.lucene.document.BinaryDocValuesField;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.document.FieldType;
-import org.apache.lucene.document.SortedDocValuesField;
 import org.apache.lucene.document.StoredField;
 import org.apache.lucene.document.StringField;
 import org.apache.lucene.index.IndexOptions;
@@ -74,7 +74,7 @@ public Document createDocument(T src) throws GeneratorException {
     // Store the collection docid.
     document.add(new StringField(IndexArgs.ID, id, Field.Store.YES));
     // This is needed to break score ties by docid.
-    document.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef(id)));
+    document.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef(id)));
 
     if (args.storeRaw) {
       document.add(new StoredField(IndexArgs.RAW, src.raw()));
diff --git a/src/main/java/io/anserini/index/generator/EpidemicQAGenerator.java b/src/main/java/io/anserini/index/generator/EpidemicQAGenerator.java
index eb870adbdb..9a74406087 100644
--- a/src/main/java/io/anserini/index/generator/EpidemicQAGenerator.java
+++ b/src/main/java/io/anserini/index/generator/EpidemicQAGenerator.java
@@ -22,10 +22,10 @@
 import org.apache.lucene.analysis.Analyzer;
 import org.apache.lucene.analysis.CharArraySet;
 import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.document.BinaryDocValuesField;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.document.FieldType;
-import org.apache.lucene.document.SortedDocValuesField;
 import org.apache.lucene.document.StoredField;
 import org.apache.lucene.document.StringField;
 import org.apache.lucene.index.IndexOptions;
@@ -76,7 +76,7 @@ public Document createDocument(EpidemicQACollection.Document covidDoc) throws Ge
     // Store the collection docid.
     doc.add(new StringField(IndexArgs.ID, id, Field.Store.YES));
     // This is needed to break score ties by docid.
-    doc.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef(id)));
+    doc.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef(id)));
 
     if (args.storeRaw) {
       doc.add(new StoredField(IndexArgs.RAW, raw));
diff --git a/src/main/java/io/anserini/rerank/ScoredDocuments.java b/src/main/java/io/anserini/rerank/ScoredDocuments.java
index cc41381254..c215927a31 100644
--- a/src/main/java/io/anserini/rerank/ScoredDocuments.java
+++ b/src/main/java/io/anserini/rerank/ScoredDocuments.java
@@ -17,12 +17,12 @@
 package io.anserini.rerank;
 
 import io.anserini.index.IndexArgs;
+import org.apache.lucene.document.BinaryDocValuesField;
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.index.Term;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.document.StringField;
-import org.apache.lucene.document.SortedDocValuesField;
 import org.apache.lucene.search.IndexSearcher;
 import org.apache.lucene.search.Query;
 import org.apache.lucene.search.TermQuery;
@@ -97,7 +97,7 @@ public static ScoredDocuments fromSolrDocs(SolrDocumentList rs) {
       // Store the collection docid.
       document.add(new StringField(IndexArgs.ID, id, Field.Store.YES));
       // This is needed to break score ties by docid.
-      document.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef(id)));
+      document.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef(id)));
       scoredDocs.documents[i] = document;
       scoredDocs.scores[i] = score;
       scoredDocs.ids[i] = i; // no internal Lucene ID available, use index as placeholder
@@ -130,7 +130,7 @@ public static ScoredDocuments fromESDocs(SearchHits rs) {
       // Store the collection docid.
       document.add(new StringField(IndexArgs.ID, id, Field.Store.YES));
       // This is needed to break score ties by docid.
-      document.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef(id)));
+      document.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef(id)));
       scoredDocs.documents[i] = document;
       scoredDocs.scores[i] = score;
       scoredDocs.ids[i] = i; // no internal Lucene ID available, use index as placeholder
diff --git a/src/main/java/io/anserini/search/SearchSolr.java b/src/main/java/io/anserini/search/SearchSolr.java
index cc83c92978..86b1a42f6b 100644
--- a/src/main/java/io/anserini/search/SearchSolr.java
+++ b/src/main/java/io/anserini/search/SearchSolr.java
@@ -165,8 +165,8 @@ public SearchSolr(Args args) throws IOException {
     LOG.info("Solr ZooKeeper URL: " + args.zkUrl);
     this.client = new CloudSolrClient.Builder(Splitter.on(',')
             .splitToList(args.zkUrl), Optional.of(args.zkChroot))
-            .withConnectionTimeout(TIMEOUT)
-            .withSocketTimeout(TIMEOUT)
+//            .withConnectionTimeout(TIMEOUT)
+//            .withSocketTimeout(TIMEOUT)
             .build();
   }
 
diff --git a/src/main/java/io/anserini/search/query/SdmQueryGenerator.java b/src/main/java/io/anserini/search/query/SdmQueryGenerator.java
index c99292594e..18dac1019d 100644
--- a/src/main/java/io/anserini/search/query/SdmQueryGenerator.java
+++ b/src/main/java/io/anserini/search/query/SdmQueryGenerator.java
@@ -19,14 +19,14 @@
 import io.anserini.analysis.AnalyzerUtils;
 import org.apache.lucene.analysis.Analyzer;
 import org.apache.lucene.index.Term;
+import org.apache.lucene.queries.spans.SpanNearQuery;
+import org.apache.lucene.queries.spans.SpanQuery;
+import org.apache.lucene.queries.spans.SpanTermQuery;
 import org.apache.lucene.search.BooleanClause;
 import org.apache.lucene.search.BooleanQuery;
 import org.apache.lucene.search.BoostQuery;
 import org.apache.lucene.search.Query;
 import org.apache.lucene.search.TermQuery;
-import org.apache.lucene.search.spans.SpanNearQuery;
-import org.apache.lucene.search.spans.SpanQuery;
-import org.apache.lucene.search.spans.SpanTermQuery;
 
 import java.util.List;
 
diff --git a/src/main/resources/solr/anserini/conf/solrconfig.xml b/src/main/resources/solr/anserini/conf/solrconfig.xml
index 424d806e88..b00368515b 100644
--- a/src/main/resources/solr/anserini/conf/solrconfig.xml
+++ b/src/main/resources/solr/anserini/conf/solrconfig.xml
@@ -35,7 +35,7 @@
        that you fully re-index after changing this setting as it can
        affect both how text is indexed and queried.
   -->
-  <luceneMatchVersion>8.0.0</luceneMatchVersion>
+  <luceneMatchVersion>9.0.0</luceneMatchVersion>
 
   <!-- <lib/> directives can be used to instruct Solr to load any Jars
        identified and use them to resolve any "plugins" specified in
@@ -72,18 +72,7 @@
        The examples below can be used to load some solr-contribs along
        with their external dependencies.
     -->
-  <lib dir="${solr.install.dir:../../../..}/lib" />
-  <lib dir="${solr.install.dir:../../../..}/contrib/extraction/lib" regex=".*\.jar" />
-  <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-cell-\d.*\.jar" />
 
-  <lib dir="${solr.install.dir:../../../..}/contrib/clustering/lib/" regex=".*\.jar" />
-  <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-clustering-\d.*\.jar" />
-
-  <lib dir="${solr.install.dir:../../../..}/contrib/langid/lib/" regex=".*\.jar" />
-  <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-langid-\d.*\.jar" />
-
-  <lib dir="${solr.install.dir:../../../..}/contrib/velocity/lib" regex=".*\.jar" />
-  <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-velocity-\d.*\.jar" />
   <!-- an exact 'path' can be used instead of a 'dir' to specify a
        specific jar file.  This will cause a serious error to be logged
        if it can't be loaded.
@@ -409,8 +398,7 @@
                       to occupy. Note that when this option is specified, the size
                       and initialSize parameters are ignored.
       -->
-    <filterCache class="solr.FastLRUCache"
-                 size="512"
+    <filterCache size="512"
                  initialSize="512"
                  autowarmCount="0"/>
 
@@ -422,8 +410,7 @@
             maxRamMB - the maximum amount of RAM (in MB) that this cache is allowed
                        to occupy
       -->
-    <queryResultCache class="solr.LRUCache"
-                      size="512"
+    <queryResultCache size="512"
                       initialSize="512"
                       autowarmCount="0"/>
 
@@ -433,14 +420,12 @@
          document).  Since Lucene internal document ids are transient,
          this cache will not be autowarmed.
       -->
-    <documentCache class="solr.LRUCache"
-                   size="512"
+    <documentCache size="512"
                    initialSize="512"
                    autowarmCount="0"/>
 
     <!-- custom cache currently used by block join -->
     <cache name="perSegFilter"
-           class="solr.search.LRUCache"
            size="10"
            initialSize="0"
            autowarmCount="10"
@@ -1304,13 +1289,6 @@
     <str name="params.resource.loader.enabled">${velocity.params.resource.loader.enabled:false}</str>
   </queryResponseWriter>
 
-  <!-- XSLT response writer transforms the XML output by any xslt file found
-       in Solr's conf/xslt directory.  Changes to xslt files are checked for
-       every xsltCacheLifetimeSeconds.
-    -->
-  <queryResponseWriter name="xslt" class="solr.XSLTResponseWriter">
-    <int name="xsltCacheLifetimeSeconds">5</int>
-  </queryResponseWriter>
 
   <!-- Query Parsers
 
diff --git a/src/test/java/io/anserini/IndexerTestBase.java b/src/test/java/io/anserini/IndexerTestBase.java
index 22d3428077..ffd16c0b0c 100644
--- a/src/test/java/io/anserini/IndexerTestBase.java
+++ b/src/test/java/io/anserini/IndexerTestBase.java
@@ -19,10 +19,10 @@
 import io.anserini.index.IndexArgs;
 import org.apache.lucene.analysis.Analyzer;
 import org.apache.lucene.analysis.en.EnglishAnalyzer;
+import org.apache.lucene.document.BinaryDocValuesField;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.document.FieldType;
-import org.apache.lucene.document.SortedDocValuesField;
 import org.apache.lucene.document.StoredField;
 import org.apache.lucene.document.StringField;
 import org.apache.lucene.index.IndexOptions;
@@ -30,8 +30,8 @@
 import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
-import org.apache.lucene.util.BytesRef;
 import org.apache.lucene.util.LuceneTestCase;
+import org.apache.lucene.util.BytesRef;
 import org.junit.After;
 import org.junit.Before;
 
@@ -61,7 +61,7 @@ private void buildTestIndex() throws IOException {
     Document doc1 = new Document();
     String doc1Text = "here is some text here is some more text. city.";
     doc1.add(new StringField(IndexArgs.ID, "doc1", Field.Store.YES));
-    doc1.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef("doc1".getBytes())));
+    doc1.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef("doc1".getBytes())));
     doc1.add(new Field(IndexArgs.CONTENTS, doc1Text , textOptions));
     // specifically demonstrate how "contents" and "raw" might diverge:
     doc1.add(new StoredField(IndexArgs.RAW, String.format("{\"contents\": \"%s\"}", doc1Text)));
@@ -70,7 +70,7 @@ private void buildTestIndex() throws IOException {
     Document doc2 = new Document();
     String doc2Text = "more texts";
     doc2.add(new StringField(IndexArgs.ID, "doc2", Field.Store.YES));
-    doc2.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef("doc2".getBytes())));
+    doc2.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef("doc2".getBytes())));
     doc2.add(new Field(IndexArgs.CONTENTS, doc2Text, textOptions));  // Note plural, to test stemming
     // specifically demonstrate how "contents" and "raw" might diverge:
     doc2.add(new StoredField(IndexArgs.RAW, String.format("{\"contents\": \"%s\"}", doc2Text)));
@@ -79,7 +79,7 @@ private void buildTestIndex() throws IOException {
     Document doc3 = new Document();
     String doc3Text = "here is a test";
     doc3.add(new StringField(IndexArgs.ID, "doc3", Field.Store.YES));
-    doc3.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef("doc3".getBytes())));
+    doc3.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef("doc3".getBytes())));
     doc3.add(new Field(IndexArgs.CONTENTS, doc3Text, textOptions));
     // specifically demonstrate how "contents" and "raw" might diverge:
     doc3.add(new StoredField(IndexArgs.RAW, String.format("{\"contents\": \"%s\"}", doc3Text)));
diff --git a/src/test/java/io/anserini/IndexerWithEmptyDocumentTestBase.java b/src/test/java/io/anserini/IndexerWithEmptyDocumentTestBase.java
index c7f18e242a..417a0fb0ea 100644
--- a/src/test/java/io/anserini/IndexerWithEmptyDocumentTestBase.java
+++ b/src/test/java/io/anserini/IndexerWithEmptyDocumentTestBase.java
@@ -19,10 +19,10 @@
 import io.anserini.index.IndexArgs;
 import org.apache.lucene.analysis.Analyzer;
 import org.apache.lucene.analysis.en.EnglishAnalyzer;
+import org.apache.lucene.document.BinaryDocValuesField;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.document.FieldType;
-import org.apache.lucene.document.SortedDocValuesField;
 import org.apache.lucene.document.StoredField;
 import org.apache.lucene.document.StringField;
 import org.apache.lucene.index.IndexOptions;
@@ -30,8 +30,8 @@
 import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
-import org.apache.lucene.util.BytesRef;
 import org.apache.lucene.util.LuceneTestCase;
+import org.apache.lucene.util.BytesRef;
 import org.junit.After;
 import org.junit.Before;
 
@@ -90,7 +90,7 @@ private void buildTestIndex() throws IOException {
     Document doc1 = new Document();
     String doc1Text = "here is some text here is some more text. city.";
     doc1.add(new StringField(IndexArgs.ID, "doc1", Field.Store.YES));
-    doc1.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef("doc1".getBytes())));
+    doc1.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef("doc1".getBytes())));
     doc1.add(new Field(IndexArgs.CONTENTS, doc1Text , textOptions));
     doc1.add(new StoredField(IndexArgs.RAW, doc1Text));
     writer.addDocument(doc1);
@@ -98,7 +98,7 @@ private void buildTestIndex() throws IOException {
     Document doc2 = new Document();
     String doc2Text = "more texts";
     doc2.add(new StringField(IndexArgs.ID, "doc2", Field.Store.YES));
-    doc2.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef("doc2".getBytes())));
+    doc2.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef("doc2".getBytes())));
     doc2.add(new Field(IndexArgs.CONTENTS, doc2Text, textOptions));  // Note plural, to test stemming
     doc2.add(new StoredField(IndexArgs.RAW, doc2Text));
     writer.addDocument(doc2);
@@ -106,7 +106,7 @@ private void buildTestIndex() throws IOException {
     Document doc3 = new Document();
     String doc3Text = "here is a test";
     doc3.add(new StringField(IndexArgs.ID, "doc3", Field.Store.YES));
-    doc3.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef("doc3".getBytes())));
+    doc3.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef("doc3".getBytes())));
     doc3.add(new Field(IndexArgs.CONTENTS, doc3Text, textOptions));
     doc3.add(new StoredField(IndexArgs.RAW, doc3Text));
     writer.addDocument(doc3);
@@ -114,7 +114,7 @@ private void buildTestIndex() throws IOException {
     Document doc4 = new Document();
     String doc4Text = "";
     doc4.add(new StringField(IndexArgs.ID, "doc4", Field.Store.YES));
-    doc4.add(new SortedDocValuesField(IndexArgs.ID, new BytesRef("doc4".getBytes())));
+    doc4.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef("doc4".getBytes())));
     doc4.add(new Field(IndexArgs.CONTENTS, doc4Text, textOptions));
     doc4.add(new StoredField(IndexArgs.RAW, doc4Text));
     writer.addDocument(doc4);
diff --git a/src/test/java/io/anserini/index/CloneIndexTest.java b/src/test/java/io/anserini/index/CloneIndexTest.java
index 2cab8d13c4..2383be8352 100644
--- a/src/test/java/io/anserini/index/CloneIndexTest.java
+++ b/src/test/java/io/anserini/index/CloneIndexTest.java
@@ -31,7 +31,6 @@
 import org.apache.lucene.index.Terms;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
-import org.apache.lucene.util.Accountable;
 import org.junit.After;
 import org.junit.Before;
 import org.junit.Test;
@@ -157,14 +156,5 @@ public int size() {
       return fieldsProducer.size();
     }
 
-    @Override
-    public long ramBytesUsed() {
-      return fieldsProducer.ramBytesUsed();
-    }
-
-    @Override
-    public Collection<Accountable> getChildResources() {
-      return fieldsProducer.getChildResources();
-    }
   }
 }
diff --git a/src/test/java/io/anserini/integration/CoreEndToEndTest.java b/src/test/java/io/anserini/integration/CoreEndToEndTest.java
index 4e283e0737..422b7f7c66 100644
--- a/src/test/java/io/anserini/integration/CoreEndToEndTest.java
+++ b/src/test/java/io/anserini/integration/CoreEndToEndTest.java
@@ -54,7 +54,7 @@ protected void setCheckIndexGroundTruth() {
     termIndexStatusTotFreq = 43;
     storedFieldStatusTotalDocCounts = 3;
     termIndexStatusTotPos = 45;
-    storedFieldStatusTotFields = 47;
+    storedFieldStatusTotFields = 46;
   }
 
   @Override
diff --git a/src/test/java/io/anserini/integration/EndToEndTest.java b/src/test/java/io/anserini/integration/EndToEndTest.java
index 16c2062b2b..3b509702e3 100644
--- a/src/test/java/io/anserini/integration/EndToEndTest.java
+++ b/src/test/java/io/anserini/integration/EndToEndTest.java
@@ -28,9 +28,9 @@
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
-import org.apache.lucene.util.IOUtils;
 import org.apache.lucene.util.LuceneTestCase;
 import org.apache.lucene.util.TestRuleLimitSysouts;
+import org.apache.lucene.util.IOUtils;
 import org.junit.After;
 import org.junit.Before;
 import org.junit.Test;
diff --git a/src/test/java/io/anserini/integration/solr/SolrEndToEndTest.java b/src/test/java/io/anserini/integration/solr/SolrEndToEndTest.java
index 453cc77153..d2529d7c6d 100644
--- a/src/test/java/io/anserini/integration/solr/SolrEndToEndTest.java
+++ b/src/test/java/io/anserini/integration/solr/SolrEndToEndTest.java
@@ -35,6 +35,7 @@
 import org.apache.solr.client.solrj.request.json.DirectJsonQueryRequest;
 import org.apache.solr.client.solrj.response.QueryResponse;
 import org.apache.solr.common.params.CommonParams;
+import org.apache.solr.common.params.ModifiableSolrParams;
 import org.apache.solr.core.NodeConfig;
 import org.apache.solr.core.SolrResourceLoader;
 import org.junit.After;
@@ -48,7 +49,6 @@
 import java.net.URL;
 import java.nio.file.Files;
 
-import static org.apache.solr.SolrTestCaseJ4.params;
 
 @LuceneTestCase.SuppressSysoutChecks(bugUrl = "None")
 public abstract class SolrEndToEndTest extends LuceneTestCase {
@@ -193,7 +193,9 @@ public void testIndexAndSearch() throws Exception {
     if (schemaAdjustmentFile != null) {
       // update schema, much like curl -X POST -H 'Content-type:application/json' --data-binary SCHEMA_NAME.json http://localhost:8983/solr/COLLECTION_NAME/schema
       String schemaJson = Files.readString(getFile(schemaAdjustmentFile).toPath());
-      DirectJsonQueryRequest schemaRequest = new DirectJsonQueryRequest(schemaJson, params(CommonParams.QT, "/schema"));
+      ModifiableSolrParams params = new ModifiableSolrParams();
+      params.add(CommonParams.QT, "/schema");
+      DirectJsonQueryRequest schemaRequest = new DirectJsonQueryRequest(schemaJson, params);
       QueryResponse response = schemaRequest.process(client, getCollectionName());
       assertEquals(0, response.getStatus());
     }
diff --git a/src/test/java/io/anserini/search/query/DisjunctionMaxQueryGeneratorTest.java b/src/test/java/io/anserini/search/query/DisjunctionMaxQueryGeneratorTest.java
index e9ec334c6b..6b82cdcc29 100644
--- a/src/test/java/io/anserini/search/query/DisjunctionMaxQueryGeneratorTest.java
+++ b/src/test/java/io/anserini/search/query/DisjunctionMaxQueryGeneratorTest.java
@@ -51,9 +51,9 @@ public void testMultipleFields() {
     DisjunctionMaxQuery combinedQuery = (DisjunctionMaxQuery) query;
     assertEquals(tiebreaker, combinedQuery.getTieBreakerMultiplier(), 1e-6);
     assertEquals(3, combinedQuery.getDisjuncts().size());
-    assertTrue(combinedQuery.getDisjuncts().get(0) instanceof BoostQuery);
+    assertTrue(combinedQuery.getDisjuncts().iterator().next() instanceof BoostQuery);
 
-    BoostQuery boostQuery = (BoostQuery) combinedQuery.getDisjuncts().get(0);
+    BoostQuery boostQuery = (BoostQuery) combinedQuery.getDisjuncts().iterator().next();
     assertTrue(boostQuery.getBoost() > 1.0f);
     assertTrue(boostQuery.getQuery() instanceof BooleanQuery);
 
diff --git a/src/test/java/io/anserini/search/query/SdmQueryTest.java b/src/test/java/io/anserini/search/query/SdmQueryTest.java
index 90d53fbc97..89663ffdca 100644
--- a/src/test/java/io/anserini/search/query/SdmQueryTest.java
+++ b/src/test/java/io/anserini/search/query/SdmQueryTest.java
@@ -27,13 +27,13 @@
 import org.apache.lucene.index.IndexWriter;
 import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.index.Term;
+import org.apache.lucene.queries.spans.SpanNearQuery;
+import org.apache.lucene.queries.spans.SpanQuery;
+import org.apache.lucene.queries.spans.SpanTermQuery;
 import org.apache.lucene.search.IndexSearcher;
 import org.apache.lucene.search.Query;
 import org.apache.lucene.search.TopDocs;
 import org.apache.lucene.search.similarities.BM25Similarity;
-import org.apache.lucene.search.spans.SpanNearQuery;
-import org.apache.lucene.search.spans.SpanQuery;
-import org.apache.lucene.search.spans.SpanTermQuery;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
 import org.apache.lucene.util.LuceneTestCase;

From 09a7dbad8b89b1dcfcc612be02c96080e87b7cd9 Mon Sep 17 00:00:00 2001
From: Tommaso Teofili <tteofili@redhat.com>
Date: Thu, 19 May 2022 12:13:42 +0200
Subject: [PATCH 05/13] upgrade solr twitter conf to 90

---
 .../solr/anserini-twitter/conf/solrconfig.xml | 34 +++----------------
 1 file changed, 5 insertions(+), 29 deletions(-)

diff --git a/src/main/resources/solr/anserini-twitter/conf/solrconfig.xml b/src/main/resources/solr/anserini-twitter/conf/solrconfig.xml
index 424d806e88..092d84405e 100644
--- a/src/main/resources/solr/anserini-twitter/conf/solrconfig.xml
+++ b/src/main/resources/solr/anserini-twitter/conf/solrconfig.xml
@@ -35,7 +35,7 @@
        that you fully re-index after changing this setting as it can
        affect both how text is indexed and queried.
   -->
-  <luceneMatchVersion>8.0.0</luceneMatchVersion>
+  <luceneMatchVersion>9.0.0</luceneMatchVersion>
 
   <!-- <lib/> directives can be used to instruct Solr to load any Jars
        identified and use them to resolve any "plugins" specified in
@@ -72,18 +72,6 @@
        The examples below can be used to load some solr-contribs along
        with their external dependencies.
     -->
-  <lib dir="${solr.install.dir:../../../..}/lib" />
-  <lib dir="${solr.install.dir:../../../..}/contrib/extraction/lib" regex=".*\.jar" />
-  <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-cell-\d.*\.jar" />
-
-  <lib dir="${solr.install.dir:../../../..}/contrib/clustering/lib/" regex=".*\.jar" />
-  <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-clustering-\d.*\.jar" />
-
-  <lib dir="${solr.install.dir:../../../..}/contrib/langid/lib/" regex=".*\.jar" />
-  <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-langid-\d.*\.jar" />
-
-  <lib dir="${solr.install.dir:../../../..}/contrib/velocity/lib" regex=".*\.jar" />
-  <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-velocity-\d.*\.jar" />
   <!-- an exact 'path' can be used instead of a 'dir' to specify a
        specific jar file.  This will cause a serious error to be logged
        if it can't be loaded.
@@ -409,8 +397,7 @@
                       to occupy. Note that when this option is specified, the size
                       and initialSize parameters are ignored.
       -->
-    <filterCache class="solr.FastLRUCache"
-                 size="512"
+    <filterCache size="512"
                  initialSize="512"
                  autowarmCount="0"/>
 
@@ -422,8 +409,7 @@
             maxRamMB - the maximum amount of RAM (in MB) that this cache is allowed
                        to occupy
       -->
-    <queryResultCache class="solr.LRUCache"
-                      size="512"
+    <queryResultCache size="512"
                       initialSize="512"
                       autowarmCount="0"/>
 
@@ -433,14 +419,12 @@
          document).  Since Lucene internal document ids are transient,
          this cache will not be autowarmed.
       -->
-    <documentCache class="solr.LRUCache"
-                   size="512"
+    <documentCache size="512"
                    initialSize="512"
                    autowarmCount="0"/>
 
     <!-- custom cache currently used by block join -->
     <cache name="perSegFilter"
-           class="solr.search.LRUCache"
            size="10"
            initialSize="0"
            autowarmCount="10"
@@ -1303,15 +1287,7 @@
     <str name="solr.resource.loader.enabled">${velocity.solr.resource.loader.enabled:true}</str>
     <str name="params.resource.loader.enabled">${velocity.params.resource.loader.enabled:false}</str>
   </queryResponseWriter>
-
-  <!-- XSLT response writer transforms the XML output by any xslt file found
-       in Solr's conf/xslt directory.  Changes to xslt files are checked for
-       every xsltCacheLifetimeSeconds.
-    -->
-  <queryResponseWriter name="xslt" class="solr.XSLTResponseWriter">
-    <int name="xsltCacheLifetimeSeconds">5</int>
-  </queryResponseWriter>
-
+  
   <!-- Query Parsers
 
        https://lucene.apache.org/solr/guide/query-syntax-and-parsing.html

From 4e245598f246771681fbaa7e969379a9be57fad5 Mon Sep 17 00:00:00 2001
From: Tommaso Teofili <tteofili@redhat.com>
Date: Thu, 19 May 2022 12:31:28 +0200
Subject: [PATCH 06/13] merged upstream changes

---
 pom.xml                                                      | 2 +-
 src/main/java/io/anserini/index/IndexCollection.java         | 4 ++--
 src/main/java/io/anserini/search/SearchSolr.java             | 4 ++--
 src/main/resources/solr/anserini-twitter/conf/solrconfig.xml | 2 +-
 4 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/pom.xml b/pom.xml
index ec22d6f448..aa02d02055 100644
--- a/pom.xml
+++ b/pom.xml
@@ -308,7 +308,7 @@
     </dependency>
     <dependency> <!-- polish and ukrainian -->
       <groupId>org.apache.lucene</groupId>
-      <artifactId>lucene-analyzers-morfologik</artifactId>
+      <artifactId>lucene-analysis-morfologik</artifactId>
       <version>${lucene.version}</version>
     </dependency>
     <dependency> <!-- only needed for testing -->
diff --git a/src/main/java/io/anserini/index/IndexCollection.java b/src/main/java/io/anserini/index/IndexCollection.java
index d4b9a9107d..e768f587fe 100644
--- a/src/main/java/io/anserini/index/IndexCollection.java
+++ b/src/main/java/io/anserini/index/IndexCollection.java
@@ -85,6 +85,7 @@
 import org.apache.lucene.store.FSDirectory;
 import org.apache.solr.client.solrj.SolrClient;
 import org.apache.solr.client.solrj.impl.CloudSolrClient;
+import org.apache.solr.client.solrj.impl.Http2SolrClient;
 import org.apache.solr.common.SolrInputDocument;
 import org.elasticsearch.action.DocWriteRequest;
 import org.elasticsearch.action.bulk.BulkRequest;
@@ -411,8 +412,7 @@ private class SolrClientFactory extends BasePooledObjectFactory<SolrClient> {
     @Override
     public SolrClient create() {
       return new CloudSolrClient.Builder(Splitter.on(',').splitToList(args.zkUrl), Optional.of(args.zkChroot))
-//          .withConnectionTimeout(TIMEOUT)
-//          .withSocketTimeout(TIMEOUT)
+          .withInternalClientBuilder(new Http2SolrClient.Builder().connectionTimeout(TIMEOUT))
           .build();
     }
 
diff --git a/src/main/java/io/anserini/search/SearchSolr.java b/src/main/java/io/anserini/search/SearchSolr.java
index 86b1a42f6b..9b01661aa4 100644
--- a/src/main/java/io/anserini/search/SearchSolr.java
+++ b/src/main/java/io/anserini/search/SearchSolr.java
@@ -31,6 +31,7 @@
 import org.apache.solr.client.solrj.SolrQuery;
 import org.apache.solr.client.solrj.SolrQuery.SortClause;
 import org.apache.solr.client.solrj.impl.CloudSolrClient;
+import org.apache.solr.client.solrj.impl.Http2SolrClient;
 import org.apache.solr.client.solrj.response.QueryResponse;
 import org.apache.solr.common.SolrDocumentList;
 import org.kohsuke.args4j.CmdLineException;
@@ -165,8 +166,7 @@ public SearchSolr(Args args) throws IOException {
     LOG.info("Solr ZooKeeper URL: " + args.zkUrl);
     this.client = new CloudSolrClient.Builder(Splitter.on(',')
             .splitToList(args.zkUrl), Optional.of(args.zkChroot))
-//            .withConnectionTimeout(TIMEOUT)
-//            .withSocketTimeout(TIMEOUT)
+            .withInternalClientBuilder(new Http2SolrClient.Builder().connectionTimeout(TIMEOUT))
             .build();
   }
 
diff --git a/src/main/resources/solr/anserini-twitter/conf/solrconfig.xml b/src/main/resources/solr/anserini-twitter/conf/solrconfig.xml
index 092d84405e..5f3e4208ef 100644
--- a/src/main/resources/solr/anserini-twitter/conf/solrconfig.xml
+++ b/src/main/resources/solr/anserini-twitter/conf/solrconfig.xml
@@ -1287,7 +1287,7 @@
     <str name="solr.resource.loader.enabled">${velocity.solr.resource.loader.enabled:true}</str>
     <str name="params.resource.loader.enabled">${velocity.params.resource.loader.enabled:false}</str>
   </queryResponseWriter>
-  
+
   <!-- Query Parsers
 
        https://lucene.apache.org/solr/guide/query-syntax-and-parsing.html

From 41c475c6b72401b3c82110d86fa8eb57149fac21 Mon Sep 17 00:00:00 2001
From: Tommaso Teofili <tteofili@redhat.com>
Date: Thu, 19 May 2022 15:43:22 +0200
Subject: [PATCH 07/13] comparing covid19 query generated query at object level

---
 .../query/Covid19QueryGeneratorTest.java      | 44 +++++++++++++++----
 1 file changed, 35 insertions(+), 9 deletions(-)

diff --git a/src/test/java/io/anserini/search/query/Covid19QueryGeneratorTest.java b/src/test/java/io/anserini/search/query/Covid19QueryGeneratorTest.java
index e096cb5456..dab30a8406 100644
--- a/src/test/java/io/anserini/search/query/Covid19QueryGeneratorTest.java
+++ b/src/test/java/io/anserini/search/query/Covid19QueryGeneratorTest.java
@@ -16,10 +16,19 @@
 
 package io.anserini.search.query;
 
+import java.util.ArrayList;
+import java.util.List;
+
 import io.anserini.index.IndexArgs;
 import io.anserini.index.IndexCollection;
 import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.index.Term;
+import org.apache.lucene.search.BooleanClause;
+import org.apache.lucene.search.BooleanQuery;
+import org.apache.lucene.search.DisjunctionMaxQuery;
+import org.apache.lucene.search.PhraseQuery;
 import org.apache.lucene.search.Query;
+import org.apache.lucene.search.TermQuery;
 import org.junit.Test;
 
 import static org.junit.Assert.assertEquals;
@@ -37,27 +46,46 @@ public void test1() {
     query = queryGenerator.buildQuery(IndexArgs.CONTENTS, analyzer, "incubation period");
     assertEquals("(contents:incub)^1.0 (contents:period)^1.0", query.toString());
 
+    Query targetQuery = getTargetQuery("incub", "period");
+
     query = queryGenerator.buildQuery(IndexArgs.CONTENTS, analyzer, "incubation period covid-19");
-    assertEquals("contents:incub contents:period (contents:\"covid 19\" | contents:\"2019 ncov\" | contents:\"sar cov 2\")", query.toString());
+    assertEquals(targetQuery, query);
 
     query = queryGenerator.buildQuery(IndexArgs.CONTENTS, analyzer, "covid-19 incubation period");
-    assertEquals("contents:incub contents:period (contents:\"covid 19\" | contents:\"2019 ncov\" | contents:\"sar cov 2\")", query.toString());
+    assertEquals(targetQuery, query);
 
     query = queryGenerator.buildQuery(IndexArgs.CONTENTS, analyzer, "incubation period COVID19");
-    assertEquals("contents:incub contents:period (contents:\"covid 19\" | contents:\"2019 ncov\" | contents:\"sar cov 2\")", query.toString());
+    assertEquals(targetQuery, query);
 
     query = queryGenerator.buildQuery(IndexArgs.CONTENTS, analyzer, "SARS-cov-2 incubation period");
-    assertEquals("contents:incub contents:period (contents:\"covid 19\" | contents:\"2019 ncov\" | contents:\"sar cov 2\")", query.toString());
+    assertEquals(targetQuery, query);
 
     query = queryGenerator.buildQuery(IndexArgs.CONTENTS, analyzer, "the 2019nCov incubation period");
-    assertEquals("contents:incub contents:period (contents:\"covid 19\" | contents:\"2019 ncov\" | contents:\"sar cov 2\")", query.toString());
+    assertEquals(targetQuery, query);
 
     // no mention of covid-19, just pass through
     query = queryGenerator.buildQuery(IndexArgs.CONTENTS, analyzer, "drugs");
     assertEquals("(contents:drug)^1.0", query.toString());
 
+    Query targetQuery2 = getTargetQuery("drug");
+
     query = queryGenerator.buildQuery(IndexArgs.CONTENTS, analyzer, "coronavirus drugs");
-    assertEquals("contents:drug (contents:\"covid 19\" | contents:\"2019 ncov\" | contents:\"sar cov 2\")", query.toString());
+    assertEquals(targetQuery2, query);
+  }
+
+  private Query getTargetQuery(String... terms) {
+    BooleanQuery.Builder builder = new BooleanQuery.Builder();
+    for (String term : terms) {
+      builder.add(new TermQuery(new Term("contents", term)), BooleanClause.Occur.SHOULD);
+    }
+
+    List<Query> disjuncts = new ArrayList<>();
+    disjuncts.add(new PhraseQuery("contents", "covid", "19"));
+    disjuncts.add(new PhraseQuery("contents", "2019", "ncov"));
+    disjuncts.add(new PhraseQuery("contents", "sar", "cov", "2"));
+    builder.add(new DisjunctionMaxQuery(disjuncts, 0.0f), BooleanClause.Occur.SHOULD);
+
+    return builder.build();
   }
 
   @Test
@@ -97,9 +125,7 @@ public void testRemoveBoilerplate() {
 
     query = queryGenerator.buildQuery(IndexArgs.CONTENTS, analyzer,
         "I'm looking for information about the incubation period of COVID-19?");
-    assertEquals(
-        "contents:incub contents:period (contents:\"covid 19\" | contents:\"2019 ncov\" | contents:\"sar cov 2\")",
-        query.toString());
+    assertEquals(getTargetQuery("incub", "period"), query);
 
     assertEquals("the incubation period of COVID-19?",
         queryGenerator.removeBoilerplate("I'm looking for information about the incubation period of COVID-19?"));

From 9f298abce78c941ce9ec5da6283492a8f3e55d11 Mon Sep 17 00:00:00 2001
From: lintool <jimmylin@uwaterloo.ca>
Date: Wed, 27 Jul 2022 16:56:03 -0400
Subject: [PATCH 08/13] Fix to enable successful Lucene 9 upgrade.

---
 pom.xml                                               | 11 +++++++++++
 .../TweetLowerCaseEntityPreservingFilterFactory.java  |  2 +-
 2 files changed, 12 insertions(+), 1 deletion(-)

diff --git a/pom.xml b/pom.xml
index aa02d02055..c4d944b194 100644
--- a/pom.xml
+++ b/pom.xml
@@ -301,6 +301,11 @@
       <artifactId>lucene-queries</artifactId>
       <version>${lucene.version}</version>
     </dependency>
+    <dependency>
+      <groupId>org.apache.lucene</groupId>
+      <artifactId>lucene-analysis-common</artifactId>
+      <version>${lucene.version}</version>
+    </dependency>
     <dependency>
       <groupId>org.apache.lucene</groupId>
       <artifactId>lucene-analysis-kuromoji</artifactId>
@@ -387,6 +392,12 @@
       <groupId>org.elasticsearch.client</groupId>
       <artifactId>elasticsearch-rest-high-level-client</artifactId>
       <version>7.0.0</version>
+      <exclusions>
+        <exclusion>
+          <groupId>org.apache.lucene</groupId>
+          <artifactId>lucene-analyzers-common</artifactId>
+        </exclusion>
+      </exclusions>
     </dependency>
     <dependency>
       <groupId>org.tukaani</groupId>
diff --git a/src/main/java/io/anserini/analysis/TweetLowerCaseEntityPreservingFilterFactory.java b/src/main/java/io/anserini/analysis/TweetLowerCaseEntityPreservingFilterFactory.java
index 14a63c6790..948911672f 100644
--- a/src/main/java/io/anserini/analysis/TweetLowerCaseEntityPreservingFilterFactory.java
+++ b/src/main/java/io/anserini/analysis/TweetLowerCaseEntityPreservingFilterFactory.java
@@ -17,7 +17,7 @@
 package io.anserini.analysis;
 
 import org.apache.lucene.analysis.TokenStream;
-import org.apache.lucene.analysis.util.TokenFilterFactory;
+import org.apache.lucene.analysis.TokenFilterFactory;
 
 import java.util.Map;
 

From 72572916bf89cda253a87c3da81b440919561516 Mon Sep 17 00:00:00 2001
From: lintool <jimmylin@uwaterloo.ca>
Date: Sun, 31 Jul 2022 22:30:02 -0400
Subject: [PATCH 09/13] Removal of Solr and ES code paths.

---
 pom.xml                                       |   95 +-
 .../java/io/anserini/index/IndexArgs.java     |   79 +-
 .../io/anserini/index/IndexCollection.java    |  470 +-----
 .../io/anserini/rerank/ScoredDocuments.java   |   86 +-
 .../io/anserini/search/SearchElastic.java     |  334 ----
 .../java/io/anserini/search/SearchSolr.java   |  275 ----
 src/main/python/run_es_regression.py          |  256 ----
 src/main/python/run_solr_regression.py        |  247 ---
 .../elasticsearch/index-config.cord19.json    |   32 -
 .../elasticsearch/index-config.core18.json    |   32 -
 .../index-config.msmarco-doc.json             |   32 -
 .../index-config.msmarco-passage.json         |   32 -
 .../elasticsearch/index-config.robust04.json  |   32 -
 .../solr/anserini-twitter/conf/managed-schema |  216 ---
 .../solr/anserini-twitter/conf/params.json    |   20 -
 .../solr/anserini-twitter/conf/protwords.txt  |   21 -
 .../solr/anserini-twitter/conf/solrconfig.xml | 1341 ----------------
 .../anserini-twitter/conf/stopwords_en.txt    |   49 -
 .../solr/anserini-twitter/conf/synonyms.txt   |   29 -
 .../solr/anserini/conf/managed-schema         |  216 ---
 .../resources/solr/anserini/conf/params.json  |   20 -
 .../solr/anserini/conf/protwords.txt          |   21 -
 .../solr/anserini/conf/solrconfig.xml         | 1343 -----------------
 .../solr/anserini/conf/stopwords_en.txt       |   49 -
 .../resources/solr/anserini/conf/synonyms.txt |   29 -
 .../resources/solr/schemas/acl-anthology.json |   26 -
 src/main/resources/solr/schemas/cord19.json   |   86 --
 src/main/resources/solr/schemas/core.json     |   56 -
 src/main/resources/solr/schemas/covid.json    |   86 --
 src/main/resources/solr/solr.sh               |   23 -
 .../solr/AclAnthologyEndToEndTest.java        |   57 -
 .../integration/solr/CoreEndToEndTest.java    |   59 -
 .../integration/solr/SolrEndToEndTest.java    |  222 ---
 .../integration/solr/TrecEndToEndTest.java    |   55 -
 34 files changed, 25 insertions(+), 6001 deletions(-)
 delete mode 100644 src/main/java/io/anserini/search/SearchElastic.java
 delete mode 100644 src/main/java/io/anserini/search/SearchSolr.java
 delete mode 100644 src/main/python/run_es_regression.py
 delete mode 100644 src/main/python/run_solr_regression.py
 delete mode 100644 src/main/resources/elasticsearch/index-config.cord19.json
 delete mode 100644 src/main/resources/elasticsearch/index-config.core18.json
 delete mode 100644 src/main/resources/elasticsearch/index-config.msmarco-doc.json
 delete mode 100644 src/main/resources/elasticsearch/index-config.msmarco-passage.json
 delete mode 100644 src/main/resources/elasticsearch/index-config.robust04.json
 delete mode 100644 src/main/resources/solr/anserini-twitter/conf/managed-schema
 delete mode 100644 src/main/resources/solr/anserini-twitter/conf/params.json
 delete mode 100644 src/main/resources/solr/anserini-twitter/conf/protwords.txt
 delete mode 100644 src/main/resources/solr/anserini-twitter/conf/solrconfig.xml
 delete mode 100644 src/main/resources/solr/anserini-twitter/conf/stopwords_en.txt
 delete mode 100644 src/main/resources/solr/anserini-twitter/conf/synonyms.txt
 delete mode 100644 src/main/resources/solr/anserini/conf/managed-schema
 delete mode 100644 src/main/resources/solr/anserini/conf/params.json
 delete mode 100644 src/main/resources/solr/anserini/conf/protwords.txt
 delete mode 100644 src/main/resources/solr/anserini/conf/solrconfig.xml
 delete mode 100644 src/main/resources/solr/anserini/conf/stopwords_en.txt
 delete mode 100644 src/main/resources/solr/anserini/conf/synonyms.txt
 delete mode 100644 src/main/resources/solr/schemas/acl-anthology.json
 delete mode 100644 src/main/resources/solr/schemas/cord19.json
 delete mode 100644 src/main/resources/solr/schemas/core.json
 delete mode 100644 src/main/resources/solr/schemas/covid.json
 delete mode 100755 src/main/resources/solr/solr.sh
 delete mode 100644 src/test/java/io/anserini/integration/solr/AclAnthologyEndToEndTest.java
 delete mode 100644 src/test/java/io/anserini/integration/solr/CoreEndToEndTest.java
 delete mode 100644 src/test/java/io/anserini/integration/solr/SolrEndToEndTest.java
 delete mode 100644 src/test/java/io/anserini/integration/solr/TrecEndToEndTest.java

diff --git a/pom.xml b/pom.xml
index f78a1fba3e..f0eae16e99 100644
--- a/pom.xml
+++ b/pom.xml
@@ -27,7 +27,6 @@
 
   <properties>
     <lucene.version>9.0.0</lucene.version>
-    <solr.version>9.0.0</solr.version>
     <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
   </properties>
 
@@ -110,14 +109,6 @@
               <mainClass>io.anserini.search.SearchCollection</mainClass>
               <id>SearchCollection</id>
             </program>
-            <program>
-              <mainClass>io.anserini.search.SearchSolr</mainClass>
-              <id>SearchSolr</id>
-            </program>
-            <program>
-              <mainClass>io.anserini.search.SearchElastic</mainClass>
-              <id>SearchElastic</id>
-            </program>
             <program>
               <mainClass>io.anserini.search.SearchMsmarco</mainClass>
               <id>SearchMsmarco</id>
@@ -301,6 +292,11 @@
       <artifactId>lucene-queries</artifactId>
       <version>${lucene.version}</version>
     </dependency>
+    <dependency>
+      <groupId>org.apache.lucene</groupId>
+      <artifactId>lucene-queryparser</artifactId>
+      <version>${lucene.version}</version>
+    </dependency>
     <dependency>
       <groupId>org.apache.lucene</groupId>
       <artifactId>lucene-analysis-common</artifactId>
@@ -311,6 +307,11 @@
       <artifactId>lucene-analysis-kuromoji</artifactId>
       <version>${lucene.version}</version>
     </dependency>
+    <dependency>
+      <groupId>org.apache.lucene</groupId>
+      <artifactId>lucene-codecs</artifactId>
+      <version>${lucene.version}</version>
+    </dependency>
     <dependency> <!-- polish and ukrainian -->
       <groupId>org.apache.lucene</groupId>
       <artifactId>lucene-analysis-morfologik</artifactId>
@@ -328,77 +329,6 @@
       <version>4.13.2</version>
       <scope>test</scope>
     </dependency>
-    <dependency>
-      <groupId>org.apache.solr</groupId>
-      <artifactId>solr-solrj</artifactId>
-      <version>${solr.version}</version>
-      <exclusions>
-        <exclusion>
-          <groupId>org.apache.lucene</groupId>
-          <artifactId>lucene-core</artifactId>
-        </exclusion>
-        <exclusion>
-          <groupId>org.apache.lucene</groupId>
-          <artifactId>lucene-analysis-common</artifactId>
-        </exclusion>
-        <exclusion>
-          <groupId>org.apache.lucene</groupId>
-          <artifactId>lucene-queries</artifactId>
-        </exclusion>
-        <exclusion>
-          <groupId>org.slf4j</groupId>
-          <artifactId>slf4j-api</artifactId>
-        </exclusion>
-        <exclusion>
-          <groupId>org.apache.logging.log4j</groupId>
-          <artifactId>log4j-slf4j-impl</artifactId>
-        </exclusion>
-      </exclusions>
-    </dependency>
-    <dependency> <!-- only needed for testing -->
-      <groupId>org.apache.solr</groupId>
-      <artifactId>solr-test-framework</artifactId>
-      <version>${solr.version}</version>
-      <scope>test</scope>
-      <exclusions>
-        <exclusion>
-          <groupId>org.apache.lucene</groupId>
-          <artifactId>lucene-core</artifactId>
-        </exclusion>
-        <exclusion>
-          <groupId>org.apache.lucene</groupId>
-          <artifactId>lucene-analysis-common</artifactId>
-        </exclusion>
-        <exclusion>
-          <groupId>org.apache.lucene</groupId>
-          <artifactId>lucene-queries</artifactId>
-        </exclusion>
-        <exclusion>
-          <groupId>org.slf4j</groupId>
-          <artifactId>slf4j-api</artifactId>
-        </exclusion>
-        <exclusion>
-          <groupId>org.apache.logging.log4j</groupId>
-          <artifactId>log4j-slf4j-impl</artifactId>
-        </exclusion>
-      </exclusions>
-    </dependency>
-    <dependency>
-      <groupId>org.apache.lucene</groupId>
-      <artifactId>lucene-codecs</artifactId>
-      <version>${lucene.version}</version>
-    </dependency>
-    <dependency>
-      <groupId>org.elasticsearch.client</groupId>
-      <artifactId>elasticsearch-rest-high-level-client</artifactId>
-      <version>7.0.0</version>
-      <exclusions>
-        <exclusion>
-          <groupId>org.apache.lucene</groupId>
-          <artifactId>lucene-analyzers-common</artifactId>
-        </exclusion>
-      </exclusions>
-    </dependency>
     <dependency>
       <groupId>org.tukaani</groupId>
       <artifactId>xz</artifactId>
@@ -502,6 +432,11 @@
       <artifactId>commons-csv</artifactId>
       <version>1.8</version>
     </dependency>
+    <dependency>
+      <groupId>org.apache.commons</groupId>
+      <artifactId>commons-text</artifactId>
+      <version>1.9</version>
+    </dependency>
     <dependency>
       <groupId>org.mockito</groupId>
       <artifactId>mockito-all</artifactId>
diff --git a/src/main/java/io/anserini/index/IndexArgs.java b/src/main/java/io/anserini/index/IndexArgs.java
index 6997f95886..70957978da 100644
--- a/src/main/java/io/anserini/index/IndexArgs.java
+++ b/src/main/java/io/anserini/index/IndexArgs.java
@@ -69,8 +69,7 @@ public class IndexArgs {
 
   // optional arguments
 
-  @Option(name = "-index", metaVar = "[path]", forbids = {"-solr", "-es"},
-      usage = "Index path.")
+  @Option(name = "-index", metaVar = "[path]", usage = "Index path.")
   public String index;
 
   @Option(name = "-fields", handler = StringArrayOptionHandler.class,
@@ -160,82 +159,6 @@ public class IndexArgs {
       usage = "File that contains deleted tweet ids (longs), one per line; these tweets will be skipped during indexing.")
   public String tweetDeletedIdsFile = "";
 
-  // Solr options
-
-  @Option(name = "-solr", forbids = {"-index", "-es"},
-      usage = "Indexes into Solr.")
-  public boolean solr = false;
-
-  @Option(name = "-solr.batch", metaVar = "[n]",
-      usage = "Solr indexing batch size.")
-  public int solrBatch = 1000;
-
-  @Option(name = "-solr.commitWithin", metaVar = "[s]",
-      usage = "Solr commitWithin setting (in seconds).")
-  public int solrCommitWithin = 60;
-
-  @Option(name = "-solr.index", metaVar = "[name]",
-      usage = "Solr index name.")
-  public String solrIndex = null;
-
-  @Option(name = "-solr.zkUrl", metaVar = "[urls]",
-      usage = "Solr ZooKeeper URLs (comma separated list).")
-  public String zkUrl = null;
-
-  @Option(name = "-solr.zkChroot", metaVar = "[path]",
-      usage = "Solr ZooKeeper chroot")
-  public String zkChroot = "/";
-
-  @Option(name = "-solr.poolSize", metaVar = "[n]",
-      usage = "Solr client pool size.")
-  public int solrPoolSize = 16;
-
-  // Elasticsearch options
-
-  @Option(name = "-es", forbids = {"-index", "-solr"},
-      usage = "Indexes into Elasticsearch.")
-  public boolean es = false;
-
-  @Option(name = "-es.index", metaVar = "[name]",
-      usage = "Elasticsearch index name.")
-  public String esIndex = null;
-
-  @Option(name = "-es.batch", metaVar = "[n]",
-      usage = "Elasticsearch batch index requests size.")
-  public int esBatch = 1000;
-
-  @Option(name = "-es.bulk", metaVar = "[n]",
-      usage = "Elasticsearch max bulk requests size in bytes.")
-  public int esBulk = 80000000;
-
-  @Option(name = "-es.hostname", metaVar = "[host]",
-      usage = "Elasticsearch host.")
-  public String esHostname = "localhost";
-
-  @Option(name = "-es.port", metaVar = "[port]",
-      usage = "Elasticsearch port number.")
-  public int esPort = 9200;
-
-  @Option(name = "-es.user", metaVar = "[username]",
-      usage = "Elasticsearch user name.")
-  public String esUser = "elastic";
-
-  @Option(name = "-es.password", metaVar = "[password]",
-      usage = "Elasticsearch password.")
-  public String esPassword = "changeme";
-
-  @Option(name = "-es.poolSize", metaVar = "[num]",
-      usage = "Elasticsearch client pool size.")
-  public int esPoolSize = 10;
-
-  @Option(name = "-es.connectTimeout", metaVar = "[ms]",
-      usage = "Elasticsearch (low level) REST client connect timeout (in ms).")
-  public int esConnectTimeout = TIMEOUT;
-
-  @Option(name = "-es.socketTimeout", metaVar = "[ms]",
-      usage = "Elasticsearch (low level) REST client socket timeout (in ms).")
-  public int esSocketTimeout = TIMEOUT;
-
   // Sharding options
 
   @Option(name = "-shard.count", metaVar = "[n]",
diff --git a/src/main/java/io/anserini/index/IndexCollection.java b/src/main/java/io/anserini/index/IndexCollection.java
index e768f587fe..b83403a3ae 100644
--- a/src/main/java/io/anserini/index/IndexCollection.java
+++ b/src/main/java/io/anserini/index/IndexCollection.java
@@ -16,8 +16,6 @@
 
 package io.anserini.index;
 
-import com.google.common.base.Splitter;
-import com.google.common.collect.Lists;
 import io.anserini.analysis.DefaultEnglishAnalyzer;
 import io.anserini.analysis.TweetAnalyzer;
 import io.anserini.collection.DocumentCollection;
@@ -27,22 +25,10 @@
 import io.anserini.index.generator.InvalidDocumentException;
 import io.anserini.index.generator.LuceneDocumentGenerator;
 import io.anserini.index.generator.SkippedDocumentException;
-import io.anserini.index.generator.WashingtonPostGenerator;
 import io.anserini.search.similarity.AccurateBM25Similarity;
 import io.anserini.search.similarity.ImpactSimilarity;
 import org.apache.commons.io.FileUtils;
 import org.apache.commons.lang3.time.DurationFormatUtils;
-import org.apache.commons.pool2.BasePooledObjectFactory;
-import org.apache.commons.pool2.ObjectPool;
-import org.apache.commons.pool2.PooledObject;
-import org.apache.commons.pool2.impl.DefaultPooledObject;
-import org.apache.commons.pool2.impl.GenericObjectPool;
-import org.apache.commons.pool2.impl.GenericObjectPoolConfig;
-import org.apache.http.HttpHost;
-import org.apache.http.auth.AuthScope;
-import org.apache.http.auth.UsernamePasswordCredentials;
-import org.apache.http.client.CredentialsProvider;
-import org.apache.http.impl.client.BasicCredentialsProvider;
 import org.apache.logging.log4j.Level;
 import org.apache.logging.log4j.LogManager;
 import org.apache.logging.log4j.Logger;
@@ -72,29 +58,14 @@
 import org.apache.lucene.analysis.th.ThaiAnalyzer;
 import org.apache.lucene.analysis.tr.TurkishAnalyzer;
 import org.apache.lucene.analysis.uk.UkrainianMorfologikAnalyzer;
-
 import org.apache.lucene.document.Document;
 import org.apache.lucene.index.ConcurrentMergeScheduler;
-import org.apache.lucene.index.DocValuesType;
 import org.apache.lucene.index.IndexWriter;
 import org.apache.lucene.index.IndexWriterConfig;
-import org.apache.lucene.index.IndexableField;
 import org.apache.lucene.index.Term;
 import org.apache.lucene.search.similarities.BM25Similarity;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
-import org.apache.solr.client.solrj.SolrClient;
-import org.apache.solr.client.solrj.impl.CloudSolrClient;
-import org.apache.solr.client.solrj.impl.Http2SolrClient;
-import org.apache.solr.common.SolrInputDocument;
-import org.elasticsearch.action.DocWriteRequest;
-import org.elasticsearch.action.bulk.BulkRequest;
-import org.elasticsearch.action.index.IndexRequest;
-import org.elasticsearch.client.RequestOptions;
-import org.elasticsearch.client.RestClient;
-import org.elasticsearch.client.RestHighLevelClient;
-import org.elasticsearch.common.xcontent.XContentBuilder;
-import org.elasticsearch.common.xcontent.XContentFactory;
 import org.kohsuke.args4j.CmdLineException;
 import org.kohsuke.args4j.CmdLineParser;
 import org.kohsuke.args4j.OptionHandlerFilter;
@@ -105,32 +76,21 @@
 import java.nio.file.Files;
 import java.nio.file.Path;
 import java.nio.file.Paths;
-import java.util.ArrayList;
 import java.util.Arrays;
-import java.util.Collections;
 import java.util.HashSet;
 import java.util.List;
-import java.util.Optional;
 import java.util.Set;
 import java.util.concurrent.Executors;
 import java.util.concurrent.ThreadPoolExecutor;
 import java.util.concurrent.TimeUnit;
 import java.util.concurrent.atomic.AtomicLong;
-import java.util.stream.Collectors;
-import java.util.stream.Stream;
 
 public final class IndexCollection {
   private static final Logger LOG = LogManager.getLogger(IndexCollection.class);
 
-  private static final int TIMEOUT = 600 * 1000;
   // This is the default analyzer used, unless another stemming algorithm or language is specified.
   public static final Analyzer DEFAULT_ANALYZER = DefaultEnglishAnalyzer.newDefaultInstance();
 
-  // When duplicates of these fields are attempted to be indexed in Solr, they are ignored. This allows some fields to be multi-valued, but not others.
-  // Stored vs. indexed vs. doc values vs. multi-valued vs. ... are controlled via config, rather than code, in Solr.
-  private static final List<String> IGNORED_DUPLICATE_FIELDS =
-      Lists.newArrayList(WashingtonPostGenerator.WashingtonPostField.PUBLISHED_DATE.name);
-
   public final class Counters {
     /**
      * Counter for successfully indexed documents.
@@ -262,361 +222,6 @@ public void run() {
     }
   }
 
-  private final class SolrIndexerThread implements Runnable {
-    private final Path input;
-    private final DocumentCollection collection;
-    private final List<SolrInputDocument> buffer = new ArrayList<>(args.solrBatch);
-    private FileSegment fileSegment;
-
-    private SolrIndexerThread(DocumentCollection collection, Path input) {
-      this.input = input;
-      this.collection = collection;
-    }
-
-    @Override
-    @SuppressWarnings("unchecked")
-    public void run() {
-      try {
-        LuceneDocumentGenerator generator = (LuceneDocumentGenerator)
-            generatorClass.getDeclaredConstructor(IndexArgs.class).newInstance(args);
-
-        // We keep track of two separate counts: the total count of documents in this file segment (cnt),
-        // and the number of documents in this current "batch" (batch). We update the global counter every
-        // 10k documents: this is so that we get intermediate updates, which is informative if a collection
-        // has only one file segment; see https://github.com/castorini/anserini/issues/683
-        int cnt = 0;
-        int batch = 0;
-
-        @SuppressWarnings("unchecked")
-        FileSegment<SourceDocument> segment = (FileSegment) collection.createFileSegment(input);
-        // in order to call close() and clean up resources in case of exception
-        this.fileSegment = segment;
-
-        for (SourceDocument sourceDocument : segment) {
-          if (!sourceDocument.indexable()) {
-            counters.unindexable.incrementAndGet();
-            continue;
-          }
-
-          Document document;
-          try {
-            document = generator.createDocument(sourceDocument);
-          } catch (EmptyDocumentException e1) {
-            counters.empty.incrementAndGet();
-            continue;
-          } catch (SkippedDocumentException e2) {
-            counters.skipped.incrementAndGet();
-            continue;
-          } catch (InvalidDocumentException e3) {
-            counters.errors.incrementAndGet();
-            continue;
-          }
-
-          if (whitelistDocids != null && !whitelistDocids.contains(sourceDocument.id())) {
-            counters.skipped.incrementAndGet();
-            continue;
-          }
-
-          SolrInputDocument solrDocument = new SolrInputDocument();
-
-          // Copy all Lucene Document fields to Solr document
-          for (IndexableField field : document.getFields()) {
-            // Skip docValues fields - this is done via Solr config.
-            if (field.fieldType().docValuesType() != DocValuesType.NONE) {
-              continue;
-            }
-            // If the field is already in the doc, skip it.
-            // This fixes an issue with WaPo where published_date is in the Lucene doc as LongPoint and StoredField. Solr needs one copy, more fine-grained control in config.
-            if (solrDocument.containsKey(field.name()) && IGNORED_DUPLICATE_FIELDS.contains(field.name())) {
-              continue;
-            }
-            if (field.numericValue() != null) {
-              solrDocument.addField(field.name(), field.numericValue());
-            } else if (field.stringValue() != null) { // For some reason, id is multi-valued with null as one of the values
-              solrDocument.addField(field.name(), field.stringValue());
-            }
-          }
-
-          buffer.add(solrDocument);
-          if (buffer.size() == args.solrBatch) {
-            flush();
-          }
-
-          cnt++;
-          batch++;
-
-          // And the counts from this batch, reset batch counter.
-          if (batch % 10000 == 0) {
-            counters.indexed.addAndGet(batch);
-            batch = 0;
-          }
-        }
-
-        // If we have docs in the buffer, flush them.
-        if (!buffer.isEmpty()) {
-          flush();
-        }
-
-        // Add the remaining documents.
-        counters.indexed.addAndGet(batch);
-
-        int skipped = segment.getSkippedCount();
-        if (skipped > 0) {
-          // When indexing tweets, this is normal, because there are delete messages that are skipped over.
-          counters.skipped.addAndGet(skipped);
-          LOG.warn(input.getParent().getFileName().toString() + File.separator +
-              input.getFileName().toString() + ": " + skipped + " docs skipped.");
-        }
-
-        if (segment.getErrorStatus()) {
-          counters.errors.incrementAndGet();
-          LOG.error(input.getParent().getFileName().toString() + File.separator +
-              input.getFileName().toString() + ": error iterating through segment.");
-        }
-
-        // Log at the debug level because this can be quite noisy if there are lots of file segments.
-        LOG.debug(input.getParent().getFileName().toString() + File.separator +
-            input.getFileName().toString() + ": " + cnt + " docs added.");
-      } catch (Exception e) {
-        LOG.error(Thread.currentThread().getName() + ": Unexpected Exception:", e);
-      } finally {
-        if (fileSegment != null) {
-          fileSegment.close();
-        }
-      }
-    }
-
-    private void flush() {
-      if (!buffer.isEmpty()) {
-        SolrClient solrClient = null;
-        try {
-          solrClient = solrPool.borrowObject();
-          solrClient.add(args.solrIndex, buffer, args.solrCommitWithin * 1000);
-          buffer.clear();
-        } catch (Exception e) {
-          LOG.error("Error flushing documents to Solr", e);
-        } finally {
-          if (solrClient != null) {
-            try {
-              solrPool.returnObject(solrClient);
-            } catch (Exception e) {
-              LOG.error("Error returning SolrClient to pool", e);
-            }
-          }
-        }
-      }
-    }
-  }
-
-  private class SolrClientFactory extends BasePooledObjectFactory<SolrClient> {
-    @Override
-    public SolrClient create() {
-      return new CloudSolrClient.Builder(Splitter.on(',').splitToList(args.zkUrl), Optional.of(args.zkChroot))
-          .withInternalClientBuilder(new Http2SolrClient.Builder().connectionTimeout(TIMEOUT))
-          .build();
-    }
-
-    @Override
-    public PooledObject<SolrClient> wrap(SolrClient solrClient) {
-      return new DefaultPooledObject<>(solrClient);
-    }
-
-    @Override
-    public void destroyObject(PooledObject<SolrClient> pooled) throws Exception {
-      pooled.getObject().close();
-    }
-  }
-
-  private final class ESIndexerThread implements Runnable {
-    private final Path input;
-    private final DocumentCollection collection;
-    private BulkRequest bulkRequest;
-    private FileSegment fileSegment;
-
-    private ESIndexerThread(DocumentCollection collection, Path input) {
-      this.input = input;
-      this.collection = collection;
-      this.bulkRequest = new BulkRequest();
-    }
-
-    @Override
-    @SuppressWarnings("unchecked")
-    public void run() {
-      try {
-        LuceneDocumentGenerator generator = (LuceneDocumentGenerator)
-            generatorClass.getDeclaredConstructor(IndexArgs.class).newInstance(args);
-
-        // We keep track of two separate counts: the total count of documents in this file segment (cnt),
-        // and the number of documents in this current "batch" (batch). We update the global counter every
-        // 10k documents: this is so that we get intermediate updates, which is informative if a collection
-        // has only one file segment; see https://github.com/castorini/anserini/issues/683
-        int cnt = 0;
-        int batch = 0;
-
-        FileSegment<SourceDocument> segment = collection.createFileSegment(input);
-        // in order to call close() and clean up resources in case of exception
-        this.fileSegment = segment;
-
-        for (SourceDocument sourceDocument : segment) {
-          if (!sourceDocument.indexable()) {
-            counters.unindexable.incrementAndGet();
-            continue;
-          }
-
-          Document document;
-          try {
-            document = generator.createDocument(sourceDocument);
-          } catch (EmptyDocumentException e1) {
-            counters.empty.incrementAndGet();
-            continue;
-          } catch (SkippedDocumentException e2) {
-            counters.skipped.incrementAndGet();
-            continue;
-          } catch (InvalidDocumentException e3) {
-            counters.errors.incrementAndGet();
-            continue;
-          }
-
-          if (whitelistDocids != null && !whitelistDocids.contains(sourceDocument.id())) {
-            counters.skipped.incrementAndGet();
-            continue;
-          }
-
-          // Get distinct field names
-          List<String> fields = document.getFields().stream().map(field -> field.name()).distinct().collect(Collectors.toList());
-
-          XContentBuilder builder = XContentFactory.jsonBuilder().startObject();
-
-          for (String field : fields) {
-
-            // Skip docValues fields
-            if (document.getField(field).fieldType().docValuesType() != DocValuesType.NONE) continue;
-
-            // Get field objects for current field name (could be multiple, such as WaPo's fullCaption)
-            IndexableField[] indexableFields = document.getFields(field);
-
-            if (field.equalsIgnoreCase("id") || indexableFields.length == 1) {
-              // Single value fields or "id" field
-              Object value = document.getField(field).stringValue() != null ? document.getField(field).stringValue() : document.getField(field).numericValue();
-              builder.field(field, value);
-            } else {
-              // Multi-valued fields
-              Object[] values = Stream.of(indexableFields).map(f -> f.stringValue()).toArray();
-              builder.array(field, values);
-            }
-          }
-
-          builder.endObject();
-
-          String indexName = (args.esIndex != null) ? args.esIndex : input.getFileName().toString();
-          bulkRequest.add(new IndexRequest(indexName).id(sourceDocument.id()).source(builder));
-
-          // sendBulkRequest when the batch size is reached OR the bulk size is reached
-          if (bulkRequest.numberOfActions() == args.esBatch || 
-              bulkRequest.estimatedSizeInBytes() >= args.esBulk) {
-            sendBulkRequest();
-          }
-
-          cnt++;
-          batch++;
-
-          // And the counts from this batch, reset batch counter.
-          if (batch % 10000 == 0) {
-            counters.indexed.addAndGet(batch);
-            batch = 0;
-          }
-        }
-
-        if (bulkRequest.numberOfActions() != 0) {
-          sendBulkRequest();
-        }
-
-        // Add the remaining documents.
-        counters.indexed.addAndGet(batch);
-
-        int skipped = segment.getSkippedCount();
-        if (skipped > 0) {
-          // When indexing tweets, this is normal, because there are delete messages that are skipped over.
-          counters.skipped.addAndGet(skipped);
-          LOG.warn(input.getParent().getFileName().toString() + File.separator +
-              input.getFileName().toString() + ": " + skipped + " docs skipped.");
-        }
-
-        if (segment.getErrorStatus()) {
-          counters.errors.incrementAndGet();
-          LOG.error(input.getParent().getFileName().toString() + File.separator +
-              input.getFileName().toString() + ": error iterating through segment.");
-        }
-
-        // Log at the debug level because this can be quite noisy if there are lots of file segments.
-        LOG.debug(input.getParent().getFileName().toString() + File.separator +
-            input.getFileName().toString() + ": " + cnt + " docs added.");
-      } catch (Exception e) {
-        LOG.error(Thread.currentThread().getName() + ": Unexpected Exception:", e);
-      } finally {
-        if (fileSegment != null){
-          fileSegment.close();
-        }
-      }
-    }
-
-    private void sendBulkRequest() {
-      if (bulkRequest.numberOfActions() == 0) {
-        return;
-      }
-
-      RestHighLevelClient esClient = null;
-      try {
-        esClient = esPool.borrowObject();
-        esClient.bulk(bulkRequest, RequestOptions.DEFAULT);
-        bulkRequest = new BulkRequest();
-      } catch (Exception e) {
-        LOG.error("Error sending bulk requests to Elasticsearch", e);
-
-        // Log the 10 docs that have the largest sizes in this request
-        List<DocWriteRequest<?>> docs = bulkRequest.requests();
-        Collections.sort(docs, (d1, d2) -> ((IndexRequest) d2).source().length() - ((IndexRequest) d1).source().length());
-
-        LOG.info("Error sending bulkRequest. The 10 largest docs in this request are the following cord_uid: ");
-        for (int i = 0; i < 10; i++) {
-          IndexRequest doc = (IndexRequest) docs.get(i);
-          LOG.info(doc.id()); 
-        }
-      } finally {
-        if (esClient != null) {
-          try {
-            esPool.returnObject(esClient);
-          } catch (Exception e) {
-            LOG.error("Error returning ES client to pool", e);
-          }
-        }
-      }
-    }
-  }
-
-  private class ESClientFactory extends BasePooledObjectFactory<RestHighLevelClient> {
-    @Override
-    public RestHighLevelClient create() {
-      final CredentialsProvider credentialsProvider = new BasicCredentialsProvider();
-      credentialsProvider.setCredentials(AuthScope.ANY, new UsernamePasswordCredentials(args.esUser, args.esPassword));
-      return new RestHighLevelClient(
-          RestClient.builder(new HttpHost(args.esHostname, args.esPort, "http"))
-              .setHttpClientConfigCallback(builder -> builder.setDefaultCredentialsProvider(credentialsProvider))
-              .setRequestConfigCallback(builder -> builder.setConnectTimeout(args.esConnectTimeout).setSocketTimeout(args.esSocketTimeout))
-      );
-    }
-
-    @Override
-    public PooledObject<RestHighLevelClient> wrap(RestHighLevelClient esClient) {
-      return new DefaultPooledObject<>(esClient);
-    }
-
-    @Override
-    public void destroyObject(PooledObject<RestHighLevelClient> pooled) throws Exception {
-      pooled.getObject().close();
-    }
-  }
-
   private final IndexArgs args;
   private final Path collectionPath;
   private final Set whitelistDocids;
@@ -625,10 +230,6 @@ public void destroyObject(PooledObject<RestHighLevelClient> pooled) throws Excep
   private final DocumentCollection collection;
   private final Counters counters;
   private Path indexPath;
-  private ObjectPool<SolrClient> solrPool;
-  private ObjectPool<RestHighLevelClient> esPool;
-
-
 
   @SuppressWarnings("unchecked")
   public IndexCollection(IndexArgs args) throws Exception {
@@ -665,32 +266,7 @@ public IndexCollection(IndexArgs args) throws Exception {
     LOG.info("Optimize (merge segments)? " + args.optimize);
     LOG.info("Whitelist: " + args.whitelist);
     LOG.info("Pretokenized?: " + args.pretokenized);
-
-    if (args.solr) {
-      LOG.info("Indexing into Solr...");
-      LOG.info("Solr batch size: " + args.solrBatch);
-      LOG.info("Solr commitWithin: " + args.solrCommitWithin);
-      LOG.info("Solr index: " + args.solrIndex);
-      LOG.info("Solr ZooKeeper URL: " + args.zkUrl);
-      LOG.info("SolrClient pool size: " + args.solrPoolSize);
-    } else if (args.es) {
-      LOG.info("Indexing into Elasticsearch...");
-      LOG.info("Elasticsearch batch size: " + args.esBatch);
-      LOG.info("Elasticsearch index: " + args.esIndex);
-      LOG.info("Elasticsearch hostname: " + args.esHostname);
-      LOG.info("Elasticsearch host port: " + args.esPort);
-      LOG.info("Elasticsearch client connect timeout (in ms): " + args.esConnectTimeout);
-      LOG.info("Elasticsearch client socket timeout (in ms): " + args.esSocketTimeout);
-      LOG.info("Elasticsearch pool size: " + args.esPoolSize);
-      LOG.info("Elasticsearch user: " + args.esUser);
-    } else {
-      LOG.info("Directly building Lucene indexes...");
-      LOG.info("Index path: " + args.index);
-    }
-
-    if (args.index == null && !args.solr && !args.es) {
-      throw new IllegalArgumentException("Must specify one of -index, -solr, or -es");
-    }
+    LOG.info("Index path: " + args.index);
 
     if (args.index != null) {
       this.indexPath = Paths.get(args.index);
@@ -723,18 +299,6 @@ public IndexCollection(IndexArgs args) throws Exception {
       this.whitelistDocids = null;
     }
 
-    if (args.solr) {
-      GenericObjectPoolConfig<SolrClient> config = new GenericObjectPoolConfig<>();
-      config.setMaxTotal(args.solrPoolSize);
-      config.setMinIdle(args.solrPoolSize); // To guard against premature discarding of solrClients
-      this.solrPool = new GenericObjectPool<>(new SolrClientFactory(), config);
-    } else if (args.es) {
-      GenericObjectPoolConfig<RestHighLevelClient> config = new GenericObjectPoolConfig<>();
-      config.setMaxTotal(args.esPoolSize);
-      config.setMinIdle(args.esPoolSize);
-      this.esPool = new GenericObjectPool<>(new ESClientFactory(), config);
-    }
-
     this.counters = new Counters();
   }
 
@@ -865,13 +429,7 @@ public Counters run() throws IOException {
     LOG.info("Starting to index...");
 
     for (int i = 0; i < segmentCnt; i++) {
-      if (args.solr) {
-        executor.execute(new SolrIndexerThread(collection, (Path) segmentPaths.get(i)));
-      } else if (args.es) {
-        executor.execute(new ESIndexerThread(collection, (Path) segmentPaths.get(i)));
-      } else {
-        executor.execute(new LocalIndexerThread(writer, collection, (Path) segmentPaths.get(i)));
-      }
+      executor.execute(new LocalIndexerThread(writer, collection, (Path) segmentPaths.get(i)));
     }
 
     executor.shutdown();
@@ -898,31 +456,9 @@ public Counters run() throws IOException {
           " is not equal to completedTaskCount =  " + executor.getCompletedTaskCount());
     }
 
-    long numIndexed;
-
-    if (args.solr || args.es) {
-      numIndexed = counters.indexed.get();
-    } else {
-      numIndexed = writer.getDocStats().maxDoc;
-    }
+    long numIndexed = writer.getDocStats().maxDoc;
 
     // Do a final commit
-    if (args.solr) {
-      try {
-        SolrClient client = solrPool.borrowObject();
-        client.commit(args.solrIndex);
-        // Needed for orderly shutdown so the SolrClient executor does not delay main thread exit
-        solrPool.returnObject(client);
-        solrPool.close();
-      } catch (Exception e) {
-        LOG.error("Exception during final Solr commit: ", e);
-      }
-    }
-
-    if (args.es) {
-      esPool.close();
-    }
-
     try {
       if (writer != null) {
         writer.commit();
diff --git a/src/main/java/io/anserini/rerank/ScoredDocuments.java b/src/main/java/io/anserini/rerank/ScoredDocuments.java
index c215927a31..e4eb692873 100644
--- a/src/main/java/io/anserini/rerank/ScoredDocuments.java
+++ b/src/main/java/io/anserini/rerank/ScoredDocuments.java
@@ -17,30 +17,21 @@
 package io.anserini.rerank;
 
 import io.anserini.index.IndexArgs;
-import org.apache.lucene.document.BinaryDocValuesField;
+import org.apache.commons.lang3.ArrayUtils;
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+import org.apache.lucene.document.Document;
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.index.Term;
-import org.apache.lucene.document.Document;
-import org.apache.lucene.document.Field;
-import org.apache.lucene.document.StringField;
 import org.apache.lucene.search.IndexSearcher;
 import org.apache.lucene.search.Query;
 import org.apache.lucene.search.TermQuery;
 import org.apache.lucene.search.TopDocs;
-import org.apache.lucene.util.BytesRef;
-import org.apache.solr.common.SolrDocument;
-import org.apache.solr.common.SolrDocumentList;
-import org.apache.commons.lang3.ArrayUtils;
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
-import org.elasticsearch.search.SearchHit;
-import org.elasticsearch.search.SearchHits;
-
 
-import java.util.List;
+import java.io.IOException;
 import java.util.ArrayList;
+import java.util.List;
 import java.util.Map;
-import java.io.IOException;
 
 /**
  * ScoredDocuments object that converts TopDocs from the searcher into an Anserini format
@@ -74,71 +65,6 @@ public static ScoredDocuments fromTopDocs(TopDocs rs, IndexSearcher searcher) {
     return scoredDocs;
   }
 
-  public static ScoredDocuments fromSolrDocs(SolrDocumentList rs) {
-
-    ScoredDocuments scoredDocs = new ScoredDocuments();
-
-    int length = rs.size();
-    scoredDocs.documents = new Document[length];
-    scoredDocs.ids = new int[length];
-    scoredDocs.scores = new float[length];
-
-    for (int i = 0; i < length; i++) {
-
-      SolrDocument d = rs.get(i);
-
-      // Create placeholder copies of Lucene Documents
-      // Intention is for compatibility with ScoreTiesAdjusterReranker without disturbing other aspects of reranker code
-
-      Document document = new Document();
-      String id = d.getFieldValue("id").toString();
-      float score = (float) d.getFieldValue("score");
-
-      // Store the collection docid.
-      document.add(new StringField(IndexArgs.ID, id, Field.Store.YES));
-      // This is needed to break score ties by docid.
-      document.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef(id)));
-      scoredDocs.documents[i] = document;
-      scoredDocs.scores[i] = score;
-      scoredDocs.ids[i] = i; // no internal Lucene ID available, use index as placeholder
-    }
-
-    return scoredDocs;
-  }
-
-  public static ScoredDocuments fromESDocs(SearchHits rs) {
-
-    ScoredDocuments scoredDocs = new ScoredDocuments();
-    SearchHit[] searchHits = rs.getHits();
-
-    int length = searchHits.length;
-    scoredDocs.documents = new Document[length];
-    scoredDocs.ids = new int[length];
-    scoredDocs.scores = new float[length];
-
-    for (int i = 0; i < length; i++) {
-
-      SearchHit hit = searchHits[i];
-
-      // Create placeholder copies of Lucene Documents
-      // Intention is for compatibility with ScoreTiesAdjusterReranker without disturbing other aspects of reranker code
-
-      Document document = new Document();
-      String id = hit.getId();
-      float score = hit.getScore();
-
-      // Store the collection docid.
-      document.add(new StringField(IndexArgs.ID, id, Field.Store.YES));
-      // This is needed to break score ties by docid.
-      document.add(new BinaryDocValuesField(IndexArgs.ID, new BytesRef(id)));
-      scoredDocs.documents[i] = document;
-      scoredDocs.scores[i] = score;
-      scoredDocs.ids[i] = i; // no internal Lucene ID available, use index as placeholder
-    }
-
-    return scoredDocs;
-  }
-
   public static ScoredDocuments fromQrels(Map<String, Integer> qrels, IndexReader reader) throws IOException {
     ScoredDocuments scoredDocs = new ScoredDocuments();
 
diff --git a/src/main/java/io/anserini/search/SearchElastic.java b/src/main/java/io/anserini/search/SearchElastic.java
deleted file mode 100644
index fdc01e387f..0000000000
--- a/src/main/java/io/anserini/search/SearchElastic.java
+++ /dev/null
@@ -1,334 +0,0 @@
-/*
- * Anserini: A Lucene toolkit for reproducible information retrieval research
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package io.anserini.search;
-
-import io.anserini.index.IndexArgs;
-import io.anserini.index.generator.TweetGenerator;
-import io.anserini.rerank.ScoredDocuments;
-import io.anserini.rerank.lib.ScoreTiesAdjusterReranker;
-import io.anserini.search.topicreader.TopicReader;
-import org.apache.commons.lang3.time.DurationFormatUtils;
-import org.apache.http.HttpHost;
-import org.apache.http.auth.AuthScope;
-import org.apache.http.auth.UsernamePasswordCredentials;
-import org.apache.http.client.CredentialsProvider;
-import org.apache.http.impl.client.BasicCredentialsProvider;
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
-import org.elasticsearch.action.search.SearchRequest;
-import org.elasticsearch.action.search.SearchResponse;
-import org.elasticsearch.client.HttpAsyncResponseConsumerFactory;
-import org.elasticsearch.client.RequestOptions;
-import org.elasticsearch.client.RestClient;
-import org.elasticsearch.client.RestHighLevelClient;
-import org.elasticsearch.index.query.BoolQueryBuilder;
-import org.elasticsearch.index.query.QueryBuilders;
-import org.elasticsearch.index.query.QueryStringQueryBuilder;
-import org.elasticsearch.index.query.RangeQueryBuilder;
-import org.elasticsearch.search.SearchHits;
-import org.elasticsearch.search.builder.SearchSourceBuilder;
-import org.elasticsearch.search.sort.FieldSortBuilder;
-import org.elasticsearch.search.sort.ScoreSortBuilder;
-import org.elasticsearch.search.sort.SortOrder;
-import org.kohsuke.args4j.CmdLineException;
-import org.kohsuke.args4j.CmdLineParser;
-import org.kohsuke.args4j.Option;
-import org.kohsuke.args4j.OptionHandlerFilter;
-import org.kohsuke.args4j.ParserProperties;
-import org.kohsuke.args4j.spi.StringArrayOptionHandler;
-
-import java.io.Closeable;
-import java.io.IOException;
-import java.io.PrintWriter;
-import java.nio.charset.StandardCharsets;
-import java.nio.file.Files;
-import java.nio.file.Path;
-import java.nio.file.Paths;
-import java.util.Locale;
-import java.util.Map;
-import java.util.SortedMap;
-import java.util.TreeMap;
-import java.util.concurrent.TimeUnit;
-
-/*
-* Entry point of the Retrieval.
- */
-public final class SearchElastic implements Closeable {
-
-  private static final Logger LOG = LogManager.getLogger(SearchCollection.class);
-  private static final int TIMEOUT = 600 * 1000;
-  private final Args args;
-  private RestHighLevelClient client;
-
-  private static final RequestOptions COMMON_OPTIONS;
-  static {
-    RequestOptions.Builder builder = RequestOptions.DEFAULT.toBuilder();
-    builder.setHttpAsyncResponseConsumerFactory(
-      new HttpAsyncResponseConsumerFactory.HeapBufferedResponseConsumerFactory(1024 * 1024 * 1024));
-    COMMON_OPTIONS = builder.build();
-  }
-
-  public static final class Args {
-
-    // required arguments
-
-    @Option(name = "-topics", metaVar = "[file]", handler = StringArrayOptionHandler.class, required = true, usage = "topics file")
-    public String[] topics;
-
-    @Option(name = "-output", metaVar = "[file]", required = true, usage = "output file")
-    public String output;
-
-    @Option(name = "-topicreader", required = true, usage = "define how to read the topic(query) file: one of [Trec|Webxml]")
-    public String topicReader;
-
-    @Option(name = "-es.index", usage = "the name of the index in Elasticsearch")
-    public String esIndex = null;
-
-    @Option(name = "-es.hostname", usage = "the name of Elasticsearch HTTP host")
-    public String esHostname = "localhost";
-
-    @Option(name = "-es.port", usage = "the port for Elasticsearch HTTP host")
-    public int esPort = 9200;
-
-    /**
-     * The user and password are defaulted to those pre-configured for docker-elk
-     */
-    @Option(name = "-es.user", usage = "the user of the ELK stack")
-    public String esUser = "elastic";
-
-    @Option(name = "-es.password", usage = "the password for the ELK stack")
-    public String esPassword = "changeme";
-
-    // optional arguments
-    @Option(name = "-topicfield", usage = "Which field of the query should be used, default \"title\"." +
-            " For TREC ad hoc topics, description or narrative can be used.")
-    public String topicfield = "title";
-
-    @Option(name = "-searchtweets", usage = "Whether the search is against a tweet " +
-            "index created by IndexCollection -collection TweetCollection")
-    public Boolean searchtweets = false;
-
-    @Option(name = "-hits", metaVar = "[number]", required = false, usage = "max number of hits to return")
-    public int hits = 1000;
-
-    @Option(name = "-runtag", metaVar = "[tag]", required = false, usage = "runtag")
-    public String runtag = null;
-
-  }
-
-  private final class ESSearcherThread<K> extends Thread {
-
-    final private SortedMap<K, Map<String, String>> topics;
-    final private String outputPath;
-    final private String runTag;
-
-    private ESSearcherThread(SortedMap<K, Map<String, String>> topics, String outputPath, String runTag){
-
-      this.topics = topics;
-      this.runTag = runTag;
-      this.outputPath = outputPath;
-      setName(outputPath);
-    }
-
-    @Override
-    public void run() {
-      try {
-        LOG.info("[Start] Retrieval with Elasticsearch collection: " + args.esIndex);
-        final long start = System.nanoTime();
-        PrintWriter out = new PrintWriter(Files.newBufferedWriter(Paths.get(outputPath), StandardCharsets.US_ASCII));
-
-        for (Map.Entry<K, Map<String, String>> entry : topics.entrySet()) {
-          K qid = entry.getKey();
-          String queryString = entry.getValue().get(args.topicfield);
-          ScoredDocuments docs;
-          if (args.searchtweets) {
-            docs = searchTweets(queryString, Long.parseLong(entry.getValue().get("time")));
-          } else {
-            docs = search(queryString);
-          }
-
-          /**
-           * the first column is the topic number.
-           * the second column is currently unused and should always be "Q0".
-           * the third column is the official document identifier of the retrieved document.
-           * the fourth column is the rank the document is retrieved.
-           * the fifth column shows the score (integer or floating point) that generated the ranking.
-           * the sixth column is called the "run tag" and should be a unique identifier for your
-           */
-          for (int i = 0; i < docs.documents.length; i++) {
-            out.println(String.format(Locale.US, "%s Q0 %s %d %f %s", qid,
-                    docs.documents[i].getField(IndexArgs.ID).stringValue(), (i + 1), docs.scores[i], runTag));
-          }
-        }
-        out.flush();
-        out.close();
-
-        final long durationMillis = TimeUnit.MILLISECONDS.convert(System.nanoTime() - start, TimeUnit.NANOSECONDS);
-        LOG.info("[Finished] Run " + topics.size() + " topics searched in "
-                + DurationFormatUtils.formatDuration(durationMillis, "HH:mm:ss"));
-      } catch (Exception e) {
-        LOG.error(Thread.currentThread().getName() + ": Unexpected Exception:", e);
-      }
-    }
-  }
-
-  public SearchElastic(Args args) {
-    this.args = args;
-    LOG.info("Elasticsearch index: " + args.esIndex);
-    LOG.info("Elasticsearch hostname: " + args.esHostname);
-    LOG.info("Elasticsearch host port: " + args.esPort);
-
-    final CredentialsProvider credentialsProvider = new BasicCredentialsProvider();
-    credentialsProvider.setCredentials(AuthScope.ANY, new UsernamePasswordCredentials(args.esUser, args.esPassword));
-
-    this.client = new RestHighLevelClient(
-            RestClient.builder(new HttpHost(args.esHostname, args.esPort, "http"))
-                    .setHttpClientConfigCallback(builder -> builder.setDefaultCredentialsProvider(credentialsProvider))
-                    .setRequestConfigCallback(builder -> builder.setConnectTimeout(TIMEOUT).setSocketTimeout(TIMEOUT)));
-  }
-
-  @SuppressWarnings("unchecked")
-  public<K> void runTopics() throws IOException {
-    TopicReader<K> tr;
-    SortedMap<K, Map<String, String>> topics = new TreeMap<>();
-    for (String singleTopicsFile : args.topics) {
-      Path topicsFilePath = Paths.get(singleTopicsFile);
-      if (!Files.exists(topicsFilePath) || !Files.isRegularFile(topicsFilePath) || !Files.isReadable(topicsFilePath)) {
-        throw new IllegalArgumentException("Topics file : " + topicsFilePath + " does not exist or is not a (readable) file.");
-      }
-      try {
-        tr = (TopicReader<K>) Class.forName("io.anserini.search.topicreader." + args.topicReader + "TopicReader")
-            .getConstructor(Path.class).newInstance(topicsFilePath);
-        topics.putAll(tr.read());
-      } catch (Exception e) {
-        throw new IllegalArgumentException("Unable to load topic reader: " + args.topicReader);
-      }
-    }
-  
-    final String runTag = args.runtag == null ? "Elastirini" : args.runtag;
-    ESSearcherThread<K> esThread = new ESSearcherThread<K>(topics, args.output, runTag);
-    esThread.run();
-  }
-
-  public<K> ScoredDocuments search(String queryString){
-
-    SearchHits results = null;
-
-    String specials = "+-=&|><!(){}[]^\"~*?:\\/";
-
-    for (int i = 0; i < specials.length(); i++){
-      char c = specials.charAt(i);
-      queryString = queryString.replace(String.valueOf(c), " ");
-    }
-
-    QueryStringQueryBuilder query = QueryBuilders
-            .queryStringQuery(queryString)
-            .defaultField("contents")
-            .analyzer("english");
-
-    SearchRequest searchRequest = new SearchRequest(args.esIndex);
-    SearchSourceBuilder sourceBuilder = new SearchSourceBuilder();
-    sourceBuilder.query(query);
-    sourceBuilder.size(args.hits);
-    sourceBuilder.sort(new ScoreSortBuilder().order(SortOrder.DESC));
-    sourceBuilder.sort(new FieldSortBuilder(IndexArgs.ID).order(SortOrder.ASC));
-    searchRequest.source(sourceBuilder);
-
-    try {
-      SearchResponse searchResponse = client.search(searchRequest, COMMON_OPTIONS);
-      results = searchResponse.getHits();
-    } catch (Exception e) {
-      LOG.error("Exception during ES query: ", e);
-    }
-
-    ScoreTiesAdjusterReranker reranker = new ScoreTiesAdjusterReranker();
-    return reranker.rerank(ScoredDocuments.fromESDocs(results), null);
-  }
-
-  public<K> ScoredDocuments searchTweets(String queryString, long t){
-
-    SearchHits results = null;
-
-    String specials = "+-=&|><!(){}[]^\"~*?:\\/";
-
-    for (int i = 0; i < specials.length(); i++){
-      char c = specials.charAt(i);
-      queryString = queryString.replace(String.valueOf(c), " ");
-    }
-
-    // Do not consider the tweets with tweet ids that are beyond the queryTweetTime
-    // <querytweettime> tag contains the timestamp of the query in terms of the
-    // chronologically nearest tweet id within the corpus
-    RangeQueryBuilder queryTweetTime = QueryBuilders
-            .rangeQuery(TweetGenerator.TweetField.ID_LONG.name)
-            .from(0L)
-            .to(t);
-
-    QueryStringQueryBuilder queryTerms = QueryBuilders
-            .queryStringQuery(queryString)
-            .defaultField("contents")
-            .analyzer("english");
-
-    BoolQueryBuilder query = QueryBuilders.boolQuery()
-            .filter(queryTweetTime)
-            .should(queryTerms);
-
-    SearchRequest searchRequest = new SearchRequest(args.esIndex);
-    SearchSourceBuilder sourceBuilder = new SearchSourceBuilder();
-    sourceBuilder.query(query);
-    sourceBuilder.size(args.hits);
-    sourceBuilder.sort(new ScoreSortBuilder().order(SortOrder.DESC));
-    sourceBuilder.sort(new FieldSortBuilder(TweetGenerator.TweetField.ID_LONG.name).order(SortOrder.DESC));
-    searchRequest.source(sourceBuilder);
-
-    try {
-      SearchResponse searchResponse = client.search(searchRequest, COMMON_OPTIONS);
-      results = searchResponse.getHits();
-    } catch (Exception e) {
-      LOG.error("Exception during ES query: ", e);
-    }
-
-    ScoreTiesAdjusterReranker reranker = new ScoreTiesAdjusterReranker();
-    return reranker.rerank(ScoredDocuments.fromESDocs(results), null);
-  }
-
-  @Override
-  public void close() throws IOException {
-    client.close();
-  }
-
-  public static void main(String[] args) throws Exception {
-    Args searchElasticArgs = new Args();
-    CmdLineParser parser = new CmdLineParser(searchElasticArgs, ParserProperties.defaults().withUsageWidth(90));
-
-    try {
-      parser.parseArgument(args);
-    } catch (CmdLineException e) {
-      System.err.println(e.getMessage());
-      parser.printUsage(System.err);
-      System.err.println("Example: SearchElastic" + parser.printExample(OptionHandlerFilter.REQUIRED));
-      return;
-    }
-
-    final long start = System.nanoTime();
-    SearchElastic searcher = new SearchElastic(searchElasticArgs);
-    searcher.runTopics();
-    searcher.close();
-    final long durationMillis = TimeUnit.MILLISECONDS.convert(System.nanoTime() - start, TimeUnit.NANOSECONDS);
-    LOG.info("Total run time: " + DurationFormatUtils.formatDuration(durationMillis, "HH:mm:ss"));
-  }
-}
\ No newline at end of file
diff --git a/src/main/java/io/anserini/search/SearchSolr.java b/src/main/java/io/anserini/search/SearchSolr.java
deleted file mode 100644
index 9b01661aa4..0000000000
--- a/src/main/java/io/anserini/search/SearchSolr.java
+++ /dev/null
@@ -1,275 +0,0 @@
-/*
- * Anserini: A Lucene toolkit for reproducible information retrieval research
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package io.anserini.search;
-
-import com.google.common.base.Splitter;
-import io.anserini.index.IndexArgs;
-import io.anserini.index.generator.TweetGenerator;
-import io.anserini.rerank.ScoredDocuments;
-import io.anserini.rerank.lib.ScoreTiesAdjusterReranker;
-import io.anserini.search.topicreader.TopicReader;
-import org.apache.commons.lang3.time.DurationFormatUtils;
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
-import org.apache.lucene.document.LongPoint;
-import org.apache.lucene.search.Query;
-import org.apache.solr.client.solrj.SolrClient;
-import org.apache.solr.client.solrj.SolrQuery;
-import org.apache.solr.client.solrj.SolrQuery.SortClause;
-import org.apache.solr.client.solrj.impl.CloudSolrClient;
-import org.apache.solr.client.solrj.impl.Http2SolrClient;
-import org.apache.solr.client.solrj.response.QueryResponse;
-import org.apache.solr.common.SolrDocumentList;
-import org.kohsuke.args4j.CmdLineException;
-import org.kohsuke.args4j.CmdLineParser;
-import org.kohsuke.args4j.Option;
-import org.kohsuke.args4j.OptionHandlerFilter;
-import org.kohsuke.args4j.ParserProperties;
-import org.kohsuke.args4j.spi.StringArrayOptionHandler;
-
-import java.io.Closeable;
-import java.io.IOException;
-import java.io.PrintWriter;
-import java.nio.charset.StandardCharsets;
-import java.nio.file.Files;
-import java.nio.file.Path;
-import java.nio.file.Paths;
-import java.util.Locale;
-import java.util.Map;
-import java.util.Optional;
-import java.util.SortedMap;
-import java.util.TreeMap;
-import java.util.concurrent.TimeUnit;
-
-/*
-* Entry point of the Retrieval.
- */
-public final class SearchSolr implements Closeable {
-
-  private static final Logger LOG = LogManager.getLogger(SearchCollection.class);
-  private static final int TIMEOUT = 600 * 1000;
-  private final Args args;
-  private SolrClient client;
-
-  public static final class Args {
-
-    // required arguments
-
-    @Option(name = "-topics", metaVar = "[file]", handler = StringArrayOptionHandler.class, required = true, usage = "topics file")
-    public String[] topics;
-
-    @Option(name = "-output", metaVar = "[file]", required = true, usage = "output file")
-    public String output;
-
-    @Option(name = "-topicreader", required = true, usage = "define how to read the topic(query) file: one of [Trec|Webxml]")
-    public String topicReader;
-
-    @Option(name = "-solr.index", usage = "the name of the index in Solr")
-    public String solrIndex = null;
-
-    @Option(name = "-solr.zkUrl", usage = "the URL of Solr's ZooKeeper (comma separated list of using ensemble)")
-    public String zkUrl = null;
-
-    @Option(name = "-solr.zkChroot", usage = "the ZooKeeper chroot")
-    public String zkChroot = "/";
-
-    // optional arguments
-    @Option(name = "-topicfield", usage = "Which field of the query should be used, default \"title\"." +
-            " For TREC ad hoc topics, description or narrative can be used.")
-    public String topicfield = "title";
-
-    @Option(name = "-searchtweets", usage = "Whether the search is against a tweet " +
-            "index created by IndexCollection -collection TweetCollection")
-    public Boolean searchtweets = false;
-
-    @Option(name = "-hits", metaVar = "[number]", required = false, usage = "max number of hits to return")
-    public int hits = 1000;
-
-    @Option(name = "-runtag", metaVar = "[tag]", required = false, usage = "runtag")
-    public String runtag = null;
-
-  }
-
-  private final class SolrSearcherThread<K> extends Thread {
-
-    final private SortedMap<K, Map<String, String>> topics;
-    final private String outputPath;
-    final private String runTag;
-
-    private SolrSearcherThread(SortedMap<K, Map<String, String>> topics, String outputPath, String runTag){
-
-      this.topics = topics;
-      this.runTag = runTag;
-      this.outputPath = outputPath;
-      setName(outputPath);
-    }
-
-    @Override
-    public void run() {
-      try {
-        LOG.info("[Start] Retrieval with Solr collection: " + args.solrIndex);
-        final long start = System.nanoTime();
-        PrintWriter out = new PrintWriter(Files.newBufferedWriter(Paths.get(outputPath), StandardCharsets.US_ASCII));
-
-        for (Map.Entry<K, Map<String, String>> entry : topics.entrySet()) {
-          K qid = entry.getKey();
-          String queryString = entry.getValue().get(args.topicfield);
-          ScoredDocuments docs;
-          if (args.searchtweets) {
-            docs = searchTweets(queryString, Long.parseLong(entry.getValue().get("time")));
-          } else {
-            docs = search(queryString);
-          }
-
-          /**
-           * the first column is the topic number.
-           * the second column is currently unused and should always be "Q0".
-           * the third column is the official document identifier of the retrieved document.
-           * the fourth column is the rank the document is retrieved.
-           * the fifth column shows the score (integer or floating point) that generated the ranking.
-           * the sixth column is called the "run tag" and should be a unique identifier for your
-           */
-          for (int i = 0; i < docs.documents.length; i++) {
-            out.println(String.format(Locale.US, "%s Q0 %s %d %f %s", qid,
-                    docs.documents[i].getField(IndexArgs.ID).stringValue(), (i + 1), docs.scores[i], runTag));
-          }
-        }
-        out.flush();
-        out.close();
-
-        final long durationMillis = TimeUnit.MILLISECONDS.convert(System.nanoTime() - start, TimeUnit.NANOSECONDS);
-        LOG.info("[Finished] Run " + topics.size() + " topics searched in "
-                + DurationFormatUtils.formatDuration(durationMillis, "HH:mm:ss"));
-      } catch (Exception e) {
-        LOG.error(Thread.currentThread().getName() + ": Unexpected Exception:", e);
-      }
-    }
-  }
-
-  public SearchSolr(Args args) throws IOException {
-    this.args = args;
-    LOG.info("Solr index: " + args.solrIndex);
-    LOG.info("Solr ZooKeeper URL: " + args.zkUrl);
-    this.client = new CloudSolrClient.Builder(Splitter.on(',')
-            .splitToList(args.zkUrl), Optional.of(args.zkChroot))
-            .withInternalClientBuilder(new Http2SolrClient.Builder().connectionTimeout(TIMEOUT))
-            .build();
-  }
-
-  @SuppressWarnings("unchecked")
-  public<K> void runTopics() throws IOException {
-    TopicReader<K> tr;
-    SortedMap<K, Map<String, String>> topics = new TreeMap<>();
-    for (String singleTopicsFile : args.topics) {
-      Path topicsFilePath = Paths.get(singleTopicsFile);
-      if (!Files.exists(topicsFilePath) || !Files.isRegularFile(topicsFilePath) || !Files.isReadable(topicsFilePath)) {
-        throw new IllegalArgumentException("Topics file : " + topicsFilePath + " does not exist or is not a (readable) file.");
-      }
-      try {
-        tr = (TopicReader<K>) Class.forName("io.anserini.search.topicreader." + args.topicReader + "TopicReader")
-            .getConstructor(Path.class).newInstance(topicsFilePath);
-        topics.putAll(tr.read());
-      } catch (Exception e) {
-        throw new IllegalArgumentException("Unable to load topic reader: " + args.topicReader);
-      }
-    }
-  
-    final String runTag = args.runtag == null ? "Solrini" : args.runtag;
-    SolrSearcherThread<K> solrThread = new SolrSearcherThread<K>(topics, args.output, runTag);
-    solrThread.run();
-  }
-
-  public<K> ScoredDocuments search(String queryString){
-
-    SolrDocumentList results = null;
-
-    SolrQuery solrq = new SolrQuery();
-    solrq.set("df", "contents");
-    solrq.set("fl", "* score");
-    // Remove some characters in query which are special syntax in Solr query parser
-    solrq.setQuery(queryString.replaceAll("[+=&|<>!(){}~*?:/\"\\^\\-\\[\\]\\\\]", " "));
-    solrq.setRows(args.hits);
-    solrq.setSort(SortClause.desc("score"));
-    solrq.addSort(SortClause.asc(IndexArgs.ID));
-
-    try {
-      QueryResponse response = client.query(args.solrIndex, solrq);
-      results = response.getResults();
-    } catch (Exception e) {
-      LOG.error("Exception during Solr query: ", e);
-    }
-
-    ScoreTiesAdjusterReranker reranker = new ScoreTiesAdjusterReranker();
-    return reranker.rerank(ScoredDocuments.fromSolrDocs(results), null);
-  }
-
-  public<K> ScoredDocuments searchTweets(String queryString, long t){
-
-    SolrDocumentList results = null;
-
-    SolrQuery solrq = new SolrQuery();
-    solrq.set("df", "contents");
-    solrq.set("fl", "* score");
-    // Remove double quotes in query since they are special syntax in Solr query parser
-    solrq.setQuery(queryString.replace("\"", ""));
-    solrq.setRows(args.hits);
-    solrq.setSort(SortClause.desc("score"));
-    solrq.addSort(SortClause.desc(TweetGenerator.TweetField.ID_LONG.name));
-
-    // Do not consider the tweets with tweet ids that are beyond the queryTweetTime
-    // <querytweettime> tag contains the timestamp of the query in terms of the
-    // chronologically nearest tweet id within the corpus
-    Query filter = LongPoint.newRangeQuery(TweetGenerator.TweetField.ID_LONG.name, 0L, t);
-    solrq.set("fq", filter.toString());
-
-    try {
-      QueryResponse response = client.query(args.solrIndex, solrq);
-      results = response.getResults();
-    } catch (Exception e) {
-      LOG.error("Exception during Solr query: ", e);
-    }
-
-    ScoreTiesAdjusterReranker reranker = new ScoreTiesAdjusterReranker();
-    return reranker.rerank(ScoredDocuments.fromSolrDocs(results), null);
-  }
-
-  @Override
-  public void close() throws IOException {
-    client.close();
-  }
-
-  public static void main(String[] args) throws Exception {
-    Args searchSolrArgs = new Args();
-    CmdLineParser parser = new CmdLineParser(searchSolrArgs, ParserProperties.defaults().withUsageWidth(90));
-
-    try {
-      parser.parseArgument(args);
-    } catch (CmdLineException e) {
-      System.err.println(e.getMessage());
-      parser.printUsage(System.err);
-      System.err.println("Example: SearchSolr" + parser.printExample(OptionHandlerFilter.REQUIRED));
-      return;
-    }
-
-    final long start = System.nanoTime();
-    SearchSolr searcher = new SearchSolr(searchSolrArgs);
-    searcher.runTopics();
-    searcher.close();
-    final long durationMillis = TimeUnit.MILLISECONDS.convert(System.nanoTime() - start, TimeUnit.NANOSECONDS);
-    LOG.info("Total run time: " + DurationFormatUtils.formatDuration(durationMillis, "HH:mm:ss"));
-  }
-}
diff --git a/src/main/python/run_es_regression.py b/src/main/python/run_es_regression.py
deleted file mode 100644
index b2084de21d..0000000000
--- a/src/main/python/run_es_regression.py
+++ /dev/null
@@ -1,256 +0,0 @@
-#
-# Pyserini: Python interface to the Anserini IR toolkit built on Lucene
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-#
-
-import argparse
-import logging
-import math
-import os
-import requests
-import time
-
-import regression_utils
-
-# Note that this class is specifically written with REST API requests instead of the
-# Elasticsearch client eliminate an additional dependency
-
-logger = logging.getLogger('run_es_regression')
-ch = logging.StreamHandler()
-ch.setFormatter(logging.Formatter('%(asctime)s %(levelname)s - %(message)s'))
-logger.addHandler(ch)
-logger.setLevel(logging.INFO)
-
-
-class ElasticsearchClient:
-    def __init__(self):
-        pass
-
-    @staticmethod
-    def is_alive():
-        try:
-            response = requests.get('http://localhost:9200/')
-            response.raise_for_status()
-        except requests.exceptions.RequestException:
-            return False
-        else:
-            return True
-
-    def does_index_exist(self, collection):
-        # Make sure ES is alive:
-        if self.is_alive():
-            try:
-                response = requests.get('http://localhost:9200/{}'.format(collection))
-                response.raise_for_status()
-            except requests.exceptions.RequestException:
-                return False
-            else:
-                return True
-        else:
-            raise Exception('ES does not appear to be alive!')
-
-    def delete_index(self, collection):
-        logger.info('Deleting index {}...'.format(collection))
-        # Make sure the index exists:
-        if self.does_index_exist(collection):
-            try:
-                response = requests.request('DELETE', url='http://localhost:9200/{}'.format(collection))
-                response.raise_for_status()
-            except requests.exceptions.RequestException:
-                return False
-            else:
-                return True
-        else:
-            raise Exception('The index {} does not exist!'.format(collection))
-
-    def create_index(self, collection):
-        logger.info('Creating index {}...'.format(collection))
-        # Make sure the index does not exist:
-        if not self.does_index_exist(collection):
-            filename = 'src/main/resources/elasticsearch/index-config.{}.json'.format(collection)
-            if not os.path.exists(filename):
-                raise Exception('No config found in src/main/resources/elasticsearch/ for {}!'.format(collection))
-            logger.info('Using index config for {} at {}'.format(collection, filename))
-            with open(filename, mode='r') as file:
-                json = file.read()
-            response = ''
-            try:
-                response = requests.request('PUT', url='http://localhost:9200/{}'.format(collection),
-                                            data=json, headers={'Content-type': 'application/json'})
-                response.raise_for_status()
-            except requests.exceptions.RequestException:
-                logger.info(response)
-                return False
-            else:
-                return True
-        else:
-            raise Exception('The index {} already exists!'.format(collection))
-
-    def insert_docs(self, collection, path):
-        logger.info('Inserting documents from {} into {}... '.format(path, collection))
-        if not os.path.exists(args.input):
-            raise Exception('{} does not exist!'.format(args.input))
-        if not self.does_index_exist(collection):
-            raise Exception('The index {} does not exist!'.format(collection))
-        # TODO: abstract this into an external config instead of hard-coded.
-        if collection == 'robust04':
-            command = 'sh target/appassembler/bin/IndexCollection -collection TrecCollection ' + \
-                      '-generator DefaultLuceneDocumentGenerator -es -es.index robust04 -threads 8 -input ' + \
-                      path + ' -storePositions -storeDocvectors -storeRaw'
-        elif collection == 'msmarco-passage':
-            command = 'sh target/appassembler/bin/IndexCollection -collection JsonCollection ' + \
-                      '-generator DefaultLuceneDocumentGenerator -es -es.index msmarco-passage -threads 8 -input ' + \
-                      path + ' -storePositions -storeDocvectors -storeRaw'
-        elif collection == 'core18':
-            command = 'sh target/appassembler/bin/IndexCollection -collection WashingtonPostCollection ' + \
-                      '-generator WashingtonPostGenerator -es -es.index core18 -threads 8 -input ' + \
-                      path + ' -storePositions -storeDocvectors -storeContents'
-        elif collection == 'msmarco-doc':
-            command = 'sh target/appassembler/bin/IndexCollection -collection JsonCollection ' + \
-                      '-generator DefaultLuceneDocumentGenerator -es -es.index msmarco-doc -threads 8 -input ' + \
-                      path + ' -storePositions -storeDocvectors -storeRaw'
-        else:
-            raise Exception('Unknown collection: {}'.format(collection))
-        logger.info('Running indexing command: ' + command)
-        return regression_utils.run_shell_command(command, logger, echo=True)
-
-    def evaluate(self, collection):
-        if not self.does_index_exist(collection):
-            raise Exception('The index {} does not exist!'.format(collection))
-        # TODO: abstract this into an external config instead of hard-coded.
-        if collection == 'robust04':
-            command = 'sh target/appassembler/bin/SearchElastic -topicreader Trec -es.index robust04 ' + \
-                      '-topics src/main/resources/topics-and-qrels/topics.robust04.txt ' + \
-                      '-output runs/run.es.robust04.bm25.topics.robust04.txt'
-        elif collection == 'msmarco-passage':
-            command = 'sh target/appassembler/bin/SearchElastic -topicreader TsvString -es.index msmarco-passage ' + \
-                      '-topics src/main/resources/topics-and-qrels/topics.msmarco-passage.dev-subset.txt ' + \
-                      '-output runs/run.es.msmarco-passage.txt'
-        elif collection == 'core18':
-            command = 'sh target/appassembler/bin/SearchElastic -topicreader Trec -es.index core18 ' + \
-                      '-topics src/main/resources/topics-and-qrels/topics.core18.txt ' + \
-                      '-output runs/run.es.core18.bm25.topics.core18.txt'
-        elif collection == 'msmarco-doc':
-            command = 'sh target/appassembler/bin/SearchElastic -topicreader TsvInt -es.index msmarco-doc ' + \
-                      '-topics src/main/resources/topics-and-qrels/topics.msmarco-doc.dev.txt ' + \
-                      '-output runs/run.es.msmarco-doc.txt'
-        else:
-            raise Exception('Unknown collection: {}'.format(collection))
-
-        logger.info('Retrieval command: ' + command)
-        regression_utils.run_shell_command(command, logger, echo=True)
-        logger.info('Retrieval complete!')
-
-        if collection == 'robust04':
-            command = 'tools/eval/trec_eval.9.0.4/trec_eval -m map -m P.30 ' + \
-                      'src/main/resources/topics-and-qrels/qrels.robust04.txt ' + \
-                      'runs/run.es.robust04.bm25.topics.robust04.txt'
-        elif collection == 'msmarco-passage':
-            command = 'tools/eval/trec_eval.9.0.4/trec_eval -c -mrecall.1000 -mmap ' + \
-                      'src/main/resources/topics-and-qrels/qrels.msmarco-passage.dev-subset.txt ' + \
-                      'runs/run.es.msmarco-passage.txt'
-        elif collection == 'core18':
-            command = 'tools/eval/trec_eval.9.0.4/trec_eval -m map -m P.30 ' + \
-                      'src/main/resources/topics-and-qrels/qrels.core18.txt runs/run.es.core18.bm25.topics.core18.txt'
-        elif collection == 'msmarco-doc':
-            command = 'tools/eval/trec_eval.9.0.4/trec_eval -c -mrecall.1000 -mmap ' + \
-                      'src/main/resources/topics-and-qrels/qrels.msmarco-doc.dev.txt runs/run.es.msmarco-doc.txt'
-        else:
-            raise Exception('Unknown collection: {}'.format(collection))
-
-        logger.info('Evaluation command: ' + command)
-        output = regression_utils.run_shell_command(command, logger, capture=True)
-        ap = float(output[0].split('\t')[2])
-
-        if collection == 'robust04':
-            expected = 0.2531
-        elif collection == 'msmarco-passage':
-            expected = 0.1956
-        elif collection == 'core18':
-            expected = 0.2496
-        elif collection == 'msmarco-doc':
-            expected = 0.2307
-        else:
-            raise Exception('Unknown collection: {}'.format(collection))
-
-        if math.isclose(ap, expected):
-            logger.info('[SUCESS] {} MAP verified as expected!'.format(ap))
-        else:
-            logger.info('[FAILED] {} MAP, expected {} MAP!'.format(ap, expected))
-
-
-if __name__ == '__main__':
-    parser = argparse.ArgumentParser(description='Program for running Elasticsearch regressions.')
-    parser.add_argument('--ping', action='store_true', default=False, help='Ping ES and exit.')
-    parser.add_argument('--check-index-exists', default='', type=str, metavar='collection',
-                        help='Check if index exists.')
-    parser.add_argument('--delete-index', default='', type=str, metavar='collection', help='Delete index.')
-    parser.add_argument('--create-index', default='', type=str, metavar='collection', help='Create index.')
-    parser.add_argument('--insert-docs', default='', type=str, metavar='collection',
-                        help='Insert documents into index.')
-    parser.add_argument('--input', default='', type=str, metavar='directory',
-                        help='Location of documents to insert into index.')
-    parser.add_argument('--evaluate', default='', type=str, metavar='collection',
-                        help='Search and evaluate on collection.')
-    parser.add_argument('--regression', default='', type=str, metavar='collection', help='Run end-to-end regression.')
-
-    args = parser.parse_args()
-    es = ElasticsearchClient()
-
-    if args.ping:
-        logger.info('Pinging Elasticsearch instance...')
-        if es.is_alive():
-            logger.info('... appears to alive! :)')
-        else:
-            logger.info('... appears to dead! :(')
-    elif args.check_index_exists:
-        logger.info('Checking if index {} exists...'.format(args.check_index_exists))
-        if es.does_index_exist(args.check_index_exists):
-            logger.info('... yes indeed!')
-        else:
-            logger.info('... appears not.')
-    elif args.delete_index:
-        if es.delete_index(args.delete_index):
-            logger.info('... successful!')
-        else:
-            logger.info('... failed!')
-    elif args.create_index:
-        if es.create_index(args.create_index):
-            logger.info('... successful!')
-        else:
-            logger.info('... failed!')
-    elif args.insert_docs:
-        if not args.input:
-            raise Exception('Location of corpus not specified (use --input)!')
-        else:
-            es.insert_docs(args.insert_docs, args.input)
-    elif args.evaluate:
-        es.evaluate(args.evaluate)
-    elif args.regression:
-        logger.info('Running BM25 regression on {}...'.format(args.regression))
-        if not args.input:
-            raise Exception('Location of corpus not specified (use --input)!')
-        if not es.is_alive():
-            raise Exception('Elasticsearch does not appear to be alive!')
-        if es.does_index_exist(args.regression):
-            logger.info('Index {} already exists: deleting and recreating.'.format(args.regression))
-            es.delete_index(args.regression)
-        es.create_index(args.regression)
-        es.insert_docs(args.regression, args.input)
-        # Documents ingested into ES are not immediately searchable. There are lots of 'refresh' options
-        # to control the visibility behavior, but the simplest solution is just to wait for a bit...
-        logger.info('Document ingestion complete. Sleeping now for 120s...')
-        time.sleep(120)
-        logger.info('Waking up!')
-        es.evaluate(args.regression)
diff --git a/src/main/python/run_solr_regression.py b/src/main/python/run_solr_regression.py
deleted file mode 100644
index 3fa8486a4b..0000000000
--- a/src/main/python/run_solr_regression.py
+++ /dev/null
@@ -1,247 +0,0 @@
-#
-# Pyserini: Python interface to the Anserini IR toolkit built on Lucene
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-#
-
-import argparse
-import logging
-import math
-import os
-import requests
-
-import regression_utils
-
-logger = logging.getLogger('run_solr_regression')
-ch = logging.StreamHandler()
-ch.setFormatter(logging.Formatter('%(asctime)s %(levelname)s - %(message)s'))
-logger.addHandler(ch)
-logger.setLevel(logging.INFO)
-
-
-class SolrClient:
-    def __init__(self):
-        pass
-
-    @staticmethod
-    def is_alive():
-        try:
-            response = requests.get('http://localhost:8983/')
-            response.raise_for_status()
-        except requests.exceptions.RequestException:
-            return False
-        else:
-            return True
-
-    def does_index_exist(self, collection):
-        # Make sure Solr is alive:
-        if self.is_alive():
-            try:
-                response = requests.get('http://localhost:8983/solr/admin/collections?action=LIST')
-                response.raise_for_status()
-            except requests.exceptions.RequestException:
-                return False
-            else:
-                return collection in response.json()['collections']
-        else:
-            raise Exception('Solr does not appear to be alive!')
-
-    def delete_index(self, collection):
-        # Make sure the index exists:
-        if self.does_index_exist(collection):
-            command = 'solrini/bin/solr delete -c {}'.format(collection)
-            logger.info('Deleting index {} command: {}'.format(collection, command))
-            regression_utils.run_shell_command(command, logger, echo=True)
-            return not self.does_index_exist(collection)
-        else:
-            raise Exception('The index {} does not exist!'.format(collection))
-
-    def create_index(self, collection):
-        # Make sure the index does not exist:
-        if not self.does_index_exist(collection):
-            # Re-upload configsets to Solr's internal Zookeeper
-            self.upload_configs()
-            command = 'solrini/bin/solr create -n anserini -c {}'.format(collection)
-            logger.info('Creating index {} command: {}'.format(collection, command))
-            regression_utils.run_shell_command(command, logger, echo=True)
-            return self.does_index_exist(collection)
-        else:
-            raise Exception('The index {} already exists!'.format(collection))
-
-    def insert_docs(self, collection, path):
-        logger.info('Inserting documents from {} into {}... '.format(path, collection))
-        if not os.path.exists(args.input):
-            raise Exception('{} does not exist!'.format(args.input))
-        if not self.does_index_exist(collection):
-            raise Exception('The index {} does not exist!'.format(collection))
-        if collection == 'core18':
-            command = 'sh target/appassembler/bin/IndexCollection -collection WashingtonPostCollection ' + \
-                      '-generator WashingtonPostGenerator -solr -solr.index core18 -solr.zkUrl localhost:9983 ' + \
-                      '-threads 8 -input ' + path + ' -storePositions -storeDocvectors -storeContents'
-        elif collection == 'robust04':
-            command = 'sh target/appassembler/bin/IndexCollection -collection TrecCollection ' + \
-                      '-generator DefaultLuceneDocumentGenerator ' + \
-                      '-solr -solr.index robust04 -solr.zkUrl localhost:9983 ' + \
-                      '-threads 8 -input ' + path + ' -storePositions -storeDocvectors -storeRaw'
-        elif collection == 'msmarco-passage':
-            command = 'sh target/appassembler/bin/IndexCollection -collection JsonCollection ' + \
-                      '-generator DefaultLuceneDocumentGenerator ' + \
-                      '-solr -solr.index msmarco-passage -solr.zkUrl localhost:9983 ' + \
-                      '-threads 8 -input ' + path + ' -storePositions -storeDocvectors -storeRaw'
-        elif collection == 'msmarco-doc':
-            command = 'sh target/appassembler/bin/IndexCollection -collection JsonCollection ' + \
-                      '-generator DefaultLuceneDocumentGenerator ' + \
-                      '-solr -solr.index msmarco-doc -solr.zkUrl localhost:9983 ' + \
-                      '-threads 8 -input ' + path + ' -storePositions -storeDocvectors -storeRaw'
-        else:
-            raise Exception('Unknown collection: {}'.format(collection))
-        logger.info('Running indexing command: ' + command)
-        return regression_utils.run_shell_command(command, logger, echo=True)
-
-    @staticmethod
-    def upload_configs():
-        os.chdir('src/main/resources/solr')
-        command = 'rm -rf anserini/conf/lang anserini-twitter/conf/lang'
-        logger.info('Deleting existed configs command: ' + command)
-        regression_utils.run_shell_command(command, logger, echo=True)
-        command = './solr.sh ../../../../solrini localhost:9983'
-        logger.info('Uploading configs command: ' + command)
-        regression_utils.run_shell_command(command, logger, echo=True)
-        os.chdir('../../../..')
-        logger.info('Uploading complete!')
-
-    def evaluate(self, collection):
-        if not self.does_index_exist(collection):
-            raise Exception('The index {} does not exist!'.format(collection))
-        if collection == 'core18':
-            command = 'sh target/appassembler/bin/SearchSolr -topicreader Trec -solr.index core18 ' + \
-                      '-solr.zkUrl localhost:9983 -topics src/main/resources/topics-and-qrels/topics.core18.txt ' + \
-                      '-output runs/run.solr.core18.bm25.topics.core18.txt'
-        elif collection == 'robust04':
-            command = 'sh target/appassembler/bin/SearchSolr -topicreader Trec -solr.index robust04 ' + \
-                      '-solr.zkUrl localhost:9983 -topics src/main/resources/topics-and-qrels/topics.robust04.txt ' + \
-                      '-output runs/run.solr.robust04.bm25.topics.robust04.txt'
-        elif collection == 'msmarco-passage':
-            command = 'sh target/appassembler/bin/SearchSolr -topicreader TsvString -solr.index msmarco-passage ' + \
-                      '-solr.zkUrl localhost:9983 ' + \
-                      '-topics src/main/resources/topics-and-qrels/topics.msmarco-passage.dev-subset.txt ' + \
-                      '-output runs/run.solr.msmarco-passage.txt'
-        elif collection == 'msmarco-doc':
-            command = 'sh target/appassembler/bin/SearchSolr -topicreader TsvInt -solr.index msmarco-doc ' + \
-                      '-solr.zkUrl localhost:9983 ' + \
-                      '-topics src/main/resources/topics-and-qrels/topics.msmarco-doc.dev.txt ' + \
-                      '-output runs/run.solr.msmarco-doc.txt '
-        else:
-            raise Exception('Unknown collection: {}'.format(collection))
-
-        logger.info('Retrieval command: ' + command)
-        regression_utils.run_shell_command(command, logger, echo=True)
-        logger.info('Retrieval complete!')
-
-        if collection == 'core18':
-            command = 'tools/eval/trec_eval.9.0.4/trec_eval -m map -m P.30 ' + \
-                      'src/main/resources/topics-and-qrels/qrels.core18.txt runs/run.solr.core18.bm25.topics.core18.txt'
-        elif collection == 'robust04':
-            command = 'tools/eval/trec_eval.9.0.4/trec_eval -m map -m P.30 ' + \
-                      'src/main/resources/topics-and-qrels/qrels.robust04.txt ' + \
-                      'runs/run.solr.robust04.bm25.topics.robust04.txt'
-        elif collection == 'msmarco-passage':
-            command = 'tools/eval/trec_eval.9.0.4/trec_eval  -c -mrecall.1000 -mmap ' + \
-                      'src/main/resources/topics-and-qrels/qrels.msmarco-passage.dev-subset.txt ' + \
-                      'runs/run.solr.msmarco-passage.txt'
-        elif collection == 'msmarco-doc':
-            command = 'tools/eval/trec_eval.9.0.4/trec_eval  -c -mrecall.1000 -mmap ' + \
-                      'src/main/resources/topics-and-qrels/qrels.msmarco-doc.dev.txt runs/run.solr.msmarco-doc.txt'
-        else:
-            raise Exception('Unknown collection: {}'.format(collection))
-
-        logger.info('Evaluation command: ' + command)
-        output = regression_utils.run_shell_command(command, logger, capture=True)
-        ap = float(output[0].split('\t')[2])
-
-        if collection == 'core18':
-            expected = 0.2496
-        elif collection == 'robust04':
-            expected = 0.2531
-        elif collection == 'msmarco-passage':
-            expected = 0.1926
-        elif collection == 'msmarco-doc':
-            expected = 0.2305
-        else:
-            raise Exception('Unknown collection: {}'.format(collection))
-
-        if math.isclose(ap, expected):
-            logger.info('[SUCESS] {} MAP verified as expected!'.format(ap))
-        else:
-            logger.info('[FAILED] {} MAP, expected {} MAP!'.format(ap, expected))
-
-
-if __name__ == '__main__':
-    parser = argparse.ArgumentParser(description='Program for running Solr regressions.')
-    parser.add_argument('--ping', action='store_true', default=False, help='ping Solr and exit')
-    parser.add_argument('--check-index-exists', default='', type=str, metavar='collection',
-                        help='Check if index exists.')
-    parser.add_argument('--delete-index', default='', type=str, metavar='collection', help='Delete index.')
-    parser.add_argument('--create-index', default='', type=str, metavar='collection', help='Create index.')
-    parser.add_argument('--insert-docs', default='', type=str, metavar='collection',
-                        help='Insert documents into index.')
-    parser.add_argument('--input', default='', type=str, metavar='directory',
-                        help='Location of documents to insert into index.')
-    parser.add_argument('--evaluate', default='', type=str, metavar='collection',
-                        help='Search and evaluate on collection.')
-    parser.add_argument('--regression', default='', type=str, metavar='collection', help='Run end-to-end regression.')
-
-    args = parser.parse_args()
-    solr = SolrClient()
-
-    if args.ping:
-        logger.info('Pinging Solr instance...')
-        if solr.is_alive():
-            logger.info('... appears to alive! :)')
-        else:
-            logger.info('... appears to dead! :(')
-    elif args.check_index_exists:
-        logger.info('Checking if index {} exists...'.format(args.check_index_exists))
-        if solr.does_index_exist(args.check_index_exists):
-            logger.info('... yes indeed!')
-        else:
-            logger.info('... appears not.')
-    elif args.delete_index:
-        if solr.delete_index(args.delete_index):
-            logger.info('... successful!')
-        else:
-            logger.info('... failed!')
-    elif args.create_index:
-        if solr.create_index(args.create_index):
-            logger.info('... successful!')
-        else:
-            logger.info('... failed!')
-    elif args.insert_docs:
-        if not args.input:
-            raise Exception('Location of corpus not specified (use --input)!')
-        else:
-            solr.insert_docs(args.insert_docs, args.input)
-    elif args.evaluate:
-        solr.evaluate(args.evaluate)
-    elif args.regression:
-        logger.info('Running BM25 regression on {}...'.format(args.regression))
-        if not args.input:
-            raise Exception('Location of corpus not specified (use --input)!')
-        if not solr.is_alive():
-            raise Exception('Solr does not appear to be alive!')
-        if solr.does_index_exist(args.regression):
-            logger.info('Index {} already exists: deleting and recreating.'.format(args.regression))
-            solr.delete_index(args.regression)
-        solr.create_index(args.regression)
-        solr.insert_docs(args.regression, args.input)
-        solr.evaluate(args.regression)
diff --git a/src/main/resources/elasticsearch/index-config.cord19.json b/src/main/resources/elasticsearch/index-config.cord19.json
deleted file mode 100644
index c7c08e4610..0000000000
--- a/src/main/resources/elasticsearch/index-config.cord19.json
+++ /dev/null
@@ -1,32 +0,0 @@
-{
-  "mappings": {
-    "properties": {
-      "id": {
-        "type": "keyword"
-      },
-      "contents": {
-        "type": "text",
-        "store": false,
-        "index": true,
-        "analyzer": "english"
-      },
-      "raw": {
-        "type": "text",
-        "store": true,
-        "index": false
-      }
-    }
-  },
-  "settings": {
-    "index": {
-      "refresh_interval": "60s",
-      "similarity": {
-        "default": {
-          "type": "BM25",
-          "k1": "0.9",
-          "b": "0.4"
-        }
-      }
-    }
-  }
-}
diff --git a/src/main/resources/elasticsearch/index-config.core18.json b/src/main/resources/elasticsearch/index-config.core18.json
deleted file mode 100644
index c7c08e4610..0000000000
--- a/src/main/resources/elasticsearch/index-config.core18.json
+++ /dev/null
@@ -1,32 +0,0 @@
-{
-  "mappings": {
-    "properties": {
-      "id": {
-        "type": "keyword"
-      },
-      "contents": {
-        "type": "text",
-        "store": false,
-        "index": true,
-        "analyzer": "english"
-      },
-      "raw": {
-        "type": "text",
-        "store": true,
-        "index": false
-      }
-    }
-  },
-  "settings": {
-    "index": {
-      "refresh_interval": "60s",
-      "similarity": {
-        "default": {
-          "type": "BM25",
-          "k1": "0.9",
-          "b": "0.4"
-        }
-      }
-    }
-  }
-}
diff --git a/src/main/resources/elasticsearch/index-config.msmarco-doc.json b/src/main/resources/elasticsearch/index-config.msmarco-doc.json
deleted file mode 100644
index c7c08e4610..0000000000
--- a/src/main/resources/elasticsearch/index-config.msmarco-doc.json
+++ /dev/null
@@ -1,32 +0,0 @@
-{
-  "mappings": {
-    "properties": {
-      "id": {
-        "type": "keyword"
-      },
-      "contents": {
-        "type": "text",
-        "store": false,
-        "index": true,
-        "analyzer": "english"
-      },
-      "raw": {
-        "type": "text",
-        "store": true,
-        "index": false
-      }
-    }
-  },
-  "settings": {
-    "index": {
-      "refresh_interval": "60s",
-      "similarity": {
-        "default": {
-          "type": "BM25",
-          "k1": "0.9",
-          "b": "0.4"
-        }
-      }
-    }
-  }
-}
diff --git a/src/main/resources/elasticsearch/index-config.msmarco-passage.json b/src/main/resources/elasticsearch/index-config.msmarco-passage.json
deleted file mode 100644
index ad33344097..0000000000
--- a/src/main/resources/elasticsearch/index-config.msmarco-passage.json
+++ /dev/null
@@ -1,32 +0,0 @@
-{
-  "mappings": {
-    "properties": {
-      "id": {
-        "type": "keyword"
-      },
-      "contents": {
-        "type": "text",
-        "store": false,
-        "index": true,
-        "analyzer": "english"
-      },
-      "raw": {
-        "type": "text",
-        "store": true,
-        "index": false
-      }
-    }
-  },
-  "settings": {
-    "index": {
-      "refresh_interval": "60s",
-      "similarity": {
-        "default": {
-          "type": "BM25",
-          "k1": "0.82",
-          "b": "0.68"
-        }
-      }
-    }
-  }
-}
diff --git a/src/main/resources/elasticsearch/index-config.robust04.json b/src/main/resources/elasticsearch/index-config.robust04.json
deleted file mode 100644
index c7c08e4610..0000000000
--- a/src/main/resources/elasticsearch/index-config.robust04.json
+++ /dev/null
@@ -1,32 +0,0 @@
-{
-  "mappings": {
-    "properties": {
-      "id": {
-        "type": "keyword"
-      },
-      "contents": {
-        "type": "text",
-        "store": false,
-        "index": true,
-        "analyzer": "english"
-      },
-      "raw": {
-        "type": "text",
-        "store": true,
-        "index": false
-      }
-    }
-  },
-  "settings": {
-    "index": {
-      "refresh_interval": "60s",
-      "similarity": {
-        "default": {
-          "type": "BM25",
-          "k1": "0.9",
-          "b": "0.4"
-        }
-      }
-    }
-  }
-}
diff --git a/src/main/resources/solr/anserini-twitter/conf/managed-schema b/src/main/resources/solr/anserini-twitter/conf/managed-schema
deleted file mode 100644
index 08e1f08be5..0000000000
--- a/src/main/resources/solr/anserini-twitter/conf/managed-schema
+++ /dev/null
@@ -1,216 +0,0 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<!-- Solr managed schema - automatically generated - DO NOT EDIT -->
-<schema name="anserini" version="1.6">
-  <uniqueKey>id</uniqueKey>
-  <fieldType name="ancestor_path" class="solr.TextField">
-    <analyzer type="index">
-      <tokenizer class="solr.KeywordTokenizerFactory"/>
-    </analyzer>
-    <analyzer type="query">
-      <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="binary" class="solr.BinaryField"/>
-  <fieldType name="boolean" class="solr.BoolField" sortMissingLast="true"/>
-  <fieldType name="booleans" class="solr.BoolField" sortMissingLast="true" multiValued="true"/>
-  <fieldType name="delimited_payloads_float" class="solr.TextField" indexed="true" stored="false">
-    <analyzer>
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.DelimitedPayloadTokenFilterFactory" encoder="float"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="delimited_payloads_int" class="solr.TextField" indexed="true" stored="false">
-    <analyzer>
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.DelimitedPayloadTokenFilterFactory" encoder="integer"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="delimited_payloads_string" class="solr.TextField" indexed="true" stored="false">
-    <analyzer>
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.DelimitedPayloadTokenFilterFactory" encoder="identity"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="descendent_path" class="solr.TextField">
-    <analyzer type="index">
-      <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/"/>
-    </analyzer>
-    <analyzer type="query">
-      <tokenizer class="solr.KeywordTokenizerFactory"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="location" class="solr.LatLonPointSpatialField" docValues="true"/>
-  <fieldType name="location_rpt" class="solr.SpatialRecursivePrefixTreeFieldType" geo="true" maxDistErr="0.001" distErrPct="0.025" distanceUnits="kilometers"/>
-  <fieldType name="lowercase" class="solr.TextField" positionIncrementGap="100">
-    <analyzer>
-      <tokenizer class="solr.KeywordTokenizerFactory"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="pdate" class="solr.DatePointField" docValues="true"/>
-  <fieldType name="pdates" class="solr.DatePointField" docValues="true" multiValued="true"/>
-  <fieldType name="pdouble" class="solr.DoublePointField" docValues="true"/>
-  <fieldType name="pdoubles" class="solr.DoublePointField" docValues="true" multiValued="true"/>
-  <fieldType name="pfloat" class="solr.FloatPointField" docValues="true"/>
-  <fieldType name="pfloats" class="solr.FloatPointField" docValues="true" multiValued="true"/>
-  <fieldType name="phonetic_en" class="solr.TextField" indexed="true" stored="false">
-    <analyzer>
-      <tokenizer class="solr.StandardTokenizerFactory"/>
-      <filter class="solr.DoubleMetaphoneFilterFactory" inject="false"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="pint" class="solr.IntPointField" docValues="true"/>
-  <fieldType name="pints" class="solr.IntPointField" docValues="true" multiValued="true"/>
-  <fieldType name="plong" class="solr.LongPointField" docValues="true"/>
-  <fieldType name="plongs" class="solr.LongPointField" docValues="true" multiValued="true"/>
-  <fieldType name="point" class="solr.PointType" subFieldSuffix="_d" dimension="2"/>
-  <fieldType name="random" class="solr.RandomSortField" indexed="true"/>
-  <fieldType name="string" class="solr.StrField" sortMissingLast="true" docValues="true"/>
-  <fieldType name="strings" class="solr.StrField" sortMissingLast="true" docValues="true" multiValued="true"/>
-
-  <fieldType name="text_en" class="solr.TextField" positionIncrementGap="100">
-    <analyzer type="index">
-      <tokenizer class="solr.StandardTokenizerFactory"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.EnglishPossessiveFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.PorterStemFilterFactory"/>
-    </analyzer>
-    <analyzer type="query">
-      <tokenizer class="solr.StandardTokenizerFactory"/>
-      <filter class="solr.SynonymGraphFilterFactory" expand="true" ignoreCase="true" synonyms="synonyms.txt"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.EnglishPossessiveFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.PorterStemFilterFactory"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="text_general" class="solr.TextField" positionIncrementGap="100" multiValued="true">
-   <analyzer type="index">
-     <tokenizer class="solr.StandardTokenizerFactory"/>
-     <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-     <filter class="solr.LowerCaseFilterFactory"/>
-   </analyzer>
-   <analyzer type="query">
-     <tokenizer class="solr.StandardTokenizerFactory"/>
-     <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-     <filter class="solr.SynonymGraphFilterFactory" expand="true" ignoreCase="true" synonyms="synonyms.txt"/>
-     <filter class="solr.LowerCaseFilterFactory"/>
-   </analyzer>
- </fieldType>
-  <fieldType name="text_en_splitting" class="solr.TextField" autoGeneratePhraseQueries="true" positionIncrementGap="100">
-    <analyzer type="index">
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.WordDelimiterGraphFilterFactory" catenateNumbers="1" generateNumberParts="1" splitOnCaseChange="1" generateWordParts="1" catenateAll="0" catenateWords="1"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.PorterStemFilterFactory"/>
-      <filter class="solr.FlattenGraphFilterFactory"/>
-    </analyzer>
-    <analyzer type="query">
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.SynonymGraphFilterFactory" expand="true" ignoreCase="true" synonyms="synonyms.txt"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.WordDelimiterGraphFilterFactory" catenateNumbers="0" generateNumberParts="1" splitOnCaseChange="1" generateWordParts="1" catenateAll="0" catenateWords="0"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.PorterStemFilterFactory"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="text_en_splitting_tight" class="solr.TextField" autoGeneratePhraseQueries="true" positionIncrementGap="100">
-    <analyzer type="index">
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.SynonymGraphFilterFactory" expand="false" ignoreCase="true" synonyms="synonyms.txt"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.WordDelimiterGraphFilterFactory" catenateNumbers="1" generateNumberParts="0" generateWordParts="0" catenateAll="0" catenateWords="1"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.EnglishMinimalStemFilterFactory"/>
-      <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
-      <filter class="solr.FlattenGraphFilterFactory"/>
-    </analyzer>
-    <analyzer type="query">
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.SynonymGraphFilterFactory" expand="false" ignoreCase="true" synonyms="synonyms.txt"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.WordDelimiterGraphFilterFactory" catenateNumbers="1" generateNumberParts="0" generateWordParts="0" catenateAll="0" catenateWords="1"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.EnglishMinimalStemFilterFactory"/>
-      <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
-    </analyzer>
-  </fieldType>
-
-  <fieldType name="text_ws" class="solr.TextField" positionIncrementGap="100">
-    <analyzer>
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-    </analyzer>
-  </fieldType>
-  <field name="_root_" type="string" docValues="false" indexed="true" stored="false"/>
-  <field name="_text_" type="text_general" multiValued="true" indexed="true" stored="false"/>
-  <field name="_version_" type="plong" indexed="false" stored="false"/>
-  <field name="id" type="string" multiValued="false" indexed="true" required="true" stored="true"/>
-  <dynamicField name="*_txt_en_split_tight" type="text_en_splitting_tight" indexed="true" stored="true"/>
-  <dynamicField name="*_descendent_path" type="descendent_path" indexed="true" stored="true"/>
-  <dynamicField name="*_ancestor_path" type="ancestor_path" indexed="true" stored="true"/>
-  <dynamicField name="*_txt_en_split" type="text_en_splitting" indexed="true" stored="true"/>
-  <dynamicField name="*_phon_en" type="phonetic_en" indexed="true" stored="true"/>
-  <dynamicField name="*_s_lower" type="lowercase" indexed="true" stored="true"/>
-  <dynamicField name="random_*" type="random"/>
-  <dynamicField name="*_txt_en" type="text_en" indexed="true" stored="true"/>
-
-  <dynamicField name="*_point" type="point" indexed="true" stored="true"/>
-  <dynamicField name="*_srpt" type="location_rpt" indexed="true" stored="true"/>
-  <dynamicField name="attr_*" type="text_general" multiValued="true" indexed="true" stored="true"/>
-  <dynamicField name="*_txt" type="text_general" indexed="true" stored="true"/>
-  <dynamicField name="*_str" type="strings" docValues="true" indexed="false" stored="false" useDocValuesAsStored="false"/>
-  <dynamicField name="*_dts" type="pdate" multiValued="true" indexed="true" stored="true"/>
-  <dynamicField name="*_dpf" type="delimited_payloads_float" indexed="true" stored="true"/>
-  <dynamicField name="*_dpi" type="delimited_payloads_int" indexed="true" stored="true"/>
-  <dynamicField name="*_dps" type="delimited_payloads_string" indexed="true" stored="true"/>
-  <dynamicField name="*_is" type="pints" indexed="true" stored="true"/>
-  <dynamicField name="*_ss" type="strings" indexed="true" stored="true"/>
-  <dynamicField name="*_ls" type="plongs" indexed="true" stored="true"/>
-  <dynamicField name="*_bs" type="booleans" indexed="true" stored="true"/>
-  <dynamicField name="*_fs" type="pfloats" indexed="true" stored="true"/>
-  <dynamicField name="*_ds" type="pdoubles" indexed="true" stored="true"/>
-  <dynamicField name="*_dt" type="pdate" indexed="true" stored="true"/>
-  <dynamicField name="*_ws" type="text_ws" indexed="true" stored="true"/>
-  <dynamicField name="*_i" type="pint" indexed="true" stored="true"/>
-  <dynamicField name="*_s" type="string" indexed="true" stored="true"/>
-  <dynamicField name="*_l" type="plong" indexed="true" stored="true"/>
-  <dynamicField name="*_t" type="text_general" multiValued="false" indexed="true" stored="true"/>
-  <dynamicField name="*_b" type="boolean" indexed="true" stored="true"/>
-  <dynamicField name="*_f" type="pfloat" indexed="true" stored="true"/>
-  <dynamicField name="*_d" type="pdouble" indexed="true" stored="true"/>
-  <dynamicField name="*_p" type="location" indexed="true" stored="true"/>
-
-  <!-- Anserini Fields -->
-
-  <fieldType name="text_en_anserini" class="solr.TextField">
-     <analyzer class="org.apache.lucene.analysis.en.EnglishAnalyzer"/>
-  </fieldType>
-
-  <!-- "raw" is stored but not searchable. -->
-  <field name="raw" type="text_general" indexed="false" stored="true" multiValued="false" />
-
-  <!-- "contents" are stored and searchable. -->
-  <field name="contents" type="text_en_anserini" indexed="true" stored="true" multiValued="false" />
-
-  <!-- Anserini WashingtonPost Fields -->
-  <field name="author" type="string" />
-  <field name="article_url" type="string" />
-  <field name="fullCaption" type="text_en" multiValued="true" />
-  <field name="kicker" type="string" />
-  <field name="published_date" type="plong" />
-  <field name="title" type="text_en" />
-
-  <similarity class="solr.BM25SimilarityFactory">
-    <float name="k1">0.9</float>
-    <float name="b">0.4</float>
-  </similarity>
-
-</schema>
diff --git a/src/main/resources/solr/anserini-twitter/conf/params.json b/src/main/resources/solr/anserini-twitter/conf/params.json
deleted file mode 100644
index 06114ef257..0000000000
--- a/src/main/resources/solr/anserini-twitter/conf/params.json
+++ /dev/null
@@ -1,20 +0,0 @@
-{"params":{
-  "query":{
-    "defType":"edismax",
-    "q.alt":"*:*",
-    "rows":"10",
-    "fl":"*,score",
-    "":{"v":0}
-  },
-  "facets":{
-    "facet":"on",
-    "facet.mincount": "1",
-    "":{"v":0}
-  },
- "velocity":{
-   "wt": "velocity",
-   "v.template":"browse",
-   "v.layout": "layout",
-   "":{"v":0}
- }
-}}
\ No newline at end of file
diff --git a/src/main/resources/solr/anserini-twitter/conf/protwords.txt b/src/main/resources/solr/anserini-twitter/conf/protwords.txt
deleted file mode 100644
index 1dfc0abecb..0000000000
--- a/src/main/resources/solr/anserini-twitter/conf/protwords.txt
+++ /dev/null
@@ -1,21 +0,0 @@
-# The ASF licenses this file to You under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License.  You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-#-----------------------------------------------------------------------
-# Use a protected word file to protect against the stemmer reducing two
-# unrelated words to the same base word.
-
-# Some non-words that normally won't be encountered,
-# just to test that they won't be stemmed.
-dontstems
-zwhacky
-
diff --git a/src/main/resources/solr/anserini-twitter/conf/solrconfig.xml b/src/main/resources/solr/anserini-twitter/conf/solrconfig.xml
deleted file mode 100644
index 5f3e4208ef..0000000000
--- a/src/main/resources/solr/anserini-twitter/conf/solrconfig.xml
+++ /dev/null
@@ -1,1341 +0,0 @@
-<?xml version="1.0" encoding="UTF-8" ?>
-<!--
- Licensed to the Apache Software Foundation (ASF) under one or more
- contributor license agreements.  See the NOTICE file distributed with
- this work for additional information regarding copyright ownership.
- The ASF licenses this file to You under the Apache License, Version 2.0
- (the "License"); you may not use this file except in compliance with
- the License.  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-
-<!--
-     For more details about configurations options that may appear in
-     this file, see http://wiki.apache.org/solr/SolrConfigXml.
--->
-<config>
-  <!-- In all configuration below, a prefix of "solr." for class names
-       is an alias that causes solr to search appropriate packages,
-       including org.apache.solr.(search|update|request|core|analysis)
-
-       You may also specify a fully qualified Java classname if you
-       have your own custom plugins.
-    -->
-
-  <!-- Controls what version of Lucene various components of Solr
-       adhere to.  Generally, you want to use the latest version to
-       get all bug fixes and improvements. It is highly recommended
-       that you fully re-index after changing this setting as it can
-       affect both how text is indexed and queried.
-  -->
-  <luceneMatchVersion>9.0.0</luceneMatchVersion>
-
-  <!-- <lib/> directives can be used to instruct Solr to load any Jars
-       identified and use them to resolve any "plugins" specified in
-       your solrconfig.xml or schema.xml (ie: Analyzers, Request
-       Handlers, etc...).
-
-       All directories and paths are resolved relative to the
-       instanceDir.
-
-       Please note that <lib/> directives are processed in the order
-       that they appear in your solrconfig.xml file, and are "stacked"
-       on top of each other when building a ClassLoader - so if you have
-       plugin jars with dependencies on other jars, the "lower level"
-       dependency jars should be loaded first.
-
-       If a "./lib" directory exists in your instanceDir, all files
-       found in it are included as if you had used the following
-       syntax...
-
-              <lib dir="./lib" />
-    -->
-
-  <!-- A 'dir' option by itself adds any files found in the directory
-       to the classpath, this is useful for including all jars in a
-       directory.
-
-       When a 'regex' is specified in addition to a 'dir', only the
-       files in that directory which completely match the regex
-       (anchored on both ends) will be included.
-
-       If a 'dir' option (with or without a regex) is used and nothing
-       is found that matches, a warning will be logged.
-
-       The examples below can be used to load some solr-contribs along
-       with their external dependencies.
-    -->
-  <!-- an exact 'path' can be used instead of a 'dir' to specify a
-       specific jar file.  This will cause a serious error to be logged
-       if it can't be loaded.
-    -->
-  <!--
-     <lib path="../a-jar-that-does-not-exist.jar" />
-  -->
-
-  <!-- Data Directory
-
-       Used to specify an alternate directory to hold all index data
-       other than the default ./data under the Solr home.  If
-       replication is in use, this should match the replication
-       configuration.
-    -->
-  <dataDir>${solr.data.dir:}</dataDir>
-
-
-  <!-- The DirectoryFactory to use for indexes.
-
-       solr.StandardDirectoryFactory is filesystem
-       based and tries to pick the best implementation for the current
-       JVM and platform.  solr.NRTCachingDirectoryFactory, the default,
-       wraps solr.StandardDirectoryFactory and caches small files in memory
-       for better NRT performance.
-
-       One can force a particular implementation via solr.MMapDirectoryFactory,
-       solr.NIOFSDirectoryFactory, or solr.SimpleFSDirectoryFactory.
-
-       solr.RAMDirectoryFactory is memory based and not persistent.
-    -->
-  <directoryFactory name="DirectoryFactory"
-                    class="${solr.directoryFactory:solr.NRTCachingDirectoryFactory}"/>
-
-  <!-- The CodecFactory for defining the format of the inverted index.
-       The default implementation is SchemaCodecFactory, which is the official Lucene
-       index format, but hooks into the schema to provide per-field customization of
-       the postings lists and per-document values in the fieldType element
-       (postingsFormat/docValuesFormat). Note that most of the alternative implementations
-       are experimental, so if you choose to customize the index format, it's a good
-       idea to convert back to the official format e.g. via IndexWriter.addIndexes(IndexReader)
-       before upgrading to a newer version to avoid unnecessary reindexing.
-       A "compressionMode" string element can be added to <codecFactory> to choose
-       between the existing compression modes in the default codec: "BEST_SPEED" (default)
-       or "BEST_COMPRESSION".
-  -->
-  <codecFactory class="solr.SchemaCodecFactory"/>
-
-  <!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-       Index Config - These settings control low-level behavior of indexing
-       Most example settings here show the default value, but are commented
-       out, to more easily see where customizations have been made.
-
-       Note: This replaces <indexDefaults> and <mainIndex> from older versions
-       ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -->
-  <indexConfig>
-    <!-- maxFieldLength was removed in 4.0. To get similar behavior, include a
-         LimitTokenCountFilterFactory in your fieldType definition. E.g.
-     <filter class="solr.LimitTokenCountFilterFactory" maxTokenCount="10000"/>
-    -->
-    <!-- Maximum time to wait for a write lock (ms) for an IndexWriter. Default: 1000 -->
-    <!-- <writeLockTimeout>1000</writeLockTimeout>  -->
-
-    <!-- Expert: Enabling compound file will use less files for the index,
-         using fewer file descriptors on the expense of performance decrease.
-         Default in Lucene is "true". Default in Solr is "false" (since 3.6) -->
-    <!-- <useCompoundFile>false</useCompoundFile> -->
-
-    <!-- ramBufferSizeMB sets the amount of RAM that may be used by Lucene
-         indexing for buffering added documents and deletions before they are
-         flushed to the Directory.
-         maxBufferedDocs sets a limit on the number of documents buffered
-         before flushing.
-         If both ramBufferSizeMB and maxBufferedDocs is set, then
-         Lucene will flush based on whichever limit is hit first.  -->
-    <ramBufferSizeMB>2048</ramBufferSizeMB>
-    <!-- <maxBufferedDocs>1000</maxBufferedDocs> -->
-
-    <!-- Expert: Merge Policy
-         The Merge Policy in Lucene controls how merging of segments is done.
-         The default since Solr/Lucene 3.3 is TieredMergePolicy.
-         The default since Lucene 2.3 was the LogByteSizeMergePolicy,
-         Even older versions of Lucene used LogDocMergePolicy.
-      -->
-    <!--
-        <mergePolicyFactory class="org.apache.solr.index.TieredMergePolicyFactory">
-          <int name="maxMergeAtOnce">10</int>
-          <int name="segmentsPerTier">10</int>
-          <double name="noCFSRatio">0.1</double>
-        </mergePolicyFactory>
-      -->
-
-    <!-- Expert: Merge Scheduler
-         The Merge Scheduler in Lucene controls how merges are
-         performed.  The ConcurrentMergeScheduler (Lucene 2.3 default)
-         can perform merges in the background using separate threads.
-         The SerialMergeScheduler (Lucene 2.2 default) does not.
-     -->
-    <!--
-       <mergeScheduler class="org.apache.lucene.index.ConcurrentMergeScheduler"/>
-       -->
-
-    <!-- LockFactory
-
-         This option specifies which Lucene LockFactory implementation
-         to use.
-
-         single = SingleInstanceLockFactory - suggested for a
-                  read-only index or when there is no possibility of
-                  another process trying to modify the index.
-         native = NativeFSLockFactory - uses OS native file locking.
-                  Do not use when multiple solr webapps in the same
-                  JVM are attempting to share a single index.
-         simple = SimpleFSLockFactory  - uses a plain file for locking
-
-         Defaults: 'native' is default for Solr3.6 and later, otherwise
-                   'simple' is the default
-
-         More details on the nuances of each LockFactory...
-         http://wiki.apache.org/lucene-java/AvailableLockFactories
-    -->
-    <lockType>${solr.lock.type:native}</lockType>
-
-    <!-- Commit Deletion Policy
-         Custom deletion policies can be specified here. The class must
-         implement org.apache.lucene.index.IndexDeletionPolicy.
-
-         The default Solr IndexDeletionPolicy implementation supports
-         deleting index commit points on number of commits, age of
-         commit point and optimized status.
-
-         The latest commit point should always be preserved regardless
-         of the criteria.
-    -->
-    <!--
-    <deletionPolicy class="solr.SolrDeletionPolicy">
-    -->
-    <!-- The number of commit points to be kept -->
-    <!-- <str name="maxCommitsToKeep">1</str> -->
-    <!-- The number of optimized commit points to be kept -->
-    <!-- <str name="maxOptimizedCommitsToKeep">0</str> -->
-    <!--
-        Delete all commit points once they have reached the given age.
-        Supports DateMathParser syntax e.g.
-      -->
-    <!--
-       <str name="maxCommitAge">30MINUTES</str>
-       <str name="maxCommitAge">1DAY</str>
-    -->
-    <!--
-    </deletionPolicy>
-    -->
-
-    <!-- Lucene Infostream
-
-         To aid in advanced debugging, Lucene provides an "InfoStream"
-         of detailed information when indexing.
-
-         Setting The value to true will instruct the underlying Lucene
-         IndexWriter to write its debugging info the specified file
-      -->
-    <!-- <infoStream file="INFOSTREAM.txt">false</infoStream> -->
-  </indexConfig>
-
-
-  <!-- JMX
-
-       This example enables JMX if and only if an existing MBeanServer
-       is found, use this if you want to configure JMX through JVM
-       parameters. Remove this to disable exposing Solr configuration
-       and statistics to JMX.
-
-       For more details see http://wiki.apache.org/solr/SolrJmx
-    -->
-  <jmx />
-  <!-- If you want to connect to a particular server, specify the
-       agentId
-    -->
-  <!-- <jmx agentId="myAgent" /> -->
-  <!-- If you want to start a new MBeanServer, specify the serviceUrl -->
-  <!-- <jmx serviceUrl="service:jmx:rmi:///jndi/rmi://localhost:9999/solr"/>
-    -->
-
-  <!-- The default high-performance update handler -->
-  <updateHandler class="solr.DirectUpdateHandler2">
-
-    <!-- Enables a transaction log, used for real-time get, durability, and
-         and solr cloud replica recovery.  The log can grow as big as
-         uncommitted changes to the index, so use of a hard autoCommit
-         is recommended (see below).
-         "dir" - the target directory for transaction logs, defaults to the
-                solr data directory.
-         "numVersionBuckets" - sets the number of buckets used to keep
-                track of max version values when checking for re-ordered
-                updates; increase this value to reduce the cost of
-                synchronizing access to version buckets during high-volume
-                indexing, this requires 8 bytes (long) * numVersionBuckets
-                of heap space per Solr core.
-    -->
-    <updateLog>
-      <str name="dir">${solr.ulog.dir:}</str>
-      <int name="numVersionBuckets">${solr.ulog.numVersionBuckets:65536}</int>
-    </updateLog>
-
-    <!-- AutoCommit
-
-         Perform a hard commit automatically under certain conditions.
-         Instead of enabling autoCommit, consider using "commitWithin"
-         when adding documents.
-
-         http://wiki.apache.org/solr/UpdateXmlMessages
-
-         maxDocs - Maximum number of documents to add since the last
-                   commit before automatically triggering a new commit.
-
-         maxTime - Maximum amount of time in ms that is allowed to pass
-                   since a document was added before automatically
-                   triggering a new commit.
-         openSearcher - if false, the commit causes recent index changes
-           to be flushed to stable storage, but does not cause a new
-           searcher to be opened to make those changes visible.
-
-         If the updateLog is enabled, then it's highly recommended to
-         have some sort of hard autoCommit to limit the log size.
-      -->
-    <autoCommit>
-      <maxTime>${solr.autoCommit.maxTime:15000}</maxTime>
-      <openSearcher>false</openSearcher>
-    </autoCommit>
-
-    <!-- softAutoCommit is like autoCommit except it causes a
-         'soft' commit which only ensures that changes are visible
-         but does not ensure that data is synced to disk.  This is
-         faster and more near-realtime friendly than a hard commit.
-      -->
-
-    <autoSoftCommit>
-      <maxTime>${solr.autoSoftCommit.maxTime:-1}</maxTime>
-    </autoSoftCommit>
-
-    <!-- Update Related Event Listeners
-
-         Various IndexWriter related events can trigger Listeners to
-         take actions.
-
-         postCommit - fired after every commit or optimize command
-         postOptimize - fired after every optimize command
-      -->
-
-  </updateHandler>
-
-  <!-- IndexReaderFactory
-
-       Use the following format to specify a custom IndexReaderFactory,
-       which allows for alternate IndexReader implementations.
-
-       ** Experimental Feature **
-
-       Please note - Using a custom IndexReaderFactory may prevent
-       certain other features from working. The API to
-       IndexReaderFactory may change without warning or may even be
-       removed from future releases if the problems cannot be
-       resolved.
-
-
-       ** Features that may not work with custom IndexReaderFactory **
-
-       The ReplicationHandler assumes a disk-resident index. Using a
-       custom IndexReader implementation may cause incompatibility
-       with ReplicationHandler and may cause replication to not work
-       correctly. See SOLR-1366 for details.
-
-    -->
-  <!--
-  <indexReaderFactory name="IndexReaderFactory" class="package.class">
-    <str name="someArg">Some Value</str>
-  </indexReaderFactory >
-  -->
-
-  <!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-       Query section - these settings control query time things like caches
-       ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -->
-  <query>
-
-    <!-- Maximum number of clauses in each BooleanQuery,  an exception
-         is thrown if exceeded.  It is safe to increase or remove this setting,
-         since it is purely an arbitrary limit to try and catch user errors where
-         large boolean queries may not be the best implementation choice.
-      -->
-    <maxBooleanClauses>1024</maxBooleanClauses>
-
-    <!-- Solr Internal Query Caches
-
-         There are two implementations of cache available for Solr,
-         LRUCache, based on a synchronized LinkedHashMap, and
-         FastLRUCache, based on a ConcurrentHashMap.
-
-         FastLRUCache has faster gets and slower puts in single
-         threaded operation and thus is generally faster than LRUCache
-         when the hit ratio of the cache is high (> 75%), and may be
-         faster under other scenarios on multi-cpu systems.
-    -->
-
-    <!-- Filter Cache
-
-         Cache used by SolrIndexSearcher for filters (DocSets),
-         unordered sets of *all* documents that match a query.  When a
-         new searcher is opened, its caches may be prepopulated or
-         "autowarmed" using data from caches in the old searcher.
-         autowarmCount is the number of items to prepopulate.  For
-         LRUCache, the autowarmed items will be the most recently
-         accessed items.
-
-         Parameters:
-           class - the SolrCache implementation LRUCache or
-               (LRUCache or FastLRUCache)
-           size - the maximum number of entries in the cache
-           initialSize - the initial capacity (number of entries) of
-               the cache.  (see java.util.HashMap)
-           autowarmCount - the number of entries to prepopulate from
-               and old cache.
-           maxRamMB - the maximum amount of RAM (in MB) that this cache is allowed
-                      to occupy. Note that when this option is specified, the size
-                      and initialSize parameters are ignored.
-      -->
-    <filterCache size="512"
-                 initialSize="512"
-                 autowarmCount="0"/>
-
-    <!-- Query Result Cache
-
-         Caches results of searches - ordered lists of document ids
-         (DocList) based on a query, a sort, and the range of documents requested.
-         Additional supported parameter by LRUCache:
-            maxRamMB - the maximum amount of RAM (in MB) that this cache is allowed
-                       to occupy
-      -->
-    <queryResultCache size="512"
-                      initialSize="512"
-                      autowarmCount="0"/>
-
-    <!-- Document Cache
-
-         Caches Lucene Document objects (the stored fields for each
-         document).  Since Lucene internal document ids are transient,
-         this cache will not be autowarmed.
-      -->
-    <documentCache size="512"
-                   initialSize="512"
-                   autowarmCount="0"/>
-
-    <!-- custom cache currently used by block join -->
-    <cache name="perSegFilter"
-           size="10"
-           initialSize="0"
-           autowarmCount="10"
-           regenerator="solr.NoOpRegenerator" />
-
-    <!-- Field Value Cache
-
-         Cache used to hold field values that are quickly accessible
-         by document id.  The fieldValueCache is created by default
-         even if not configured here.
-      -->
-    <!--
-       <fieldValueCache class="solr.FastLRUCache"
-                        size="512"
-                        autowarmCount="128"
-                        showItems="32" />
-      -->
-
-    <!-- Custom Cache
-
-         Example of a generic cache.  These caches may be accessed by
-         name through SolrIndexSearcher.getCache(),cacheLookup(), and
-         cacheInsert().  The purpose is to enable easy caching of
-         user/application level data.  The regenerator argument should
-         be specified as an implementation of solr.CacheRegenerator
-         if autowarming is desired.
-      -->
-    <!--
-       <cache name="myUserCache"
-              class="solr.LRUCache"
-              size="4096"
-              initialSize="1024"
-              autowarmCount="1024"
-              regenerator="com.mycompany.MyRegenerator"
-              />
-      -->
-
-
-    <!-- Lazy Field Loading
-
-         If true, stored fields that are not requested will be loaded
-         lazily.  This can result in a significant speed improvement
-         if the usual case is to not load all stored fields,
-         especially if the skipped fields are large compressed text
-         fields.
-    -->
-    <enableLazyFieldLoading>true</enableLazyFieldLoading>
-
-    <!-- Use Filter For Sorted Query
-
-         A possible optimization that attempts to use a filter to
-         satisfy a search.  If the requested sort does not include
-         score, then the filterCache will be checked for a filter
-         matching the query. If found, the filter will be used as the
-         source of document ids, and then the sort will be applied to
-         that.
-
-         For most situations, this will not be useful unless you
-         frequently get the same search repeatedly with different sort
-         options, and none of them ever use "score"
-      -->
-    <!--
-       <useFilterForSortedQuery>true</useFilterForSortedQuery>
-      -->
-
-    <!-- Result Window Size
-
-         An optimization for use with the queryResultCache.  When a search
-         is requested, a superset of the requested number of document ids
-         are collected.  For example, if a search for a particular query
-         requests matching documents 10 through 19, and queryWindowSize is 50,
-         then documents 0 through 49 will be collected and cached.  Any further
-         requests in that range can be satisfied via the cache.
-      -->
-    <queryResultWindowSize>20</queryResultWindowSize>
-
-    <!-- Maximum number of documents to cache for any entry in the
-         queryResultCache.
-      -->
-    <queryResultMaxDocsCached>200</queryResultMaxDocsCached>
-
-    <!-- Query Related Event Listeners
-
-         Various IndexSearcher related events can trigger Listeners to
-         take actions.
-
-         newSearcher - fired whenever a new searcher is being prepared
-         and there is a current searcher handling requests (aka
-         registered).  It can be used to prime certain caches to
-         prevent long request times for certain requests.
-
-         firstSearcher - fired whenever a new searcher is being
-         prepared but there is no current registered searcher to handle
-         requests or to gain autowarming data from.
-
-
-      -->
-    <!-- QuerySenderListener takes an array of NamedList and executes a
-         local query request for each NamedList in sequence.
-      -->
-    <listener event="newSearcher" class="solr.QuerySenderListener">
-      <arr name="queries">
-        <!--
-           <lst><str name="q">solr</str><str name="sort">price asc</str></lst>
-           <lst><str name="q">rocks</str><str name="sort">weight asc</str></lst>
-          -->
-      </arr>
-    </listener>
-    <listener event="firstSearcher" class="solr.QuerySenderListener">
-      <arr name="queries">
-        <!--
-        <lst>
-          <str name="q">static firstSearcher warming in solrconfig.xml</str>
-        </lst>
-        -->
-      </arr>
-    </listener>
-
-    <!-- Use Cold Searcher
-
-         If a search request comes in and there is no current
-         registered searcher, then immediately register the still
-         warming searcher and use it.  If "false" then all requests
-         will block until the first searcher is done warming.
-      -->
-    <useColdSearcher>false</useColdSearcher>
-
-  </query>
-
-
-  <!-- Request Dispatcher
-
-       This section contains instructions for how the SolrDispatchFilter
-       should behave when processing requests for this SolrCore.
-
-    -->
-  <requestDispatcher>
-    <!-- Request Parsing
-
-         These settings indicate how Solr Requests may be parsed, and
-         what restrictions may be placed on the ContentStreams from
-         those requests
-
-         enableRemoteStreaming - enables use of the stream.file
-         and stream.url parameters for specifying remote streams.
-
-         multipartUploadLimitInKB - specifies the max size (in KiB) of
-         Multipart File Uploads that Solr will allow in a Request.
-
-         formdataUploadLimitInKB - specifies the max size (in KiB) of
-         form data (application/x-www-form-urlencoded) sent via
-         POST. You can use POST to pass request parameters not
-         fitting into the URL.
-
-         addHttpRequestToContext - if set to true, it will instruct
-         the requestParsers to include the original HttpServletRequest
-         object in the context map of the SolrQueryRequest under the
-         key "httpRequest". It will not be used by any of the existing
-         Solr components, but may be useful when developing custom
-         plugins.
-
-         *** WARNING ***
-         Before enabling remote streaming, you should make sure your
-         system has authentication enabled.
-
-    <requestParsers enableRemoteStreaming="false"
-                    multipartUploadLimitInKB="-1"
-                    formdataUploadLimitInKB="-1"
-                    addHttpRequestToContext="false"/>
-      -->
-
-    <!-- HTTP Caching
-
-         Set HTTP caching related parameters (for proxy caches and clients).
-
-         The options below instruct Solr not to output any HTTP Caching
-         related headers
-      -->
-    <httpCaching never304="true" />
-    <!-- If you include a <cacheControl> directive, it will be used to
-         generate a Cache-Control header (as well as an Expires header
-         if the value contains "max-age=")
-
-         By default, no Cache-Control header is generated.
-
-         You can use the <cacheControl> option even if you have set
-         never304="true"
-      -->
-    <!--
-       <httpCaching never304="true" >
-         <cacheControl>max-age=30, public</cacheControl>
-       </httpCaching>
-      -->
-    <!-- To enable Solr to respond with automatically generated HTTP
-         Caching headers, and to response to Cache Validation requests
-         correctly, set the value of never304="false"
-
-         This will cause Solr to generate Last-Modified and ETag
-         headers based on the properties of the Index.
-
-         The following options can also be specified to affect the
-         values of these headers...
-
-         lastModFrom - the default value is "openTime" which means the
-         Last-Modified value (and validation against If-Modified-Since
-         requests) will all be relative to when the current Searcher
-         was opened.  You can change it to lastModFrom="dirLastMod" if
-         you want the value to exactly correspond to when the physical
-         index was last modified.
-
-         etagSeed="..." is an option you can change to force the ETag
-         header (and validation against If-None-Match requests) to be
-         different even if the index has not changed (ie: when making
-         significant changes to your config file)
-
-         (lastModifiedFrom and etagSeed are both ignored if you use
-         the never304="true" option)
-      -->
-    <!--
-       <httpCaching lastModifiedFrom="openTime"
-                    etagSeed="Solr">
-         <cacheControl>max-age=30, public</cacheControl>
-       </httpCaching>
-      -->
-  </requestDispatcher>
-
-  <!-- Request Handlers
-
-       http://wiki.apache.org/solr/SolrRequestHandler
-
-       Incoming queries will be dispatched to a specific handler by name
-       based on the path specified in the request.
-
-       If a Request Handler is declared with startup="lazy", then it will
-       not be initialized until the first request that uses it.
-
-    -->
-  <!-- SearchHandler
-
-       http://wiki.apache.org/solr/SearchHandler
-
-       For processing Search Queries, the primary Request Handler
-       provided with Solr is "SearchHandler" It delegates to a sequent
-       of SearchComponents (see below) and supports distributed
-       queries across multiple shards
-    -->
-  <requestHandler name="/select" class="solr.SearchHandler">
-    <!-- default values for query parameters can be specified, these
-         will be overridden by parameters in the request
-      -->
-    <lst name="defaults">
-      <str name="echoParams">explicit</str>
-      <int name="rows">10</int>
-      <!-- Default search field
-         <str name="df">text</str> 
-        -->
-      <!-- Change from JSON to XML format (the default prior to Solr 7.0)
-         <str name="wt">xml</str> 
-        -->
-    </lst>
-    <!-- In addition to defaults, "appends" params can be specified
-         to identify values which should be appended to the list of
-         multi-val params from the query (or the existing "defaults").
-      -->
-    <!-- In this example, the param "fq=instock:true" would be appended to
-         any query time fq params the user may specify, as a mechanism for
-         partitioning the index, independent of any user selected filtering
-         that may also be desired (perhaps as a result of faceted searching).
-
-         NOTE: there is *absolutely* nothing a client can do to prevent these
-         "appends" values from being used, so don't use this mechanism
-         unless you are sure you always want it.
-      -->
-    <!--
-       <lst name="appends">
-         <str name="fq">inStock:true</str>
-       </lst>
-      -->
-    <!-- "invariants" are a way of letting the Solr maintainer lock down
-         the options available to Solr clients.  Any params values
-         specified here are used regardless of what values may be specified
-         in either the query, the "defaults", or the "appends" params.
-
-         In this example, the facet.field and facet.query params would
-         be fixed, limiting the facets clients can use.  Faceting is
-         not turned on by default - but if the client does specify
-         facet=true in the request, these are the only facets they
-         will be able to see counts for; regardless of what other
-         facet.field or facet.query params they may specify.
-
-         NOTE: there is *absolutely* nothing a client can do to prevent these
-         "invariants" values from being used, so don't use this mechanism
-         unless you are sure you always want it.
-      -->
-    <!--
-       <lst name="invariants">
-         <str name="facet.field">cat</str>
-         <str name="facet.field">manu_exact</str>
-         <str name="facet.query">price:[* TO 500]</str>
-         <str name="facet.query">price:[500 TO *]</str>
-       </lst>
-      -->
-    <!-- If the default list of SearchComponents is not desired, that
-         list can either be overridden completely, or components can be
-         prepended or appended to the default list.  (see below)
-      -->
-    <!--
-       <arr name="components">
-         <str>nameOfCustomComponent1</str>
-         <str>nameOfCustomComponent2</str>
-       </arr>
-      -->
-  </requestHandler>
-
-  <!-- A request handler that returns indented JSON by default -->
-  <requestHandler name="/query" class="solr.SearchHandler">
-    <lst name="defaults">
-      <str name="echoParams">explicit</str>
-      <str name="wt">json</str>
-      <str name="indent">true</str>
-    </lst>
-  </requestHandler>
-
-
-  <!-- A Robust Example
-
-       This example SearchHandler declaration shows off usage of the
-       SearchHandler with many defaults declared
-
-       Note that multiple instances of the same Request Handler
-       (SearchHandler) can be registered multiple times with different
-       names (and different init parameters)
-    -->
-  <requestHandler name="/browse" class="solr.SearchHandler" useParams="query,facets,velocity,browse">
-    <lst name="defaults">
-      <str name="echoParams">explicit</str>
-    </lst>
-  </requestHandler>
-
-  <initParams path="/update/**,/query,/select,/tvrh,/elevate,/spell,/browse">
-    <lst name="defaults">
-      <str name="df">_text_</str>
-    </lst>
-  </initParams>
-
-  <!-- Solr Cell Update Request Handler
-
-       http://wiki.apache.org/solr/ExtractingRequestHandler
-
-    -->
-  <requestHandler name="/update/extract"
-                  startup="lazy"
-                  class="solr.extraction.ExtractingRequestHandler" >
-    <lst name="defaults">
-      <str name="lowernames">true</str>
-      <str name="fmap.meta">ignored_</str>
-      <str name="fmap.content">_text_</str>
-    </lst>
-  </requestHandler>
-
-  <!-- Search Components
-
-       Search components are registered to SolrCore and used by
-       instances of SearchHandler (which can access them by name)
-
-       By default, the following components are available:
-
-       <searchComponent name="query"     class="solr.QueryComponent" />
-       <searchComponent name="facet"     class="solr.FacetComponent" />
-       <searchComponent name="mlt"       class="solr.MoreLikeThisComponent" />
-       <searchComponent name="highlight" class="solr.HighlightComponent" />
-       <searchComponent name="stats"     class="solr.StatsComponent" />
-       <searchComponent name="debug"     class="solr.DebugComponent" />
-
-       Default configuration in a requestHandler would look like:
-
-       <arr name="components">
-         <str>query</str>
-         <str>facet</str>
-         <str>mlt</str>
-         <str>highlight</str>
-         <str>stats</str>
-         <str>debug</str>
-       </arr>
-
-       If you register a searchComponent to one of the standard names,
-       that will be used instead of the default.
-
-       To insert components before or after the 'standard' components, use:
-
-       <arr name="first-components">
-         <str>myFirstComponentName</str>
-       </arr>
-
-       <arr name="last-components">
-         <str>myLastComponentName</str>
-       </arr>
-
-       NOTE: The component registered with the name "debug" will
-       always be executed after the "last-components"
-
-     -->
-
-  <!-- Spell Check
-
-       The spell check component can return a list of alternative spelling
-       suggestions.
-
-       http://wiki.apache.org/solr/SpellCheckComponent
-    -->
-  <searchComponent name="spellcheck" class="solr.SpellCheckComponent">
-
-    <str name="queryAnalyzerFieldType">text_general</str>
-
-    <!-- Multiple "Spell Checkers" can be declared and used by this
-         component
-      -->
-
-    <!-- a spellchecker built from a field of the main index -->
-    <lst name="spellchecker">
-      <str name="name">default</str>
-      <str name="field">_text_</str>
-      <str name="classname">solr.DirectSolrSpellChecker</str>
-      <!-- the spellcheck distance measure used, the default is the internal levenshtein -->
-      <str name="distanceMeasure">internal</str>
-      <!-- minimum accuracy needed to be considered a valid spellcheck suggestion -->
-      <float name="accuracy">0.5</float>
-      <!-- the maximum #edits we consider when enumerating terms: can be 1 or 2 -->
-      <int name="maxEdits">2</int>
-      <!-- the minimum shared prefix when enumerating terms -->
-      <int name="minPrefix">1</int>
-      <!-- maximum number of inspections per result. -->
-      <int name="maxInspections">5</int>
-      <!-- minimum length of a query term to be considered for correction -->
-      <int name="minQueryLength">4</int>
-      <!-- maximum threshold of documents a query term can appear to be considered for correction -->
-      <float name="maxQueryFrequency">0.01</float>
-      <!-- uncomment this to require suggestions to occur in 1% of the documents
-        <float name="thresholdTokenFrequency">.01</float>
-      -->
-    </lst>
-
-    <!-- a spellchecker that can break or combine words.  See "/spell" handler below for usage -->
-    <!--
-    <lst name="spellchecker">
-      <str name="name">wordbreak</str>
-      <str name="classname">solr.WordBreakSolrSpellChecker</str>
-      <str name="field">name</str>
-      <str name="combineWords">true</str>
-      <str name="breakWords">true</str>
-      <int name="maxChanges">10</int>
-    </lst>
-    -->
-  </searchComponent>
-
-  <!-- A request handler for demonstrating the spellcheck component.
-
-       NOTE: This is purely as an example.  The whole purpose of the
-       SpellCheckComponent is to hook it into the request handler that
-       handles your normal user queries so that a separate request is
-       not needed to get suggestions.
-
-       IN OTHER WORDS, THERE IS REALLY GOOD CHANCE THE SETUP BELOW IS
-       NOT WHAT YOU WANT FOR YOUR PRODUCTION SYSTEM!
-
-       See http://wiki.apache.org/solr/SpellCheckComponent for details
-       on the request parameters.
-    -->
-  <requestHandler name="/spell" class="solr.SearchHandler" startup="lazy">
-    <lst name="defaults">
-      <!-- Solr will use suggestions from both the 'default' spellchecker
-           and from the 'wordbreak' spellchecker and combine them.
-           collations (re-written queries) can include a combination of
-           corrections from both spellcheckers -->
-      <str name="spellcheck.dictionary">default</str>
-      <str name="spellcheck">on</str>
-      <str name="spellcheck.extendedResults">true</str>
-      <str name="spellcheck.count">10</str>
-      <str name="spellcheck.alternativeTermCount">5</str>
-      <str name="spellcheck.maxResultsForSuggest">5</str>
-      <str name="spellcheck.collate">true</str>
-      <str name="spellcheck.collateExtendedResults">true</str>
-      <str name="spellcheck.maxCollationTries">10</str>
-      <str name="spellcheck.maxCollations">5</str>
-    </lst>
-    <arr name="last-components">
-      <str>spellcheck</str>
-    </arr>
-  </requestHandler>
-
-  <!-- Term Vector Component
-
-       http://wiki.apache.org/solr/TermVectorComponent
-    -->
-  <searchComponent name="tvComponent" class="solr.TermVectorComponent"/>
-
-  <!-- A request handler for demonstrating the term vector component
-
-       This is purely as an example.
-
-       In reality you will likely want to add the component to your
-       already specified request handlers.
-    -->
-  <requestHandler name="/tvrh" class="solr.SearchHandler" startup="lazy">
-    <lst name="defaults">
-      <bool name="tv">true</bool>
-    </lst>
-    <arr name="last-components">
-      <str>tvComponent</str>
-    </arr>
-  </requestHandler>
-
-  <!-- Clustering Component. (Omitted here. See the default Solr example for a typical configuration.) -->
-
-  <!-- Terms Component
-
-       http://wiki.apache.org/solr/TermsComponent
-
-       A component to return terms and document frequency of those
-       terms
-    -->
-  <searchComponent name="terms" class="solr.TermsComponent"/>
-
-  <!-- A request handler for demonstrating the terms component -->
-  <requestHandler name="/terms" class="solr.SearchHandler" startup="lazy">
-    <lst name="defaults">
-      <bool name="terms">true</bool>
-      <bool name="distrib">false</bool>
-    </lst>
-    <arr name="components">
-      <str>terms</str>
-    </arr>
-  </requestHandler>
-
-
-  <!-- Query Elevation Component
-
-       http://wiki.apache.org/solr/QueryElevationComponent
-
-       a search component that enables you to configure the top
-       results for a given query regardless of the normal lucene
-       scoring.
-    -->
-  <searchComponent name="elevator" class="solr.QueryElevationComponent" >
-    <!-- pick a fieldType to analyze queries -->
-    <str name="queryFieldType">string</str>
-  </searchComponent>
-
-  <!-- A request handler for demonstrating the elevator component -->
-  <requestHandler name="/elevate" class="solr.SearchHandler" startup="lazy">
-    <lst name="defaults">
-      <str name="echoParams">explicit</str>
-    </lst>
-    <arr name="last-components">
-      <str>elevator</str>
-    </arr>
-  </requestHandler>
-
-  <!-- Highlighting Component
-
-       http://wiki.apache.org/solr/HighlightingParameters
-    -->
-  <searchComponent class="solr.HighlightComponent" name="highlight">
-    <highlighting>
-      <!-- Configure the standard fragmenter -->
-      <!-- This could most likely be commented out in the "default" case -->
-      <fragmenter name="gap"
-                  default="true"
-                  class="solr.highlight.GapFragmenter">
-        <lst name="defaults">
-          <int name="hl.fragsize">100</int>
-        </lst>
-      </fragmenter>
-
-      <!-- A regular-expression-based fragmenter
-           (for sentence extraction)
-        -->
-      <fragmenter name="regex"
-                  class="solr.highlight.RegexFragmenter">
-        <lst name="defaults">
-          <!-- slightly smaller fragsizes work better because of slop -->
-          <int name="hl.fragsize">70</int>
-          <!-- allow 50% slop on fragment sizes -->
-          <float name="hl.regex.slop">0.5</float>
-          <!-- a basic sentence pattern -->
-          <str name="hl.regex.pattern">[-\w ,/\n\&quot;&apos;]{20,200}</str>
-        </lst>
-      </fragmenter>
-
-      <!-- Configure the standard formatter -->
-      <formatter name="html"
-                 default="true"
-                 class="solr.highlight.HtmlFormatter">
-        <lst name="defaults">
-          <str name="hl.simple.pre"><![CDATA[<em>]]></str>
-          <str name="hl.simple.post"><![CDATA[</em>]]></str>
-        </lst>
-      </formatter>
-
-      <!-- Configure the standard encoder -->
-      <encoder name="html"
-               class="solr.highlight.HtmlEncoder" />
-
-      <!-- Configure the standard fragListBuilder -->
-      <fragListBuilder name="simple"
-                       class="solr.highlight.SimpleFragListBuilder"/>
-
-      <!-- Configure the single fragListBuilder -->
-      <fragListBuilder name="single"
-                       class="solr.highlight.SingleFragListBuilder"/>
-
-      <!-- Configure the weighted fragListBuilder -->
-      <fragListBuilder name="weighted"
-                       default="true"
-                       class="solr.highlight.WeightedFragListBuilder"/>
-
-      <!-- default tag FragmentsBuilder -->
-      <fragmentsBuilder name="default"
-                        default="true"
-                        class="solr.highlight.ScoreOrderFragmentsBuilder">
-        <!--
-        <lst name="defaults">
-          <str name="hl.multiValuedSeparatorChar">/</str>
-        </lst>
-        -->
-      </fragmentsBuilder>
-
-      <!-- multi-colored tag FragmentsBuilder -->
-      <fragmentsBuilder name="colored"
-                        class="solr.highlight.ScoreOrderFragmentsBuilder">
-        <lst name="defaults">
-          <str name="hl.tag.pre"><![CDATA[
-               <b style="background:yellow">,<b style="background:lawgreen">,
-               <b style="background:aquamarine">,<b style="background:magenta">,
-               <b style="background:palegreen">,<b style="background:coral">,
-               <b style="background:wheat">,<b style="background:khaki">,
-               <b style="background:lime">,<b style="background:deepskyblue">]]></str>
-          <str name="hl.tag.post"><![CDATA[</b>]]></str>
-        </lst>
-      </fragmentsBuilder>
-
-      <boundaryScanner name="default"
-                       default="true"
-                       class="solr.highlight.SimpleBoundaryScanner">
-        <lst name="defaults">
-          <str name="hl.bs.maxScan">10</str>
-          <str name="hl.bs.chars">.,!? &#9;&#10;&#13;</str>
-        </lst>
-      </boundaryScanner>
-
-      <boundaryScanner name="breakIterator"
-                       class="solr.highlight.BreakIteratorBoundaryScanner">
-        <lst name="defaults">
-          <!-- type should be one of CHARACTER, WORD(default), LINE and SENTENCE -->
-          <str name="hl.bs.type">WORD</str>
-          <!-- language and country are used when constructing Locale object.  -->
-          <!-- And the Locale object will be used when getting instance of BreakIterator -->
-          <str name="hl.bs.language">en</str>
-          <str name="hl.bs.country">US</str>
-        </lst>
-      </boundaryScanner>
-    </highlighting>
-  </searchComponent>
-
-  <!-- Update Processors
-
-       Chains of Update Processor Factories for dealing with Update
-       Requests can be declared, and then used by name in Update
-       Request Processors
-
-       http://wiki.apache.org/solr/UpdateRequestProcessor
-
-    -->
-
-  <!-- Add unknown fields to the schema
-
-       Field type guessing update processors that will
-       attempt to parse string-typed field values as Booleans, Longs,
-       Doubles, or Dates, and then add schema fields with the guessed
-       field types. Text content will be indexed as "text_general" as
-       well as a copy to a plain string version in *_str.
-
-       These require that the schema is both managed and mutable, by
-       declaring schemaFactory as ManagedIndexSchemaFactory, with
-       mutable specified as true.
-
-       See http://wiki.apache.org/solr/GuessingFieldTypes
-    -->
-  <updateProcessor class="solr.UUIDUpdateProcessorFactory" name="uuid"/>
-  <updateProcessor class="solr.RemoveBlankFieldUpdateProcessorFactory" name="remove-blank"/>
-  <updateProcessor class="solr.FieldNameMutatingUpdateProcessorFactory" name="field-name-mutating">
-    <str name="pattern">[^\w-\.]</str>
-    <str name="replacement">_</str>
-  </updateProcessor>
-  <updateProcessor class="solr.ParseBooleanFieldUpdateProcessorFactory" name="parse-boolean"/>
-  <updateProcessor class="solr.ParseLongFieldUpdateProcessorFactory" name="parse-long"/>
-  <updateProcessor class="solr.ParseDoubleFieldUpdateProcessorFactory" name="parse-double"/>
-  <updateProcessor class="solr.ParseDateFieldUpdateProcessorFactory" name="parse-date">
-    <arr name="format">
-      <str>yyyy-MM-dd'T'HH:mm:ss.SSSZ</str>
-      <str>yyyy-MM-dd'T'HH:mm:ss,SSSZ</str>
-      <str>yyyy-MM-dd'T'HH:mm:ss.SSS</str>
-      <str>yyyy-MM-dd'T'HH:mm:ss,SSS</str>
-      <str>yyyy-MM-dd'T'HH:mm:ssZ</str>
-      <str>yyyy-MM-dd'T'HH:mm:ss</str>
-      <str>yyyy-MM-dd'T'HH:mmZ</str>
-      <str>yyyy-MM-dd'T'HH:mm</str>
-      <str>yyyy-MM-dd HH:mm:ss.SSSZ</str>
-      <str>yyyy-MM-dd HH:mm:ss,SSSZ</str>
-      <str>yyyy-MM-dd HH:mm:ss.SSS</str>
-      <str>yyyy-MM-dd HH:mm:ss,SSS</str>
-      <str>yyyy-MM-dd HH:mm:ssZ</str>
-      <str>yyyy-MM-dd HH:mm:ss</str>
-      <str>yyyy-MM-dd HH:mmZ</str>
-      <str>yyyy-MM-dd HH:mm</str>
-      <str>yyyy-MM-dd</str>
-    </arr>
-  </updateProcessor>
-  <updateProcessor class="solr.AddSchemaFieldsUpdateProcessorFactory" name="add-schema-fields">
-    <lst name="typeMapping">
-      <str name="valueClass">java.lang.String</str>
-      <str name="fieldType">text_general</str>
-      <lst name="copyField">
-        <str name="dest">*_str</str>
-        <int name="maxChars">256</int>
-      </lst>
-      <!-- Use as default mapping instead of defaultFieldType -->
-      <bool name="default">true</bool>
-    </lst>
-    <lst name="typeMapping">
-      <str name="valueClass">java.lang.Boolean</str>
-      <str name="fieldType">booleans</str>
-    </lst>
-    <lst name="typeMapping">
-      <str name="valueClass">java.util.Date</str>
-      <str name="fieldType">pdates</str>
-    </lst>
-    <lst name="typeMapping">
-      <str name="valueClass">java.lang.Long</str>
-      <str name="valueClass">java.lang.Integer</str>
-      <str name="fieldType">plongs</str>
-    </lst>
-    <lst name="typeMapping">
-      <str name="valueClass">java.lang.Number</str>
-      <str name="fieldType">pdoubles</str>
-    </lst>
-  </updateProcessor>
-
-  <!-- The update.autoCreateFields property can be turned to false to disable schemaless mode -->
-  <updateRequestProcessorChain name="add-unknown-fields-to-the-schema" default="${update.autoCreateFields:true}"
-           processor="uuid,remove-blank,field-name-mutating,parse-boolean,parse-long,parse-double,parse-date,add-schema-fields">
-    <processor class="solr.LogUpdateProcessorFactory"/>
-    <processor class="solr.DistributedUpdateProcessorFactory"/>
-    <processor class="solr.RunUpdateProcessorFactory"/>
-  </updateRequestProcessorChain>
-
-  <!-- Deduplication
-
-       An example dedup update processor that creates the "id" field
-       on the fly based on the hash code of some other fields.  This
-       example has overwriteDupes set to false since we are using the
-       id field as the signatureField and Solr will maintain
-       uniqueness based on that anyway.
-
-    -->
-  <!--
-     <updateRequestProcessorChain name="dedupe">
-       <processor class="solr.processor.SignatureUpdateProcessorFactory">
-         <bool name="enabled">true</bool>
-         <str name="signatureField">id</str>
-         <bool name="overwriteDupes">false</bool>
-         <str name="fields">name,features,cat</str>
-         <str name="signatureClass">solr.processor.Lookup3Signature</str>
-       </processor>
-       <processor class="solr.LogUpdateProcessorFactory" />
-       <processor class="solr.RunUpdateProcessorFactory" />
-     </updateRequestProcessorChain>
-    -->
-
-  <!-- Language identification
-
-       This example update chain identifies the language of the incoming
-       documents using the langid contrib. The detected language is
-       written to field language_s. No field name mapping is done.
-       The fields used for detection are text, title, subject and description,
-       making this example suitable for detecting languages form full-text
-       rich documents injected via ExtractingRequestHandler.
-       See more about langId at http://wiki.apache.org/solr/LanguageDetection
-    -->
-  <!--
-   <updateRequestProcessorChain name="langid">
-     <processor class="org.apache.solr.update.processor.TikaLanguageIdentifierUpdateProcessorFactory">
-       <str name="langid.fl">text,title,subject,description</str>
-       <str name="langid.langField">language_s</str>
-       <str name="langid.fallback">en</str>
-     </processor>
-     <processor class="solr.LogUpdateProcessorFactory" />
-     <processor class="solr.RunUpdateProcessorFactory" />
-   </updateRequestProcessorChain>
-  -->
-
-  <!-- Script update processor
-
-    This example hooks in an update processor implemented using JavaScript.
-
-    See more about the script update processor at http://wiki.apache.org/solr/ScriptUpdateProcessor
-  -->
-  <!--
-    <updateRequestProcessorChain name="script">
-      <processor class="solr.StatelessScriptUpdateProcessorFactory">
-        <str name="script">update-script.js</str>
-        <lst name="params">
-          <str name="config_param">example config parameter</str>
-        </lst>
-      </processor>
-      <processor class="solr.RunUpdateProcessorFactory" />
-    </updateRequestProcessorChain>
-  -->
-
-  <!-- Response Writers
-
-       http://wiki.apache.org/solr/QueryResponseWriter
-
-       Request responses will be written using the writer specified by
-       the 'wt' request parameter matching the name of a registered
-       writer.
-
-       The "default" writer is the default and will be used if 'wt' is
-       not specified in the request.
-    -->
-  <!-- The following response writers are implicitly configured unless
-       overridden...
-    -->
-  <!--
-     <queryResponseWriter name="xml"
-                          default="true"
-                          class="solr.XMLResponseWriter" />
-     <queryResponseWriter name="json" class="solr.JSONResponseWriter"/>
-     <queryResponseWriter name="python" class="solr.PythonResponseWriter"/>
-     <queryResponseWriter name="ruby" class="solr.RubyResponseWriter"/>
-     <queryResponseWriter name="php" class="solr.PHPResponseWriter"/>
-     <queryResponseWriter name="phps" class="solr.PHPSerializedResponseWriter"/>
-     <queryResponseWriter name="csv" class="solr.CSVResponseWriter"/>
-     <queryResponseWriter name="schema.xml" class="solr.SchemaXmlResponseWriter"/>
-    -->
-
-  <queryResponseWriter name="json" class="solr.JSONResponseWriter">
-    <!-- For the purposes of the tutorial, JSON responses are written as
-     plain text so that they are easy to read in *any* browser.
-     If you expect a MIME type of "application/json" just remove this override.
-    -->
-    <str name="content-type">text/plain; charset=UTF-8</str>
-  </queryResponseWriter>
-
-  <!--
-     Custom response writers can be declared as needed...
-    -->
-  <queryResponseWriter name="velocity" class="solr.VelocityResponseWriter" startup="lazy">
-    <str name="template.base.dir">${velocity.template.base.dir:}</str>
-    <str name="solr.resource.loader.enabled">${velocity.solr.resource.loader.enabled:true}</str>
-    <str name="params.resource.loader.enabled">${velocity.params.resource.loader.enabled:false}</str>
-  </queryResponseWriter>
-
-  <!-- Query Parsers
-
-       https://lucene.apache.org/solr/guide/query-syntax-and-parsing.html
-
-       Multiple QParserPlugins can be registered by name, and then
-       used in either the "defType" param for the QueryComponent (used
-       by SearchHandler) or in LocalParams
-    -->
-  <!-- example of registering a query parser -->
-  <!--
-     <queryParser name="myparser" class="com.mycompany.MyQParserPlugin"/>
-    -->
-
-  <!-- Function Parsers
-
-       http://wiki.apache.org/solr/FunctionQuery
-
-       Multiple ValueSourceParsers can be registered by name, and then
-       used as function names when using the "func" QParser.
-    -->
-  <!-- example of registering a custom function parser  -->
-  <!--
-     <valueSourceParser name="myfunc"
-                        class="com.mycompany.MyValueSourceParser" />
-    -->
-
-
-  <!-- Document Transformers
-       http://wiki.apache.org/solr/DocTransformers
-    -->
-  <!--
-     Could be something like:
-     <transformer name="db" class="com.mycompany.LoadFromDatabaseTransformer" >
-       <int name="connection">jdbc://....</int>
-     </transformer>
-
-     To add a constant value to all docs, use:
-     <transformer name="mytrans2" class="org.apache.solr.response.transform.ValueAugmenterFactory" >
-       <int name="value">5</int>
-     </transformer>
-
-     If you want the user to still be able to change it with _value:something_ use this:
-     <transformer name="mytrans3" class="org.apache.solr.response.transform.ValueAugmenterFactory" >
-       <double name="defaultValue">5</double>
-     </transformer>
-
-      If you are using the QueryElevationComponent, you may wish to mark documents that get boosted.  The
-      EditorialMarkerFactory will do exactly that:
-     <transformer name="qecBooster" class="org.apache.solr.response.transform.EditorialMarkerFactory" />
-    -->
-</config>
diff --git a/src/main/resources/solr/anserini-twitter/conf/stopwords_en.txt b/src/main/resources/solr/anserini-twitter/conf/stopwords_en.txt
deleted file mode 100644
index e11bbd5670..0000000000
--- a/src/main/resources/solr/anserini-twitter/conf/stopwords_en.txt
+++ /dev/null
@@ -1,49 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one or more
-# contributor license agreements.  See the NOTICE file distributed with
-# this work for additional information regarding copyright ownership.
-# The ASF licenses this file to You under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License.  You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-# Standard english stop words taken from Lucene's StopAnalyzer
-a
-an
-and
-are
-as
-at
-be
-but
-by
-for
-if
-in
-into
-is
-it
-no
-not
-of
-on
-or
-such
-that
-the
-their
-then
-there
-these
-they
-this
-to
-was
-will
-with
diff --git a/src/main/resources/solr/anserini-twitter/conf/synonyms.txt b/src/main/resources/solr/anserini-twitter/conf/synonyms.txt
deleted file mode 100644
index eab4ee8753..0000000000
--- a/src/main/resources/solr/anserini-twitter/conf/synonyms.txt
+++ /dev/null
@@ -1,29 +0,0 @@
-# The ASF licenses this file to You under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License.  You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-#-----------------------------------------------------------------------
-#some test synonym mappings unlikely to appear in real input text
-aaafoo => aaabar
-bbbfoo => bbbfoo bbbbar
-cccfoo => cccbar cccbaz
-fooaaa,baraaa,bazaaa
-
-# Some synonym groups specific to this example
-GB,gib,gigabyte,gigabytes
-MB,mib,megabyte,megabytes
-Television, Televisions, TV, TVs
-#notice we use "gib" instead of "GiB" so any WordDelimiterGraphFilter coming
-#after us won't split it into two words.
-
-# Synonym mappings can be used for spelling correction too
-pixima => pixma
-
diff --git a/src/main/resources/solr/anserini/conf/managed-schema b/src/main/resources/solr/anserini/conf/managed-schema
deleted file mode 100644
index 08e1f08be5..0000000000
--- a/src/main/resources/solr/anserini/conf/managed-schema
+++ /dev/null
@@ -1,216 +0,0 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<!-- Solr managed schema - automatically generated - DO NOT EDIT -->
-<schema name="anserini" version="1.6">
-  <uniqueKey>id</uniqueKey>
-  <fieldType name="ancestor_path" class="solr.TextField">
-    <analyzer type="index">
-      <tokenizer class="solr.KeywordTokenizerFactory"/>
-    </analyzer>
-    <analyzer type="query">
-      <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="binary" class="solr.BinaryField"/>
-  <fieldType name="boolean" class="solr.BoolField" sortMissingLast="true"/>
-  <fieldType name="booleans" class="solr.BoolField" sortMissingLast="true" multiValued="true"/>
-  <fieldType name="delimited_payloads_float" class="solr.TextField" indexed="true" stored="false">
-    <analyzer>
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.DelimitedPayloadTokenFilterFactory" encoder="float"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="delimited_payloads_int" class="solr.TextField" indexed="true" stored="false">
-    <analyzer>
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.DelimitedPayloadTokenFilterFactory" encoder="integer"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="delimited_payloads_string" class="solr.TextField" indexed="true" stored="false">
-    <analyzer>
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.DelimitedPayloadTokenFilterFactory" encoder="identity"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="descendent_path" class="solr.TextField">
-    <analyzer type="index">
-      <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/"/>
-    </analyzer>
-    <analyzer type="query">
-      <tokenizer class="solr.KeywordTokenizerFactory"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="location" class="solr.LatLonPointSpatialField" docValues="true"/>
-  <fieldType name="location_rpt" class="solr.SpatialRecursivePrefixTreeFieldType" geo="true" maxDistErr="0.001" distErrPct="0.025" distanceUnits="kilometers"/>
-  <fieldType name="lowercase" class="solr.TextField" positionIncrementGap="100">
-    <analyzer>
-      <tokenizer class="solr.KeywordTokenizerFactory"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="pdate" class="solr.DatePointField" docValues="true"/>
-  <fieldType name="pdates" class="solr.DatePointField" docValues="true" multiValued="true"/>
-  <fieldType name="pdouble" class="solr.DoublePointField" docValues="true"/>
-  <fieldType name="pdoubles" class="solr.DoublePointField" docValues="true" multiValued="true"/>
-  <fieldType name="pfloat" class="solr.FloatPointField" docValues="true"/>
-  <fieldType name="pfloats" class="solr.FloatPointField" docValues="true" multiValued="true"/>
-  <fieldType name="phonetic_en" class="solr.TextField" indexed="true" stored="false">
-    <analyzer>
-      <tokenizer class="solr.StandardTokenizerFactory"/>
-      <filter class="solr.DoubleMetaphoneFilterFactory" inject="false"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="pint" class="solr.IntPointField" docValues="true"/>
-  <fieldType name="pints" class="solr.IntPointField" docValues="true" multiValued="true"/>
-  <fieldType name="plong" class="solr.LongPointField" docValues="true"/>
-  <fieldType name="plongs" class="solr.LongPointField" docValues="true" multiValued="true"/>
-  <fieldType name="point" class="solr.PointType" subFieldSuffix="_d" dimension="2"/>
-  <fieldType name="random" class="solr.RandomSortField" indexed="true"/>
-  <fieldType name="string" class="solr.StrField" sortMissingLast="true" docValues="true"/>
-  <fieldType name="strings" class="solr.StrField" sortMissingLast="true" docValues="true" multiValued="true"/>
-
-  <fieldType name="text_en" class="solr.TextField" positionIncrementGap="100">
-    <analyzer type="index">
-      <tokenizer class="solr.StandardTokenizerFactory"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.EnglishPossessiveFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.PorterStemFilterFactory"/>
-    </analyzer>
-    <analyzer type="query">
-      <tokenizer class="solr.StandardTokenizerFactory"/>
-      <filter class="solr.SynonymGraphFilterFactory" expand="true" ignoreCase="true" synonyms="synonyms.txt"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.EnglishPossessiveFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.PorterStemFilterFactory"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="text_general" class="solr.TextField" positionIncrementGap="100" multiValued="true">
-   <analyzer type="index">
-     <tokenizer class="solr.StandardTokenizerFactory"/>
-     <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-     <filter class="solr.LowerCaseFilterFactory"/>
-   </analyzer>
-   <analyzer type="query">
-     <tokenizer class="solr.StandardTokenizerFactory"/>
-     <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-     <filter class="solr.SynonymGraphFilterFactory" expand="true" ignoreCase="true" synonyms="synonyms.txt"/>
-     <filter class="solr.LowerCaseFilterFactory"/>
-   </analyzer>
- </fieldType>
-  <fieldType name="text_en_splitting" class="solr.TextField" autoGeneratePhraseQueries="true" positionIncrementGap="100">
-    <analyzer type="index">
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.WordDelimiterGraphFilterFactory" catenateNumbers="1" generateNumberParts="1" splitOnCaseChange="1" generateWordParts="1" catenateAll="0" catenateWords="1"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.PorterStemFilterFactory"/>
-      <filter class="solr.FlattenGraphFilterFactory"/>
-    </analyzer>
-    <analyzer type="query">
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.SynonymGraphFilterFactory" expand="true" ignoreCase="true" synonyms="synonyms.txt"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.WordDelimiterGraphFilterFactory" catenateNumbers="0" generateNumberParts="1" splitOnCaseChange="1" generateWordParts="1" catenateAll="0" catenateWords="0"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.PorterStemFilterFactory"/>
-    </analyzer>
-  </fieldType>
-  <fieldType name="text_en_splitting_tight" class="solr.TextField" autoGeneratePhraseQueries="true" positionIncrementGap="100">
-    <analyzer type="index">
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.SynonymGraphFilterFactory" expand="false" ignoreCase="true" synonyms="synonyms.txt"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.WordDelimiterGraphFilterFactory" catenateNumbers="1" generateNumberParts="0" generateWordParts="0" catenateAll="0" catenateWords="1"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.EnglishMinimalStemFilterFactory"/>
-      <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
-      <filter class="solr.FlattenGraphFilterFactory"/>
-    </analyzer>
-    <analyzer type="query">
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-      <filter class="solr.SynonymGraphFilterFactory" expand="false" ignoreCase="true" synonyms="synonyms.txt"/>
-      <filter class="solr.StopFilterFactory" words="stopwords_en.txt" ignoreCase="true"/>
-      <filter class="solr.WordDelimiterGraphFilterFactory" catenateNumbers="1" generateNumberParts="0" generateWordParts="0" catenateAll="0" catenateWords="1"/>
-      <filter class="solr.LowerCaseFilterFactory"/>
-      <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
-      <filter class="solr.EnglishMinimalStemFilterFactory"/>
-      <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
-    </analyzer>
-  </fieldType>
-
-  <fieldType name="text_ws" class="solr.TextField" positionIncrementGap="100">
-    <analyzer>
-      <tokenizer class="solr.WhitespaceTokenizerFactory"/>
-    </analyzer>
-  </fieldType>
-  <field name="_root_" type="string" docValues="false" indexed="true" stored="false"/>
-  <field name="_text_" type="text_general" multiValued="true" indexed="true" stored="false"/>
-  <field name="_version_" type="plong" indexed="false" stored="false"/>
-  <field name="id" type="string" multiValued="false" indexed="true" required="true" stored="true"/>
-  <dynamicField name="*_txt_en_split_tight" type="text_en_splitting_tight" indexed="true" stored="true"/>
-  <dynamicField name="*_descendent_path" type="descendent_path" indexed="true" stored="true"/>
-  <dynamicField name="*_ancestor_path" type="ancestor_path" indexed="true" stored="true"/>
-  <dynamicField name="*_txt_en_split" type="text_en_splitting" indexed="true" stored="true"/>
-  <dynamicField name="*_phon_en" type="phonetic_en" indexed="true" stored="true"/>
-  <dynamicField name="*_s_lower" type="lowercase" indexed="true" stored="true"/>
-  <dynamicField name="random_*" type="random"/>
-  <dynamicField name="*_txt_en" type="text_en" indexed="true" stored="true"/>
-
-  <dynamicField name="*_point" type="point" indexed="true" stored="true"/>
-  <dynamicField name="*_srpt" type="location_rpt" indexed="true" stored="true"/>
-  <dynamicField name="attr_*" type="text_general" multiValued="true" indexed="true" stored="true"/>
-  <dynamicField name="*_txt" type="text_general" indexed="true" stored="true"/>
-  <dynamicField name="*_str" type="strings" docValues="true" indexed="false" stored="false" useDocValuesAsStored="false"/>
-  <dynamicField name="*_dts" type="pdate" multiValued="true" indexed="true" stored="true"/>
-  <dynamicField name="*_dpf" type="delimited_payloads_float" indexed="true" stored="true"/>
-  <dynamicField name="*_dpi" type="delimited_payloads_int" indexed="true" stored="true"/>
-  <dynamicField name="*_dps" type="delimited_payloads_string" indexed="true" stored="true"/>
-  <dynamicField name="*_is" type="pints" indexed="true" stored="true"/>
-  <dynamicField name="*_ss" type="strings" indexed="true" stored="true"/>
-  <dynamicField name="*_ls" type="plongs" indexed="true" stored="true"/>
-  <dynamicField name="*_bs" type="booleans" indexed="true" stored="true"/>
-  <dynamicField name="*_fs" type="pfloats" indexed="true" stored="true"/>
-  <dynamicField name="*_ds" type="pdoubles" indexed="true" stored="true"/>
-  <dynamicField name="*_dt" type="pdate" indexed="true" stored="true"/>
-  <dynamicField name="*_ws" type="text_ws" indexed="true" stored="true"/>
-  <dynamicField name="*_i" type="pint" indexed="true" stored="true"/>
-  <dynamicField name="*_s" type="string" indexed="true" stored="true"/>
-  <dynamicField name="*_l" type="plong" indexed="true" stored="true"/>
-  <dynamicField name="*_t" type="text_general" multiValued="false" indexed="true" stored="true"/>
-  <dynamicField name="*_b" type="boolean" indexed="true" stored="true"/>
-  <dynamicField name="*_f" type="pfloat" indexed="true" stored="true"/>
-  <dynamicField name="*_d" type="pdouble" indexed="true" stored="true"/>
-  <dynamicField name="*_p" type="location" indexed="true" stored="true"/>
-
-  <!-- Anserini Fields -->
-
-  <fieldType name="text_en_anserini" class="solr.TextField">
-     <analyzer class="org.apache.lucene.analysis.en.EnglishAnalyzer"/>
-  </fieldType>
-
-  <!-- "raw" is stored but not searchable. -->
-  <field name="raw" type="text_general" indexed="false" stored="true" multiValued="false" />
-
-  <!-- "contents" are stored and searchable. -->
-  <field name="contents" type="text_en_anserini" indexed="true" stored="true" multiValued="false" />
-
-  <!-- Anserini WashingtonPost Fields -->
-  <field name="author" type="string" />
-  <field name="article_url" type="string" />
-  <field name="fullCaption" type="text_en" multiValued="true" />
-  <field name="kicker" type="string" />
-  <field name="published_date" type="plong" />
-  <field name="title" type="text_en" />
-
-  <similarity class="solr.BM25SimilarityFactory">
-    <float name="k1">0.9</float>
-    <float name="b">0.4</float>
-  </similarity>
-
-</schema>
diff --git a/src/main/resources/solr/anserini/conf/params.json b/src/main/resources/solr/anserini/conf/params.json
deleted file mode 100644
index 06114ef257..0000000000
--- a/src/main/resources/solr/anserini/conf/params.json
+++ /dev/null
@@ -1,20 +0,0 @@
-{"params":{
-  "query":{
-    "defType":"edismax",
-    "q.alt":"*:*",
-    "rows":"10",
-    "fl":"*,score",
-    "":{"v":0}
-  },
-  "facets":{
-    "facet":"on",
-    "facet.mincount": "1",
-    "":{"v":0}
-  },
- "velocity":{
-   "wt": "velocity",
-   "v.template":"browse",
-   "v.layout": "layout",
-   "":{"v":0}
- }
-}}
\ No newline at end of file
diff --git a/src/main/resources/solr/anserini/conf/protwords.txt b/src/main/resources/solr/anserini/conf/protwords.txt
deleted file mode 100644
index 1dfc0abecb..0000000000
--- a/src/main/resources/solr/anserini/conf/protwords.txt
+++ /dev/null
@@ -1,21 +0,0 @@
-# The ASF licenses this file to You under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License.  You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-#-----------------------------------------------------------------------
-# Use a protected word file to protect against the stemmer reducing two
-# unrelated words to the same base word.
-
-# Some non-words that normally won't be encountered,
-# just to test that they won't be stemmed.
-dontstems
-zwhacky
-
diff --git a/src/main/resources/solr/anserini/conf/solrconfig.xml b/src/main/resources/solr/anserini/conf/solrconfig.xml
deleted file mode 100644
index b00368515b..0000000000
--- a/src/main/resources/solr/anserini/conf/solrconfig.xml
+++ /dev/null
@@ -1,1343 +0,0 @@
-<?xml version="1.0" encoding="UTF-8" ?>
-<!--
- Licensed to the Apache Software Foundation (ASF) under one or more
- contributor license agreements.  See the NOTICE file distributed with
- this work for additional information regarding copyright ownership.
- The ASF licenses this file to You under the Apache License, Version 2.0
- (the "License"); you may not use this file except in compliance with
- the License.  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-
-<!--
-     For more details about configurations options that may appear in
-     this file, see http://wiki.apache.org/solr/SolrConfigXml.
--->
-<config>
-  <!-- In all configuration below, a prefix of "solr." for class names
-       is an alias that causes solr to search appropriate packages,
-       including org.apache.solr.(search|update|request|core|analysis)
-
-       You may also specify a fully qualified Java classname if you
-       have your own custom plugins.
-    -->
-
-  <!-- Controls what version of Lucene various components of Solr
-       adhere to.  Generally, you want to use the latest version to
-       get all bug fixes and improvements. It is highly recommended
-       that you fully re-index after changing this setting as it can
-       affect both how text is indexed and queried.
-  -->
-  <luceneMatchVersion>9.0.0</luceneMatchVersion>
-
-  <!-- <lib/> directives can be used to instruct Solr to load any Jars
-       identified and use them to resolve any "plugins" specified in
-       your solrconfig.xml or schema.xml (ie: Analyzers, Request
-       Handlers, etc...).
-
-       All directories and paths are resolved relative to the
-       instanceDir.
-
-       Please note that <lib/> directives are processed in the order
-       that they appear in your solrconfig.xml file, and are "stacked"
-       on top of each other when building a ClassLoader - so if you have
-       plugin jars with dependencies on other jars, the "lower level"
-       dependency jars should be loaded first.
-
-       If a "./lib" directory exists in your instanceDir, all files
-       found in it are included as if you had used the following
-       syntax...
-
-              <lib dir="./lib" />
-    -->
-
-  <!-- A 'dir' option by itself adds any files found in the directory
-       to the classpath, this is useful for including all jars in a
-       directory.
-
-       When a 'regex' is specified in addition to a 'dir', only the
-       files in that directory which completely match the regex
-       (anchored on both ends) will be included.
-
-       If a 'dir' option (with or without a regex) is used and nothing
-       is found that matches, a warning will be logged.
-
-       The examples below can be used to load some solr-contribs along
-       with their external dependencies.
-    -->
-
-  <!-- an exact 'path' can be used instead of a 'dir' to specify a
-       specific jar file.  This will cause a serious error to be logged
-       if it can't be loaded.
-    -->
-  <!--
-     <lib path="../a-jar-that-does-not-exist.jar" />
-  -->
-
-  <!-- Data Directory
-
-       Used to specify an alternate directory to hold all index data
-       other than the default ./data under the Solr home.  If
-       replication is in use, this should match the replication
-       configuration.
-    -->
-  <dataDir>${solr.data.dir:}</dataDir>
-
-
-  <!-- The DirectoryFactory to use for indexes.
-
-       solr.StandardDirectoryFactory is filesystem
-       based and tries to pick the best implementation for the current
-       JVM and platform.  solr.NRTCachingDirectoryFactory, the default,
-       wraps solr.StandardDirectoryFactory and caches small files in memory
-       for better NRT performance.
-
-       One can force a particular implementation via solr.MMapDirectoryFactory,
-       solr.NIOFSDirectoryFactory, or solr.SimpleFSDirectoryFactory.
-
-       solr.RAMDirectoryFactory is memory based and not persistent.
-    -->
-  <directoryFactory name="DirectoryFactory"
-                    class="${solr.directoryFactory:solr.NRTCachingDirectoryFactory}"/>
-
-  <!-- The CodecFactory for defining the format of the inverted index.
-       The default implementation is SchemaCodecFactory, which is the official Lucene
-       index format, but hooks into the schema to provide per-field customization of
-       the postings lists and per-document values in the fieldType element
-       (postingsFormat/docValuesFormat). Note that most of the alternative implementations
-       are experimental, so if you choose to customize the index format, it's a good
-       idea to convert back to the official format e.g. via IndexWriter.addIndexes(IndexReader)
-       before upgrading to a newer version to avoid unnecessary reindexing.
-       A "compressionMode" string element can be added to <codecFactory> to choose
-       between the existing compression modes in the default codec: "BEST_SPEED" (default)
-       or "BEST_COMPRESSION".
-  -->
-  <codecFactory class="solr.SchemaCodecFactory"/>
-
-  <!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-       Index Config - These settings control low-level behavior of indexing
-       Most example settings here show the default value, but are commented
-       out, to more easily see where customizations have been made.
-
-       Note: This replaces <indexDefaults> and <mainIndex> from older versions
-       ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -->
-  <indexConfig>
-    <!-- maxFieldLength was removed in 4.0. To get similar behavior, include a
-         LimitTokenCountFilterFactory in your fieldType definition. E.g.
-     <filter class="solr.LimitTokenCountFilterFactory" maxTokenCount="10000"/>
-    -->
-    <!-- Maximum time to wait for a write lock (ms) for an IndexWriter. Default: 1000 -->
-    <!-- <writeLockTimeout>1000</writeLockTimeout>  -->
-
-    <!-- Expert: Enabling compound file will use less files for the index,
-         using fewer file descriptors on the expense of performance decrease.
-         Default in Lucene is "true". Default in Solr is "false" (since 3.6) -->
-    <!-- <useCompoundFile>false</useCompoundFile> -->
-
-    <!-- ramBufferSizeMB sets the amount of RAM that may be used by Lucene
-         indexing for buffering added documents and deletions before they are
-         flushed to the Directory.
-         maxBufferedDocs sets a limit on the number of documents buffered
-         before flushing.
-         If both ramBufferSizeMB and maxBufferedDocs is set, then
-         Lucene will flush based on whichever limit is hit first.  -->
-    <ramBufferSizeMB>2048</ramBufferSizeMB>
-    <!-- <maxBufferedDocs>1000</maxBufferedDocs> -->
-
-    <!-- Expert: Merge Policy
-         The Merge Policy in Lucene controls how merging of segments is done.
-         The default since Solr/Lucene 3.3 is TieredMergePolicy.
-         The default since Lucene 2.3 was the LogByteSizeMergePolicy,
-         Even older versions of Lucene used LogDocMergePolicy.
-      -->
-    <!--
-        <mergePolicyFactory class="org.apache.solr.index.TieredMergePolicyFactory">
-          <int name="maxMergeAtOnce">10</int>
-          <int name="segmentsPerTier">10</int>
-          <double name="noCFSRatio">0.1</double>
-        </mergePolicyFactory>
-      -->
-
-    <!-- Expert: Merge Scheduler
-         The Merge Scheduler in Lucene controls how merges are
-         performed.  The ConcurrentMergeScheduler (Lucene 2.3 default)
-         can perform merges in the background using separate threads.
-         The SerialMergeScheduler (Lucene 2.2 default) does not.
-     -->
-    <!--
-       <mergeScheduler class="org.apache.lucene.index.ConcurrentMergeScheduler"/>
-       -->
-
-    <!-- LockFactory
-
-         This option specifies which Lucene LockFactory implementation
-         to use.
-
-         single = SingleInstanceLockFactory - suggested for a
-                  read-only index or when there is no possibility of
-                  another process trying to modify the index.
-         native = NativeFSLockFactory - uses OS native file locking.
-                  Do not use when multiple solr webapps in the same
-                  JVM are attempting to share a single index.
-         simple = SimpleFSLockFactory  - uses a plain file for locking
-
-         Defaults: 'native' is default for Solr3.6 and later, otherwise
-                   'simple' is the default
-
-         More details on the nuances of each LockFactory...
-         http://wiki.apache.org/lucene-java/AvailableLockFactories
-    -->
-    <lockType>${solr.lock.type:native}</lockType>
-
-    <!-- Commit Deletion Policy
-         Custom deletion policies can be specified here. The class must
-         implement org.apache.lucene.index.IndexDeletionPolicy.
-
-         The default Solr IndexDeletionPolicy implementation supports
-         deleting index commit points on number of commits, age of
-         commit point and optimized status.
-
-         The latest commit point should always be preserved regardless
-         of the criteria.
-    -->
-    <!--
-    <deletionPolicy class="solr.SolrDeletionPolicy">
-    -->
-    <!-- The number of commit points to be kept -->
-    <!-- <str name="maxCommitsToKeep">1</str> -->
-    <!-- The number of optimized commit points to be kept -->
-    <!-- <str name="maxOptimizedCommitsToKeep">0</str> -->
-    <!--
-        Delete all commit points once they have reached the given age.
-        Supports DateMathParser syntax e.g.
-      -->
-    <!--
-       <str name="maxCommitAge">30MINUTES</str>
-       <str name="maxCommitAge">1DAY</str>
-    -->
-    <!--
-    </deletionPolicy>
-    -->
-
-    <!-- Lucene Infostream
-
-         To aid in advanced debugging, Lucene provides an "InfoStream"
-         of detailed information when indexing.
-
-         Setting The value to true will instruct the underlying Lucene
-         IndexWriter to write its debugging info the specified file
-      -->
-    <!-- <infoStream file="INFOSTREAM.txt">false</infoStream> -->
-  </indexConfig>
-
-
-  <!-- JMX
-
-       This example enables JMX if and only if an existing MBeanServer
-       is found, use this if you want to configure JMX through JVM
-       parameters. Remove this to disable exposing Solr configuration
-       and statistics to JMX.
-
-       For more details see http://wiki.apache.org/solr/SolrJmx
-    -->
-  <jmx />
-  <!-- If you want to connect to a particular server, specify the
-       agentId
-    -->
-  <!-- <jmx agentId="myAgent" /> -->
-  <!-- If you want to start a new MBeanServer, specify the serviceUrl -->
-  <!-- <jmx serviceUrl="service:jmx:rmi:///jndi/rmi://localhost:9999/solr"/>
-    -->
-
-  <!-- The default high-performance update handler -->
-  <updateHandler class="solr.DirectUpdateHandler2">
-
-    <!-- Enables a transaction log, used for real-time get, durability, and
-         and solr cloud replica recovery.  The log can grow as big as
-         uncommitted changes to the index, so use of a hard autoCommit
-         is recommended (see below).
-         "dir" - the target directory for transaction logs, defaults to the
-                solr data directory.
-         "numVersionBuckets" - sets the number of buckets used to keep
-                track of max version values when checking for re-ordered
-                updates; increase this value to reduce the cost of
-                synchronizing access to version buckets during high-volume
-                indexing, this requires 8 bytes (long) * numVersionBuckets
-                of heap space per Solr core.
-    -->
-    <updateLog>
-      <str name="dir">${solr.ulog.dir:}</str>
-      <int name="numVersionBuckets">${solr.ulog.numVersionBuckets:65536}</int>
-    </updateLog>
-
-    <!-- AutoCommit
-
-         Perform a hard commit automatically under certain conditions.
-         Instead of enabling autoCommit, consider using "commitWithin"
-         when adding documents.
-
-         http://wiki.apache.org/solr/UpdateXmlMessages
-
-         maxDocs - Maximum number of documents to add since the last
-                   commit before automatically triggering a new commit.
-
-         maxTime - Maximum amount of time in ms that is allowed to pass
-                   since a document was added before automatically
-                   triggering a new commit.
-         openSearcher - if false, the commit causes recent index changes
-           to be flushed to stable storage, but does not cause a new
-           searcher to be opened to make those changes visible.
-
-         If the updateLog is enabled, then it's highly recommended to
-         have some sort of hard autoCommit to limit the log size.
-      -->
-    <autoCommit>
-      <maxTime>${solr.autoCommit.maxTime:15000}</maxTime>
-      <openSearcher>false</openSearcher>
-    </autoCommit>
-
-    <!-- softAutoCommit is like autoCommit except it causes a
-         'soft' commit which only ensures that changes are visible
-         but does not ensure that data is synced to disk.  This is
-         faster and more near-realtime friendly than a hard commit.
-      -->
-
-    <autoSoftCommit>
-      <maxTime>${solr.autoSoftCommit.maxTime:-1}</maxTime>
-    </autoSoftCommit>
-
-    <!-- Update Related Event Listeners
-
-         Various IndexWriter related events can trigger Listeners to
-         take actions.
-
-         postCommit - fired after every commit or optimize command
-         postOptimize - fired after every optimize command
-      -->
-
-  </updateHandler>
-
-  <!-- IndexReaderFactory
-
-       Use the following format to specify a custom IndexReaderFactory,
-       which allows for alternate IndexReader implementations.
-
-       ** Experimental Feature **
-
-       Please note - Using a custom IndexReaderFactory may prevent
-       certain other features from working. The API to
-       IndexReaderFactory may change without warning or may even be
-       removed from future releases if the problems cannot be
-       resolved.
-
-
-       ** Features that may not work with custom IndexReaderFactory **
-
-       The ReplicationHandler assumes a disk-resident index. Using a
-       custom IndexReader implementation may cause incompatibility
-       with ReplicationHandler and may cause replication to not work
-       correctly. See SOLR-1366 for details.
-
-    -->
-  <!--
-  <indexReaderFactory name="IndexReaderFactory" class="package.class">
-    <str name="someArg">Some Value</str>
-  </indexReaderFactory >
-  -->
-
-  <!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-       Query section - these settings control query time things like caches
-       ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -->
-  <query>
-
-    <!-- Maximum number of clauses in each BooleanQuery,  an exception
-         is thrown if exceeded.  It is safe to increase or remove this setting,
-         since it is purely an arbitrary limit to try and catch user errors where
-         large boolean queries may not be the best implementation choice.
-      -->
-    <maxBooleanClauses>1024</maxBooleanClauses>
-
-    <!-- Solr Internal Query Caches
-
-         There are two implementations of cache available for Solr,
-         LRUCache, based on a synchronized LinkedHashMap, and
-         FastLRUCache, based on a ConcurrentHashMap.
-
-         FastLRUCache has faster gets and slower puts in single
-         threaded operation and thus is generally faster than LRUCache
-         when the hit ratio of the cache is high (> 75%), and may be
-         faster under other scenarios on multi-cpu systems.
-    -->
-
-    <!-- Filter Cache
-
-         Cache used by SolrIndexSearcher for filters (DocSets),
-         unordered sets of *all* documents that match a query.  When a
-         new searcher is opened, its caches may be prepopulated or
-         "autowarmed" using data from caches in the old searcher.
-         autowarmCount is the number of items to prepopulate.  For
-         LRUCache, the autowarmed items will be the most recently
-         accessed items.
-
-         Parameters:
-           class - the SolrCache implementation LRUCache or
-               (LRUCache or FastLRUCache)
-           size - the maximum number of entries in the cache
-           initialSize - the initial capacity (number of entries) of
-               the cache.  (see java.util.HashMap)
-           autowarmCount - the number of entries to prepopulate from
-               and old cache.
-           maxRamMB - the maximum amount of RAM (in MB) that this cache is allowed
-                      to occupy. Note that when this option is specified, the size
-                      and initialSize parameters are ignored.
-      -->
-    <filterCache size="512"
-                 initialSize="512"
-                 autowarmCount="0"/>
-
-    <!-- Query Result Cache
-
-         Caches results of searches - ordered lists of document ids
-         (DocList) based on a query, a sort, and the range of documents requested.
-         Additional supported parameter by LRUCache:
-            maxRamMB - the maximum amount of RAM (in MB) that this cache is allowed
-                       to occupy
-      -->
-    <queryResultCache size="512"
-                      initialSize="512"
-                      autowarmCount="0"/>
-
-    <!-- Document Cache
-
-         Caches Lucene Document objects (the stored fields for each
-         document).  Since Lucene internal document ids are transient,
-         this cache will not be autowarmed.
-      -->
-    <documentCache size="512"
-                   initialSize="512"
-                   autowarmCount="0"/>
-
-    <!-- custom cache currently used by block join -->
-    <cache name="perSegFilter"
-           size="10"
-           initialSize="0"
-           autowarmCount="10"
-           regenerator="solr.NoOpRegenerator" />
-
-    <!-- Field Value Cache
-
-         Cache used to hold field values that are quickly accessible
-         by document id.  The fieldValueCache is created by default
-         even if not configured here.
-      -->
-    <!--
-       <fieldValueCache class="solr.FastLRUCache"
-                        size="512"
-                        autowarmCount="128"
-                        showItems="32" />
-      -->
-
-    <!-- Custom Cache
-
-         Example of a generic cache.  These caches may be accessed by
-         name through SolrIndexSearcher.getCache(),cacheLookup(), and
-         cacheInsert().  The purpose is to enable easy caching of
-         user/application level data.  The regenerator argument should
-         be specified as an implementation of solr.CacheRegenerator
-         if autowarming is desired.
-      -->
-    <!--
-       <cache name="myUserCache"
-              class="solr.LRUCache"
-              size="4096"
-              initialSize="1024"
-              autowarmCount="1024"
-              regenerator="com.mycompany.MyRegenerator"
-              />
-      -->
-
-
-    <!-- Lazy Field Loading
-
-         If true, stored fields that are not requested will be loaded
-         lazily.  This can result in a significant speed improvement
-         if the usual case is to not load all stored fields,
-         especially if the skipped fields are large compressed text
-         fields.
-    -->
-    <enableLazyFieldLoading>true</enableLazyFieldLoading>
-
-    <!-- Use Filter For Sorted Query
-
-         A possible optimization that attempts to use a filter to
-         satisfy a search.  If the requested sort does not include
-         score, then the filterCache will be checked for a filter
-         matching the query. If found, the filter will be used as the
-         source of document ids, and then the sort will be applied to
-         that.
-
-         For most situations, this will not be useful unless you
-         frequently get the same search repeatedly with different sort
-         options, and none of them ever use "score"
-      -->
-    <!--
-       <useFilterForSortedQuery>true</useFilterForSortedQuery>
-      -->
-
-    <!-- Result Window Size
-
-         An optimization for use with the queryResultCache.  When a search
-         is requested, a superset of the requested number of document ids
-         are collected.  For example, if a search for a particular query
-         requests matching documents 10 through 19, and queryWindowSize is 50,
-         then documents 0 through 49 will be collected and cached.  Any further
-         requests in that range can be satisfied via the cache.
-      -->
-    <queryResultWindowSize>20</queryResultWindowSize>
-
-    <!-- Maximum number of documents to cache for any entry in the
-         queryResultCache.
-      -->
-    <queryResultMaxDocsCached>200</queryResultMaxDocsCached>
-
-    <!-- Query Related Event Listeners
-
-         Various IndexSearcher related events can trigger Listeners to
-         take actions.
-
-         newSearcher - fired whenever a new searcher is being prepared
-         and there is a current searcher handling requests (aka
-         registered).  It can be used to prime certain caches to
-         prevent long request times for certain requests.
-
-         firstSearcher - fired whenever a new searcher is being
-         prepared but there is no current registered searcher to handle
-         requests or to gain autowarming data from.
-
-
-      -->
-    <!-- QuerySenderListener takes an array of NamedList and executes a
-         local query request for each NamedList in sequence.
-      -->
-    <listener event="newSearcher" class="solr.QuerySenderListener">
-      <arr name="queries">
-        <!--
-           <lst><str name="q">solr</str><str name="sort">price asc</str></lst>
-           <lst><str name="q">rocks</str><str name="sort">weight asc</str></lst>
-          -->
-      </arr>
-    </listener>
-    <listener event="firstSearcher" class="solr.QuerySenderListener">
-      <arr name="queries">
-        <!--
-        <lst>
-          <str name="q">static firstSearcher warming in solrconfig.xml</str>
-        </lst>
-        -->
-      </arr>
-    </listener>
-
-    <!-- Use Cold Searcher
-
-         If a search request comes in and there is no current
-         registered searcher, then immediately register the still
-         warming searcher and use it.  If "false" then all requests
-         will block until the first searcher is done warming.
-      -->
-    <useColdSearcher>false</useColdSearcher>
-
-  </query>
-
-
-  <!-- Request Dispatcher
-
-       This section contains instructions for how the SolrDispatchFilter
-       should behave when processing requests for this SolrCore.
-
-    -->
-  <requestDispatcher>
-    <!-- Request Parsing
-
-         These settings indicate how Solr Requests may be parsed, and
-         what restrictions may be placed on the ContentStreams from
-         those requests
-
-         enableRemoteStreaming - enables use of the stream.file
-         and stream.url parameters for specifying remote streams.
-
-         multipartUploadLimitInKB - specifies the max size (in KiB) of
-         Multipart File Uploads that Solr will allow in a Request.
-
-         formdataUploadLimitInKB - specifies the max size (in KiB) of
-         form data (application/x-www-form-urlencoded) sent via
-         POST. You can use POST to pass request parameters not
-         fitting into the URL.
-
-         addHttpRequestToContext - if set to true, it will instruct
-         the requestParsers to include the original HttpServletRequest
-         object in the context map of the SolrQueryRequest under the
-         key "httpRequest". It will not be used by any of the existing
-         Solr components, but may be useful when developing custom
-         plugins.
-
-         *** WARNING ***
-         Before enabling remote streaming, you should make sure your
-         system has authentication enabled.
-
-    <requestParsers enableRemoteStreaming="false"
-                    multipartUploadLimitInKB="-1"
-                    formdataUploadLimitInKB="-1"
-                    addHttpRequestToContext="false"/>
-      -->
-
-    <!-- HTTP Caching
-
-         Set HTTP caching related parameters (for proxy caches and clients).
-
-         The options below instruct Solr not to output any HTTP Caching
-         related headers
-      -->
-    <httpCaching never304="true" />
-    <!-- If you include a <cacheControl> directive, it will be used to
-         generate a Cache-Control header (as well as an Expires header
-         if the value contains "max-age=")
-
-         By default, no Cache-Control header is generated.
-
-         You can use the <cacheControl> option even if you have set
-         never304="true"
-      -->
-    <!--
-       <httpCaching never304="true" >
-         <cacheControl>max-age=30, public</cacheControl>
-       </httpCaching>
-      -->
-    <!-- To enable Solr to respond with automatically generated HTTP
-         Caching headers, and to response to Cache Validation requests
-         correctly, set the value of never304="false"
-
-         This will cause Solr to generate Last-Modified and ETag
-         headers based on the properties of the Index.
-
-         The following options can also be specified to affect the
-         values of these headers...
-
-         lastModFrom - the default value is "openTime" which means the
-         Last-Modified value (and validation against If-Modified-Since
-         requests) will all be relative to when the current Searcher
-         was opened.  You can change it to lastModFrom="dirLastMod" if
-         you want the value to exactly correspond to when the physical
-         index was last modified.
-
-         etagSeed="..." is an option you can change to force the ETag
-         header (and validation against If-None-Match requests) to be
-         different even if the index has not changed (ie: when making
-         significant changes to your config file)
-
-         (lastModifiedFrom and etagSeed are both ignored if you use
-         the never304="true" option)
-      -->
-    <!--
-       <httpCaching lastModifiedFrom="openTime"
-                    etagSeed="Solr">
-         <cacheControl>max-age=30, public</cacheControl>
-       </httpCaching>
-      -->
-  </requestDispatcher>
-
-  <!-- Request Handlers
-
-       http://wiki.apache.org/solr/SolrRequestHandler
-
-       Incoming queries will be dispatched to a specific handler by name
-       based on the path specified in the request.
-
-       If a Request Handler is declared with startup="lazy", then it will
-       not be initialized until the first request that uses it.
-
-    -->
-  <!-- SearchHandler
-
-       http://wiki.apache.org/solr/SearchHandler
-
-       For processing Search Queries, the primary Request Handler
-       provided with Solr is "SearchHandler" It delegates to a sequent
-       of SearchComponents (see below) and supports distributed
-       queries across multiple shards
-    -->
-  <requestHandler name="/select" class="solr.SearchHandler">
-    <!-- default values for query parameters can be specified, these
-         will be overridden by parameters in the request
-      -->
-    <lst name="defaults">
-      <str name="echoParams">explicit</str>
-      <int name="rows">10</int>
-      <!-- Default search field
-         <str name="df">text</str> 
-        -->
-      <!-- Change from JSON to XML format (the default prior to Solr 7.0)
-         <str name="wt">xml</str> 
-        -->
-    </lst>
-    <!-- In addition to defaults, "appends" params can be specified
-         to identify values which should be appended to the list of
-         multi-val params from the query (or the existing "defaults").
-      -->
-    <!-- In this example, the param "fq=instock:true" would be appended to
-         any query time fq params the user may specify, as a mechanism for
-         partitioning the index, independent of any user selected filtering
-         that may also be desired (perhaps as a result of faceted searching).
-
-         NOTE: there is *absolutely* nothing a client can do to prevent these
-         "appends" values from being used, so don't use this mechanism
-         unless you are sure you always want it.
-      -->
-    <!--
-       <lst name="appends">
-         <str name="fq">inStock:true</str>
-       </lst>
-      -->
-    <!-- "invariants" are a way of letting the Solr maintainer lock down
-         the options available to Solr clients.  Any params values
-         specified here are used regardless of what values may be specified
-         in either the query, the "defaults", or the "appends" params.
-
-         In this example, the facet.field and facet.query params would
-         be fixed, limiting the facets clients can use.  Faceting is
-         not turned on by default - but if the client does specify
-         facet=true in the request, these are the only facets they
-         will be able to see counts for; regardless of what other
-         facet.field or facet.query params they may specify.
-
-         NOTE: there is *absolutely* nothing a client can do to prevent these
-         "invariants" values from being used, so don't use this mechanism
-         unless you are sure you always want it.
-      -->
-    <!--
-       <lst name="invariants">
-         <str name="facet.field">cat</str>
-         <str name="facet.field">manu_exact</str>
-         <str name="facet.query">price:[* TO 500]</str>
-         <str name="facet.query">price:[500 TO *]</str>
-       </lst>
-      -->
-    <!-- If the default list of SearchComponents is not desired, that
-         list can either be overridden completely, or components can be
-         prepended or appended to the default list.  (see below)
-      -->
-    <!--
-       <arr name="components">
-         <str>nameOfCustomComponent1</str>
-         <str>nameOfCustomComponent2</str>
-       </arr>
-      -->
-  </requestHandler>
-
-  <!-- A request handler that returns indented JSON by default -->
-  <requestHandler name="/query" class="solr.SearchHandler">
-    <lst name="defaults">
-      <str name="echoParams">explicit</str>
-      <str name="wt">json</str>
-      <str name="indent">true</str>
-    </lst>
-  </requestHandler>
-
-
-  <!-- A Robust Example
-
-       This example SearchHandler declaration shows off usage of the
-       SearchHandler with many defaults declared
-
-       Note that multiple instances of the same Request Handler
-       (SearchHandler) can be registered multiple times with different
-       names (and different init parameters)
-    -->
-  <requestHandler name="/browse" class="solr.SearchHandler" useParams="query,facets,velocity,browse">
-    <lst name="defaults">
-      <str name="echoParams">explicit</str>
-    </lst>
-  </requestHandler>
-
-  <initParams path="/update/**,/query,/select,/tvrh,/elevate,/spell,/browse">
-    <lst name="defaults">
-      <str name="df">_text_</str>
-    </lst>
-  </initParams>
-
-  <!-- Solr Cell Update Request Handler
-
-       http://wiki.apache.org/solr/ExtractingRequestHandler
-
-    -->
-  <requestHandler name="/update/extract"
-                  startup="lazy"
-                  class="solr.extraction.ExtractingRequestHandler" >
-    <lst name="defaults">
-      <str name="lowernames">true</str>
-      <str name="fmap.meta">ignored_</str>
-      <str name="fmap.content">_text_</str>
-    </lst>
-  </requestHandler>
-
-  <!-- Search Components
-
-       Search components are registered to SolrCore and used by
-       instances of SearchHandler (which can access them by name)
-
-       By default, the following components are available:
-
-       <searchComponent name="query"     class="solr.QueryComponent" />
-       <searchComponent name="facet"     class="solr.FacetComponent" />
-       <searchComponent name="mlt"       class="solr.MoreLikeThisComponent" />
-       <searchComponent name="highlight" class="solr.HighlightComponent" />
-       <searchComponent name="stats"     class="solr.StatsComponent" />
-       <searchComponent name="debug"     class="solr.DebugComponent" />
-
-       Default configuration in a requestHandler would look like:
-
-       <arr name="components">
-         <str>query</str>
-         <str>facet</str>
-         <str>mlt</str>
-         <str>highlight</str>
-         <str>stats</str>
-         <str>debug</str>
-       </arr>
-
-       If you register a searchComponent to one of the standard names,
-       that will be used instead of the default.
-
-       To insert components before or after the 'standard' components, use:
-
-       <arr name="first-components">
-         <str>myFirstComponentName</str>
-       </arr>
-
-       <arr name="last-components">
-         <str>myLastComponentName</str>
-       </arr>
-
-       NOTE: The component registered with the name "debug" will
-       always be executed after the "last-components"
-
-     -->
-
-  <!-- Spell Check
-
-       The spell check component can return a list of alternative spelling
-       suggestions.
-
-       http://wiki.apache.org/solr/SpellCheckComponent
-    -->
-  <searchComponent name="spellcheck" class="solr.SpellCheckComponent">
-
-    <str name="queryAnalyzerFieldType">text_general</str>
-
-    <!-- Multiple "Spell Checkers" can be declared and used by this
-         component
-      -->
-
-    <!-- a spellchecker built from a field of the main index -->
-    <lst name="spellchecker">
-      <str name="name">default</str>
-      <str name="field">_text_</str>
-      <str name="classname">solr.DirectSolrSpellChecker</str>
-      <!-- the spellcheck distance measure used, the default is the internal levenshtein -->
-      <str name="distanceMeasure">internal</str>
-      <!-- minimum accuracy needed to be considered a valid spellcheck suggestion -->
-      <float name="accuracy">0.5</float>
-      <!-- the maximum #edits we consider when enumerating terms: can be 1 or 2 -->
-      <int name="maxEdits">2</int>
-      <!-- the minimum shared prefix when enumerating terms -->
-      <int name="minPrefix">1</int>
-      <!-- maximum number of inspections per result. -->
-      <int name="maxInspections">5</int>
-      <!-- minimum length of a query term to be considered for correction -->
-      <int name="minQueryLength">4</int>
-      <!-- maximum threshold of documents a query term can appear to be considered for correction -->
-      <float name="maxQueryFrequency">0.01</float>
-      <!-- uncomment this to require suggestions to occur in 1% of the documents
-        <float name="thresholdTokenFrequency">.01</float>
-      -->
-    </lst>
-
-    <!-- a spellchecker that can break or combine words.  See "/spell" handler below for usage -->
-    <!--
-    <lst name="spellchecker">
-      <str name="name">wordbreak</str>
-      <str name="classname">solr.WordBreakSolrSpellChecker</str>
-      <str name="field">name</str>
-      <str name="combineWords">true</str>
-      <str name="breakWords">true</str>
-      <int name="maxChanges">10</int>
-    </lst>
-    -->
-  </searchComponent>
-
-  <!-- A request handler for demonstrating the spellcheck component.
-
-       NOTE: This is purely as an example.  The whole purpose of the
-       SpellCheckComponent is to hook it into the request handler that
-       handles your normal user queries so that a separate request is
-       not needed to get suggestions.
-
-       IN OTHER WORDS, THERE IS REALLY GOOD CHANCE THE SETUP BELOW IS
-       NOT WHAT YOU WANT FOR YOUR PRODUCTION SYSTEM!
-
-       See http://wiki.apache.org/solr/SpellCheckComponent for details
-       on the request parameters.
-    -->
-  <requestHandler name="/spell" class="solr.SearchHandler" startup="lazy">
-    <lst name="defaults">
-      <!-- Solr will use suggestions from both the 'default' spellchecker
-           and from the 'wordbreak' spellchecker and combine them.
-           collations (re-written queries) can include a combination of
-           corrections from both spellcheckers -->
-      <str name="spellcheck.dictionary">default</str>
-      <str name="spellcheck">on</str>
-      <str name="spellcheck.extendedResults">true</str>
-      <str name="spellcheck.count">10</str>
-      <str name="spellcheck.alternativeTermCount">5</str>
-      <str name="spellcheck.maxResultsForSuggest">5</str>
-      <str name="spellcheck.collate">true</str>
-      <str name="spellcheck.collateExtendedResults">true</str>
-      <str name="spellcheck.maxCollationTries">10</str>
-      <str name="spellcheck.maxCollations">5</str>
-    </lst>
-    <arr name="last-components">
-      <str>spellcheck</str>
-    </arr>
-  </requestHandler>
-
-  <!-- Term Vector Component
-
-       http://wiki.apache.org/solr/TermVectorComponent
-    -->
-  <searchComponent name="tvComponent" class="solr.TermVectorComponent"/>
-
-  <!-- A request handler for demonstrating the term vector component
-
-       This is purely as an example.
-
-       In reality you will likely want to add the component to your
-       already specified request handlers.
-    -->
-  <requestHandler name="/tvrh" class="solr.SearchHandler" startup="lazy">
-    <lst name="defaults">
-      <bool name="tv">true</bool>
-    </lst>
-    <arr name="last-components">
-      <str>tvComponent</str>
-    </arr>
-  </requestHandler>
-
-  <!-- Clustering Component. (Omitted here. See the default Solr example for a typical configuration.) -->
-
-  <!-- Terms Component
-
-       http://wiki.apache.org/solr/TermsComponent
-
-       A component to return terms and document frequency of those
-       terms
-    -->
-  <searchComponent name="terms" class="solr.TermsComponent"/>
-
-  <!-- A request handler for demonstrating the terms component -->
-  <requestHandler name="/terms" class="solr.SearchHandler" startup="lazy">
-    <lst name="defaults">
-      <bool name="terms">true</bool>
-      <bool name="distrib">false</bool>
-    </lst>
-    <arr name="components">
-      <str>terms</str>
-    </arr>
-  </requestHandler>
-
-
-  <!-- Query Elevation Component
-
-       http://wiki.apache.org/solr/QueryElevationComponent
-
-       a search component that enables you to configure the top
-       results for a given query regardless of the normal lucene
-       scoring.
-    -->
-  <searchComponent name="elevator" class="solr.QueryElevationComponent" >
-    <!-- pick a fieldType to analyze queries -->
-    <str name="queryFieldType">string</str>
-  </searchComponent>
-
-  <!-- A request handler for demonstrating the elevator component -->
-  <requestHandler name="/elevate" class="solr.SearchHandler" startup="lazy">
-    <lst name="defaults">
-      <str name="echoParams">explicit</str>
-    </lst>
-    <arr name="last-components">
-      <str>elevator</str>
-    </arr>
-  </requestHandler>
-
-  <!-- Highlighting Component
-
-       http://wiki.apache.org/solr/HighlightingParameters
-    -->
-  <searchComponent class="solr.HighlightComponent" name="highlight">
-    <highlighting>
-      <!-- Configure the standard fragmenter -->
-      <!-- This could most likely be commented out in the "default" case -->
-      <fragmenter name="gap"
-                  default="true"
-                  class="solr.highlight.GapFragmenter">
-        <lst name="defaults">
-          <int name="hl.fragsize">100</int>
-        </lst>
-      </fragmenter>
-
-      <!-- A regular-expression-based fragmenter
-           (for sentence extraction)
-        -->
-      <fragmenter name="regex"
-                  class="solr.highlight.RegexFragmenter">
-        <lst name="defaults">
-          <!-- slightly smaller fragsizes work better because of slop -->
-          <int name="hl.fragsize">70</int>
-          <!-- allow 50% slop on fragment sizes -->
-          <float name="hl.regex.slop">0.5</float>
-          <!-- a basic sentence pattern -->
-          <str name="hl.regex.pattern">[-\w ,/\n\&quot;&apos;]{20,200}</str>
-        </lst>
-      </fragmenter>
-
-      <!-- Configure the standard formatter -->
-      <formatter name="html"
-                 default="true"
-                 class="solr.highlight.HtmlFormatter">
-        <lst name="defaults">
-          <str name="hl.simple.pre"><![CDATA[<em>]]></str>
-          <str name="hl.simple.post"><![CDATA[</em>]]></str>
-        </lst>
-      </formatter>
-
-      <!-- Configure the standard encoder -->
-      <encoder name="html"
-               class="solr.highlight.HtmlEncoder" />
-
-      <!-- Configure the standard fragListBuilder -->
-      <fragListBuilder name="simple"
-                       class="solr.highlight.SimpleFragListBuilder"/>
-
-      <!-- Configure the single fragListBuilder -->
-      <fragListBuilder name="single"
-                       class="solr.highlight.SingleFragListBuilder"/>
-
-      <!-- Configure the weighted fragListBuilder -->
-      <fragListBuilder name="weighted"
-                       default="true"
-                       class="solr.highlight.WeightedFragListBuilder"/>
-
-      <!-- default tag FragmentsBuilder -->
-      <fragmentsBuilder name="default"
-                        default="true"
-                        class="solr.highlight.ScoreOrderFragmentsBuilder">
-        <!--
-        <lst name="defaults">
-          <str name="hl.multiValuedSeparatorChar">/</str>
-        </lst>
-        -->
-      </fragmentsBuilder>
-
-      <!-- multi-colored tag FragmentsBuilder -->
-      <fragmentsBuilder name="colored"
-                        class="solr.highlight.ScoreOrderFragmentsBuilder">
-        <lst name="defaults">
-          <str name="hl.tag.pre"><![CDATA[
-               <b style="background:yellow">,<b style="background:lawgreen">,
-               <b style="background:aquamarine">,<b style="background:magenta">,
-               <b style="background:palegreen">,<b style="background:coral">,
-               <b style="background:wheat">,<b style="background:khaki">,
-               <b style="background:lime">,<b style="background:deepskyblue">]]></str>
-          <str name="hl.tag.post"><![CDATA[</b>]]></str>
-        </lst>
-      </fragmentsBuilder>
-
-      <boundaryScanner name="default"
-                       default="true"
-                       class="solr.highlight.SimpleBoundaryScanner">
-        <lst name="defaults">
-          <str name="hl.bs.maxScan">10</str>
-          <str name="hl.bs.chars">.,!? &#9;&#10;&#13;</str>
-        </lst>
-      </boundaryScanner>
-
-      <boundaryScanner name="breakIterator"
-                       class="solr.highlight.BreakIteratorBoundaryScanner">
-        <lst name="defaults">
-          <!-- type should be one of CHARACTER, WORD(default), LINE and SENTENCE -->
-          <str name="hl.bs.type">WORD</str>
-          <!-- language and country are used when constructing Locale object.  -->
-          <!-- And the Locale object will be used when getting instance of BreakIterator -->
-          <str name="hl.bs.language">en</str>
-          <str name="hl.bs.country">US</str>
-        </lst>
-      </boundaryScanner>
-    </highlighting>
-  </searchComponent>
-
-  <!-- Update Processors
-
-       Chains of Update Processor Factories for dealing with Update
-       Requests can be declared, and then used by name in Update
-       Request Processors
-
-       http://wiki.apache.org/solr/UpdateRequestProcessor
-
-    -->
-
-  <!-- Add unknown fields to the schema
-
-       Field type guessing update processors that will
-       attempt to parse string-typed field values as Booleans, Longs,
-       Doubles, or Dates, and then add schema fields with the guessed
-       field types. Text content will be indexed as "text_general" as
-       well as a copy to a plain string version in *_str.
-
-       These require that the schema is both managed and mutable, by
-       declaring schemaFactory as ManagedIndexSchemaFactory, with
-       mutable specified as true.
-
-       See http://wiki.apache.org/solr/GuessingFieldTypes
-    -->
-  <updateProcessor class="solr.UUIDUpdateProcessorFactory" name="uuid"/>
-  <updateProcessor class="solr.RemoveBlankFieldUpdateProcessorFactory" name="remove-blank"/>
-  <updateProcessor class="solr.FieldNameMutatingUpdateProcessorFactory" name="field-name-mutating">
-    <str name="pattern">[^\w-\.]</str>
-    <str name="replacement">_</str>
-  </updateProcessor>
-  <updateProcessor class="solr.ParseBooleanFieldUpdateProcessorFactory" name="parse-boolean"/>
-  <updateProcessor class="solr.ParseLongFieldUpdateProcessorFactory" name="parse-long"/>
-  <updateProcessor class="solr.ParseDoubleFieldUpdateProcessorFactory" name="parse-double"/>
-  <updateProcessor class="solr.ParseDateFieldUpdateProcessorFactory" name="parse-date">
-    <arr name="format">
-      <str>yyyy-MM-dd'T'HH:mm:ss.SSSZ</str>
-      <str>yyyy-MM-dd'T'HH:mm:ss,SSSZ</str>
-      <str>yyyy-MM-dd'T'HH:mm:ss.SSS</str>
-      <str>yyyy-MM-dd'T'HH:mm:ss,SSS</str>
-      <str>yyyy-MM-dd'T'HH:mm:ssZ</str>
-      <str>yyyy-MM-dd'T'HH:mm:ss</str>
-      <str>yyyy-MM-dd'T'HH:mmZ</str>
-      <str>yyyy-MM-dd'T'HH:mm</str>
-      <str>yyyy-MM-dd HH:mm:ss.SSSZ</str>
-      <str>yyyy-MM-dd HH:mm:ss,SSSZ</str>
-      <str>yyyy-MM-dd HH:mm:ss.SSS</str>
-      <str>yyyy-MM-dd HH:mm:ss,SSS</str>
-      <str>yyyy-MM-dd HH:mm:ssZ</str>
-      <str>yyyy-MM-dd HH:mm:ss</str>
-      <str>yyyy-MM-dd HH:mmZ</str>
-      <str>yyyy-MM-dd HH:mm</str>
-      <str>yyyy-MM-dd</str>
-    </arr>
-  </updateProcessor>
-  <updateProcessor class="solr.AddSchemaFieldsUpdateProcessorFactory" name="add-schema-fields">
-    <lst name="typeMapping">
-      <str name="valueClass">java.lang.String</str>
-      <str name="fieldType">text_general</str>
-      <lst name="copyField">
-        <str name="dest">*_str</str>
-        <int name="maxChars">256</int>
-      </lst>
-      <!-- Use as default mapping instead of defaultFieldType -->
-      <bool name="default">true</bool>
-    </lst>
-    <lst name="typeMapping">
-      <str name="valueClass">java.lang.Boolean</str>
-      <str name="fieldType">booleans</str>
-    </lst>
-    <lst name="typeMapping">
-      <str name="valueClass">java.util.Date</str>
-      <str name="fieldType">pdates</str>
-    </lst>
-    <lst name="typeMapping">
-      <str name="valueClass">java.lang.Long</str>
-      <str name="valueClass">java.lang.Integer</str>
-      <str name="fieldType">plongs</str>
-    </lst>
-    <lst name="typeMapping">
-      <str name="valueClass">java.lang.Number</str>
-      <str name="fieldType">pdoubles</str>
-    </lst>
-  </updateProcessor>
-
-  <!-- The update.autoCreateFields property can be turned to false to disable schemaless mode -->
-  <updateRequestProcessorChain name="add-unknown-fields-to-the-schema" default="${update.autoCreateFields:true}"
-           processor="uuid,remove-blank,field-name-mutating,parse-boolean,parse-long,parse-double,parse-date,add-schema-fields">
-    <processor class="solr.LogUpdateProcessorFactory"/>
-    <processor class="solr.DistributedUpdateProcessorFactory"/>
-    <processor class="solr.RunUpdateProcessorFactory"/>
-  </updateRequestProcessorChain>
-
-  <!-- Deduplication
-
-       An example dedup update processor that creates the "id" field
-       on the fly based on the hash code of some other fields.  This
-       example has overwriteDupes set to false since we are using the
-       id field as the signatureField and Solr will maintain
-       uniqueness based on that anyway.
-
-    -->
-  <!--
-     <updateRequestProcessorChain name="dedupe">
-       <processor class="solr.processor.SignatureUpdateProcessorFactory">
-         <bool name="enabled">true</bool>
-         <str name="signatureField">id</str>
-         <bool name="overwriteDupes">false</bool>
-         <str name="fields">name,features,cat</str>
-         <str name="signatureClass">solr.processor.Lookup3Signature</str>
-       </processor>
-       <processor class="solr.LogUpdateProcessorFactory" />
-       <processor class="solr.RunUpdateProcessorFactory" />
-     </updateRequestProcessorChain>
-    -->
-
-  <!-- Language identification
-
-       This example update chain identifies the language of the incoming
-       documents using the langid contrib. The detected language is
-       written to field language_s. No field name mapping is done.
-       The fields used for detection are text, title, subject and description,
-       making this example suitable for detecting languages form full-text
-       rich documents injected via ExtractingRequestHandler.
-       See more about langId at http://wiki.apache.org/solr/LanguageDetection
-    -->
-  <!--
-   <updateRequestProcessorChain name="langid">
-     <processor class="org.apache.solr.update.processor.TikaLanguageIdentifierUpdateProcessorFactory">
-       <str name="langid.fl">text,title,subject,description</str>
-       <str name="langid.langField">language_s</str>
-       <str name="langid.fallback">en</str>
-     </processor>
-     <processor class="solr.LogUpdateProcessorFactory" />
-     <processor class="solr.RunUpdateProcessorFactory" />
-   </updateRequestProcessorChain>
-  -->
-
-  <!-- Script update processor
-
-    This example hooks in an update processor implemented using JavaScript.
-
-    See more about the script update processor at http://wiki.apache.org/solr/ScriptUpdateProcessor
-  -->
-  <!--
-    <updateRequestProcessorChain name="script">
-      <processor class="solr.StatelessScriptUpdateProcessorFactory">
-        <str name="script">update-script.js</str>
-        <lst name="params">
-          <str name="config_param">example config parameter</str>
-        </lst>
-      </processor>
-      <processor class="solr.RunUpdateProcessorFactory" />
-    </updateRequestProcessorChain>
-  -->
-
-  <!-- Response Writers
-
-       http://wiki.apache.org/solr/QueryResponseWriter
-
-       Request responses will be written using the writer specified by
-       the 'wt' request parameter matching the name of a registered
-       writer.
-
-       The "default" writer is the default and will be used if 'wt' is
-       not specified in the request.
-    -->
-  <!-- The following response writers are implicitly configured unless
-       overridden...
-    -->
-  <!--
-     <queryResponseWriter name="xml"
-                          default="true"
-                          class="solr.XMLResponseWriter" />
-     <queryResponseWriter name="json" class="solr.JSONResponseWriter"/>
-     <queryResponseWriter name="python" class="solr.PythonResponseWriter"/>
-     <queryResponseWriter name="ruby" class="solr.RubyResponseWriter"/>
-     <queryResponseWriter name="php" class="solr.PHPResponseWriter"/>
-     <queryResponseWriter name="phps" class="solr.PHPSerializedResponseWriter"/>
-     <queryResponseWriter name="csv" class="solr.CSVResponseWriter"/>
-     <queryResponseWriter name="schema.xml" class="solr.SchemaXmlResponseWriter"/>
-    -->
-
-  <queryResponseWriter name="json" class="solr.JSONResponseWriter">
-    <!-- For the purposes of the tutorial, JSON responses are written as
-     plain text so that they are easy to read in *any* browser.
-     If you expect a MIME type of "application/json" just remove this override.
-    -->
-    <str name="content-type">text/plain; charset=UTF-8</str>
-  </queryResponseWriter>
-
-  <!--
-     Custom response writers can be declared as needed...
-    -->
-  <queryResponseWriter name="velocity" class="solr.VelocityResponseWriter" startup="lazy">
-    <str name="template.base.dir">${velocity.template.base.dir:}</str>
-    <str name="solr.resource.loader.enabled">${velocity.solr.resource.loader.enabled:true}</str>
-    <str name="params.resource.loader.enabled">${velocity.params.resource.loader.enabled:false}</str>
-  </queryResponseWriter>
-
-
-  <!-- Query Parsers
-
-       https://lucene.apache.org/solr/guide/query-syntax-and-parsing.html
-
-       Multiple QParserPlugins can be registered by name, and then
-       used in either the "defType" param for the QueryComponent (used
-       by SearchHandler) or in LocalParams
-    -->
-  <!-- example of registering a query parser -->
-  <!--
-     <queryParser name="myparser" class="com.mycompany.MyQParserPlugin"/>
-    -->
-
-  <!-- Function Parsers
-
-       http://wiki.apache.org/solr/FunctionQuery
-
-       Multiple ValueSourceParsers can be registered by name, and then
-       used as function names when using the "func" QParser.
-    -->
-  <!-- example of registering a custom function parser  -->
-  <!--
-     <valueSourceParser name="myfunc"
-                        class="com.mycompany.MyValueSourceParser" />
-    -->
-
-
-  <!-- Document Transformers
-       http://wiki.apache.org/solr/DocTransformers
-    -->
-  <!--
-     Could be something like:
-     <transformer name="db" class="com.mycompany.LoadFromDatabaseTransformer" >
-       <int name="connection">jdbc://....</int>
-     </transformer>
-
-     To add a constant value to all docs, use:
-     <transformer name="mytrans2" class="org.apache.solr.response.transform.ValueAugmenterFactory" >
-       <int name="value">5</int>
-     </transformer>
-
-     If you want the user to still be able to change it with _value:something_ use this:
-     <transformer name="mytrans3" class="org.apache.solr.response.transform.ValueAugmenterFactory" >
-       <double name="defaultValue">5</double>
-     </transformer>
-
-      If you are using the QueryElevationComponent, you may wish to mark documents that get boosted.  The
-      EditorialMarkerFactory will do exactly that:
-     <transformer name="qecBooster" class="org.apache.solr.response.transform.EditorialMarkerFactory" />
-    -->
-</config>
diff --git a/src/main/resources/solr/anserini/conf/stopwords_en.txt b/src/main/resources/solr/anserini/conf/stopwords_en.txt
deleted file mode 100644
index e11bbd5670..0000000000
--- a/src/main/resources/solr/anserini/conf/stopwords_en.txt
+++ /dev/null
@@ -1,49 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one or more
-# contributor license agreements.  See the NOTICE file distributed with
-# this work for additional information regarding copyright ownership.
-# The ASF licenses this file to You under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License.  You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-# Standard english stop words taken from Lucene's StopAnalyzer
-a
-an
-and
-are
-as
-at
-be
-but
-by
-for
-if
-in
-into
-is
-it
-no
-not
-of
-on
-or
-such
-that
-the
-their
-then
-there
-these
-they
-this
-to
-was
-will
-with
diff --git a/src/main/resources/solr/anserini/conf/synonyms.txt b/src/main/resources/solr/anserini/conf/synonyms.txt
deleted file mode 100644
index eab4ee8753..0000000000
--- a/src/main/resources/solr/anserini/conf/synonyms.txt
+++ /dev/null
@@ -1,29 +0,0 @@
-# The ASF licenses this file to You under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License.  You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-#-----------------------------------------------------------------------
-#some test synonym mappings unlikely to appear in real input text
-aaafoo => aaabar
-bbbfoo => bbbfoo bbbbar
-cccfoo => cccbar cccbaz
-fooaaa,baraaa,bazaaa
-
-# Some synonym groups specific to this example
-GB,gib,gigabyte,gigabytes
-MB,mib,megabyte,megabytes
-Television, Televisions, TV, TVs
-#notice we use "gib" instead of "GiB" so any WordDelimiterGraphFilter coming
-#after us won't split it into two words.
-
-# Synonym mappings can be used for spelling correction too
-pixima => pixma
-
diff --git a/src/main/resources/solr/schemas/acl-anthology.json b/src/main/resources/solr/schemas/acl-anthology.json
deleted file mode 100644
index e358861e83..0000000000
--- a/src/main/resources/solr/schemas/acl-anthology.json
+++ /dev/null
@@ -1,26 +0,0 @@
-{
-  "add-field": {
-    "name":"authors",
-    "type":"string",
-    "stored":true,
-    "multiValued":true
-  },
-  "add-field": {
-    "name":"sigs",
-    "type":"string",
-    "stored":true,
-    "multiValued":true
-  },
-  "add-field": {
-    "name":"venues",
-    "type":"string",
-    "stored":true,
-    "multiValued":true
-  },
-  "add-field": {
-    "name":"pages",
-    "type":"string",
-    "stored":true,
-    "docValues": false
-  }
-}
\ No newline at end of file
diff --git a/src/main/resources/solr/schemas/cord19.json b/src/main/resources/solr/schemas/cord19.json
deleted file mode 100644
index 8a9d305b9b..0000000000
--- a/src/main/resources/solr/schemas/cord19.json
+++ /dev/null
@@ -1,86 +0,0 @@
-{
-  "add-field": {
-    "name":"authors",
-    "type":"string",
-    "stored":true,
-    "multiValued":true
-  },
-  "add-field": {
-    "name":"source_x",
-    "type":"string",
-    "stored":true,
-    "multiValued": true
-  },
-  "add-field": {
-    "name":"pmcid",
-    "type":"string",
-    "stored":true,
-    "docValues": true
-  },
-  "add-field": {
-    "name":"pubmed_id",
-    "type":"string",
-    "stored":true,
-    "docValues": true
-  },
-  "add-field": {
-    "name":"publish_time",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"doi",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"journal",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"license",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"sha",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"url",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"year",
-    "type":"pint",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"outcomes_vocab",
-    "type":"string",
-    "stored":true,
-    "multiValued":true
-  },
-  "add-field": {
-    "name":"population_vocab",
-    "type":"string",
-    "stored":true,
-    "multiValued":true
-  },
-  "add-field": {
-    "name":"interventions_vocab",
-    "type":"string",
-    "stored":true,
-    "multiValued":true
-  }
-}
diff --git a/src/main/resources/solr/schemas/core.json b/src/main/resources/solr/schemas/core.json
deleted file mode 100644
index f6c205539b..0000000000
--- a/src/main/resources/solr/schemas/core.json
+++ /dev/null
@@ -1,56 +0,0 @@
-{
-  "add-field": {
-    "name":"authors",
-    "type":"string",
-    "stored":true,
-    "multiValued":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"contributors",
-    "type":"string",
-    "stored":true,
-    "multiValued":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"identifiers",
-    "type":"string",
-    "stored":true,
-    "multiValued":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"journals",
-    "type":"string",
-    "stored":true,
-    "multiValued":true,
-    "docValues":false
-  },
-  "add-field": {
-    "name":"relations",
-    "type":"string",
-    "stored":true,
-    "multiValued":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"subjects",
-    "type":"string",
-    "stored":true,
-    "multiValued":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"topics",
-    "type":"string",
-    "stored":true,
-    "multiValued":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"datePublished",
-    "type":"string",
-    "stored":true
-  }
-}
\ No newline at end of file
diff --git a/src/main/resources/solr/schemas/covid.json b/src/main/resources/solr/schemas/covid.json
deleted file mode 100644
index f6a1f237f3..0000000000
--- a/src/main/resources/solr/schemas/covid.json
+++ /dev/null
@@ -1,86 +0,0 @@
-{
-  "add-field": {
-    "name":"authors",
-    "type":"string",
-    "stored":true,
-    "multiValued":true
-  },
-  "add-field": {
-    "name":"source_x",
-    "type":"string",
-    "stored":true,
-    "docValues": true
-  },
-  "add-field": {
-    "name":"pmcid",
-    "type":"string",
-    "stored":true,
-    "docValues": true
-  },
-  "add-field": {
-    "name":"pubmed_id",
-    "type":"string",
-    "stored":true,
-    "docValues": true
-  },
-  "add-field": {
-    "name":"publish_time",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"doi",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"journal",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"license",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"sha",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"url",
-    "type":"string",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"year",
-    "type":"pint",
-    "stored":true,
-    "docValues":true
-  },
-  "add-field": {
-    "name":"outcomes_vocab",
-    "type":"string",
-    "stored":true,
-    "multiValued":true
-  },
-  "add-field": {
-    "name":"population_vocab",
-    "type":"string",
-    "stored":true,
-    "multiValued":true
-  },
-  "add-field": {
-    "name":"interventions_vocab",
-    "type":"string",
-    "stored":true,
-    "multiValued":true
-  }
-}
diff --git a/src/main/resources/solr/solr.sh b/src/main/resources/solr/solr.sh
deleted file mode 100755
index 194ea446d8..0000000000
--- a/src/main/resources/solr/solr.sh
+++ /dev/null
@@ -1,23 +0,0 @@
-#!/usr/bin/env sh
-
-###
-# This script assumes a single-node SolrCloud instance is running locally.
-###
-
-if [[ -z "$1" ]]; then
-    echo "Usage: ./solr.sh <solr_directory> <solr_zookeeper_url>"
-    exit 1
-fi
-
-# Solr install directory
-SOLR_DIR=$1
-
-# Solr's ZooKeeper URL
-ZOOKEEPER_URL=$2
-
-# Copy anserini into lib dir
-mkdir ${SOLR_DIR}/lib && cp ../../../../target/anserini-*-fatjar.jar ${SOLR_DIR}/lib
-
-# Upload configset to Solr
-${SOLR_DIR}/bin/solr zk -z ${ZOOKEEPER_URL:-localhost:9983} upconfig -n anserini -d anserini
-${SOLR_DIR}/bin/solr zk -z ${ZOOKEEPER_URL:-localhost:9983} upconfig -n anserini-twitter -d anserini-twitter
diff --git a/src/test/java/io/anserini/integration/solr/AclAnthologyEndToEndTest.java b/src/test/java/io/anserini/integration/solr/AclAnthologyEndToEndTest.java
deleted file mode 100644
index a46383b484..0000000000
--- a/src/test/java/io/anserini/integration/solr/AclAnthologyEndToEndTest.java
+++ /dev/null
@@ -1,57 +0,0 @@
-/*
- * Anserini: A Lucene toolkit for reproducible information retrieval research
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package io.anserini.integration.solr;
-
-import io.anserini.collection.AclAnthology;
-import io.anserini.index.IndexArgs;
-import io.anserini.index.generator.AclAnthologyGenerator;
-import io.anserini.search.SearchSolr;
-
-public class AclAnthologyEndToEndTest extends SolrEndToEndTest {
-  @Override
-  protected String getCollectionName() {
-    return "AclAnthology";
-  }
-
-  @Override
-  protected String getSchemaAdjustmentFile() {
-    return "solr/schemas/acl-anthology.json";
-  }
-
-  @Override
-  public IndexArgs getIndexArgs() {
-    IndexArgs indexArgs = createDefaultIndexArgs();
-    indexArgs.input = "src/test/resources/sample_docs/acl";
-    indexArgs.collectionClass = AclAnthology.class.getSimpleName();
-    indexArgs.generatorClass = AclAnthologyGenerator.class.getSimpleName();
-    return indexArgs;
-  }
-
-  @Override
-  protected SearchSolr.Args getSearchArgs() {
-    return createSearchArgs("TsvInt", "src/test/resources/sample_topics/acl_topics.tsv");
-  }
-
-  @Override
-  protected String[] getRefRankingResult() {
-    return new String[]{ // bm25
-        "1 Q0 C00-1007 1 0.294000 Solrini",
-        "1 Q0 E17-1003 2 0.186100 Solrini",
-        "2 Q0 C00-1003 1 0.622700 Solrini"
-    };
-  }
-}
diff --git a/src/test/java/io/anserini/integration/solr/CoreEndToEndTest.java b/src/test/java/io/anserini/integration/solr/CoreEndToEndTest.java
deleted file mode 100644
index 761e12e537..0000000000
--- a/src/test/java/io/anserini/integration/solr/CoreEndToEndTest.java
+++ /dev/null
@@ -1,59 +0,0 @@
-/*
- * Anserini: A Lucene toolkit for reproducible information retrieval research
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package io.anserini.integration.solr;
-
-import io.anserini.collection.CoreCollection;
-import io.anserini.index.IndexArgs;
-import io.anserini.index.generator.CoreGenerator;
-import io.anserini.search.SearchSolr;
-
-public class CoreEndToEndTest extends SolrEndToEndTest {
-  @Override
-  protected String getCollectionName() {
-    return "Core";
-  }
-
-  @Override
-  protected String getSchemaAdjustmentFile() {
-    return "solr/schemas/core.json";
-  }
-
-  @Override
-  protected IndexArgs getIndexArgs() {
-    IndexArgs indexArgs = createDefaultIndexArgs();
-    indexArgs.input = "src/test/resources/sample_docs/core";
-    indexArgs.collectionClass = CoreCollection.class.getSimpleName();
-    indexArgs.generatorClass = CoreGenerator.class.getSimpleName();
-    return indexArgs;
-  }
-
-  @Override
-  protected SearchSolr.Args getSearchArgs() {
-    return createSearchArgs("TsvInt", "src/test/resources/sample_topics/core_topics.tsv");
-  }
-
-  @Override
-  protected String[] getRefRankingResult() {
-    return new String[]{ // bm25
-        "1 Q0 coreDoc1 1 0.243200 Solrini",
-        "1 Q0 doi2 2 0.243199 Solrini",
-        "2 Q0 coreDoc1 1 0.243200 Solrini",
-        "2 Q0 doi2 2 0.243199 Solrini",
-        "3 Q0 fullCoreDoc 1 0.534600 Solrini"
-    };
-  }
-}
diff --git a/src/test/java/io/anserini/integration/solr/SolrEndToEndTest.java b/src/test/java/io/anserini/integration/solr/SolrEndToEndTest.java
deleted file mode 100644
index d2529d7c6d..0000000000
--- a/src/test/java/io/anserini/integration/solr/SolrEndToEndTest.java
+++ /dev/null
@@ -1,222 +0,0 @@
-/*
- * Anserini: A Lucene toolkit for reproducible information retrieval research
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package io.anserini.integration.solr;
-
-import io.anserini.index.IndexArgs;
-import io.anserini.index.IndexCollection;
-import io.anserini.search.SearchSolr;
-import org.apache.commons.io.FileUtils;
-import org.apache.commons.pool2.BasePooledObjectFactory;
-import org.apache.commons.pool2.ObjectPool;
-import org.apache.commons.pool2.PooledObject;
-import org.apache.commons.pool2.impl.DefaultPooledObject;
-import org.apache.commons.pool2.impl.GenericObjectPool;
-import org.apache.commons.pool2.impl.GenericObjectPoolConfig;
-import org.apache.logging.log4j.LogManager;
-import org.apache.logging.log4j.Logger;
-import org.apache.lucene.util.LuceneTestCase;
-import org.apache.solr.client.solrj.SolrClient;
-import org.apache.solr.client.solrj.embedded.EmbeddedSolrServer;
-import org.apache.solr.client.solrj.request.CoreAdminRequest;
-import org.apache.solr.client.solrj.request.json.DirectJsonQueryRequest;
-import org.apache.solr.client.solrj.response.QueryResponse;
-import org.apache.solr.common.params.CommonParams;
-import org.apache.solr.common.params.ModifiableSolrParams;
-import org.apache.solr.core.NodeConfig;
-import org.apache.solr.core.SolrResourceLoader;
-import org.junit.After;
-import org.junit.Before;
-import org.junit.Test;
-
-import java.io.BufferedReader;
-import java.io.File;
-import java.io.FileReader;
-import java.lang.reflect.Field;
-import java.net.URL;
-import java.nio.file.Files;
-
-
-@LuceneTestCase.SuppressSysoutChecks(bugUrl = "None")
-public abstract class SolrEndToEndTest extends LuceneTestCase {
-  private static final Logger LOG = LogManager.getLogger(SolrEndToEndTest.class);
-
-  protected ObjectPool<SolrClient> stubSolrPool;
-  protected final String searchOutputPrefix = "e2eTestSearch";
-
-  protected EmbeddedSolrServer client;
-
-  protected static File getFile(String path) {
-    final URL url = SolrEndToEndTest.class.getClassLoader().getResource(path);
-    if (url != null) {
-      try {
-        return new File(url.toURI());
-      } catch (Exception e) {
-        throw new RuntimeException("Resource was found on classpath, but cannot be resolved to a normal file: " + path);
-      }
-    }
-    final File file = new File(path);
-    if (file.exists()) {
-      return file;
-    }
-    throw new RuntimeException("Cannot find resource in classpath or in file-system (relative to CWD): " + path);
-  }
-
-  @Before
-  @Override
-  public void setUp() throws Exception {
-    super.setUp();
-
-    final File solrHome = createTempDir().toFile();
-    final File configSetBaseDir = new File(solrHome.toPath() + File.separator + "configsets");
-    FileUtils.copyDirectory(getFile("solr/anserini"), new File(configSetBaseDir + File.separator + "anserini"));
-
-    SolrResourceLoader loader = new SolrResourceLoader(solrHome.toPath());
-    NodeConfig config = new NodeConfig.NodeConfigBuilder("embeddedSolrServerNode", loader.getInstancePath())
-        .setConfigSetBaseDirectory(configSetBaseDir.getAbsolutePath()).build();
-    client = new EmbeddedSolrServer(config, getCollectionName());
-    LOG.info("Created Embedded Solr Server");
-
-    CoreAdminRequest.Create createRequest = new CoreAdminRequest.Create();
-    createRequest.setCoreName(getCollectionName());
-    createRequest.setConfigSet("anserini");
-    createRequest.process(client);
-    client.commit();
-    LOG.info("Created Solr Core: " + getCollectionName());
-
-    GenericObjectPoolConfig<SolrClient> poolConfig = new GenericObjectPoolConfig<>();
-    poolConfig.setMaxTotal(1); // only 1 EmbeddedSolrServer instance will be created by getSolrClient
-    poolConfig.setMinIdle(1);
-    stubSolrPool = new GenericObjectPool<>(new StubSolrClientFactory(client), poolConfig);
-  }
-
-  @After
-  @Override
-  public void tearDown() throws Exception {
-    super.tearDown();
-
-    client.deleteByQuery("*:*");
-    client.commit();
-    client.close();
-    stubSolrPool.close();
-  }
-
-  protected IndexArgs createDefaultIndexArgs() {
-    IndexArgs args = new IndexArgs();
-
-    args.solrIndex = getCollectionName();
-    args.threads = 1;
-    args.storePositions = true;
-    args.storeDocvectors = true;
-    args.storeContents = true;
-    args.storeRaw = true;
-    args.optimize = true;
-    args.quiet = true;
-    args.solr = true;
-
-    return args;
-  }
-
-  protected SearchSolr.Args createSearchArgs(String topicReader, String topicFile) {
-    SearchSolr.Args args = new SearchSolr.Args();
-
-    args.solrIndex = getCollectionName();
-    args.output = searchOutputPrefix + topicReader;
-    args.topicReader = topicReader;
-    args.topics = new String[]{topicFile};
-    args.zkUrl = "localhost"; // SearchSolr initialization workaround
-
-    return args;
-  }
-
-  protected static class StubSolrClientFactory extends BasePooledObjectFactory<SolrClient> {
-    final SolrClient client;
-
-    public StubSolrClientFactory(SolrClient client) {
-      this.client = client;
-    }
-
-    @Override
-    public SolrClient create() {
-      return this.client;
-    }
-
-    @Override
-    public PooledObject<SolrClient> wrap(SolrClient solrClient) {
-      return new DefaultPooledObject<>(solrClient);
-    }
-  }
-
-  protected IndexCollection getIndexRunner(IndexArgs args) throws Exception {
-    IndexCollection runner = new IndexCollection(args);
-    Field f = runner.getClass().getDeclaredField("solrPool");
-    f.setAccessible(true);
-    f.set(runner, stubSolrPool);
-    return runner;
-  }
-
-  protected SearchSolr getSearchRunner(SearchSolr.Args args) throws Exception {
-    SearchSolr runner = new SearchSolr(args);
-    Field f = runner.getClass().getDeclaredField("client");
-    f.setAccessible(true);
-    ((SolrClient) f.get(runner)).close(); // close the old client
-    f.set(runner, client);
-    return runner;
-  }
-
-  protected abstract String getCollectionName();
-
-  protected abstract String getSchemaAdjustmentFile();
-
-  protected abstract IndexArgs getIndexArgs();
-
-  protected abstract SearchSolr.Args getSearchArgs();
-
-  protected abstract String[] getRefRankingResult();
-
-  @Test
-  public void testIndexAndSearch() throws Exception {
-    String schemaAdjustmentFile = getSchemaAdjustmentFile();
-    if (schemaAdjustmentFile != null) {
-      // update schema, much like curl -X POST -H 'Content-type:application/json' --data-binary SCHEMA_NAME.json http://localhost:8983/solr/COLLECTION_NAME/schema
-      String schemaJson = Files.readString(getFile(schemaAdjustmentFile).toPath());
-      ModifiableSolrParams params = new ModifiableSolrParams();
-      params.add(CommonParams.QT, "/schema");
-      DirectJsonQueryRequest schemaRequest = new DirectJsonQueryRequest(schemaJson, params);
-      QueryResponse response = schemaRequest.process(client, getCollectionName());
-      assertEquals(0, response.getStatus());
-    }
-
-    IndexArgs indexArgs = getIndexArgs();
-    IndexCollection indexRunner = getIndexRunner(indexArgs);
-    indexRunner.run();
-
-    SearchSolr.Args searchArgs = getSearchArgs();
-    SearchSolr searchRunner = getSearchRunner(searchArgs);
-    searchRunner.runTopics();
-
-    BufferedReader br = new BufferedReader(new FileReader(searchArgs.output));
-    String[] ref = getRefRankingResult();
-    String s;
-    int cnt = 0;
-    while ((s = br.readLine()) != null) {
-      assertEquals(ref[cnt], s);
-      cnt++;
-    }
-    assertEquals(cnt, ref.length);
-    FileUtils.deleteQuietly(new File(searchArgs.output));
-  }
-}
diff --git a/src/test/java/io/anserini/integration/solr/TrecEndToEndTest.java b/src/test/java/io/anserini/integration/solr/TrecEndToEndTest.java
deleted file mode 100644
index f9d95a9d29..0000000000
--- a/src/test/java/io/anserini/integration/solr/TrecEndToEndTest.java
+++ /dev/null
@@ -1,55 +0,0 @@
-/*
- * Anserini: A Lucene toolkit for reproducible information retrieval research
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package io.anserini.integration.solr;
-
-import io.anserini.collection.TrecCollection;
-import io.anserini.index.IndexArgs;
-import io.anserini.search.SearchSolr;
-
-public class TrecEndToEndTest extends SolrEndToEndTest {
-  @Override
-  protected String getCollectionName() {
-    return "Trec";
-  }
-
-  @Override
-  protected String getSchemaAdjustmentFile() {
-    return null; // no need to adjust schema
-  }
-
-  @Override
-  protected IndexArgs getIndexArgs() {
-    IndexArgs indexArgs = createDefaultIndexArgs();
-    indexArgs.input = "src/test/resources/sample_docs/trec/collection2";
-    indexArgs.collectionClass = TrecCollection.class.getSimpleName();
-    return indexArgs;
-  }
-
-  @Override
-  protected SearchSolr.Args getSearchArgs() {
-    return createSearchArgs("Trec", "src/test/resources/sample_topics/Trec");
-  }
-
-  @Override
-  protected String[] getRefRankingResult() {
-    return new String[]{ // bm25
-        "1 Q0 DOC222 1 0.343200 Solrini",
-        "1 Q0 TREC_DOC_1 2 0.333400 Solrini",
-        "1 Q0 WSJ_1 3 0.068700 Solrini"
-    };
-  }
-}

From dedfbbbaa8c40d284fb02cec7319d833730b2ad1 Mon Sep 17 00:00:00 2001
From: lintool <jimmylin@uwaterloo.ca>
Date: Mon, 1 Aug 2022 07:44:14 -0400
Subject: [PATCH 10/13] Reordered.

---
 pom.xml | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/pom.xml b/pom.xml
index f0eae16e99..50cb6a995c 100644
--- a/pom.xml
+++ b/pom.xml
@@ -2,7 +2,7 @@
   <modelVersion>4.0.0</modelVersion>
   <groupId>io.anserini</groupId>
   <artifactId>anserini</artifactId>
-  <version>0.14.5-SNAPSHOT</version>
+  <version>0.15.0-SNAPSHOT</version>
   <name>Anserini</name>
   <description>An information retrieval toolkit built on Lucene</description>
   <url>http://anserini.io/</url>
@@ -289,27 +289,27 @@
     </dependency>
     <dependency>
       <groupId>org.apache.lucene</groupId>
-      <artifactId>lucene-queries</artifactId>
+      <artifactId>lucene-codecs</artifactId>
       <version>${lucene.version}</version>
     </dependency>
     <dependency>
       <groupId>org.apache.lucene</groupId>
-      <artifactId>lucene-queryparser</artifactId>
+      <artifactId>lucene-queries</artifactId>
       <version>${lucene.version}</version>
     </dependency>
     <dependency>
       <groupId>org.apache.lucene</groupId>
-      <artifactId>lucene-analysis-common</artifactId>
+      <artifactId>lucene-queryparser</artifactId>
       <version>${lucene.version}</version>
     </dependency>
     <dependency>
       <groupId>org.apache.lucene</groupId>
-      <artifactId>lucene-analysis-kuromoji</artifactId>
+      <artifactId>lucene-analysis-common</artifactId>
       <version>${lucene.version}</version>
     </dependency>
     <dependency>
       <groupId>org.apache.lucene</groupId>
-      <artifactId>lucene-codecs</artifactId>
+      <artifactId>lucene-analysis-kuromoji</artifactId>
       <version>${lucene.version}</version>
     </dependency>
     <dependency> <!-- polish and ukrainian -->

From 3dd6c3498d0e8b73107acd0f990ff636a9da4e91 Mon Sep 17 00:00:00 2001
From: lintool <jimmylin@uwaterloo.ca>
Date: Mon, 1 Aug 2022 08:23:07 -0400
Subject: [PATCH 11/13] Bumped up to Lucene 9.

---
 pom.xml                                               |  2 +-
 src/test/java/io/anserini/GeoIndexerTestBase.java     | 11 ++++++++---
 src/test/java/io/anserini/IndexerTestBase.java        |  2 +-
 .../io/anserini/IndexerWithEmptyDocumentTestBase.java |  2 +-
 .../anserini/collection/DocumentCollectionTest.java   |  2 +-
 .../java/io/anserini/integration/EndToEndTest.java    |  4 ++--
 .../io/anserini/ltr/BaseFeatureExtractorTest.java     |  2 +-
 .../query/DisjunctionMaxQueryGeneratorTest.java       |  2 +-
 .../java/io/anserini/search/query/SdmQueryTest.java   |  2 +-
 src/test/java/io/anserini/util/FeatureVectorTest.java |  2 +-
 10 files changed, 18 insertions(+), 13 deletions(-)

diff --git a/pom.xml b/pom.xml
index 50cb6a995c..e174478da3 100644
--- a/pom.xml
+++ b/pom.xml
@@ -26,7 +26,7 @@
   </developers>
 
   <properties>
-    <lucene.version>9.0.0</lucene.version>
+    <lucene.version>9.3.0</lucene.version>
     <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
   </properties>
 
diff --git a/src/test/java/io/anserini/GeoIndexerTestBase.java b/src/test/java/io/anserini/GeoIndexerTestBase.java
index 8c3c94e88d..e3ecc13edf 100644
--- a/src/test/java/io/anserini/GeoIndexerTestBase.java
+++ b/src/test/java/io/anserini/GeoIndexerTestBase.java
@@ -17,7 +17,11 @@
 package io.anserini;
 
 import io.anserini.index.IndexArgs;
-import org.apache.lucene.document.*;
+import org.apache.lucene.document.Document;
+import org.apache.lucene.document.Field;
+import org.apache.lucene.document.LatLonDocValuesField;
+import org.apache.lucene.document.LatLonShape;
+import org.apache.lucene.document.StringField;
 import org.apache.lucene.geo.Line;
 import org.apache.lucene.geo.Polygon;
 import org.apache.lucene.geo.SimpleWKTShapeParser;
@@ -25,9 +29,10 @@
 import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
-import org.apache.lucene.util.LuceneTestCase;
-import org.junit.Before;
+import org.apache.lucene.tests.util.LuceneTestCase;
 import org.junit.After;
+import org.junit.Before;
+
 import java.io.IOException;
 import java.nio.file.Files;
 import java.nio.file.Path;
diff --git a/src/test/java/io/anserini/IndexerTestBase.java b/src/test/java/io/anserini/IndexerTestBase.java
index ffd16c0b0c..8a1410bdc6 100644
--- a/src/test/java/io/anserini/IndexerTestBase.java
+++ b/src/test/java/io/anserini/IndexerTestBase.java
@@ -30,7 +30,7 @@
 import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
-import org.apache.lucene.util.LuceneTestCase;
+import org.apache.lucene.tests.util.LuceneTestCase;
 import org.apache.lucene.util.BytesRef;
 import org.junit.After;
 import org.junit.Before;
diff --git a/src/test/java/io/anserini/IndexerWithEmptyDocumentTestBase.java b/src/test/java/io/anserini/IndexerWithEmptyDocumentTestBase.java
index 417a0fb0ea..e4a854d2ca 100644
--- a/src/test/java/io/anserini/IndexerWithEmptyDocumentTestBase.java
+++ b/src/test/java/io/anserini/IndexerWithEmptyDocumentTestBase.java
@@ -30,7 +30,7 @@
 import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
-import org.apache.lucene.util.LuceneTestCase;
+import org.apache.lucene.tests.util.LuceneTestCase;
 import org.apache.lucene.util.BytesRef;
 import org.junit.After;
 import org.junit.Before;
diff --git a/src/test/java/io/anserini/collection/DocumentCollectionTest.java b/src/test/java/io/anserini/collection/DocumentCollectionTest.java
index 64b2faee63..ce06003621 100644
--- a/src/test/java/io/anserini/collection/DocumentCollectionTest.java
+++ b/src/test/java/io/anserini/collection/DocumentCollectionTest.java
@@ -16,7 +16,7 @@
 
 package io.anserini.collection;
 
-import org.apache.lucene.util.LuceneTestCase;
+import org.apache.lucene.tests.util.LuceneTestCase;
 import org.junit.After;
 import org.junit.Before;
 import org.junit.Test;
diff --git a/src/test/java/io/anserini/integration/EndToEndTest.java b/src/test/java/io/anserini/integration/EndToEndTest.java
index 3b509702e3..d0a55efe03 100644
--- a/src/test/java/io/anserini/integration/EndToEndTest.java
+++ b/src/test/java/io/anserini/integration/EndToEndTest.java
@@ -28,8 +28,8 @@
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
-import org.apache.lucene.util.LuceneTestCase;
-import org.apache.lucene.util.TestRuleLimitSysouts;
+import org.apache.lucene.tests.util.LuceneTestCase;
+import org.apache.lucene.tests.util.TestRuleLimitSysouts;
 import org.apache.lucene.util.IOUtils;
 import org.junit.After;
 import org.junit.Before;
diff --git a/src/test/java/io/anserini/ltr/BaseFeatureExtractorTest.java b/src/test/java/io/anserini/ltr/BaseFeatureExtractorTest.java
index b93cd5b42b..bfbe194a68 100644
--- a/src/test/java/io/anserini/ltr/BaseFeatureExtractorTest.java
+++ b/src/test/java/io/anserini/ltr/BaseFeatureExtractorTest.java
@@ -31,7 +31,7 @@
 import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
-import org.apache.lucene.util.LuceneTestCase;
+import org.apache.lucene.tests.util.LuceneTestCase;
 import org.junit.After;
 import org.junit.Before;
 
diff --git a/src/test/java/io/anserini/search/query/DisjunctionMaxQueryGeneratorTest.java b/src/test/java/io/anserini/search/query/DisjunctionMaxQueryGeneratorTest.java
index 6b82cdcc29..00ce6a20a0 100644
--- a/src/test/java/io/anserini/search/query/DisjunctionMaxQueryGeneratorTest.java
+++ b/src/test/java/io/anserini/search/query/DisjunctionMaxQueryGeneratorTest.java
@@ -21,7 +21,7 @@
 import org.apache.lucene.search.BoostQuery;
 import org.apache.lucene.search.DisjunctionMaxQuery;
 import org.apache.lucene.search.Query;
-import org.apache.lucene.util.LuceneTestCase;
+import org.apache.lucene.tests.util.LuceneTestCase;
 import org.junit.Test;
 
 import java.util.Map;
diff --git a/src/test/java/io/anserini/search/query/SdmQueryTest.java b/src/test/java/io/anserini/search/query/SdmQueryTest.java
index 89663ffdca..c032882834 100644
--- a/src/test/java/io/anserini/search/query/SdmQueryTest.java
+++ b/src/test/java/io/anserini/search/query/SdmQueryTest.java
@@ -36,7 +36,7 @@
 import org.apache.lucene.search.similarities.BM25Similarity;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FSDirectory;
-import org.apache.lucene.util.LuceneTestCase;
+import org.apache.lucene.tests.util.LuceneTestCase;
 import org.junit.After;
 import org.junit.Before;
 import org.junit.Test;
diff --git a/src/test/java/io/anserini/util/FeatureVectorTest.java b/src/test/java/io/anserini/util/FeatureVectorTest.java
index c747194004..12694bd90b 100644
--- a/src/test/java/io/anserini/util/FeatureVectorTest.java
+++ b/src/test/java/io/anserini/util/FeatureVectorTest.java
@@ -16,7 +16,7 @@
 
 package io.anserini.util;
 
-import org.apache.lucene.util.LuceneTestCase;
+import org.apache.lucene.tests.util.LuceneTestCase;
 import org.junit.Test;
 
 import java.util.Arrays;

From c3f0ba292dcbb33e64314dc399fb49339c33fb71 Mon Sep 17 00:00:00 2001
From: lintool <jimmylin@uwaterloo.ca>
Date: Mon, 1 Aug 2022 09:03:51 -0400
Subject: [PATCH 12/13] Added backward codecs.

---
 pom.xml | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/pom.xml b/pom.xml
index e174478da3..ecb15d4b84 100644
--- a/pom.xml
+++ b/pom.xml
@@ -292,6 +292,11 @@
       <artifactId>lucene-codecs</artifactId>
       <version>${lucene.version}</version>
     </dependency>
+    <dependency>
+      <groupId>org.apache.lucene</groupId>
+      <artifactId>lucene-backward-codecs</artifactId>
+      <version>${lucene.version}</version>
+    </dependency>
     <dependency>
       <groupId>org.apache.lucene</groupId>
       <artifactId>lucene-queries</artifactId>

From be33a261be61b9f29259d4105a133dfd10492dd3 Mon Sep 17 00:00:00 2001
From: lintool <jimmylin@uwaterloo.ca>
Date: Mon, 1 Aug 2022 09:39:56 -0400
Subject: [PATCH 13/13] Fix Lucene 8/9 index compat issue

---
 src/main/java/io/anserini/search/SearchArgs.java |  3 +++
 .../io/anserini/search/SearchCollection.java     |  6 ++++++
 src/main/python/run_regression.py                | 16 ++++++++++++++--
 3 files changed, 23 insertions(+), 2 deletions(-)

diff --git a/src/main/java/io/anserini/search/SearchArgs.java b/src/main/java/io/anserini/search/SearchArgs.java
index b90dda1a06..d4d3f50d58 100644
--- a/src/main/java/io/anserini/search/SearchArgs.java
+++ b/src/main/java/io/anserini/search/SearchArgs.java
@@ -36,6 +36,9 @@ public class SearchArgs {
   @Option(name = "-topicreader", required = true, usage = "TopicReader to use.")
   public String topicReader;
 
+  @Option(name = "-lucene8", usage = "Enable Lucene 8 index compatibility.")
+  public Boolean lucene8 = false;
+
   // optional arguments
   @Option(name = "-querygenerator", usage = "QueryGenerator to use.")
   public String queryGenerator = "BagOfWordsQueryGenerator";
diff --git a/src/main/java/io/anserini/search/SearchCollection.java b/src/main/java/io/anserini/search/SearchCollection.java
index 1a7d1776ff..ed40f11217 100644
--- a/src/main/java/io/anserini/search/SearchCollection.java
+++ b/src/main/java/io/anserini/search/SearchCollection.java
@@ -494,6 +494,12 @@ public SearchCollection(SearchArgs args) throws IOException {
       loadQrels(args.rf_qrels);      
     }
 
+    // See https://github.com/castorini/anserini/issues/1952
+    // The solution to the issue described above is to turn off deterministic tie-breaking.
+    if (args.lucene8) {
+      args.arbitraryScoreTieBreak = true;
+      args.axiom_deterministic = false;
+    }
   }
 
   @Override
diff --git a/src/main/python/run_regression.py b/src/main/python/run_regression.py
index 9afc28d1b9..08884abeeb 100644
--- a/src/main/python/run_regression.py
+++ b/src/main/python/run_regression.py
@@ -61,6 +61,10 @@ def is_close(a, b, rel_tol=1e-09, abs_tol=0.0):
     return abs(a-b) <= max(rel_tol * max(abs(a), abs(b)), abs_tol)
 
 
+def is_close_lucene8(a, b):
+    return abs(a-b) <= 0.001
+
+
 def check_output(command):
     # Python 2.6 compatible subprocess.check_output
     process = Popen(command, shell=True, stdout=PIPE)
@@ -131,6 +135,7 @@ def construct_search_commands(yaml_data):
             '-topicreader', topic_set['topic_reader'] if 'topic_reader' in topic_set and topic_set['topic_reader'] else yaml_data['topic_reader'],
             '-output', construct_runfile_path(yaml_data['corpus'], topic_set['id'], model['name']),
             model['params'],
+            '-lucene8' if args.lucene8 else ''
         ]
         for (model, topic_set) in list(itertools.product(yaml_data['models'], yaml_data['topics']))
     ]
@@ -154,6 +159,7 @@ def construct_convert_commands(yaml_data):
 def evaluate_and_verify(yaml_data, dry_run):
     fail_str = '\033[91m[FAIL]\033[0m '
     ok_str = '   [OK] '
+    okish_str = '  \033[94m[OK*]\033[0m '
     failures = False
 
     logger.info('='*10 + ' Verifying Results: ' + yaml_data['corpus'] + ' ' + '='*10)
@@ -181,8 +187,11 @@ def evaluate_and_verify(yaml_data, dry_run):
                 if is_close(expected, actual):
                     logger.info(ok_str + result_str)
                 else:
-                    logger.error(fail_str + result_str)
-                    failures = True
+                    if args.lucene8 and is_close_lucene8(expected, actual):
+                        logger.info(okish_str + result_str)
+                    else:
+                        logger.error(fail_str + result_str)
+                        failures = True
 
     if not dry_run:
         if failures:
@@ -280,6 +289,7 @@ def download_url(url, save_dir, local_filename=None, md5=None, force=False, verb
                         help='Number of converting runs to execute in parallel.')
     parser.add_argument('--dry-run', dest='dry_run', action='store_true',
                         help='Output commands without actual execution.')
+    parser.add_argument('--lucene8', dest='lucene8', action='store_true', help='Enable Lucene 8 index compatibility.')
     args = parser.parse_args()
 
     with open('src/main/resources/regression/{}.yaml'.format(args.regression)) as f:
@@ -340,6 +350,8 @@ def download_url(url, save_dir, local_filename=None, md5=None, force=False, verb
     # Search and verify results.
     if args.search:
         logger.info('='*10 + ' Ranking ' + '='*10)
+        if args.lucene8:
+            logger.info('Enabling Lucene 8 index compatibility.')
         search_cmds = construct_search_commands(yaml_data)
         if args.dry_run:
             for cmd in search_cmds: