From 1363a9125a8e3595c3e8f5b29de9e5fe5717fb54 Mon Sep 17 00:00:00 2001 From: Roman Chyla Date: Wed, 20 May 2020 22:09:40 -0400 Subject: [PATCH] Fixed FU guy's feedback --- .../src/test/org/adsabs/TestAdsAllFields.java | 18 ++-- .../server/solr/collection1/conf/schema.xml | 25 +++--- .../solr/collection1/conf/solrconfig.xml | 2 +- scripts/parse_index.py | 90 +++++++++++++++++++ 4 files changed, 113 insertions(+), 22 deletions(-) create mode 100644 scripts/parse_index.py diff --git a/contrib/adsabs/src/test/org/adsabs/TestAdsAllFields.java b/contrib/adsabs/src/test/org/adsabs/TestAdsAllFields.java index fd561b3fe..69e18274e 100644 --- a/contrib/adsabs/src/test/org/adsabs/TestAdsAllFields.java +++ b/contrib/adsabs/src/test/org/adsabs/TestAdsAllFields.java @@ -449,7 +449,7 @@ public void test() throws Exception { "//doc/int[@name='recid'][.='100']", "//doc/float[@name='score'][.='26.0']"); - assert h.query(req("q", "author:\"Einstein, A\"")) + assert h.query(req("q", "author:\"Einstein, A\"", "fl", "author_norm")) .contains("" + "t' Hooft, van X" + "Anders, John Michael" + @@ -570,7 +570,7 @@ public void test() throws Exception { "//*[@numFound='1']"); - assert h.query(req("q", "recid:100")) + assert h.query(req("q", "recid:100", "fl", "aff")) .contains("" + "-" + "NASA Kavli space center, Cambridge, MA 02138, USA" + @@ -646,7 +646,7 @@ public void test() throws Exception { // order/gaps are important - assert h.query(req("q", "recid:100")) + assert h.query(req("q", "recid:100", "fl", "email")) .contains("" + "-" + "anders@email.com" + @@ -667,7 +667,7 @@ public void test() throws Exception { "//doc/int[@name='recid'][.='100']", "//*[@numFound='1']" ); - assert h.query(req("q", "recid:100")) + assert h.query(req("q", "recid:100", "fl", "orcid_pub")) .contains("" + "1111-2222-3333-4444" + "-" + @@ -1293,7 +1293,7 @@ public void test() throws Exception { * links_data (generated and stored as JSON for display purposes) * ids_data (generated and stored as JSON for display purposes) */ - assertQ(req("q", "id:100"), + assertQ(req("q", "id:100", "fl", "links_data"), "//doc/arr[@name='links_data']/str[contains(text(),'MAST')]", "//doc/arr[@name='links_data']/str[contains(text(),'{\"foo\": [\"bar\", \"baz\"], \"one\": {\"two\": \"three\"}}')]" ); @@ -1469,7 +1469,7 @@ public void test() throws Exception { assertQ(req("q", "page_range:23"), "//*[@numFound='0']" // not searchable ); - assertQ(req("q", "page:55"), + assertQ(req("q", "page:55", "fl", "page_range"), "//doc[1]/str[@name='page_range'][.='23-55s']" ); @@ -1540,7 +1540,7 @@ public void test() throws Exception { assertQ(req("q", "data:(nEd OR foo)"), "//doc[1]/int[@name='recid'][.='100']" ); - assertQ(req("q", "data:\"NED:999\""), // numbers should be ignored in search, but stored + assertQ(req("q", "data:\"NED:999\"", "fl", "recid,data"), // numbers should be ignored in search, but stored "//doc[1]/int[@name='recid'][.='100']", "//doc[1]/arr[@name='data']/str[contains(text(),'NED:15')]" ); @@ -1549,7 +1549,7 @@ public void test() throws Exception { * esources * */ - assertQ(req("q", "esources:pub_pDF"), + assertQ(req("q", "esources:pub_pDF", "fl", "recid"), "//doc[1]/int[@name='recid'][.='100']" ); @@ -1626,7 +1626,7 @@ public void test() throws Exception { /* * similar() query */ - assertQ(req("q", "similar(recid:100)"), + assertQ(req("q", "similar(recid:100)", "fl", "recid"), "//doc[1]/int[@name='recid'][.='60']" ); diff --git a/contrib/examples/adsabs/server/solr/collection1/conf/schema.xml b/contrib/examples/adsabs/server/solr/collection1/conf/schema.xml index 2047c8895..98db659dc 100644 --- a/contrib/examples/adsabs/server/solr/collection1/conf/schema.xml +++ b/contrib/examples/adsabs/server/solr/collection1/conf/schema.xml @@ -403,7 +403,7 @@ unittest: TestAdsabsTypeFulltext --> - + @@ -445,6 +445,7 @@ class="org.apache.lucene.analysis.core.SelectiveLowerCaseFilterFactory" /> + - - + + + @@ -551,11 +552,6 @@ inclOrig="true" /> - - + + diff --git a/contrib/examples/adsabs/server/solr/collection1/conf/solrconfig.xml b/contrib/examples/adsabs/server/solr/collection1/conf/solrconfig.xml index 703d8ba35..1a23e126a 100644 --- a/contrib/examples/adsabs/server/solr/collection1/conf/solrconfig.xml +++ b/contrib/examples/adsabs/server/solr/collection1/conf/solrconfig.xml @@ -307,7 +307,7 @@ json 10 - recid author title abstract page pub + id recid author title abstract page pub