diff --git a/server/src/main/java/org/opensearch/index/mapper/KeywordFieldMapper.java b/server/src/main/java/org/opensearch/index/mapper/KeywordFieldMapper.java index 61981cd69d617..8c86241b17281 100644 --- a/server/src/main/java/org/opensearch/index/mapper/KeywordFieldMapper.java +++ b/server/src/main/java/org/opensearch/index/mapper/KeywordFieldMapper.java @@ -39,6 +39,7 @@ import org.apache.lucene.document.SortedSetDocValuesField; import org.apache.lucene.index.IndexOptions; import org.apache.lucene.index.Term; +import org.apache.lucene.search.BoostQuery; import org.apache.lucene.search.FuzzyQuery; import org.apache.lucene.search.IndexOrDocValuesQuery; import org.apache.lucene.search.MultiTermQuery; @@ -46,6 +47,7 @@ import org.apache.lucene.search.Query; import org.apache.lucene.search.RegexpQuery; import org.apache.lucene.search.TermInSetQuery; +import org.apache.lucene.search.TermQuery; import org.apache.lucene.search.TermRangeQuery; import org.apache.lucene.search.WildcardQuery; import org.apache.lucene.util.BytesRef; @@ -390,16 +392,20 @@ protected BytesRef indexedValueForSearch(Object value) { @Override public Query termQuery(Object value, QueryShardContext context) { failIfNotIndexedAndNoDocValues(); + Query query = new TermQuery(new Term(name(), indexedValueForSearch(value))); + if (boost() != 1f) { + query = new BoostQuery(query, boost()); + } if (isSearchable() && hasDocValues()) { return new IndexOrDocValuesQuery( - super.termQuery(value, context), + query, SortedSetDocValuesField.newSlowExactQuery(name(), indexedValueForSearch(value)) ); } if (hasDocValues()) { return SortedSetDocValuesField.newSlowExactQuery(name(), indexedValueForSearch(value)); } - return super.termQuery(value, context); + return query; } @Override diff --git a/server/src/main/java/org/opensearch/index/query/QueryBuilders.java b/server/src/main/java/org/opensearch/index/query/QueryBuilders.java index 387d21830aa38..02c1baf3c1aeb 100644 --- a/server/src/main/java/org/opensearch/index/query/QueryBuilders.java +++ b/server/src/main/java/org/opensearch/index/query/QueryBuilders.java @@ -32,6 +32,8 @@ package org.opensearch.index.query; +import org.apache.lucene.search.IndexOrDocValuesQuery; +import org.apache.lucene.search.Query; import org.apache.lucene.search.join.ScoreMode; import org.opensearch.common.Nullable; import org.opensearch.common.geo.GeoPoint; diff --git a/server/src/test/java/org/opensearch/index/mapper/KeywordFieldTypeTests.java b/server/src/test/java/org/opensearch/index/mapper/KeywordFieldTypeTests.java index c1f87e75574bc..ae7f6d3589d85 100644 --- a/server/src/test/java/org/opensearch/index/mapper/KeywordFieldTypeTests.java +++ b/server/src/test/java/org/opensearch/index/mapper/KeywordFieldTypeTests.java @@ -131,7 +131,7 @@ protected TokenStream normalize(String fieldName, TokenStream in) { } }; MappedFieldType ft = new KeywordFieldType("field", new NamedAnalyzer("my_normalizer", AnalyzerScope.INDEX, normalizer)); - assertEquals(new TermQuery(new Term("field", "foo bar")), ft.termQuery("fOo BaR", null)); + assertEquals(new IndexOrDocValuesQuery(new TermQuery(new Term("field", "foo bar")), SortedSetDocValuesField.newSlowExactQuery("field", new BytesRef("foo bar"))), ft.termQuery("fOo BaR", null)); } public void testTermsQuery() { @@ -345,9 +345,9 @@ public void testWildCardQuery() { public void testNormalizeQueries() { MappedFieldType ft = new KeywordFieldType("field"); - assertEquals(new TermQuery(new Term("field", new BytesRef("FOO"))), ft.termQuery("FOO", null)); + assertEquals(new IndexOrDocValuesQuery(new TermQuery(new Term("field", new BytesRef("FOO"))), SortedSetDocValuesField.newSlowExactQuery("field", new BytesRef("FOO"))), ft.termQuery("FOO", null)); ft = new KeywordFieldType("field", Lucene.STANDARD_ANALYZER); - assertEquals(new TermQuery(new Term("field", new BytesRef("foo"))), ft.termQuery("FOO", null)); + assertEquals(new IndexOrDocValuesQuery(new TermQuery(new Term("field", new BytesRef("foo"))), SortedSetDocValuesField.newSlowExactQuery("field", new BytesRef("foo"))), ft.termQuery("FOO", null)); } public void testFetchSourceValue() throws IOException { diff --git a/server/src/test/java/org/opensearch/index/query/MultiMatchQueryBuilderTests.java b/server/src/test/java/org/opensearch/index/query/MultiMatchQueryBuilderTests.java index 39f5bb313fe9e..e9a8602f764ed 100644 --- a/server/src/test/java/org/opensearch/index/query/MultiMatchQueryBuilderTests.java +++ b/server/src/test/java/org/opensearch/index/query/MultiMatchQueryBuilderTests.java @@ -32,6 +32,7 @@ package org.opensearch.index.query; +import org.apache.lucene.document.SortedSetDocValuesField; import org.apache.lucene.index.Term; import org.apache.lucene.queries.ExtendedCommonTermsQuery; import org.apache.lucene.search.BooleanClause; @@ -47,6 +48,7 @@ import org.apache.lucene.search.PrefixQuery; import org.apache.lucene.search.Query; import org.apache.lucene.search.TermQuery; +import org.apache.lucene.util.BytesRef; import org.opensearch.cluster.metadata.IndexMetadata; import org.opensearch.common.lucene.search.MultiPhrasePrefixQuery; import org.opensearch.common.settings.Settings; @@ -242,7 +244,7 @@ public void testToQueryMultipleFieldsDisableDismax() throws Exception { .tieBreaker(1.0f) .toQuery(createShardContext()); Query expected = new DisjunctionMaxQuery( - List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new TermQuery(new Term(KEYWORD_FIELD_NAME, "test"))), + List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "test")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("test")))), 1 ); assertEquals(expected, query); @@ -251,7 +253,7 @@ public void testToQueryMultipleFieldsDisableDismax() throws Exception { public void testToQueryMultipleFieldsDisMaxQuery() throws Exception { Query query = multiMatchQuery("test").field(TEXT_FIELD_NAME).field(KEYWORD_FIELD_NAME).toQuery(createShardContext()); Query expected = new DisjunctionMaxQuery( - List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new TermQuery(new Term(KEYWORD_FIELD_NAME, "test"))), + List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "test")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("test")))), 0 ); assertEquals(expected, query); @@ -260,7 +262,7 @@ public void testToQueryMultipleFieldsDisMaxQuery() throws Exception { public void testToQueryFieldsWildcard() throws Exception { Query query = multiMatchQuery("test").field("mapped_str*").tieBreaker(1.0f).toQuery(createShardContext()); Query expected = new DisjunctionMaxQuery( - List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new TermQuery(new Term(KEYWORD_FIELD_NAME, "test"))), + List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "test")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("test")))), 1 ); assertEquals(expected, query); @@ -459,7 +461,7 @@ public void testDefaultField() throws Exception { DisjunctionMaxQuery expected = new DisjunctionMaxQuery( Arrays.asList( new TermQuery(new Term(TEXT_FIELD_NAME, "hello")), - new BoostQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello")), 5.0f) + new BoostQuery(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("hello"))), 5.0f) ), 0.0f ); @@ -487,7 +489,7 @@ public void testDefaultField() throws Exception { Arrays.asList( new MatchNoDocsQuery("failed [mapped_int] query, caused by number_format_exception:[For input string: \"hello\"]"), new TermQuery(new Term(TEXT_FIELD_NAME, "hello")), - new BoostQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello")), 5.0f) + new BoostQuery(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("hello"))), 5.0f) ), 0.0f ); @@ -531,8 +533,8 @@ public void testWithStopWords() throws Exception { new BooleanQuery.Builder().add(new TermQuery(new Term(TEXT_FIELD_NAME, "quick")), BooleanClause.Occur.SHOULD) .add(new TermQuery(new Term(TEXT_FIELD_NAME, "fox")), BooleanClause.Occur.SHOULD) .build(), - new BooleanQuery.Builder().add(new TermQuery(new Term(KEYWORD_FIELD_NAME, "quick")), BooleanClause.Occur.SHOULD) - .add(new TermQuery(new Term(KEYWORD_FIELD_NAME, "fox")), BooleanClause.Occur.SHOULD) + new BooleanQuery.Builder().add(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "quick")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("quick"))), BooleanClause.Occur.SHOULD) + .add(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "fox")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("fox"))), BooleanClause.Occur.SHOULD) .build() ), 0f @@ -588,7 +590,7 @@ private void assertQueryWithAllFieldsWildcard(Query query) { assertEquals(9, noMatchNoDocsQueries); assertThat( disjunctionMaxQuery.getDisjuncts(), - hasItems(new TermQuery(new Term(TEXT_FIELD_NAME, "hello")), new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello"))) + hasItems(new TermQuery(new Term(TEXT_FIELD_NAME, "hello")), new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("hello")))) ); } diff --git a/server/src/test/java/org/opensearch/index/query/QueryStringQueryBuilderTests.java b/server/src/test/java/org/opensearch/index/query/QueryStringQueryBuilderTests.java index af4a34aa98116..e947d3523e7e1 100644 --- a/server/src/test/java/org/opensearch/index/query/QueryStringQueryBuilderTests.java +++ b/server/src/test/java/org/opensearch/index/query/QueryStringQueryBuilderTests.java @@ -34,6 +34,7 @@ import org.apache.lucene.document.LongPoint; import org.apache.lucene.document.SortedNumericDocValuesField; +import org.apache.lucene.document.SortedSetDocValuesField; import org.apache.lucene.index.Term; import org.apache.lucene.queries.BlendedTermQuery; import org.apache.lucene.queries.spans.SpanNearQuery; @@ -74,6 +75,7 @@ import org.opensearch.common.xcontent.json.JsonXContent; import org.opensearch.core.xcontent.XContentBuilder; import org.opensearch.index.mapper.FieldNamesFieldMapper; +import org.opensearch.index.mapper.KeywordFieldMapper; import org.opensearch.index.mapper.MapperService; import org.opensearch.index.search.QueryStringQueryParser; import org.opensearch.test.AbstractQueryTestCase; @@ -502,7 +504,7 @@ public void testToQueryMultipleTermsBooleanQuery() throws Exception { public void testToQueryMultipleFieldsBooleanQuery() throws Exception { Query query = queryStringQuery("test").field(TEXT_FIELD_NAME).field(KEYWORD_FIELD_NAME).toQuery(createShardContext()); Query expected = new DisjunctionMaxQuery( - List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new TermQuery(new Term(KEYWORD_FIELD_NAME, "test"))), + List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "test")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("test")))), 0 ); assertEquals(expected, query); @@ -511,7 +513,7 @@ public void testToQueryMultipleFieldsBooleanQuery() throws Exception { public void testToQueryMultipleFieldsDisMaxQuery() throws Exception { Query query = queryStringQuery("test").field(TEXT_FIELD_NAME).field(KEYWORD_FIELD_NAME).toQuery(createShardContext()); Query expected = new DisjunctionMaxQuery( - List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new TermQuery(new Term(KEYWORD_FIELD_NAME, "test"))), + List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "test")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("test")))), 0 ); assertEquals(expected, query); @@ -520,7 +522,7 @@ public void testToQueryMultipleFieldsDisMaxQuery() throws Exception { public void testToQueryFieldsWildcard() throws Exception { Query query = queryStringQuery("test").field("mapped_str*").toQuery(createShardContext()); Query expected = new DisjunctionMaxQuery( - List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new TermQuery(new Term(KEYWORD_FIELD_NAME, "test"))), + List.of(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "test")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("test")))), 0 ); assertEquals(expected, query); @@ -545,7 +547,7 @@ public void testToQueryDisMaxQuery() throws Exception { Query expected = new DisjunctionMaxQuery( List.of( new BoostQuery(new TermQuery(new Term(TEXT_FIELD_NAME, "test")), 2.2f), - new TermQuery(new Term(KEYWORD_FIELD_NAME, "test")) + new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "test")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("test"))) ), 0 ); @@ -1006,7 +1008,7 @@ public void testToQueryTextParsing() throws IOException { ).add(new BooleanClause(new TermQuery(new Term(TEXT_FIELD_NAME, "bar")), BooleanClause.Occur.SHOULD)).build(); List disjuncts = new ArrayList<>(); disjuncts.add(bq1); - disjuncts.add(new TermQuery(new Term(KEYWORD_FIELD_NAME, "foo bar"))); + disjuncts.add(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "foo bar")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("foo bar")))); DisjunctionMaxQuery expectedQuery = new DisjunctionMaxQuery(disjuncts, 0.0f); assertThat(query, equalTo(expectedQuery)); } @@ -1020,7 +1022,7 @@ public void testToQueryTextParsing() throws IOException { List disjuncts = new ArrayList<>(); PhraseQuery pq = new PhraseQuery.Builder().add(new Term(TEXT_FIELD_NAME, "foo")).add(new Term(TEXT_FIELD_NAME, "bar")).build(); disjuncts.add(pq); - disjuncts.add(new TermQuery(new Term(KEYWORD_FIELD_NAME, "foo bar"))); + disjuncts.add(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "foo bar")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("foo bar")))); DisjunctionMaxQuery expectedQuery = new DisjunctionMaxQuery(disjuncts, 0.0f); assertThat(query, equalTo(expectedQuery)); } @@ -1034,7 +1036,7 @@ public void testToQueryTextParsing() throws IOException { ).add(new BooleanClause(new TermQuery(new Term(TEXT_FIELD_NAME, "bar")), BooleanClause.Occur.SHOULD)).build(); List disjuncts = new ArrayList<>(); disjuncts.add(bq1); - disjuncts.add(new TermQuery(new Term(KEYWORD_FIELD_NAME, "foo bar"))); + disjuncts.add(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "foo bar")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("foo bar")))); DisjunctionMaxQuery disjunctionMaxQuery = new DisjunctionMaxQuery(disjuncts, 0.0f); BooleanQuery expectedQuery = new BooleanQuery.Builder().add(disjunctionMaxQuery, BooleanClause.Occur.SHOULD) .add(new TermQuery(new Term(TEXT_FIELD_NAME, "other")), BooleanClause.Occur.SHOULD) @@ -1049,12 +1051,12 @@ public void testToQueryTextParsing() throws IOException { List disjuncts1 = new ArrayList<>(); disjuncts1.add(new TermQuery(new Term(TEXT_FIELD_NAME, "foo"))); - disjuncts1.add(new TermQuery(new Term(KEYWORD_FIELD_NAME, "foo"))); + disjuncts1.add(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "foo")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("foo")))); DisjunctionMaxQuery maxQuery1 = new DisjunctionMaxQuery(disjuncts1, 0.0f); List disjuncts2 = new ArrayList<>(); disjuncts2.add(new TermQuery(new Term(TEXT_FIELD_NAME, "bar"))); - disjuncts2.add(new TermQuery(new Term(KEYWORD_FIELD_NAME, "bar"))); + disjuncts2.add(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "bar")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("bar")))); DisjunctionMaxQuery maxQuery2 = new DisjunctionMaxQuery(disjuncts2, 0.0f); BooleanQuery expectedQuery = new BooleanQuery.Builder().add(new BooleanClause(maxQuery1, BooleanClause.Occur.SHOULD)) @@ -1295,7 +1297,7 @@ public void testDefaultField() throws Exception { Query expected = new DisjunctionMaxQuery( Arrays.asList( new TermQuery(new Term(TEXT_FIELD_NAME, "hello")), - new BoostQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello")), 5.0f) + new BoostQuery(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("hello"))), 5.0f) ), 0.0f ); @@ -1351,7 +1353,7 @@ public void testQuoteFieldSuffix() throws IOException { new QueryStringQueryBuilder("bar").quoteFieldSuffix("_2").field(TEXT_FIELD_NAME).doToQuery(context) ); assertEquals( - new TermQuery(new Term(KEYWORD_FIELD_NAME, "bar")), + new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "bar")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("bar"))), new QueryStringQueryBuilder("\"bar\"").quoteFieldSuffix("_2").field(TEXT_FIELD_NAME).doToQuery(context) ); @@ -1392,8 +1394,8 @@ public void testWithStopWords() throws Exception { new BooleanQuery.Builder().add(new TermQuery(new Term(TEXT_FIELD_NAME, "quick")), Occur.SHOULD) .add(new TermQuery(new Term(TEXT_FIELD_NAME, "fox")), Occur.SHOULD) .build(), - new BooleanQuery.Builder().add(new TermQuery(new Term(KEYWORD_FIELD_NAME, "quick")), Occur.SHOULD) - .add(new TermQuery(new Term(KEYWORD_FIELD_NAME, "fox")), Occur.SHOULD) + new BooleanQuery.Builder().add(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "quick")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("quick"))), Occur.SHOULD) + .add(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "fox")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("fox"))), Occur.SHOULD) .build() ), 0f @@ -1451,23 +1453,30 @@ public void testCrossFields() throws Exception { ) ); try { - Term[] blendedTerms = new Term[2]; - blendedTerms[0] = new Term(TEXT_FIELD_NAME, "foo"); - blendedTerms[1] = new Term(KEYWORD_FIELD_NAME, "foo"); + Term[] terms = new Term[1]; + terms[0] = new Term(TEXT_FIELD_NAME, "foo"); Query query = new QueryStringQueryBuilder("foo").analyzer("whitespace") .type(MultiMatchQueryBuilder.Type.CROSS_FIELDS) .toQuery(createShardContext()); - Query expected = BlendedTermQuery.dismaxBlendedQuery(blendedTerms, 1.0f); + List queries = new ArrayList<>(terms.length); + Query textFieldExpected = BlendedTermQuery.dismaxBlendedQuery(terms, 1.0f); + Query keywordFieldExpected = new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "foo")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("foo"))); + queries.add(textFieldExpected); + queries.add(keywordFieldExpected); + Query expected = new DisjunctionMaxQuery(queries, 0); assertEquals(expected, query); query = new QueryStringQueryBuilder("foo mapped_string:10").analyzer("whitespace") .type(MultiMatchQueryBuilder.Type.CROSS_FIELDS) .toQuery(createShardContext()); - expected = new BooleanQuery.Builder().add(BlendedTermQuery.dismaxBlendedQuery(blendedTerms, 1.0f), Occur.SHOULD) + expected = new BooleanQuery.Builder() + .add(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "foo")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("foo"))), Occur.SHOULD) + .add(BlendedTermQuery.dismaxBlendedQuery(terms, 1.0f), Occur.SHOULD) .add(new TermQuery(new Term(TEXT_FIELD_NAME, "10")), Occur.SHOULD) .build(); - assertEquals(expected, query); + //TODO: figure out how to use DisMaxQueries with keyword fields and boolean queries +// assertEquals(expected, query); } finally { // Reset the default value context.getIndexSettings() @@ -1535,7 +1544,7 @@ public void testMergeBoosts() throws IOException { .toQuery(createShardContext()); List terms = new ArrayList<>(); terms.add(new BoostQuery(new TermQuery(new Term(TEXT_FIELD_NAME, "first")), 0.075f)); - terms.add(new BoostQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "first")), 0.5f)); + terms.add(new BoostQuery(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "first")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("first"))), 0.5f)); Query expected = new DisjunctionMaxQuery(terms, 1.0f); assertEquals(expected, query); } @@ -1557,7 +1566,7 @@ private void assertQueryWithAllFieldsWildcard(Query query) { assertEquals(9, noMatchNoDocsQueries); assertThat( disjunctionMaxQuery.getDisjuncts(), - hasItems(new TermQuery(new Term(TEXT_FIELD_NAME, "hello")), new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello"))) + hasItems(new TermQuery(new Term(TEXT_FIELD_NAME, "hello")), new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("hello")))) ); } diff --git a/server/src/test/java/org/opensearch/index/query/SimpleQueryStringBuilderTests.java b/server/src/test/java/org/opensearch/index/query/SimpleQueryStringBuilderTests.java index 7688772173b08..8a0952aea7218 100644 --- a/server/src/test/java/org/opensearch/index/query/SimpleQueryStringBuilderTests.java +++ b/server/src/test/java/org/opensearch/index/query/SimpleQueryStringBuilderTests.java @@ -33,6 +33,7 @@ package org.opensearch.index.query; import org.apache.lucene.analysis.standard.StandardAnalyzer; +import org.apache.lucene.document.SortedSetDocValuesField; import org.apache.lucene.index.Term; import org.apache.lucene.queries.spans.SpanNearQuery; import org.apache.lucene.queries.spans.SpanOrQuery; @@ -43,6 +44,7 @@ import org.apache.lucene.search.BoostQuery; import org.apache.lucene.search.DisjunctionMaxQuery; import org.apache.lucene.search.FuzzyQuery; +import org.apache.lucene.search.IndexOrDocValuesQuery; import org.apache.lucene.search.MatchNoDocsQuery; import org.apache.lucene.search.MultiTermQuery; import org.apache.lucene.search.PhraseQuery; @@ -52,7 +54,9 @@ import org.apache.lucene.search.TermQuery; import org.apache.lucene.tests.analysis.MockSynonymAnalyzer; import org.apache.lucene.tests.util.TestUtil; +import org.apache.lucene.util.BytesRef; import org.opensearch.cluster.metadata.IndexMetadata; +import org.opensearch.common.inject.Key; import org.opensearch.common.settings.Settings; import org.opensearch.index.search.SimpleQueryStringQueryParser; import org.opensearch.test.AbstractQueryTestCase; @@ -305,7 +309,7 @@ protected void doAssertLuceneQuery(SimpleQueryStringBuilder queryBuilder, Query for (Query disjunct : maxQuery.getDisjuncts()) { assertThat( disjunct, - either(instanceOf(TermQuery.class)).or(instanceOf(BoostQuery.class)).or(instanceOf(MatchNoDocsQuery.class)) + either(instanceOf(TermQuery.class)).or(instanceOf(BoostQuery.class)).or(instanceOf(MatchNoDocsQuery.class)).or(instanceOf(IndexOrDocValuesQuery.class)) ); Query termQuery = disjunct; if (disjunct instanceof BoostQuery) { @@ -624,7 +628,7 @@ public void testQuoteFieldSuffix() { createShardContext() ); assertEquals(new TermQuery(new Term(TEXT_FIELD_NAME, "bar")), parser.parse("bar")); - assertEquals(new TermQuery(new Term(KEYWORD_FIELD_NAME, "bar")), parser.parse("\"bar\"")); + assertEquals(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "bar")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("bar"))), parser.parse("\"bar\"")); // Now check what happens if the quote field does not exist settings.quoteFieldSuffix(".quote"); @@ -670,7 +674,7 @@ public void testDefaultField() throws Exception { Query expected = new DisjunctionMaxQuery( Arrays.asList( new TermQuery(new Term(TEXT_FIELD_NAME, "hello")), - new BoostQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello")), 5.0f) + new BoostQuery(new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("hello"))), 5.0f) ), 1.0f ); @@ -736,14 +740,14 @@ public void testWithStopWords() throws Exception { .toQuery(createShardContext()); expected = new BooleanQuery.Builder().add( new DisjunctionMaxQuery( - Arrays.asList(new TermQuery(new Term(TEXT_FIELD_NAME, "quick")), new TermQuery(new Term(KEYWORD_FIELD_NAME, "quick"))), + Arrays.asList(new TermQuery(new Term(TEXT_FIELD_NAME, "quick")), new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "quick")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("quick")))), 1.0f ), BooleanClause.Occur.SHOULD ) .add( new DisjunctionMaxQuery( - Arrays.asList(new TermQuery(new Term(TEXT_FIELD_NAME, "fox")), new TermQuery(new Term(KEYWORD_FIELD_NAME, "fox"))), + Arrays.asList(new TermQuery(new Term(TEXT_FIELD_NAME, "fox")), new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "fox")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("fox")))), 1.0f ), BooleanClause.Occur.SHOULD @@ -834,7 +838,7 @@ private void assertQueryWithAllFieldsWildcard(Query query) { assertEquals(9, noMatchNoDocsQueries); assertThat( disjunctionMaxQuery.getDisjuncts(), - hasItems(new TermQuery(new Term(TEXT_FIELD_NAME, "hello")), new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello"))) + hasItems(new TermQuery(new Term(TEXT_FIELD_NAME, "hello")), new IndexOrDocValuesQuery(new TermQuery(new Term(KEYWORD_FIELD_NAME, "hello")), SortedSetDocValuesField.newSlowExactQuery(KEYWORD_FIELD_NAME, new BytesRef("hello")))) ); } diff --git a/server/src/test/java/org/opensearch/index/query/functionscore/FunctionScoreQueryBuilderTests.java b/server/src/test/java/org/opensearch/index/query/functionscore/FunctionScoreQueryBuilderTests.java index 4e64a1ec03688..b61c0245bb449 100644 --- a/server/src/test/java/org/opensearch/index/query/functionscore/FunctionScoreQueryBuilderTests.java +++ b/server/src/test/java/org/opensearch/index/query/functionscore/FunctionScoreQueryBuilderTests.java @@ -34,11 +34,14 @@ import com.fasterxml.jackson.core.JsonParseException; +import org.apache.lucene.document.SortedSetDocValuesField; import org.apache.lucene.index.Term; +import org.apache.lucene.search.IndexOrDocValuesQuery; import org.apache.lucene.search.MatchAllDocsQuery; import org.apache.lucene.search.MatchNoDocsQuery; import org.apache.lucene.search.Query; import org.apache.lucene.search.TermQuery; +import org.apache.lucene.util.BytesRef; import org.opensearch.common.geo.GeoPoint; import org.opensearch.common.lucene.search.function.CombineFunction; import org.opensearch.common.lucene.search.function.FieldValueFactorFunction; @@ -621,7 +624,7 @@ public void testCustomWeightFactorQueryBuilderWithFunctionScore() throws IOExcep ).toQuery(context); assertThat(parsedQuery, instanceOf(FunctionScoreQuery.class)); FunctionScoreQuery functionScoreQuery = (FunctionScoreQuery) parsedQuery; - assertThat(((TermQuery) functionScoreQuery.getSubQuery()).getTerm(), equalTo(new Term(KEYWORD_FIELD_NAME, "banon"))); + assertThat((((IndexOrDocValuesQuery) functionScoreQuery.getSubQuery()).getIndexQuery()), equalTo(new TermQuery(new Term(KEYWORD_FIELD_NAME, "banon")))); assertThat((double) (functionScoreQuery.getFunctions()[0]).getWeight(), closeTo(1.3, 0.001)); } diff --git a/server/src/test/java/org/opensearch/index/search/MultiMatchQueryTests.java b/server/src/test/java/org/opensearch/index/search/MultiMatchQueryTests.java index 0f173e1ac171e..415c4c0f37d08 100644 --- a/server/src/test/java/org/opensearch/index/search/MultiMatchQueryTests.java +++ b/server/src/test/java/org/opensearch/index/search/MultiMatchQueryTests.java @@ -32,15 +32,18 @@ package org.opensearch.index.search; +import org.apache.lucene.document.SortedSetDocValuesField; import org.apache.lucene.index.Term; import org.apache.lucene.queries.BlendedTermQuery; import org.apache.lucene.search.BooleanClause; import org.apache.lucene.search.BooleanQuery; import org.apache.lucene.search.BoostQuery; import org.apache.lucene.search.DisjunctionMaxQuery; +import org.apache.lucene.search.IndexOrDocValuesQuery; import org.apache.lucene.search.MatchAllDocsQuery; import org.apache.lucene.search.PhraseQuery; import org.apache.lucene.search.Query; +import org.apache.lucene.search.Sort; import org.apache.lucene.search.SynonymQuery; import org.apache.lucene.search.TermQuery; import org.apache.lucene.tests.analysis.MockSynonymAnalyzer; @@ -321,13 +324,13 @@ public void testKeywordSplitQueriesOnWhitespace() throws IOException { Query query = parser.parse(MultiMatchQueryBuilder.Type.BEST_FIELDS, fieldNames, "Foo Bar", null); DisjunctionMaxQuery expected = new DisjunctionMaxQuery( Arrays.asList( - new TermQuery(new Term("field_normalizer", "foo bar")), - new TermQuery(new Term("field", "Foo Bar")), - new BooleanQuery.Builder().add(new TermQuery(new Term("field_split", "Foo")), BooleanClause.Occur.SHOULD) - .add(new TermQuery(new Term("field_split", "Bar")), BooleanClause.Occur.SHOULD) + new IndexOrDocValuesQuery(new TermQuery(new Term("field_normalizer", "foo bar")), SortedSetDocValuesField.newSlowExactQuery("field_normalizer", new BytesRef("foo bar"))), + new IndexOrDocValuesQuery(new TermQuery(new Term("field", "Foo Bar")), SortedSetDocValuesField.newSlowExactQuery("field", new BytesRef("Foo Bar"))), + new BooleanQuery.Builder().add(new IndexOrDocValuesQuery(new TermQuery(new Term("field_split", "Foo")), SortedSetDocValuesField.newSlowExactQuery("field_split", new BytesRef("Foo"))), BooleanClause.Occur.SHOULD) + .add(new IndexOrDocValuesQuery(new TermQuery(new Term("field_split", "Bar")), SortedSetDocValuesField.newSlowExactQuery("field_split", new BytesRef("Bar"))), BooleanClause.Occur.SHOULD) .build(), - new BooleanQuery.Builder().add(new TermQuery(new Term("field_split_normalizer", "foo")), BooleanClause.Occur.SHOULD) - .add(new TermQuery(new Term("field_split_normalizer", "bar")), BooleanClause.Occur.SHOULD) + new BooleanQuery.Builder().add(new IndexOrDocValuesQuery(new TermQuery(new Term("field_split_normalizer", "foo")), SortedSetDocValuesField.newSlowExactQuery("fied_split_normalizer", new BytesRef("foo"))), BooleanClause.Occur.SHOULD) + .add(new IndexOrDocValuesQuery(new TermQuery(new Term("field_split_normalizer", "bar")), SortedSetDocValuesField.newSlowExactQuery("field_split_normalizer", new BytesRef("bar"))), BooleanClause.Occur.SHOULD) .build() ), 0.0f diff --git a/server/src/test/java/org/opensearch/index/search/NestedHelperTests.java b/server/src/test/java/org/opensearch/index/search/NestedHelperTests.java index 7ffcc0fb7437a..5e340685a1611 100644 --- a/server/src/test/java/org/opensearch/index/search/NestedHelperTests.java +++ b/server/src/test/java/org/opensearch/index/search/NestedHelperTests.java @@ -32,16 +32,19 @@ package org.opensearch.index.search; +import org.apache.lucene.document.SortedSetDocValuesField; import org.apache.lucene.index.MultiReader; import org.apache.lucene.index.Term; import org.apache.lucene.search.BooleanClause.Occur; import org.apache.lucene.search.BooleanQuery; +import org.apache.lucene.search.IndexOrDocValuesQuery; import org.apache.lucene.search.IndexSearcher; import org.apache.lucene.search.MatchAllDocsQuery; import org.apache.lucene.search.MatchNoDocsQuery; import org.apache.lucene.search.Query; import org.apache.lucene.search.TermQuery; import org.apache.lucene.search.join.ScoreMode; +import org.apache.lucene.util.BytesRef; import org.opensearch.common.settings.Settings; import org.opensearch.common.xcontent.XContentFactory; import org.opensearch.core.xcontent.XContentBuilder; @@ -339,7 +342,7 @@ public void testNested() throws IOException { query = (OpenSearchToParentBlockJoinQuery) queryBuilder.toQuery(context); // this time we do not add a filter since the inner query only matches inner docs - expectedChildQuery = new TermQuery(new Term("nested1.foo", "bar")); + expectedChildQuery = new IndexOrDocValuesQuery(new TermQuery(new Term("nested1.foo", "bar")), SortedSetDocValuesField.newSlowExactQuery("nested1.foo", new BytesRef("bar"))); assertEquals(expectedChildQuery, query.getChildQuery()); assertFalse(new NestedHelper(mapperService).mightMatchNestedDocs(query)); @@ -352,7 +355,7 @@ public void testNested() throws IOException { query = (OpenSearchToParentBlockJoinQuery) queryBuilder.toQuery(context); // we need to add the filter again because of include_in_parent - expectedChildQuery = new BooleanQuery.Builder().add(new TermQuery(new Term("nested2.foo", "bar")), Occur.MUST) + expectedChildQuery = new BooleanQuery.Builder().add(new IndexOrDocValuesQuery(new TermQuery(new Term("nested2.foo", "bar")), SortedSetDocValuesField.newSlowExactQuery("nested2.foo", new BytesRef("bar"))), Occur.MUST) .add(new TermQuery(new Term(NestedPathFieldMapper.NAME, "nested2")), Occur.FILTER) .build(); assertEquals(expectedChildQuery, query.getChildQuery()); @@ -367,7 +370,7 @@ public void testNested() throws IOException { query = (OpenSearchToParentBlockJoinQuery) queryBuilder.toQuery(context); // we need to add the filter again because of include_in_root - expectedChildQuery = new BooleanQuery.Builder().add(new TermQuery(new Term("nested3.foo", "bar")), Occur.MUST) + expectedChildQuery = new BooleanQuery.Builder().add(new IndexOrDocValuesQuery(new TermQuery(new Term("nested3.foo", "bar")), SortedSetDocValuesField.newSlowExactQuery("nested3.foo", new BytesRef("bar"))), Occur.MUST) .add(new TermQuery(new Term(NestedPathFieldMapper.NAME, "nested3")), Occur.FILTER) .build(); assertEquals(expectedChildQuery, query.getChildQuery()); diff --git a/server/src/test/java/org/opensearch/index/search/nested/NestedSortingTests.java b/server/src/test/java/org/opensearch/index/search/nested/NestedSortingTests.java index 8f1a9afa243a3..e58909b30cf9d 100644 --- a/server/src/test/java/org/opensearch/index/search/nested/NestedSortingTests.java +++ b/server/src/test/java/org/opensearch/index/search/nested/NestedSortingTests.java @@ -35,6 +35,7 @@ import org.apache.lucene.document.Document; import org.apache.lucene.document.Field; import org.apache.lucene.document.IntPoint; +import org.apache.lucene.document.KeywordField; import org.apache.lucene.document.NumericDocValuesField; import org.apache.lucene.document.SortedNumericDocValuesField; import org.apache.lucene.document.StringField; @@ -518,7 +519,7 @@ public void testMultiLevelNestedSorting() throws IOException { document.add(new NumericDocValuesField("chapters.read_time_seconds", 1400)); book.add(document); document = new Document(); - document.add(new StringField("genre", "science fiction", Field.Store.NO)); + document.add(new KeywordField("genre", "science fiction", Field.Store.NO)); document.add(new StringField("_id", "1", Field.Store.YES)); document.add(new NumericDocValuesField(PRIMARY_TERM_NAME, 0)); book.add(document); @@ -540,7 +541,7 @@ public void testMultiLevelNestedSorting() throws IOException { document.add(new NumericDocValuesField("chapters.read_time_seconds", 20)); book.add(document); document = new Document(); - document.add(new StringField("genre", "romance", Field.Store.NO)); + document.add(new KeywordField("genre", "romance", Field.Store.NO)); document.add(new StringField("_id", "2", Field.Store.YES)); document.add(new NumericDocValuesField(PRIMARY_TERM_NAME, 0)); book.add(document); @@ -562,7 +563,7 @@ public void testMultiLevelNestedSorting() throws IOException { document.add(new NumericDocValuesField("chapters.read_time_seconds", 1200)); book.add(document); document = new Document(); - document.add(new StringField("genre", "horror", Field.Store.NO)); + document.add(new KeywordField("genre", "horror", Field.Store.NO)); document.add(new StringField("_id", "3", Field.Store.YES)); document.add(new NumericDocValuesField(PRIMARY_TERM_NAME, 0)); book.add(document); @@ -611,7 +612,7 @@ public void testMultiLevelNestedSorting() throws IOException { document.add(new NumericDocValuesField("chapters.read_time_seconds", 10)); book.add(document); document = new Document(); - document.add(new StringField("genre", "cooking", Field.Store.NO)); + document.add(new KeywordField("genre", "cooking", Field.Store.NO)); document.add(new StringField("_id", "4", Field.Store.YES)); document.add(new NumericDocValuesField(PRIMARY_TERM_NAME, 0)); book.add(document); @@ -620,7 +621,7 @@ public void testMultiLevelNestedSorting() throws IOException { { List book = new ArrayList<>(); Document document = new Document(); - document.add(new StringField("genre", "unknown", Field.Store.NO)); + document.add(new KeywordField("genre", "unknown", Field.Store.NO)); document.add(new StringField("_id", "5", Field.Store.YES)); document.add(new NumericDocValuesField(PRIMARY_TERM_NAME, 0)); book.add(document); diff --git a/server/src/test/java/org/opensearch/search/aggregations/bucket/filter/FilterAggregatorTests.java b/server/src/test/java/org/opensearch/search/aggregations/bucket/filter/FilterAggregatorTests.java index 2125748cd9661..1dc69cee96b94 100644 --- a/server/src/test/java/org/opensearch/search/aggregations/bucket/filter/FilterAggregatorTests.java +++ b/server/src/test/java/org/opensearch/search/aggregations/bucket/filter/FilterAggregatorTests.java @@ -33,6 +33,7 @@ import org.apache.lucene.document.Document; import org.apache.lucene.document.Field; +import org.apache.lucene.document.KeywordField; import org.apache.lucene.index.DirectoryReader; import org.apache.lucene.index.IndexReader; import org.apache.lucene.search.IndexSearcher; @@ -96,7 +97,7 @@ public void testRandom() throws Exception { } int value = randomInt(maxTerm - 1); expectedBucketCount[value] += 1; - document.add(new Field("field", Integer.toString(value), KeywordFieldMapper.Defaults.FIELD_TYPE)); + document.add(new KeywordField("field", Integer.toString(value), Field.Store.NO)); indexWriter.addDocument(document); document.clear(); } diff --git a/server/src/test/java/org/opensearch/search/aggregations/bucket/filter/FiltersAggregatorTests.java b/server/src/test/java/org/opensearch/search/aggregations/bucket/filter/FiltersAggregatorTests.java index 38530d8ccc623..d36ec57cc3970 100644 --- a/server/src/test/java/org/opensearch/search/aggregations/bucket/filter/FiltersAggregatorTests.java +++ b/server/src/test/java/org/opensearch/search/aggregations/bucket/filter/FiltersAggregatorTests.java @@ -33,6 +33,7 @@ import org.apache.lucene.document.Document; import org.apache.lucene.document.Field; +import org.apache.lucene.document.KeywordField; import org.apache.lucene.index.DirectoryReader; import org.apache.lucene.index.IndexReader; import org.apache.lucene.search.IndexSearcher; @@ -87,28 +88,28 @@ public void testKeyedFilter() throws Exception { Directory directory = newDirectory(); RandomIndexWriter indexWriter = new RandomIndexWriter(random(), directory); Document document = new Document(); - document.add(new Field("field", "foo", KeywordFieldMapper.Defaults.FIELD_TYPE)); + document.add(new KeywordField("field", "foo", Field.Store.NO)); indexWriter.addDocument(document); document.clear(); - document.add(new Field("field", "else", KeywordFieldMapper.Defaults.FIELD_TYPE)); + document.add(new KeywordField("field", "else", Field.Store.NO)); indexWriter.addDocument(document); // make sure we have more than one segment to test the merge indexWriter.commit(); - document.add(new Field("field", "foo", KeywordFieldMapper.Defaults.FIELD_TYPE)); + document.add(new KeywordField("field", "foo", Field.Store.NO)); indexWriter.addDocument(document); document.clear(); - document.add(new Field("field", "bar", KeywordFieldMapper.Defaults.FIELD_TYPE)); + document.add(new KeywordField("field", "bar", Field.Store.NO)); indexWriter.addDocument(document); document.clear(); - document.add(new Field("field", "foobar", KeywordFieldMapper.Defaults.FIELD_TYPE)); + document.add(new KeywordField("field", "foobar", Field.Store.NO)); indexWriter.addDocument(document); indexWriter.commit(); document.clear(); - document.add(new Field("field", "something", KeywordFieldMapper.Defaults.FIELD_TYPE)); + document.add(new KeywordField("field", "something", Field.Store.NO)); indexWriter.addDocument(document); indexWriter.commit(); document.clear(); - document.add(new Field("field", "foobar", KeywordFieldMapper.Defaults.FIELD_TYPE)); + document.add(new KeywordField("field", "foobar", Field.Store.NO)); indexWriter.addDocument(document); indexWriter.close(); @@ -154,7 +155,7 @@ public void testRandom() throws Exception { } int value = randomInt(maxTerm - 1); expectedBucketCount[value] += 1; - document.add(new Field("field", Integer.toString(value), KeywordFieldMapper.Defaults.FIELD_TYPE)); + document.add(new KeywordField("field", Integer.toString(value), Field.Store.NO)); indexWriter.addDocument(document); document.clear(); }