/* * Licensed to Elasticsearch under one or more contributor * license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright * ownership. Elasticsearch licenses this file to you under * the Apache License, Version 2.0 (the "License"); you may * not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, * software distributed under the License is distributed on an * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY * KIND, either express or implied. See the License for the * specific language governing permissions and limitations * under the License. */ package org.elasticsearch.index.query; import org.apache.lucene.search.FuzzyQuery; import org.apache.lucene.search.Query; import org.elasticsearch.common.ParseField; import org.elasticsearch.common.ParsingException; import org.elasticsearch.common.io.stream.StreamInput; import org.elasticsearch.common.io.stream.StreamOutput; import org.elasticsearch.common.lucene.search.Queries; import org.elasticsearch.common.unit.Fuzziness; import org.elasticsearch.common.xcontent.XContentBuilder; import org.elasticsearch.common.xcontent.XContentParser; import org.elasticsearch.index.query.support.QueryParsers; import org.elasticsearch.index.search.MatchQuery; import org.elasticsearch.index.search.MatchQuery.ZeroTermsQuery; import java.io.IOException; import java.util.Locale; import java.util.Objects; /** * Match query is a query that analyzes the text and constructs a query as the * result of the analysis. */ public class MatchQueryBuilder extends AbstractQueryBuilder<MatchQueryBuilder> { public static final ParseField SLOP_FIELD = new ParseField("slop", "phrase_slop").withAllDeprecated("match_phrase query"); public static final ParseField ZERO_TERMS_QUERY_FIELD = new ParseField("zero_terms_query"); public static final ParseField CUTOFF_FREQUENCY_FIELD = new ParseField("cutoff_frequency"); public static final ParseField LENIENT_FIELD = new ParseField("lenient"); public static final ParseField FUZZY_TRANSPOSITIONS_FIELD = new ParseField("fuzzy_transpositions"); public static final ParseField FUZZY_REWRITE_FIELD = new ParseField("fuzzy_rewrite"); public static final ParseField MINIMUM_SHOULD_MATCH_FIELD = new ParseField("minimum_should_match"); public static final ParseField OPERATOR_FIELD = new ParseField("operator"); public static final ParseField MAX_EXPANSIONS_FIELD = new ParseField("max_expansions"); public static final ParseField PREFIX_LENGTH_FIELD = new ParseField("prefix_length"); public static final ParseField ANALYZER_FIELD = new ParseField("analyzer"); public static final ParseField TYPE_FIELD = new ParseField("type").withAllDeprecated("match_phrase and match_phrase_prefix query"); public static final ParseField QUERY_FIELD = new ParseField("query"); /** The name for the match query */ public static final String NAME = "match"; /** The default mode terms are combined in a match query */ public static final Operator DEFAULT_OPERATOR = Operator.OR; /** The default mode match query type */ @Deprecated public static final MatchQuery.Type DEFAULT_TYPE = MatchQuery.Type.BOOLEAN; private final String fieldName; private final Object value; @Deprecated private MatchQuery.Type type = DEFAULT_TYPE; private Operator operator = DEFAULT_OPERATOR; private String analyzer; @Deprecated private int slop = MatchQuery.DEFAULT_PHRASE_SLOP; private Fuzziness fuzziness = null; private int prefixLength = FuzzyQuery.defaultPrefixLength; private int maxExpansions = FuzzyQuery.defaultMaxExpansions; private boolean fuzzyTranspositions = FuzzyQuery.defaultTranspositions; private String minimumShouldMatch; private String fuzzyRewrite = null; private boolean lenient = MatchQuery.DEFAULT_LENIENCY; private MatchQuery.ZeroTermsQuery zeroTermsQuery = MatchQuery.DEFAULT_ZERO_TERMS_QUERY; private Float cutoffFrequency = null; /** * Constructs a new match query. */ public MatchQueryBuilder(String fieldName, Object value) { if (fieldName == null) { throw new IllegalArgumentException("[" + NAME + "] requires fieldName"); } if (value == null) { throw new IllegalArgumentException("[" + NAME + "] requires query value"); } this.fieldName = fieldName; this.value = value; } /** * Read from a stream. */ public MatchQueryBuilder(StreamInput in) throws IOException { super(in); fieldName = in.readString(); value = in.readGenericValue(); type = MatchQuery.Type.readFromStream(in); operator = Operator.readFromStream(in); slop = in.readVInt(); prefixLength = in.readVInt(); maxExpansions = in.readVInt(); fuzzyTranspositions = in.readBoolean(); lenient = in.readBoolean(); zeroTermsQuery = MatchQuery.ZeroTermsQuery.readFromStream(in); // optional fields analyzer = in.readOptionalString(); minimumShouldMatch = in.readOptionalString(); fuzzyRewrite = in.readOptionalString(); fuzziness = in.readOptionalWriteable(Fuzziness::new); cutoffFrequency = in.readOptionalFloat(); } @Override protected void doWriteTo(StreamOutput out) throws IOException { out.writeString(fieldName); out.writeGenericValue(value); type.writeTo(out); operator.writeTo(out); out.writeVInt(slop); out.writeVInt(prefixLength); out.writeVInt(maxExpansions); out.writeBoolean(fuzzyTranspositions); out.writeBoolean(lenient); zeroTermsQuery.writeTo(out); // optional fields out.writeOptionalString(analyzer); out.writeOptionalString(minimumShouldMatch); out.writeOptionalString(fuzzyRewrite); out.writeOptionalWriteable(fuzziness); out.writeOptionalFloat(cutoffFrequency); } /** Returns the field name used in this query. */ public String fieldName() { return this.fieldName; } /** Returns the value used in this query. */ public Object value() { return this.value; } /** * Sets the type of the text query. * * @deprecated Use {@link MatchPhraseQueryBuilder} for <code>phrase</code> * queries and {@link MatchPhrasePrefixQueryBuilder} for * <code>phrase_prefix</code> queries */ @Deprecated public MatchQueryBuilder type(MatchQuery.Type type) { if (type == null) { throw new IllegalArgumentException("[" + NAME + "] requires type to be non-null"); } this.type = type; return this; } /** * Get the type of the query. * * @deprecated Use {@link MatchPhraseQueryBuilder} for <code>phrase</code> * queries and {@link MatchPhrasePrefixQueryBuilder} for * <code>phrase_prefix</code> queries */ @Deprecated public MatchQuery.Type type() { return this.type; } /** Sets the operator to use when using a boolean query. Defaults to <tt>OR</tt>. */ public MatchQueryBuilder operator(Operator operator) { if (operator == null) { throw new IllegalArgumentException("[" + NAME + "] requires operator to be non-null"); } this.operator = operator; return this; } /** Returns the operator to use in a boolean query.*/ public Operator operator() { return this.operator; } /** * Explicitly set the analyzer to use. Defaults to use explicit mapping config for the field, or, if not * set, the default search analyzer. */ public MatchQueryBuilder analyzer(String analyzer) { this.analyzer = analyzer; return this; } /** Get the analyzer to use, if previously set, otherwise <tt>null</tt> */ public String analyzer() { return this.analyzer; } /** * Sets a slop factor for phrase queries * * @deprecated for phrase queries use {@link MatchPhraseQueryBuilder} */ @Deprecated public MatchQueryBuilder slop(int slop) { if (slop < 0 ) { throw new IllegalArgumentException("No negative slop allowed."); } this.slop = slop; return this; } /** * Get the slop factor for phrase queries. * * @deprecated for phrase queries use {@link MatchPhraseQueryBuilder} */ @Deprecated public int slop() { return this.slop; } /** Sets the fuzziness used when evaluated to a fuzzy query type. Defaults to "AUTO". */ public MatchQueryBuilder fuzziness(Object fuzziness) { this.fuzziness = Fuzziness.build(fuzziness); return this; } /** Gets the fuzziness used when evaluated to a fuzzy query type. */ public Fuzziness fuzziness() { return this.fuzziness; } /** * Sets the length of a length of common (non-fuzzy) prefix for fuzzy match queries * @param prefixLength non-negative length of prefix * @throws IllegalArgumentException in case the prefix is negative */ public MatchQueryBuilder prefixLength(int prefixLength) { if (prefixLength < 0 ) { throw new IllegalArgumentException("[" + NAME + "] requires prefix length to be non-negative."); } this.prefixLength = prefixLength; return this; } /** * Gets the length of a length of common (non-fuzzy) prefix for fuzzy match queries */ public int prefixLength() { return this.prefixLength; } /** * When using fuzzy or prefix type query, the number of term expansions to use. */ public MatchQueryBuilder maxExpansions(int maxExpansions) { if (maxExpansions <= 0 ) { throw new IllegalArgumentException("[" + NAME + "] requires maxExpansions to be positive."); } this.maxExpansions = maxExpansions; return this; } /** * Get the (optional) number of term expansions when using fuzzy or prefix type query. */ public int maxExpansions() { return this.maxExpansions; } /** * Set a cutoff value in [0..1] (or absolute number >=1) representing the * maximum threshold of a terms document frequency to be considered a low * frequency term. */ public MatchQueryBuilder cutoffFrequency(float cutoff) { this.cutoffFrequency = cutoff; return this; } /** Gets the optional cutoff value, can be <tt>null</tt> if not set previously */ public Float cutoffFrequency() { return this.cutoffFrequency; } /** Sets optional minimumShouldMatch value to apply to the query */ public MatchQueryBuilder minimumShouldMatch(String minimumShouldMatch) { this.minimumShouldMatch = minimumShouldMatch; return this; } /** Gets the minimumShouldMatch value */ public String minimumShouldMatch() { return this.minimumShouldMatch; } /** Sets the fuzzy_rewrite parameter controlling how the fuzzy query will get rewritten */ public MatchQueryBuilder fuzzyRewrite(String fuzzyRewrite) { this.fuzzyRewrite = fuzzyRewrite; return this; } /** * Get the fuzzy_rewrite parameter * @see #fuzzyRewrite(String) */ public String fuzzyRewrite() { return this.fuzzyRewrite; } /** * Sets whether transpositions are supported in fuzzy queries.<p> * The default metric used by fuzzy queries to determine a match is the Damerau-Levenshtein * distance formula which supports transpositions. Setting transposition to false will * switch to classic Levenshtein distance.<br> * If not set, Damerau-Levenshtein distance metric will be used. */ public MatchQueryBuilder fuzzyTranspositions(boolean fuzzyTranspositions) { this.fuzzyTranspositions = fuzzyTranspositions; return this; } /** Gets the fuzzy query transposition setting. */ public boolean fuzzyTranspositions() { return this.fuzzyTranspositions; } /** * Sets whether format based failures will be ignored. * @deprecated use #lenient() instead */ @Deprecated public MatchQueryBuilder setLenient(boolean lenient) { return lenient(lenient); } /** * Sets whether format based failures will be ignored. */ public MatchQueryBuilder lenient(boolean lenient) { this.lenient = lenient; return this; } /** * Gets leniency setting that controls if format based failures will be ignored. */ public boolean lenient() { return this.lenient; } /** * Sets query to use in case no query terms are available, e.g. after analysis removed them. * Defaults to {@link MatchQuery.ZeroTermsQuery#NONE}, but can be set to * {@link MatchQuery.ZeroTermsQuery#ALL} instead. */ public MatchQueryBuilder zeroTermsQuery(MatchQuery.ZeroTermsQuery zeroTermsQuery) { if (zeroTermsQuery == null) { throw new IllegalArgumentException("[" + NAME + "] requires zeroTermsQuery to be non-null"); } this.zeroTermsQuery = zeroTermsQuery; return this; } /** * Returns the setting for handling zero terms queries. */ public MatchQuery.ZeroTermsQuery zeroTermsQuery() { return this.zeroTermsQuery; } @Override public void doXContent(XContentBuilder builder, Params params) throws IOException { builder.startObject(NAME); builder.startObject(fieldName); builder.field(QUERY_FIELD.getPreferredName(), value); // this is deprecated so only output the value if its not the default value (for bwc) if (type != MatchQuery.Type.BOOLEAN) { builder.field(TYPE_FIELD.getPreferredName(), type.toString().toLowerCase(Locale.ENGLISH)); } builder.field(OPERATOR_FIELD.getPreferredName(), operator.toString()); if (analyzer != null) { builder.field(ANALYZER_FIELD.getPreferredName(), analyzer); } // this is deprecated so only output the value if its not the default value (for bwc) if (slop != MatchQuery.DEFAULT_PHRASE_SLOP) { builder.field(SLOP_FIELD.getPreferredName(), slop); } if (fuzziness != null) { fuzziness.toXContent(builder, params); } builder.field(PREFIX_LENGTH_FIELD.getPreferredName(), prefixLength); builder.field(MAX_EXPANSIONS_FIELD.getPreferredName(), maxExpansions); if (minimumShouldMatch != null) { builder.field(MINIMUM_SHOULD_MATCH_FIELD.getPreferredName(), minimumShouldMatch); } if (fuzzyRewrite != null) { builder.field(FUZZY_REWRITE_FIELD.getPreferredName(), fuzzyRewrite); } // LUCENE 4 UPGRADE we need to document this & test this builder.field(FUZZY_TRANSPOSITIONS_FIELD.getPreferredName(), fuzzyTranspositions); builder.field(LENIENT_FIELD.getPreferredName(), lenient); builder.field(ZERO_TERMS_QUERY_FIELD.getPreferredName(), zeroTermsQuery.toString()); if (cutoffFrequency != null) { builder.field(CUTOFF_FREQUENCY_FIELD.getPreferredName(), cutoffFrequency); } printBoostAndQueryName(builder); builder.endObject(); builder.endObject(); } @Override protected Query doToQuery(QueryShardContext context) throws IOException { // validate context specific fields if (analyzer != null && context.getIndexAnalyzers().get(analyzer) == null) { throw new QueryShardException(context, "[" + NAME + "] analyzer [" + analyzer + "] not found"); } MatchQuery matchQuery = new MatchQuery(context); matchQuery.setOccur(operator.toBooleanClauseOccur()); matchQuery.setAnalyzer(analyzer); matchQuery.setPhraseSlop(slop); matchQuery.setFuzziness(fuzziness); matchQuery.setFuzzyPrefixLength(prefixLength); matchQuery.setMaxExpansions(maxExpansions); matchQuery.setTranspositions(fuzzyTranspositions); matchQuery.setFuzzyRewriteMethod(QueryParsers.parseRewriteMethod(fuzzyRewrite, null)); matchQuery.setLenient(lenient); matchQuery.setCommonTermsCutoff(cutoffFrequency); matchQuery.setZeroTermsQuery(zeroTermsQuery); Query query = matchQuery.parse(type, fieldName, value); return Queries.maybeApplyMinimumShouldMatch(query, minimumShouldMatch); } @Override protected boolean doEquals(MatchQueryBuilder other) { return Objects.equals(fieldName, other.fieldName) && Objects.equals(value, other.value) && Objects.equals(type, other.type) && Objects.equals(operator, other.operator) && Objects.equals(analyzer, other.analyzer) && Objects.equals(slop, other.slop) && Objects.equals(fuzziness, other.fuzziness) && Objects.equals(prefixLength, other.prefixLength) && Objects.equals(maxExpansions, other.maxExpansions) && Objects.equals(minimumShouldMatch, other.minimumShouldMatch) && Objects.equals(fuzzyRewrite, other.fuzzyRewrite) && Objects.equals(lenient, other.lenient) && Objects.equals(fuzzyTranspositions, other.fuzzyTranspositions) && Objects.equals(zeroTermsQuery, other.zeroTermsQuery) && Objects.equals(cutoffFrequency, other.cutoffFrequency); } @Override protected int doHashCode() { return Objects.hash(fieldName, value, type, operator, analyzer, slop, fuzziness, prefixLength, maxExpansions, minimumShouldMatch, fuzzyRewrite, lenient, fuzzyTranspositions, zeroTermsQuery, cutoffFrequency); } @Override public String getWriteableName() { return NAME; } public static MatchQueryBuilder fromXContent(QueryParseContext parseContext) throws IOException { XContentParser parser = parseContext.parser(); String fieldName = null; MatchQuery.Type type = MatchQuery.Type.BOOLEAN; Object value = null; float boost = AbstractQueryBuilder.DEFAULT_BOOST; String minimumShouldMatch = null; String analyzer = null; Operator operator = MatchQueryBuilder.DEFAULT_OPERATOR; int slop = MatchQuery.DEFAULT_PHRASE_SLOP; Fuzziness fuzziness = null; int prefixLength = FuzzyQuery.defaultPrefixLength; int maxExpansion = FuzzyQuery.defaultMaxExpansions; boolean fuzzyTranspositions = FuzzyQuery.defaultTranspositions; String fuzzyRewrite = null; boolean lenient = MatchQuery.DEFAULT_LENIENCY; Float cutOffFrequency = null; ZeroTermsQuery zeroTermsQuery = MatchQuery.DEFAULT_ZERO_TERMS_QUERY; String queryName = null; String currentFieldName = null; XContentParser.Token token; while ((token = parser.nextToken()) != XContentParser.Token.END_OBJECT) { if (token == XContentParser.Token.FIELD_NAME) { currentFieldName = parser.currentName(); } else if (parseContext.isDeprecatedSetting(currentFieldName)) { // skip } else if (token == XContentParser.Token.START_OBJECT) { throwParsingExceptionOnMultipleFields(NAME, parser.getTokenLocation(), fieldName, currentFieldName); fieldName = currentFieldName; while ((token = parser.nextToken()) != XContentParser.Token.END_OBJECT) { if (token == XContentParser.Token.FIELD_NAME) { currentFieldName = parser.currentName(); } else if (token.isValue()) { if (QUERY_FIELD.match(currentFieldName)) { value = parser.objectText(); } else if (TYPE_FIELD.match(currentFieldName)) { String tStr = parser.text(); if ("boolean".equals(tStr)) { type = MatchQuery.Type.BOOLEAN; } else if ("phrase".equals(tStr)) { type = MatchQuery.Type.PHRASE; } else if ("phrase_prefix".equals(tStr) || ("phrasePrefix".equals(tStr))) { type = MatchQuery.Type.PHRASE_PREFIX; } else { throw new ParsingException(parser.getTokenLocation(), "[" + NAME + "] query does not support type " + tStr); } } else if (ANALYZER_FIELD.match(currentFieldName)) { analyzer = parser.text(); } else if (AbstractQueryBuilder.BOOST_FIELD.match(currentFieldName)) { boost = parser.floatValue(); } else if (SLOP_FIELD.match(currentFieldName)) { slop = parser.intValue(); } else if (Fuzziness.FIELD.match(currentFieldName)) { fuzziness = Fuzziness.parse(parser); } else if (PREFIX_LENGTH_FIELD.match(currentFieldName)) { prefixLength = parser.intValue(); } else if (MAX_EXPANSIONS_FIELD.match(currentFieldName)) { maxExpansion = parser.intValue(); } else if (OPERATOR_FIELD.match(currentFieldName)) { operator = Operator.fromString(parser.text()); } else if (MINIMUM_SHOULD_MATCH_FIELD.match(currentFieldName)) { minimumShouldMatch = parser.textOrNull(); } else if (FUZZY_REWRITE_FIELD.match(currentFieldName)) { fuzzyRewrite = parser.textOrNull(); } else if (FUZZY_TRANSPOSITIONS_FIELD.match(currentFieldName)) { fuzzyTranspositions = parser.booleanValue(); } else if (LENIENT_FIELD.match(currentFieldName)) { lenient = parser.booleanValue(); } else if (CUTOFF_FREQUENCY_FIELD.match(currentFieldName)) { cutOffFrequency = parser.floatValue(); } else if (ZERO_TERMS_QUERY_FIELD.match(currentFieldName)) { String zeroTermsDocs = parser.text(); if ("none".equalsIgnoreCase(zeroTermsDocs)) { zeroTermsQuery = MatchQuery.ZeroTermsQuery.NONE; } else if ("all".equalsIgnoreCase(zeroTermsDocs)) { zeroTermsQuery = MatchQuery.ZeroTermsQuery.ALL; } else { throw new ParsingException(parser.getTokenLocation(), "Unsupported zero_terms_docs value [" + zeroTermsDocs + "]"); } } else if (AbstractQueryBuilder.NAME_FIELD.match(currentFieldName)) { queryName = parser.text(); } else { throw new ParsingException(parser.getTokenLocation(), "[" + NAME + "] query does not support [" + currentFieldName + "]"); } } else { throw new ParsingException(parser.getTokenLocation(), "[" + NAME + "] unknown token [" + token + "] after [" + currentFieldName + "]"); } } } else { throwParsingExceptionOnMultipleFields(NAME, parser.getTokenLocation(), fieldName, parser.currentName()); fieldName = parser.currentName(); value = parser.objectText(); } } if (value == null) { throw new ParsingException(parser.getTokenLocation(), "No text specified for text query"); } MatchQueryBuilder matchQuery = new MatchQueryBuilder(fieldName, value); matchQuery.operator(operator); matchQuery.type(type); matchQuery.analyzer(analyzer); matchQuery.slop(slop); matchQuery.minimumShouldMatch(minimumShouldMatch); if (fuzziness != null) { matchQuery.fuzziness(fuzziness); } matchQuery.fuzzyRewrite(fuzzyRewrite); matchQuery.prefixLength(prefixLength); matchQuery.fuzzyTranspositions(fuzzyTranspositions); matchQuery.maxExpansions(maxExpansion); matchQuery.lenient(lenient); if (cutOffFrequency != null) { matchQuery.cutoffFrequency(cutOffFrequency); } matchQuery.zeroTermsQuery(zeroTermsQuery); matchQuery.queryName(queryName); matchQuery.boost(boost); return matchQuery; } }