|
38 | 38 | import org.apache.lucene.document.FieldType;
|
39 | 39 | import org.apache.lucene.document.SortedSetDocValuesField;
|
40 | 40 | import org.apache.lucene.index.IndexOptions;
|
| 41 | +import org.apache.lucene.index.Term; |
| 42 | +import org.apache.lucene.search.FuzzyQuery; |
| 43 | +import org.apache.lucene.search.IndexOrDocValuesQuery; |
41 | 44 | import org.apache.lucene.search.MultiTermQuery;
|
| 45 | +import org.apache.lucene.search.PrefixQuery; |
42 | 46 | import org.apache.lucene.search.Query;
|
| 47 | +import org.apache.lucene.search.RegexpQuery; |
| 48 | +import org.apache.lucene.search.TermInSetQuery; |
| 49 | +import org.apache.lucene.search.TermRangeQuery; |
| 50 | +import org.apache.lucene.search.WildcardQuery; |
43 | 51 | import org.apache.lucene.util.BytesRef;
|
| 52 | +import org.apache.lucene.util.automaton.Operations; |
| 53 | +import org.opensearch.OpenSearchException; |
44 | 54 | import org.opensearch.common.Nullable;
|
| 55 | +import org.opensearch.common.lucene.BytesRefs; |
45 | 56 | import org.opensearch.common.lucene.Lucene;
|
| 57 | +import org.opensearch.common.lucene.search.AutomatonQueries; |
| 58 | +import org.opensearch.common.unit.Fuzziness; |
46 | 59 | import org.opensearch.core.xcontent.XContentParser;
|
47 | 60 | import org.opensearch.index.analysis.IndexAnalyzers;
|
48 | 61 | import org.opensearch.index.analysis.NamedAnalyzer;
|
|
62 | 75 | import java.util.Objects;
|
63 | 76 | import java.util.function.Supplier;
|
64 | 77 |
|
| 78 | +import static org.opensearch.search.SearchService.ALLOW_EXPENSIVE_QUERIES; |
| 79 | + |
65 | 80 | /**
|
66 | 81 | * A field mapper for keywords. This mapper accepts strings and indexes them as-is.
|
67 | 82 | *
|
@@ -317,7 +332,7 @@ public IndexFieldData.Builder fielddataBuilder(String fullyQualifiedIndexName, S
|
317 | 332 | @Override
|
318 | 333 | public ValueFetcher valueFetcher(QueryShardContext context, SearchLookup searchLookup, String format) {
|
319 | 334 | if (format != null) {
|
320 |
| - throw new IllegalArgumentException("Field [" + name() + "] of type [" + typeName() + "] doesn't support formats."); |
| 335 | + throw new IllegalArgumentException("Field [" + name() + "] of type [" + typeName() + "] doesn't " + "support formats."); |
321 | 336 | }
|
322 | 337 |
|
323 | 338 | return new SourceValueFetcher(name(), context, nullValue) {
|
@@ -372,17 +387,226 @@ protected BytesRef indexedValueForSearch(Object value) {
|
372 | 387 | return getTextSearchInfo().getSearchAnalyzer().normalize(name(), value.toString());
|
373 | 388 | }
|
374 | 389 |
|
| 390 | + @Override |
| 391 | + public Query termsQuery(List<?> values, QueryShardContext context) { |
| 392 | + failIfNotIndexedAndNoDocValues(); |
| 393 | + // has index and doc_values enabled |
| 394 | + if (isSearchable() && hasDocValues()) { |
| 395 | + BytesRef[] bytesRefs = new BytesRef[values.size()]; |
| 396 | + for (int i = 0; i < bytesRefs.length; i++) { |
| 397 | + bytesRefs[i] = indexedValueForSearch(values.get(i)); |
| 398 | + } |
| 399 | + Query indexQuery = new TermInSetQuery(name(), bytesRefs); |
| 400 | + Query dvQuery = new TermInSetQuery(MultiTermQuery.DOC_VALUES_REWRITE, name(), bytesRefs); |
| 401 | + return new IndexOrDocValuesQuery(indexQuery, dvQuery); |
| 402 | + } |
| 403 | + // if we only have doc_values enabled, we construct a new query with doc_values re-written |
| 404 | + if (hasDocValues()) { |
| 405 | + BytesRef[] bytesRefs = new BytesRef[values.size()]; |
| 406 | + for (int i = 0; i < bytesRefs.length; i++) { |
| 407 | + bytesRefs[i] = indexedValueForSearch(values.get(i)); |
| 408 | + } |
| 409 | + return new TermInSetQuery(MultiTermQuery.DOC_VALUES_REWRITE, name(), bytesRefs); |
| 410 | + } |
| 411 | + // has index enabled, we're going to return the query as is |
| 412 | + return super.termsQuery(values, context); |
| 413 | + } |
| 414 | + |
| 415 | + @Override |
| 416 | + public Query prefixQuery( |
| 417 | + String value, |
| 418 | + @Nullable MultiTermQuery.RewriteMethod method, |
| 419 | + boolean caseInsensitive, |
| 420 | + QueryShardContext context |
| 421 | + ) { |
| 422 | + if (context.allowExpensiveQueries() == false) { |
| 423 | + throw new OpenSearchException( |
| 424 | + "[prefix] queries cannot be executed when '" |
| 425 | + + ALLOW_EXPENSIVE_QUERIES.getKey() |
| 426 | + + "' is set to false. For optimised prefix queries on text " |
| 427 | + + "fields please enable [index_prefixes]." |
| 428 | + ); |
| 429 | + } |
| 430 | + failIfNotIndexedAndNoDocValues(); |
| 431 | + if (isSearchable() && hasDocValues()) { |
| 432 | + Query indexQuery = super.prefixQuery(value, method, caseInsensitive, context); |
| 433 | + Query dvQuery = super.prefixQuery(value, MultiTermQuery.DOC_VALUES_REWRITE, caseInsensitive, context); |
| 434 | + return new IndexOrDocValuesQuery(indexQuery, dvQuery); |
| 435 | + } |
| 436 | + if (hasDocValues()) { |
| 437 | + if (caseInsensitive) { |
| 438 | + return AutomatonQueries.caseInsensitivePrefixQuery( |
| 439 | + (new Term(name(), indexedValueForSearch(value))), |
| 440 | + MultiTermQuery.DOC_VALUES_REWRITE |
| 441 | + ); |
| 442 | + } |
| 443 | + return new PrefixQuery(new Term(name(), indexedValueForSearch(value)), MultiTermQuery.DOC_VALUES_REWRITE); |
| 444 | + } |
| 445 | + return super.prefixQuery(value, method, caseInsensitive, context); |
| 446 | + } |
| 447 | + |
| 448 | + @Override |
| 449 | + public Query regexpQuery( |
| 450 | + String value, |
| 451 | + int syntaxFlags, |
| 452 | + int matchFlags, |
| 453 | + int maxDeterminizedStates, |
| 454 | + @Nullable MultiTermQuery.RewriteMethod method, |
| 455 | + QueryShardContext context |
| 456 | + ) { |
| 457 | + if (context.allowExpensiveQueries() == false) { |
| 458 | + throw new OpenSearchException( |
| 459 | + "[regexp] queries cannot be executed when '" + ALLOW_EXPENSIVE_QUERIES.getKey() + "' is set to " + "false." |
| 460 | + ); |
| 461 | + } |
| 462 | + failIfNotIndexedAndNoDocValues(); |
| 463 | + if (isSearchable() && hasDocValues()) { |
| 464 | + Query indexQuery = super.regexpQuery(value, syntaxFlags, matchFlags, maxDeterminizedStates, method, context); |
| 465 | + Query dvQuery = super.regexpQuery( |
| 466 | + value, |
| 467 | + syntaxFlags, |
| 468 | + matchFlags, |
| 469 | + maxDeterminizedStates, |
| 470 | + MultiTermQuery.DOC_VALUES_REWRITE, |
| 471 | + context |
| 472 | + ); |
| 473 | + return new IndexOrDocValuesQuery(indexQuery, dvQuery); |
| 474 | + } |
| 475 | + if (hasDocValues()) { |
| 476 | + return new RegexpQuery( |
| 477 | + new Term(name(), indexedValueForSearch(value)), |
| 478 | + syntaxFlags, |
| 479 | + matchFlags, |
| 480 | + RegexpQuery.DEFAULT_PROVIDER, |
| 481 | + maxDeterminizedStates, |
| 482 | + MultiTermQuery.DOC_VALUES_REWRITE |
| 483 | + ); |
| 484 | + } |
| 485 | + return super.regexpQuery(value, syntaxFlags, matchFlags, maxDeterminizedStates, method, context); |
| 486 | + } |
| 487 | + |
| 488 | + @Override |
| 489 | + public Query rangeQuery(Object lowerTerm, Object upperTerm, boolean includeLower, boolean includeUpper, QueryShardContext context) { |
| 490 | + if (context.allowExpensiveQueries() == false) { |
| 491 | + throw new OpenSearchException( |
| 492 | + "[range] queries on [text] or [keyword] fields cannot be executed when '" |
| 493 | + + ALLOW_EXPENSIVE_QUERIES.getKey() |
| 494 | + + "' is set to false." |
| 495 | + ); |
| 496 | + } |
| 497 | + failIfNotIndexedAndNoDocValues(); |
| 498 | + if (isSearchable() && hasDocValues()) { |
| 499 | + Query indexQuery = new TermRangeQuery( |
| 500 | + name(), |
| 501 | + lowerTerm == null ? null : indexedValueForSearch(lowerTerm), |
| 502 | + upperTerm == null ? null : indexedValueForSearch(upperTerm), |
| 503 | + includeLower, |
| 504 | + includeUpper |
| 505 | + ); |
| 506 | + Query dvQuery = new TermRangeQuery( |
| 507 | + name(), |
| 508 | + lowerTerm == null ? null : indexedValueForSearch(lowerTerm), |
| 509 | + upperTerm == null ? null : indexedValueForSearch(upperTerm), |
| 510 | + includeLower, |
| 511 | + includeUpper, |
| 512 | + MultiTermQuery.DOC_VALUES_REWRITE |
| 513 | + ); |
| 514 | + return new IndexOrDocValuesQuery(indexQuery, dvQuery); |
| 515 | + } |
| 516 | + if (hasDocValues()) { |
| 517 | + return new TermRangeQuery( |
| 518 | + name(), |
| 519 | + lowerTerm == null ? null : indexedValueForSearch(lowerTerm), |
| 520 | + upperTerm == null ? null : indexedValueForSearch(upperTerm), |
| 521 | + includeLower, |
| 522 | + includeUpper, |
| 523 | + MultiTermQuery.DOC_VALUES_REWRITE |
| 524 | + ); |
| 525 | + } |
| 526 | + return new TermRangeQuery( |
| 527 | + name(), |
| 528 | + lowerTerm == null ? null : indexedValueForSearch(lowerTerm), |
| 529 | + upperTerm == null ? null : indexedValueForSearch(upperTerm), |
| 530 | + includeLower, |
| 531 | + includeUpper |
| 532 | + ); |
| 533 | + } |
| 534 | + |
| 535 | + @Override |
| 536 | + public Query fuzzyQuery( |
| 537 | + Object value, |
| 538 | + Fuzziness fuzziness, |
| 539 | + int prefixLength, |
| 540 | + int maxExpansions, |
| 541 | + boolean transpositions, |
| 542 | + @Nullable MultiTermQuery.RewriteMethod method, |
| 543 | + QueryShardContext context |
| 544 | + ) { |
| 545 | + failIfNotIndexedAndNoDocValues(); |
| 546 | + if (context.allowExpensiveQueries() == false) { |
| 547 | + throw new OpenSearchException( |
| 548 | + "[fuzzy] queries cannot be executed when '" + ALLOW_EXPENSIVE_QUERIES.getKey() + "' is set to " + "false." |
| 549 | + ); |
| 550 | + } |
| 551 | + if (isSearchable() && hasDocValues()) { |
| 552 | + Query indexQuery = super.fuzzyQuery(value, fuzziness, prefixLength, maxExpansions, transpositions, context); |
| 553 | + Query dvQuery = super.fuzzyQuery( |
| 554 | + value, |
| 555 | + fuzziness, |
| 556 | + prefixLength, |
| 557 | + maxExpansions, |
| 558 | + transpositions, |
| 559 | + MultiTermQuery.DOC_VALUES_REWRITE, |
| 560 | + context |
| 561 | + ); |
| 562 | + return new IndexOrDocValuesQuery(indexQuery, dvQuery); |
| 563 | + } |
| 564 | + if (hasDocValues()) { |
| 565 | + return new FuzzyQuery( |
| 566 | + new Term(name(), indexedValueForSearch(value)), |
| 567 | + fuzziness.asDistance(BytesRefs.toString(value)), |
| 568 | + prefixLength, |
| 569 | + maxExpansions, |
| 570 | + transpositions, |
| 571 | + MultiTermQuery.DOC_VALUES_REWRITE |
| 572 | + ); |
| 573 | + } |
| 574 | + return super.fuzzyQuery(value, fuzziness, prefixLength, maxExpansions, transpositions, context); |
| 575 | + } |
| 576 | + |
375 | 577 | @Override
|
376 | 578 | public Query wildcardQuery(
|
377 | 579 | String value,
|
378 | 580 | @Nullable MultiTermQuery.RewriteMethod method,
|
379 |
| - boolean caseInsensitve, |
| 581 | + boolean caseInsensitive, |
380 | 582 | QueryShardContext context
|
381 | 583 | ) {
|
382 |
| - // keyword field types are always normalized, so ignore case sensitivity and force normalize the wildcard |
| 584 | + if (context.allowExpensiveQueries() == false) { |
| 585 | + throw new OpenSearchException( |
| 586 | + "[wildcard] queries cannot be executed when '" + ALLOW_EXPENSIVE_QUERIES.getKey() + "' is set to " + "false." |
| 587 | + ); |
| 588 | + } |
| 589 | + failIfNotIndexedAndNoDocValues(); |
| 590 | + // keyword field types are always normalized, so ignore case sensitivity and force normalize the |
| 591 | + // wildcard |
383 | 592 | // query text
|
384 |
| - return super.wildcardQuery(value, method, caseInsensitve, true, context); |
| 593 | + if (isSearchable() && hasDocValues()) { |
| 594 | + Query indexQuery = super.wildcardQuery(value, method, caseInsensitive, true, context); |
| 595 | + Query dvQuery = super.wildcardQuery(value, MultiTermQuery.DOC_VALUES_REWRITE, caseInsensitive, true, context); |
| 596 | + return new IndexOrDocValuesQuery(indexQuery, dvQuery); |
| 597 | + } |
| 598 | + if (hasDocValues()) { |
| 599 | + Term term; |
| 600 | + value = normalizeWildcardPattern(name(), value, getTextSearchInfo().getSearchAnalyzer()); |
| 601 | + term = new Term(name(), value); |
| 602 | + if (caseInsensitive) { |
| 603 | + return AutomatonQueries.caseInsensitiveWildcardQuery(term, method); |
| 604 | + } |
| 605 | + return new WildcardQuery(term, Operations.DEFAULT_DETERMINIZE_WORK_LIMIT, MultiTermQuery.DOC_VALUES_REWRITE); |
| 606 | + } |
| 607 | + return super.wildcardQuery(value, method, caseInsensitive, true, context); |
385 | 608 | }
|
| 609 | + |
386 | 610 | }
|
387 | 611 |
|
388 | 612 | private final boolean indexed;
|
@@ -422,8 +646,10 @@ protected KeywordFieldMapper(
|
422 | 646 | this.indexAnalyzers = builder.indexAnalyzers;
|
423 | 647 | }
|
424 | 648 |
|
425 |
| - /** Values that have more chars than the return value of this method will |
426 |
| - * be skipped at parsing time. */ |
| 649 | + /** |
| 650 | + * Values that have more chars than the return value of this method will |
| 651 | + * be skipped at parsing time. |
| 652 | + */ |
427 | 653 | public int ignoreAbove() {
|
428 | 654 | return ignoreAbove;
|
429 | 655 | }
|
|
0 commit comments