opensearch-project
diff --git a/‎CHANGELOG.md
Lines changed: 2 additions & 1 deletion b/‎CHANGELOG.md
Lines changed: 2 additions & 1 deletion
diff --git a/‎src/main/java/org/opensearch/neuralsearch/query/HybridBulkScorer.java
Lines changed: 176 additions & 0 deletions b/‎src/main/java/org/opensearch/neuralsearch/query/HybridBulkScorer.java
Lines changed: 176 additions & 0 deletions
diff --git a/‎src/main/java/org/opensearch/neuralsearch/query/HybridQueryDocIdStream.java
Lines changed: 62 additions & 0 deletions b/‎src/main/java/org/opensearch/neuralsearch/query/HybridQueryDocIdStream.java
Lines changed: 62 additions & 0 deletions
diff --git a/‎src/main/java/org/opensearch/neuralsearch/query/HybridQueryScorer.java
Lines changed: 5 additions & 6 deletions b/‎src/main/java/org/opensearch/neuralsearch/query/HybridQueryScorer.java
Lines changed: 5 additions & 6 deletions
diff --git a/‎src/main/java/org/opensearch/neuralsearch/query/HybridQueryWeight.java
Lines changed: 18 additions & 5 deletions b/‎src/main/java/org/opensearch/neuralsearch/query/HybridQueryWeight.java
Lines changed: 18 additions & 5 deletions
@@ -7,9 +7,10 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 
 ### Features
 - Implement analyzer based neural sparse query ([#1088](https://github.com/opensearch-project/neural-search/pull/1088) [#1279](https://github.com/opensearch-project/neural-search/pull/1279))
-- [Semantic Field] Add semantic field mapper. ([#1225](https://github.com/opensearch-project/neural-search/pull/1225)).
+- [Semantic Field] Add semantic field mapper. ([#1225](https://github.com/opensearch-project/neural-search/pull/1225))
 
 ### Enhancements
+- [Performance Improvement] Add custom bulk scorer for hybrid query (2-3x faster) ([#1289](https://github.com/opensearch-project/neural-search/pull/1289))
 
 ### Bug Fixes
 - Add validations to prevent empty input_text_field and input_image_field in TextImageEmbeddingProcessor ([#1257](https://github.com/opensearch-project/neural-search/pull/1257))
 
@@ -0,0 +1,176 @@
+/*
+ * Copyright OpenSearch Contributors
+ * SPDX-License-Identifier: Apache-2.0
+ */
+package org.opensearch.neuralsearch.query;
+
+import lombok.Getter;
+import org.apache.lucene.search.BulkScorer;
+import org.apache.lucene.search.DocIdSetIterator;
+import org.apache.lucene.search.LeafCollector;
+import org.apache.lucene.search.Scorer;
+import org.apache.lucene.util.Bits;
+import org.apache.lucene.util.FixedBitSet;
+
+import java.io.IOException;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Objects;
+
+/**
+ * Bulk scorer for hybrid query
+ */
+public class HybridBulkScorer extends BulkScorer {
+    private static final int SHIFT = 10;
+    private static final int WINDOW_SIZE = 1 << SHIFT;
+    private static final int MASK = WINDOW_SIZE - 1;
+
+    private final long cost;
+    private final Scorer[] scorers;
+    @Getter
+    private final HybridSubQueryScorer hybridSubQueryScorer;
+    private final boolean needsScores;
+    @Getter
+    private final FixedBitSet matching;
+    @Getter
+    private final float[][] windowScores;
+    private final HybridQueryDocIdStream hybridQueryDocIdStream;
+    private final int maxDoc;
+
+    public HybridBulkScorer(List<Scorer> scorers, boolean needsScores, int maxDoc) {
+        long cost = 0;
+        this.scorers = new Scorer[scorers.size()];
+        for (int subQueryIndex = 0; subQueryIndex < scorers.size(); subQueryIndex++) {
+            Scorer scorer = scorers.get(subQueryIndex);
+            if (Objects.isNull(scorer)) {
+                continue;
+            }
+            cost += scorer.iterator().cost();
+            this.scorers[subQueryIndex] = scorer;
+        }
+        this.cost = cost;
+        this.hybridSubQueryScorer = new HybridSubQueryScorer(scorers.size());
+        this.needsScores = needsScores;
+        this.matching = new FixedBitSet(WINDOW_SIZE);
+        this.windowScores = new float[this.scorers.length][WINDOW_SIZE];
+        this.maxDoc = maxDoc;
+        this.hybridQueryDocIdStream = new HybridQueryDocIdStream(this);
+    }
+
+    @Override
+    public int score(LeafCollector collector, Bits acceptDocs, int min, int max) throws IOException {
+        collector.setScorer(hybridSubQueryScorer);
+        // making sure we are not going over the global limit defined by maxDoc
+        max = Math.min(max, maxDoc);
+        int[] docsIds = advance(min, scorers);
+        while (allDocIdsUsed(docsIds, max) == false) {
+            scoreWindow(collector, acceptDocs, min, max, docsIds);
+        }
+        return getNextDocIdCandidate(docsIds);
+    }
+
+    private void scoreWindow(LeafCollector collector, Bits acceptDocs, int min, int max, int[] docIds) throws IOException {
+        // pick the lowest out of all not yet used doc ids
+        int topDoc = -1;
+        for (int docId : docIds) {
+            if (docId < max) {
+                topDoc = docId;
+                break;
+            }
+        }
+
+        final int windowBase = topDoc & ~MASK; // take the next match (at random) and find the window where it belongs
+        final int windowMin = Math.max(min, windowBase);
+        final int windowMax = Math.min(max, windowBase + WINDOW_SIZE);
+
+        scoreWindowIntoBitSetWithSubqueryScorers(collector, acceptDocs, max, docIds, windowMin, windowMax, windowBase);
+    }
+
+    private void scoreWindowIntoBitSetWithSubqueryScorers(
+        LeafCollector collector,
+        Bits acceptDocs,
+        int max,
+        int[] docIds,
+        int windowMin,
+        int windowMax,
+        int windowBase
+    ) throws IOException {
+        for (int subQueryIndex = 0; subQueryIndex < scorers.length; subQueryIndex++) {
+            if (Objects.isNull(scorers[subQueryIndex]) || docIds[subQueryIndex] >= max) {
+                continue;
+            }
+            DocIdSetIterator it = scorers[subQueryIndex].iterator();
+            int doc = docIds[subQueryIndex];
+            if (doc < windowMin) {
+                doc = it.advance(windowMin);
+            }
+            while (doc < windowMax) {
+                if (Objects.isNull(acceptDocs) || acceptDocs.get(doc)) {
+                    int d = doc & MASK;
+                    if (needsScores) {
+                        float score = scorers[subQueryIndex].score();
+                        // collect score only in case it's gt competitive score
+                        if (score > hybridSubQueryScorer.getMinScores()[subQueryIndex]) {
+                            matching.set(d);
+                            windowScores[subQueryIndex][d] = score;
+                        }
+                    } else {
+                        matching.set(d);
+                    }
+                }
+                doc = it.nextDoc();
+            }
+            docIds[subQueryIndex] = doc;
+        }
+
+        hybridQueryDocIdStream.setBase(windowBase);
+        collector.collect(hybridQueryDocIdStream);
+
+        matching.clear();
+
+        for (float[] windowScore : windowScores) {
+            Arrays.fill(windowScore, 0.0f);
+        }
+    }
+
+    private int[] advance(int min, Scorer[] scorers) throws IOException {
+        int[] docIds = new int[scorers.length];
+        for (int subQueryIndex = 0; subQueryIndex < scorers.length; subQueryIndex++) {
+            if (Objects.isNull(scorers[subQueryIndex])) {
+                docIds[subQueryIndex] = DocIdSetIterator.NO_MORE_DOCS;
+                continue;
+            }
+            DocIdSetIterator it = scorers[subQueryIndex].iterator();
+            int doc = it.docID();
+            if (doc < min) {
+                doc = it.advance(min);
+            }
+            docIds[subQueryIndex] = doc;
+        }
+        return docIds;
+    }
+
+    private boolean allDocIdsUsed(int[] docsIds, int max) {
+        for (int docId : docsIds) {
+            if (docId < max) {
+                return false;
+            }
+        }
+        return true;
+    }
+
+    private int getNextDocIdCandidate(final int[] docsIds) {
+        int nextDoc = -1;
+        for (int doc : docsIds) {
+            if (doc != DocIdSetIterator.NO_MORE_DOCS) {
+                nextDoc = Math.max(nextDoc, doc);
+            }
+        }
+        return nextDoc == -1 ? DocIdSetIterator.NO_MORE_DOCS : nextDoc;
+    }
+
+    @Override
+    public long cost() {
+        return cost;
+    }
+}
@@ -0,0 +1,62 @@
+/*
+ * Copyright OpenSearch Contributors
+ * SPDX-License-Identifier: Apache-2.0
+ */
+package org.opensearch.neuralsearch.query;
+
+import lombok.RequiredArgsConstructor;
+import lombok.Setter;
+import org.apache.lucene.search.CheckedIntConsumer;
+import org.apache.lucene.search.DocIdStream;
+import org.apache.lucene.util.FixedBitSet;
+
+import java.io.IOException;
+import java.util.Objects;
+
+/**
+ * This class is used to create a DocIdStream for HybridQuery
+ */
+@RequiredArgsConstructor
+public class HybridQueryDocIdStream extends DocIdStream {
+    private final HybridBulkScorer hybridBulkScorer;
+    @Setter
+    private int base;
+
+    /**
+     * Iterate over all doc ids and collect each doc id with leaf collector
+     * @param consumer consumer that is called for each accepted doc id
+     * @throws IOException in case of IO exception
+     */
+    @Override
+    public void forEach(CheckedIntConsumer<IOException> consumer) throws IOException {
+        // bitset that represents matching documents, bit is set (1) if doc id is a match
+        FixedBitSet matchingBitSet = hybridBulkScorer.getMatching();
+        long[] bitArray = matchingBitSet.getBits();
+        // iterate through each block of 64 documents (since each long contains 64 bits)
+        for (int idx = 0; idx < bitArray.length; idx++) {
+            long bits = bitArray[idx];
+            while (bits != 0L) {
+                // find position of the rightmost set bit (1)
+                int numberOfTrailingZeros = Long.numberOfTrailingZeros(bits);
+                // calculate actual document ID within the window
+                // idx << 6 is equivalent to idx * 64 (block offset)
+                // numberOfTrailingZeros gives position within the block
+                final int docIndexInWindow = (idx << 6) | numberOfTrailingZeros;
+                float[][] windowScores = hybridBulkScorer.getWindowScores();
+                for (int subQueryIndex = 0; subQueryIndex < windowScores.length; subQueryIndex++) {
+                    if (Objects.isNull(windowScores[subQueryIndex])) {
+                        continue;
+                    }
+                    float scoreOfDocIdForSubQuery = windowScores[subQueryIndex][docIndexInWindow];
+                    hybridBulkScorer.getHybridSubQueryScorer().getSubQueryScores()[subQueryIndex] = scoreOfDocIdForSubQuery;
+                }
+                // process the document with its base offset
+                consumer.accept(base | docIndexInWindow);
+                // reset scores after processing of one doc, this is required because scorer object is re-used
+                hybridBulkScorer.getHybridSubQueryScorer().resetScores();
+                // reset bit for this doc id to indicate that it has been consumed
+                bits ^= 1L << numberOfTrailingZeros;
+            }
+        }
+    }
+}
@@ -14,7 +14,6 @@
 import org.apache.lucene.search.ScoreMode;
 import org.apache.lucene.search.Scorer;
 import org.apache.lucene.search.TwoPhaseIterator;
-import org.apache.lucene.search.Weight;
 import org.apache.lucene.util.PriorityQueue;
 import org.opensearch.neuralsearch.search.HybridDisiWrapper;
 
@@ -44,11 +43,11 @@ public class HybridQueryScorer extends Scorer {
     private final TwoPhase twoPhase;
     private final int numSubqueries;
 
-    public HybridQueryScorer(final Weight weight, final List<Scorer> subScorers) throws IOException {
-        this(weight, subScorers, ScoreMode.TOP_SCORES);
+    public HybridQueryScorer(final List<Scorer> subScorers) throws IOException {
+        this(subScorers, ScoreMode.TOP_SCORES);
     }
 
-    HybridQueryScorer(final Weight weight, final List<Scorer> subScorers, final ScoreMode scoreMode) throws IOException {
+    HybridQueryScorer(final List<Scorer> subScorers, final ScoreMode scoreMode) throws IOException {
         super();
         this.subScorers = Collections.unmodifiableList(subScorers);
         this.numSubqueries = subScorers.size();
@@ -75,7 +74,7 @@ public HybridQueryScorer(final Weight weight, final List<Scorer> subScorers) thr
                 sumMatchCost += w.matchCost * costWeight;
             }
         }
-        if (!hasApproximation) { // no sub scorer supports approximations
+        if (hasApproximation == false) { // no sub scorer supports approximations
             twoPhase = null;
         } else {
             final float matchCost = sumMatchCost / sumApproxCost;
@@ -284,7 +283,7 @@ public boolean matches() throws IOException {
                     wrapper.next = verifiedMatches;
                     verifiedMatches = wrapper;
 
-                    if (!needsScores) {
+                    if (needsScores == false) {
                         // we can stop here
                         return true;
                     }
 
@@ -15,6 +15,7 @@
 import lombok.Getter;
 import lombok.RequiredArgsConstructor;
 import org.apache.lucene.index.LeafReaderContext;
+import org.apache.lucene.search.BulkScorer;
 import org.apache.lucene.search.Explanation;
 import org.apache.lucene.search.IndexSearcher;
 import org.apache.lucene.search.Matches;
@@ -37,7 +38,6 @@ public final class HybridQueryWeight extends Weight {
     // The Weights for our subqueries, in 1-1 correspondence
     @Getter(AccessLevel.PACKAGE)
     private final List<Weight> weights;
-
     private final ScoreMode scoreMode;
 
     /**
@@ -95,7 +95,7 @@ public ScorerSupplier scorerSupplier(LeafReaderContext context) throws IOExcepti
         if (scorerSuppliers.isEmpty()) {
             return null;
         }
-        return new HybridScorerSupplier(scorerSuppliers, this, scoreMode);
+        return new HybridScorerSupplier(scorerSuppliers, this, scoreMode, context);
     }
 
     private Void addScoreSupplier(Weight weight, HybridQueryExecutorCollector<LeafReaderContext, ScorerSupplier> collector) {
@@ -145,7 +145,7 @@ public Explanation explain(LeafReaderContext context, int doc) throws IOExceptio
                 max = Math.max(max, score);
                 subsOnMatch.add(e);
             } else {
-                if (!match) {
+                if (match == false) {
                     subsOnNoMatch.add(e);
                 }
                 subsOnMatch.add(e);
@@ -161,10 +161,23 @@ public Explanation explain(LeafReaderContext context, int doc) throws IOExceptio
 
     @RequiredArgsConstructor
     static class HybridScorerSupplier extends ScorerSupplier {
+
+        @Override
+        public BulkScorer bulkScorer() throws IOException {
+            List<Scorer> scorers = new ArrayList<>();
+            for (Weight weight : weight.getWeights()) {
+                Scorer scorer = weight.scorer(context);
+                scorers.add(scorer);
+            }
+            return new HybridBulkScorer(scorers, scoreMode.needsScores(), context.reader().maxDoc());
+        }
+
         private long cost = -1;
+        @Getter
         private final List<ScorerSupplier> scorerSuppliers;
-        private final Weight weight;
+        private final HybridQueryWeight weight;
         private final ScoreMode scoreMode;
+        private final LeafReaderContext context;
 
         @Override
         public Scorer get(long leadCost) throws IOException {
@@ -176,7 +189,7 @@ public Scorer get(long leadCost) throws IOException {
                     tScorers.add(null);
                 }
             }
-            return new HybridQueryScorer(weight, tScorers, scoreMode);
+            return new HybridQueryScorer(tScorers, scoreMode);
         }
 
         @Override