will-hwang
diff --git a/‎src/main/java/org/opensearch/neuralsearch/processor/InferenceProcessor.java
Lines changed: 194 additions & 27 deletions b/‎src/main/java/org/opensearch/neuralsearch/processor/InferenceProcessor.java
Lines changed: 194 additions & 27 deletions
diff --git a/‎src/main/java/org/opensearch/neuralsearch/processor/TextEmbeddingProcessor.java
Lines changed: 47 additions & 1 deletion b/‎src/main/java/org/opensearch/neuralsearch/processor/TextEmbeddingProcessor.java
Lines changed: 47 additions & 1 deletion
@@ -7,7 +7,6 @@
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collection;
-import java.util.Collections;
 import java.util.Comparator;
 import java.util.HashMap;
 import java.util.Iterator;
@@ -26,6 +25,10 @@
 import org.apache.commons.lang3.StringUtils;
 import org.apache.commons.lang3.tuple.ImmutablePair;
 import org.apache.commons.lang3.tuple.Pair;
+import org.opensearch.action.get.MultiGetItemResponse;
+import org.opensearch.action.get.MultiGetRequest;
+import org.opensearch.action.get.MultiGetResponse;
+import org.opensearch.common.CheckedConsumer;
 import org.opensearch.common.collect.Tuple;
 import org.opensearch.core.action.ActionListener;
 import org.opensearch.core.common.util.CollectionUtils;
@@ -42,6 +45,7 @@
 import com.google.common.collect.ImmutableMap;
 
 import lombok.extern.log4j.Log4j2;
+import org.opensearch.neuralsearch.processor.optimization.InferenceFilter;
 import org.opensearch.neuralsearch.util.ProcessorDocumentUtils;
 
 /**
@@ -54,6 +58,8 @@ public abstract class InferenceProcessor extends AbstractBatchingProcessor {
 
     public static final String MODEL_ID_FIELD = "model_id";
     public static final String FIELD_MAP_FIELD = "field_map";
+    public static final String INDEX_FIELD = "_index";
+    public static final String ID_FIELD = "_id";
     private static final BiFunction<Object, Object, Object> REMAPPING_FUNCTION = (v1, v2) -> {
         if (v1 instanceof Collection && v2 instanceof Collection) {
             ((Collection) v1).addAll((Collection) v2);
@@ -169,23 +175,67 @@ void preprocessIngestDocument(IngestDocument ingestDocument) {
      */
     abstract void doBatchExecute(List<String> inferenceList, Consumer<List<?>> handler, Consumer<Exception> onException);
 
+    /**
+     * This is the function which does actual inference work for subBatchExecute interface.
+     * @param ingestDocumentWrappers a list of IngestDocuments in a batch.
+     * @param handler a callback handler to handle inference results which is a list of objects.
+     */
     @Override
     public void subBatchExecute(List<IngestDocumentWrapper> ingestDocumentWrappers, Consumer<List<IngestDocumentWrapper>> handler) {
-        if (CollectionUtils.isEmpty(ingestDocumentWrappers)) {
-            handler.accept(Collections.emptyList());
-            return;
+        try {
+            if (CollectionUtils.isEmpty(ingestDocumentWrappers)) {
+                handler.accept(ingestDocumentWrappers);
+                return;
+            }
+
+            List<DataForInference> dataForInferences = getDataForInference(ingestDocumentWrappers);
+            List<String> inferenceList = constructInferenceTexts(dataForInferences);
+            if (inferenceList.isEmpty()) {
+                handler.accept(ingestDocumentWrappers);
+                return;
+            }
+            doSubBatchExecute(ingestDocumentWrappers, inferenceList, dataForInferences, handler);
+        } catch (Exception e) {
+            updateWithExceptions(ingestDocumentWrappers, handler, e);
         }
+    }
 
-        List<DataForInference> dataForInferences = getDataForInference(ingestDocumentWrappers);
-        List<String> inferenceList = constructInferenceTexts(dataForInferences);
-        if (inferenceList.isEmpty()) {
-            handler.accept(ingestDocumentWrappers);
-            return;
+    /**
+     * This is a helper function for subBatchExecute, which invokes doBatchExecute for given inference list.
+     * @param ingestDocumentWrappers a list of IngestDocuments in a batch.
+     * @param inferenceList a list of String for inference.
+     * @param dataForInferences a list of data for inference, which includes ingestDocumentWrapper, processMap, inferenceList.
+     */
+    protected void doSubBatchExecute(
+        List<IngestDocumentWrapper> ingestDocumentWrappers,
+        List<String> inferenceList,
+        List<DataForInference> dataForInferences,
+        Consumer<List<IngestDocumentWrapper>> handler
+    ) {
+        try {
+            Tuple<List<String>, Map<Integer, Integer>> sortedResult = sortByLengthAndReturnOriginalOrder(inferenceList);
+            inferenceList = sortedResult.v1();
+            Map<Integer, Integer> originalOrder = sortedResult.v2();
+            doBatchExecute(
+                inferenceList,
+                results -> batchExecuteHandler(results, ingestDocumentWrappers, dataForInferences, originalOrder, handler),
+                exception -> {
+                    updateWithExceptions(ingestDocumentWrappers, handler, exception);
+                }
+            );
+        } catch (Exception e) {
+            updateWithExceptions(ingestDocumentWrappers, handler, e);
         }
-        Tuple<List<String>, Map<Integer, Integer>> sortedResult = sortByLengthAndReturnOriginalOrder(inferenceList);
-        inferenceList = sortedResult.v1();
-        Map<Integer, Integer> originalOrder = sortedResult.v2();
-        doBatchExecute(inferenceList, results -> {
+    }
+
+    private void batchExecuteHandler(
+        List<?> results,
+        List<IngestDocumentWrapper> ingestDocumentWrappers,
+        List<DataForInference> dataForInferences,
+        Map<Integer, Integer> originalOrder,
+        Consumer<List<IngestDocumentWrapper>> handler
+    ) {
+        try {
             int startIndex = 0;
             results = restoreToOriginalOrder(results, originalOrder);
             for (DataForInference dataForInference : dataForInferences) {
@@ -202,16 +252,9 @@ public void subBatchExecute(List<IngestDocumentWrapper> ingestDocumentWrappers,
                 );
             }
             handler.accept(ingestDocumentWrappers);
-        }, exception -> {
-            for (IngestDocumentWrapper ingestDocumentWrapper : ingestDocumentWrappers) {
-                // The IngestDocumentWrapper might already run into exception and not sent for inference. So here we only
-                // set exception to IngestDocumentWrapper which doesn't have exception before.
-                if (ingestDocumentWrapper.getException() == null) {
-                    ingestDocumentWrapper.update(ingestDocumentWrapper.getIngestDocument(), exception);
-                }
-            }
-            handler.accept(ingestDocumentWrappers);
-        });
+        } catch (Exception e) {
+            updateWithExceptions(ingestDocumentWrappers, handler, e);
+        }
     }
 
     private Tuple<List<String>, Map<Integer, Integer>> sortByLengthAndReturnOriginalOrder(List<String> inferenceList) {
@@ -238,7 +281,7 @@ private List<?> restoreToOriginalOrder(List<?> results, Map<Integer, Integer> or
         return sortedResults;
     }
 
-    private List<String> constructInferenceTexts(List<DataForInference> dataForInferences) {
+    protected List<String> constructInferenceTexts(List<DataForInference> dataForInferences) {
         List<String> inferenceTexts = new ArrayList<>();
         for (DataForInference dataForInference : dataForInferences) {
             if (dataForInference.getIngestDocumentWrapper().getException() != null
@@ -250,7 +293,7 @@ private List<String> constructInferenceTexts(List<DataForInference> dataForInfer
         return inferenceTexts;
     }
 
-    private List<DataForInference> getDataForInference(List<IngestDocumentWrapper> ingestDocumentWrappers) {
+    protected List<DataForInference> getDataForInference(List<IngestDocumentWrapper> ingestDocumentWrappers) {
         List<DataForInference> dataForInferences = new ArrayList<>();
         for (IngestDocumentWrapper ingestDocumentWrapper : ingestDocumentWrappers) {
             Map<String, Object> processMap = null;
@@ -272,7 +315,7 @@ private List<DataForInference> getDataForInference(List<IngestDocumentWrapper> i
 
     @Getter
     @AllArgsConstructor
-    private static class DataForInference {
+    protected static class DataForInference {
         private final IngestDocumentWrapper ingestDocumentWrapper;
         private final Map<String, Object> processMap;
         private final List<String> inferenceList;
@@ -415,6 +458,36 @@ protected void setVectorFieldsToDocument(IngestDocument ingestDocument, Map<Stri
         nlpResult.forEach(ingestDocument::setFieldValue);
     }
 
+    /**
+     * This method creates a MultiGetRequest from a list of ingest documents to be fetched for comparison
+     * @param dataForInferences, list of data for inferences
+     * */
+    protected MultiGetRequest buildMultiGetRequest(List<DataForInference> dataForInferences) {
+        MultiGetRequest multiGetRequest = new MultiGetRequest();
+        for (DataForInference dataForInference : dataForInferences) {
+            Object index = dataForInference.getIngestDocumentWrapper().getIngestDocument().getSourceAndMetadata().get(INDEX_FIELD);
+            Object id = dataForInference.getIngestDocumentWrapper().getIngestDocument().getSourceAndMetadata().get(ID_FIELD);
+            if (Objects.nonNull(index) && Objects.nonNull(id)) {
+                multiGetRequest.add(index.toString(), id.toString());
+            }
+        }
+        return multiGetRequest;
+    }
+
+    /**
+     * This method creates a map of documents from MultiGetItemResponse where the key is document ID and value is corresponding document
+     * @param multiGetItemResponses, array of responses from Multi Get Request
+     * */
+    protected Map<String, Map<String, Object>> createDocumentMap(MultiGetItemResponse[] multiGetItemResponses) {
+        Map<String, Map<String, Object>> existingDocuments = new HashMap<>();
+        for (MultiGetItemResponse item : multiGetItemResponses) {
+            String id = item.getId();
+            Map<String, Object> existingDocument = item.getResponse().getSourceAsMap();
+            existingDocuments.put(id, existingDocument);
+        }
+        return existingDocuments;
+    }
+
     @SuppressWarnings({ "unchecked" })
     @VisibleForTesting
     Map<String, Object> buildNLPResult(Map<String, Object> processorMap, List<?> results, Map<String, Object> sourceAndMetadataMap) {
@@ -504,6 +577,27 @@ private void processMapEntryValue(
         }
     }
 
+    // This method updates each ingestDocument with exceptions and accepts ingestDocumentWrappers.
+    // Ingestion fails when exception occurs while updating
+    protected void updateWithExceptions(
+        List<IngestDocumentWrapper> ingestDocumentWrappers,
+        Consumer<List<IngestDocumentWrapper>> handler,
+        Exception e
+    ) {
+        try {
+            for (IngestDocumentWrapper ingestDocumentWrapper : ingestDocumentWrappers) {
+                // The IngestDocumentWrapper might have already run into exception. So here we only
+                // set exception to IngestDocumentWrapper which doesn't have exception before.
+                if (ingestDocumentWrapper.getException() == null) {
+                    ingestDocumentWrapper.update(ingestDocumentWrapper.getIngestDocument(), e);
+                }
+            }
+            handler.accept(ingestDocumentWrappers);
+        } catch (Exception ex) {
+            handler.accept(null);
+        }
+    }
+
     private void processMapEntryValue(
         List<?> results,
         IndexWrapper indexWrapper,
@@ -582,11 +676,65 @@ private List<Map<String, Object>> buildNLPResultForListType(List<String> sourceV
         List<Map<String, Object>> keyToResult = new ArrayList<>();
         sourceValue.stream()
             .filter(Objects::nonNull) // explicit null check is required since sourceValue can contain null values in cases where
-                                      // sourceValue has been filtered
+            // sourceValue has been filtered
             .forEachOrdered(x -> keyToResult.add(ImmutableMap.of(listTypeNestedMapKey, results.get(indexWrapper.index++))));
         return keyToResult;
     }
 
+    // This method validates and filters given inferenceList and dataForInferences after response is successfully retrieved from multi-get
+    // operation.
+    protected void multiGetResponseHandler(
+        MultiGetResponse response,
+        List<IngestDocumentWrapper> ingestDocumentWrappers,
+        List<String> inferenceList,
+        List<DataForInference> dataForInferences,
+        Consumer<List<IngestDocumentWrapper>> handler,
+        InferenceFilter inferenceFilter
+    ) {
+        MultiGetItemResponse[] multiGetItemResponses = response.getResponses();
+        if (multiGetItemResponses == null || multiGetItemResponses.length == 0) {
+            doSubBatchExecute(ingestDocumentWrappers, inferenceList, dataForInferences, handler);
+            return;
+        }
+        // create a map of documents with key: doc_id and value: doc
+        Map<String, Map<String, Object>> existingDocuments = createDocumentMap(multiGetItemResponses);
+        List<DataForInference> filteredDataForInference = filterDataForInference(inferenceFilter, dataForInferences, existingDocuments);
+        List<String> filteredInferenceList = constructInferenceTexts(filteredDataForInference);
+        if (filteredInferenceList.isEmpty()) {
+            handler.accept(ingestDocumentWrappers);
+            return;
+        }
+        doSubBatchExecute(ingestDocumentWrappers, filteredInferenceList, filteredDataForInference, handler);
+    }
+
+    // This is a helper method to filter the given list of dataForInferences by comparing its documents with existingDocuments with
+    // given inferenceFilter
+    protected List<DataForInference> filterDataForInference(
+        InferenceFilter inferenceFilter,
+        List<DataForInference> dataForInferences,
+        Map<String, Map<String, Object>> existingDocuments
+    ) {
+        List<DataForInference> filteredDataForInference = new ArrayList<>();
+        for (DataForInference dataForInference : dataForInferences) {
+            IngestDocumentWrapper ingestDocumentWrapper = dataForInference.getIngestDocumentWrapper();
+            Map<String, Object> processMap = dataForInference.getProcessMap();
+            Map<String, Object> document = ingestDocumentWrapper.getIngestDocument().getSourceAndMetadata();
+            Object id = document.get(ID_FIELD);
+            // insert non-filtered dataForInference if existing document does not exist
+            if (Objects.isNull(id) || existingDocuments.containsKey(id.toString()) == false) {
+                filteredDataForInference.add(dataForInference);
+                continue;
+            }
+            // filter dataForInference when existing document exists
+            String docId = id.toString();
+            Map<String, Object> existingDocument = existingDocuments.get(docId);
+            Map<String, Object> filteredProcessMap = inferenceFilter.filter(existingDocument, document, processMap);
+            List<String> filteredInferenceList = createInferenceList(filteredProcessMap);
+            filteredDataForInference.add(new DataForInference(ingestDocumentWrapper, filteredProcessMap, filteredInferenceList));
+        }
+        return filteredDataForInference;
+    }
+
     /**
      * This method invokes inference call through mlCommonsClientAccessor and populates retrieved embeddings to ingestDocument
      *
@@ -611,6 +759,25 @@ protected void makeInferenceCall(
         );
     }
 
+    protected <Response> ActionListener<Response> wrap(
+        final CheckedConsumer<Response, ? extends Exception> onResponse,
+        final Consumer<Exception> onFailure
+    ) {
+        return new ActionListener<>() {
+            public void onResponse(Response response) {
+                try {
+                    onResponse.accept(response);
+                } catch (Exception e) {
+                    this.onFailure(e);
+                }
+            }
+
+            public void onFailure(Exception e) {
+                onFailure.accept(e);
+            }
+        };
+    }
+
     @Override
     public String getType() {
         return type;
 
@@ -13,10 +13,13 @@
 
 import org.opensearch.action.get.GetAction;
 import org.opensearch.action.get.GetRequest;
+import org.opensearch.action.get.MultiGetAction;
 import org.opensearch.cluster.service.ClusterService;
 import org.opensearch.core.action.ActionListener;
+import org.opensearch.core.common.util.CollectionUtils;
 import org.opensearch.env.Environment;
 import org.opensearch.ingest.IngestDocument;
+import org.opensearch.ingest.IngestDocumentWrapper;
 import org.opensearch.neuralsearch.ml.MLCommonsClientAccessor;
 
 import lombok.extern.log4j.Log4j2;
@@ -74,7 +77,7 @@ public void doExecute(
         // if skipExisting flag is turned on, eligible inference texts will be compared and filtered after embeddings are copied
         String index = ingestDocument.getSourceAndMetadata().get(INDEX_FIELD).toString();
         String id = ingestDocument.getSourceAndMetadata().get(ID_FIELD).toString();
-        openSearchClient.execute(GetAction.INSTANCE, new GetRequest(index, id), ActionListener.wrap(response -> {
+        openSearchClient.execute(GetAction.INSTANCE, new GetRequest(index, id), wrap(response -> {
             final Map<String, Object> existingDocument = response.getSourceAsMap();
             if (existingDocument == null || existingDocument.isEmpty()) {
                 makeInferenceCall(ingestDocument, processMap, inferenceList, handler);
@@ -106,4 +109,47 @@ public void doBatchExecute(List<String> inferenceList, Consumer<List<?>> handler
             ActionListener.wrap(handler::accept, onException)
         );
     }
+
+    @Override
+    public void subBatchExecute(List<IngestDocumentWrapper> ingestDocumentWrappers, Consumer<List<IngestDocumentWrapper>> handler) {
+        try {
+            if (CollectionUtils.isEmpty(ingestDocumentWrappers)) {
+                handler.accept(ingestDocumentWrappers);
+                return;
+            }
+            List<DataForInference> dataForInferences = getDataForInference(ingestDocumentWrappers);
+            List<String> inferenceList = constructInferenceTexts(dataForInferences);
+            if (inferenceList.isEmpty()) {
+                handler.accept(ingestDocumentWrappers);
+                return;
+            }
+            // skip existing flag is turned off. Call doSubBatchExecute without filtering
+            if (skipExisting == false) {
+                doSubBatchExecute(ingestDocumentWrappers, inferenceList, dataForInferences, handler);
+                return;
+            }
+            // skipExisting flag is turned on, eligible inference texts in dataForInferences will be compared and filtered after embeddings
+            // are copied
+            openSearchClient.execute(
+                MultiGetAction.INSTANCE,
+                buildMultiGetRequest(dataForInferences),
+                wrap(
+                    response -> multiGetResponseHandler(
+                        response,
+                        ingestDocumentWrappers,
+                        inferenceList,
+                        dataForInferences,
+                        handler,
+                        textEmbeddingInferenceFilter
+                    ),
+                    e -> {
+                        // When exception is thrown in for MultiGetAction, set exception to all ingestDocumentWrappers
+                        updateWithExceptions(ingestDocumentWrappers, handler, e);
+                    }
+                )
+            );
+        } catch (Exception e) {
+            updateWithExceptions(ingestDocumentWrappers, handler, e);
+        }
+    }
 }