fixed comments suggested changes

sonianuj287 · ylwu-amzn · commit ffab1bf0b54d · 2025-10-27T20:45:43.000-07:00
Signed-off-by: Anuj Soni &lt;sonianuj287@gmail.com&gt;
diff --git a/plugin/src/test/java/org/opensearch/ml/rest/RestBedRockInferenceIT.java b/plugin/src/test/java/org/opensearch/ml/rest/RestBedRockInferenceIT.java
@@ -5,19 +5,40 @@
 
 package org.opensearch.ml.rest;
 
+import static org.mockito.ArgumentMatchers.any;
+import static org.mockito.Mockito.doAnswer;
+import static org.mockito.Mockito.mock;
+
 import java.io.IOException;
+import java.lang.reflect.Field;
 import java.nio.file.Files;
 import java.nio.file.Path;
 import java.util.ArrayList;
+import java.util.Collections;
+import java.util.HashMap;
 import java.util.List;
 import java.util.Locale;
 import java.util.Map;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.atomic.AtomicReference;
 
 import org.junit.Before;
+import org.opensearch.core.action.ActionListener;
 import org.opensearch.ml.common.FunctionName;
 import org.opensearch.ml.common.dataset.TextDocsInputDataSet;
 import org.opensearch.ml.common.input.MLInput;
+import org.opensearch.ml.common.output.MLOutput;
+import org.opensearch.ml.common.output.model.MLResultDataType;
+import org.opensearch.ml.common.output.model.ModelTensor;
+import org.opensearch.ml.common.output.model.ModelTensorOutput;
+import org.opensearch.ml.common.output.model.ModelTensors;
 import org.opensearch.ml.common.utils.StringUtils;
+import org.opensearch.searchpipelines.questionanswering.generative.client.MachineLearningInternalClient;
+import org.opensearch.searchpipelines.questionanswering.generative.llm.ChatCompletionInput;
+import org.opensearch.searchpipelines.questionanswering.generative.llm.ChatCompletionOutput;
+import org.opensearch.searchpipelines.questionanswering.generative.llm.DefaultLlmImpl;
+import org.opensearch.searchpipelines.questionanswering.generative.llm.Llm;
 
 import lombok.SneakyThrows;
 import lombok.extern.log4j.Log4j2;
@@ -82,17 +103,95 @@ public void test_bedrock_embedding_model() throws Exception {
         }
     }
 
-    public void testChatCompletionBedrockErrorResponseFormats() throws Exception {
-        // Simulate Bedrock inference endpoint behavior
-        // You can mock or create sample response maps for two formats
+    public void testChatCompletionBedrockContentFormat() throws Exception {
+        Map<String, Object> response = Map.of("content", List.of(Map.of("text", "Claude V3 response text")));
+
+        Map<String, Object> result = invokeBedrockInference(response);
+
+        assertTrue(result.containsKey("answers"));
+        assertEquals("Claude V3 response text", ((List<?>) result.get("answers")).get(0));
+    }
+
+    private static void injectMlClient(DefaultLlmImpl connector, Object mlClient) {
+        try {
+            Field field = null;
+            // Try common field names. Adjust if the actual field is named differently.
+            try {
+                field = DefaultLlmImpl.class.getDeclaredField("mlClient");
+            } catch (NoSuchFieldException e) {
+                // fallback if different field name
+                field = DefaultLlmImpl.class.getDeclaredField("client");
+            }
+            field.setAccessible(true);
+            field.set(connector, mlClient);
+        } catch (ReflectiveOperationException e) {
+            throw new RuntimeException("Failed to inject mlClient into DefaultLlmImpl", e);
+        }
+    }
 
-        Map<String, Object> errorFormat1 = Map.of("error", Map.of("message", "Unsupported Claude response format"));
+    private Map<String, Object> invokeBedrockInference(Map<String, Object> mockResponse) throws Exception {
+        // Create DefaultLlmImpl and mock ML client
+        DefaultLlmImpl connector = new DefaultLlmImpl("model_id", null); // Use getClient() from MLCommonsRestTestCase
+        MachineLearningInternalClient mlClient = mock(MachineLearningInternalClient.class);
+        injectMlClient(connector, mlClient);
 
-        Map<String, Object> errorFormat2 = Map.of("error", "InvalidRequest");
+        // Wrap mockResponse inside a ModelTensor -> ModelTensors -> ModelTensorOutput -> MLOutput
+        ModelTensor tensor = new ModelTensor("tensor", new Number[0], new long[0], MLResultDataType.STRING, null, null, mockResponse);
+        ModelTensorOutput mlOutput = new ModelTensorOutput(List.of(new ModelTensors(List.of(tensor))));
+        // Do NOT depend on ActionFuture return path; instead drive the async listener directly.
 
-        // Use the same validation style but inverted for errors
-        validateErrorOutput("Should detect error format 1 correctly", errorFormat1, "Unsupported Claude response format");
-        validateErrorOutput("Should detect error format 2 correctly", errorFormat2, "InvalidRequest");
+        // Make asynchronous predict(...) call invoke the ActionListener with our mlOutput
+        doAnswer(invocation -> {
+            @SuppressWarnings("unchecked")
+            ActionListener<MLOutput> listener = (ActionListener<MLOutput>) invocation.getArguments()[2];
+            // Simulate successful ML response
+            listener.onResponse(mlOutput);
+            return null;
+        }).when(mlClient).predict(any(), any(), any());
+
+        // Prepare input (use BEDROCK provider so bedrock branch is taken)
+        ChatCompletionInput input = new ChatCompletionInput(
+            "bedrock/model",
+            "question",
+            Collections.emptyList(),
+            Collections.emptyList(),
+            0,
+            "prompt",
+            "instructions",
+            Llm.ModelProvider.BEDROCK,
+            null,
+            null
+        );
+
+        // Synchronously wait for callback result
+        CountDownLatch latch = new CountDownLatch(1);
+        AtomicReference<Map<String, Object>> resultRef = new AtomicReference<>();
+
+        connector.doChatCompletion(input, new ActionListener<>() {
+            @Override
+            public void onResponse(ChatCompletionOutput output) {
+                Map<String, Object> map = new HashMap<>();
+                map.put("answers", output.getAnswers());
+                map.put("errors", output.getErrors());
+                resultRef.set(map);
+                latch.countDown();
+            }
+
+            @Override
+            public void onFailure(Exception e) {
+                Map<String, Object> map = new HashMap<>();
+                map.put("answers", Collections.emptyList());
+                map.put("errors", List.of(e.getMessage()));
+                resultRef.set(map);
+                latch.countDown();
+            }
+        });
+
+        boolean completed = latch.await(5, TimeUnit.SECONDS);
+        if (!completed) {
+            throw new RuntimeException("Timed out waiting for doChatCompletion callback");
+        }
+        return resultRef.get();
     }
 
     private void validateErrorOutput(String msg, Map<String, Object> output, String expectedError) {
diff --git a/search-processors/src/main/java/org/opensearch/searchpipelines/questionanswering/generative/llm/DefaultLlmImpl.java b/search-processors/src/main/java/org/opensearch/searchpipelines/questionanswering/generative/llm/DefaultLlmImpl.java
@@ -52,9 +52,9 @@ public class DefaultLlmImpl implements Llm {
     private static final String CONNECTOR_OUTPUT_MESSAGE_ROLE = "role";
     private static final String CONNECTOR_OUTPUT_MESSAGE_CONTENT = "content";
     private static final String CONNECTOR_OUTPUT_ERROR = "error";
-    private static final String CLAUDE_V2_COMPLETION_FIELD = "completion";
-    private static final String CLAUDE_V3_CONTENT_FIELD = "content";
-    private static final String CLAUDE_V3_TEXT_FIELD = "text";
+    private static final String BEDROCK_COMPLETION_FIELD = "completion";
+    private static final String BEDROCK_CONTENT_FIELD = "content";
+    private static final String BEDROCK_TEXT_FIELD = "text";
 
     private final String openSearchModelId;
 
@@ -194,39 +194,37 @@ protected ChatCompletionOutput buildChatCompletionOutput(ModelProvider provider,
                 answers = List.of(message.get(CONNECTOR_OUTPUT_MESSAGE_CONTENT));
             }
         } else if (provider == ModelProvider.BEDROCK) {
-            // Handle both Claude V2 and V3 response formats
-            if (dataAsMap.containsKey(CLAUDE_V2_COMPLETION_FIELD)) {
-                // Old Claude V2 format
-                answerField = CLAUDE_V2_COMPLETION_FIELD;
-                fillAnswersOrErrors(dataAsMap, answers, errors, answerField, errorField, defaultErrorMessageField);
-            } else if (dataAsMap.containsKey(CLAUDE_V3_CONTENT_FIELD)) {
-                // New Claude V3 format
-                Object contentObj = dataAsMap.get(CLAUDE_V3_CONTENT_FIELD);
-                if (contentObj instanceof List) {
-                    List<?> contentList = (List<?>) contentObj;
-                    if (!contentList.isEmpty()) {
-                        Object first = contentList.get(0);
-                        if (first instanceof Map) {
-                            Map<?, ?> firstMap = (Map<?, ?>) first;
-                            Object text = firstMap.get(CLAUDE_V3_TEXT_FIELD);
-                            if (text != null) {
-                                answers.add(text.toString());
-                            } else {
-                                errors.add("Claude V3 response missing '" + CLAUDE_V3_TEXT_FIELD + "' field.");
-                            }
+            // Handle Bedrock model responses (supports both legacy completion and newer content/text formats)
+
+            Object contentObj = dataAsMap.get(BEDROCK_CONTENT_FIELD);
+            if (contentObj == null) {
+                // Legacy completion-style format
+                Object completion = dataAsMap.get(BEDROCK_COMPLETION_FIELD);
+                if (completion != null) {
+                    answers.add(completion.toString());
+                } else {
+                    errors.add("Unsupported Bedrock response format: " + dataAsMap.keySet());
+                    log.error("Unknown Bedrock response format: {}", dataAsMap);
+                }
+            } else {
+                // Fail-fast checks for new content/text format
+                if (!(contentObj instanceof List<?> contentList)) {
+                    errors.add("Unexpected type for '" + BEDROCK_CONTENT_FIELD + "' in Bedrock response.");
+                } else if (contentList.isEmpty()) {
+                    errors.add("Empty content list in Bedrock response.");
+                } else {
+                    Object first = contentList.get(0);
+                    if (!(first instanceof Map<?, ?> firstMap)) {
+                        errors.add("Unexpected content format in Bedrock response.");
+                    } else {
+                        Object text = firstMap.get(BEDROCK_TEXT_FIELD);
+                        if (text == null) {
+                            errors.add("Bedrock content response missing '" + BEDROCK_TEXT_FIELD + "' field.");
                         } else {
-                            errors.add("Unexpected content format in Claude V3 response.");
+                            answers.add(text.toString());
                         }
-                    } else {
-                        errors.add("Empty content list in Claude V3 response.");
                     }
-                } else {
-                    errors.add("Unexpected type for '" + CLAUDE_V3_CONTENT_FIELD + "' in Claude V3 response.");
                 }
-            } else {
-                // Fallback error handling
-                errors.add("Unsupported Claude response format: " + dataAsMap.keySet());
-                log.error("Unknown Bedrock/Claude response format: {}", dataAsMap);
             }
         } else if (provider == ModelProvider.COHERE) {
             answerField = "text";
diff --git a/search-processors/src/test/java/org/opensearch/searchpipelines/questionanswering/generative/llm/DefaultLlmImplTests.java b/search-processors/src/test/java/org/opensearch/searchpipelines/questionanswering/generative/llm/DefaultLlmImplTests.java
@@ -143,14 +143,14 @@ public void onFailure(Exception e) {
         assertTrue(mlInput.getInputDataset() instanceof RemoteInferenceInputDataSet);
     }
 
-    public void testChatCompletionApiForBedrockClaudeV3() throws Exception {
+    public void testChatCompletionApiForBedrockContentFormat() throws Exception {
         MachineLearningInternalClient mlClient = mock(MachineLearningInternalClient.class);
         ArgumentCaptor<MLInput> captor = ArgumentCaptor.forClass(MLInput.class);
         DefaultLlmImpl connector = new DefaultLlmImpl("model_id", client);
         connector.setMlClient(mlClient);
 
-        // Claude V3-style response
-        Map<String, Object> textPart = Map.of("type", "text", "text", "Hello from Claude V3");
+        // Bedrock content/text response (newer format)
+        Map<String, Object> textPart = Map.of("type", "text", "text", "Hello from Bedrock");
         Map<String, Object> dataAsMap = Map.of("content", List.of(textPart));
 
         ModelTensor tensor = new ModelTensor("tensor", new Number[0], new long[0], MLResultDataType.STRING, null, null, dataAsMap);
@@ -180,13 +180,13 @@ public void testChatCompletionApiForBedrockClaudeV3() throws Exception {
         connector.doChatCompletion(input, new ActionListener<>() {
             @Override
             public void onResponse(ChatCompletionOutput output) {
-                // Verify that we parsed the Claude V3 response correctly
-                assertEquals("Hello from Claude V3", output.getAnswers().get(0));
+                // Verify that we parsed the Bedrock content response correctly
+                assertEquals("Hello from Bedrock", output.getAnswers().get(0));
             }
 
             @Override
             public void onFailure(Exception e) {
-                fail("Claude V3 test failed: " + e.getMessage());
+                fail("Bedrock test failed: " + e.getMessage());
             }
         });
 
@@ -629,7 +629,7 @@ public void testChatCompletionBedrockThrowingError() throws Exception {
         DefaultLlmImpl connector = new DefaultLlmImpl("model_id", client);
         connector.setMlClient(mlClient);
 
-        String errorMessage = "Unsupported Claude response format";
+        String errorMessage = "Unsupported Bedrock response format";
         Map<String, String> messageMap = Map.of("message", errorMessage);
         Map<String, ?> dataAsMap = Map.of("error", messageMap);
         ModelTensor tensor = new ModelTensor("tensor", new Number[0], new long[0], MLResultDataType.STRING, null, null, dataAsMap);