junweid62
diff --git a/‎plugin/src/test/java/org/opensearch/ml/rest/RestMLRAGSearchProcessorIT.java
Lines changed: 174 additions & 3 deletions b/‎plugin/src/test/java/org/opensearch/ml/rest/RestMLRAGSearchProcessorIT.java
Lines changed: 174 additions & 3 deletions
diff --git a/‎search-processors/src/main/java/org/opensearch/searchpipelines/questionanswering/generative/GenerativeQAResponseProcessor.java
Lines changed: 2 additions & 1 deletion b/‎search-processors/src/main/java/org/opensearch/searchpipelines/questionanswering/generative/GenerativeQAResponseProcessor.java
Lines changed: 2 additions & 1 deletion
diff --git a/‎search-processors/src/main/java/org/opensearch/searchpipelines/questionanswering/generative/ext/GenerativeQAParameters.java
Lines changed: 20 additions & 3 deletions b/‎search-processors/src/main/java/org/opensearch/searchpipelines/questionanswering/generative/ext/GenerativeQAParameters.java
Lines changed: 20 additions & 3 deletions
diff --git a/‎search-processors/src/main/java/org/opensearch/searchpipelines/questionanswering/generative/llm/ChatCompletionInput.java
Lines changed: 1 addition & 0 deletions b/‎search-processors/src/main/java/org/opensearch/searchpipelines/questionanswering/generative/llm/ChatCompletionInput.java
Lines changed: 1 addition & 0 deletions
diff --git a/‎search-processors/src/main/java/org/opensearch/searchpipelines/questionanswering/generative/llm/ChatCompletionOutput.java
Lines changed: 4 additions & 9 deletions b/‎search-processors/src/main/java/org/opensearch/searchpipelines/questionanswering/generative/llm/ChatCompletionOutput.java
Lines changed: 4 additions & 9 deletions
@@ -34,6 +34,7 @@
 import org.opensearch.core.rest.RestStatus;
 import org.opensearch.ml.common.MLTaskState;
 import org.opensearch.ml.utils.TestHelper;
+import org.opensearch.searchpipelines.questionanswering.generative.llm.LlmIOUtil;
 
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
@@ -147,6 +148,35 @@ public class RestMLRAGSearchProcessorIT extends RestMLRemoteInferenceIT {
     private static final String BEDROCK_CONNECTOR_BLUEPRINT = AWS_SESSION_TOKEN == null
         ? BEDROCK_CONNECTOR_BLUEPRINT2
         : BEDROCK_CONNECTOR_BLUEPRINT1;
+
+    private static final String COHERE_API_KEY = System.getenv("COHERE_API_KEY");
+    private static final String COHERE_CONNECTOR_BLUEPRINT = "{\n"
+        + "    \"name\": \"Cohere Chat Model\",\n"
+        + "    \"description\": \"The connector to Cohere's public chat API\",\n"
+        + "    \"version\": \"1\",\n"
+        + "    \"protocol\": \"http\",\n"
+        + "    \"credential\": {\n"
+        + "        \"cohere_key\": \""
+        + COHERE_API_KEY
+        + "\"\n"
+        + "    },\n"
+        + "    \"parameters\": {\n"
+        + "        \"model\": \"command\"\n"
+        + "    },\n"
+        + "    \"actions\": [\n"
+        + "        {\n"
+        + "            \"action_type\": \"predict\",\n"
+        + "            \"method\": \"POST\",\n"
+        + "            \"url\": \"https://api.cohere.ai/v1/chat\",\n"
+        + "            \"headers\": {\n"
+        + "                \"Authorization\": \"Bearer ${credential.cohere_key}\",\n"
+        + "                \"Request-Source\": \"unspecified:opensearch\"\n"
+        + "            },\n"
+        + "            \"request_body\": \"{ \\\"message\\\": \\\"${parameters.inputs}\\\", \\\"model\\\": \\\"${parameters.model}\\\" }\" \n"
+        + "        }\n"
+        + "    ]\n"
+        + "}";
+
     private static final String PIPELINE_TEMPLATE = "{\n"
         + "  \"response_processors\": [\n"
         + "    {\n"
@@ -199,6 +229,23 @@ public class RestMLRAGSearchProcessorIT extends RestMLRemoteInferenceIT {
         + "  }\n"
         + "}";
 
+    private static final String BM25_SEARCH_REQUEST_WITH_LLM_RESPONSE_FIELD_TEMPLATE = "{\n"
+        + "  \"_source\": [\"%s\"],\n"
+        + "  \"query\" : {\n"
+        + "    \"match\": {\"%s\": \"%s\"}\n"
+        + "  },\n"
+        + "   \"ext\": {\n"
+        + "      \"generative_qa_parameters\": {\n"
+        + "        \"llm_model\": \"%s\",\n"
+        + "        \"llm_question\": \"%s\",\n"
+        + "        \"context_size\": %d,\n"
+        + "        \"message_size\": %d,\n"
+        + "        \"timeout\": %d,\n"
+        + "        \"llm_response_field\": \"%s\"\n"
+        + "      }\n"
+        + "  }\n"
+        + "}";
+
     private static final String OPENAI_MODEL = "gpt-3.5-turbo";
     private static final String BEDROCK_ANTHROPIC_CLAUDE = "bedrock/anthropic-claude";
     private static final String TEST_DOC_PATH = "org/opensearch/ml/rest/test_data/";
@@ -472,6 +519,111 @@ public void testBM25WithBedrockWithConversation() throws Exception {
         assertNotNull(interactionId);
     }
 
+    public void testBM25WithCohere() throws Exception {
+        // Skip test if key is null
+        if (COHERE_API_KEY == null) {
+            return;
+        }
+        Response response = createConnector(COHERE_CONNECTOR_BLUEPRINT);
+        Map responseMap = parseResponseToMap(response);
+        String connectorId = (String) responseMap.get("connector_id");
+        response = registerRemoteModel("Cohere Chat Completion v1", connectorId);
+        responseMap = parseResponseToMap(response);
+        String taskId = (String) responseMap.get("task_id");
+        waitForTask(taskId, MLTaskState.COMPLETED);
+        response = getTask(taskId);
+        responseMap = parseResponseToMap(response);
+        String modelId = (String) responseMap.get("model_id");
+        response = deployRemoteModel(modelId);
+        responseMap = parseResponseToMap(response);
+        taskId = (String) responseMap.get("task_id");
+        waitForTask(taskId, MLTaskState.COMPLETED);
+
+        PipelineParameters pipelineParameters = new PipelineParameters();
+        pipelineParameters.tag = "testBM25WithCohere";
+        pipelineParameters.description = "desc";
+        pipelineParameters.modelId = modelId;
+        pipelineParameters.systemPrompt = "You are a helpful assistant";
+        pipelineParameters.userInstructions = "none";
+        pipelineParameters.context_field = "text";
+        Response response1 = createSearchPipeline("pipeline_test", pipelineParameters);
+        assertEquals(200, response1.getStatusLine().getStatusCode());
+
+        SearchRequestParameters requestParameters = new SearchRequestParameters();
+        requestParameters.source = "text";
+        requestParameters.match = "president";
+        requestParameters.llmModel = LlmIOUtil.COHERE_PROVIDER_PREFIX + "command";
+        requestParameters.llmQuestion = "who is lincoln";
+        requestParameters.contextSize = 5;
+        requestParameters.interactionSize = 5;
+        requestParameters.timeout = 60;
+        Response response2 = performSearch(INDEX_NAME, "pipeline_test", 5, requestParameters);
+        assertEquals(200, response2.getStatusLine().getStatusCode());
+
+        Map responseMap2 = parseResponseToMap(response2);
+        Map ext = (Map) responseMap2.get("ext");
+        assertNotNull(ext);
+        Map rag = (Map) ext.get("retrieval_augmented_generation");
+        assertNotNull(rag);
+
+        // TODO handle errors such as throttling
+        String answer = (String) rag.get("answer");
+        assertNotNull(answer);
+    }
+
+    public void testBM25WithCohereUsingLlmResponseField() throws Exception {
+        // Skip test if key is null
+        if (COHERE_API_KEY == null) {
+            return;
+        }
+        Response response = createConnector(COHERE_CONNECTOR_BLUEPRINT);
+        Map responseMap = parseResponseToMap(response);
+        String connectorId = (String) responseMap.get("connector_id");
+        response = registerRemoteModel("Cohere Chat Completion v1", connectorId);
+        responseMap = parseResponseToMap(response);
+        String taskId = (String) responseMap.get("task_id");
+        waitForTask(taskId, MLTaskState.COMPLETED);
+        response = getTask(taskId);
+        responseMap = parseResponseToMap(response);
+        String modelId = (String) responseMap.get("model_id");
+        response = deployRemoteModel(modelId);
+        responseMap = parseResponseToMap(response);
+        taskId = (String) responseMap.get("task_id");
+        waitForTask(taskId, MLTaskState.COMPLETED);
+
+        PipelineParameters pipelineParameters = new PipelineParameters();
+        pipelineParameters.tag = "testBM25WithCohereLlmResponseField";
+        pipelineParameters.description = "desc";
+        pipelineParameters.modelId = modelId;
+        pipelineParameters.systemPrompt = "You are a helpful assistant";
+        pipelineParameters.userInstructions = "none";
+        pipelineParameters.context_field = "text";
+        Response response1 = createSearchPipeline("pipeline_test", pipelineParameters);
+        assertEquals(200, response1.getStatusLine().getStatusCode());
+
+        SearchRequestParameters requestParameters = new SearchRequestParameters();
+        requestParameters.source = "text";
+        requestParameters.match = "president";
+        requestParameters.llmModel = "command";
+        requestParameters.llmQuestion = "who is lincoln";
+        requestParameters.contextSize = 5;
+        requestParameters.interactionSize = 5;
+        requestParameters.timeout = 60;
+        requestParameters.llmResponseField = "text";
+        Response response2 = performSearch(INDEX_NAME, "pipeline_test", 5, requestParameters);
+        assertEquals(200, response2.getStatusLine().getStatusCode());
+
+        Map responseMap2 = parseResponseToMap(response2);
+        Map ext = (Map) responseMap2.get("ext");
+        assertNotNull(ext);
+        Map rag = (Map) ext.get("retrieval_augmented_generation");
+        assertNotNull(rag);
+
+        // TODO handle errors such as throttling
+        String answer = (String) rag.get("answer");
+        assertNotNull(answer);
+    }
+
     private Response createSearchPipeline(String pipeline, PipelineParameters parameters) throws Exception {
         return makeRequest(
             client(),
@@ -498,11 +650,11 @@ private Response createSearchPipeline(String pipeline, PipelineParameters parame
     private Response performSearch(String indexName, String pipeline, int size, SearchRequestParameters requestParameters)
         throws Exception {
 
-        String httpEntity = (requestParameters.conversationId == null)
+        String httpEntity = requestParameters.llmResponseField != null
             ? String
                 .format(
                     Locale.ROOT,
-                    BM25_SEARCH_REQUEST_TEMPLATE,
+                    BM25_SEARCH_REQUEST_WITH_LLM_RESPONSE_FIELD_TEMPLATE,
                     requestParameters.source,
                     requestParameters.source,
                     requestParameters.match,
@@ -512,8 +664,25 @@ private Response performSearch(String indexName, String pipeline, int size, Sear
                     requestParameters.userInstructions,
                     requestParameters.contextSize,
                     requestParameters.interactionSize,
-                    requestParameters.timeout
+                    requestParameters.timeout,
+                    requestParameters.llmResponseField
                 )
+            : (requestParameters.conversationId == null)
+                ? String
+                    .format(
+                        Locale.ROOT,
+                        BM25_SEARCH_REQUEST_TEMPLATE,
+                        requestParameters.source,
+                        requestParameters.source,
+                        requestParameters.match,
+                        requestParameters.llmModel,
+                        requestParameters.llmQuestion,
+                        requestParameters.systemPrompt,
+                        requestParameters.userInstructions,
+                        requestParameters.contextSize,
+                        requestParameters.interactionSize,
+                        requestParameters.timeout
+                    )
             : String
                 .format(
                     Locale.ROOT,
@@ -572,5 +741,7 @@ static class SearchRequestParameters {
         int interactionSize;
         int timeout;
         String conversationId;
+
+        String llmResponseField;
     }
 }
@@ -165,7 +165,8 @@ public SearchResponse processResponse(SearchRequest request, SearchResponse resp
                             llmQuestion,
                             chatHistory,
                             searchResults,
-                            timeout
+                            timeout,
+                            params.getLlmResponseField()
                         )
                 );
             log.info("doChatCompletion complete. ({})", getDuration(start));
 
@@ -71,10 +71,16 @@ public class GenerativeQAParameters implements Writeable, ToXContentObject {
     // from a remote inference endpoint before timing out the request.
     private static final ParseField TIMEOUT = new ParseField("timeout");
 
+    // Optional parameter: this parameter allows request-level customization of the "system" (role) prompt.
     private static final ParseField SYSTEM_PROMPT = new ParseField(GenerativeQAProcessorConstants.CONFIG_NAME_SYSTEM_PROMPT);
 
+    // Optional parameter: this parameter allows request-level customization of the "user" (role) prompt.
     private static final ParseField USER_INSTRUCTIONS = new ParseField(GenerativeQAProcessorConstants.CONFIG_NAME_USER_INSTRUCTIONS);
 
+    // Optional parameter; this parameter indicates the name of the field in the LLM response
+    // that contains the chat completion text, i.e. "answer".
+    private static final ParseField LLM_RESPONSE_FIELD = new ParseField("llm_response_field");
+
     public static final int SIZE_NULL_VALUE = -1;
 
     static {
@@ -87,6 +93,7 @@ public class GenerativeQAParameters implements Writeable, ToXContentObject {
         PARSER.declareIntOrNull(GenerativeQAParameters::setContextSize, SIZE_NULL_VALUE, CONTEXT_SIZE);
         PARSER.declareIntOrNull(GenerativeQAParameters::setInteractionSize, SIZE_NULL_VALUE, INTERACTION_SIZE);
         PARSER.declareIntOrNull(GenerativeQAParameters::setTimeout, SIZE_NULL_VALUE, TIMEOUT);
+        PARSER.declareStringOrNull(GenerativeQAParameters::setLlmResponseField, LLM_RESPONSE_FIELD);
     }
 
     @Setter
@@ -121,6 +128,10 @@ public class GenerativeQAParameters implements Writeable, ToXContentObject {
     @Getter
     private String userInstructions;
 
+    @Setter
+    @Getter
+    private String llmResponseField;
+
     public GenerativeQAParameters(
         String conversationId,
         String llmModel,
@@ -129,7 +140,8 @@ public GenerativeQAParameters(
         String userInstructions,
         Integer contextSize,
         Integer interactionSize,
-        Integer timeout
+        Integer timeout,
+        String llmResponseField
     ) {
         this.conversationId = conversationId;
         this.llmModel = llmModel;
@@ -143,6 +155,7 @@ public GenerativeQAParameters(
         this.contextSize = (contextSize == null) ? SIZE_NULL_VALUE : contextSize;
         this.interactionSize = (interactionSize == null) ? SIZE_NULL_VALUE : interactionSize;
         this.timeout = (timeout == null) ? SIZE_NULL_VALUE : timeout;
+        this.llmResponseField = llmResponseField;
     }
 
     public GenerativeQAParameters(StreamInput input) throws IOException {
@@ -154,6 +167,7 @@ public GenerativeQAParameters(StreamInput input) throws IOException {
         this.contextSize = input.readInt();
         this.interactionSize = input.readInt();
         this.timeout = input.readInt();
+        this.llmResponseField = input.readOptionalString();
     }
 
     @Override
@@ -166,7 +180,8 @@ public XContentBuilder toXContent(XContentBuilder xContentBuilder, Params params
             .field(USER_INSTRUCTIONS.getPreferredName(), this.userInstructions)
             .field(CONTEXT_SIZE.getPreferredName(), this.contextSize)
             .field(INTERACTION_SIZE.getPreferredName(), this.interactionSize)
-            .field(TIMEOUT.getPreferredName(), this.timeout);
+            .field(TIMEOUT.getPreferredName(), this.timeout)
+            .field(LLM_RESPONSE_FIELD.getPreferredName(), this.llmResponseField);
     }
 
     @Override
@@ -181,6 +196,7 @@ public void writeTo(StreamOutput out) throws IOException {
         out.writeInt(contextSize);
         out.writeInt(interactionSize);
         out.writeInt(timeout);
+        out.writeOptionalString(llmResponseField);
     }
 
     public static GenerativeQAParameters parse(XContentParser parser) throws IOException {
@@ -204,6 +220,7 @@ public boolean equals(Object o) {
             && Objects.equals(this.userInstructions, other.getUserInstructions())
             && (this.contextSize == other.getContextSize())
             && (this.interactionSize == other.getInteractionSize())
-            && (this.timeout == other.getTimeout());
+            && (this.timeout == other.getTimeout())
+            && Objects.equals(this.llmResponseField, other.getLlmResponseField());
     }
 }
@@ -43,4 +43,5 @@ public class ChatCompletionInput {
     private String systemPrompt;
     private String userInstructions;
     private Llm.ModelProvider modelProvider;
+    private String llmResponseField;
 }
@@ -19,6 +19,8 @@
 
 import java.util.List;
 
+import org.opensearch.core.common.util.CollectionUtils;
+
 import lombok.Getter;
 import lombok.Setter;
 import lombok.extern.log4j.Log4j2;
@@ -38,19 +40,12 @@ public class ChatCompletionOutput {
 
     public ChatCompletionOutput(List<Object> answers, List<String> errors) {
 
-        if (answers == null && errors == null) {
+        if (CollectionUtils.isEmpty(answers) && CollectionUtils.isEmpty(errors)) {
             throw new IllegalArgumentException("answers and errors can't both be null.");
         }
 
-        if (answers == null) {
-            if (errors.isEmpty()) {
-                throw new IllegalArgumentException("If answers is not provided, one or more errors must be provided.");
-            }
+        if (CollectionUtils.isEmpty(answers)) {
             this.errorOccurred = true;
-        } else if (errors == null) {
-            if (answers.isEmpty()) {
-                throw new IllegalArgumentException("If errors is not provided, one or more answers must be provided.");
-            }
         }
 
         this.answers = answers;
Original file line number	Diff line number	Diff line change
`@@ -43,4 +43,5 @@ public class ChatCompletionInput {`
`43`	`43`	`private String systemPrompt;`
`44`	`44`	`private String userInstructions;`
`45`	`45`	`private Llm.ModelProvider modelProvider;`
	`46`	`+ private String llmResponseField;`
`46`	`47`	`}`