|
19 | 19 | import org.elasticsearch.xpack.inference.external.http.sender.Sender; |
20 | 20 | import org.elasticsearch.xpack.inference.external.http.sender.UnifiedChatInput; |
21 | 21 | import org.elasticsearch.xpack.inference.services.ServiceComponents; |
22 | | -import org.elasticsearch.xpack.inference.services.cohere.CohereResponseHandler; |
23 | | -import org.elasticsearch.xpack.inference.services.cohere.response.CohereRankedResponseEntity; |
| 22 | +import org.elasticsearch.xpack.inference.services.jinaai.JinaAIResponseHandler; |
| 23 | +import org.elasticsearch.xpack.inference.services.jinaai.response.JinaAIRerankResponseEntity; |
24 | 24 | import org.elasticsearch.xpack.inference.services.openai.response.OpenAiChatCompletionResponseEntity; |
25 | 25 | import org.elasticsearch.xpack.inference.services.openai.response.OpenAiEmbeddingsResponseEntity; |
26 | 26 | import org.elasticsearch.xpack.inference.services.openshiftai.completion.OpenShiftAiChatCompletionModel; |
@@ -57,11 +57,10 @@ public class OpenShiftAiActionCreator implements OpenShiftAiActionVisitor { |
57 | 57 | "OpenShift AI completion", |
58 | 58 | OpenAiChatCompletionResponseEntity::fromResponse |
59 | 59 | ); |
60 | | - // OpenShift AI Rerank task uses the same response format as Cohere, therefore we can reuse the CohereResponseHandler |
61 | | - private static final ResponseHandler RERANK_HANDLER = new CohereResponseHandler( |
| 60 | + // OpenShift AI Rerank task uses the same response format as JinaAI, therefore we can reuse the JinaAIResponseHandler |
| 61 | + private static final ResponseHandler RERANK_HANDLER = new JinaAIResponseHandler( |
62 | 62 | "OpenShift AI rerank", |
63 | | - (request, response) -> CohereRankedResponseEntity.fromResponse(response), |
64 | | - false |
| 63 | + (request, response) -> JinaAIRerankResponseEntity.fromResponse(response) |
65 | 64 | ); |
66 | 65 |
|
67 | 66 | private final Sender sender; |
@@ -122,11 +121,11 @@ public ExecutableAction create(OpenShiftAiRerankModel model, Map<String, Object> |
122 | 121 | inputs.getChunks(), |
123 | 122 | inputs.getReturnDocuments(), |
124 | 123 | inputs.getTopN(), |
125 | | - model |
| 124 | + overriddenModel |
126 | 125 | ), |
127 | 126 | QueryAndDocsInputs.class |
128 | 127 | ); |
129 | | - var errorMessage = buildErrorMessage(TaskType.RERANK, model.getInferenceEntityId()); |
| 128 | + var errorMessage = buildErrorMessage(TaskType.RERANK, overriddenModel.getInferenceEntityId()); |
130 | 129 | return new SenderExecutableAction(sender, manager, errorMessage); |
131 | 130 | } |
132 | 131 |
|
|
0 commit comments