Skip to content

Commit 20eb590

Browse files
authored
[ML] Move request managers into service package (#126114)
1 parent 0360db2 commit 20eb590

File tree

74 files changed

+181
-128
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

74 files changed

+181
-128
lines changed

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/BaseRequestManager.java

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@
1515

1616
import static org.elasticsearch.xpack.inference.InferencePlugin.UTILITY_THREAD_POOL_NAME;
1717

18-
abstract class BaseRequestManager implements RequestManager {
18+
public abstract class BaseRequestManager implements RequestManager {
1919
private final ThreadPool threadPool;
2020
private final String inferenceEntityId;
2121
// It's possible that two inference endpoints have the same information defining the group but have different
@@ -24,7 +24,7 @@ abstract class BaseRequestManager implements RequestManager {
2424
private final EndpointGrouping endpointGrouping;
2525
private final RateLimitSettings rateLimitSettings;
2626

27-
BaseRequestManager(ThreadPool threadPool, String inferenceEntityId, Object rateLimitGroup, RateLimitSettings rateLimitSettings) {
27+
public BaseRequestManager(ThreadPool threadPool, String inferenceEntityId, Object rateLimitGroup, RateLimitSettings rateLimitSettings) {
2828
this.threadPool = Objects.requireNonNull(threadPool);
2929
this.inferenceEntityId = Objects.requireNonNull(inferenceEntityId);
3030

@@ -33,7 +33,7 @@ abstract class BaseRequestManager implements RequestManager {
3333
this.rateLimitSettings = rateLimitSettings;
3434
}
3535

36-
BaseRequestManager(ThreadPool threadPool, RateLimitGroupingModel rateLimitGroupingModel) {
36+
public BaseRequestManager(ThreadPool threadPool, RateLimitGroupingModel rateLimitGroupingModel) {
3737
this.threadPool = Objects.requireNonNull(threadPool);
3838
Objects.requireNonNull(rateLimitGroupingModel);
3939

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/ExecutableInferenceRequest.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818

1919
import java.util.function.Supplier;
2020

21-
record ExecutableInferenceRequest(
21+
public record ExecutableInferenceRequest(
2222
RequestSender requestSender,
2323
Logger logger,
2424
Request request,

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/RequestExecutorService.java

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,7 @@
5555
* attempting to execute a task (aka waiting for the connection manager to lease a connection). See
5656
* {@link org.apache.http.client.config.RequestConfig.Builder#setConnectionRequestTimeout} for more info.
5757
*/
58-
class RequestExecutorService implements RequestExecutor {
58+
public class RequestExecutorService implements RequestExecutor {
5959

6060
/**
6161
* Provides dependency injection mainly for testing
@@ -123,7 +123,7 @@ interface RateLimiterCreator {
123123
private final AtomicReference<Scheduler.Cancellable> cancellableCleanupTask = new AtomicReference<>();
124124
private final AtomicBoolean started = new AtomicBoolean(false);
125125

126-
RequestExecutorService(
126+
public RequestExecutorService(
127127
ThreadPool threadPool,
128128
@Nullable CountDownLatch startupLatch,
129129
RequestExecutorServiceSettings settings,
@@ -141,7 +141,7 @@ interface RateLimiterCreator {
141141
);
142142
}
143143

144-
RequestExecutorService(
144+
public RequestExecutorService(
145145
ThreadPool threadPool,
146146
AdjustableCapacityBlockingQueue.QueueCreator<RejectableTask> queueCreator,
147147
@Nullable CountDownLatch startupLatch,
Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55
* 2.0.
66
*/
77

8-
package org.elasticsearch.xpack.inference.external.http.sender;
8+
package org.elasticsearch.xpack.inference.services.alibabacloudsearch;
99

1010
import org.apache.logging.log4j.LogManager;
1111
import org.apache.logging.log4j.Logger;
@@ -14,10 +14,11 @@
1414
import org.elasticsearch.threadpool.ThreadPool;
1515
import org.elasticsearch.xpack.inference.external.http.retry.RequestSender;
1616
import org.elasticsearch.xpack.inference.external.http.retry.ResponseHandler;
17+
import org.elasticsearch.xpack.inference.external.http.sender.ChatCompletionInput;
18+
import org.elasticsearch.xpack.inference.external.http.sender.ExecutableInferenceRequest;
19+
import org.elasticsearch.xpack.inference.external.http.sender.InferenceInputs;
1720
import org.elasticsearch.xpack.inference.external.request.alibabacloudsearch.completion.AlibabaCloudSearchCompletionRequest;
1821
import org.elasticsearch.xpack.inference.external.response.alibabacloudsearch.AlibabaCloudSearchCompletionResponseEntity;
19-
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchAccount;
20-
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchResponseHandler;
2122
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.completion.AlibabaCloudSearchCompletionModel;
2223

2324
import java.util.List;
Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55
* 2.0.
66
*/
77

8-
package org.elasticsearch.xpack.inference.external.http.sender;
8+
package org.elasticsearch.xpack.inference.services.alibabacloudsearch;
99

1010
import org.apache.logging.log4j.LogManager;
1111
import org.apache.logging.log4j.Logger;
@@ -15,10 +15,11 @@
1515
import org.elasticsearch.threadpool.ThreadPool;
1616
import org.elasticsearch.xpack.inference.external.http.retry.RequestSender;
1717
import org.elasticsearch.xpack.inference.external.http.retry.ResponseHandler;
18+
import org.elasticsearch.xpack.inference.external.http.sender.EmbeddingsInput;
19+
import org.elasticsearch.xpack.inference.external.http.sender.ExecutableInferenceRequest;
20+
import org.elasticsearch.xpack.inference.external.http.sender.InferenceInputs;
1821
import org.elasticsearch.xpack.inference.external.request.alibabacloudsearch.AlibabaCloudSearchEmbeddingsRequest;
1922
import org.elasticsearch.xpack.inference.external.response.alibabacloudsearch.AlibabaCloudSearchEmbeddingsResponseEntity;
20-
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchAccount;
21-
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchResponseHandler;
2223
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.embeddings.AlibabaCloudSearchEmbeddingsModel;
2324

2425
import java.util.List;
Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -5,10 +5,10 @@
55
* 2.0.
66
*/
77

8-
package org.elasticsearch.xpack.inference.external.http.sender;
8+
package org.elasticsearch.xpack.inference.services.alibabacloudsearch;
99

1010
import org.elasticsearch.threadpool.ThreadPool;
11-
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchModel;
11+
import org.elasticsearch.xpack.inference.external.http.sender.BaseRequestManager;
1212

1313
import java.util.Objects;
1414

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55
* 2.0.
66
*/
77

8-
package org.elasticsearch.xpack.inference.external.http.sender;
8+
package org.elasticsearch.xpack.inference.services.alibabacloudsearch;
99

1010
import org.apache.logging.log4j.LogManager;
1111
import org.apache.logging.log4j.Logger;
@@ -14,10 +14,11 @@
1414
import org.elasticsearch.threadpool.ThreadPool;
1515
import org.elasticsearch.xpack.inference.external.http.retry.RequestSender;
1616
import org.elasticsearch.xpack.inference.external.http.retry.ResponseHandler;
17+
import org.elasticsearch.xpack.inference.external.http.sender.ExecutableInferenceRequest;
18+
import org.elasticsearch.xpack.inference.external.http.sender.InferenceInputs;
19+
import org.elasticsearch.xpack.inference.external.http.sender.QueryAndDocsInputs;
1720
import org.elasticsearch.xpack.inference.external.request.alibabacloudsearch.AlibabaCloudSearchRerankRequest;
1821
import org.elasticsearch.xpack.inference.external.response.alibabacloudsearch.AlibabaCloudSearchRerankResponseEntity;
19-
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchAccount;
20-
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchResponseHandler;
2122
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.rerank.AlibabaCloudSearchRerankModel;
2223

2324
import java.util.Objects;
Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55
* 2.0.
66
*/
77

8-
package org.elasticsearch.xpack.inference.external.http.sender;
8+
package org.elasticsearch.xpack.inference.services.alibabacloudsearch;
99

1010
import org.apache.logging.log4j.LogManager;
1111
import org.apache.logging.log4j.Logger;
@@ -15,10 +15,11 @@
1515
import org.elasticsearch.threadpool.ThreadPool;
1616
import org.elasticsearch.xpack.inference.external.http.retry.RequestSender;
1717
import org.elasticsearch.xpack.inference.external.http.retry.ResponseHandler;
18+
import org.elasticsearch.xpack.inference.external.http.sender.EmbeddingsInput;
19+
import org.elasticsearch.xpack.inference.external.http.sender.ExecutableInferenceRequest;
20+
import org.elasticsearch.xpack.inference.external.http.sender.InferenceInputs;
1821
import org.elasticsearch.xpack.inference.external.request.alibabacloudsearch.AlibabaCloudSearchSparseRequest;
1922
import org.elasticsearch.xpack.inference.external.response.alibabacloudsearch.AlibabaCloudSearchSparseResponseEntity;
20-
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchAccount;
21-
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchResponseHandler;
2223
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.sparse.AlibabaCloudSearchSparseModel;
2324

2425
import java.util.List;

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/alibabacloudsearch/action/AlibabaCloudSearchCompletionAction.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,12 +16,12 @@
1616
import org.elasticsearch.inference.InferenceServiceResults;
1717
import org.elasticsearch.rest.RestStatus;
1818
import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
19-
import org.elasticsearch.xpack.inference.external.http.sender.AlibabaCloudSearchCompletionRequestManager;
2019
import org.elasticsearch.xpack.inference.external.http.sender.ChatCompletionInput;
2120
import org.elasticsearch.xpack.inference.external.http.sender.InferenceInputs;
2221
import org.elasticsearch.xpack.inference.external.http.sender.Sender;
2322
import org.elasticsearch.xpack.inference.services.ServiceComponents;
2423
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchAccount;
24+
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchCompletionRequestManager;
2525
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.completion.AlibabaCloudSearchCompletionModel;
2626

2727
import java.util.Objects;

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/alibabacloudsearch/action/AlibabaCloudSearchEmbeddingsAction.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,11 +12,11 @@
1212
import org.elasticsearch.core.TimeValue;
1313
import org.elasticsearch.inference.InferenceServiceResults;
1414
import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
15-
import org.elasticsearch.xpack.inference.external.http.sender.AlibabaCloudSearchEmbeddingsRequestManager;
1615
import org.elasticsearch.xpack.inference.external.http.sender.InferenceInputs;
1716
import org.elasticsearch.xpack.inference.external.http.sender.Sender;
1817
import org.elasticsearch.xpack.inference.services.ServiceComponents;
1918
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchAccount;
19+
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.AlibabaCloudSearchEmbeddingsRequestManager;
2020
import org.elasticsearch.xpack.inference.services.alibabacloudsearch.embeddings.AlibabaCloudSearchEmbeddingsModel;
2121

2222
import java.util.Objects;

0 commit comments

Comments
 (0)