Skip to content

Commit c2621e7

Browse files
Refactor Mistral model classes to remove modelId and update rate limit hashing
1 parent 18ee182 commit c2621e7

File tree

5 files changed

+4
-16
lines changed

5 files changed

+4
-16
lines changed

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/llama/LlamaModel.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -61,7 +61,7 @@ public RateLimitSettings rateLimitSettings() {
6161

6262
@Override
6363
public int rateLimitGroupingHash() {
64-
return Objects.hash(uri, getSecretSettings());
64+
return Objects.hash(getServiceSettings().modelId(), uri, getSecretSettings());
6565
}
6666

6767
// Needed for testing only

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/mistral/MistralModel.java

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -16,13 +16,13 @@
1616

1717
import java.net.URI;
1818
import java.net.URISyntaxException;
19+
import java.util.Objects;
1920

2021
/**
2122
* Represents a Mistral model that can be used for inference tasks.
2223
* This class extends RateLimitGroupingModel to handle rate limiting based on model and API key.
2324
*/
2425
public abstract class MistralModel extends RateLimitGroupingModel {
25-
protected String model;
2626
protected URI uri;
2727
protected RateLimitSettings rateLimitSettings;
2828

@@ -34,10 +34,6 @@ protected MistralModel(RateLimitGroupingModel model, ServiceSettings serviceSett
3434
super(model, serviceSettings);
3535
}
3636

37-
public String model() {
38-
return this.model;
39-
}
40-
4137
public URI uri() {
4238
return this.uri;
4339
}
@@ -49,7 +45,7 @@ public RateLimitSettings rateLimitSettings() {
4945

5046
@Override
5147
public int rateLimitGroupingHash() {
52-
return 0;
48+
return Objects.hash(getServiceSettings().modelId(), getSecretSettings().apiKey());
5349
}
5450

5551
// Needed for testing only

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/mistral/completion/MistralChatCompletionModel.java

Lines changed: 0 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,6 @@
2222
import java.net.URI;
2323
import java.net.URISyntaxException;
2424
import java.util.Map;
25-
import java.util.Objects;
2625

2726
import static org.elasticsearch.xpack.inference.services.mistral.MistralConstants.API_COMPLETIONS_PATH;
2827

@@ -102,16 +101,10 @@ public MistralChatCompletionModel(
102101
}
103102

104103
private void setPropertiesFromServiceSettings(MistralChatCompletionServiceSettings serviceSettings) {
105-
this.model = serviceSettings.modelId();
106104
this.rateLimitSettings = serviceSettings.rateLimitSettings();
107105
setEndpointUrl();
108106
}
109107

110-
@Override
111-
public int rateLimitGroupingHash() {
112-
return Objects.hash(model, getSecretSettings().apiKey());
113-
}
114-
115108
private void setEndpointUrl() {
116109
try {
117110
this.uri = new URI(API_COMPLETIONS_PATH);

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/mistral/embeddings/MistralEmbeddingsModel.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -59,7 +59,6 @@ public MistralEmbeddingsModel(MistralEmbeddingsModel model, MistralEmbeddingsSer
5959
}
6060

6161
private void setPropertiesFromServiceSettings(MistralEmbeddingsServiceSettings serviceSettings) {
62-
this.model = serviceSettings.modelId();
6362
this.rateLimitSettings = serviceSettings.rateLimitSettings();
6463
setEndpointUrl();
6564
}

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/mistral/request/embeddings/MistralEmbeddingsRequest.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,7 @@ public HttpRequest createHttpRequest() {
4242
HttpPost httpPost = new HttpPost(this.uri);
4343

4444
ByteArrayEntity byteEntity = new ByteArrayEntity(
45-
Strings.toString(new MistralEmbeddingsRequestEntity(embeddingsModel.model(), truncationResult.input()))
45+
Strings.toString(new MistralEmbeddingsRequestEntity(embeddingsModel.getServiceSettings().modelId(), truncationResult.input()))
4646
.getBytes(StandardCharsets.UTF_8)
4747
);
4848
httpPost.setEntity(byteEntity);

0 commit comments

Comments
 (0)