Skip to content

Commit fe6173e

Browse files
Refactor Llama model classes to remove modelId and update embedding request handling
1 parent e06653b commit fe6173e

File tree

4 files changed

+3
-9
lines changed

4 files changed

+3
-9
lines changed

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/llama/LlamaModel.java

Lines changed: 1 addition & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,6 @@
2828
* This class extends RateLimitGroupingModel and provides common functionality for Llama models.
2929
*/
3030
public abstract class LlamaModel extends RateLimitGroupingModel {
31-
protected String modelId;
3231
protected URI uri;
3332
protected RateLimitSettings rateLimitSettings;
3433

@@ -51,10 +50,6 @@ protected LlamaModel(RateLimitGroupingModel model, ServiceSettings serviceSettin
5150
super(model, serviceSettings);
5251
}
5352

54-
public String model() {
55-
return this.modelId;
56-
}
57-
5853
public URI uri() {
5954
return this.uri;
6055
}
@@ -66,7 +61,7 @@ public RateLimitSettings rateLimitSettings() {
6661

6762
@Override
6863
public int rateLimitGroupingHash() {
69-
return Objects.hash(modelId, uri, getSecretSettings());
64+
return Objects.hash(uri, getSecretSettings());
7065
}
7166

7267
// Needed for testing only

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/llama/completion/LlamaChatCompletionModel.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -105,7 +105,6 @@ public static LlamaChatCompletionModel of(LlamaChatCompletionModel model, Unifie
105105
}
106106

107107
private void setPropertiesFromServiceSettings(LlamaChatCompletionServiceSettings serviceSettings) {
108-
this.modelId = serviceSettings.modelId();
109108
this.uri = serviceSettings.uri();
110109
this.rateLimitSettings = serviceSettings.rateLimitSettings();
111110
}

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/llama/embeddings/LlamaEmbeddingsModel.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,6 @@ public LlamaEmbeddingsModel(LlamaEmbeddingsModel model, LlamaEmbeddingsServiceSe
7575
* @param serviceSettings the service settings to extract properties from
7676
*/
7777
private void setPropertiesFromServiceSettings(LlamaEmbeddingsServiceSettings serviceSettings) {
78-
this.modelId = serviceSettings.modelId();
7978
this.uri = serviceSettings.uri();
8079
this.rateLimitSettings = serviceSettings.rateLimitSettings();
8180
}

x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/llama/request/embeddings/LlamaEmbeddingsRequest.java

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -60,7 +60,8 @@ public HttpRequest createHttpRequest() {
6060
HttpPost httpPost = new HttpPost(this.uri);
6161

6262
ByteArrayEntity byteEntity = new ByteArrayEntity(
63-
Strings.toString(new LlamaEmbeddingsRequestEntity(model.model(), truncationResult.input())).getBytes(StandardCharsets.UTF_8)
63+
Strings.toString(new LlamaEmbeddingsRequestEntity(model.getServiceSettings().modelId(), truncationResult.input()))
64+
.getBytes(StandardCharsets.UTF_8)
6465
);
6566
httpPost.setEntity(byteEntity);
6667

0 commit comments

Comments
 (0)