Skip to content

Commit 08be4c4

Browse files
committed
remove double-counting of inference memory
1 parent 45cf65e commit 08be4c4

File tree

1 file changed

+1
-14
lines changed

1 file changed

+1
-14
lines changed

x-pack/plugin/ml/src/main/java/org/elasticsearch/xpack/ml/inference/assignment/TrainedModelAssignmentRebalancer.java

Lines changed: 1 addition & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -300,9 +300,7 @@ private Map<List<String>, List<AssignmentPlan.Node>> createNodesByZoneMap() {
300300
nodes.add(
301301
new AssignmentPlan.Node(
302302
discoveryNode.getId(),
303-
// We subtract native inference memory as the planner expects available memory for
304-
// native inference including current assignments.
305-
getNodeFreeMemoryExcludingPerNodeOverheadAndNativeInference(load),
303+
load.getFreeMemoryExcludingPerNodeOverhead(),
306304
MlProcessors.get(discoveryNode, allocatedProcessorsScale).roundUp()
307305
)
308306
);
@@ -319,17 +317,6 @@ private Map<List<String>, List<AssignmentPlan.Node>> createNodesByZoneMap() {
319317
}));
320318
}
321319

322-
private static long getNodeFreeMemoryExcludingPerNodeOverheadAndNativeInference(NodeLoad load) {
323-
// load.getFreeMemoryExcludingPerNodeOverhead() = maxMemory - assignedJobMemoryExcludingPerNodeOverhead - 30MB native executable
324-
// code overhead
325-
// assignedJobMemoryExcludingPerNodeOverhead = assignedAnomalyDetectorMemory + assignedDataFrameAnalyticsMemory +
326-
// assignedNativeInferenceMemory
327-
// load.getAssignedNativeInferenceMemory() = assignedNativeInferenceMemory
328-
// TODO: (valeriy) assignedNativeInferenceMemory is double counted in the current calculation.
329-
return load.getFreeMemoryExcludingPerNodeOverhead()/* - load.getAssignedNativeInferenceMemory()*/;
330-
331-
}
332-
333320
private TrainedModelAssignmentMetadata.Builder buildAssignmentsFromPlan(AssignmentPlan assignmentPlan) {
334321
TrainedModelAssignmentMetadata.Builder builder = TrainedModelAssignmentMetadata.Builder.empty();
335322
for (AssignmentPlan.Deployment deployment : assignmentPlan.deployments()) {

0 commit comments

Comments
 (0)