Skip to content

Commit b08533e

Browse files
committed
Update field name
1 parent 50bf543 commit b08533e

File tree

1 file changed

+6
-7
lines changed

1 file changed

+6
-7
lines changed

protobuf/model_config.proto

Lines changed: 6 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1660,15 +1660,14 @@ message ModelEnsembling
16601660
//@@
16611661
repeated Step step = 1;
16621662

1663-
//@@ .. cpp:var:: uint32 max_inflight_responses
1663+
//@@ .. cpp:var:: uint32 max_inflight_requests
16641664
//@@
1665-
//@@ The maximum number of concurrent inflight responses from ensemble
1666-
//@@ steps to downstream consumers. This limit prevents unbounded memory
1667-
//@@ growth when decoupled models produce responses faster than downstream
1668-
//@@ models can consume them. Default value is 0, which indicates that no
1669-
//@@ limit is enforced (unlimited).
1665+
//@@ The maximum number of concurrent inflight requests to ensemble steps.
1666+
//@@ This limit prevents unbounded memory growth when decoupled models
1667+
//@@ produce responses faster than downstream models can consume them.
1668+
//@@ Default value is 0, which indicates that no limit is enforced.
16701669
//@@
1671-
uint32 max_inflight_responses = 2;
1670+
uint32 max_inflight_requests = 2;
16721671
}
16731672

16741673
//@@

0 commit comments

Comments
 (0)