Update protobuf/model_config.proto

pskiran1 · yinggeh · web-flow · commit 088152421f3b · 2025-10-31T12:48:26.000+05:30
Co-authored-by: Yingge He &lt;157551214+yinggeh@users.noreply.github.com&gt;
diff --git a/protobuf/model_config.proto b/protobuf/model_config.proto
@@ -1662,8 +1662,8 @@ message ModelEnsembling
 
   //@@  .. cpp:var:: uint32 max_inflight_requests
   //@@
-  //@@     The maximum number of concurrent inflight requests at each ensemble
-  //@@     step.
+  //@@     The maximum number of concurrent inflight requests allowed at each ensemble
+  //@@     step per inference request.
   //@@     This limit prevents unbounded memory growth when decoupled models
   //@@     produce responses faster than downstream models can consume them.
   //@@     Default value is 0, which indicates that no limit is enforced.