We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 1352a52 commit 2ece3e4Copy full SHA for 2ece3e4
tensorflow_serving/apis/predict.proto
@@ -66,6 +66,10 @@ message PredictRequest {
66
// Only supported in disaggregated serving. When set, additional arrays from
67
// prefill will be returned if available.
68
optional bool return_additional_arrays_from_prefill = 3;
69
+
70
+ // Returns these stop tokens in response if the model stops at them. The
71
+ // model may stop at other tokens, but will not return them in the response.
72
+ repeated int64 return_stoptokens = 4;
73
}
74
75
optional RequestOptions request_options = 7;
0 commit comments