We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6d2fd08 commit 1c88766Copy full SHA for 1c88766
tensorflow_serving/apis/predict.proto
@@ -71,6 +71,10 @@ message PredictRequest {
71
// response if the model stops at them. The model may stop at other tokens,
72
// but will not return them in the response.
73
repeated int64 return_stoptokens = 4;
74
+
75
+ // When set and supported by servable, the model server will cache the
76
+ // prefix of request up to this length.
77
+ optional int64 max_cache_length = 6;
78
}
79
80
optional RequestOptions request_options = 7;
0 commit comments