1+ # Copyright 2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2+ #
3+ # Redistribution and use in source and binary forms, with or without
4+ # modification, are permitted provided that the following conditions
5+ # are met:
6+ # * Redistributions of source code must retain the above copyright
7+ # notice, this list of conditions and the following disclaimer.
8+ # * Redistributions in binary form must reproduce the above copyright
9+ # notice, this list of conditions and the following disclaimer in the
10+ # documentation and/or other materials provided with the distribution.
11+ # * Neither the name of NVIDIA CORPORATION nor the names of its
12+ # contributors may be used to endorse or promote products derived
13+ # from this software without specific prior written permission.
14+ #
15+ # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
16+ # EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17+ # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
18+ # PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
19+ # CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
20+ # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21+ # PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
22+ # PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
23+ # OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24+ # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
25+ # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26+
27+ name: " ensemble_model"
28+ platform: " ensemble"
29+ max_batch_size: 1
30+ input [
31+ {
32+ name: " text_input"
33+ data_type: TYPE_STRING
34+ dims: [ -1 ]
35+ }
36+ ]
37+ output [
38+ {
39+ name: " text_output"
40+ data_type: TYPE_STRING
41+ dims: [ -1 ]
42+ }
43+ ]
44+ ensemble_scheduling {
45+ step [
46+ {
47+ model_name: " vllm_opt"
48+ model_version: -1
49+ input_map {
50+ key: " text_input"
51+ value: " text_input"
52+ }
53+ output_map {
54+ key: " text_output"
55+ value: " text_output"
56+ }
57+ }
58+ ]
59+ }
0 commit comments