|
22 | 22 | "apiBasePath": "text_classification/flow_classification/local/",
|
23 | 23 | "containerPort": 8000,
|
24 | 24 | "environment": {},
|
25 |
| - "nginx": [] |
| 25 | + "nginx": [], |
| 26 | + "constraints": ["node.role==worker"] |
26 | 27 | },
|
27 | 28 | {
|
28 | 29 | "serviceName": "text_translation_azure_dict",
|
|
42 | 43 | "environment": {
|
43 | 44 | "OPENAI_API_KEY": "${OPENAI_API_KEY}"
|
44 | 45 | },
|
45 |
| - "nginx": [] |
| 46 | + "nginx": [], |
| 47 | + "constraints": ["node.labels.node_vm_type==gpu"] |
46 | 48 | },
|
47 | 49 | {
|
48 | 50 | "serviceName": "coref_spacy",
|
49 | 51 | "modelBasePath": "src/coref/spacy/local/.",
|
50 | 52 | "apiBasePath": "/coref/spacy/local",
|
51 | 53 | "containerPort": 8000,
|
52 | 54 | "environment": {},
|
53 |
| - "nginx": [] |
| 55 | + "nginx": [], |
| 56 | + "constraints": ["node.labels.node_vm_type==gpu"] |
54 | 57 | },
|
55 | 58 | {
|
56 | 59 | "serviceName": "coref_bart",
|
57 | 60 | "modelBasePath": "src/coref/bart/local/.",
|
58 | 61 | "apiBasePath": "/coref/bart/local",
|
59 | 62 | "containerPort": 8000,
|
60 | 63 | "environment": {},
|
61 |
| - "nginx": [] |
| 64 | + "nginx": [], |
| 65 | + "constraints": ["node.labels.node_vm_type==gpu"] |
62 | 66 | },
|
63 | 67 | {
|
64 | 68 | "serviceName": "text_translation_azure",
|
|
68 | 72 | "environment": {
|
69 | 73 | "AZURE_TRANSLATE_KEY": "${AZURE_TRANSLATE_KEY}"
|
70 | 74 | },
|
71 |
| - "nginx": [] |
| 75 | + "nginx": [], |
| 76 | + "constraints": ["node.labels.node_vm_type==gpu"] |
72 | 77 | },
|
73 | 78 | {
|
74 | 79 | "serviceName": "asr_mms",
|
75 | 80 | "modelBasePath": "src/asr/fairseq_mms/local/.",
|
76 | 81 | "apiBasePath": "/asr/fairseq_mms/local",
|
77 | 82 | "containerPort": 8000,
|
78 | 83 | "environment": {},
|
79 |
| - "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"] |
| 84 | + "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"], |
| 85 | + "constraints": ["node.labels.node_vm_type==gpu"] |
80 | 86 | },
|
81 | 87 | {
|
82 | 88 | "serviceName": "coref_fcoref",
|
83 | 89 | "modelBasePath": "src/coref/fcoref/local/.",
|
84 | 90 | "apiBasePath": "/coref/fcoref/local",
|
85 | 91 | "containerPort": 8000,
|
86 | 92 | "environment": {},
|
87 |
| - "nginx": [] |
| 93 | + "nginx": [], |
| 94 | + "constraints": ["node.labels.node_vm_type==gpu"] |
88 | 95 | },
|
89 | 96 | {
|
90 | 97 | "serviceName": "text_translation_bhashini",
|
91 | 98 | "modelBasePath": "src/text_translation/bhashini/remote/.",
|
92 | 99 | "apiBasePath": "/text_translation/bhashini/remote",
|
93 | 100 | "containerPort": 8000,
|
94 | 101 | "environment": {},
|
95 |
| - "nginx": [] |
| 102 | + "nginx": [], |
| 103 | + "constraints": ["node.labels.node_vm_type==gpu"] |
96 | 104 | },
|
97 | 105 | {
|
98 | 106 | "serviceName": "text_translation_ai4bharat",
|
99 | 107 | "modelBasePath": "src/text_translation/ai4bharat/remote/.",
|
100 | 108 | "apiBasePath": "src/text_translation/ai4bharat/remote",
|
101 | 109 | "containerPort": 8000,
|
102 |
| - "environment": {} |
| 110 | + "environment": {}, |
| 111 | + "constraints": ["node.labels.node_vm_type==gpu"] |
103 | 112 | },
|
104 | 113 | {
|
105 | 114 | "serviceName": "text_lang_detection_bhashini",
|
106 | 115 | "modelBasePath": "src/text_lang_detection/bhashini/remote/.",
|
107 | 116 | "apiBasePath": "/text_lang_detection/bhashini/remote",
|
108 | 117 | "containerPort": 8000,
|
109 |
| - "environment": {} |
| 118 | + "environment": {}, |
| 119 | + "constraints": ["node.labels.node_vm_type==gpu"] |
110 | 120 | },
|
111 | 121 | {
|
112 | 122 | "serviceName": "chunking_mpnet",
|
|
116 | 126 | "environment": {
|
117 | 127 | "OPENAI_API_KEY": "${OPENAI_API_KEY}"
|
118 | 128 | },
|
119 |
| - "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"] |
| 129 | + "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"], |
| 130 | + "constraints": ["node.labels.node_vm_type==gpu"] |
120 | 131 | },
|
121 | 132 | {
|
122 | 133 | "serviceName": "embedding_instructor",
|
|
126 | 137 | "environment": {
|
127 | 138 | "OPENAI_API_KEY": "${OPENAI_API_KEY}"
|
128 | 139 | },
|
129 |
| - "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"] |
| 140 | + "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"], |
| 141 | + "constraints": ["node.labels.node_vm_type==gpu"] |
130 | 142 | },
|
131 | 143 | {
|
132 | 144 | "serviceName": "llm_openai_gpt3",
|
|
136 | 148 | "environment": {
|
137 | 149 | "OPENAI_API_KEY": "${OPENAI_API_KEY}"
|
138 | 150 | },
|
139 |
| - "nginx": [] |
| 151 | + "nginx": [], |
| 152 | + "constraints": ["node.labels.node_vm_type==gpu"] |
140 | 153 | }
|
141 | 154 | ]
|
142 | 155 | }
|
0 commit comments