|
1 |
| -{ |
2 | 1 | "models": [
|
3 |
| - { |
| 2 | + { |
4 | 3 | "serviceName": "token_counter_openai",
|
5 | 4 | "modelBasePath": "src/token_counter/openai/local/.",
|
6 | 5 | "apiBasePath": "token_counter/openai/local/",
|
|
9 | 8 | "nginx": [],
|
10 | 9 | "build": true
|
11 | 10 | },
|
12 |
| - { |
| 11 | + { |
13 | 12 | "serviceName": "asr_whisper_en",
|
14 | 13 | "modelBasePath": "src/asr/whisper_en/local/.",
|
15 | 14 | "apiBasePath": "asr/whisper_en/local/",
|
16 | 15 | "containerPort": 8000,
|
17 |
| - "environment": {}, |
| 16 | + "environment": { |
| 17 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
| 18 | + }, |
18 | 19 | "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"],
|
19 | 20 | "constraints": ["node.labels.node_vm_type==gpu"],
|
20 | 21 | "build": false
|
21 | 22 | },
|
22 |
| - { |
| 23 | + { |
23 | 24 | "serviceName": "asr_lang_detect",
|
24 | 25 | "modelBasePath": "src/asr/whisper_lang_rec/local/.",
|
25 | 26 | "apiBasePath": "asr/whisper_lang_rec/local/",
|
26 | 27 | "containerPort": 8000,
|
27 |
| - "environment": {}, |
| 28 | + "environment": { |
| 29 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
| 30 | + }, |
28 | 31 | "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"],
|
29 | 32 | "constraints": ["node.labels.node_vm_type==gpu"],
|
30 | 33 | "build": false
|
31 |
| - }, |
| 34 | + }, |
32 | 35 | {
|
33 | 36 | "serviceName": "ner",
|
34 | 37 | "modelBasePath": "src/ner/agri_ner_akai/local/.",
|
35 | 38 | "apiBasePath": "ner/agri_ner_akai/local/",
|
36 | 39 | "containerPort": 8000,
|
37 |
| - "environment": {}, |
| 40 | + "environment": { |
| 41 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
| 42 | + }, |
38 | 43 | "nginx": [],
|
| 44 | + "constraints": ["node.labels.node_vm_type==gpu"], |
39 | 45 | "build": false
|
40 | 46 | },
|
41 | 47 | {
|
|
64 | 70 | "environment": {},
|
65 | 71 | "nginx": [],
|
66 | 72 | "constraints": ["node.role==worker"],
|
67 |
| - "build": false |
| 73 | + "build": true |
68 | 74 | },
|
69 | 75 | {
|
70 | 76 | "serviceName": "text_translation_azure_dict",
|
|
86 | 92 | "OPENAI_API_KEY": "${OPENAI_API_KEY}"
|
87 | 93 | },
|
88 | 94 | "nginx": [],
|
89 |
| - "constraints": ["node.labels.node_vm_type==gpu"], |
90 | 95 | "build": false
|
91 | 96 | },
|
92 |
| - { |
93 |
| - "serviceName": "text_translation_azure", |
94 |
| - "modelBasePath": "src/text_translation/azure/remote/.", |
95 |
| - "apiBasePath": "/text_translation/azure/remote", |
96 |
| - "containerPort": 8000, |
97 |
| - "environment": { |
98 |
| - "AZURE_TRANSLATE_KEY": "${AZURE_TRANSLATE_KEY}" |
99 |
| - }, |
100 |
| - "nginx": [], |
101 |
| - "constraints": ["node.labels.node_vm_type==gpu"], |
102 |
| - "build": false |
103 |
| - }, |
104 | 97 | {
|
105 | 98 | "serviceName": "asr_mms",
|
106 | 99 | "modelBasePath": "src/asr/fairseq_mms/local/.",
|
107 | 100 | "apiBasePath": "/asr/fairseq_mms/local",
|
108 | 101 | "containerPort": 8000,
|
109 |
| - "environment": {}, |
| 102 | + "environment": { |
| 103 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
| 104 | + }, |
110 | 105 | "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"],
|
111 | 106 | "constraints": ["node.labels.node_vm_type==gpu"],
|
112 | 107 | "build": false
|
|
116 | 111 | "modelBasePath": "src/coref/fcoref/local/.",
|
117 | 112 | "apiBasePath": "/coref/fcoref/local",
|
118 | 113 | "containerPort": 8000,
|
119 |
| - "environment": {}, |
120 |
| - "nginx": [], |
121 |
| - "constraints": ["node.labels.node_vm_type==gpu"], |
122 |
| - "build": false |
123 |
| - }, |
124 |
| - { |
125 |
| - "serviceName": "text_translation_bhashini", |
126 |
| - "modelBasePath": "src/text_translation/bhashini/remote/.", |
127 |
| - "apiBasePath": "/text_translation/bhashini/remote", |
128 |
| - "containerPort": 8000, |
129 |
| - "environment": {}, |
| 114 | + "environment": { |
| 115 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
| 116 | + }, |
130 | 117 | "nginx": [],
|
131 | 118 | "constraints": ["node.labels.node_vm_type==gpu"],
|
132 | 119 | "build": false
|
133 | 120 | },
|
134 |
| - { |
135 |
| - "serviceName": "text_translation_ai4bharat", |
136 |
| - "modelBasePath": "src/text_translation/ai4bharat/remote/.", |
137 |
| - "apiBasePath": "src/text_translation/ai4bharat/remote", |
138 |
| - "containerPort": 8000, |
139 |
| - "environment": {}, |
140 |
| - "constraints": ["node.labels.node_vm_type==gpu"], |
141 |
| - "build": false |
142 |
| - }, |
143 |
| - { |
144 |
| - "serviceName": "text_lang_detection_bhashini", |
145 |
| - "modelBasePath": "src/text_lang_detection/bhashini/remote/.", |
146 |
| - "apiBasePath": "/text_lang_detection/bhashini/remote", |
147 |
| - "containerPort": 8000, |
148 |
| - "environment": {}, |
149 |
| - "constraints": ["node.labels.node_vm_type==gpu"], |
150 |
| - "build": false |
151 |
| - }, |
152 | 121 | {
|
153 | 122 | "serviceName": "chunking_mpnet",
|
154 | 123 | "modelBasePath": "src/chunking/MPNet/local/.",
|
155 | 124 | "apiBasePath": "chunking/MPNet/local",
|
156 | 125 | "containerPort": 8000,
|
157 | 126 | "environment": {
|
158 |
| - "OPENAI_API_KEY": "${OPENAI_API_KEY}" |
| 127 | + "OPENAI_API_KEY": "${OPENAI_API_KEY}", |
| 128 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
159 | 129 | },
|
160 | 130 | "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"],
|
161 | 131 | "constraints": ["node.labels.node_vm_type==gpu"],
|
|
167 | 137 | "apiBasePath": "/embeddings/instructor/local",
|
168 | 138 | "containerPort": 8000,
|
169 | 139 | "environment": {
|
170 |
| - "OPENAI_API_KEY": "${OPENAI_API_KEY}" |
| 140 | + "OPENAI_API_KEY": "${OPENAI_API_KEY}", |
| 141 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
171 | 142 | },
|
172 | 143 | "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"],
|
173 | 144 | "constraints": ["node.labels.node_vm_type==gpu"],
|
|
179 | 150 | "apiBasePath": "/llm/openai/chatgpt3",
|
180 | 151 | "containerPort": 8000,
|
181 | 152 | "environment": {
|
182 |
| - "OPENAI_API_KEY": "${OPENAI_API_KEY}" |
| 153 | + "OPENAI_API_KEY": "${OPENAI_API_KEY}", |
| 154 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
183 | 155 | },
|
184 | 156 | "nginx": [],
|
185 | 157 | "constraints": ["node.labels.node_vm_type==gpu"],
|
|
0 commit comments