|
1 | | -{ |
2 | 1 | "models": [ |
3 | | - { |
| 2 | + { |
4 | 3 | "serviceName": "token_counter_openai", |
5 | 4 | "modelBasePath": "src/token_counter/openai/local/.", |
6 | 5 | "apiBasePath": "token_counter/openai/local/", |
|
9 | 8 | "nginx": [], |
10 | 9 | "build": true |
11 | 10 | }, |
12 | | - { |
| 11 | + { |
13 | 12 | "serviceName": "asr_whisper_en", |
14 | 13 | "modelBasePath": "src/asr/whisper_en/local/.", |
15 | 14 | "apiBasePath": "asr/whisper_en/local/", |
16 | 15 | "containerPort": 8000, |
17 | | - "environment": {}, |
| 16 | + "environment": { |
| 17 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
| 18 | + }, |
18 | 19 | "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"], |
19 | 20 | "constraints": ["node.labels.node_vm_type==gpu"], |
20 | 21 | "build": false |
21 | 22 | }, |
22 | | - { |
| 23 | + { |
23 | 24 | "serviceName": "asr_lang_detect", |
24 | 25 | "modelBasePath": "src/asr/whisper_lang_rec/local/.", |
25 | 26 | "apiBasePath": "asr/whisper_lang_rec/local/", |
26 | 27 | "containerPort": 8000, |
27 | | - "environment": {}, |
| 28 | + "environment": { |
| 29 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
| 30 | + }, |
28 | 31 | "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"], |
29 | 32 | "constraints": ["node.labels.node_vm_type==gpu"], |
30 | 33 | "build": false |
31 | | - }, |
| 34 | + }, |
32 | 35 | { |
33 | 36 | "serviceName": "ner", |
34 | 37 | "modelBasePath": "src/ner/agri_ner_akai/local/.", |
35 | 38 | "apiBasePath": "ner/agri_ner_akai/local/", |
36 | 39 | "containerPort": 8000, |
37 | | - "environment": {}, |
| 40 | + "environment": { |
| 41 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
| 42 | + }, |
38 | 43 | "nginx": [], |
| 44 | + "constraints": ["node.labels.node_vm_type==gpu"], |
39 | 45 | "build": false |
40 | 46 | }, |
41 | 47 | { |
|
64 | 70 | "environment": {}, |
65 | 71 | "nginx": [], |
66 | 72 | "constraints": ["node.role==worker"], |
67 | | - "build": false |
| 73 | + "build": true |
68 | 74 | }, |
69 | 75 | { |
70 | 76 | "serviceName": "text_translation_azure_dict", |
|
86 | 92 | "OPENAI_API_KEY": "${OPENAI_API_KEY}" |
87 | 93 | }, |
88 | 94 | "nginx": [], |
89 | | - "constraints": ["node.labels.node_vm_type==gpu"], |
90 | 95 | "build": false |
91 | 96 | }, |
92 | | - { |
93 | | - "serviceName": "text_translation_azure", |
94 | | - "modelBasePath": "src/text_translation/azure/remote/.", |
95 | | - "apiBasePath": "/text_translation/azure/remote", |
96 | | - "containerPort": 8000, |
97 | | - "environment": { |
98 | | - "AZURE_TRANSLATE_KEY": "${AZURE_TRANSLATE_KEY}" |
99 | | - }, |
100 | | - "nginx": [], |
101 | | - "constraints": ["node.labels.node_vm_type==gpu"], |
102 | | - "build": false |
103 | | - }, |
104 | 97 | { |
105 | 98 | "serviceName": "asr_mms", |
106 | 99 | "modelBasePath": "src/asr/fairseq_mms/local/.", |
107 | 100 | "apiBasePath": "/asr/fairseq_mms/local", |
108 | 101 | "containerPort": 8000, |
109 | | - "environment": {}, |
| 102 | + "environment": { |
| 103 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
| 104 | + }, |
110 | 105 | "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"], |
111 | 106 | "constraints": ["node.labels.node_vm_type==gpu"], |
112 | 107 | "build": false |
|
116 | 111 | "modelBasePath": "src/coref/fcoref/local/.", |
117 | 112 | "apiBasePath": "/coref/fcoref/local", |
118 | 113 | "containerPort": 8000, |
119 | | - "environment": {}, |
120 | | - "nginx": [], |
121 | | - "constraints": ["node.labels.node_vm_type==gpu"], |
122 | | - "build": false |
123 | | - }, |
124 | | - { |
125 | | - "serviceName": "text_translation_bhashini", |
126 | | - "modelBasePath": "src/text_translation/bhashini/remote/.", |
127 | | - "apiBasePath": "/text_translation/bhashini/remote", |
128 | | - "containerPort": 8000, |
129 | | - "environment": {}, |
| 114 | + "environment": { |
| 115 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
| 116 | + }, |
130 | 117 | "nginx": [], |
131 | 118 | "constraints": ["node.labels.node_vm_type==gpu"], |
132 | 119 | "build": false |
133 | 120 | }, |
134 | | - { |
135 | | - "serviceName": "text_translation_ai4bharat", |
136 | | - "modelBasePath": "src/text_translation/ai4bharat/remote/.", |
137 | | - "apiBasePath": "src/text_translation/ai4bharat/remote", |
138 | | - "containerPort": 8000, |
139 | | - "environment": {}, |
140 | | - "constraints": ["node.labels.node_vm_type==gpu"], |
141 | | - "build": false |
142 | | - }, |
143 | | - { |
144 | | - "serviceName": "text_lang_detection_bhashini", |
145 | | - "modelBasePath": "src/text_lang_detection/bhashini/remote/.", |
146 | | - "apiBasePath": "/text_lang_detection/bhashini/remote", |
147 | | - "containerPort": 8000, |
148 | | - "environment": {}, |
149 | | - "constraints": ["node.labels.node_vm_type==gpu"], |
150 | | - "build": false |
151 | | - }, |
152 | 121 | { |
153 | 122 | "serviceName": "chunking_mpnet", |
154 | 123 | "modelBasePath": "src/chunking/MPNet/local/.", |
155 | 124 | "apiBasePath": "chunking/MPNet/local", |
156 | 125 | "containerPort": 8000, |
157 | 126 | "environment": { |
158 | | - "OPENAI_API_KEY": "${OPENAI_API_KEY}" |
| 127 | + "OPENAI_API_KEY": "${OPENAI_API_KEY}", |
| 128 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
159 | 129 | }, |
160 | 130 | "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"], |
161 | 131 | "constraints": ["node.labels.node_vm_type==gpu"], |
|
167 | 137 | "apiBasePath": "/embeddings/instructor/local", |
168 | 138 | "containerPort": 8000, |
169 | 139 | "environment": { |
170 | | - "OPENAI_API_KEY": "${OPENAI_API_KEY}" |
| 140 | + "OPENAI_API_KEY": "${OPENAI_API_KEY}", |
| 141 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
171 | 142 | }, |
172 | 143 | "nginx": ["client_max_body_size 100M;", "proxy_read_timeout 600;", "proxy_connect_timeout 600;", "proxy_send_timeout 600;"], |
173 | 144 | "constraints": ["node.labels.node_vm_type==gpu"], |
|
179 | 150 | "apiBasePath": "/llm/openai/chatgpt3", |
180 | 151 | "containerPort": 8000, |
181 | 152 | "environment": { |
182 | | - "OPENAI_API_KEY": "${OPENAI_API_KEY}" |
| 153 | + "OPENAI_API_KEY": "${OPENAI_API_KEY}", |
| 154 | + "NVIDIA_VISIBLE_DEVICES": "${NVIDIA_VISIBLE_DEVICES}" |
183 | 155 | }, |
184 | 156 | "nginx": [], |
185 | 157 | "constraints": ["node.labels.node_vm_type==gpu"], |
|
0 commit comments