/ mlflow / utils / model_catalog / ovhcloud.json
ovhcloud.json
  1  {
  2    "schema_version": "1.0",
  3    "models": {
  4      "DeepSeek-R1-Distill-Llama-70B": {
  5        "mode": "chat",
  6        "context_window": {
  7          "max_input": 131000,
  8          "max_output": 131000,
  9          "max_tokens": 131000
 10        },
 11        "pricing": {
 12          "input_per_million_tokens": 0.67,
 13          "output_per_million_tokens": 0.67
 14        },
 15        "capabilities": {
 16          "function_calling": true,
 17          "vision": false,
 18          "reasoning": true,
 19          "prompt_caching": false,
 20          "response_schema": true
 21        },
 22        "last_updated_at": "2026-04-24"
 23      },
 24      "Llama-3.1-8B-Instruct": {
 25        "mode": "chat",
 26        "context_window": {
 27          "max_input": 131000,
 28          "max_output": 131000,
 29          "max_tokens": 131000
 30        },
 31        "pricing": {
 32          "input_per_million_tokens": 0.1,
 33          "output_per_million_tokens": 0.1
 34        },
 35        "capabilities": {
 36          "function_calling": true,
 37          "vision": false,
 38          "reasoning": false,
 39          "prompt_caching": false,
 40          "response_schema": true
 41        },
 42        "last_updated_at": "2026-04-24"
 43      },
 44      "Meta-Llama-3_1-70B-Instruct": {
 45        "mode": "chat",
 46        "context_window": {
 47          "max_input": 131000,
 48          "max_output": 131000,
 49          "max_tokens": 131000
 50        },
 51        "pricing": {
 52          "input_per_million_tokens": 0.67,
 53          "output_per_million_tokens": 0.67
 54        },
 55        "capabilities": {
 56          "function_calling": false,
 57          "vision": false,
 58          "reasoning": false,
 59          "prompt_caching": false,
 60          "response_schema": false
 61        },
 62        "last_updated_at": "2026-04-24"
 63      },
 64      "Meta-Llama-3_3-70B-Instruct": {
 65        "mode": "chat",
 66        "context_window": {
 67          "max_input": 131000,
 68          "max_output": 131000,
 69          "max_tokens": 131000
 70        },
 71        "pricing": {
 72          "input_per_million_tokens": 0.67,
 73          "output_per_million_tokens": 0.67
 74        },
 75        "capabilities": {
 76          "function_calling": true,
 77          "vision": false,
 78          "reasoning": false,
 79          "prompt_caching": false,
 80          "response_schema": true
 81        },
 82        "last_updated_at": "2026-04-24"
 83      },
 84      "Mistral-7B-Instruct-v0.3": {
 85        "mode": "chat",
 86        "context_window": {
 87          "max_input": 127000,
 88          "max_output": 127000,
 89          "max_tokens": 127000
 90        },
 91        "pricing": {
 92          "input_per_million_tokens": 0.1,
 93          "output_per_million_tokens": 0.1
 94        },
 95        "capabilities": {
 96          "function_calling": true,
 97          "vision": false,
 98          "reasoning": false,
 99          "prompt_caching": false,
100          "response_schema": true
101        },
102        "last_updated_at": "2026-04-24"
103      },
104      "Mistral-Nemo-Instruct-2407": {
105        "mode": "chat",
106        "context_window": {
107          "max_input": 118000,
108          "max_output": 118000,
109          "max_tokens": 118000
110        },
111        "pricing": {
112          "input_per_million_tokens": 0.13,
113          "output_per_million_tokens": 0.13
114        },
115        "capabilities": {
116          "function_calling": true,
117          "vision": false,
118          "reasoning": false,
119          "prompt_caching": false,
120          "response_schema": true
121        },
122        "last_updated_at": "2026-04-24"
123      },
124      "Mistral-Small-3.2-24B-Instruct-2506": {
125        "mode": "chat",
126        "context_window": {
127          "max_input": 128000,
128          "max_output": 128000,
129          "max_tokens": 128000
130        },
131        "pricing": {
132          "input_per_million_tokens": 0.09,
133          "output_per_million_tokens": 0.28
134        },
135        "capabilities": {
136          "function_calling": true,
137          "vision": true,
138          "reasoning": false,
139          "prompt_caching": false,
140          "response_schema": true
141        },
142        "last_updated_at": "2026-04-24"
143      },
144      "Mixtral-8x7B-Instruct-v0.1": {
145        "mode": "chat",
146        "context_window": {
147          "max_input": 32000,
148          "max_output": 32000,
149          "max_tokens": 32000
150        },
151        "pricing": {
152          "input_per_million_tokens": 0.63,
153          "output_per_million_tokens": 0.63
154        },
155        "capabilities": {
156          "function_calling": false,
157          "vision": false,
158          "reasoning": false,
159          "prompt_caching": false,
160          "response_schema": true
161        },
162        "last_updated_at": "2026-04-24"
163      },
164      "Qwen2.5-Coder-32B-Instruct": {
165        "mode": "chat",
166        "context_window": {
167          "max_input": 32000,
168          "max_output": 32000,
169          "max_tokens": 32000
170        },
171        "pricing": {
172          "input_per_million_tokens": 0.87,
173          "output_per_million_tokens": 0.87
174        },
175        "capabilities": {
176          "function_calling": false,
177          "vision": false,
178          "reasoning": false,
179          "prompt_caching": false,
180          "response_schema": true
181        },
182        "last_updated_at": "2026-04-24"
183      },
184      "Qwen2.5-VL-72B-Instruct": {
185        "mode": "chat",
186        "context_window": {
187          "max_input": 32000,
188          "max_output": 32000,
189          "max_tokens": 32000
190        },
191        "pricing": {
192          "input_per_million_tokens": 0.91,
193          "output_per_million_tokens": 0.91
194        },
195        "capabilities": {
196          "function_calling": false,
197          "vision": true,
198          "reasoning": false,
199          "prompt_caching": false,
200          "response_schema": true
201        },
202        "last_updated_at": "2026-04-24"
203      },
204      "Qwen3-32B": {
205        "mode": "chat",
206        "context_window": {
207          "max_input": 32000,
208          "max_output": 32000,
209          "max_tokens": 32000
210        },
211        "pricing": {
212          "input_per_million_tokens": 0.08,
213          "output_per_million_tokens": 0.23
214        },
215        "capabilities": {
216          "function_calling": true,
217          "vision": false,
218          "reasoning": true,
219          "prompt_caching": false,
220          "response_schema": true
221        },
222        "last_updated_at": "2026-04-24"
223      },
224      "gpt-oss-120b": {
225        "mode": "chat",
226        "context_window": {
227          "max_input": 131000,
228          "max_output": 131000,
229          "max_tokens": 131000
230        },
231        "pricing": {
232          "input_per_million_tokens": 0.08,
233          "output_per_million_tokens": 0.4
234        },
235        "capabilities": {
236          "function_calling": false,
237          "vision": false,
238          "reasoning": true,
239          "prompt_caching": false,
240          "response_schema": true
241        },
242        "last_updated_at": "2026-04-24"
243      },
244      "gpt-oss-20b": {
245        "mode": "chat",
246        "context_window": {
247          "max_input": 131000,
248          "max_output": 131000,
249          "max_tokens": 131000
250        },
251        "pricing": {
252          "input_per_million_tokens": 0.04,
253          "output_per_million_tokens": 0.15
254        },
255        "capabilities": {
256          "function_calling": false,
257          "vision": false,
258          "reasoning": true,
259          "prompt_caching": false,
260          "response_schema": true
261        },
262        "last_updated_at": "2026-04-24"
263      },
264      "llava-v1.6-mistral-7b-hf": {
265        "mode": "chat",
266        "context_window": {
267          "max_input": 32000,
268          "max_output": 32000,
269          "max_tokens": 32000
270        },
271        "pricing": {
272          "input_per_million_tokens": 0.29,
273          "output_per_million_tokens": 0.29
274        },
275        "capabilities": {
276          "function_calling": false,
277          "vision": true,
278          "reasoning": false,
279          "prompt_caching": false,
280          "response_schema": true
281        },
282        "last_updated_at": "2026-04-24"
283      },
284      "mamba-codestral-7B-v0.1": {
285        "mode": "chat",
286        "context_window": {
287          "max_input": 256000,
288          "max_output": 256000,
289          "max_tokens": 256000
290        },
291        "pricing": {
292          "input_per_million_tokens": 0.19,
293          "output_per_million_tokens": 0.19
294        },
295        "capabilities": {
296          "function_calling": false,
297          "vision": false,
298          "reasoning": false,
299          "prompt_caching": false,
300          "response_schema": true
301        },
302        "last_updated_at": "2026-04-24"
303      }
304    }
305  }