/ mlflow / utils / model_catalog / azure_ai.json
azure_ai.json
   1  {
   2    "schema_version": "1.0",
   3    "models": {
   4      "Cohere-embed-v3-english": {
   5        "mode": "embedding",
   6        "context_window": {
   7          "max_input": 512,
   8          "max_tokens": 512
   9        },
  10        "pricing": {
  11          "input_per_million_tokens": 0.1,
  12          "output_per_million_tokens": 0.0
  13        },
  14        "capabilities": {
  15          "function_calling": false,
  16          "vision": false,
  17          "reasoning": false,
  18          "prompt_caching": false,
  19          "response_schema": false
  20        },
  21        "last_updated_at": "2026-04-24"
  22      },
  23      "Cohere-embed-v3-multilingual": {
  24        "mode": "embedding",
  25        "context_window": {
  26          "max_input": 512,
  27          "max_tokens": 512
  28        },
  29        "pricing": {
  30          "input_per_million_tokens": 0.1,
  31          "output_per_million_tokens": 0.0
  32        },
  33        "capabilities": {
  34          "function_calling": false,
  35          "vision": false,
  36          "reasoning": false,
  37          "prompt_caching": false,
  38          "response_schema": false
  39        },
  40        "last_updated_at": "2026-04-24"
  41      },
  42      "Llama-3.2-11B-Vision-Instruct": {
  43        "mode": "chat",
  44        "context_window": {
  45          "max_input": 128000,
  46          "max_output": 2048,
  47          "max_tokens": 2048
  48        },
  49        "pricing": {
  50          "input_per_million_tokens": 0.37,
  51          "output_per_million_tokens": 0.37
  52        },
  53        "capabilities": {
  54          "function_calling": true,
  55          "vision": true,
  56          "reasoning": false,
  57          "prompt_caching": false,
  58          "response_schema": false
  59        },
  60        "last_updated_at": "2026-04-24"
  61      },
  62      "Llama-3.2-90B-Vision-Instruct": {
  63        "mode": "chat",
  64        "context_window": {
  65          "max_input": 128000,
  66          "max_output": 2048,
  67          "max_tokens": 2048
  68        },
  69        "pricing": {
  70          "input_per_million_tokens": 2.04,
  71          "output_per_million_tokens": 2.04
  72        },
  73        "capabilities": {
  74          "function_calling": true,
  75          "vision": true,
  76          "reasoning": false,
  77          "prompt_caching": false,
  78          "response_schema": false
  79        },
  80        "last_updated_at": "2026-04-24"
  81      },
  82      "Llama-3.3-70B-Instruct": {
  83        "mode": "chat",
  84        "context_window": {
  85          "max_input": 128000,
  86          "max_output": 2048,
  87          "max_tokens": 2048
  88        },
  89        "pricing": {
  90          "input_per_million_tokens": 0.71,
  91          "output_per_million_tokens": 0.71
  92        },
  93        "capabilities": {
  94          "function_calling": true,
  95          "vision": false,
  96          "reasoning": false,
  97          "prompt_caching": false,
  98          "response_schema": false
  99        },
 100        "last_updated_at": "2026-04-24"
 101      },
 102      "Llama-4-Maverick-17B-128E-Instruct-FP8": {
 103        "mode": "chat",
 104        "context_window": {
 105          "max_input": 1000000,
 106          "max_output": 16384,
 107          "max_tokens": 16384
 108        },
 109        "pricing": {
 110          "input_per_million_tokens": 1.41,
 111          "output_per_million_tokens": 0.35
 112        },
 113        "capabilities": {
 114          "function_calling": true,
 115          "vision": true,
 116          "reasoning": false,
 117          "prompt_caching": false,
 118          "response_schema": false
 119        },
 120        "last_updated_at": "2026-04-24"
 121      },
 122      "Llama-4-Scout-17B-16E-Instruct": {
 123        "mode": "chat",
 124        "context_window": {
 125          "max_input": 10000000,
 126          "max_output": 16384,
 127          "max_tokens": 16384
 128        },
 129        "pricing": {
 130          "input_per_million_tokens": 0.2,
 131          "output_per_million_tokens": 0.78
 132        },
 133        "capabilities": {
 134          "function_calling": true,
 135          "vision": true,
 136          "reasoning": false,
 137          "prompt_caching": false,
 138          "response_schema": false
 139        },
 140        "last_updated_at": "2026-04-24"
 141      },
 142      "MAI-DS-R1": {
 143        "mode": "chat",
 144        "context_window": {
 145          "max_input": 128000,
 146          "max_output": 8192,
 147          "max_tokens": 8192
 148        },
 149        "pricing": {
 150          "input_per_million_tokens": 1.35,
 151          "output_per_million_tokens": 5.4
 152        },
 153        "capabilities": {
 154          "function_calling": false,
 155          "vision": false,
 156          "reasoning": true,
 157          "prompt_caching": false,
 158          "response_schema": false
 159        },
 160        "last_updated_at": "2026-04-24"
 161      },
 162      "Meta-Llama-3-70B-Instruct": {
 163        "mode": "chat",
 164        "context_window": {
 165          "max_input": 8192,
 166          "max_output": 2048,
 167          "max_tokens": 2048
 168        },
 169        "pricing": {
 170          "input_per_million_tokens": 1.1,
 171          "output_per_million_tokens": 0.37
 172        },
 173        "capabilities": {
 174          "function_calling": false,
 175          "vision": false,
 176          "reasoning": false,
 177          "prompt_caching": false,
 178          "response_schema": false
 179        },
 180        "last_updated_at": "2026-04-24"
 181      },
 182      "Meta-Llama-3.1-405B-Instruct": {
 183        "mode": "chat",
 184        "context_window": {
 185          "max_input": 128000,
 186          "max_output": 2048,
 187          "max_tokens": 2048
 188        },
 189        "pricing": {
 190          "input_per_million_tokens": 5.33,
 191          "output_per_million_tokens": 16.0
 192        },
 193        "capabilities": {
 194          "function_calling": false,
 195          "vision": false,
 196          "reasoning": false,
 197          "prompt_caching": false,
 198          "response_schema": false
 199        },
 200        "last_updated_at": "2026-04-24"
 201      },
 202      "Meta-Llama-3.1-70B-Instruct": {
 203        "mode": "chat",
 204        "context_window": {
 205          "max_input": 128000,
 206          "max_output": 2048,
 207          "max_tokens": 2048
 208        },
 209        "pricing": {
 210          "input_per_million_tokens": 2.68,
 211          "output_per_million_tokens": 3.54
 212        },
 213        "capabilities": {
 214          "function_calling": false,
 215          "vision": false,
 216          "reasoning": false,
 217          "prompt_caching": false,
 218          "response_schema": false
 219        },
 220        "last_updated_at": "2026-04-24"
 221      },
 222      "Meta-Llama-3.1-8B-Instruct": {
 223        "mode": "chat",
 224        "context_window": {
 225          "max_input": 128000,
 226          "max_output": 2048,
 227          "max_tokens": 2048
 228        },
 229        "pricing": {
 230          "input_per_million_tokens": 0.3,
 231          "output_per_million_tokens": 0.61
 232        },
 233        "capabilities": {
 234          "function_calling": false,
 235          "vision": false,
 236          "reasoning": false,
 237          "prompt_caching": false,
 238          "response_schema": false
 239        },
 240        "last_updated_at": "2026-04-24"
 241      },
 242      "Phi-3-medium-128k-instruct": {
 243        "mode": "chat",
 244        "context_window": {
 245          "max_input": 128000,
 246          "max_output": 4096,
 247          "max_tokens": 4096
 248        },
 249        "pricing": {
 250          "input_per_million_tokens": 0.17,
 251          "output_per_million_tokens": 0.68
 252        },
 253        "capabilities": {
 254          "function_calling": false,
 255          "vision": false,
 256          "reasoning": false,
 257          "prompt_caching": false,
 258          "response_schema": false
 259        },
 260        "last_updated_at": "2026-04-24"
 261      },
 262      "Phi-3-medium-4k-instruct": {
 263        "mode": "chat",
 264        "context_window": {
 265          "max_input": 4096,
 266          "max_output": 4096,
 267          "max_tokens": 4096
 268        },
 269        "pricing": {
 270          "input_per_million_tokens": 0.17,
 271          "output_per_million_tokens": 0.68
 272        },
 273        "capabilities": {
 274          "function_calling": false,
 275          "vision": false,
 276          "reasoning": false,
 277          "prompt_caching": false,
 278          "response_schema": false
 279        },
 280        "last_updated_at": "2026-04-24"
 281      },
 282      "Phi-3-mini-128k-instruct": {
 283        "mode": "chat",
 284        "context_window": {
 285          "max_input": 128000,
 286          "max_output": 4096,
 287          "max_tokens": 4096
 288        },
 289        "pricing": {
 290          "input_per_million_tokens": 0.13,
 291          "output_per_million_tokens": 0.52
 292        },
 293        "capabilities": {
 294          "function_calling": false,
 295          "vision": false,
 296          "reasoning": false,
 297          "prompt_caching": false,
 298          "response_schema": false
 299        },
 300        "last_updated_at": "2026-04-24"
 301      },
 302      "Phi-3-mini-4k-instruct": {
 303        "mode": "chat",
 304        "context_window": {
 305          "max_input": 4096,
 306          "max_output": 4096,
 307          "max_tokens": 4096
 308        },
 309        "pricing": {
 310          "input_per_million_tokens": 0.13,
 311          "output_per_million_tokens": 0.52
 312        },
 313        "capabilities": {
 314          "function_calling": false,
 315          "vision": false,
 316          "reasoning": false,
 317          "prompt_caching": false,
 318          "response_schema": false
 319        },
 320        "last_updated_at": "2026-04-24"
 321      },
 322      "Phi-3-small-128k-instruct": {
 323        "mode": "chat",
 324        "context_window": {
 325          "max_input": 128000,
 326          "max_output": 4096,
 327          "max_tokens": 4096
 328        },
 329        "pricing": {
 330          "input_per_million_tokens": 0.15,
 331          "output_per_million_tokens": 0.6
 332        },
 333        "capabilities": {
 334          "function_calling": false,
 335          "vision": false,
 336          "reasoning": false,
 337          "prompt_caching": false,
 338          "response_schema": false
 339        },
 340        "last_updated_at": "2026-04-24"
 341      },
 342      "Phi-3-small-8k-instruct": {
 343        "mode": "chat",
 344        "context_window": {
 345          "max_input": 8192,
 346          "max_output": 4096,
 347          "max_tokens": 4096
 348        },
 349        "pricing": {
 350          "input_per_million_tokens": 0.15,
 351          "output_per_million_tokens": 0.6
 352        },
 353        "capabilities": {
 354          "function_calling": false,
 355          "vision": false,
 356          "reasoning": false,
 357          "prompt_caching": false,
 358          "response_schema": false
 359        },
 360        "last_updated_at": "2026-04-24"
 361      },
 362      "Phi-3.5-MoE-instruct": {
 363        "mode": "chat",
 364        "context_window": {
 365          "max_input": 128000,
 366          "max_output": 4096,
 367          "max_tokens": 4096
 368        },
 369        "pricing": {
 370          "input_per_million_tokens": 0.16,
 371          "output_per_million_tokens": 0.64
 372        },
 373        "capabilities": {
 374          "function_calling": false,
 375          "vision": false,
 376          "reasoning": false,
 377          "prompt_caching": false,
 378          "response_schema": false
 379        },
 380        "last_updated_at": "2026-04-24"
 381      },
 382      "Phi-3.5-mini-instruct": {
 383        "mode": "chat",
 384        "context_window": {
 385          "max_input": 128000,
 386          "max_output": 4096,
 387          "max_tokens": 4096
 388        },
 389        "pricing": {
 390          "input_per_million_tokens": 0.13,
 391          "output_per_million_tokens": 0.52
 392        },
 393        "capabilities": {
 394          "function_calling": false,
 395          "vision": false,
 396          "reasoning": false,
 397          "prompt_caching": false,
 398          "response_schema": false
 399        },
 400        "last_updated_at": "2026-04-24"
 401      },
 402      "Phi-3.5-vision-instruct": {
 403        "mode": "chat",
 404        "context_window": {
 405          "max_input": 128000,
 406          "max_output": 4096,
 407          "max_tokens": 4096
 408        },
 409        "pricing": {
 410          "input_per_million_tokens": 0.13,
 411          "output_per_million_tokens": 0.52
 412        },
 413        "capabilities": {
 414          "function_calling": false,
 415          "vision": true,
 416          "reasoning": false,
 417          "prompt_caching": false,
 418          "response_schema": false
 419        },
 420        "last_updated_at": "2026-04-24"
 421      },
 422      "Phi-4": {
 423        "mode": "chat",
 424        "context_window": {
 425          "max_input": 16384,
 426          "max_output": 16384,
 427          "max_tokens": 16384
 428        },
 429        "pricing": {
 430          "input_per_million_tokens": 0.125,
 431          "output_per_million_tokens": 0.5
 432        },
 433        "capabilities": {
 434          "function_calling": true,
 435          "vision": false,
 436          "reasoning": false,
 437          "prompt_caching": false,
 438          "response_schema": false
 439        },
 440        "last_updated_at": "2026-04-24"
 441      },
 442      "Phi-4-mini-instruct": {
 443        "mode": "chat",
 444        "context_window": {
 445          "max_input": 131072,
 446          "max_output": 4096,
 447          "max_tokens": 4096
 448        },
 449        "pricing": {
 450          "input_per_million_tokens": 0.075,
 451          "output_per_million_tokens": 0.3
 452        },
 453        "capabilities": {
 454          "function_calling": true,
 455          "vision": false,
 456          "reasoning": false,
 457          "prompt_caching": false,
 458          "response_schema": false
 459        },
 460        "last_updated_at": "2026-04-24"
 461      },
 462      "Phi-4-mini-reasoning": {
 463        "mode": "chat",
 464        "context_window": {
 465          "max_input": 131072,
 466          "max_output": 4096,
 467          "max_tokens": 4096
 468        },
 469        "pricing": {
 470          "input_per_million_tokens": 0.08,
 471          "output_per_million_tokens": 0.32
 472        },
 473        "capabilities": {
 474          "function_calling": true,
 475          "vision": false,
 476          "reasoning": false,
 477          "prompt_caching": false,
 478          "response_schema": false
 479        },
 480        "last_updated_at": "2026-04-24"
 481      },
 482      "Phi-4-multimodal-instruct": {
 483        "mode": "chat",
 484        "context_window": {
 485          "max_input": 131072,
 486          "max_output": 4096,
 487          "max_tokens": 4096
 488        },
 489        "pricing": {
 490          "input_per_million_tokens": 0.08,
 491          "output_per_million_tokens": 0.32,
 492          "modality": {
 493            "audio": {
 494              "input_per_million_tokens": 4.0
 495            }
 496          }
 497        },
 498        "capabilities": {
 499          "function_calling": true,
 500          "vision": true,
 501          "reasoning": false,
 502          "prompt_caching": false,
 503          "response_schema": false
 504        },
 505        "last_updated_at": "2026-04-24"
 506      },
 507      "Phi-4-reasoning": {
 508        "mode": "chat",
 509        "context_window": {
 510          "max_input": 32768,
 511          "max_output": 4096,
 512          "max_tokens": 4096
 513        },
 514        "pricing": {
 515          "input_per_million_tokens": 0.125,
 516          "output_per_million_tokens": 0.5
 517        },
 518        "capabilities": {
 519          "function_calling": true,
 520          "vision": false,
 521          "reasoning": true,
 522          "prompt_caching": false,
 523          "response_schema": false
 524        },
 525        "last_updated_at": "2026-04-24"
 526      },
 527      "claude-haiku-4-5": {
 528        "mode": "chat",
 529        "context_window": {
 530          "max_input": 200000,
 531          "max_output": 64000,
 532          "max_tokens": 64000
 533        },
 534        "pricing": {
 535          "input_per_million_tokens": 1.0,
 536          "output_per_million_tokens": 5.0,
 537          "cache_read_per_million_tokens": 0.1,
 538          "cache_write_per_million_tokens": 1.25
 539        },
 540        "capabilities": {
 541          "function_calling": true,
 542          "vision": true,
 543          "reasoning": true,
 544          "prompt_caching": true,
 545          "response_schema": true
 546        },
 547        "last_updated_at": "2026-04-24"
 548      },
 549      "claude-opus-4-1": {
 550        "mode": "chat",
 551        "context_window": {
 552          "max_input": 200000,
 553          "max_output": 32000,
 554          "max_tokens": 32000
 555        },
 556        "pricing": {
 557          "input_per_million_tokens": 15.0,
 558          "output_per_million_tokens": 75.0,
 559          "cache_read_per_million_tokens": 1.5,
 560          "cache_write_per_million_tokens": 18.75
 561        },
 562        "capabilities": {
 563          "function_calling": true,
 564          "vision": true,
 565          "reasoning": true,
 566          "prompt_caching": true,
 567          "response_schema": true
 568        },
 569        "last_updated_at": "2026-04-24"
 570      },
 571      "claude-opus-4-5": {
 572        "mode": "chat",
 573        "context_window": {
 574          "max_input": 200000,
 575          "max_output": 64000,
 576          "max_tokens": 64000
 577        },
 578        "pricing": {
 579          "input_per_million_tokens": 5.0,
 580          "output_per_million_tokens": 25.0,
 581          "cache_read_per_million_tokens": 0.5,
 582          "cache_write_per_million_tokens": 6.25
 583        },
 584        "capabilities": {
 585          "function_calling": true,
 586          "vision": true,
 587          "reasoning": true,
 588          "prompt_caching": true,
 589          "response_schema": true
 590        },
 591        "last_updated_at": "2026-04-24"
 592      },
 593      "claude-opus-4-6": {
 594        "mode": "chat",
 595        "context_window": {
 596          "max_input": 200000,
 597          "max_output": 128000,
 598          "max_tokens": 128000
 599        },
 600        "pricing": {
 601          "input_per_million_tokens": 5.0,
 602          "output_per_million_tokens": 25.0,
 603          "cache_read_per_million_tokens": 0.5,
 604          "cache_write_per_million_tokens": 6.25,
 605          "tooling": {
 606            "search_context_per_query": {
 607              "search_context_size_high": 0.01,
 608              "search_context_size_low": 0.01,
 609              "search_context_size_medium": 0.01
 610            },
 611            "tool_use_system_prompt_tokens": 159
 612          }
 613        },
 614        "capabilities": {
 615          "function_calling": true,
 616          "vision": true,
 617          "reasoning": true,
 618          "prompt_caching": true,
 619          "response_schema": true
 620        },
 621        "last_updated_at": "2026-04-24"
 622      },
 623      "claude-opus-4-7": {
 624        "mode": "chat",
 625        "context_window": {
 626          "max_input": 200000,
 627          "max_output": 128000,
 628          "max_tokens": 128000
 629        },
 630        "pricing": {
 631          "input_per_million_tokens": 5.0,
 632          "output_per_million_tokens": 25.0,
 633          "cache_read_per_million_tokens": 0.5,
 634          "cache_write_per_million_tokens": 6.25,
 635          "tooling": {
 636            "search_context_per_query": {
 637              "search_context_size_high": 0.01,
 638              "search_context_size_low": 0.01,
 639              "search_context_size_medium": 0.01
 640            },
 641            "tool_use_system_prompt_tokens": 159
 642          }
 643        },
 644        "capabilities": {
 645          "function_calling": true,
 646          "vision": true,
 647          "reasoning": true,
 648          "prompt_caching": true,
 649          "response_schema": true
 650        },
 651        "last_updated_at": "2026-04-24"
 652      },
 653      "claude-sonnet-4-5": {
 654        "mode": "chat",
 655        "context_window": {
 656          "max_input": 200000,
 657          "max_output": 64000,
 658          "max_tokens": 64000
 659        },
 660        "pricing": {
 661          "input_per_million_tokens": 3.0,
 662          "output_per_million_tokens": 15.0,
 663          "cache_read_per_million_tokens": 0.3,
 664          "cache_write_per_million_tokens": 3.75
 665        },
 666        "capabilities": {
 667          "function_calling": true,
 668          "vision": true,
 669          "reasoning": true,
 670          "prompt_caching": true,
 671          "response_schema": true
 672        },
 673        "last_updated_at": "2026-04-24"
 674      },
 675      "claude-sonnet-4-6": {
 676        "mode": "chat",
 677        "context_window": {
 678          "max_input": 1000000,
 679          "max_output": 64000,
 680          "max_tokens": 64000
 681        },
 682        "pricing": {
 683          "input_per_million_tokens": 3.0,
 684          "output_per_million_tokens": 15.0,
 685          "cache_read_per_million_tokens": 0.3,
 686          "cache_write_per_million_tokens": 3.75,
 687          "tooling": {
 688            "tool_use_system_prompt_tokens": 346
 689          }
 690        },
 691        "capabilities": {
 692          "function_calling": true,
 693          "vision": true,
 694          "reasoning": true,
 695          "prompt_caching": true,
 696          "response_schema": true
 697        },
 698        "last_updated_at": "2026-04-24"
 699      },
 700      "deepseek-r1": {
 701        "mode": "chat",
 702        "context_window": {
 703          "max_input": 128000,
 704          "max_output": 8192,
 705          "max_tokens": 8192
 706        },
 707        "pricing": {
 708          "input_per_million_tokens": 1.35,
 709          "output_per_million_tokens": 5.4
 710        },
 711        "capabilities": {
 712          "function_calling": false,
 713          "vision": false,
 714          "reasoning": true,
 715          "prompt_caching": false,
 716          "response_schema": false
 717        },
 718        "last_updated_at": "2026-04-24"
 719      },
 720      "deepseek-v3": {
 721        "mode": "chat",
 722        "context_window": {
 723          "max_input": 128000,
 724          "max_output": 8192,
 725          "max_tokens": 8192
 726        },
 727        "pricing": {
 728          "input_per_million_tokens": 1.14,
 729          "output_per_million_tokens": 4.56
 730        },
 731        "capabilities": {
 732          "function_calling": false,
 733          "vision": false,
 734          "reasoning": false,
 735          "prompt_caching": false,
 736          "response_schema": false
 737        },
 738        "last_updated_at": "2026-04-24"
 739      },
 740      "deepseek-v3-0324": {
 741        "mode": "chat",
 742        "context_window": {
 743          "max_input": 128000,
 744          "max_output": 8192,
 745          "max_tokens": 8192
 746        },
 747        "pricing": {
 748          "input_per_million_tokens": 1.14,
 749          "output_per_million_tokens": 4.56
 750        },
 751        "capabilities": {
 752          "function_calling": true,
 753          "vision": false,
 754          "reasoning": false,
 755          "prompt_caching": false,
 756          "response_schema": false
 757        },
 758        "last_updated_at": "2026-04-24"
 759      },
 760      "deepseek-v3.2": {
 761        "mode": "chat",
 762        "context_window": {
 763          "max_input": 163840,
 764          "max_output": 163840,
 765          "max_tokens": 163840
 766        },
 767        "pricing": {
 768          "input_per_million_tokens": 0.58,
 769          "output_per_million_tokens": 1.68
 770        },
 771        "capabilities": {
 772          "function_calling": true,
 773          "vision": false,
 774          "reasoning": true,
 775          "prompt_caching": true,
 776          "response_schema": false
 777        },
 778        "last_updated_at": "2026-04-24"
 779      },
 780      "deepseek-v3.2-speciale": {
 781        "mode": "chat",
 782        "context_window": {
 783          "max_input": 163840,
 784          "max_output": 163840,
 785          "max_tokens": 163840
 786        },
 787        "pricing": {
 788          "input_per_million_tokens": 0.58,
 789          "output_per_million_tokens": 1.68
 790        },
 791        "capabilities": {
 792          "function_calling": true,
 793          "vision": false,
 794          "reasoning": true,
 795          "prompt_caching": true,
 796          "response_schema": false
 797        },
 798        "last_updated_at": "2026-04-24"
 799      },
 800      "embed-v-4-0": {
 801        "mode": "embedding",
 802        "context_window": {
 803          "max_input": 128000,
 804          "max_tokens": 128000
 805        },
 806        "pricing": {
 807          "input_per_million_tokens": 0.12,
 808          "output_per_million_tokens": 0.0
 809        },
 810        "capabilities": {
 811          "function_calling": false,
 812          "vision": false,
 813          "reasoning": false,
 814          "prompt_caching": false,
 815          "response_schema": false
 816        },
 817        "last_updated_at": "2026-04-24"
 818      },
 819      "global/grok-3": {
 820        "mode": "chat",
 821        "context_window": {
 822          "max_input": 131072,
 823          "max_output": 131072,
 824          "max_tokens": 131072
 825        },
 826        "pricing": {
 827          "input_per_million_tokens": 3.0,
 828          "output_per_million_tokens": 15.0
 829        },
 830        "capabilities": {
 831          "function_calling": true,
 832          "vision": false,
 833          "reasoning": false,
 834          "prompt_caching": false,
 835          "response_schema": false
 836        },
 837        "last_updated_at": "2026-04-24"
 838      },
 839      "global/grok-3-mini": {
 840        "mode": "chat",
 841        "context_window": {
 842          "max_input": 131072,
 843          "max_output": 131072,
 844          "max_tokens": 131072
 845        },
 846        "pricing": {
 847          "input_per_million_tokens": 0.25,
 848          "output_per_million_tokens": 1.27
 849        },
 850        "capabilities": {
 851          "function_calling": true,
 852          "vision": false,
 853          "reasoning": true,
 854          "prompt_caching": false,
 855          "response_schema": false
 856        },
 857        "last_updated_at": "2026-04-24"
 858      },
 859      "gpt-oss-120b": {
 860        "mode": "chat",
 861        "context_window": {
 862          "max_input": 131072,
 863          "max_output": 131072,
 864          "max_tokens": 131072
 865        },
 866        "pricing": {
 867          "input_per_million_tokens": 0.15,
 868          "output_per_million_tokens": 0.6
 869        },
 870        "capabilities": {
 871          "function_calling": true,
 872          "vision": false,
 873          "reasoning": false,
 874          "prompt_caching": false,
 875          "response_schema": true
 876        },
 877        "last_updated_at": "2026-04-24"
 878      },
 879      "grok-3": {
 880        "mode": "chat",
 881        "context_window": {
 882          "max_input": 131072,
 883          "max_output": 131072,
 884          "max_tokens": 131072
 885        },
 886        "pricing": {
 887          "input_per_million_tokens": 3.0,
 888          "output_per_million_tokens": 15.0
 889        },
 890        "capabilities": {
 891          "function_calling": true,
 892          "vision": false,
 893          "reasoning": false,
 894          "prompt_caching": false,
 895          "response_schema": false
 896        },
 897        "last_updated_at": "2026-04-24"
 898      },
 899      "grok-3-mini": {
 900        "mode": "chat",
 901        "context_window": {
 902          "max_input": 131072,
 903          "max_output": 131072,
 904          "max_tokens": 131072
 905        },
 906        "pricing": {
 907          "input_per_million_tokens": 0.25,
 908          "output_per_million_tokens": 1.27
 909        },
 910        "capabilities": {
 911          "function_calling": true,
 912          "vision": false,
 913          "reasoning": true,
 914          "prompt_caching": false,
 915          "response_schema": false
 916        },
 917        "last_updated_at": "2026-04-24"
 918      },
 919      "grok-4": {
 920        "mode": "chat",
 921        "context_window": {
 922          "max_input": 131072,
 923          "max_output": 131072,
 924          "max_tokens": 131072
 925        },
 926        "pricing": {
 927          "input_per_million_tokens": 3.0,
 928          "output_per_million_tokens": 15.0
 929        },
 930        "capabilities": {
 931          "function_calling": true,
 932          "vision": false,
 933          "reasoning": false,
 934          "prompt_caching": false,
 935          "response_schema": true
 936        },
 937        "last_updated_at": "2026-04-24"
 938      },
 939      "grok-4-1-fast-non-reasoning": {
 940        "mode": "chat",
 941        "context_window": {
 942          "max_input": 131072,
 943          "max_output": 131072,
 944          "max_tokens": 131072
 945        },
 946        "pricing": {
 947          "input_per_million_tokens": 0.2,
 948          "output_per_million_tokens": 0.5
 949        },
 950        "capabilities": {
 951          "function_calling": true,
 952          "vision": false,
 953          "reasoning": false,
 954          "prompt_caching": false,
 955          "response_schema": true
 956        },
 957        "last_updated_at": "2026-04-24"
 958      },
 959      "grok-4-1-fast-reasoning": {
 960        "mode": "chat",
 961        "context_window": {
 962          "max_input": 131072,
 963          "max_output": 131072,
 964          "max_tokens": 131072
 965        },
 966        "pricing": {
 967          "input_per_million_tokens": 0.2,
 968          "output_per_million_tokens": 0.5
 969        },
 970        "capabilities": {
 971          "function_calling": true,
 972          "vision": false,
 973          "reasoning": true,
 974          "prompt_caching": false,
 975          "response_schema": true
 976        },
 977        "last_updated_at": "2026-04-24"
 978      },
 979      "grok-4-fast-non-reasoning": {
 980        "mode": "chat",
 981        "context_window": {
 982          "max_input": 131072,
 983          "max_output": 131072,
 984          "max_tokens": 131072
 985        },
 986        "pricing": {
 987          "input_per_million_tokens": 0.2,
 988          "output_per_million_tokens": 0.5
 989        },
 990        "capabilities": {
 991          "function_calling": true,
 992          "vision": false,
 993          "reasoning": false,
 994          "prompt_caching": false,
 995          "response_schema": true
 996        },
 997        "last_updated_at": "2026-04-24"
 998      },
 999      "grok-4-fast-reasoning": {
1000        "mode": "chat",
1001        "context_window": {
1002          "max_input": 131072,
1003          "max_output": 131072,
1004          "max_tokens": 131072
1005        },
1006        "pricing": {
1007          "input_per_million_tokens": 0.2,
1008          "output_per_million_tokens": 0.5
1009        },
1010        "capabilities": {
1011          "function_calling": true,
1012          "vision": false,
1013          "reasoning": false,
1014          "prompt_caching": false,
1015          "response_schema": true
1016        },
1017        "last_updated_at": "2026-04-24"
1018      },
1019      "grok-code-fast-1": {
1020        "mode": "chat",
1021        "context_window": {
1022          "max_input": 131072,
1023          "max_output": 131072,
1024          "max_tokens": 131072
1025        },
1026        "pricing": {
1027          "input_per_million_tokens": 0.2,
1028          "output_per_million_tokens": 1.5
1029        },
1030        "capabilities": {
1031          "function_calling": true,
1032          "vision": false,
1033          "reasoning": false,
1034          "prompt_caching": false,
1035          "response_schema": true
1036        },
1037        "last_updated_at": "2026-04-24"
1038      },
1039      "jais-30b-chat": {
1040        "mode": "chat",
1041        "context_window": {
1042          "max_input": 8192,
1043          "max_output": 8192,
1044          "max_tokens": 8192
1045        },
1046        "pricing": {
1047          "input_per_million_tokens": 3200.0,
1048          "output_per_million_tokens": 9710.0
1049        },
1050        "capabilities": {
1051          "function_calling": false,
1052          "vision": false,
1053          "reasoning": false,
1054          "prompt_caching": false,
1055          "response_schema": false
1056        },
1057        "last_updated_at": "2026-04-24"
1058      },
1059      "jamba-instruct": {
1060        "mode": "chat",
1061        "context_window": {
1062          "max_input": 70000,
1063          "max_output": 4096,
1064          "max_tokens": 4096
1065        },
1066        "pricing": {
1067          "input_per_million_tokens": 0.5,
1068          "output_per_million_tokens": 0.7
1069        },
1070        "capabilities": {
1071          "function_calling": false,
1072          "vision": false,
1073          "reasoning": false,
1074          "prompt_caching": false,
1075          "response_schema": false
1076        },
1077        "last_updated_at": "2026-04-24"
1078      },
1079      "kimi-k2.5": {
1080        "mode": "chat",
1081        "context_window": {
1082          "max_input": 262144,
1083          "max_output": 262144,
1084          "max_tokens": 262144
1085        },
1086        "pricing": {
1087          "input_per_million_tokens": 0.6,
1088          "output_per_million_tokens": 3.0
1089        },
1090        "capabilities": {
1091          "function_calling": true,
1092          "vision": true,
1093          "reasoning": false,
1094          "prompt_caching": false,
1095          "response_schema": false
1096        },
1097        "last_updated_at": "2026-04-24"
1098      },
1099      "ministral-3b": {
1100        "mode": "chat",
1101        "context_window": {
1102          "max_input": 128000,
1103          "max_output": 4096,
1104          "max_tokens": 4096
1105        },
1106        "pricing": {
1107          "input_per_million_tokens": 0.04,
1108          "output_per_million_tokens": 0.04
1109        },
1110        "capabilities": {
1111          "function_calling": true,
1112          "vision": false,
1113          "reasoning": false,
1114          "prompt_caching": false,
1115          "response_schema": false
1116        },
1117        "last_updated_at": "2026-04-24"
1118      },
1119      "mistral-large": {
1120        "mode": "chat",
1121        "context_window": {
1122          "max_input": 32000,
1123          "max_output": 8191,
1124          "max_tokens": 8191
1125        },
1126        "pricing": {
1127          "input_per_million_tokens": 4.0,
1128          "output_per_million_tokens": 12.0
1129        },
1130        "capabilities": {
1131          "function_calling": true,
1132          "vision": false,
1133          "reasoning": false,
1134          "prompt_caching": false,
1135          "response_schema": false
1136        },
1137        "last_updated_at": "2026-04-24"
1138      },
1139      "mistral-large-2407": {
1140        "mode": "chat",
1141        "context_window": {
1142          "max_input": 128000,
1143          "max_output": 4096,
1144          "max_tokens": 4096
1145        },
1146        "pricing": {
1147          "input_per_million_tokens": 2.0,
1148          "output_per_million_tokens": 6.0
1149        },
1150        "capabilities": {
1151          "function_calling": true,
1152          "vision": false,
1153          "reasoning": false,
1154          "prompt_caching": false,
1155          "response_schema": false
1156        },
1157        "last_updated_at": "2026-04-24"
1158      },
1159      "mistral-large-3": {
1160        "mode": "chat",
1161        "context_window": {
1162          "max_input": 256000,
1163          "max_output": 8191,
1164          "max_tokens": 8191
1165        },
1166        "pricing": {
1167          "input_per_million_tokens": 0.5,
1168          "output_per_million_tokens": 1.5
1169        },
1170        "capabilities": {
1171          "function_calling": true,
1172          "vision": true,
1173          "reasoning": false,
1174          "prompt_caching": false,
1175          "response_schema": false
1176        },
1177        "last_updated_at": "2026-04-24"
1178      },
1179      "mistral-large-latest": {
1180        "mode": "chat",
1181        "context_window": {
1182          "max_input": 128000,
1183          "max_output": 4096,
1184          "max_tokens": 4096
1185        },
1186        "pricing": {
1187          "input_per_million_tokens": 2.0,
1188          "output_per_million_tokens": 6.0
1189        },
1190        "capabilities": {
1191          "function_calling": true,
1192          "vision": false,
1193          "reasoning": false,
1194          "prompt_caching": false,
1195          "response_schema": false
1196        },
1197        "last_updated_at": "2026-04-24"
1198      },
1199      "mistral-medium-2505": {
1200        "mode": "chat",
1201        "context_window": {
1202          "max_input": 131072,
1203          "max_output": 8191,
1204          "max_tokens": 8191
1205        },
1206        "pricing": {
1207          "input_per_million_tokens": 0.4,
1208          "output_per_million_tokens": 2.0
1209        },
1210        "capabilities": {
1211          "function_calling": true,
1212          "vision": false,
1213          "reasoning": false,
1214          "prompt_caching": false,
1215          "response_schema": false
1216        },
1217        "last_updated_at": "2026-04-24"
1218      },
1219      "mistral-nemo": {
1220        "mode": "chat",
1221        "context_window": {
1222          "max_input": 131072,
1223          "max_output": 4096,
1224          "max_tokens": 4096
1225        },
1226        "pricing": {
1227          "input_per_million_tokens": 0.15,
1228          "output_per_million_tokens": 0.15
1229        },
1230        "capabilities": {
1231          "function_calling": true,
1232          "vision": false,
1233          "reasoning": false,
1234          "prompt_caching": false,
1235          "response_schema": false
1236        },
1237        "last_updated_at": "2026-04-24"
1238      },
1239      "mistral-small": {
1240        "mode": "chat",
1241        "context_window": {
1242          "max_input": 32000,
1243          "max_output": 8191,
1244          "max_tokens": 8191
1245        },
1246        "pricing": {
1247          "input_per_million_tokens": 1.0,
1248          "output_per_million_tokens": 3.0
1249        },
1250        "capabilities": {
1251          "function_calling": true,
1252          "vision": false,
1253          "reasoning": false,
1254          "prompt_caching": false,
1255          "response_schema": false
1256        },
1257        "last_updated_at": "2026-04-24"
1258      },
1259      "mistral-small-2503": {
1260        "mode": "chat",
1261        "context_window": {
1262          "max_input": 128000,
1263          "max_output": 128000,
1264          "max_tokens": 128000
1265        },
1266        "pricing": {
1267          "input_per_million_tokens": 0.1,
1268          "output_per_million_tokens": 0.3
1269        },
1270        "capabilities": {
1271          "function_calling": true,
1272          "vision": true,
1273          "reasoning": false,
1274          "prompt_caching": false,
1275          "response_schema": false
1276        },
1277        "last_updated_at": "2026-04-24"
1278      },
1279      "model_router": {
1280        "mode": "chat",
1281        "pricing": {
1282          "input_per_million_tokens": 0.14,
1283          "output_per_million_tokens": 0
1284        },
1285        "capabilities": {
1286          "function_calling": false,
1287          "vision": false,
1288          "reasoning": false,
1289          "prompt_caching": false,
1290          "response_schema": false
1291        },
1292        "last_updated_at": "2026-04-24"
1293      }
1294    }
1295  }