novita.json
1 { 2 "schema_version": "1.0", 3 "models": { 4 "Sao10K/L3-8B-Stheno-v3.2": { 5 "mode": "chat", 6 "context_window": { 7 "max_input": 8192, 8 "max_output": 32000, 9 "max_tokens": 32000 10 }, 11 "pricing": { 12 "input_per_million_tokens": 0.05, 13 "output_per_million_tokens": 0.05 14 }, 15 "capabilities": { 16 "function_calling": true, 17 "vision": false, 18 "reasoning": false, 19 "prompt_caching": false, 20 "response_schema": false 21 }, 22 "last_updated_at": "2026-04-24" 23 }, 24 "baai/bge-m3": { 25 "mode": "embedding", 26 "context_window": { 27 "max_input": 8192, 28 "max_output": 96000, 29 "max_tokens": 96000 30 }, 31 "pricing": { 32 "input_per_million_tokens": 0.01, 33 "output_per_million_tokens": 0.01 34 }, 35 "capabilities": { 36 "function_calling": false, 37 "vision": false, 38 "reasoning": false, 39 "prompt_caching": false, 40 "response_schema": false 41 }, 42 "last_updated_at": "2026-04-24" 43 }, 44 "baichuan/baichuan-m2-32b": { 45 "mode": "chat", 46 "context_window": { 47 "max_input": 131072, 48 "max_output": 131072, 49 "max_tokens": 131072 50 }, 51 "pricing": { 52 "input_per_million_tokens": 0.07, 53 "output_per_million_tokens": 0.07 54 }, 55 "capabilities": { 56 "function_calling": false, 57 "vision": false, 58 "reasoning": false, 59 "prompt_caching": false, 60 "response_schema": false 61 }, 62 "last_updated_at": "2026-04-24" 63 }, 64 "baidu/ernie-4.5-21B-a3b": { 65 "mode": "chat", 66 "context_window": { 67 "max_input": 120000, 68 "max_output": 8000, 69 "max_tokens": 8000 70 }, 71 "pricing": { 72 "input_per_million_tokens": 0.07, 73 "output_per_million_tokens": 0.28 74 }, 75 "capabilities": { 76 "function_calling": true, 77 "vision": false, 78 "reasoning": false, 79 "prompt_caching": false, 80 "response_schema": false 81 }, 82 "last_updated_at": "2026-04-24" 83 }, 84 "baidu/ernie-4.5-21B-a3b-thinking": { 85 "mode": "chat", 86 "context_window": { 87 "max_input": 131072, 88 "max_output": 65536, 89 "max_tokens": 65536 90 }, 91 "pricing": { 92 "input_per_million_tokens": 0.07, 93 "output_per_million_tokens": 0.28 94 }, 95 "capabilities": { 96 "function_calling": false, 97 "vision": false, 98 "reasoning": true, 99 "prompt_caching": false, 100 "response_schema": false 101 }, 102 "last_updated_at": "2026-04-24" 103 }, 104 "baidu/ernie-4.5-300b-a47b-paddle": { 105 "mode": "chat", 106 "context_window": { 107 "max_input": 123000, 108 "max_output": 12000, 109 "max_tokens": 12000 110 }, 111 "pricing": { 112 "input_per_million_tokens": 0.28, 113 "output_per_million_tokens": 1.1 114 }, 115 "capabilities": { 116 "function_calling": false, 117 "vision": false, 118 "reasoning": false, 119 "prompt_caching": false, 120 "response_schema": true 121 }, 122 "last_updated_at": "2026-04-24" 123 }, 124 "baidu/ernie-4.5-vl-28b-a3b": { 125 "mode": "chat", 126 "context_window": { 127 "max_input": 30000, 128 "max_output": 8000, 129 "max_tokens": 8000 130 }, 131 "pricing": { 132 "input_per_million_tokens": 0.14, 133 "output_per_million_tokens": 0.56 134 }, 135 "capabilities": { 136 "function_calling": true, 137 "vision": true, 138 "reasoning": true, 139 "prompt_caching": false, 140 "response_schema": false 141 }, 142 "last_updated_at": "2026-04-24" 143 }, 144 "baidu/ernie-4.5-vl-28b-a3b-thinking": { 145 "mode": "chat", 146 "context_window": { 147 "max_input": 131072, 148 "max_output": 65536, 149 "max_tokens": 65536 150 }, 151 "pricing": { 152 "input_per_million_tokens": 0.39, 153 "output_per_million_tokens": 0.39 154 }, 155 "capabilities": { 156 "function_calling": true, 157 "vision": true, 158 "reasoning": true, 159 "prompt_caching": false, 160 "response_schema": true 161 }, 162 "last_updated_at": "2026-04-24" 163 }, 164 "baidu/ernie-4.5-vl-424b-a47b": { 165 "mode": "chat", 166 "context_window": { 167 "max_input": 123000, 168 "max_output": 16000, 169 "max_tokens": 16000 170 }, 171 "pricing": { 172 "input_per_million_tokens": 0.42, 173 "output_per_million_tokens": 1.25 174 }, 175 "capabilities": { 176 "function_calling": false, 177 "vision": true, 178 "reasoning": true, 179 "prompt_caching": false, 180 "response_schema": false 181 }, 182 "last_updated_at": "2026-04-24" 183 }, 184 "deepseek/deepseek-ocr": { 185 "mode": "chat", 186 "context_window": { 187 "max_input": 8192, 188 "max_output": 8192, 189 "max_tokens": 8192 190 }, 191 "pricing": { 192 "input_per_million_tokens": 0.03, 193 "output_per_million_tokens": 0.03 194 }, 195 "capabilities": { 196 "function_calling": false, 197 "vision": true, 198 "reasoning": false, 199 "prompt_caching": false, 200 "response_schema": true 201 }, 202 "last_updated_at": "2026-04-24" 203 }, 204 "deepseek/deepseek-prover-v2-671b": { 205 "mode": "chat", 206 "context_window": { 207 "max_input": 160000, 208 "max_output": 160000, 209 "max_tokens": 160000 210 }, 211 "pricing": { 212 "input_per_million_tokens": 0.7, 213 "output_per_million_tokens": 2.5 214 }, 215 "capabilities": { 216 "function_calling": false, 217 "vision": false, 218 "reasoning": false, 219 "prompt_caching": false, 220 "response_schema": false 221 }, 222 "last_updated_at": "2026-04-24" 223 }, 224 "deepseek/deepseek-r1-0528": { 225 "mode": "chat", 226 "context_window": { 227 "max_input": 163840, 228 "max_output": 32768, 229 "max_tokens": 32768 230 }, 231 "pricing": { 232 "input_per_million_tokens": 0.7, 233 "output_per_million_tokens": 2.5, 234 "cache_read_per_million_tokens": 0.35 235 }, 236 "capabilities": { 237 "function_calling": true, 238 "vision": false, 239 "reasoning": true, 240 "prompt_caching": false, 241 "response_schema": true 242 }, 243 "last_updated_at": "2026-04-24" 244 }, 245 "deepseek/deepseek-r1-0528-qwen3-8b": { 246 "mode": "chat", 247 "context_window": { 248 "max_input": 128000, 249 "max_output": 32000, 250 "max_tokens": 32000 251 }, 252 "pricing": { 253 "input_per_million_tokens": 0.06, 254 "output_per_million_tokens": 0.09 255 }, 256 "capabilities": { 257 "function_calling": false, 258 "vision": false, 259 "reasoning": true, 260 "prompt_caching": false, 261 "response_schema": false 262 }, 263 "last_updated_at": "2026-04-24" 264 }, 265 "deepseek/deepseek-r1-distill-llama-70b": { 266 "mode": "chat", 267 "context_window": { 268 "max_input": 8192, 269 "max_output": 8192, 270 "max_tokens": 8192 271 }, 272 "pricing": { 273 "input_per_million_tokens": 0.8, 274 "output_per_million_tokens": 0.8 275 }, 276 "capabilities": { 277 "function_calling": false, 278 "vision": false, 279 "reasoning": true, 280 "prompt_caching": false, 281 "response_schema": true 282 }, 283 "last_updated_at": "2026-04-24" 284 }, 285 "deepseek/deepseek-r1-distill-qwen-14b": { 286 "mode": "chat", 287 "context_window": { 288 "max_input": 32768, 289 "max_output": 16384, 290 "max_tokens": 16384 291 }, 292 "pricing": { 293 "input_per_million_tokens": 0.15, 294 "output_per_million_tokens": 0.15 295 }, 296 "capabilities": { 297 "function_calling": false, 298 "vision": false, 299 "reasoning": true, 300 "prompt_caching": false, 301 "response_schema": true 302 }, 303 "last_updated_at": "2026-04-24" 304 }, 305 "deepseek/deepseek-r1-distill-qwen-32b": { 306 "mode": "chat", 307 "context_window": { 308 "max_input": 64000, 309 "max_output": 32000, 310 "max_tokens": 32000 311 }, 312 "pricing": { 313 "input_per_million_tokens": 0.3, 314 "output_per_million_tokens": 0.3 315 }, 316 "capabilities": { 317 "function_calling": false, 318 "vision": false, 319 "reasoning": true, 320 "prompt_caching": false, 321 "response_schema": true 322 }, 323 "last_updated_at": "2026-04-24" 324 }, 325 "deepseek/deepseek-r1-turbo": { 326 "mode": "chat", 327 "context_window": { 328 "max_input": 64000, 329 "max_output": 16000, 330 "max_tokens": 16000 331 }, 332 "pricing": { 333 "input_per_million_tokens": 0.7, 334 "output_per_million_tokens": 2.5 335 }, 336 "capabilities": { 337 "function_calling": true, 338 "vision": false, 339 "reasoning": true, 340 "prompt_caching": false, 341 "response_schema": false 342 }, 343 "last_updated_at": "2026-04-24" 344 }, 345 "deepseek/deepseek-v3-0324": { 346 "mode": "chat", 347 "context_window": { 348 "max_input": 163840, 349 "max_output": 163840, 350 "max_tokens": 163840 351 }, 352 "pricing": { 353 "input_per_million_tokens": 0.27, 354 "output_per_million_tokens": 1.12, 355 "cache_read_per_million_tokens": 0.135 356 }, 357 "capabilities": { 358 "function_calling": true, 359 "vision": false, 360 "reasoning": false, 361 "prompt_caching": false, 362 "response_schema": true 363 }, 364 "last_updated_at": "2026-04-24" 365 }, 366 "deepseek/deepseek-v3-turbo": { 367 "mode": "chat", 368 "context_window": { 369 "max_input": 64000, 370 "max_output": 16000, 371 "max_tokens": 16000 372 }, 373 "pricing": { 374 "input_per_million_tokens": 0.4, 375 "output_per_million_tokens": 1.3 376 }, 377 "capabilities": { 378 "function_calling": true, 379 "vision": false, 380 "reasoning": false, 381 "prompt_caching": false, 382 "response_schema": false 383 }, 384 "last_updated_at": "2026-04-24" 385 }, 386 "deepseek/deepseek-v3.1": { 387 "mode": "chat", 388 "context_window": { 389 "max_input": 131072, 390 "max_output": 32768, 391 "max_tokens": 32768 392 }, 393 "pricing": { 394 "input_per_million_tokens": 0.27, 395 "output_per_million_tokens": 1.0, 396 "cache_read_per_million_tokens": 0.135 397 }, 398 "capabilities": { 399 "function_calling": true, 400 "vision": false, 401 "reasoning": true, 402 "prompt_caching": false, 403 "response_schema": true 404 }, 405 "last_updated_at": "2026-04-24" 406 }, 407 "deepseek/deepseek-v3.1-terminus": { 408 "mode": "chat", 409 "context_window": { 410 "max_input": 131072, 411 "max_output": 32768, 412 "max_tokens": 32768 413 }, 414 "pricing": { 415 "input_per_million_tokens": 0.27, 416 "output_per_million_tokens": 1.0, 417 "cache_read_per_million_tokens": 0.135 418 }, 419 "capabilities": { 420 "function_calling": true, 421 "vision": false, 422 "reasoning": true, 423 "prompt_caching": false, 424 "response_schema": true 425 }, 426 "last_updated_at": "2026-04-24" 427 }, 428 "deepseek/deepseek-v3.2": { 429 "mode": "chat", 430 "context_window": { 431 "max_input": 163840, 432 "max_output": 65536, 433 "max_tokens": 65536 434 }, 435 "pricing": { 436 "input_per_million_tokens": 0.269, 437 "output_per_million_tokens": 0.4, 438 "cache_read_per_million_tokens": 0.1345 439 }, 440 "capabilities": { 441 "function_calling": true, 442 "vision": false, 443 "reasoning": true, 444 "prompt_caching": false, 445 "response_schema": true 446 }, 447 "last_updated_at": "2026-04-24" 448 }, 449 "deepseek/deepseek-v3.2-exp": { 450 "mode": "chat", 451 "context_window": { 452 "max_input": 163840, 453 "max_output": 65536, 454 "max_tokens": 65536 455 }, 456 "pricing": { 457 "input_per_million_tokens": 0.27, 458 "output_per_million_tokens": 0.41 459 }, 460 "capabilities": { 461 "function_calling": true, 462 "vision": false, 463 "reasoning": true, 464 "prompt_caching": false, 465 "response_schema": true 466 }, 467 "last_updated_at": "2026-04-24" 468 }, 469 "google/gemma-3-12b-it": { 470 "mode": "chat", 471 "context_window": { 472 "max_input": 131072, 473 "max_output": 8192, 474 "max_tokens": 8192 475 }, 476 "pricing": { 477 "input_per_million_tokens": 0.05, 478 "output_per_million_tokens": 0.1 479 }, 480 "capabilities": { 481 "function_calling": false, 482 "vision": true, 483 "reasoning": false, 484 "prompt_caching": false, 485 "response_schema": true 486 }, 487 "last_updated_at": "2026-04-24" 488 }, 489 "google/gemma-3-27b-it": { 490 "mode": "chat", 491 "context_window": { 492 "max_input": 98304, 493 "max_output": 16384, 494 "max_tokens": 16384 495 }, 496 "pricing": { 497 "input_per_million_tokens": 0.119, 498 "output_per_million_tokens": 0.2 499 }, 500 "capabilities": { 501 "function_calling": false, 502 "vision": true, 503 "reasoning": false, 504 "prompt_caching": false, 505 "response_schema": false 506 }, 507 "last_updated_at": "2026-04-24" 508 }, 509 "gryphe/mythomax-l2-13b": { 510 "mode": "chat", 511 "context_window": { 512 "max_input": 4096, 513 "max_output": 3200, 514 "max_tokens": 3200 515 }, 516 "pricing": { 517 "input_per_million_tokens": 0.09, 518 "output_per_million_tokens": 0.09 519 }, 520 "capabilities": { 521 "function_calling": false, 522 "vision": false, 523 "reasoning": false, 524 "prompt_caching": false, 525 "response_schema": false 526 }, 527 "last_updated_at": "2026-04-24" 528 }, 529 "kwaipilot/kat-coder-pro": { 530 "mode": "chat", 531 "context_window": { 532 "max_input": 256000, 533 "max_output": 128000, 534 "max_tokens": 128000 535 }, 536 "pricing": { 537 "input_per_million_tokens": 0.3, 538 "output_per_million_tokens": 1.2, 539 "cache_read_per_million_tokens": 0.06 540 }, 541 "capabilities": { 542 "function_calling": true, 543 "vision": false, 544 "reasoning": false, 545 "prompt_caching": false, 546 "response_schema": true 547 }, 548 "last_updated_at": "2026-04-24" 549 }, 550 "meta-llama/llama-3-70b-instruct": { 551 "mode": "chat", 552 "context_window": { 553 "max_input": 8192, 554 "max_output": 8000, 555 "max_tokens": 8000 556 }, 557 "pricing": { 558 "input_per_million_tokens": 0.51, 559 "output_per_million_tokens": 0.74 560 }, 561 "capabilities": { 562 "function_calling": false, 563 "vision": false, 564 "reasoning": false, 565 "prompt_caching": false, 566 "response_schema": true 567 }, 568 "last_updated_at": "2026-04-24" 569 }, 570 "meta-llama/llama-3-8b-instruct": { 571 "mode": "chat", 572 "context_window": { 573 "max_input": 8192, 574 "max_output": 8192, 575 "max_tokens": 8192 576 }, 577 "pricing": { 578 "input_per_million_tokens": 0.04, 579 "output_per_million_tokens": 0.04 580 }, 581 "capabilities": { 582 "function_calling": false, 583 "vision": false, 584 "reasoning": false, 585 "prompt_caching": false, 586 "response_schema": false 587 }, 588 "last_updated_at": "2026-04-24" 589 }, 590 "meta-llama/llama-3.1-8b-instruct": { 591 "mode": "chat", 592 "context_window": { 593 "max_input": 16384, 594 "max_output": 16384, 595 "max_tokens": 16384 596 }, 597 "pricing": { 598 "input_per_million_tokens": 0.02, 599 "output_per_million_tokens": 0.05 600 }, 601 "capabilities": { 602 "function_calling": false, 603 "vision": false, 604 "reasoning": false, 605 "prompt_caching": false, 606 "response_schema": false 607 }, 608 "last_updated_at": "2026-04-24" 609 }, 610 "meta-llama/llama-3.2-3b-instruct": { 611 "mode": "chat", 612 "context_window": { 613 "max_input": 32768, 614 "max_output": 32000, 615 "max_tokens": 32000 616 }, 617 "pricing": { 618 "input_per_million_tokens": 0.03, 619 "output_per_million_tokens": 0.05 620 }, 621 "capabilities": { 622 "function_calling": true, 623 "vision": false, 624 "reasoning": false, 625 "prompt_caching": false, 626 "response_schema": false 627 }, 628 "last_updated_at": "2026-04-24" 629 }, 630 "meta-llama/llama-3.3-70b-instruct": { 631 "mode": "chat", 632 "context_window": { 633 "max_input": 131072, 634 "max_output": 120000, 635 "max_tokens": 120000 636 }, 637 "pricing": { 638 "input_per_million_tokens": 0.135, 639 "output_per_million_tokens": 0.4 640 }, 641 "capabilities": { 642 "function_calling": true, 643 "vision": false, 644 "reasoning": false, 645 "prompt_caching": false, 646 "response_schema": false 647 }, 648 "last_updated_at": "2026-04-24" 649 }, 650 "meta-llama/llama-4-maverick-17b-128e-instruct-fp8": { 651 "mode": "chat", 652 "context_window": { 653 "max_input": 1048576, 654 "max_output": 8192, 655 "max_tokens": 8192 656 }, 657 "pricing": { 658 "input_per_million_tokens": 0.27, 659 "output_per_million_tokens": 0.85 660 }, 661 "capabilities": { 662 "function_calling": false, 663 "vision": true, 664 "reasoning": false, 665 "prompt_caching": false, 666 "response_schema": false 667 }, 668 "last_updated_at": "2026-04-24" 669 }, 670 "meta-llama/llama-4-scout-17b-16e-instruct": { 671 "mode": "chat", 672 "context_window": { 673 "max_input": 131072, 674 "max_output": 131072, 675 "max_tokens": 131072 676 }, 677 "pricing": { 678 "input_per_million_tokens": 0.18, 679 "output_per_million_tokens": 0.59 680 }, 681 "capabilities": { 682 "function_calling": false, 683 "vision": true, 684 "reasoning": false, 685 "prompt_caching": false, 686 "response_schema": false 687 }, 688 "last_updated_at": "2026-04-24" 689 }, 690 "microsoft/wizardlm-2-8x22b": { 691 "mode": "chat", 692 "context_window": { 693 "max_input": 65535, 694 "max_output": 8000, 695 "max_tokens": 8000 696 }, 697 "pricing": { 698 "input_per_million_tokens": 0.62, 699 "output_per_million_tokens": 0.62 700 }, 701 "capabilities": { 702 "function_calling": false, 703 "vision": false, 704 "reasoning": false, 705 "prompt_caching": false, 706 "response_schema": false 707 }, 708 "last_updated_at": "2026-04-24" 709 }, 710 "minimax/minimax-m2": { 711 "mode": "chat", 712 "context_window": { 713 "max_input": 204800, 714 "max_output": 131072, 715 "max_tokens": 131072 716 }, 717 "pricing": { 718 "input_per_million_tokens": 0.3, 719 "output_per_million_tokens": 1.2, 720 "cache_read_per_million_tokens": 0.03 721 }, 722 "capabilities": { 723 "function_calling": true, 724 "vision": false, 725 "reasoning": true, 726 "prompt_caching": false, 727 "response_schema": false 728 }, 729 "last_updated_at": "2026-04-24" 730 }, 731 "minimax/minimax-m2.1": { 732 "mode": "chat", 733 "context_window": { 734 "max_input": 204800, 735 "max_output": 131072, 736 "max_tokens": 131072 737 }, 738 "pricing": { 739 "input_per_million_tokens": 0.3, 740 "output_per_million_tokens": 1.2, 741 "cache_read_per_million_tokens": 0.03 742 }, 743 "capabilities": { 744 "function_calling": true, 745 "vision": false, 746 "reasoning": false, 747 "prompt_caching": false, 748 "response_schema": true 749 }, 750 "last_updated_at": "2026-04-24" 751 }, 752 "minimaxai/minimax-m1-80k": { 753 "mode": "chat", 754 "context_window": { 755 "max_input": 1000000, 756 "max_output": 40000, 757 "max_tokens": 40000 758 }, 759 "pricing": { 760 "input_per_million_tokens": 0.55, 761 "output_per_million_tokens": 2.2 762 }, 763 "capabilities": { 764 "function_calling": true, 765 "vision": false, 766 "reasoning": true, 767 "prompt_caching": false, 768 "response_schema": false 769 }, 770 "last_updated_at": "2026-04-24" 771 }, 772 "mistralai/mistral-nemo": { 773 "mode": "chat", 774 "context_window": { 775 "max_input": 60288, 776 "max_output": 16000, 777 "max_tokens": 16000 778 }, 779 "pricing": { 780 "input_per_million_tokens": 0.04, 781 "output_per_million_tokens": 0.17 782 }, 783 "capabilities": { 784 "function_calling": false, 785 "vision": false, 786 "reasoning": false, 787 "prompt_caching": false, 788 "response_schema": true 789 }, 790 "last_updated_at": "2026-04-24" 791 }, 792 "moonshotai/kimi-k2-0905": { 793 "mode": "chat", 794 "context_window": { 795 "max_input": 262144, 796 "max_output": 262144, 797 "max_tokens": 262144 798 }, 799 "pricing": { 800 "input_per_million_tokens": 0.6, 801 "output_per_million_tokens": 2.5 802 }, 803 "capabilities": { 804 "function_calling": true, 805 "vision": false, 806 "reasoning": false, 807 "prompt_caching": false, 808 "response_schema": true 809 }, 810 "last_updated_at": "2026-04-24" 811 }, 812 "moonshotai/kimi-k2-instruct": { 813 "mode": "chat", 814 "context_window": { 815 "max_input": 131072, 816 "max_output": 131072, 817 "max_tokens": 131072 818 }, 819 "pricing": { 820 "input_per_million_tokens": 0.57, 821 "output_per_million_tokens": 2.3 822 }, 823 "capabilities": { 824 "function_calling": true, 825 "vision": false, 826 "reasoning": false, 827 "prompt_caching": false, 828 "response_schema": true 829 }, 830 "last_updated_at": "2026-04-24" 831 }, 832 "moonshotai/kimi-k2-thinking": { 833 "mode": "chat", 834 "context_window": { 835 "max_input": 262144, 836 "max_output": 262144, 837 "max_tokens": 262144 838 }, 839 "pricing": { 840 "input_per_million_tokens": 0.6, 841 "output_per_million_tokens": 2.5 842 }, 843 "capabilities": { 844 "function_calling": true, 845 "vision": false, 846 "reasoning": true, 847 "prompt_caching": false, 848 "response_schema": true 849 }, 850 "last_updated_at": "2026-04-24" 851 }, 852 "nousresearch/hermes-2-pro-llama-3-8b": { 853 "mode": "chat", 854 "context_window": { 855 "max_input": 8192, 856 "max_output": 8192, 857 "max_tokens": 8192 858 }, 859 "pricing": { 860 "input_per_million_tokens": 0.14, 861 "output_per_million_tokens": 0.14 862 }, 863 "capabilities": { 864 "function_calling": false, 865 "vision": false, 866 "reasoning": false, 867 "prompt_caching": false, 868 "response_schema": true 869 }, 870 "last_updated_at": "2026-04-24" 871 }, 872 "openai/gpt-oss-120b": { 873 "mode": "chat", 874 "context_window": { 875 "max_input": 131072, 876 "max_output": 32768, 877 "max_tokens": 32768 878 }, 879 "pricing": { 880 "input_per_million_tokens": 0.05, 881 "output_per_million_tokens": 0.25 882 }, 883 "capabilities": { 884 "function_calling": true, 885 "vision": true, 886 "reasoning": true, 887 "prompt_caching": false, 888 "response_schema": true 889 }, 890 "last_updated_at": "2026-04-24" 891 }, 892 "openai/gpt-oss-20b": { 893 "mode": "chat", 894 "context_window": { 895 "max_input": 131072, 896 "max_output": 32768, 897 "max_tokens": 32768 898 }, 899 "pricing": { 900 "input_per_million_tokens": 0.04, 901 "output_per_million_tokens": 0.15 902 }, 903 "capabilities": { 904 "function_calling": false, 905 "vision": true, 906 "reasoning": true, 907 "prompt_caching": false, 908 "response_schema": true 909 }, 910 "last_updated_at": "2026-04-24" 911 }, 912 "paddlepaddle/paddleocr-vl": { 913 "mode": "chat", 914 "context_window": { 915 "max_input": 16384, 916 "max_output": 16384, 917 "max_tokens": 16384 918 }, 919 "pricing": { 920 "input_per_million_tokens": 0.02, 921 "output_per_million_tokens": 0.02 922 }, 923 "capabilities": { 924 "function_calling": false, 925 "vision": true, 926 "reasoning": false, 927 "prompt_caching": false, 928 "response_schema": false 929 }, 930 "last_updated_at": "2026-04-24" 931 }, 932 "qwen/qwen-2.5-72b-instruct": { 933 "mode": "chat", 934 "context_window": { 935 "max_input": 32000, 936 "max_output": 8192, 937 "max_tokens": 8192 938 }, 939 "pricing": { 940 "input_per_million_tokens": 0.38, 941 "output_per_million_tokens": 0.4 942 }, 943 "capabilities": { 944 "function_calling": true, 945 "vision": false, 946 "reasoning": false, 947 "prompt_caching": false, 948 "response_schema": true 949 }, 950 "last_updated_at": "2026-04-24" 951 }, 952 "qwen/qwen-mt-plus": { 953 "mode": "chat", 954 "context_window": { 955 "max_input": 16384, 956 "max_output": 8192, 957 "max_tokens": 8192 958 }, 959 "pricing": { 960 "input_per_million_tokens": 0.25, 961 "output_per_million_tokens": 0.75 962 }, 963 "capabilities": { 964 "function_calling": false, 965 "vision": false, 966 "reasoning": false, 967 "prompt_caching": false, 968 "response_schema": false 969 }, 970 "last_updated_at": "2026-04-24" 971 }, 972 "qwen/qwen2.5-7b-instruct": { 973 "mode": "chat", 974 "context_window": { 975 "max_input": 32000, 976 "max_output": 32000, 977 "max_tokens": 32000 978 }, 979 "pricing": { 980 "input_per_million_tokens": 0.07, 981 "output_per_million_tokens": 0.07 982 }, 983 "capabilities": { 984 "function_calling": true, 985 "vision": false, 986 "reasoning": false, 987 "prompt_caching": false, 988 "response_schema": true 989 }, 990 "last_updated_at": "2026-04-24" 991 }, 992 "qwen/qwen2.5-vl-72b-instruct": { 993 "mode": "chat", 994 "context_window": { 995 "max_input": 32768, 996 "max_output": 32768, 997 "max_tokens": 32768 998 }, 999 "pricing": { 1000 "input_per_million_tokens": 0.8, 1001 "output_per_million_tokens": 0.8 1002 }, 1003 "capabilities": { 1004 "function_calling": false, 1005 "vision": true, 1006 "reasoning": false, 1007 "prompt_caching": false, 1008 "response_schema": false 1009 }, 1010 "last_updated_at": "2026-04-24" 1011 }, 1012 "qwen/qwen3-235b-a22b-fp8": { 1013 "mode": "chat", 1014 "context_window": { 1015 "max_input": 40960, 1016 "max_output": 20000, 1017 "max_tokens": 20000 1018 }, 1019 "pricing": { 1020 "input_per_million_tokens": 0.2, 1021 "output_per_million_tokens": 0.8 1022 }, 1023 "capabilities": { 1024 "function_calling": false, 1025 "vision": false, 1026 "reasoning": true, 1027 "prompt_caching": false, 1028 "response_schema": false 1029 }, 1030 "last_updated_at": "2026-04-24" 1031 }, 1032 "qwen/qwen3-235b-a22b-instruct-2507": { 1033 "mode": "chat", 1034 "context_window": { 1035 "max_input": 131072, 1036 "max_output": 16384, 1037 "max_tokens": 16384 1038 }, 1039 "pricing": { 1040 "input_per_million_tokens": 0.09, 1041 "output_per_million_tokens": 0.58 1042 }, 1043 "capabilities": { 1044 "function_calling": true, 1045 "vision": false, 1046 "reasoning": false, 1047 "prompt_caching": false, 1048 "response_schema": true 1049 }, 1050 "last_updated_at": "2026-04-24" 1051 }, 1052 "qwen/qwen3-235b-a22b-thinking-2507": { 1053 "mode": "chat", 1054 "context_window": { 1055 "max_input": 131072, 1056 "max_output": 32768, 1057 "max_tokens": 32768 1058 }, 1059 "pricing": { 1060 "input_per_million_tokens": 0.3, 1061 "output_per_million_tokens": 3.0 1062 }, 1063 "capabilities": { 1064 "function_calling": true, 1065 "vision": false, 1066 "reasoning": true, 1067 "prompt_caching": false, 1068 "response_schema": false 1069 }, 1070 "last_updated_at": "2026-04-24" 1071 }, 1072 "qwen/qwen3-30b-a3b-fp8": { 1073 "mode": "chat", 1074 "context_window": { 1075 "max_input": 40960, 1076 "max_output": 20000, 1077 "max_tokens": 20000 1078 }, 1079 "pricing": { 1080 "input_per_million_tokens": 0.09, 1081 "output_per_million_tokens": 0.45 1082 }, 1083 "capabilities": { 1084 "function_calling": false, 1085 "vision": false, 1086 "reasoning": true, 1087 "prompt_caching": false, 1088 "response_schema": false 1089 }, 1090 "last_updated_at": "2026-04-24" 1091 }, 1092 "qwen/qwen3-32b-fp8": { 1093 "mode": "chat", 1094 "context_window": { 1095 "max_input": 40960, 1096 "max_output": 20000, 1097 "max_tokens": 20000 1098 }, 1099 "pricing": { 1100 "input_per_million_tokens": 0.1, 1101 "output_per_million_tokens": 0.45 1102 }, 1103 "capabilities": { 1104 "function_calling": false, 1105 "vision": false, 1106 "reasoning": true, 1107 "prompt_caching": false, 1108 "response_schema": false 1109 }, 1110 "last_updated_at": "2026-04-24" 1111 }, 1112 "qwen/qwen3-4b-fp8": { 1113 "mode": "chat", 1114 "context_window": { 1115 "max_input": 128000, 1116 "max_output": 20000, 1117 "max_tokens": 20000 1118 }, 1119 "pricing": { 1120 "input_per_million_tokens": 0.03, 1121 "output_per_million_tokens": 0.03 1122 }, 1123 "capabilities": { 1124 "function_calling": false, 1125 "vision": false, 1126 "reasoning": true, 1127 "prompt_caching": false, 1128 "response_schema": false 1129 }, 1130 "last_updated_at": "2026-04-24" 1131 }, 1132 "qwen/qwen3-8b-fp8": { 1133 "mode": "chat", 1134 "context_window": { 1135 "max_input": 128000, 1136 "max_output": 20000, 1137 "max_tokens": 20000 1138 }, 1139 "pricing": { 1140 "input_per_million_tokens": 0.035, 1141 "output_per_million_tokens": 0.138 1142 }, 1143 "capabilities": { 1144 "function_calling": false, 1145 "vision": false, 1146 "reasoning": true, 1147 "prompt_caching": false, 1148 "response_schema": false 1149 }, 1150 "last_updated_at": "2026-04-24" 1151 }, 1152 "qwen/qwen3-coder-30b-a3b-instruct": { 1153 "mode": "chat", 1154 "context_window": { 1155 "max_input": 160000, 1156 "max_output": 32768, 1157 "max_tokens": 32768 1158 }, 1159 "pricing": { 1160 "input_per_million_tokens": 0.07, 1161 "output_per_million_tokens": 0.27 1162 }, 1163 "capabilities": { 1164 "function_calling": true, 1165 "vision": false, 1166 "reasoning": false, 1167 "prompt_caching": false, 1168 "response_schema": true 1169 }, 1170 "last_updated_at": "2026-04-24" 1171 }, 1172 "qwen/qwen3-coder-480b-a35b-instruct": { 1173 "mode": "chat", 1174 "context_window": { 1175 "max_input": 262144, 1176 "max_output": 65536, 1177 "max_tokens": 65536 1178 }, 1179 "pricing": { 1180 "input_per_million_tokens": 0.3, 1181 "output_per_million_tokens": 1.3 1182 }, 1183 "capabilities": { 1184 "function_calling": true, 1185 "vision": false, 1186 "reasoning": false, 1187 "prompt_caching": false, 1188 "response_schema": true 1189 }, 1190 "last_updated_at": "2026-04-24" 1191 }, 1192 "qwen/qwen3-embedding-0.6b": { 1193 "mode": "embedding", 1194 "context_window": { 1195 "max_input": 32768, 1196 "max_output": 32768, 1197 "max_tokens": 32768 1198 }, 1199 "pricing": { 1200 "input_per_million_tokens": 0.07, 1201 "output_per_million_tokens": 0 1202 }, 1203 "capabilities": { 1204 "function_calling": false, 1205 "vision": false, 1206 "reasoning": false, 1207 "prompt_caching": false, 1208 "response_schema": false 1209 }, 1210 "last_updated_at": "2026-04-24" 1211 }, 1212 "qwen/qwen3-embedding-8b": { 1213 "mode": "embedding", 1214 "context_window": { 1215 "max_input": 32768, 1216 "max_output": 4096, 1217 "max_tokens": 4096 1218 }, 1219 "pricing": { 1220 "input_per_million_tokens": 0.07, 1221 "output_per_million_tokens": 0 1222 }, 1223 "capabilities": { 1224 "function_calling": false, 1225 "vision": false, 1226 "reasoning": false, 1227 "prompt_caching": false, 1228 "response_schema": false 1229 }, 1230 "last_updated_at": "2026-04-24" 1231 }, 1232 "qwen/qwen3-max": { 1233 "mode": "chat", 1234 "context_window": { 1235 "max_input": 262144, 1236 "max_output": 65536, 1237 "max_tokens": 65536 1238 }, 1239 "pricing": { 1240 "input_per_million_tokens": 2.11, 1241 "output_per_million_tokens": 8.45 1242 }, 1243 "capabilities": { 1244 "function_calling": true, 1245 "vision": false, 1246 "reasoning": false, 1247 "prompt_caching": false, 1248 "response_schema": true 1249 }, 1250 "last_updated_at": "2026-04-24" 1251 }, 1252 "qwen/qwen3-next-80b-a3b-instruct": { 1253 "mode": "chat", 1254 "context_window": { 1255 "max_input": 131072, 1256 "max_output": 32768, 1257 "max_tokens": 32768 1258 }, 1259 "pricing": { 1260 "input_per_million_tokens": 0.15, 1261 "output_per_million_tokens": 1.5 1262 }, 1263 "capabilities": { 1264 "function_calling": true, 1265 "vision": false, 1266 "reasoning": false, 1267 "prompt_caching": false, 1268 "response_schema": true 1269 }, 1270 "last_updated_at": "2026-04-24" 1271 }, 1272 "qwen/qwen3-next-80b-a3b-thinking": { 1273 "mode": "chat", 1274 "context_window": { 1275 "max_input": 131072, 1276 "max_output": 32768, 1277 "max_tokens": 32768 1278 }, 1279 "pricing": { 1280 "input_per_million_tokens": 0.15, 1281 "output_per_million_tokens": 1.5 1282 }, 1283 "capabilities": { 1284 "function_calling": true, 1285 "vision": false, 1286 "reasoning": true, 1287 "prompt_caching": false, 1288 "response_schema": true 1289 }, 1290 "last_updated_at": "2026-04-24" 1291 }, 1292 "qwen/qwen3-omni-30b-a3b-instruct": { 1293 "mode": "chat", 1294 "context_window": { 1295 "max_input": 65536, 1296 "max_output": 16384, 1297 "max_tokens": 16384 1298 }, 1299 "pricing": { 1300 "input_per_million_tokens": 0.25, 1301 "output_per_million_tokens": 0.97 1302 }, 1303 "capabilities": { 1304 "function_calling": true, 1305 "vision": true, 1306 "reasoning": false, 1307 "prompt_caching": false, 1308 "response_schema": true 1309 }, 1310 "last_updated_at": "2026-04-24" 1311 }, 1312 "qwen/qwen3-omni-30b-a3b-thinking": { 1313 "mode": "chat", 1314 "context_window": { 1315 "max_input": 65536, 1316 "max_output": 16384, 1317 "max_tokens": 16384 1318 }, 1319 "pricing": { 1320 "input_per_million_tokens": 0.25, 1321 "output_per_million_tokens": 0.97 1322 }, 1323 "capabilities": { 1324 "function_calling": true, 1325 "vision": true, 1326 "reasoning": true, 1327 "prompt_caching": false, 1328 "response_schema": true 1329 }, 1330 "last_updated_at": "2026-04-24" 1331 }, 1332 "qwen/qwen3-vl-235b-a22b-instruct": { 1333 "mode": "chat", 1334 "context_window": { 1335 "max_input": 131072, 1336 "max_output": 32768, 1337 "max_tokens": 32768 1338 }, 1339 "pricing": { 1340 "input_per_million_tokens": 0.3, 1341 "output_per_million_tokens": 1.5 1342 }, 1343 "capabilities": { 1344 "function_calling": true, 1345 "vision": true, 1346 "reasoning": false, 1347 "prompt_caching": false, 1348 "response_schema": true 1349 }, 1350 "last_updated_at": "2026-04-24" 1351 }, 1352 "qwen/qwen3-vl-235b-a22b-thinking": { 1353 "mode": "chat", 1354 "context_window": { 1355 "max_input": 131072, 1356 "max_output": 32768, 1357 "max_tokens": 32768 1358 }, 1359 "pricing": { 1360 "input_per_million_tokens": 0.98, 1361 "output_per_million_tokens": 3.95 1362 }, 1363 "capabilities": { 1364 "function_calling": false, 1365 "vision": true, 1366 "reasoning": true, 1367 "prompt_caching": false, 1368 "response_schema": false 1369 }, 1370 "last_updated_at": "2026-04-24" 1371 }, 1372 "qwen/qwen3-vl-30b-a3b-instruct": { 1373 "mode": "chat", 1374 "context_window": { 1375 "max_input": 131072, 1376 "max_output": 32768, 1377 "max_tokens": 32768 1378 }, 1379 "pricing": { 1380 "input_per_million_tokens": 0.2, 1381 "output_per_million_tokens": 0.7 1382 }, 1383 "capabilities": { 1384 "function_calling": true, 1385 "vision": true, 1386 "reasoning": false, 1387 "prompt_caching": false, 1388 "response_schema": true 1389 }, 1390 "last_updated_at": "2026-04-24" 1391 }, 1392 "qwen/qwen3-vl-30b-a3b-thinking": { 1393 "mode": "chat", 1394 "context_window": { 1395 "max_input": 131072, 1396 "max_output": 32768, 1397 "max_tokens": 32768 1398 }, 1399 "pricing": { 1400 "input_per_million_tokens": 0.2, 1401 "output_per_million_tokens": 1.0 1402 }, 1403 "capabilities": { 1404 "function_calling": true, 1405 "vision": true, 1406 "reasoning": false, 1407 "prompt_caching": false, 1408 "response_schema": true 1409 }, 1410 "last_updated_at": "2026-04-24" 1411 }, 1412 "qwen/qwen3-vl-8b-instruct": { 1413 "mode": "chat", 1414 "context_window": { 1415 "max_input": 131072, 1416 "max_output": 32768, 1417 "max_tokens": 32768 1418 }, 1419 "pricing": { 1420 "input_per_million_tokens": 0.08, 1421 "output_per_million_tokens": 0.5 1422 }, 1423 "capabilities": { 1424 "function_calling": true, 1425 "vision": true, 1426 "reasoning": false, 1427 "prompt_caching": false, 1428 "response_schema": true 1429 }, 1430 "last_updated_at": "2026-04-24" 1431 }, 1432 "sao10k/l3-70b-euryale-v2.1": { 1433 "mode": "chat", 1434 "context_window": { 1435 "max_input": 8192, 1436 "max_output": 8192, 1437 "max_tokens": 8192 1438 }, 1439 "pricing": { 1440 "input_per_million_tokens": 1.48, 1441 "output_per_million_tokens": 1.48 1442 }, 1443 "capabilities": { 1444 "function_calling": true, 1445 "vision": false, 1446 "reasoning": false, 1447 "prompt_caching": false, 1448 "response_schema": false 1449 }, 1450 "last_updated_at": "2026-04-24" 1451 }, 1452 "sao10k/l3-8b-lunaris": { 1453 "mode": "chat", 1454 "context_window": { 1455 "max_input": 8192, 1456 "max_output": 8192, 1457 "max_tokens": 8192 1458 }, 1459 "pricing": { 1460 "input_per_million_tokens": 0.05, 1461 "output_per_million_tokens": 0.05 1462 }, 1463 "capabilities": { 1464 "function_calling": false, 1465 "vision": false, 1466 "reasoning": false, 1467 "prompt_caching": false, 1468 "response_schema": true 1469 }, 1470 "last_updated_at": "2026-04-24" 1471 }, 1472 "sao10k/l31-70b-euryale-v2.2": { 1473 "mode": "chat", 1474 "context_window": { 1475 "max_input": 8192, 1476 "max_output": 8192, 1477 "max_tokens": 8192 1478 }, 1479 "pricing": { 1480 "input_per_million_tokens": 1.48, 1481 "output_per_million_tokens": 1.48 1482 }, 1483 "capabilities": { 1484 "function_calling": true, 1485 "vision": false, 1486 "reasoning": false, 1487 "prompt_caching": false, 1488 "response_schema": false 1489 }, 1490 "last_updated_at": "2026-04-24" 1491 }, 1492 "skywork/r1v4-lite": { 1493 "mode": "chat", 1494 "context_window": { 1495 "max_input": 262144, 1496 "max_output": 65536, 1497 "max_tokens": 65536 1498 }, 1499 "pricing": { 1500 "input_per_million_tokens": 0.2, 1501 "output_per_million_tokens": 0.6 1502 }, 1503 "capabilities": { 1504 "function_calling": false, 1505 "vision": true, 1506 "reasoning": false, 1507 "prompt_caching": false, 1508 "response_schema": true 1509 }, 1510 "last_updated_at": "2026-04-24" 1511 }, 1512 "xiaomimimo/mimo-v2-flash": { 1513 "mode": "chat", 1514 "context_window": { 1515 "max_input": 262144, 1516 "max_output": 32000, 1517 "max_tokens": 32000 1518 }, 1519 "pricing": { 1520 "input_per_million_tokens": 0.1, 1521 "output_per_million_tokens": 0.3, 1522 "cache_read_per_million_tokens": 0.02 1523 }, 1524 "capabilities": { 1525 "function_calling": true, 1526 "vision": false, 1527 "reasoning": true, 1528 "prompt_caching": false, 1529 "response_schema": true 1530 }, 1531 "last_updated_at": "2026-04-24" 1532 }, 1533 "zai-org/autoglm-phone-9b-multilingual": { 1534 "mode": "chat", 1535 "context_window": { 1536 "max_input": 65536, 1537 "max_output": 65536, 1538 "max_tokens": 65536 1539 }, 1540 "pricing": { 1541 "input_per_million_tokens": 0.035, 1542 "output_per_million_tokens": 0.138 1543 }, 1544 "capabilities": { 1545 "function_calling": false, 1546 "vision": true, 1547 "reasoning": false, 1548 "prompt_caching": false, 1549 "response_schema": false 1550 }, 1551 "last_updated_at": "2026-04-24" 1552 }, 1553 "zai-org/glm-4.5": { 1554 "mode": "chat", 1555 "context_window": { 1556 "max_input": 131072, 1557 "max_output": 98304, 1558 "max_tokens": 98304 1559 }, 1560 "pricing": { 1561 "input_per_million_tokens": 0.6, 1562 "output_per_million_tokens": 2.2, 1563 "cache_read_per_million_tokens": 0.11 1564 }, 1565 "capabilities": { 1566 "function_calling": true, 1567 "vision": false, 1568 "reasoning": true, 1569 "prompt_caching": false, 1570 "response_schema": false 1571 }, 1572 "last_updated_at": "2026-04-24" 1573 }, 1574 "zai-org/glm-4.5-air": { 1575 "mode": "chat", 1576 "context_window": { 1577 "max_input": 131072, 1578 "max_output": 98304, 1579 "max_tokens": 98304 1580 }, 1581 "pricing": { 1582 "input_per_million_tokens": 0.13, 1583 "output_per_million_tokens": 0.85 1584 }, 1585 "capabilities": { 1586 "function_calling": true, 1587 "vision": false, 1588 "reasoning": true, 1589 "prompt_caching": false, 1590 "response_schema": false 1591 }, 1592 "last_updated_at": "2026-04-24" 1593 }, 1594 "zai-org/glm-4.5v": { 1595 "mode": "chat", 1596 "context_window": { 1597 "max_input": 65536, 1598 "max_output": 16384, 1599 "max_tokens": 16384 1600 }, 1601 "pricing": { 1602 "input_per_million_tokens": 0.6, 1603 "output_per_million_tokens": 1.8, 1604 "cache_read_per_million_tokens": 0.11 1605 }, 1606 "capabilities": { 1607 "function_calling": true, 1608 "vision": true, 1609 "reasoning": true, 1610 "prompt_caching": false, 1611 "response_schema": true 1612 }, 1613 "last_updated_at": "2026-04-24" 1614 }, 1615 "zai-org/glm-4.6": { 1616 "mode": "chat", 1617 "context_window": { 1618 "max_input": 204800, 1619 "max_output": 131072, 1620 "max_tokens": 131072 1621 }, 1622 "pricing": { 1623 "input_per_million_tokens": 0.55, 1624 "output_per_million_tokens": 2.2, 1625 "cache_read_per_million_tokens": 0.11 1626 }, 1627 "capabilities": { 1628 "function_calling": true, 1629 "vision": false, 1630 "reasoning": true, 1631 "prompt_caching": false, 1632 "response_schema": true 1633 }, 1634 "last_updated_at": "2026-04-24" 1635 }, 1636 "zai-org/glm-4.6v": { 1637 "mode": "chat", 1638 "context_window": { 1639 "max_input": 131072, 1640 "max_output": 32768, 1641 "max_tokens": 32768 1642 }, 1643 "pricing": { 1644 "input_per_million_tokens": 0.3, 1645 "output_per_million_tokens": 0.9, 1646 "cache_read_per_million_tokens": 0.055 1647 }, 1648 "capabilities": { 1649 "function_calling": true, 1650 "vision": true, 1651 "reasoning": true, 1652 "prompt_caching": false, 1653 "response_schema": true 1654 }, 1655 "last_updated_at": "2026-04-24" 1656 }, 1657 "zai-org/glm-4.7": { 1658 "mode": "chat", 1659 "context_window": { 1660 "max_input": 204800, 1661 "max_output": 131072, 1662 "max_tokens": 131072 1663 }, 1664 "pricing": { 1665 "input_per_million_tokens": 0.6, 1666 "output_per_million_tokens": 2.2, 1667 "cache_read_per_million_tokens": 0.11 1668 }, 1669 "capabilities": { 1670 "function_calling": true, 1671 "vision": false, 1672 "reasoning": true, 1673 "prompt_caching": false, 1674 "response_schema": true 1675 }, 1676 "last_updated_at": "2026-04-24" 1677 } 1678 } 1679 }