/ mlflow / utils / model_catalog / baseten.json
baseten.json
  1  {
  2    "schema_version": "1.0",
  3    "models": {
  4      "MiniMaxAI/MiniMax-M2.5": {
  5        "mode": "chat",
  6        "pricing": {
  7          "input_per_million_tokens": 0.3,
  8          "output_per_million_tokens": 1.2
  9        },
 10        "capabilities": {
 11          "function_calling": false,
 12          "vision": false,
 13          "reasoning": false,
 14          "prompt_caching": false,
 15          "response_schema": false
 16        },
 17        "last_updated_at": "2026-04-24"
 18      },
 19      "deepseek-ai/DeepSeek-V3-0324": {
 20        "mode": "chat",
 21        "pricing": {
 22          "input_per_million_tokens": 0.77,
 23          "output_per_million_tokens": 0.77
 24        },
 25        "capabilities": {
 26          "function_calling": false,
 27          "vision": false,
 28          "reasoning": false,
 29          "prompt_caching": false,
 30          "response_schema": false
 31        },
 32        "last_updated_at": "2026-04-24"
 33      },
 34      "deepseek-ai/DeepSeek-V3.1": {
 35        "mode": "chat",
 36        "pricing": {
 37          "input_per_million_tokens": 0.5,
 38          "output_per_million_tokens": 1.5
 39        },
 40        "capabilities": {
 41          "function_calling": false,
 42          "vision": false,
 43          "reasoning": false,
 44          "prompt_caching": false,
 45          "response_schema": false
 46        },
 47        "last_updated_at": "2026-04-24"
 48      },
 49      "moonshotai/Kimi-K2-Instruct-0905": {
 50        "mode": "chat",
 51        "pricing": {
 52          "input_per_million_tokens": 0.6,
 53          "output_per_million_tokens": 2.5
 54        },
 55        "capabilities": {
 56          "function_calling": false,
 57          "vision": false,
 58          "reasoning": false,
 59          "prompt_caching": false,
 60          "response_schema": false
 61        },
 62        "last_updated_at": "2026-04-24"
 63      },
 64      "moonshotai/Kimi-K2-Thinking": {
 65        "mode": "chat",
 66        "pricing": {
 67          "input_per_million_tokens": 0.6,
 68          "output_per_million_tokens": 2.5
 69        },
 70        "capabilities": {
 71          "function_calling": false,
 72          "vision": false,
 73          "reasoning": false,
 74          "prompt_caching": false,
 75          "response_schema": false
 76        },
 77        "last_updated_at": "2026-04-24"
 78      },
 79      "moonshotai/Kimi-K2.5": {
 80        "mode": "chat",
 81        "pricing": {
 82          "input_per_million_tokens": 0.6,
 83          "output_per_million_tokens": 3.0
 84        },
 85        "capabilities": {
 86          "function_calling": false,
 87          "vision": false,
 88          "reasoning": false,
 89          "prompt_caching": false,
 90          "response_schema": false
 91        },
 92        "last_updated_at": "2026-04-24"
 93      },
 94      "nvidia/Nemotron-120B-A12B": {
 95        "mode": "chat",
 96        "pricing": {
 97          "input_per_million_tokens": 0.3,
 98          "output_per_million_tokens": 0.75
 99        },
100        "capabilities": {
101          "function_calling": false,
102          "vision": false,
103          "reasoning": false,
104          "prompt_caching": false,
105          "response_schema": false
106        },
107        "last_updated_at": "2026-04-24"
108      },
109      "openai/gpt-oss-120b": {
110        "mode": "chat",
111        "pricing": {
112          "input_per_million_tokens": 0.1,
113          "output_per_million_tokens": 0.5
114        },
115        "capabilities": {
116          "function_calling": false,
117          "vision": false,
118          "reasoning": false,
119          "prompt_caching": false,
120          "response_schema": false
121        },
122        "last_updated_at": "2026-04-24"
123      },
124      "zai-org/GLM-4.6": {
125        "mode": "chat",
126        "pricing": {
127          "input_per_million_tokens": 0.6,
128          "output_per_million_tokens": 2.2
129        },
130        "capabilities": {
131          "function_calling": false,
132          "vision": false,
133          "reasoning": false,
134          "prompt_caching": false,
135          "response_schema": false
136        },
137        "last_updated_at": "2026-04-24"
138      },
139      "zai-org/GLM-4.7": {
140        "mode": "chat",
141        "pricing": {
142          "input_per_million_tokens": 0.6,
143          "output_per_million_tokens": 2.2
144        },
145        "capabilities": {
146          "function_calling": false,
147          "vision": false,
148          "reasoning": false,
149          "prompt_caching": false,
150          "response_schema": false
151        },
152        "last_updated_at": "2026-04-24"
153      },
154      "zai-org/GLM-5": {
155        "mode": "chat",
156        "pricing": {
157          "input_per_million_tokens": 0.95,
158          "output_per_million_tokens": 3.15
159        },
160        "capabilities": {
161          "function_calling": false,
162          "vision": false,
163          "reasoning": false,
164          "prompt_caching": false,
165          "response_schema": false
166        },
167        "last_updated_at": "2026-04-24"
168      }
169    }
170  }