/ mlflow / deployments / server / config.py
config.py
 1  from pydantic import ConfigDict
 2  
 3  from mlflow.gateway.base_models import ResponseModel
 4  from mlflow.gateway.config import EndpointModelInfo, Limit
 5  
 6  
 7  class Endpoint(ResponseModel):
 8      name: str
 9      endpoint_type: str
10      model: EndpointModelInfo
11      endpoint_url: str
12      limit: Limit | None
13  
14      model_config = ConfigDict(
15          json_schema_extra={
16              "example": {
17                  "name": "openai-completions",
18                  "endpoint_type": "llm/v1/completions",
19                  "model": {
20                      "name": "gpt-4o-mini",
21                      "provider": "openai",
22                  },
23                  "endpoint_url": "/endpoints/completions/invocations",
24                  "limit": {"calls": 1, "key": None, "renewal_period": "minute"},
25              }
26          }
27      )