Databricks SDK for JavaScript
    Preparing search index...
    interface InferenceEndpointDetailed {
        aiGateway?: AiGatewayConfig;
        budgetPolicyId?: string;
        config?: EndpointCoreConfigOutput;
        creationTimestamp?: bigint;
        creator?: string;
        dataPlaneInfo?: ModelDataPlaneInfo;
        description?: string;
        emailNotifications?: EmailNotifications;
        endpointUrl?: string;
        id?: string;
        lastUpdatedTimestamp?: bigint;
        name?: string;
        pendingConfig?: PendingConfig;
        permissionLevel?: ServingEndpointDetailedPermissionLevel;
        routeOptimized?: boolean;
        state?: InferenceEndpointState;
        tags?: EndpointTag[];
        task?: string;
    }
    Index

    Properties

    aiGateway?: AiGatewayConfig

    The AI Gateway configuration for the serving endpoint. NOTE: External model, provisioned throughput, and pay-per-token endpoints are fully supported; agent endpoints currently only support inference tables.

    budgetPolicyId?: string

    The budget policy associated with the endpoint.

    The config that is currently being served by the endpoint.

    creationTimestamp?: bigint

    The timestamp when the endpoint was created in Unix time.

    creator?: string

    The email of the user who created the serving endpoint.

    dataPlaneInfo?: ModelDataPlaneInfo

    Information required to query DataPlane APIs.

    description?: string

    Description of the serving model

    emailNotifications?: EmailNotifications

    Email notification settings.

    endpointUrl?: string

    Endpoint invocation url if route optimization is enabled for endpoint

    id?: string

    System-generated ID of the endpoint. This is used to refer to the endpoint in the Permissions API

    lastUpdatedTimestamp?: bigint

    The timestamp when the endpoint was last updated by a user in Unix time.

    name?: string

    The name of the serving endpoint.

    pendingConfig?: PendingConfig

    The config that the endpoint is attempting to update to.

    The permission level of the principal making the request.

    routeOptimized?: boolean

    Boolean representing if route optimization has been enabled for the endpoint

    Information corresponding to the state of the serving endpoint.

    tags?: EndpointTag[]

    Tags attached to the serving endpoint.

    task?: string

    The task type of the serving endpoint.