Module Values_0.InstancePoolSource

Specifies an instance type and its priority for a heterogeneous endpoint. Use instance pools to configure a production variant with multiple instance types, enabling the endpoint to provision instances across different types based on priority.

Sourcetype nonrec t = {
  1. instanceType : ProductionVariantInstanceType.t;
    (*

    The ML compute instance type for the instance pool.

    *)
  2. modelNameOverride : ModelName.t option;
    (*

    The name of a SageMaker model to use for this instance pool instead of the model specified for the production variant. Use this to deploy a different model optimized for the instance type in this pool.

    *)
  3. priority : InstancePoolPriority.t;
    (*

    The priority for the instance pool. SageMaker attempts to provision instances in order of priority, starting with the lowest value. If instances for a higher-priority pool are unavailable, SageMaker attempts to provision from the next pool. Valid values: 1 to 5, where 1 is the highest priority.

    *)
}
Sourceval context_ : string
Sourceval make : ?modelNameOverride:??? -> instanceType:ProductionVariantInstanceType.t -> priority:InstancePoolPriority.t -> unit -> t
Sourceval to_value : t -> [> `Structure of (string * [> `Enum of string | `Integer of InstancePoolPriority.t | `String of ModelName.t ]) list ]
Sourceval to_query : t -> Awso.Client.Query.t
Sourceval of_xml : Awso.Xml.t -> t
Sourceval of_string : string -> t
Sourceval of_json : Yojson.Safe.t -> t
Sourceval to_json : t -> Yojson.Safe.t