Module Values_1.InferenceComponentSchedulingConfigSource

The scheduling configuration that determines how inference component copies are placed across available instances when copies are added or removed.

Sourcetype nonrec t = {
  1. placementStrategy : InferenceComponentPlacementStrategy.t;
    (*

    The strategy for placing inference component copies across available instances. If you also set AvailabilityZoneBalance, this strategy applies to placement within each Availability Zone. SPREAD Distributes copies evenly across available instances for better resilience. BINPACK Packs copies onto fewer instances to optimize resource utilization.

    *)
  2. availabilityZoneBalance : InferenceComponentAvailabilityZoneBalance.t option;
    (*

    Configuration for balancing inference component copies across Availability Zones.

    *)
}
Sourceval context_ : string
Sourceval make : ?availabilityZoneBalance:??? -> placementStrategy:InferenceComponentPlacementStrategy.t -> unit -> t
Sourceval to_value : t -> [> `Structure of (string * [> `Enum of string | `Structure of (string * [> `Enum of string | `Integer of Values_0.AvailabilityZoneBalanceMaxImbalance.t ]) list ]) list ]
Sourceval to_query : t -> Awso.Client.Query.t
Sourceval of_xml : Awso.Xml.t -> t
Sourceval of_string : string -> t
Sourceval of_json : Yojson.Safe.t -> t
Sourceval to_json : t -> Yojson.Safe.t