Module Values_1.InferenceComponentAvailabilityZoneBalanceSource

Configuration for balancing inference component copies across Availability Zones.

Sourcetype nonrec t = {
  1. enforcementMode : Values_0.AvailabilityZoneBalanceEnforcementMode.t;
    (*

    Determines how strictly the Availability Zone balance constraint is enforced. PERMISSIVE The endpoint attempts to balance copies across Availability Zones but proceeds with scheduling even if balance can't be achieved due to available capacity or instance distribution across Availability Zones.

    *)
  2. maxImbalance : Values_0.AvailabilityZoneBalanceMaxImbalance.t option;
    (*

    The maximum allowed difference in the number of inference component copies between any two Availability Zones. This parameter applies only when the endpoint has instances across two or more Availability Zones. A copy placement is allowed if it reduces imbalance or the resulting imbalance is within this value. Default value: 0.

    *)
}
Sourceval context_ : string
Sourceval make : ?maxImbalance:??? -> enforcementMode:Values_0.AvailabilityZoneBalanceEnforcementMode.t -> unit -> t
Sourceval to_value : t -> [> `Structure of (string * [> `Enum of string | `Integer of Values_0.AvailabilityZoneBalanceMaxImbalance.t ]) list ]
Sourceval to_query : t -> Awso.Client.Query.t
Sourceval of_xml : Awso.Xml.t -> t
Sourceval of_string : string -> t
Sourceval of_json : Yojson.Safe.t -> t
Sourceval to_json : t -> Yojson.Safe.t