Module Values_2.ScalingPolicyMetricSource

The metric for a scaling policy.

Sourcetype nonrec t = {
  1. invocationsPerInstance : Values_0.Integer.t option;
    (*

    The number of invocations sent to a model, normalized by InstanceCount in each ProductionVariant. 1/numberOfInstances is sent as the value on each request, where numberOfInstances is the number of active instances for the ProductionVariant behind the endpoint at the time of the request.

    *)
  2. modelLatency : Values_0.Integer.t option;
    (*

    The interval of time taken by a model to respond as viewed from SageMaker. This interval includes the local communication times taken to send the request and to fetch the response from the container of a model and the time taken to complete the inference in the container.

    *)
}
Sourceval make : ?invocationsPerInstance:??? -> ?modelLatency:??? -> unit -> t
Sourceval to_value : t -> [> `Structure of (string * [> `Integer of Values_0.Integer.t ]) list ]
Sourceval to_query : t -> Awso.Client.Query.t
Sourceval of_xml : Awso.Xml.t -> t
Sourceval of_string : string -> t
Sourceval of_json : Yojson.Safe.t -> t
Sourceval to_json : t -> Yojson.Safe.t