Module Values_1.InferenceComponentComputeResourceRequirementsSource

Defines the compute resources to allocate to run a model, plus any adapter models, that you assign to an inference component. These resources include CPU cores, accelerators, and memory.

Sourcetype nonrec t = {
  1. numberOfCpuCoresRequired : NumberOfCpuCores.t option;
    (*

    The number of CPU cores to allocate to run a model that you assign to an inference component.

    *)
  2. numberOfAcceleratorDevicesRequired : NumberOfAcceleratorDevices.t option;
    (*

    The number of accelerators to allocate to run a model that you assign to an inference component. Accelerators include GPUs and Amazon Web Services Inferentia.

    *)
  3. minMemoryRequiredInMb : MemoryInMb.t;
    (*

    The minimum MB of memory to allocate to run a model that you assign to an inference component.

    *)
  4. maxMemoryRequiredInMb : MemoryInMb.t option;
    (*

    The maximum MB of memory to allocate to run a model that you assign to an inference component.

    *)
}
Sourceval context_ : string
Sourceval make : ?numberOfCpuCoresRequired:??? -> ?numberOfAcceleratorDevicesRequired:??? -> ?maxMemoryRequiredInMb:??? -> minMemoryRequiredInMb:MemoryInMb.t -> unit -> t
Sourceval to_value : t -> [> `Structure of (string * [> `Float of NumberOfCpuCores.t | `Integer of MemoryInMb.t ]) list ]
Sourceval to_query : t -> Awso.Client.Query.t
Sourceval of_xml : Awso.Xml.t -> t
Sourceval of_string : string -> t
Sourceval of_json : Yojson.Safe.t -> t
Sourceval to_json : t -> Yojson.Safe.t