Up – Package index » awso » Library awso.bedrock » Awso_bedrock » Values » RFTConfig

Module `Values.RFTConfig`Source

Configuration settings for reinforcement fine-tuning (RFT), including grader configuration and training hyperparameters.

Sourcetype nonrec t = {

graderConfig : GraderConfig.t option;
(*
Configuration for the grader that evaluates model responses and provides reward signals during RFT training.
*)
hyperParameters : RFTHyperParameters.t option;
(*
Hyperparameters that control the reinforcement fine-tuning training process, including learning rate, batch size, and epoch count.
*)

}

Sourceval make : ?graderConfig:??? -> ?hyperParameters:??? -> unit -> t

Source

val to_value : 
  t ->
  [> `Structure of
       (string
        * [> `Structure of
               (string
                * [> `Enum of string
                  | `Float of RFTLearningRate.t
                  | `Integer of EpochCount.t
                  | `Structure of (string * [> `String of LambdaArn.t ]) list ])
                 list ])
         list ]

Sourceval to_query : t -> Awso.Client.Query.t

Sourceval of_xml : Awso.Xml.t -> t

Sourceval of_string : string -> t

Sourceval of_json : Yojson.Safe.t -> t

Sourceval to_json : t -> Yojson.Safe.t