Module Values.RFTConfigSource

Configuration settings for reinforcement fine-tuning (RFT), including grader configuration and training hyperparameters.

Sourcetype nonrec t = {
  1. graderConfig : GraderConfig.t option;
    (*

    Configuration for the grader that evaluates model responses and provides reward signals during RFT training.

    *)
  2. hyperParameters : RFTHyperParameters.t option;
    (*

    Hyperparameters that control the reinforcement fine-tuning training process, including learning rate, batch size, and epoch count.

    *)
}
Sourceval make : ?graderConfig:??? -> ?hyperParameters:??? -> unit -> t
Sourceval to_value : t -> [> `Structure of (string * [> `Structure of (string * [> `Enum of string | `Float of RFTLearningRate.t | `Integer of EpochCount.t | `Structure of (string * [> `String of LambdaArn.t ]) list ]) list ]) list ]
Sourceval to_query : t -> Awso.Client.Query.t
Sourceval of_xml : Awso.Xml.t -> t
Sourceval of_string : string -> t
Sourceval of_json : Yojson.Safe.t -> t
Sourceval to_json : t -> Yojson.Safe.t