Module Values.TextInferenceConfigSource

The configuration details for text generation using a language model via the RetrieveAndGenerate function.

Sourcetype nonrec t = {
  1. temperature : Temperature.t option;
    (*

    Controls the random-ness of text generated by the language model, influencing how much the model sticks to the most predictable next words versus exploring more surprising options. A lower temperature value (e.g. 0.2 or 0.3) makes model outputs more deterministic or predictable, while a higher temperature (e.g. 0.8 or 0.9) makes the outputs more creative or unpredictable.

    *)
  2. topP : TopP.t option;
    (*

    A probability distribution threshold which controls what the model considers for the set of possible next tokens. The model will only consider the top p% of the probability distribution when generating the next token.

    *)
  3. maxTokens : MaxTokens.t option;
    (*

    The maximum number of tokens to generate in the output text. Do not use the minimum of 0 or the maximum of 65536. The limit values described here are arbitrary values, for actual values consult the limits defined by your specific model.

    *)
  4. stopSequences : RAGStopSequences.t option;
    (*

    A list of sequences of characters that, if generated, will cause the model to stop generating further tokens. Do not use a minimum length of 1 or a maximum length of 1000. The limit values described here are arbitrary values, for actual values consult the limits defined by your specific model.

    *)
}
Sourceval make : ?temperature:??? -> ?topP:??? -> ?maxTokens:??? -> ?stopSequences:??? -> unit -> t
Sourceval to_value : t -> [> `Structure of (string * [> `Float of Temperature.t | `Integer of MaxTokens.t | `List of [> `String of RAGStopSequencesMemberString.t ] list ]) list ]
Sourceval to_query : t -> Awso.Client.Query.t
Sourceval of_xml : Awso.Xml.t -> t
Sourceval of_string : string -> t
Sourceval of_json : Yojson.Safe.t -> t
Sourceval to_json : t -> Yojson.Safe.t