Module Values.SemanticChunkingConfigurationSource

Settings for semantic document chunking for a data source. Semantic chunking splits a document into smaller documents based on groups of similar content derived from the text with natural language processing.

Sourcetype nonrec t = {
  1. maxTokens : SemanticChunkingConfigurationMaxTokensInteger.t;
    (*

    The maximum number of tokens that a chunk can contain.

    *)
  2. bufferSize : SemanticChunkingConfigurationBufferSizeInteger.t;
    (*

    The buffer size.

    *)
  3. breakpointPercentileThreshold : SemanticChunkingConfigurationBreakpointPercentileThresholdInteger.t;
    (*

    The dissimilarity threshold for splitting chunks.

    *)
}
Sourceval context_ : string
Sourceval to_value : t -> [> `Structure of (string * [> `Integer of SemanticChunkingConfigurationMaxTokensInteger.t ]) list ]
Sourceval to_query : t -> Awso.Client.Query.t
Sourceval of_xml : Awso.Xml.t -> t
Sourceval of_string : string -> t
Sourceval of_json : Yojson.Safe.t -> t
Sourceval to_json : t -> Yojson.Safe.t