Module Values.ParsingConfigurationSource

Settings for parsing document contents. By default, the service converts the contents of each document into text before splitting it into chunks. To improve processing of PDF files with tables and images, you can configure the data source to convert the pages of text into images and use a model to describe the contents of each page.

Sourcetype nonrec t = {
  1. parsingStrategy : ParsingStrategy.t;
    (*

    The parsing strategy for the data source.

    *)
  2. bedrockFoundationModelConfiguration : BedrockFoundationModelConfigurationForParsing.t option;
    (*

    Settings for a foundation model used to parse documents for a data source.

    *)
}
Sourceval context_ : string
Sourceval make : ?bedrockFoundationModelConfiguration:??? -> parsingStrategy:ParsingStrategy.t -> unit -> t
Sourceval to_value : t -> [> `Structure of (string * [> `Enum of string | `Structure of (string * [> `String of BedrockModelArnForParsing.t | `Structure of (string * [> `String of ParsingPromptText.t ]) list ]) list ]) list ]
Sourceval to_query : t -> Awso.Client.Query.t
Sourceval of_xml : Awso.Xml.t -> t
Sourceval of_string : string -> t
Sourceval of_json : Yojson.Safe.t -> t
Sourceval to_json : t -> Yojson.Safe.t