Module Values_0.CrawlerSource

Specifies a crawler program that examines a data source and uses classifiers to try to determine its schema. If successful, the crawler records metadata concerning the data source in the Glue Data Catalog.

Sourcetype nonrec t = {
  1. name : NameString.t option;
    (*

    The name of the crawler.

    *)
  2. role : Role.t option;
    (*

    The Amazon Resource Name (ARN) of an IAM role that's used to access customer resources, such as Amazon Simple Storage Service (Amazon S3) data.

    *)
  3. targets : CrawlerTargets.t option;
    (*

    A collection of targets to crawl.

    *)
  4. databaseName : DatabaseName.t option;
    (*

    The name of the database in which the crawler's output is stored.

    *)
  5. description : DescriptionString.t option;
    (*

    A description of the crawler.

    *)
  6. classifiers : ClassifierNameList.t option;
    (*

    A list of UTF-8 strings that specify the custom classifiers that are associated with the crawler.

    *)
  7. recrawlPolicy : RecrawlPolicy.t option;
    (*

    A policy that specifies whether to crawl the entire dataset again, or to crawl only folders that were added since the last crawler run.

    *)
  8. schemaChangePolicy : SchemaChangePolicy.t option;
    (*

    The policy that specifies update and delete behaviors for the crawler.

    *)
  9. lineageConfiguration : LineageConfiguration.t option;
    (*

    A configuration that specifies whether data lineage is enabled for the crawler.

    *)
  10. state : CrawlerState.t option;
    (*

    Indicates whether the crawler is running, or whether a run is pending.

    *)
  11. tablePrefix : TablePrefix.t option;
    (*

    The prefix added to the names of tables that are created.

    *)
  12. schedule : Schedule.t option;
    (*

    For scheduled crawlers, the schedule when the crawler runs.

    *)
  13. crawlElapsedTime : MillisecondsCount.t option;
    (*

    If the crawler is running, contains the total time elapsed since the last crawl began.

    *)
  14. creationTime : Timestamp.t option;
    (*

    The time that the crawler was created.

    *)
  15. lastUpdated : Timestamp.t option;
    (*

    The time that the crawler was last updated.

    *)
  16. lastCrawl : LastCrawlInfo.t option;
    (*

    The status of the last crawl, and potentially error information if an error occurred.

    *)
  17. version : VersionId.t option;
    (*

    The version of the crawler.

    *)
  18. configuration : CrawlerConfiguration.t option;
    (*

    Crawler configuration information. This versioned JSON string allows users to specify aspects of a crawler's behavior. For more information, see Setting crawler configuration options.

    *)
  19. crawlerSecurityConfiguration : CrawlerSecurityConfiguration.t option;
    (*

    The name of the SecurityConfiguration structure to be used by this crawler.

    *)
  20. lakeFormationConfiguration : LakeFormationConfiguration.t option;
    (*

    Specifies whether the crawler should use Lake Formation credentials for the crawler instead of the IAM role credentials.

    *)
}
Sourceval make : ?name:??? -> ?role:??? -> ?targets:??? -> ?databaseName:??? -> ?description:??? -> ?classifiers:??? -> ?recrawlPolicy:??? -> ?schemaChangePolicy:??? -> ?lineageConfiguration:??? -> ?state:??? -> ?tablePrefix:??? -> ?schedule:??? -> ?crawlElapsedTime:??? -> ?creationTime:??? -> ?lastUpdated:??? -> ?lastCrawl:??? -> ?version:??? -> ?configuration:??? -> ?crawlerSecurityConfiguration:??? -> ?lakeFormationConfiguration:??? -> unit -> t
Sourceval to_value : t -> [> `Structure of (string * [> `Enum of string | `List of [> `String of NameString.t ] list | `Long of MillisecondsCount.t | `String of NameString.t | `Structure of (string * [> `Boolean of NullableBoolean.t | `Enum of string | `List of [> `Structure of (string * [> `Boolean of NullableBoolean.t | `Double of NullableDouble.t | `Integer of NullableInteger.t | `List of [> `Enum of string | `String of Path.t ] list | `String of Path.t ]) list ] list | `String of CronExpression.t | `Timestamp of Timestamp.t ]) list | `Timestamp of Timestamp.t ]) list ]
Sourceval to_query : t -> Awso.Client.Query.t
Sourceval of_xml : Awso.Xml.t -> t
Sourceval of_string : string -> t
Sourceval of_json : Yojson.Safe.t -> t
Sourceval to_json : t -> Yojson.Safe.t