UNPKG

@aws-cdk/aws-glue-alpha

Version:

The CDK Construct Library for AWS::Glue

77 lines (76 loc) 3.03 kB
import { Construct } from 'constructs'; import { Code } from '../code'; import { SparkJob, SparkJobProps } from './spark-job'; /** * Properties for creating a Python Spark ETL job */ export interface PySparkEtlJobProps extends SparkJobProps { /** * Extra Python Files S3 URL (optional) * S3 URL where additional python dependencies are located * * @default - no extra files */ readonly extraPythonFiles?: Code[]; /** * Additional files, such as configuration files that AWS Glue copies to the working directory of your script before executing it. * * @default - no extra files specified. * * @see https://docs.aws.amazon.com/glue/latest/dg/aws-glue-programming-etl-glue-arguments.html */ readonly extraFiles?: Code[]; /** * Extra Jars S3 URL (optional) * S3 URL where additional jar dependencies are located * @default - no extra jar files */ readonly extraJars?: Code[]; /** * Setting this value to true prioritizes the customer's extra JAR files in the classpath. * * @default false - priority is not given to user-provided jars * * @see `--user-jars-first` in https://docs.aws.amazon.com/glue/latest/dg/aws-glue-programming-etl-glue-arguments.html */ readonly extraJarsFirst?: boolean; /** * Specifies whether job run queuing is enabled for the job runs for this job. * A value of true means job run queuing is enabled for the job runs. * If false or not populated, the job runs will not be considered for queueing. * If this field does not match the value set in the job run, then the value from * the job run field will be used. This property must be set to false for flex jobs. * If this property is enabled, maxRetries must be set to zero. * * @default false */ readonly jobRunQueuingEnabled?: boolean; } /** * PySpark ETL Jobs class * * ETL jobs support pySpark and Scala languages, for which there are separate * but similar constructors. ETL jobs default to the G2 worker type, but you * can override this default with other supported worker type values * (G1, G2, G4 and G8). ETL jobs defaults to Glue version 4.0, which you can * override to 3.0. The following ETL features are enabled by default: * —enable-metrics, —enable-spark-ui, —enable-continuous-cloudwatch-log. * You can find more details about version, worker type and other features * in Glue's public documentation. */ export declare class PySparkEtlJob extends SparkJob { /** Uniquely identifies this class. */ static readonly PROPERTY_INJECTION_ID: string; readonly jobArn: string; readonly jobName: string; /** * PySparkEtlJob constructor */ constructor(scope: Construct, id: string, props: PySparkEtlJobProps); /** * Set the executable arguments with best practices enabled by default * * @returns An array of arguments for Glue to use on execution */ private executableArguments; }