@aws-cdk/aws-glue-alpha
Version:
The CDK Construct Library for AWS::Glue
77 lines (76 loc) • 3.03 kB
TypeScript
import { Construct } from 'constructs';
import { Code } from '../code';
import { SparkJob, SparkJobProps } from './spark-job';
/**
* Properties for creating a Python Spark ETL job
*/
export interface PySparkEtlJobProps extends SparkJobProps {
/**
* Extra Python Files S3 URL (optional)
* S3 URL where additional python dependencies are located
*
* @default - no extra files
*/
readonly extraPythonFiles?: Code[];
/**
* Additional files, such as configuration files that AWS Glue copies to the working directory of your script before executing it.
*
* @default - no extra files specified.
*
* @see https://docs.aws.amazon.com/glue/latest/dg/aws-glue-programming-etl-glue-arguments.html
*/
readonly extraFiles?: Code[];
/**
* Extra Jars S3 URL (optional)
* S3 URL where additional jar dependencies are located
* @default - no extra jar files
*/
readonly extraJars?: Code[];
/**
* Setting this value to true prioritizes the customer's extra JAR files in the classpath.
*
* @default false - priority is not given to user-provided jars
*
* @see `--user-jars-first` in https://docs.aws.amazon.com/glue/latest/dg/aws-glue-programming-etl-glue-arguments.html
*/
readonly extraJarsFirst?: boolean;
/**
* Specifies whether job run queuing is enabled for the job runs for this job.
* A value of true means job run queuing is enabled for the job runs.
* If false or not populated, the job runs will not be considered for queueing.
* If this field does not match the value set in the job run, then the value from
* the job run field will be used. This property must be set to false for flex jobs.
* If this property is enabled, maxRetries must be set to zero.
*
* @default false
*/
readonly jobRunQueuingEnabled?: boolean;
}
/**
* PySpark ETL Jobs class
*
* ETL jobs support pySpark and Scala languages, for which there are separate
* but similar constructors. ETL jobs default to the G2 worker type, but you
* can override this default with other supported worker type values
* (G1, G2, G4 and G8). ETL jobs defaults to Glue version 4.0, which you can
* override to 3.0. The following ETL features are enabled by default:
* —enable-metrics, —enable-spark-ui, —enable-continuous-cloudwatch-log.
* You can find more details about version, worker type and other features
* in Glue's public documentation.
*/
export declare class PySparkEtlJob extends SparkJob {
/** Uniquely identifies this class. */
static readonly PROPERTY_INJECTION_ID: string;
readonly jobArn: string;
readonly jobName: string;
/**
* PySparkEtlJob constructor
*/
constructor(scope: Construct, id: string, props: PySparkEtlJobProps);
/**
* Set the executable arguments with best practices enabled by default
*
* @returns An array of arguments for Glue to use on execution
*/
private executableArguments;
}