@aws-cdk/aws-glue-alpha
Version:
The CDK Construct Library for AWS::Glue
77 lines (76 loc) • 3.07 kB
TypeScript
import { Construct } from 'constructs';
import { Code } from '../code';
import { SparkJob, SparkJobProps } from './spark-job';
/**
* Properties for creating a Python Spark ETL job
*/
export interface PySparkStreamingJobProps extends SparkJobProps {
/**
* Extra Python Files S3 URL (optional)
* S3 URL where additional python dependencies are located
*
* @default - no extra files
*/
readonly extraPythonFiles?: Code[];
/**
* Additional files, such as configuration files that AWS Glue copies to the working directory of your script before executing it.
*
* @default - no extra files specified.
*
* @see https://docs.aws.amazon.com/glue/latest/dg/aws-glue-programming-etl-glue-arguments.html
*/
readonly extraFiles?: Code[];
/**
* Extra Jars S3 URL (optional)
* S3 URL where additional jar dependencies are located
* @default - no extra jar files
*/
readonly extraJars?: Code[];
/**
* Setting this value to true prioritizes the customer's extra JAR files in the classpath.
*
* @default false - priority is not given to user-provided jars
*
* @see `--user-jars-first` in https://docs.aws.amazon.com/glue/latest/dg/aws-glue-programming-etl-glue-arguments.html
*/
readonly extraJarsFirst?: boolean;
/**
* Specifies whether job run queuing is enabled for the job runs for this job.
* A value of true means job run queuing is enabled for the job runs.
* If false or not populated, the job runs will not be considered for queueing.
* If this field does not match the value set in the job run, then the value from
* the job run field will be used. This property must be set to false for flex jobs.
* If this property is enabled, maxRetries must be set to zero.
*
* @default - no job run queuing
*/
readonly jobRunQueuingEnabled?: boolean;
}
/**
* Python Spark Streaming Jobs class
*
* A Streaming job is similar to an ETL job, except that it performs ETL on data streams
* using the Apache Spark Structured Streaming framework.
* These jobs will default to use Python 3.9.
*
* Similar to ETL jobs, streaming job supports Scala and Python languages. Similar to ETL,
* it supports G1 and G2 worker type and 2.0, 3.0 and 4.0 version. We’ll default to G2 worker
* and 4.0 version for streaming jobs which developers can override.
* We will enable —enable-metrics, —enable-spark-ui, —enable-continuous-cloudwatch-log.
*/
export declare class PySparkStreamingJob extends SparkJob {
/** Uniquely identifies this class. */
static readonly PROPERTY_INJECTION_ID: string;
readonly jobArn: string;
readonly jobName: string;
/**
* PySparkStreamingJob constructor
*/
constructor(scope: Construct, id: string, props: PySparkStreamingJobProps);
/**
* Set the executable arguments with best practices enabled by default
*
* @returns An array of arguments for Glue to use on execution
*/
private executableArguments;
}