CreateClusterAndSubmitSteps
CreateClusterAndSubmitSteps
yaml
type: "io.kestra.plugin.aws.emr.CreateClusterAndSubmitSteps"Examples
yaml
id: aws_emr_create_cluster
namespace: company.team
tasks:
- id: create_cluster
type: io.kestra.plugin.aws.emr.CreateClusterAndSubmitSteps
accessKeyId: "{{ secret('AWS_ACCESS_KEY_ID') }}"
secretKeyId: "{{ secret('AWS_SECRET_KEY_ID') }}"
region: eu-west-3
clusterName: "Spark job cluster"
logUri: "s3://my-bucket/test-emr-logs"
keepJobFlowAliveWhenNoSteps: true
applications:
- Spark
masterInstanceType: m5.xlarge
slaveInstanceType: m5.xlarge
instanceCount: 3
ec2KeyName: my-ec2-ssh-key-pair-name
steps:
- name: Spark_job_test
jar: "command-runner.jar"
actionOnFailure: CONTINUE
commands:
- spark-submit s3://mybucket/health_violations.py --data_source s3://mybucket/food_establishment_data.csv --output_uri s3://mybucket/test-emr-output
wait: true
Properties
clusterName *Requiredstring
instanceCount *Requiredintegerstring
masterInstanceType *Requiredstring
slaveInstanceType *Requiredstring
accessKeyId string
applications array
SubTypestring
compatibilityMode booleanstring
completionCheckInterval string
Default
PT10SFormat
durationec2KeyName string
ec2SubnetId string
endpointOverride string
forcePathStyle booleanstring
jobFlowRole string
Default
EMR_EC2_DefaultRolekeepJobFlowAliveWhenNoSteps booleanstring
Default
falselogUri string
region string
releaseLabel string
Default
emr-5.20.0secretKeyId string
serviceRole string
Default
EMR_DefaultRolesessionToken string
steps Non-dynamicarray
Definitions
io.kestra.plugin.aws.emr.models.StepConfig
actionOnFailure*Requiredstring
Possible Values
TERMINATE_CLUSTERCANCEL_AND_WAITCONTINUETERMINATE_JOB_FLOWjar*Requiredstring
name*Requiredstring
commandsarray
SubTypestring
mainClassstring
stsEndpointOverride string
stsRoleArn string
stsRoleExternalId string
stsRoleSessionDuration string
Default
PT15MFormat
durationstsRoleSessionName string
visibleToAllUsers booleanstring
Default
truewait booleanstring
Default
falsewaitUntilCompletion string
Default
PT1HFormat
duration