-
Notifications
You must be signed in to change notification settings - Fork 2
/
emr.cluster.yml
45 lines (44 loc) · 1.32 KB
/
emr.cluster.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
---
Description: "EMR cluster to run Apache Beam App in Spark."
Resources:
EmrCluster:
Type: "AWS::EMR::Cluster"
Properties:
Name: DataBeamEmr
ReleaseLabel: "emr-5.20.0"
Applications:
- Name: Ganglia
- Name: Spark
- Name: Hadoop
Configurations:
- Classification: spark
ConfigurationProperties:
maximizeResourceAllocation: "true"
EbsRootVolumeSize: "16"
Instances:
MasterInstanceGroup:
Name: "Master Instance Group"
InstanceType: "m4.large"
InstanceCount: "1"
EbsConfiguration:
EbsBlockDeviceConfigs:
- VolumeSpecification:
SizeInGB: "32"
VolumeType: gp2
Market: "ON_DEMAND"
CoreInstanceGroup:
Name: "Core Instance Group"
InstanceType: "r4.xlarge"
InstanceCount: "2"
EbsConfiguration:
EbsBlockDeviceConfigs:
- VolumeSpecification:
SizeInGB: "32"
VolumeType: gp2
Market: "SPOT"
BidPrice: "0.13"
JobFlowRole: EMR_EC2_DefaultRole
ServiceRole: EMR_DefaultRole
# LogUri: "s3n://example-bucket/logs/"
ScaleDownBehavior: "TERMINATE_AT_TASK_COMPLETION"
VisibleToAllUsers: "true"