Menu
Amazon EMR
Developer Guide

Hadoop Configuration (Hadoop 1.0.3)

The following Amazon EMR default configuration settings for clusters launched with Amazon EMR AMI 2.3 are appropriate for most workloads.

If your cluster tasks are memory-intensive, you can enhance performance by using fewer tasks per core node and reducing your job tracker heap size.

The following tables list the default configuration settings for each EC2 instance type in clusters launched with the Amazon EMR AMI version 2.3. For more information about the AMI versions supported by Amazon EMR, see Choose an Amazon Machine Image (AMI).

m1.small

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 576
HADOOP_NAMENODE_HEAPSIZE 192
HADOOP_TASKTRACKER_HEAPSIZE 192
HADOOP_DATANODE_HEAPSIZE 96
mapred.child.java.opts -Xmx288m
mapred.tasktracker.map.tasks.maximum 2
mapred.tasktracker.reduce.tasks.maximum 1

m1.medium

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 1152
HADOOP_NAMENODE_HEAPSIZE 384
HADOOP_TASKTRACKER_HEAPSIZE 192
HADOOP_DATANODE_HEAPSIZE 192
mapred.child.java.opts -Xmx576m
mapred.tasktracker.map.tasks.maximum 2
mapred.tasktracker.reduce.tasks.maximum 1

m1.large

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 2304
HADOOP_NAMENODE_HEAPSIZE 768
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx864m
mapred.tasktracker.map.tasks.maximum 3
mapred.tasktracker.reduce.tasks.maximum 1

m1.xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 6912
HADOOP_NAMENODE_HEAPSIZE 2304
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx768m
mapred.tasktracker.map.tasks.maximum 8
mapred.tasktracker.reduce.tasks.maximum 3

m2.xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 9216
HADOOP_NAMENODE_HEAPSIZE 3072
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx2304m
mapred.tasktracker.map.tasks.maximum 3
mapred.tasktracker.reduce.tasks.maximum 1

m2.2xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 18432
HADOOP_NAMENODE_HEAPSIZE 6144
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx2688m
mapred.tasktracker.map.tasks.maximum 6
mapred.tasktracker.reduce.tasks.maximum 2

m2.4xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 36864
HADOOP_NAMENODE_HEAPSIZE 12288
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx2304m
mapred.tasktracker.map.tasks.maximum 14
mapred.tasktracker.reduce.tasks.maximum 4

m3.xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 3686
HADOOP_NAMENODE_HEAPSIZE 1740
HADOOP_TASKTRACKER_HEAPSIZE 686
HADOOP_DATANODE_HEAPSIZE 757
mapred.child.java.opts -Xmx1440m
mapred.tasktracker.map.tasks.maximum 6
mapred.tasktracker.reduce.tasks.maximum 2

m3.2xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 6758
HADOOP_NAMENODE_HEAPSIZE 3276
HADOOP_TASKTRACKER_HEAPSIZE 839
HADOOP_DATANODE_HEAPSIZE 1064
mapred.child.java.opts -Xmx1440m
mapred.tasktracker.map.tasks.maximum 12
mapred.tasktracker.reduce.tasks.maximum 4

c1.medium

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 576
HADOOP_NAMENODE_HEAPSIZE 192
HADOOP_TASKTRACKER_HEAPSIZE 192
HADOOP_DATANODE_HEAPSIZE 96
mapred.child.java.opts -Xmx288m
mapred.tasktracker.map.tasks.maximum 2
mapred.tasktracker.reduce.tasks.maximum 1

c1.xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 2304
HADOOP_NAMENODE_HEAPSIZE 768
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx384m
mapred.tasktracker.map.tasks.maximum 7
mapred.tasktracker.reduce.tasks.maximum 2

c3.xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 2124
HADOOP_NAMENODE_HEAPSIZE 972
HADOOP_TASKTRACKER_HEAPSIZE 588
HADOOP_DATANODE_HEAPSIZE 588
mapred.child.java.opts -Xmx1408m
mapred.tasktracker.map.tasks.maximum 3
mapred.tasktracker.reduce.tasks.maximum 1

c3.2xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 3686
HADOOP_NAMENODE_HEAPSIZE 1740
HADOOP_TASKTRACKER_HEAPSIZE 686
HADOOP_DATANODE_HEAPSIZE 757
mapred.child.java.opts -Xmx1440m
mapred.tasktracker.map.tasks.maximum 6
mapred.tasktracker.reduce.tasks.maximum 2

c3.4xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 6758
HADOOP_NAMENODE_HEAPSIZE 3276
HADOOP_TASKTRACKER_HEAPSIZE 839
HADOOP_DATANODE_HEAPSIZE 1064
mapred.child.java.opts -Xmx1440m
mapred.tasktracker.map.tasks.maximum 12
mapred.tasktracker.reduce.tasks.maximum 4

c3.8xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 12902
HADOOP_NAMENODE_HEAPSIZE 6348
HADOOP_TASKTRACKER_HEAPSIZE 1146
HADOOP_DATANODE_HEAPSIZE 1679
mapred.child.java.opts -Xmx1664m
mapred.tasktracker.map.tasks.maximum 24
mapred.tasktracker.reduce.tasks.maximum 8

cc2.8xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 30114
HADOOP_NAMENODE_HEAPSIZE 12288
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx1536m
mapred.tasktracker.map.tasks.maximum 24
mapred.tasktracker.reduce.tasks.maximum 6

cg1.4xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 7680
HADOOP_NAMENODE_HEAPSIZE 3840
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx864m
mapred.tasktracker.map.tasks.maximum 12
mapred.tasktracker.reduce.tasks.maximum 3

cr1.8xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 50585
HADOOP_NAMENODE_HEAPSIZE 25190
HADOOP_TASKTRACKER_HEAPSIZE 2048
HADOOP_DATANODE_HEAPSIZE 4096
mapred.child.java.opts -Xmx7552m
mapred.tasktracker.map.tasks.maximum 24
mapred.tasktracker.reduce.tasks.maximum 8

hi1.4xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 30114
HADOOP_NAMENODE_HEAPSIZE 12288
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx1536m
mapred.tasktracker.map.tasks.maximum 24
mapred.tasktracker.reduce.tasks.maximum 6

hs1.8xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 30114
HADOOP_NAMENODE_HEAPSIZE 12288
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx1536m
mapred.tasktracker.map.tasks.maximum 24
mapred.tasktracker.reduce.tasks.maximum 6

cg1.4xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 7680
HADOOP_NAMENODE_HEAPSIZE 3840
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx864m
mapred.tasktracker.map.tasks.maximum 12
mapred.tasktracker.reduce.tasks.maximum 3

d2.xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 6860
HADOOP_NAMENODE_HEAPSIZE 3328
HADOOP_TASKTRACKER_HEAPSIZE 844
HADOOP_DATANODE_HEAPSIZE 1075
mapred.child.java.opts -Xmx2928m
mapred.tasktracker.map.tasks.maximum 6
mapred.tasktracker.reduce.tasks.maximum 2

d2.2xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 13107
HADOOP_NAMENODE_HEAPSIZE 6451
HADOOP_TASKTRACKER_HEAPSIZE 1157
HADOOP_DATANODE_HEAPSIZE 1699
mapred.child.java.opts -Xmx3392m
mapred.tasktracker.map.tasks.maximum 12
mapred.tasktracker.reduce.tasks.maximum 4

d2.4xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 25600
HADOOP_NAMENODE_HEAPSIZE 12697
HADOOP_TASKTRACKER_HEAPSIZE 1781
HADOOP_DATANODE_HEAPSIZE 2949
mapred.child.java.opts -Xmx3648m
mapred.tasktracker.map.tasks.maximum 24
mapred.tasktracker.reduce.tasks.maximum 8

d2.8xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 50585
HADOOP_NAMENODE_HEAPSIZE 25190
HADOOP_TASKTRACKER_HEAPSIZE 2048
HADOOP_DATANODE_HEAPSIZE 4096
mapred.child.java.opts -Xmx3356m
mapred.tasktracker.map.tasks.maximum 54
mapred.tasktracker.reduce.tasks.maximum 18

g2.2xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 6912
HADOOP_NAMENODE_HEAPSIZE 2304
HADOOP_TASKTRACKER_HEAPSIZE 384
HADOOP_DATANODE_HEAPSIZE 384
mapred.child.java.opts -Xmx768m
mapred.tasktracker.map.tasks.maximum 8
mapred.tasktracker.reduce.tasks.maximum 3

i2.xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 6860
HADOOP_NAMENODE_HEAPSIZE 3328
HADOOP_TASKTRACKER_HEAPSIZE 844
HADOOP_DATANODE_HEAPSIZE 1075
mapred.child.java.opts -Xmx2928m
mapred.tasktracker.map.tasks.maximum 6
mapred.tasktracker.reduce.tasks.maximum 2

i2.2xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 13107
HADOOP_NAMENODE_HEAPSIZE 6451
HADOOP_TASKTRACKER_HEAPSIZE 1157
HADOOP_DATANODE_HEAPSIZE 1699
mapred.child.java.opts -Xmx3392m
mapred.tasktracker.map.tasks.maximum 12
mapred.tasktracker.reduce.tasks.maximum 4

i2.4xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 25600
HADOOP_NAMENODE_HEAPSIZE 12697
HADOOP_TASKTRACKER_HEAPSIZE 1781
HADOOP_DATANODE_HEAPSIZE 2949
mapred.child.java.opts -Xmx3648m
mapred.tasktracker.map.tasks.maximum 24
mapred.tasktracker.reduce.tasks.maximum 8

i2.8xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 50585
HADOOP_NAMENODE_HEAPSIZE 25190
HADOOP_TASKTRACKER_HEAPSIZE 2048
HADOOP_DATANODE_HEAPSIZE 4096
mapred.child.java.opts -Xmx3776m
mapred.tasktracker.map.tasks.maximum 48
mapred.tasktracker.reduce.tasks.maximum 16

r3.xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 6860
HADOOP_NAMENODE_HEAPSIZE 3328
HADOOP_TASKTRACKER_HEAPSIZE 844
HADOOP_DATANODE_HEAPSIZE 1075
mapred.child.java.opts -Xmx2928m
mapred.tasktracker.map.tasks.maximum 6
mapred.tasktracker.reduce.tasks.maximum 2

r3.2xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 13107
HADOOP_NAMENODE_HEAPSIZE 6451
HADOOP_TASKTRACKER_HEAPSIZE 1157
HADOOP_DATANODE_HEAPSIZE 1699
mapred.child.java.opts -Xmx3392m
mapred.tasktracker.map.tasks.maximum 12
mapred.tasktracker.reduce.tasks.maximum 4

r3.4xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 25600
HADOOP_NAMENODE_HEAPSIZE 12697
HADOOP_TASKTRACKER_HEAPSIZE 1781
HADOOP_DATANODE_HEAPSIZE 2949
mapred.child.java.opts -Xmx7296m
mapred.tasktracker.map.tasks.maximum 12
mapred.tasktracker.reduce.tasks.maximum 4

r3.8xlarge

Parameter Value
HADOOP_JOBTRACKER_HEAPSIZE 50585
HADOOP_NAMENODE_HEAPSIZE 25190
HADOOP_TASKTRACKER_HEAPSIZE 2048
HADOOP_DATANODE_HEAPSIZE 4096
mapred.child.java.opts -Xmx7552m
mapred.tasktracker.map.tasks.maximum 24
mapred.tasktracker.reduce.tasks.maximum 8