Ottomata has submitted this change and it was merged. Change subject: Moving compression configs to mapred-site.xml where they belong ......................................................................
Moving compression configs to mapred-site.xml where they belong Change-Id: I4adbf4ca20a194f9beaa8a7fb407c151e6809a0f --- M manifests/hadoop.pp M manifests/hadoop/defaults.pp M templates/hadoop/mapred-site.xml.erb M templates/hadoop/yarn-site.xml.erb 4 files changed, 36 insertions(+), 36 deletions(-) Approvals: Ottomata: Verified; Looks good to me, approved jenkins-bot: Verified diff --git a/manifests/hadoop.pp b/manifests/hadoop.pp index 57f26ed..49562a0 100644 --- a/manifests/hadoop.pp +++ b/manifests/hadoop.pp @@ -21,8 +21,6 @@ # $yarn_local_path - path relative to JBOD mount point for yarn local directories. # $yarn_logs_path - path relative to JBOD mount point for yarn log directories. # $dfs_block_size - HDFS block size in bytes. Default 64MB. -# $enable_intermediate_compression - If true, intermediate MapReduce data will be compressed with Snappy. -# $enable_final_compession - If true, Final output of MapReduce jobs will be compressed with Snappy. # $io_file_buffer_size # $map_tasks_maximum # $reduce_tasks_maximum @@ -34,6 +32,8 @@ # $mapreduce_task_io_sort_factor # $mapreduce_map_java_opts # $mapreduce_child_java_opts +# $mapreduce_intermediate_compression - If true, intermediate MapReduce data will be compressed with Snappy. Default: true. +# $mapreduce_final_compession - If true, Final output of MapReduce jobs will be compressed with Snappy. Default: false. # $yarn_nodemanager_resource_memory_mb # $yarn_resourcemanager_scheduler_class - If you change this (e.g. to FairScheduler), you should also provide your own scheduler config .xml files outside of the cdh4 module. # $use_yarn @@ -49,8 +49,6 @@ $dfs_block_size = $::cdh4::hadoop::defaults::dfs_block_size, $enable_jmxremote = $::cdh4::hadoop::defaults::enable_jmxremote, $enable_webhdfs = $::cdh4::hadoop::defaults::enable_webhdfs, - $enable_intermediate_compression = $::cdh4::hadoop::defaults::enable_intermediate_compression, - $enable_final_compession = $::cdh4::hadoop::defaults::enable_final_compession, $io_file_buffer_size = $::cdh4::hadoop::defaults::io_file_buffer_size, $mapreduce_map_tasks_maximum = $::cdh4::hadoop::defaults::mapreduce_map_tasks_maximum, $mapreduce_reduce_tasks_maximum = $::cdh4::hadoop::defaults::mapreduce_reduce_tasks_maximum, @@ -62,6 +60,8 @@ $mapreduce_task_io_sort_factor = $::cdh4::hadoop::defaults::mapreduce_task_io_sort_factor, $mapreduce_map_java_opts = $::cdh4::hadoop::defaults::mapreduce_map_java_opts, $mapreduce_reduce_java_opts = $::cdh4::hadoop::defaults::mapreduce_reduce_java_opts, + $mapreduce_intermediate_compression = $::cdh4::hadoop::defaults::mapreduce_intermediate_compression, + $mapreduce_final_compession = $::cdh4::hadoop::defaults::mapreduce_final_compession, $yarn_nodemanager_resource_memory_mb = $::cdh4::hadoop::defaults::yarn_nodemanager_resource_memory_mb, $yarn_resourcemanager_scheduler_class = $::cdh4::hadoop::defaults::yarn_resourcemanager_scheduler_class, $use_yarn = $::cdh4::hadoop::defaults::use_yarn diff --git a/manifests/hadoop/defaults.pp b/manifests/hadoop/defaults.pp index 5ad57aa..3fc6c5d 100644 --- a/manifests/hadoop/defaults.pp +++ b/manifests/hadoop/defaults.pp @@ -10,8 +10,6 @@ $dfs_block_size = 67108864 # 64MB default $enable_jmxremote = true $enable_webhdfs = true - $enable_intermediate_compression = true - $enable_final_compession = false $io_file_buffer_size = undef $mapreduce_map_tasks_maximum = undef $mapreduce_reduce_tasks_maximum = undef @@ -23,6 +21,8 @@ $mapreduce_task_io_sort_factor = undef $mapreduce_map_java_opts = undef $mapreduce_reduce_java_opts = undef + $mapreduce_intermediate_compression = true + $mapreduce_final_compression = false $yarn_nodemanager_resource_memory_mb = undef $yarn_resourcemanager_scheduler_class = undef $use_yarn = true diff --git a/templates/hadoop/mapred-site.xml.erb b/templates/hadoop/mapred-site.xml.erb index 137c43a..8864b15 100644 --- a/templates/hadoop/mapred-site.xml.erb +++ b/templates/hadoop/mapred-site.xml.erb @@ -31,7 +31,7 @@ <name>mapreduce.jobhistory.done-dir</name> <value>/user/history/done</value> </property> - + <property> <name>mapred.job.tracker</name> <!-- Hue gets confused if mapred.job.tracker is not set, @@ -115,6 +115,30 @@ </property> <% end -%> + <!-- MapReduce intermediate compression --> + <property> + <name>mapreduce.map.output.compress</name> + <value><%= mapreduce_intermediate_compression %></value> + </property> + <property> + <name>mapreduce.map.output.compress.codec</name> + <value>org.apache.hadoop.io.compress.SnappyCodec</value> + </property> + + <!-- MapReduce final output compression --> + <property> + <name>mapreduce.output.fileoutputformat.compress</name> + <value><%= mapreduce_final_compression %></value> + </property> + <property> + <name>mapred.output.fileoutputformat.compress.codec</name> + <value>org.apache.hadoop.io.compress.SnappyCodec</value> + </property> + <property> + <name>mapreduce.output.fileoutputformat.compress.type</name> + <value>BLOCK</value> + </property> + <property> <name>mapred.hosts.exclude</name> <value><%= config_directory %>/hosts.exclude</value> diff --git a/templates/hadoop/yarn-site.xml.erb b/templates/hadoop/yarn-site.xml.erb index c11b8f2..3d51195 100644 --- a/templates/hadoop/yarn-site.xml.erb +++ b/templates/hadoop/yarn-site.xml.erb @@ -58,10 +58,6 @@ <value>org.apache.hadoop.mapred.ShuffleHandler</value> </property> - <property> - <name>yarn.log-aggregation-enable</name> - <value>true</value> - </property> <% if @datanode_mounts -%> <property> @@ -85,6 +81,11 @@ <% end -%> <property> + <name>yarn.log-aggregation-enable</name> + <value>true</value> + </property> + + <property> <description>Where to aggregate logs to.</description> <name>yarn.nodemanager.remote-app-log-dir</name> <value>/var/log/hadoop-yarn/apps</value> @@ -96,17 +97,6 @@ <value>/user</value> </property> - - <!-- MapReduce intermediate compression --> - <property> - <name>mapreduce.map.output.compress</name> - <value><%= enable_intermediate_compression %></value> - </property> - <property> - <name>mapreduce.map.output.compress.codec</name> - <value>org.apache.hadoop.io.compress.SnappyCodec</value> - </property> - <property> <name>yarn.resourcemanager.nodes.exclude-path</name> <value><%= config_directory %>/hosts.exclude</value> @@ -115,20 +105,6 @@ This is useful for decommissioning nodes. </description> </property> - - <!-- MapReduce final output compression --> - <property> - <name>mapreduce.output.fileoutputformat.compress</name> - <value><%= enable_final_compession %></value> - </property> - <property> - <name>mapred.output.fileoutputformat.compress.codec</name> - <value>org.apache.hadoop.io.compress.SnappyCodec</value> - </property> - <property> - <name>mapreduce.output.fileoutputformat.compress.type</name> - <value>BLOCK</value> - </property> <property> <description>Classpath for typical applications.</description> -- To view, visit https://gerrit.wikimedia.org/r/66869 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I4adbf4ca20a194f9beaa8a7fb407c151e6809a0f Gerrit-PatchSet: 2 Gerrit-Project: operations/puppet/cdh4 Gerrit-Branch: master Gerrit-Owner: Ottomata <o...@wikimedia.org> Gerrit-Reviewer: Ottomata <o...@wikimedia.org> Gerrit-Reviewer: jenkins-bot _______________________________________________ MediaWiki-commits mailing list MediaWiki-commits@lists.wikimedia.org https://lists.wikimedia.org/mailman/listinfo/mediawiki-commits