Author: swagle
Date: Tue May 14 20:21:34 2013
New Revision: 1482557

URL: http://svn.apache.org/r1482557
Log:
AMBARI-2116. Add parameters to improve HIVE performance. With descriptions. 
(swagle)

Modified:
    incubator/ambari/trunk/CHANGES.txt
    
incubator/ambari/trunk/ambari-server/src/main/resources/stacks/HDP/1.3.0/services/HIVE/configuration/hive-site.xml
    
incubator/ambari/trunk/ambari-server/src/main/resources/stacks/HDPLocal/1.3.0/services/HIVE/configuration/hive-site.xml

Modified: incubator/ambari/trunk/CHANGES.txt
URL: 
http://svn.apache.org/viewvc/incubator/ambari/trunk/CHANGES.txt?rev=1482557&r1=1482556&r2=1482557&view=diff
==============================================================================
--- incubator/ambari/trunk/CHANGES.txt (original)
+++ incubator/ambari/trunk/CHANGES.txt Tue May 14 20:21:34 2013
@@ -850,6 +850,9 @@ Trunk (unreleased changes):
 
  BUG FIXES
 
+ AMBARI-2116. Add parameters to improve HIVE performance. With decriptions. 
+ (swagle)
+
  AMBARI-2127. Service check should not emit log with Exceptions considering
  its a positive scenario. (smohanty)
 

Modified: 
incubator/ambari/trunk/ambari-server/src/main/resources/stacks/HDP/1.3.0/services/HIVE/configuration/hive-site.xml
URL: 
http://svn.apache.org/viewvc/incubator/ambari/trunk/ambari-server/src/main/resources/stacks/HDP/1.3.0/services/HIVE/configuration/hive-site.xml?rev=1482557&r1=1482556&r2=1482557&view=diff
==============================================================================
--- 
incubator/ambari/trunk/ambari-server/src/main/resources/stacks/HDP/1.3.0/services/HIVE/configuration/hive-site.xml
 (original)
+++ 
incubator/ambari/trunk/ambari-server/src/main/resources/stacks/HDP/1.3.0/services/HIVE/configuration/hive-site.xml
 Tue May 14 20:21:34 2013
@@ -143,16 +143,19 @@ limitations under the License.
   <property>
     <name>hive.enforce.bucketing</name>
     <value>true</value>
+    <description>Whether bucketing is enforced. If true, while inserting into 
the table, bucketing is enforced.</description>
   </property>
 
   <property>
     <name>hive.enforce.sorting</name>
     <value>true</value>
+    <description>Whether sorting is enforced. If true, while inserting into 
the table, sorting is enforced.</description>
   </property>
 
   <property>
     <name>hive.map.aggr</name>
     <value>true</value>
+    <description>Whether to use map-side aggregation in Hive Group By 
queries.</description>
   </property>
 
   <property>
@@ -168,16 +171,22 @@ limitations under the License.
   <property>
     <name>hive.mapred.reduce.tasks.speculative.execution</name>
     <value>false</value>
+    <description>Whether speculative execution for reducers should be turned 
on.</description>
   </property>
 
   <property>
     <name>hive.auto.convert.join</name>
     <value>true</value>
+    <description>Whether Hive enable the optimization about converting common
+      join into mapjoin based on the input file size.</description>
   </property>
 
   <property>
     <name>hive.auto.convert.sortmerge.join</name>
     <value>true</value>
+    <description>Will the join be automatically converted to a sort-merge 
join, if the joined tables pass
+      the criteria for sort-merge join.
+    </description>
   </property>
 
   <property>
@@ -188,21 +197,38 @@ limitations under the License.
   <property>
     <name>hive.auto.convert.join.noconditionaltask</name>
     <value>true</value>
+    <description>Whether Hive enable the optimization about converting common 
join into mapjoin based on the input file
+      size. If this paramater is on, and the sum of size for n-1 of the 
tables/partitions for a n-way join is smaller than the
+      specified size, the join is directly converted to a mapjoin (there is no 
conditional task).
+    </description>
   </property>
 
   <property>
     <name>hive.auto.convert.join.noconditionaltask.size</name>
     <value>1000000000</value>
+    <description>If hive.auto.convert.join.noconditionaltask is off, this 
parameter does not take affect. However, if it
+      is on, and the sum of size for n-1 of the tables/partitions for a n-way 
join is smaller than this size, the join is directly
+      converted to a mapjoin(there is no conditional task). The default is 
10MB.
+    </description>
   </property>
 
   <property>
     <name>hive.optimize.reducededuplication.min.reducer</name>
     <value>1</value>
+    <description>Reduce deduplication merges two RSs by moving 
key/parts/reducer-num of the child RS to parent RS.
+      That means if reducer-num of the child RS is fixed (order by or forced 
bucketing) and small, it can make very slow, single MR.
+      The optimization will be disabled if number of reducers is less than 
specified value.
+    </description>
   </property>
 
   <property>
     <name>hive.optimize.mapjoin.mapreduce</name>
     <value>true</value>
+    <description>If hive.auto.convert.join is off, this parameter does not take
+      affect. If it is on, and if there are map-join jobs followed by a 
map-reduce
+      job (for e.g a group by), each map-only job is merged with the following
+      map-reduce job.
+    </description>
   </property>
 
 </configuration>

Modified: 
incubator/ambari/trunk/ambari-server/src/main/resources/stacks/HDPLocal/1.3.0/services/HIVE/configuration/hive-site.xml
URL: 
http://svn.apache.org/viewvc/incubator/ambari/trunk/ambari-server/src/main/resources/stacks/HDPLocal/1.3.0/services/HIVE/configuration/hive-site.xml?rev=1482557&r1=1482556&r2=1482557&view=diff
==============================================================================
--- 
incubator/ambari/trunk/ambari-server/src/main/resources/stacks/HDPLocal/1.3.0/services/HIVE/configuration/hive-site.xml
 (original)
+++ 
incubator/ambari/trunk/ambari-server/src/main/resources/stacks/HDPLocal/1.3.0/services/HIVE/configuration/hive-site.xml
 Tue May 14 20:21:34 2013
@@ -143,16 +143,19 @@ limitations under the License.
   <property>
     <name>hive.enforce.bucketing</name>
     <value>true</value>
+    <description>Whether bucketing is enforced. If true, while inserting into 
the table, bucketing is enforced.</description>
   </property>
 
   <property>
     <name>hive.enforce.sorting</name>
     <value>true</value>
+    <description>Whether sorting is enforced. If true, while inserting into 
the table, sorting is enforced.</description>
   </property>
 
   <property>
     <name>hive.map.aggr</name>
     <value>true</value>
+    <description>Whether to use map-side aggregation in Hive Group By 
queries.</description>
   </property>
 
   <property>
@@ -168,16 +171,22 @@ limitations under the License.
   <property>
     <name>hive.mapred.reduce.tasks.speculative.execution</name>
     <value>false</value>
+    <description>Whether speculative execution for reducers should be turned 
on.</description>
   </property>
 
   <property>
     <name>hive.auto.convert.join</name>
     <value>true</value>
+    <description>Whether Hive enable the optimization about converting common
+      join into mapjoin based on the input file size.</description>
   </property>
 
   <property>
     <name>hive.auto.convert.sortmerge.join</name>
     <value>true</value>
+    <description>Will the join be automatically converted to a sort-merge 
join, if the joined tables pass
+      the criteria for sort-merge join.
+    </description>
   </property>
 
   <property>
@@ -188,21 +197,38 @@ limitations under the License.
   <property>
     <name>hive.auto.convert.join.noconditionaltask</name>
     <value>true</value>
+    <description>Whether Hive enable the optimization about converting common 
join into mapjoin based on the input file
+      size. If this paramater is on, and the sum of size for n-1 of the 
tables/partitions for a n-way join is smaller than the
+      specified size, the join is directly converted to a mapjoin (there is no 
conditional task).
+    </description>
   </property>
 
   <property>
     <name>hive.auto.convert.join.noconditionaltask.size</name>
     <value>1000000000</value>
+    <description>If hive.auto.convert.join.noconditionaltask is off, this 
parameter does not take affect. However, if it
+      is on, and the sum of size for n-1 of the tables/partitions for a n-way 
join is smaller than this size, the join is directly
+      converted to a mapjoin(there is no conditional task). The default is 
10MB.
+    </description>
   </property>
 
   <property>
     <name>hive.optimize.reducededuplication.min.reducer</name>
     <value>1</value>
+    <description>Reduce deduplication merges two RSs by moving 
key/parts/reducer-num of the child RS to parent RS.
+      That means if reducer-num of the child RS is fixed (order by or forced 
bucketing) and small, it can make very slow, single MR.
+      The optimization will be disabled if number of reducers is less than 
specified value.
+    </description>
   </property>
 
   <property>
     <name>hive.optimize.mapjoin.mapreduce</name>
     <value>true</value>
+    <description>If hive.auto.convert.join is off, this parameter does not take
+      affect. If it is on, and if there are map-join jobs followed by a 
map-reduce
+      job (for e.g a group by), each map-only job is merged with the following
+      map-reduce job.
+    </description>
   </property>
 
 </configuration>


Reply via email to