Repository: hive Updated Branches: refs/heads/master 419593e70 -> 32b899448
HIVE-18528: Stats: In the bitvector codepath, when extrapolating column stats for String type columnStringColumnStatsAggregator uses the min value instead of max (Vaibhav Gumashta reviewed by Ashutosh Chauhan) Project: http://git-wip-us.apache.org/repos/asf/hive/repo Commit: http://git-wip-us.apache.org/repos/asf/hive/commit/32b89944 Tree: http://git-wip-us.apache.org/repos/asf/hive/tree/32b89944 Diff: http://git-wip-us.apache.org/repos/asf/hive/diff/32b89944 Branch: refs/heads/master Commit: 32b8994480ec94cb1f28ba9cd295cd85cc7fe064 Parents: 419593e Author: Vaibhav Gumashta <vgumas...@hortonworks.com> Authored: Thu Feb 1 11:47:57 2018 -0800 Committer: Vaibhav Gumashta <vgumas...@hortonworks.com> Committed: Thu Feb 1 11:47:57 2018 -0800 ---------------------------------------------------------------------- .../metastore/columnstats/aggr/StringColumnStatsAggregator.java | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) ---------------------------------------------------------------------- http://git-wip-us.apache.org/repos/asf/hive/blob/32b89944/standalone-metastore/src/main/java/org/apache/hadoop/hive/metastore/columnstats/aggr/StringColumnStatsAggregator.java ---------------------------------------------------------------------- diff --git a/standalone-metastore/src/main/java/org/apache/hadoop/hive/metastore/columnstats/aggr/StringColumnStatsAggregator.java b/standalone-metastore/src/main/java/org/apache/hadoop/hive/metastore/columnstats/aggr/StringColumnStatsAggregator.java index 2b8c493..9537647 100644 --- a/standalone-metastore/src/main/java/org/apache/hadoop/hive/metastore/columnstats/aggr/StringColumnStatsAggregator.java +++ b/standalone-metastore/src/main/java/org/apache/hadoop/hive/metastore/columnstats/aggr/StringColumnStatsAggregator.java @@ -178,7 +178,7 @@ public class StringColumnStatsAggregator extends ColumnStatsAggregator implement if (aggregateData == null) { aggregateData = newData.deepCopy(); } else { - aggregateData.setAvgColLen(Math.min(aggregateData.getAvgColLen(), + aggregateData.setAvgColLen(Math.max(aggregateData.getAvgColLen(), newData.getAvgColLen())); aggregateData.setMaxColLen(Math.max(aggregateData.getMaxColLen(), newData.getMaxColLen()));