This is an automated email from the ASF dual-hosted git repository.
lijibing pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/doris.git
The following commit(s) were added to refs/heads/master by this push:
new 7ae2917b895 Fix failed p2 hive statistics case. (#34663)
7ae2917b895 is described below
commit 7ae2917b89544d581ae900b17b7fbaf380d22104
Author: Jibing-Li <[email protected]>
AuthorDate: Sat May 11 14:05:22 2024 +0800
Fix failed p2 hive statistics case. (#34663)
---
.../hive/test_hive_partition_column_analyze.groovy | 390 +++++++++++----------
.../hive/test_hive_partition_statistic.groovy | 3 +
2 files changed, 200 insertions(+), 193 deletions(-)
diff --git
a/regression-test/suites/external_table_p2/hive/test_hive_partition_column_analyze.groovy
b/regression-test/suites/external_table_p2/hive/test_hive_partition_column_analyze.groovy
index 336e2e8b784..d4b1fa3eca4 100644
---
a/regression-test/suites/external_table_p2/hive/test_hive_partition_column_analyze.groovy
+++
b/regression-test/suites/external_table_p2/hive/test_hive_partition_column_analyze.groovy
@@ -31,199 +31,203 @@ suite("test_hive_partition_column_analyze",
"p2,external,hive,external_remote,ex
"""
logger.info("catalog " + catalog_name + " created")
- // Test analyze table without init.
- sql """analyze table
${catalog_name}.multi_partition.multi_partition_parquet (event_day) with sync"""
- sql """analyze table
${catalog_name}.multi_partition.multi_partition_orc (event_day) with sync"""
-
- sql """switch ${catalog_name};"""
- logger.info("switched to catalog " + catalog_name)
- sql """use multi_partition;"""
- def result = sql """show column stats multi_partition_parquet
(event_day)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "event_day")
- assertEquals(result[0][2], "3.83714205E8")
- assertEquals(result[0][3], "99949.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "3.83714205E9")
- assertEquals(result[0][6], "10.0")
- assertEquals(result[0][7], "\'1749-09-24\'")
- assertEquals(result[0][8], "\'2023-05-26\'")
-
- result = sql """show column stats multi_partition_orc (event_day)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "event_day")
- assertEquals(result[0][2], "1.9007155E8")
- assertEquals(result[0][3], "99949.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "1.9007155E9")
- assertEquals(result[0][6], "10.0")
- assertEquals(result[0][7], "\'1749-09-24\'")
- assertEquals(result[0][8], "\'2023-05-26\'")
-
- sql """analyze table ${catalog_name}.partition_type.tinyint_partition
(tinyint_part) with sync"""
- sql """analyze table ${catalog_name}.partition_type.smallint_partition
(smallint_part) with sync"""
- sql """analyze table ${catalog_name}.partition_type.int_partition
(int_part) with sync"""
- sql """analyze table ${catalog_name}.partition_type.bigint_partition
(bigint_part) with sync"""
- sql """analyze table ${catalog_name}.partition_type.char_partition
(char_part) with sync"""
- sql """analyze table ${catalog_name}.partition_type.varchar_partition
(varchar_part) with sync"""
- sql """analyze table ${catalog_name}.partition_type.string_partition
(string_part) with sync"""
- sql """analyze table ${catalog_name}.partition_type.date_partition
(date_part) with sync"""
- sql """analyze table ${catalog_name}.partition_type.float_partition
(float_part) with sync"""
- sql """analyze table ${catalog_name}.partition_type.double_partition
(double_part) with sync"""
- sql """analyze table ${catalog_name}.partition_type.decimal_partition
(decimal_part) with sync"""
- sql """analyze table ${catalog_name}.partition_type.two_partition
(part1, part2) with sync"""
-
- sql """use partition_type;"""
-
- result = sql """show column stats tinyint_partition (tinyint_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "tinyint_part")
- assertEquals(result[0][2], "141474.0")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "141474.0")
- assertEquals(result[0][6], "1.0")
- assertEquals(result[0][7], "1")
- assertEquals(result[0][8], "100")
-
- result = sql """show column stats smallint_partition (smallint_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "smallint_part")
- assertEquals(result[0][2], "141474.0")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "282948.0")
- assertEquals(result[0][6], "2.0")
- assertEquals(result[0][7], "1")
- assertEquals(result[0][8], "100")
-
- result = sql """show column stats int_partition (int_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "int_part")
- assertEquals(result[0][2], "141474.0")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "565896.0")
- assertEquals(result[0][6], "4.0")
- assertEquals(result[0][7], "1")
- assertEquals(result[0][8], "100")
-
- result = sql """show column stats bigint_partition (bigint_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "bigint_part")
- assertEquals(result[0][2], "141474.0")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "1131792.0")
- assertEquals(result[0][6], "8.0")
- assertEquals(result[0][7], "1")
- assertEquals(result[0][8], "100")
-
- result = sql """show column stats char_partition (char_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "char_part")
- assertEquals(result[0][2], "141474.0")
- assertEquals(result[0][3], "101.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "2829480.0")
- assertEquals(result[0][6], "20.0")
- assertEquals(result[0][7], "\'1 \'")
- assertEquals(result[0][8], "\'a \'")
-
- result = sql """show column stats varchar_partition (varchar_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "varchar_part")
- assertEquals(result[0][2], "141474.0")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "271630.0")
- assertEquals(result[0][6], "1.9199994345250717")
- assertEquals(result[0][7], "\'1\'")
- assertEquals(result[0][8], "\'99\'")
-
- result = sql """show column stats string_partition (string_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "string_part")
- assertEquals(result[0][2], "141474.0")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "271630.0")
- assertEquals(result[0][6], "1.9199994345250717")
- assertEquals(result[0][7], "\'1\'")
- assertEquals(result[0][8], "\'99\'")
-
- result = sql """show column stats date_partition (date_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "date_part")
- assertEquals(result[0][2], "141474.0")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "565896.0")
- assertEquals(result[0][6], "4.0")
- assertEquals(result[0][7], "\'2001-10-12\'")
- assertEquals(result[0][8], "\'2100-10-12\'")
-
- result = sql """show column stats float_partition (float_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "float_part")
- assertEquals(result[0][2], "141474.0")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "565896.0")
- assertEquals(result[0][6], "4.0")
- assertEquals(result[0][7], "296.3103")
- assertEquals(result[0][8], "32585.627")
-
- result = sql """show column stats double_partition (double_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "double_part")
- assertEquals(result[0][2], "141474.0")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "1131792.0")
- assertEquals(result[0][6], "8.0")
- assertEquals(result[0][7], "115.14474")
- assertEquals(result[0][8], "32761.14458")
-
- result = sql """show column stats decimal_partition (decimal_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "decimal_part")
- assertEquals(result[0][2], "141474.0")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "1131792.0")
- assertEquals(result[0][6], "8.0")
- assertEquals(result[0][7], "243.2868")
- assertEquals(result[0][8], "32527.1543")
-
- sql """analyze table ${catalog_name}.partition_type.decimal_partition
(decimal_part) with sync with sql"""
- result = sql """show column stats decimal_partition (decimal_part)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "decimal_part")
- assertEquals(result[0][2], "100000.0")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][5], "800000.0")
- assertEquals(result[0][6], "8.0")
- assertEquals(result[0][7], "243.2868")
- assertEquals(result[0][8], "32527.1543")
-
- result = sql """show column stats two_partition (part1)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "part1")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][7], "1")
- assertEquals(result[0][8], "100")
-
- result = sql """show column stats two_partition (part2)"""
- assertEquals(result.size(), 1)
- assertEquals(result[0][0], "part2")
- assertEquals(result[0][3], "100.0")
- assertEquals(result[0][4], "0.0")
- assertEquals(result[0][7], "\'1\'")
- assertEquals(result[0][8], "\'99\'")
-
+ try {
+ sql """set global enable_get_row_count_from_file_list=true"""
+ // Test analyze table without init.
+ sql """analyze table
${catalog_name}.multi_partition.multi_partition_parquet (event_day) with sync"""
+ sql """analyze table
${catalog_name}.multi_partition.multi_partition_orc (event_day) with sync"""
+
+ sql """switch ${catalog_name};"""
+ logger.info("switched to catalog " + catalog_name)
+ sql """use multi_partition;"""
+ def result = sql """show column stats multi_partition_parquet
(event_day)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "event_day")
+ assertEquals(result[0][2], "3.83714205E8")
+ assertEquals(result[0][3], "99949.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "3.83714205E9")
+ assertEquals(result[0][6], "10.0")
+ assertEquals(result[0][7], "\'1749-09-24\'")
+ assertEquals(result[0][8], "\'2023-05-26\'")
+
+ result = sql """show column stats multi_partition_orc
(event_day)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "event_day")
+ assertEquals(result[0][2], "1.9007155E8")
+ assertEquals(result[0][3], "99949.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "1.9007155E9")
+ assertEquals(result[0][6], "10.0")
+ assertEquals(result[0][7], "\'1749-09-24\'")
+ assertEquals(result[0][8], "\'2023-05-26\'")
+
+ sql """analyze table
${catalog_name}.partition_type.tinyint_partition (tinyint_part) with sync"""
+ sql """analyze table
${catalog_name}.partition_type.smallint_partition (smallint_part) with sync"""
+ sql """analyze table ${catalog_name}.partition_type.int_partition
(int_part) with sync"""
+ sql """analyze table
${catalog_name}.partition_type.bigint_partition (bigint_part) with sync"""
+ sql """analyze table ${catalog_name}.partition_type.char_partition
(char_part) with sync"""
+ sql """analyze table
${catalog_name}.partition_type.varchar_partition (varchar_part) with sync"""
+ sql """analyze table
${catalog_name}.partition_type.string_partition (string_part) with sync"""
+ sql """analyze table ${catalog_name}.partition_type.date_partition
(date_part) with sync"""
+ sql """analyze table
${catalog_name}.partition_type.float_partition (float_part) with sync"""
+ sql """analyze table
${catalog_name}.partition_type.double_partition (double_part) with sync"""
+ sql """analyze table
${catalog_name}.partition_type.decimal_partition (decimal_part) with sync"""
+ sql """analyze table ${catalog_name}.partition_type.two_partition
(part1, part2) with sync"""
+
+ sql """use partition_type;"""
+
+ result = sql """show column stats tinyint_partition
(tinyint_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "tinyint_part")
+ assertEquals(result[0][2], "141474.0")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "141474.0")
+ assertEquals(result[0][6], "1.0")
+ assertEquals(result[0][7], "1")
+ assertEquals(result[0][8], "100")
+
+ result = sql """show column stats smallint_partition
(smallint_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "smallint_part")
+ assertEquals(result[0][2], "141474.0")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "282948.0")
+ assertEquals(result[0][6], "2.0")
+ assertEquals(result[0][7], "1")
+ assertEquals(result[0][8], "100")
+
+ result = sql """show column stats int_partition (int_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "int_part")
+ assertEquals(result[0][2], "141474.0")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "565896.0")
+ assertEquals(result[0][6], "4.0")
+ assertEquals(result[0][7], "1")
+ assertEquals(result[0][8], "100")
+
+ result = sql """show column stats bigint_partition (bigint_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "bigint_part")
+ assertEquals(result[0][2], "141474.0")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "1131792.0")
+ assertEquals(result[0][6], "8.0")
+ assertEquals(result[0][7], "1")
+ assertEquals(result[0][8], "100")
+
+ result = sql """show column stats char_partition (char_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "char_part")
+ assertEquals(result[0][2], "141474.0")
+ assertEquals(result[0][3], "101.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "2829480.0")
+ assertEquals(result[0][6], "20.0")
+ assertEquals(result[0][7], "\'1 \'")
+ assertEquals(result[0][8], "\'a \'")
+
+ result = sql """show column stats varchar_partition
(varchar_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "varchar_part")
+ assertEquals(result[0][2], "141474.0")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "271630.0")
+ assertEquals(result[0][6], "1.9199994345250717")
+ assertEquals(result[0][7], "\'1\'")
+ assertEquals(result[0][8], "\'99\'")
+
+ result = sql """show column stats string_partition (string_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "string_part")
+ assertEquals(result[0][2], "141474.0")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "271630.0")
+ assertEquals(result[0][6], "1.9199994345250717")
+ assertEquals(result[0][7], "\'1\'")
+ assertEquals(result[0][8], "\'99\'")
+
+ result = sql """show column stats date_partition (date_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "date_part")
+ assertEquals(result[0][2], "141474.0")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "565896.0")
+ assertEquals(result[0][6], "4.0")
+ assertEquals(result[0][7], "\'2001-10-12\'")
+ assertEquals(result[0][8], "\'2100-10-12\'")
+
+ result = sql """show column stats float_partition (float_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "float_part")
+ assertEquals(result[0][2], "141474.0")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "565896.0")
+ assertEquals(result[0][6], "4.0")
+ assertEquals(result[0][7], "296.3103")
+ assertEquals(result[0][8], "32585.627")
+
+ result = sql """show column stats double_partition (double_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "double_part")
+ assertEquals(result[0][2], "141474.0")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "1131792.0")
+ assertEquals(result[0][6], "8.0")
+ assertEquals(result[0][7], "115.14474")
+ assertEquals(result[0][8], "32761.14458")
+
+ result = sql """show column stats decimal_partition
(decimal_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "decimal_part")
+ assertEquals(result[0][2], "141474.0")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "1131792.0")
+ assertEquals(result[0][6], "8.0")
+ assertEquals(result[0][7], "243.2868")
+ assertEquals(result[0][8], "32527.1543")
+
+ sql """analyze table
${catalog_name}.partition_type.decimal_partition (decimal_part) with sync with
sql"""
+ result = sql """show column stats decimal_partition
(decimal_part)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "decimal_part")
+ assertEquals(result[0][2], "100000.0")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][5], "800000.0")
+ assertEquals(result[0][6], "8.0")
+ assertEquals(result[0][7], "243.2868")
+ assertEquals(result[0][8], "32527.1543")
+
+ result = sql """show column stats two_partition (part1)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "part1")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][7], "1")
+ assertEquals(result[0][8], "100")
+
+ result = sql """show column stats two_partition (part2)"""
+ assertEquals(result.size(), 1)
+ assertEquals(result[0][0], "part2")
+ assertEquals(result[0][3], "100.0")
+ assertEquals(result[0][4], "0.0")
+ assertEquals(result[0][7], "\'1\'")
+ assertEquals(result[0][8], "\'99\'")
+ } finally {
+ sql """set global enable_get_row_count_from_file_list=false"""
+ }
sql """drop catalog ${catalog_name}"""
}
}
diff --git
a/regression-test/suites/external_table_p2/hive/test_hive_partition_statistic.groovy
b/regression-test/suites/external_table_p2/hive/test_hive_partition_statistic.groovy
index 73b6db1c646..6f398a62e3c 100644
---
a/regression-test/suites/external_table_p2/hive/test_hive_partition_statistic.groovy
+++
b/regression-test/suites/external_table_p2/hive/test_hive_partition_statistic.groovy
@@ -18,6 +18,8 @@
suite("test_hive_partition_statistic",
"p2,external,hive,external_remote,external_remote_hive") {
String enabled = context.config.otherConfigs.get("enableExternalHiveTest")
if (enabled != null && enabled.equalsIgnoreCase("true")) {
+ logger.info("This feature has not been supported yet, skip it.")
+ /**
String extHiveHmsHost =
context.config.otherConfigs.get("extHiveHmsHost")
String extHiveHmsPort =
context.config.otherConfigs.get("extHiveHmsPort")
String catalog_name = "test_hive_partition_statistic"
@@ -48,6 +50,7 @@ suite("test_hive_partition_statistic",
"p2,external,hive,external_remote,externa
order_qt_2 """select part_id, count, ndv, null_count, min, max from
internal.__internal_schema.column_statistics where catalog_id='$ctlId' and
part_id='event_day=1956-09-07'"""
sql """drop catalog ${catalog_name}""";
+ **/
}
}
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]