This is an automated email from the ASF dual-hosted git repository.
morningman pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/doris.git
The following commit(s) were added to refs/heads/master by this push:
new 42136081e7b [Fix](hive-writer) Fix hive partition update file size and
remove redundant column names. (#34651)
42136081e7b is described below
commit 42136081e7beaa30dbbc724621e6aa7a462647fc
Author: Qi Chen <[email protected]>
AuthorDate: Tue May 14 10:11:15 2024 +0800
[Fix](hive-writer) Fix hive partition update file size and remove redundant
column names. (#34651)
---
be/src/vec/sink/writer/vhive_partition_writer.cpp | 7 ++++---
be/src/vec/sink/writer/vhive_partition_writer.h | 1 -
2 files changed, 4 insertions(+), 4 deletions(-)
diff --git a/be/src/vec/sink/writer/vhive_partition_writer.cpp
b/be/src/vec/sink/writer/vhive_partition_writer.cpp
index 1e1faef7e80..37203911964 100644
--- a/be/src/vec/sink/writer/vhive_partition_writer.cpp
+++ b/be/src/vec/sink/writer/vhive_partition_writer.cpp
@@ -64,7 +64,9 @@ Status VHivePartitionWriter::open(RuntimeState* state,
RuntimeProfile* profile)
std::vector<std::string> column_names;
column_names.reserve(_columns.size());
for (int i = 0; i < _columns.size(); i++) {
- column_names.emplace_back(_columns[i].name);
+ if (_non_write_columns_indices.find(i) ==
_non_write_columns_indices.end()) {
+ column_names.emplace_back(_columns[i].name);
+ }
}
switch (_file_format_type) {
@@ -155,7 +157,6 @@ Status VHivePartitionWriter::write(vectorized::Block&
block, vectorized::IColumn
RETURN_IF_ERROR(_projection_and_filter_block(block, filter,
&output_block));
RETURN_IF_ERROR(_file_format_transformer->write(output_block));
_row_count += output_block.rows();
- _input_size_in_bytes += output_block.bytes();
return Status::OK();
}
@@ -198,7 +199,7 @@ THivePartitionUpdate
VHivePartitionWriter::_build_partition_update() {
hive_partition_update.__set_location(location);
hive_partition_update.__set_file_names({_get_target_file_name()});
hive_partition_update.__set_row_count(_row_count);
- hive_partition_update.__set_file_size(_input_size_in_bytes);
+
hive_partition_update.__set_file_size(_file_format_transformer->written_len());
if (_write_info.file_type == TFileType::FILE_S3) {
doris::io::S3FileWriter* s3_mpu_file_writer =
diff --git a/be/src/vec/sink/writer/vhive_partition_writer.h
b/be/src/vec/sink/writer/vhive_partition_writer.h
index 8c63d855a02..b725bcd73f0 100644
--- a/be/src/vec/sink/writer/vhive_partition_writer.h
+++ b/be/src/vec/sink/writer/vhive_partition_writer.h
@@ -92,7 +92,6 @@ private:
TUpdateMode::type _update_mode;
size_t _row_count = 0;
- size_t _input_size_in_bytes = 0;
const VExprContextSPtrs& _vec_output_expr_ctxs;
const VExprContextSPtrs& _write_output_expr_ctxs;
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]