From d2b5015d3fd9729711f4dd6730448b9884b7a043 Mon Sep 17 00:00:00 2001 From: luozenglin <37725793+luozenglin@users.noreply.github.com> Date: Sat, 4 Feb 2023 22:59:34 +0800 Subject: [PATCH] [enhancement](profile) add the profile counter RawRowsRead to record the rows read from the parquet file (#16328) --- be/src/vec/exec/format/parquet/vparquet_reader.cpp | 3 +++ be/src/vec/exec/format/parquet/vparquet_reader.h | 1 + 2 files changed, 4 insertions(+) diff --git a/be/src/vec/exec/format/parquet/vparquet_reader.cpp b/be/src/vec/exec/format/parquet/vparquet_reader.cpp index 1e9e4bd25a..1b7653433a 100644 --- a/be/src/vec/exec/format/parquet/vparquet_reader.cpp +++ b/be/src/vec/exec/format/parquet/vparquet_reader.cpp @@ -71,6 +71,8 @@ void ParquetReader::_init_profile() { ADD_CHILD_COUNTER(_profile, "FilteredRowsByLazyRead", TUnit::UNIT, parquet_profile); _parquet_profile.filtered_bytes = ADD_CHILD_COUNTER(_profile, "FilteredBytes", TUnit::BYTES, parquet_profile); + _parquet_profile.raw_rows_read = + ADD_CHILD_COUNTER(_profile, "RawRowsRead", TUnit::UNIT, parquet_profile); _parquet_profile.to_read_bytes = ADD_CHILD_COUNTER(_profile, "ReadBytes", TUnit::BYTES, parquet_profile); _parquet_profile.column_read_time = @@ -112,6 +114,7 @@ void ParquetReader::close() { COUNTER_UPDATE(_parquet_profile.lazy_read_filtered_rows, _statistics.lazy_read_filtered_rows); COUNTER_UPDATE(_parquet_profile.filtered_bytes, _statistics.filtered_bytes); + COUNTER_UPDATE(_parquet_profile.raw_rows_read, _statistics.read_rows); COUNTER_UPDATE(_parquet_profile.to_read_bytes, _statistics.read_bytes); COUNTER_UPDATE(_parquet_profile.column_read_time, _statistics.column_read_time); COUNTER_UPDATE(_parquet_profile.parse_meta_time, _statistics.parse_meta_time); diff --git a/be/src/vec/exec/format/parquet/vparquet_reader.h b/be/src/vec/exec/format/parquet/vparquet_reader.h index 904f528b7b..a2125450e1 100644 --- a/be/src/vec/exec/format/parquet/vparquet_reader.h +++ b/be/src/vec/exec/format/parquet/vparquet_reader.h @@ -114,6 +114,7 @@ private: RuntimeProfile::Counter* filtered_page_rows; RuntimeProfile::Counter* lazy_read_filtered_rows; RuntimeProfile::Counter* filtered_bytes; + RuntimeProfile::Counter* raw_rows_read; RuntimeProfile::Counter* to_read_bytes; RuntimeProfile::Counter* column_read_time; RuntimeProfile::Counter* parse_meta_time;