From 7a527c7d811d800a4d48236ef1f8fc93c38e1e3c Mon Sep 17 00:00:00 2001 From: Gabriel Date: Fri, 15 May 2026 20:14:02 +0800 Subject: [PATCH] [fix](parquet) Fix wrong encoding for parquet page v2 --- be/src/format/parquet/vparquet_group_reader.cpp | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/be/src/format/parquet/vparquet_group_reader.cpp b/be/src/format/parquet/vparquet_group_reader.cpp index 6863926ddba56d..7fb2c6fe67c770 100644 --- a/be/src/format/parquet/vparquet_group_reader.cpp +++ b/be/src/format/parquet/vparquet_group_reader.cpp @@ -277,7 +277,8 @@ bool RowGroupReader::is_dictionary_encoded(const tparquet::ColumnMetaData& colum if (column_metadata.__isset.encoding_stats) { // Condition #1 above for (const tparquet::PageEncodingStats& enc_stat : column_metadata.encoding_stats) { - if (enc_stat.page_type == tparquet::PageType::DATA_PAGE && + if ((enc_stat.page_type == tparquet::PageType::DATA_PAGE || + enc_stat.page_type == tparquet::PageType::DATA_PAGE_V2) && (enc_stat.encoding != tparquet::Encoding::PLAIN_DICTIONARY && enc_stat.encoding != tparquet::Encoding::RLE_DICTIONARY) && enc_stat.count > 0) {