From 6c5ec15e100ee02dd60ff9a3819ca2df07be138b Mon Sep 17 00:00:00 2001 From: "github-actions[bot]" <41898282+github-actions[bot]@users.noreply.github.com> Date: Wed, 9 Jul 2025 10:58:48 +0800 Subject: [PATCH] branch-2.1: [fix](be) fix parquet file reader not updating page index when processing it #52228 (#52782) Cherry-picked from #52228 Co-authored-by: SWEI Co-authored-by: zengsiwei Co-authored-by: suxiaogang223 --- be/src/common/config.cpp | 2 +- .../vec/exec/format/parquet/vparquet_reader.cpp | 2 +- .../parquet/small_2rowgroup.parquet | Bin 0 -> 13059 bytes .../hive/test_hive_parquet_skip_page.out | 4 ++++ .../hive/test_hive_parquet_skip_page.groovy | 12 +++++++++++- 5 files changed, 17 insertions(+), 3 deletions(-) create mode 100644 docker/thirdparties/docker-compose/hive/scripts/preinstalled_data/parquet/small_2rowgroup.parquet diff --git a/be/src/common/config.cpp b/be/src/common/config.cpp index fa8e5e9272..640088a742 100644 --- a/be/src/common/config.cpp +++ b/be/src/common/config.cpp @@ -1345,7 +1345,7 @@ DEFINE_mInt64(compaction_batch_size, "-1"); // If set to false, the parquet reader will not use page index to filter data. // This is only for debug purpose, in case sometimes the page index // filter wrong data. -DEFINE_mBool(enable_parquet_page_index, "false"); +DEFINE_mBool(enable_parquet_page_index, "true"); DEFINE_mBool(ignore_not_found_file_in_external_table, "true"); diff --git a/be/src/vec/exec/format/parquet/vparquet_reader.cpp b/be/src/vec/exec/format/parquet/vparquet_reader.cpp index e51d27ce20..d14d77f70c 100644 --- a/be/src/vec/exec/format/parquet/vparquet_reader.cpp +++ b/be/src/vec/exec/format/parquet/vparquet_reader.cpp @@ -860,7 +860,7 @@ Status ParquetReader::_process_page_index(const tparquet::RowGroup& row_group, // use the union row range skipped_row_ranges.emplace_back(skipped_row_range); } - _col_offsets.emplace(parquet_col_id, offset_index); + _col_offsets[parquet_col_id] = offset_index; } if (skipped_row_ranges.empty()) { read_whole_row_group(); diff --git a/docker/thirdparties/docker-compose/hive/scripts/preinstalled_data/parquet/small_2rowgroup.parquet b/docker/thirdparties/docker-compose/hive/scripts/preinstalled_data/parquet/small_2rowgroup.parquet new file mode 100644 index 0000000000000000000000000000000000000000..dcd05f5e28e08e28d472b9682cf5fed1a87d0b14 GIT binary patch literal 13059 zcmWG=3^EjD5bbji?Q_r(Z4eM;5M>i(V_;xrU|?tvU}RumU;q(J3=km}1_lOJ1_lN; z1_lOp1_lNW1_lOB1_lN$1_lOh1_lNm1_lOR1_lN`1_lOx1_lNJ1_lN}1_lNp1_lOU z1_lNZ1_lOE1_lN(1_lOk1_lNR1_lO61_lNx1_lOc1_lNh1_lOM1_lN>1_lOs1_lNN z1_lO21_lNt1_lOY1_lNd1_lOI1_lN-1_lOo1_lNV1_lOA1_lN#1_lOg1_lNl1_lOQ z1_lN_1_lOw1_lNL1_lO01_lNr1_lOW1_lNb1_lOG1_lN*1_lOm1_lNT1_lO81_lNz z1_lOe1_lNj1_lOO1_lN@1_lOu1_lNP1_lO41_lNv1_lOa1_lNf1_lOK1_lN<1_lOq z1_lNX1_lOC1_lN%1_lOi1_lNn1_lOS1_lN{1_lOy1_p)z1_p*e1_p*81_p*;1_p)@ z1_p*u1_p*O1_p+31_p)*1_p*m1_p*G1_p*`1_p*01_p*$1_p*W1_p+B1_p)%1_p*i z1_p*C1_p*?1_p){1_p*y1_p*S1_p+71_p)<1_p*q1_p*K1_p*~1_p*41_p*)1_p*a z1_p+F1_p)#1_p*g1_p*A1_p*=1_p)_1_p*w1_p*Q1_p+51_p)-1_p*o1_p*I1_p*| z1_p*21_p*&1_p*Y1_p+DP!eEZU}$7uU}$1sU}$DwU}#}rU}$AvU}$4tU}$GxVCZ0A zVCZCEVCZ6CVCZIGVCZ3BVCZFFVCZ9DVCZLHV3@$bz%Y@4fngE@1H)tn28JmN3=C5l z7#OB8FfdGKU|^WRz`!t*fq`Kb0|Ucs1_p*X3=9l&85kJmF)%R9XJBAhz`($;kb!|= z5d#CmVg?3=B@7GV{!)XQvhBFKd3}+b_7|t;;Fq~&#V7S1*z;Ka)f#DJZ1H)wo28JsP z3=CHp7#OZGFfd$aU|_hxz`$^mfq~%`0|Uct1_p*Z3=9l+85kJuF)%RPXJBA>z`(%p zkb!~W5d#CmV+IC>CkzY>PZ<~(o-r^mJZE5Fc)`HH@REUn;S~b|!)pcxhBpih3~w12 z7~U~3FuZ4AVEDkm!0?fQf#DMa1H)$q28J&T3=Cfx7#O}WFfe>)U|{&cz`*d6fq~%{ z0|Ucv1_p*d3=9l^85kJ;F)%Rvhh~08Mg|5ZMg|6EMg|5JMg|5}Mg|5pMg|6UMg|5B zMg|5>Mg|5hMg|6MMg|5RMg|66Mg|5xMg|6cMg|5@2_neIz#zoPz#z=Xz#ziNz#z)V zz#zuRz#z`Zz#zfMz#z%Uz#zrQz#z@Yz#zlOz#z-Wz#zxSz#z}az@Wg$z@W&;z@Ws) zz@W^?z@Wm&z@W;=z@Wy+z@W~^z@Wj%z@W*>z@W#-z@X2_ zz+k}0z+lM8z+lA4z+lYCz+l42z+lSAz+lG6z+leEz+l11z+lP9z+lD5z+lbDz+l73 zz+lVBz+lJ7z+lhFz~I2hz~IQpz~IElz~Ictz~I8jz~IWrz~IKnz~Iivz~I5iz~ITq zz~IHmz~Ifuz~IBkz~IZsz~INoz~Ilwz!1R5z!1pDz!1d9z!1#Hz!1X7z!1vFz!1jB zz!1*Jz!1U6z!1sEz!1gAz!1&Iz!1a8z!1yGz!1mCz!1;Kz>vVmz>vtuz>vhqz>v(y zz>vboz>vzwz>vnsz>vvYnz>vwvz>vkrz>v+zz>vepz>v$xz>vqtz>v?#z)--* zz);A@z)-}z);S}z)-=+z);D^z);1=z);P|z)-`;z);J` zz);7?z);V~z|g?Rz|hFZz|h3Vz|hRdz|g|Tz|hLbz|h9Xz|hXfz|g_Sz|hIaz|h6W zz|hUez|h0Uz|hOcz|hCYz|hagz%YT4fng#e1H&Xn28PLu3=C5k85pKAGB8YIWMG)i z$iOgzk%3_*BLl-MMh1r2j0_BO7#SGmGBPmCV`N~M&&a^AfRTY=AtM9BB1Q&=#f%IL zOBfj#mNGIhEMsI~SkB16u!50+VI?C2!zxAwhSiJ=3~Lw}7}hc}Fsx%_U|7${z_5Xl zfng&f1H&dp28PXy3=CTs85p)QGB9joWMJ6N$iT3Jk%3_+BLl-OMh1r6j0_BW7#SG$ zGBPmiV`O01&&a@VfRTaWAR`0AAw~v>Fq~s#U^vgnz;J<)f#D(}1H&ao28PRw3=CHo85piIGB8|Y zWMH_?$iQ%ek%8eRBLl-NMh1r4j0_BS7#SGuGBPmSV`N~s&&a^=fRTaWAtM9BBSr>> z$BYaNPZ${(o-#5pJY!^Fc+SYc@Pd(n;Uyyj!z)GxhS!V?3~v}27~V26FuY@AV0h2S z!0>^Qf#D+~1H&gq28Pd!3=Cfw85q7YGBA8&WMKHt$iVP}k%8eSBLl-PMh1r8j0_Ba z7#SG;GBPmyV`O0X53TqanHU(Dm>3wCnHU&Ym>3vXnHU(@m>3w?nHU&2m>3v1nHU(j zm>3winHU&&m>3v%nHU)Om>3xNnHU%Zm>3uYnHU&^m>3v@nHU&Em>3vDnHU(vm>3wu znHU%(m>3u&nHU(Pm>3wOnHU&km>3vjnHU)4m>3x3nHU%pm>3uonHU(9m>3w8nHU&U zm>3vTnHU(3w;nHU%}m>3u|nHU(fm>3wenHU&!m>3vznHU)Km>3xJnHU%hm>3ug znHU(1m>3w0nHU&Mm>3vLnHU(%m>3w$nHU%>m>3u=nHU(Xm>3wWnHU&sm>3vrnHU)C zm>3xBnHU%xm>3uwnHU(Hm>3wGnHU&cm>3vbnHU({m>3w`nHU&6m>3v5nHU(nm>3wm znHU&+m>3v*nHU)Sm>3xRnHU%Xm>3uWnHU&?m>3v>nHU&Cm>3vBnHU(tm>3wsnHU%% zm>3u$nHU(Nm>3wMnHU&im>3vhnHU)2m>3x1nHU%nm>3umnHU(7m>3w6nHU&Sm>3vR znHU(-m>3w+nHU%{m>3u`nHU(dm>3wcnHU&ym>3vxnHU)Im>3xHnHU%fm>3uenHU&~ zm>3v}nHU&Km>3vJnHU(#m>3w!nHU%3u;nHU(Vm>3wUnHU&qm>3vpnHU)Am>3x9 znHU%vm>3uunHU(Fm>3wEnHU&am>3vZnHU(_m>3w^nHU&4m>3v3nHU(lm>3wknHU&) zm>3v(nHU)Qm>3xPnHU%*FflMpWMW{L#KgcbnTdg63KIjvR3-+7X-o_Z)0r3;W-u`@ z%w%F77#1)wFf3$ZU|7V&z_6H!fnf;~1H)1# z28Lx!3=GSe7#LPCF)*xTVqjRs#K5qciGg7a69dCqCI*IeObiU`nHU&0FflM}WMW|0 z#Kgd`nTdg63ljswRwf39ZA=Ud+nE>`b}%t8>||nK*u})au$zg2VGk1n!(Ju^hJ8#7 z4EvcF7!EKoFdSrJU^v9Yz;Kv}f#C=f1H(}!28Lry3=GGa7#L14F)*BDVqiGM#K3Tx ziGkq^69dCpCI*IcObiU?nHU%@FflM(WMW{r#KgdGnTdhn3KIjvRVD_8YfKCb*O?d? zZZI)0++<>4xW&Z4aGQyN;SLi6!(Ao@hI>p54ELEB7#=V&Fg#>pV0gsD!0?!ff#C@g z1H)4$28L%$3=Gei7#LnKF)+MjVqkd1#K7>HiGkq_69dCrCI*IgObiU~nHU&8FflNE zWMW|W#KgexnTdhn3ljswS0)CAZ%hmf-94F92xenw^n1}0_(24-dk1{P)p23BSU1~z5}26ko!1`cKh22N%M1}25x2s z1|DVx23}?c20ms627YD+1_5RU20>;91|en!24Q9f1`%ck22o}P1~Fy^261Kv1_@>c z21#ZH1}SC+25Dvn1{r1s23ckX203O126<)%1_fpY21RBD1|?<&24!Xj1{G!o232MT z1~p~|26biz1`TEg22ExL1}$a=25n{r1|4Pw23=+b20dm527P7*1_NdW218~B1|wz$ z24iLh1`}om22*AR1~X;`26JWx1`B2e21{lJ1}kO;25V*p1{-Du23uwZ20La3276`( z1_x#a21jNF1}A0)24`jl1{Y=q23KYV1~+B~26tu#1`lQi22W-N1}|m?25)8t1|Mby z247|d20vy727hJ-h5%*;hCpTph9G7JhG1p}h7e{3hEQe(hA?IZhHz#Eh6rW`hDc@x zhA3tRhG=F6h8SiBhFE3>hB#&hhInQMh6H8?hD2rth9qVNhGb?2h7@K7hE!$-hBRgd zhID2Ih74u~hD>G#hAd_VhHPdAh8$)FhFoR_hCF5lhJ0oQh5}{=hC*frh9YJLhGJ$0 zh7x85hEiq*hB9UbhH_>Gh6-i|hDv4zhAL(ThH7R8h8kuDhFWF@hB{^jhI(cOh6ZK^ zhDK%vh9+hPhGu34h8AW9hE`?RxvX$tY&6lSi{V~u$GyDVI4CA!+K^0h7HUN3>%pl7&b98Fl=UK zVA#UUz_68>fnggn1H*P^28JEX3=BJ&85njkGcfFCW? z%nS?%nHd-kF*7h6W@cbG!py*Ml$n9y7&8OIab^aF6U+<@Cz%--PBAkuoMvWVIK#}q zaF&^Y;T$sq!+B-~h6~IL3>TRh7%nk0FkEJ4V7S7}z;KnBf#Di61H*M@28J8V3=B7! z85nLcGcep{W?;C(%)oG$nStRRGXukYW(I}_%nS?p7(OvG zFnnfaVEDq!!0?rsf#Dl71H*S_28JKZ3=BV+85n*sGcf#SW?=Zk%)s!MnStRSGXuka zP+nya6%iHD5oHpEjthXw1SUoX7Em`H=cvI2b_Rxv>x7ZmNZnHBm++k;6xXaGKaF3mV;XXS9!vl5(hKKA743F3u z7#_1TFg#&rV0g;T!0?Qnf#Eqj1H%h;28NgH3=FT>85mx(GcdeiXJB~C&cN`Foq^#! zI|IW9b_Rxz>jh%tvJ39lz4|WEIpX>|_zt|ZVezP+$ z{9$Kc_{+|~@QEftQ1UfsccMfuDncL4bpSL6C!iL5PEaL70PqL4<>WL6n1mL5zce zL7anuL4t#UL6U=kL5hQcL7IbsL572YL6(DoL5_ogL7szwL4kvTL6L)jL5YKbL79Vr zL4|{XL6w7nL5+ifL7jtvL4$*VL6d`lL5qWdL7RhtL5G8ZL6?JpL63uhL7#(x!GME- z!H|Q2!H9!_!I*=A!Gwc>!IXo6!Hk1}!JLDE!GeQ z$-tn-$-tn_$-tn&$-tn=$-tn+$-tn^$-tn)$-tn?$-tn;$-tn`$-rR1$-rR9$-rR5 z$-rRD$-rR3$-rRB$-rR7$-rRF$-rR2$-rRA$-rR6$-rRE$-rR4$-rRC$-rR8$-rRG z$-v;i$-v;q$-v;m$-v;u$-v;k$-v;s$-v;o$-v;w$-v;j$-v;r$-v;n$-v;v$-v;l z$-v;t$-v;p$-v;x$-of6$-ofE$-ofA$-ofI$-of8$-ofG$-ofC$-ofK$-of7$-ofF z$-ofB$-ofJ$-of9$-ofH$-ofD$-ofL$-t1n$-t1v$-t1r$-t1z$-t1p$-t1x$-t1t z$-t1#$-t1o$-t1w$-t1s$-t1!$-t1q$-t1y$-t1u$-t1$$-q#+$-q#^$-q#=$-q#| z$-q#;$-q#`$-q#?$-q#~$-q#-$-q#_$-q#>$-q#}$-q#<$-q#{$-q#@$-q$0$-vOS z$-vOa$-vOW$-vOe$-vOU$-vOc$-vOY$-vOg$-vOT$-vOb$-vOX$-vOf$-vOV$-vOd z$-vOZ$-vOh$-ppylYwC(Cj-MIP6md_oD2+8I2jnGaxySX<78l%&dIAgOh<_Cnp2LE=~r9-JA>zdpH>w_Hr^X?Bir$*w4wp zaDbD6;UFgi!y!%vhQpi;3`aN_7>;r>FdXA#U^vdnz;J?-f#D=41H&m!28Pp|3=C&D z85quTGBBLuWMDYY$-r=dlY!wPCj-MJP6md{oD2+CI2jnOaxySn<78mC&dI=VgOh>b zCMN^KElvi8+nfvxcQ_ds?s76P+~Z_mxX;PJ@PLzn;UOmj!y`@xhR2)?3{N;27@l%6 zFg)XAV0g~S!0>{Tf#D@51H&s$28P$13=D5L85rJjGBCX3WMFvD$-wY|lY!wQCj-ML zP6me0oD2+KI2jneaxyS{<78m?&dI>=gOh>bCnp2LFHQ!A-<%8#e>fQ!{&F%f{NrR` z_z#`VVB}(8VB%t6VCG_AVBun5VC7<9VB=z7VCQ0B;NW6l;N)Up;NoIn;O1gr;NfCm z;N@aq;NxOo;OAms5a4295aeQD5aMEB5awcF5aD8A5anWE5aVKC5a(iGkl7@P~u`>Q08J_P~l==P~~D^P~&1? zQ0HP`(BNWV(BxuZ(BfiX(B@)b(BWcW(B)!a(BooY(C1=cFyLZfFyvxjFydlhFy>-l zFyUfgFy&%kFymriFy~@mu;5}~u;gN3u;OB1u;yZ5u;F50u;pT4u;XH2u;*f6aNuHK zaO7fOaN=TMaOPrQaN%NLaOGlPaN}ZNaOYxR@Ze%#@Z@4(@Zw@%@aAG*@Zn-$@a1A) z@Z(}&@aJM+2;gF12;^d52;yR32k zh~{Eoh~Z*jh~;8nh~r{li05KpNZ?{%NaSK*NaA8(NakW-Na12&NabQ+NaJE)Natc; z$lzjN$mC*R$l_vP$mU{T$l+pO$mL>S$m3#Q$me2UDBxmXDCA;bDB@yZDCS~dDB)sY zDCJ^cDC1&aDCc5esNiB?sN`Z`sN!N^sODl|sNrH@sO4f{sN-T_sOMr}Xy9UCXyjsG zXyRgEXy#&IXyIaDXysyHXyamFXy;;J=-^^t=;UHx=;C5v=;mTz=;2~u=;dNy=;LBw z=;vZ!n83xrFp-OaVGz;Kg`f#DVx z1H)}D28KIa3=DU<7#QwxF)-ZcVqkc{#lY~8i-F-07X!m%E(V4tTnr3PxfmFpaWODF z=VD-Z!NtJvl8b@i6&C};Yc2+cH(U%1Z@Cy4-f=N7yys$I_`t=$@R5sw;S(1F!)GoA zhA&(U3}3kz7`|~aFns4?VEDns!0?lcf#DYy1H*4F28KUe3=Ds{7#RL>F);jxPGvH3 zGcYi5GcYi7Gcd4lGcd4nGcd4mGcd4oGca&)Gca&+Gca&*Gca&-GcfRQGcfRSGcfRR zGcfRTGcX8nGcX8pGcX8oGcX8qGcbs7Gcbs9Gcbs8GcbsAGcZVSGcZVUGcZVTGcZVV zGcd?-Gcd?GcfdUGcfdWGcfdVGcfdXGcZix zW?-1e&A>2;n}K06Hv_{IZU%;_+zbrUxEUCxb2Bi^;AUW$$<4qpi<^OAHa7#q9Bu}N zx!ep4^SBup=5sSJEZ}BfSjf%5u!x(1VKFxY!xC-=hNavL49mC~7?yK0Fs$HaU|7k` zz_5y&fnhZ_1H&3_28OlV3=HeI85q`cGcau6W?b2BjP;AUXh$<4s9i<^OAH#Y;r9&QGPz1$28`?whx_H#2Z9N=bPILOVwaEP0M z;V?G?!x3%;u@Fr46KU^vOmz;KG2f#Eba1H&0^28OfT3=HSE85quk z(mL)11sAv(7%p-%FkIqhV7Sc9z;K0|f#E7Q1H(0L28Qe03=B8885nMIGcerZW?;C@ z&A@Pnn}OjjHv_{xZU%PUUD-qyy9kHc+Jhg@P?a#;Vm}VED| zJPZuXJPZshJPZu1JPZtMJPZu%JPZsRJPZt+JPZt6JPZunJPZsxJPZuHJPZtcJPZu{ zJPZs1JPZtiJPZs%JPZuNJPZsXJPZt?JPZtCJPZutJPZsHJPZtyJPZs{JPZudJPZsn zJPZu7JPZtSJPZu-JPZs9JPZtqJPZsJPZsDJPZtuJPZs@JPZuZ zJPZsjJPZu3JPZtOJPZu(JPZsTJPZt;JPZt8JPZupJPZszJPZuJJPZteJPZu}JPZs0 zJPZthJPZs$JPZuMJPZsWJPZt>JPZtBJPZusJPZsGJPZtxJPZs`JPZucJPZsmJPZu6 zJPZtRJPZu+JPZs8JPZtpJPZs;JPZuUJPZseJPZt}JPZtJJPZu!JPZsOJPZt(JPZt3 zJPZukJPZsuJPZuEJPZtZJPZu^JPZs4JPZtlJPZs)JPZuQJPZsaJPZt_JPZtFJPZuw zJPZsKJPZt#JPZs~JPZugJPZsqJPZuAJPZtVJPZu=JPZsCJPZttJPZs?JPZuYJPZsi zJPZu2JPZtNJPZu&JPZsSJPZt-JPZt7JPZuoJPZsyJPZuIJPZtdJPZu|JPZsIco-Na z@-Q$=;$dKz%)`Jig@=J*Dh~t0G#&U|7tN28QK43=AuH7#LRaFfgp* zVPIIz!@#hHhk;=&4+FzG9tMW>JPZsQco-Nq@-Q%L;$dLe%)`L2g@=J*D-Q$1HXa6s z?K}(&J9rovcJeSV?BZcy*v-Shu!o0%VJ{B@!#*AchW$JY3pTn$H+UErZt^fN+~Q$ixXr`BaEFJ1 z;VusY!#y4bhWk7W3=eo17#{L4Fg)U6V0g^K!0?2Jf#E3+1H&^O28QQ63=A)L7#Lpi zFfhF0VPJU8!@%%{hk@ZO4+FzH9tMW@JPZsUco-Ny@-Q%b;$dL;%)`L&g@=LRD-Q$1 zHy#Ft?>r0)KX@1ze)2Fd{NiC?_|3z>@P~(i;V%yZ!#^GdhX2sjO^mz@3{1QX49vU? z3@p4146M8i3~am%4D7rN3>>@+44k|S3|zbn4BWg73_QFH47|Jy41Bx{4E($d3v%)44S+Q3|hPl z4BEU53_83F47$7w40^l_4Enqb3R492_+3?{q`45qvc3}(Cx4CcHH z3>Lf$43@kM3|71h4A#613^u$B47R)s40gN>4EDSX3=X^u434}E3{JcZ49>g^3@*G3 z46eKk3~sy(4DP%P3?94;44%9U3|_np4Bos93_iRJ48FV!41T-}4F0?f3<10h41v51 z3_-jM48gn%3?aM>457RX3}L(s4B@;C3=zBx43WGH3{kuc4AHy{3^BY646(cn3~{^+ z4Dq}S3<f3~9U!4C%ZK3>mx(44J$P3|YJk4B5O4 z3^}|E47t1v40*f^4Eeka3CZ# z43)eL3{|`g4As003^lwA47I!r40XH=4E4MW3=O;t42`@D3{AWY49&a@3@yA246VEj z3~js&4DGxO3>~}-44u3T3|+ho4Bfm83_ZLI486Pz41K%|4E?+e3=?=67$)*EFihfQ zV3^Fyz%YfEfnh2y1H&|428QXp3=A`P85m~rGBC{IWnh@i%fK*)mw{m}F9X9oUIvEw zybKHrco`TL@-i?i;$>i1%*(*AgqML~DK7)VGF}FT<-80GD|i_gR`N11tm0*0Sk248 zu!fg`VJ$BM!#Z9DhV{G*3>$bE7&h`UFl^#wVA#ydz_5jvfnh5z1H(3628Qjt3=BJX z85nl*GBE7oWnkFN%fPUQmw{m~F9X9qUIvE!ybKHnco`TD@-i?S;$>hs%*()VgqMNg zC@%xUFSDA7%uWM zFkIqgV7Sc7z;K0^f#E7I1H(0528Qdr3=B7T85nNzGBDiYWnj3?%fN7lmx19fF9X9p zUIvEyybKHvco`TT@-i?y;$>iX%*(*=gqMNgDK7)VGhPOU=e!IIFL)UkUh*<9yy9hG zc+Jbe@P?Ox;Vmx%!#iFEhWES-3?FzI7(VhcFnr==VED|-!0?5af#EAJ1H(6728Qpv z3=BVb85n-@GBEt&WnlQt%fRr5mx19gF9X9rUIvE$(3Ophd<+asd<+cCd<+aMd<+b% zd<+b1d<+cid<+a6d<+bnd<+a+d<+cSd<+acd<+b{d<+bHd<+cyd<+Z%d<+bNd<+ai zd<+c2d<+aCd<+btd<+a?d<+cYd<+Z{d<+bdd<+ayd<+cId<+aSd<+b-d<+b7d<+co zd<+Zd<+bBd<+csd<+Z@d<+bZd<+aud<+cEd<+aOd<+b(d<+b3 zd<+ckd<+a8d<+bpd<+a;d<+cUd<+aed<+b}d<+bJd<+c!d<+Z$d<+bMd<+ahd<+c1 zd<+aBd<+bsd<+a>d<+cXd<+Z`d<+bcd<+axd<+cHd<+aRd<+b+d<+b6d<+cnd<+Z; zd<+bUd<+apd<+c9d<+aJd<+b!d<+a}d<+cfd<+a3d<+bkd<+a(d<+cPd<+aZd<+b^ zd<+bEd<+cvd<+Z)d<+bQd<+ald<+c5d<+aFd<+bwd<+a_d<+cbd<+Z~d<+bgd<+a# zd<+cLd<+aVd<+b=d<+bAd<+crd<+Z?d<+bYd<+atd<+cDd<+aNd<+b&d<+b2d<+cj zd<+a7d<+bod<+a-d<+cTd<+add<+b|d<+bId<+czd<+Z|_!t-_@-Z+>;$vW#%*Vhm zg^z(@Djx&GG(HA~>3j?fGx!)7X7VvG%;IBUn9aw)Fo%zUVJ;s7!#q9)hWUI93=8-e z7#8v|Ff8I@U|7t@z_5gmfng~h1H&>t28QK)3=Avy7#LRaF)*y+V_;a#$H1_LkAYz= z9|OZWJ_d&Md<+a5_!t;A@-Z-M;$vXg%*Vj6g^z(@D<1>HHa-T1?R*RjJNOtFcJeVW z?BZi!*v-elu!oOwF9hH~1JBZt^iO+~Q+kxXs7FaEFh9;VvHo!#zF*hWmUB z3=jAi7#{L5Fg)U8V0g^O!0?2Rf#E411H&^u28QQ+3=A*$7#LpiF)+O1V_HH$Dc2?|cjlKlm6J ze)2Ie{NiI^_|3<_@Q06q;V&Np!#_R-hX2r2&5ZmE3{3nC49xrt3@rQ%46OVN3~c-i z4D9?23>^Fn44nK73|#yS4BY$-3_Sb{47~gd41D|y4E+2I3y3l44V853|jmQ4BGq*3_AP_47&Ub z40`+w4Ep>G3x45s`H3}*Zc4Ced{3>N$h43_*13|9OM z4A%S%3^x1>47U6X40iks4EFpC3=aGZ437K^3{LzE49@%v3@-c(46ghP3~u}k4DS34 z3?BRp44(W93|{;U4Bq?<3_kn}48Hsf41W9!4F3EK3<3NM41xR%3_<)148i;i3?cjs z459oC3}O5X4B`9?3=#Yc43Yc{3{m_H4AJ}y3^Du+46*zS3~~Gn4DtL73<>-U42k>< z3`zV949WZq3@Q8!45|DK3~Brf4C(v~3>o|k44M243|agP4B7k)3_1J^47vOa40-$v z4Eg*F3Ewg43+#03|0IL4AuM$ z3^n`=47L0W40Zer4E6jB3=RAY42}E@3{CtD49)xu3@!W&46XbO3~l@j4DI|33?2Lo z44wQ83|;&T4Bh+;3_bh|488me41N3z4E_8J3={Yn7$)*FFihfSV3^F$z%YfMfnh2? z1H&|a28QYU3=A{)85m~rGce5JXJDAk&%iK;pMha6KLf)&eg=m5{0s~W_!$@$@-r|j z;%8u3%+J8Egr9+7DL(_lGJXbz<@^i`EBF~0R`N42tm0>2Sk2GCu!f(3VJ$xc!#aKj zhV}dm3>)|v7&h`VFl^#yVA#yhz_5j%fnh5@1H(3c28QkY3=BK?85nl*GcfGpXJFXP z&%m&UpMha7KLf))eg=m9{0s~S_!$@u@-r|T;%8tu%+J7Zgr9-oC_e+kF@6Sy zP|{aqVv^JV?J{6s0WC6+)L;QELjbcynIzR17&P4&8Uz@a7$gmun3yCjSU_tHSU{r+ zEFd!^Em%MU5G)|8SU?7fGD(8g`fH|vbTtSturNsKh;fK+a}Z--5ZmVWtvER&H8)X|i9wV}l}UmzkwL7@ zKvG9iMvXy6lu1&RjX_d^F;SF3tVuxZjf2=52Q>~G39#cOz zFxY6aNvbh42{15-Jvq!Msv$P-5Tj@a1IUaf0W}V>Hx3M#cC;vnt!iWhVYM#~HWFa( zN`S)yWDUsk5FX4LHmEf%3JeTlJx3Ttoy0yJViYZ602v|HqM-K00mNdEl#$?Z3<~lO zw}SXqVhy7{2pFe3IyyQAf(S=PM{h^Ra!03hM>j{ubVp~fl%tcAqoXfK-r3R76GS^9 zXh%m!SCCLBh;Vgu3_s8a@r?F_aj-O;HW zVh>2nF&IqRGDs*CBo-Bxrk3a?7Zm6w78T`}E0m=c6=&w>DHs{(8R!{E%7FHnfY#!I Hw!Z)XQex{j literal 0 HcmV?d00001 diff --git a/regression-test/data/external_table_p0/hive/test_hive_parquet_skip_page.out b/regression-test/data/external_table_p0/hive/test_hive_parquet_skip_page.out index 6c869dbc78..a8973479e4 100644 --- a/regression-test/data/external_table_p0/hive/test_hive_parquet_skip_page.out +++ b/regression-test/data/external_table_p0/hive/test_hive_parquet_skip_page.out @@ -1,4 +1,8 @@ -- This file is automatically generated. You should know what you did if you want to edit this +-- !small_2rowgroup -- +1024 +4049 + -- !q01 -- 1 2132 4633 4 28.00 28955.64 0.09 0.06 N O 1996-04-21 1996-03-30 1996-05-16 NONE AIR lites. fluffily even de 1 15635 638 6 32.00 49620.16 0.07 0.02 N O 1996-01-30 1996-02-07 1996-02-03 DELIVER IN PERSON MAIL arefully slyly ex diff --git a/regression-test/suites/external_table_p0/hive/test_hive_parquet_skip_page.groovy b/regression-test/suites/external_table_p0/hive/test_hive_parquet_skip_page.groovy index ebdbedf139..0bded7d820 100644 --- a/regression-test/suites/external_table_p0/hive/test_hive_parquet_skip_page.groovy +++ b/regression-test/suites/external_table_p0/hive/test_hive_parquet_skip_page.groovy @@ -94,11 +94,21 @@ suite("test_hive_parquet_skip_page", "p0,external,hive,external_docker,external_ return; } + String externalEnvIp = context.config.otherConfigs.get("externalEnvIp") + def hdfs_port = context.config.otherConfigs.get("hive2HdfsPort") + def defaultFS = "hdfs://${externalEnvIp}:${hdfs_port}" + def hdfsUserName = "doris" + def uri = "${defaultFS}" + "/user/doris/preinstalled_data/parquet/small_2rowgroup.parquet" + qt_small_2rowgroup """ select * from HDFS( + "uri" = "${uri}", + "hadoop.username" = "${hdfsUserName}", + "format" = "parquet") where a = 1024 or a = 4049 + order by a;""" + for (String hivePrefix : ["hive2", "hive3"]) { try { String hms_port = context.config.otherConfigs.get(hivePrefix + "HmsPort") String catalog_name = "${hivePrefix}_test_parquet_skip_page" - String externalEnvIp = context.config.otherConfigs.get("externalEnvIp") sql """drop catalog if exists ${catalog_name}""" sql """create catalog if not exists ${catalog_name} properties (