diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query1.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query1.q.out index 9c98d2820e2c..900c47e7bf62 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query1.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query1.q.out @@ -6,10 +6,10 @@ HiveProject(d_date_sk=[$0]) CBO PLAN: HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]) HiveProject(c_customer_id=[$1]) - HiveJoin(condition=[AND(=($3, $7), >($4, $6))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $0)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(c_customer_sk=[$0], c_customer_id=[$1]) - HiveTableScan(table=[[default, customer]], table:alias=[customer]) + HiveJoin(condition=[=($2, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(c_customer_sk=[$0], c_customer_id=[$1]) + HiveTableScan(table=[[default, customer]], table:alias=[customer]) + HiveJoin(condition=[AND(=($1, $5), >($2, $4))], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($3, $1)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]) HiveFilter(condition=[IS NOT NULL($2)]) @@ -24,16 +24,16 @@ HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]) HiveProject(s_store_sk=[$0]) HiveFilter(condition=[=($24, _UTF-16LE'NM')]) HiveTableScan(table=[[default, store]], table:alias=[store]) - HiveProject(_o__c0=[*(CAST(/($1, $2)):DECIMAL(21, 6), 1.2:DECIMAL(2, 1))], ctr_store_sk=[$0]) - HiveFilter(condition=[IS NOT NULL(CAST(/($1, $2)):DECIMAL(21, 6))]) - HiveAggregate(group=[{1}], agg#0=[sum($2)], agg#1=[count($2)]) - HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]) - HiveAggregate(group=[{0, 1}], agg#0=[sum($2)]) - HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(sr_customer_sk=[$2], sr_store_sk=[$6], sr_fee=[$13], sr_returned_date_sk=[$19]) - HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($19))]) - HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[=($6, 2000)]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(_o__c0=[*(CAST(/($1, $2)):DECIMAL(21, 6), 1.2:DECIMAL(2, 1))], ctr_store_sk=[$0]) + HiveFilter(condition=[IS NOT NULL(CAST(/($1, $2)):DECIMAL(21, 6))]) + HiveAggregate(group=[{1}], agg#0=[sum($2)], agg#1=[count($2)]) + HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]) + HiveAggregate(group=[{0, 1}], agg#0=[sum($2)]) + HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(sr_customer_sk=[$2], sr_store_sk=[$6], sr_fee=[$13], sr_returned_date_sk=[$19]) + HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($19))]) + HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[=($6, 2000)]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query26.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query26.q.out index dda45cc67163..f8d40531b0e6 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query26.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query26.q.out @@ -1,23 +1,23 @@ CBO PLAN: HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]) HiveProject(i_item_id=[$0], agg1=[/(CAST($1):DOUBLE, $2)], agg2=[CAST(/($3, $4)):DECIMAL(11, 6)], agg3=[CAST(/($5, $6)):DECIMAL(11, 6)], agg4=[CAST(/($7, $8)):DECIMAL(11, 6)]) - HiveAggregate(group=[{12}], agg#0=[sum($3)], agg#1=[count($3)], agg#2=[sum($4)], agg#3=[count($4)], agg#4=[sum($6)], agg#5=[count($6)], agg#6=[sum($5)], agg#7=[count($5)]) - HiveJoin(condition=[=($1, $11)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $10)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($0, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $8)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveAggregate(group=[{1}], agg#0=[sum($5)], agg#1=[count($5)], agg#2=[sum($6)], agg#3=[count($6)], agg#4=[sum($8)], agg#5=[count($8)], agg#6=[sum($7)], agg#7=[count($7)]) + HiveJoin(condition=[=($3, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(i_item_sk=[$0], i_item_id=[$1]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveJoin(condition=[=($0, $10)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($7, $9)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $8)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(cs_bill_cdemo_sk=[$3], cs_item_sk=[$14], cs_promo_sk=[$15], cs_quantity=[$17], cs_list_price=[$19], cs_sales_price=[$20], cs_coupon_amt=[$26], cs_sold_date_sk=[$33]) HiveFilter(condition=[AND(IS NOT NULL($15), IS NOT NULL($3), IS NOT NULL($33))]) HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[=($6, 1998)]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cd_demo_sk=[$0]) - HiveFilter(condition=[AND(=($2, _UTF-16LE'W'), =($1, _UTF-16LE'F'), =($3, _UTF-16LE'Primary '))]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[customer_demographics]) - HiveProject(p_promo_sk=[$0]) - HiveFilter(condition=[OR(=($9, _UTF-16LE'N'), =($14, _UTF-16LE'N'))]) - HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) - HiveProject(i_item_sk=[$0], i_item_id=[$1]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(p_promo_sk=[$0]) + HiveFilter(condition=[OR(=($9, _UTF-16LE'N'), =($14, _UTF-16LE'N'))]) + HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[=($6, 1998)]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(cd_demo_sk=[$0]) + HiveFilter(condition=[AND(=($2, _UTF-16LE'W'), =($1, _UTF-16LE'F'), =($3, _UTF-16LE'Primary '))]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[customer_demographics]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query47.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query47.q.out index fe7c57f5f164..4ed659084cf8 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query47.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query47.q.out @@ -56,10 +56,10 @@ HiveProject(i_category=[$0], d_year=[$1], d_moy=[$2], avg_monthly_sales=[$3], su HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) HiveProject(s_store_sk=[$0], s_store_name=[$5], s_company_name=[$17]) - HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($17))]) + HiveFilter(condition=[AND(IS NOT NULL($17), IS NOT NULL($5))]) HiveTableScan(table=[[default, store]], table:alias=[store]) HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) HiveTableScan(table=[[default, item]], table:alias=[item]) HiveJoin(condition=[AND(=($6, $0), =($7, $1), =($8, $2), =($9, $3), =($14, $5))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject((tok_table_or_col i_category)=[$0], (tok_table_or_col i_brand)=[$1], (tok_table_or_col s_store_name)=[$2], (tok_table_or_col s_company_name)=[$3], (tok_function sum (tok_table_or_col ss_sales_price))=[$4], EXPR$0=[+($5, 1)]) @@ -77,10 +77,10 @@ HiveProject(i_category=[$0], d_year=[$1], d_moy=[$2], avg_monthly_sales=[$3], su HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) HiveProject(s_store_sk=[$0], s_store_name=[$5], s_company_name=[$17]) - HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($17))]) + HiveFilter(condition=[AND(IS NOT NULL($17), IS NOT NULL($5))]) HiveTableScan(table=[[default, store]], table:alias=[store]) HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) HiveTableScan(table=[[default, item]], table:alias=[item]) HiveProject((tok_table_or_col i_category)=[$0], (tok_table_or_col i_brand)=[$1], (tok_table_or_col s_store_name)=[$2], (tok_table_or_col s_company_name)=[$3], (tok_table_or_col d_year)=[$4], (tok_table_or_col d_moy)=[$5], (tok_function sum (tok_table_or_col ss_sales_price))=[$6], avg_window_0=[$7], rank_window_1=[$8]) HiveFilter(condition=[AND(=($4, 2000), >($7, 0:DECIMAL(1, 0)), CASE(>($7, 0:DECIMAL(1, 0)), >(/(ABS(-($6, $7)), $7), 0.1:DECIMAL(1, 1)), false), IS NOT NULL($8))]) @@ -97,9 +97,9 @@ HiveProject(i_category=[$0], d_year=[$1], d_moy=[$2], avg_monthly_sales=[$3], su HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) HiveProject(s_store_sk=[$0], s_store_name=[$5], s_company_name=[$17]) - HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($17))]) + HiveFilter(condition=[AND(IS NOT NULL($17), IS NOT NULL($5))]) HiveTableScan(table=[[default, store]], table:alias=[store]) HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) HiveTableScan(table=[[default, item]], table:alias=[item]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query53.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query53.q.out index 07fa3e1c3c13..d479f73cc927 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query53.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query53.q.out @@ -11,7 +11,7 @@ HiveSortLimit(sort0=[$2], sort1=[$1], sort2=[$0], dir0=[ASC], dir1=[ASC], dir2=[ HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($22))]) HiveTableScan(table=[[default, store_sales]], table:alias=[store_sales]) HiveProject(i_item_sk=[$0], i_manufact_id=[$13]) - HiveFilter(condition=[AND(IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants', _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'reference', _UTF-16LE'self-help'), IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics', _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'exportiunivamalg #9', _UTF-16LE'importoamalg #1', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9'), OR(AND(IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics'), IN($10, _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'reference', _UTF-16LE'self-help'), IN($8, _UTF-16LE'exportiunivamalg #9', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9')), AND(IN($12, _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'importoamalg #1'))))]) + HiveFilter(condition=[AND(IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants', _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'reference', _UTF-16LE'self-help'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'exportiunivamalg #9', _UTF-16LE'importoamalg #1', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9'), IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics', _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), OR(AND(IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics'), IN($10, _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'reference', _UTF-16LE'self-help'), IN($8, _UTF-16LE'exportiunivamalg #9', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9')), AND(IN($12, _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'importoamalg #1'))))]) HiveTableScan(table=[[default, item]], table:alias=[item]) HiveProject(d_date_sk=[$0], d_qoy=[$10]) HiveFilter(condition=[IN($3, 1212, 1213, 1214, 1215, 1216, 1217, 1218, 1219, 1220, 1221, 1222, 1223)]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query54.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query54.q.out index 3cfb0a6d6128..b011c8248316 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query54.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query54.q.out @@ -6,86 +6,87 @@ CTE Suggestion: HiveFilter(condition=[AND(=($6, 1999), =($8, 3), IS NOT NULL($3))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) -Warning: Map Join MAPJOIN[292][bigTable=?] in task 'Map 1' is a cross product -Warning: Map Join MAPJOIN[286][bigTable=?] in task 'Map 1' is a cross product -Warning: Map Join MAPJOIN[294][bigTable=?] in task 'Map 21' is a cross product -Warning: Map Join MAPJOIN[291][bigTable=?] in task 'Map 21' is a cross product +Warning: Map Join MAPJOIN[283][bigTable=?] in task 'Map 1' is a cross product +Warning: Map Join MAPJOIN[289][bigTable=?] in task 'Reducer 13' is a cross product +Warning: Map Join MAPJOIN[290][bigTable=?] in task 'Map 6' is a cross product +Warning: Map Join MAPJOIN[284][bigTable=?] in task 'Map 6' is a cross product CBO PLAN: HiveSortLimit(sort0=[$0], sort1=[$1], dir0=[ASC], dir1=[ASC], fetch=[100]) HiveProject(segment=[$0], num_customers=[$1], segment_base=[*($0, 50)]) HiveAggregate(group=[{0}], agg#0=[count()]) HiveProject($f0=[CAST(/($1, 50:DECIMAL(10, 0))):INTEGER]) - HiveAggregate(group=[{10}], agg#0=[sum($1)]) - HiveJoin(condition=[=($2, $12)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($10, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveAggregate(group=[{14}], agg#0=[sum($1)]) + HiveJoin(condition=[=($14, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[true], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[true], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(ss_customer_sk=[$2], ss_ext_sales_price=[$14], ss_sold_date_sk=[$22]) - HiveFilter(condition=[AND(IS NOT NULL($2), IS NOT NULL($22))]) - HiveTableScan(table=[[default, store_sales]], table:alias=[store_sales]) - HiveProject(cnt=[$0]) - HiveFilter(condition=[sq_count_check($0)]) - HiveProject(cnt=[$0]) - HiveAggregate(group=[{}], cnt=[COUNT()]) - HiveProject($f0=[$0]) - HiveAggregate(group=[{0}]) - HiveProject($f0=[+($3, 3)]) - HiveFilter(condition=[AND(=($6, 1999), =($8, 3))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(ss_customer_sk=[$2], ss_ext_sales_price=[$14], ss_sold_date_sk=[$22]) + HiveFilter(condition=[AND(IS NOT NULL($2), IS NOT NULL($22))]) + HiveTableScan(table=[[default, store_sales]], table:alias=[store_sales]) HiveProject(cnt=[$0]) HiveFilter(condition=[sq_count_check($0)]) HiveProject(cnt=[$0]) HiveAggregate(group=[{}], cnt=[COUNT()]) HiveProject($f0=[$0]) HiveAggregate(group=[{0}]) - HiveProject($f0=[+($3, 1)]) - HiveFilter(condition=[AND(=($6, 1999), =($8, 3))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(ca_address_sk=[$0], ca_county=[$1], ca_state=[$2], s_county=[$3], s_state=[$4], c_customer_sk=[$5], c_current_addr_sk=[$6]) - HiveJoin(condition=[=($6, $0)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[AND(=($1, $3), =($2, $4))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(ca_address_sk=[$0], ca_county=[$7], ca_state=[$8]) - HiveFilter(condition=[AND(IS NOT NULL($7), IS NOT NULL($8))]) - HiveTableScan(table=[[default, customer_address]], table:alias=[customer_address]) - HiveProject(s_county=[$23], s_state=[$24]) - HiveFilter(condition=[AND(IS NOT NULL($23), IS NOT NULL($24))]) - HiveTableScan(table=[[default, store]], table:alias=[store]) - HiveProject(c_customer_sk=[$0], c_current_addr_sk=[$1]) - HiveSemiJoin(condition=[=($0, $2)], joinType=[semi]) - HiveProject(c_customer_sk=[$0], c_current_addr_sk=[$4]) - HiveFilter(condition=[IS NOT NULL($4)]) - HiveTableScan(table=[[default, customer]], table:alias=[customer]) - HiveProject(customer_sk=[$1]) - HiveJoin(condition=[=($2, $4)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($0, $3)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(sold_date_sk=[$0], customer_sk=[$1], item_sk=[$2]) - HiveUnion(all=[true]) - HiveProject(sold_date_sk=[$33], customer_sk=[$2], item_sk=[$14]) - HiveFilter(condition=[AND(IS NOT NULL($2), IS NOT NULL($33))]) - HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) - HiveProject(sold_date_sk=[$33], customer_sk=[$3], item_sk=[$2]) - HiveFilter(condition=[AND(IS NOT NULL($3), IS NOT NULL($33))]) - HiveTableScan(table=[[default, web_sales]], table:alias=[web_sales]) - HiveProject(d_date_sk=[$0]) + HiveProject($f0=[+($3, 3)]) HiveFilter(condition=[AND(=($6, 1999), =($8, 3))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(i_item_sk=[$0]) - HiveFilter(condition=[AND(=($10, _UTF-16LE'consignment '), =($12, _UTF-16LE'Jewelry '))]) - HiveTableScan(table=[[default, item]], table:alias=[item]) - HiveProject(d_date_sk=[$0], d_month_seq=[$1], $f0=[$2], $f00=[$3]) - HiveJoin(condition=[<=($1, $3)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[<=($2, $1)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(d_date_sk=[$0], d_month_seq=[$3]) - HiveFilter(condition=[IS NOT NULL($3)]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject($f0=[$0]) - HiveAggregate(group=[{0}]) - HiveProject($f0=[+($3, 1)]) - HiveFilter(condition=[AND(=($6, 1999), =($8, 3), IS NOT NULL($3))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject($f0=[$0]) - HiveAggregate(group=[{0}]) - HiveProject($f0=[+($3, 3)]) - HiveFilter(condition=[AND(=($6, 1999), =($8, 3), IS NOT NULL($3))]) + HiveProject(d_date_sk=[$0], d_month_seq=[$1], $f0=[$2], $f00=[$3], cnt=[$4]) + HiveJoin(condition=[<=($1, $3)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[<=($2, $1)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(d_date_sk=[$0], d_month_seq=[$3]) + HiveFilter(condition=[IS NOT NULL($3)]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject($f0=[$0]) + HiveAggregate(group=[{0}]) + HiveProject($f0=[+($3, 1)]) + HiveFilter(condition=[AND(=($6, 1999), =($8, 3), IS NOT NULL($3))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject($f0=[$0], cnt=[$1]) + HiveJoin(condition=[true], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject($f0=[$0]) + HiveAggregate(group=[{0}]) + HiveProject($f0=[+($3, 3)]) + HiveFilter(condition=[AND(=($6, 1999), =($8, 3), IS NOT NULL($3))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(cnt=[$0]) + HiveFilter(condition=[sq_count_check($0)]) + HiveProject(cnt=[$0]) + HiveAggregate(group=[{}], cnt=[COUNT()]) + HiveProject($f0=[$0]) + HiveAggregate(group=[{0}]) + HiveProject($f0=[+($3, 1)]) + HiveFilter(condition=[AND(=($6, 1999), =($8, 3))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(ca_address_sk=[$0], ca_county=[$1], ca_state=[$2], s_county=[$3], s_state=[$4], c_customer_sk=[$5], c_current_addr_sk=[$6]) + HiveJoin(condition=[=($6, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[AND(=($1, $3), =($2, $4))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(ca_address_sk=[$0], ca_county=[$7], ca_state=[$8]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($7))]) + HiveTableScan(table=[[default, customer_address]], table:alias=[customer_address]) + HiveProject(s_county=[$23], s_state=[$24]) + HiveFilter(condition=[AND(IS NOT NULL($24), IS NOT NULL($23))]) + HiveTableScan(table=[[default, store]], table:alias=[store]) + HiveProject(c_customer_sk=[$0], c_current_addr_sk=[$1]) + HiveSemiJoin(condition=[=($0, $2)], joinType=[semi]) + HiveProject(c_customer_sk=[$0], c_current_addr_sk=[$4]) + HiveFilter(condition=[IS NOT NULL($4)]) + HiveTableScan(table=[[default, customer]], table:alias=[customer]) + HiveProject(customer_sk=[$1]) + HiveJoin(condition=[=($2, $4)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($0, $3)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(sold_date_sk=[$0], customer_sk=[$1], item_sk=[$2]) + HiveUnion(all=[true]) + HiveProject(sold_date_sk=[$33], customer_sk=[$2], item_sk=[$14]) + HiveFilter(condition=[AND(IS NOT NULL($2), IS NOT NULL($33))]) + HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) + HiveProject(sold_date_sk=[$33], customer_sk=[$3], item_sk=[$2]) + HiveFilter(condition=[AND(IS NOT NULL($3), IS NOT NULL($33))]) + HiveTableScan(table=[[default, web_sales]], table:alias=[web_sales]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[AND(=($6, 1999), =($8, 3))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(i_item_sk=[$0]) + HiveFilter(condition=[AND(=($10, _UTF-16LE'consignment '), =($12, _UTF-16LE'Jewelry '))]) + HiveTableScan(table=[[default, item]], table:alias=[item]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query57.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query57.q.out index 809bc99496f5..eaf43e815401 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query57.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query57.q.out @@ -1,7 +1,7 @@ CTE Suggestion: -HiveAggregate(group=[{5, 6, 8, 10, 11}], agg#0=[sum($2)]) - HiveJoin(condition=[=($1, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) +HiveAggregate(group=[{5, 6, 8, 9, 11}], agg#0=[sum($2)]) + HiveJoin(condition=[=($10, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($1, $7)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(cs_call_center_sk=[$10], cs_item_sk=[$14], cs_sales_price=[$20], cs_sold_date_sk=[$33]) HiveFilter(condition=[AND(IS NOT NULL($33), IS NOT NULL($10))]) @@ -9,19 +9,19 @@ HiveAggregate(group=[{5, 6, 8, 10, 11}], agg#0=[sum($2)]) HiveProject(d_date_sk=[$0], d_year=[$6], d_moy=[$8]) HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) - HiveFilter(condition=[IS NOT NULL($6)]) - HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) - HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) + HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) + HiveFilter(condition=[IS NOT NULL($6)]) + HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) CTE Suggestion: HiveFilter(condition=[IS NOT NULL($4)]) - HiveProject((tok_table_or_col i_category)=[$4], (tok_table_or_col i_brand)=[$3], (tok_table_or_col cc_name)=[$2], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], rank_window_1=[rank() OVER (PARTITION BY $4, $3, $2 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) - HiveAggregate(group=[{5, 6, 8, 10, 11}], agg#0=[sum($2)]) - HiveJoin(condition=[=($1, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject((tok_table_or_col i_category)=[$3], (tok_table_or_col i_brand)=[$2], (tok_table_or_col cc_name)=[$4], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], rank_window_1=[rank() OVER (PARTITION BY $3, $2, $4 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) + HiveAggregate(group=[{5, 6, 8, 9, 11}], agg#0=[sum($2)]) + HiveJoin(condition=[=($10, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($1, $7)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(cs_call_center_sk=[$10], cs_item_sk=[$14], cs_sales_price=[$20], cs_sold_date_sk=[$33]) HiveFilter(condition=[AND(IS NOT NULL($33), IS NOT NULL($10))]) @@ -29,12 +29,12 @@ HiveFilter(condition=[IS NOT NULL($4)]) HiveProject(d_date_sk=[$0], d_year=[$6], d_moy=[$8]) HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) - HiveFilter(condition=[IS NOT NULL($6)]) - HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) - HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) + HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) + HiveFilter(condition=[IS NOT NULL($6)]) + HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) CBO PLAN: HiveProject(i_category=[$0], i_brand=[$1], d_year=[$2], d_moy=[$3], avg_monthly_sales=[$4], sum_sales=[$5], psum=[$6], nsum=[$7]) @@ -43,11 +43,11 @@ HiveProject(i_category=[$0], i_brand=[$1], d_year=[$2], d_moy=[$3], avg_monthly_ HiveJoin(condition=[AND(=($10, $0), =($11, $1), =($12, $2), =($17, $4))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject((tok_table_or_col i_category)=[$0], (tok_table_or_col i_brand)=[$1], (tok_table_or_col cc_name)=[$2], (tok_function sum (tok_table_or_col cs_sales_price))=[$3], EXPR$0=[-($4, 1)]) HiveFilter(condition=[IS NOT NULL($4)]) - HiveProject((tok_table_or_col i_category)=[$4], (tok_table_or_col i_brand)=[$3], (tok_table_or_col cc_name)=[$2], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], rank_window_1=[rank() OVER (PARTITION BY $4, $3, $2 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) - HiveProject(d_year=[$0], d_moy=[$1], cc_name=[$2], i_brand=[$3], i_category=[$4], $f5=[$5]) - HiveAggregate(group=[{5, 6, 8, 10, 11}], agg#0=[sum($2)]) - HiveJoin(condition=[=($1, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject((tok_table_or_col i_category)=[$3], (tok_table_or_col i_brand)=[$2], (tok_table_or_col cc_name)=[$4], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], rank_window_1=[rank() OVER (PARTITION BY $3, $2, $4 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) + HiveProject(d_year=[$0], d_moy=[$1], i_brand=[$2], i_category=[$3], cc_name=[$4], $f5=[$5]) + HiveAggregate(group=[{5, 6, 8, 9, 11}], agg#0=[sum($2)]) + HiveJoin(condition=[=($10, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($1, $7)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(cs_call_center_sk=[$10], cs_item_sk=[$14], cs_sales_price=[$20], cs_sold_date_sk=[$33]) HiveFilter(condition=[AND(IS NOT NULL($10), IS NOT NULL($33))]) @@ -55,20 +55,20 @@ HiveProject(i_category=[$0], i_brand=[$1], d_year=[$2], d_moy=[$3], avg_monthly_ HiveProject(d_date_sk=[$0], d_year=[$6], d_moy=[$8]) HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) - HiveFilter(condition=[IS NOT NULL($6)]) - HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) - HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) + HiveFilter(condition=[IS NOT NULL($6)]) + HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) HiveJoin(condition=[AND(=($5, $0), =($6, $1), =($7, $2), =($12, $4))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject((tok_table_or_col i_category)=[$0], (tok_table_or_col i_brand)=[$1], (tok_table_or_col cc_name)=[$2], (tok_function sum (tok_table_or_col cs_sales_price))=[$3], EXPR$0=[+($4, 1)]) HiveFilter(condition=[IS NOT NULL($4)]) - HiveProject((tok_table_or_col i_category)=[$4], (tok_table_or_col i_brand)=[$3], (tok_table_or_col cc_name)=[$2], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], rank_window_1=[rank() OVER (PARTITION BY $4, $3, $2 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) - HiveProject(d_year=[$0], d_moy=[$1], cc_name=[$2], i_brand=[$3], i_category=[$4], $f5=[$5]) - HiveAggregate(group=[{5, 6, 8, 10, 11}], agg#0=[sum($2)]) - HiveJoin(condition=[=($1, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject((tok_table_or_col i_category)=[$3], (tok_table_or_col i_brand)=[$2], (tok_table_or_col cc_name)=[$4], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], rank_window_1=[rank() OVER (PARTITION BY $3, $2, $4 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) + HiveProject(d_year=[$0], d_moy=[$1], i_brand=[$2], i_category=[$3], cc_name=[$4], $f5=[$5]) + HiveAggregate(group=[{5, 6, 8, 9, 11}], agg#0=[sum($2)]) + HiveJoin(condition=[=($10, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($1, $7)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(cs_call_center_sk=[$10], cs_item_sk=[$14], cs_sales_price=[$20], cs_sold_date_sk=[$33]) HiveFilter(condition=[AND(IS NOT NULL($10), IS NOT NULL($33))]) @@ -76,19 +76,19 @@ HiveProject(i_category=[$0], i_brand=[$1], d_year=[$2], d_moy=[$3], avg_monthly_ HiveProject(d_date_sk=[$0], d_year=[$6], d_moy=[$8]) HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) - HiveFilter(condition=[IS NOT NULL($6)]) - HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) - HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) + HiveFilter(condition=[IS NOT NULL($6)]) + HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) HiveProject((tok_table_or_col i_category)=[$0], (tok_table_or_col i_brand)=[$1], (tok_table_or_col cc_name)=[$2], (tok_table_or_col d_year)=[$3], (tok_table_or_col d_moy)=[$4], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], avg_window_0=[$6], rank_window_1=[$7]) HiveFilter(condition=[AND(=($3, 2000), >($6, 0:DECIMAL(1, 0)), CASE(>($6, 0:DECIMAL(1, 0)), >(/(ABS(-($5, $6)), $6), 0.1:DECIMAL(1, 1)), false), IS NOT NULL($7))]) - HiveProject((tok_table_or_col i_category)=[$4], (tok_table_or_col i_brand)=[$3], (tok_table_or_col cc_name)=[$2], (tok_table_or_col d_year)=[$0], (tok_table_or_col d_moy)=[$1], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], avg_window_0=[avg($5) OVER (PARTITION BY $4, $3, $2, $0 ORDER BY $4 NULLS FIRST, $3 NULLS FIRST, $2 NULLS FIRST, $0 NULLS FIRST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)], rank_window_1=[rank() OVER (PARTITION BY $4, $3, $2 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) - HiveProject(d_year=[$0], d_moy=[$1], cc_name=[$2], i_brand=[$3], i_category=[$4], $f5=[$5]) - HiveAggregate(group=[{5, 6, 8, 10, 11}], agg#0=[sum($2)]) - HiveJoin(condition=[=($1, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject((tok_table_or_col i_category)=[$3], (tok_table_or_col i_brand)=[$2], (tok_table_or_col cc_name)=[$4], (tok_table_or_col d_year)=[$0], (tok_table_or_col d_moy)=[$1], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], avg_window_0=[avg($5) OVER (PARTITION BY $3, $2, $4, $0 ORDER BY $3 NULLS FIRST, $2 NULLS FIRST, $4 NULLS FIRST, $0 NULLS FIRST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)], rank_window_1=[rank() OVER (PARTITION BY $3, $2, $4 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) + HiveProject(d_year=[$0], d_moy=[$1], i_brand=[$2], i_category=[$3], cc_name=[$4], $f5=[$5]) + HiveAggregate(group=[{5, 6, 8, 9, 11}], agg#0=[sum($2)]) + HiveJoin(condition=[=($10, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($1, $7)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(cs_call_center_sk=[$10], cs_item_sk=[$14], cs_sales_price=[$20], cs_sold_date_sk=[$33]) HiveFilter(condition=[AND(IS NOT NULL($10), IS NOT NULL($33))]) @@ -96,10 +96,10 @@ HiveProject(i_category=[$0], i_brand=[$1], d_year=[$2], d_moy=[$3], avg_monthly_ HiveProject(d_date_sk=[$0], d_year=[$6], d_moy=[$8]) HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) - HiveFilter(condition=[IS NOT NULL($6)]) - HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) - HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) + HiveFilter(condition=[IS NOT NULL($6)]) + HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query63.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query63.q.out index 5d881de389d6..ad91e1502da0 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query63.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query63.q.out @@ -11,7 +11,7 @@ HiveSortLimit(sort0=[$0], sort1=[$2], sort2=[$1], dir0=[ASC], dir1=[ASC], dir2=[ HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($22))]) HiveTableScan(table=[[default, store_sales]], table:alias=[store_sales]) HiveProject(i_item_sk=[$0], i_manager_id=[$20]) - HiveFilter(condition=[AND(IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants', _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'refernece', _UTF-16LE'self-help'), IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics', _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'exportiunivamalg #9', _UTF-16LE'importoamalg #1', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9'), OR(AND(IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics'), IN($10, _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'refernece', _UTF-16LE'self-help'), IN($8, _UTF-16LE'exportiunivamalg #9', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9')), AND(IN($12, _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'importoamalg #1'))))]) + HiveFilter(condition=[AND(IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants', _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'refernece', _UTF-16LE'self-help'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'exportiunivamalg #9', _UTF-16LE'importoamalg #1', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9'), IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics', _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), OR(AND(IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics'), IN($10, _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'refernece', _UTF-16LE'self-help'), IN($8, _UTF-16LE'exportiunivamalg #9', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9')), AND(IN($12, _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'importoamalg #1'))))]) HiveTableScan(table=[[default, item]], table:alias=[item]) HiveProject(d_date_sk=[$0], d_moy=[$8]) HiveFilter(condition=[IN($3, 1212, 1213, 1214, 1215, 1216, 1217, 1218, 1219, 1220, 1221, 1222, 1223)]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query64.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query64.q.out index 7b2e0ee6e4bd..20cef665d6b7 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query64.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query64.q.out @@ -44,23 +44,21 @@ HiveProject(product_name=[$0], store_name=[$1], store_zip=[$2], b_street_number= HiveJoin(condition=[AND(=($8, $0), <=($3, $19), =($9, $1), =($10, $2))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject($f1=[$0], $f2=[$1], $f3=[$2], $f15=[$13], $f16=[$14], $f17=[$15], $f18=[$16]) HiveFilter(condition=[IS NOT NULL($13)]) - HiveProject(i_item_sk=[$4], s_store_name=[$5], s_zip=[$6], ca_street_number=[$0], ca_street_name=[$1], ca_city=[$2], ca_zip=[$3], ca_street_number0=[$9], ca_street_name0=[$10], ca_city0=[$11], ca_zip0=[$12], d_year=[$7], d_year0=[$8], $f13=[$13], $f14=[$14], $f15=[$15], $f16=[$16]) - HiveAggregate(group=[{3, 4, 5, 6, 24, 29, 30, 34, 36, 42, 43, 44, 45}], agg#0=[count()], agg#1=[sum($20)], agg#2=[sum($21)], agg#3=[sum($22)]) - HiveJoin(condition=[=($10, $41)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[AND(=($8, $39), <>($38, $40))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($15, $37)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($11, $35)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($12, $33)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($9, $32)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($16, $31)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($18, $28)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[AND(=($13, $0), =($19, $1))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(i_item_sk=[$0], s_store_name=[$1], s_zip=[$2], ca_street_number=[$5], ca_street_name=[$6], ca_city=[$7], ca_zip=[$8], ca_street_number0=[$9], ca_street_name0=[$10], ca_city0=[$11], ca_zip0=[$12], d_year=[$3], d_year0=[$4], $f13=[$13], $f14=[$14], $f15=[$15], $f16=[$16]) + HiveAggregate(group=[{19, 23, 24, 29, 31, 37, 38, 39, 40, 42, 43, 44, 45}], agg#0=[count()], agg#1=[sum($15)], agg#2=[sum($16)], agg#3=[sum($17)]) + HiveJoin(condition=[=($5, $41)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($12, $36)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[AND(=($3, $34), <>($33, $35))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($10, $32)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $30)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($7, $28)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($4, $27)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($11, $26)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[AND(=($8, $0), =($14, $1))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(sr_item_sk=[$1], sr_ticket_number=[$8]) HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]) - HiveJoin(condition=[=($15, $0)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) - HiveTableScan(table=[[default, customer_address]], table:alias=[ad1]) - HiveJoin(condition=[=($6, $20)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $23)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($11, $20)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(c_customer_sk=[$0], c_current_cdemo_sk=[$2], c_current_hdemo_sk=[$3], c_current_addr_sk=[$4], c_first_shipto_date_sk=[$5], c_first_sales_date_sk=[$6]) HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($6), IS NOT NULL($3), IS NOT NULL($2), IS NOT NULL($4))]) @@ -76,52 +74,52 @@ HiveProject(product_name=[$0], store_name=[$1], store_zip=[$2], b_street_number= HiveProject(d_date_sk=[$0]) HiveFilter(condition=[=($6, 2001)]) HiveTableScan(table=[[default, date_dim]], table:alias=[d1]) - HiveProject(cs_item_sk=[$0]) - HiveFilter(condition=[>($1, *(2:DECIMAL(10, 0), $2))]) - HiveAggregate(group=[{0}], agg#0=[sum($2)], agg#1=[sum($5)]) - HiveJoin(condition=[AND(=($0, $3), =($1, $4))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(cs_item_sk=[$14], cs_order_number=[$16], cs_ext_list_price=[$24]) - HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) - HiveProject(cr_item_sk=[$1], cr_order_number=[$15], $f2=[+(+($22, $23), $24)]) - HiveTableScan(table=[[default, catalog_returns]], table:alias=[catalog_returns]) - HiveProject(s_store_sk=[$0], s_store_name=[$5], s_zip=[$25]) - HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($25))]) - HiveTableScan(table=[[default, store]], table:alias=[store]) + HiveProject(s_store_sk=[$0], s_store_name=[$5], s_zip=[$25]) + HiveFilter(condition=[AND(IS NOT NULL($25), IS NOT NULL($5))]) + HiveTableScan(table=[[default, store]], table:alias=[store]) + HiveProject(cs_item_sk=[$0]) + HiveFilter(condition=[>($1, *(2:DECIMAL(10, 0), $2))]) + HiveAggregate(group=[{0}], agg#0=[sum($2)], agg#1=[sum($5)]) + HiveJoin(condition=[AND(=($0, $3), =($1, $4))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(cs_item_sk=[$14], cs_order_number=[$16], cs_ext_list_price=[$24]) + HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) + HiveProject(cr_item_sk=[$1], cr_order_number=[$15], $f2=[+(+($22, $23), $24)]) + HiveTableScan(table=[[default, catalog_returns]], table:alias=[catalog_returns]) + HiveProject(hd_demo_sk=[$0]) + HiveFilter(condition=[IS NOT NULL($1)]) + HiveTableScan(table=[[default, household_demographics]], table:alias=[hd1]) HiveProject(hd_demo_sk=[$0]) HiveFilter(condition=[IS NOT NULL($1)]) - HiveTableScan(table=[[default, household_demographics]], table:alias=[hd1]) - HiveProject(hd_demo_sk=[$0]) - HiveFilter(condition=[IS NOT NULL($1)]) - HiveTableScan(table=[[default, household_demographics]], table:alias=[hd2]) + HiveTableScan(table=[[default, household_demographics]], table:alias=[hd2]) + HiveProject(d_date_sk=[$0], d_year=[$6]) + HiveTableScan(table=[[default, date_dim]], table:alias=[d2]) HiveProject(d_date_sk=[$0], d_year=[$6]) - HiveTableScan(table=[[default, date_dim]], table:alias=[d2]) - HiveProject(d_date_sk=[$0], d_year=[$6]) - HiveTableScan(table=[[default, date_dim]], table:alias=[d3]) + HiveTableScan(table=[[default, date_dim]], table:alias=[d3]) + HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd1]) HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd1]) - HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd2]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd2]) + HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) + HiveTableScan(table=[[default, customer_address]], table:alias=[ad1]) HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) HiveTableScan(table=[[default, customer_address]], table:alias=[ad2]) HiveProject($f0=[$0], $f1=[$1], $f2=[$2], $f3=[$3], $f4=[$4], $f5=[$5], $f6=[$6], $f7=[$7], $f8=[$8], $f9=[$9], $f10=[$10], $f11=[$11], $f15=[$14], $f16=[$15], $f17=[$16], $f18=[$17]) HiveFilter(condition=[IS NOT NULL($14)]) - HiveProject(i_product_name=[$5], i_item_sk=[$4], s_store_name=[$6], s_zip=[$7], ca_street_number=[$0], ca_street_name=[$1], ca_city=[$2], ca_zip=[$3], ca_street_number0=[$10], ca_street_name0=[$11], ca_city0=[$12], ca_zip0=[$13], d_year=[$8], d_year0=[$9], $f14=[$14], $f15=[$15], $f16=[$16], $f17=[$17]) - HiveAggregate(group=[{3, 4, 5, 6, 24, 25, 29, 30, 34, 36, 42, 43, 44, 45}], agg#0=[count()], agg#1=[sum($20)], agg#2=[sum($21)], agg#3=[sum($22)]) - HiveJoin(condition=[=($10, $41)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[AND(=($8, $39), <>($38, $40))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($15, $37)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($11, $35)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($12, $33)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($9, $32)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($16, $31)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($18, $28)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[AND(=($13, $0), =($19, $1))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(i_product_name=[$1], i_item_sk=[$0], s_store_name=[$2], s_zip=[$3], ca_street_number=[$6], ca_street_name=[$7], ca_city=[$8], ca_zip=[$9], ca_street_number0=[$10], ca_street_name0=[$11], ca_city0=[$12], ca_zip0=[$13], d_year=[$4], d_year0=[$5], $f14=[$14], $f15=[$15], $f16=[$16], $f17=[$17]) + HiveAggregate(group=[{19, 20, 23, 24, 29, 31, 37, 38, 39, 40, 42, 43, 44, 45}], agg#0=[count()], agg#1=[sum($15)], agg#2=[sum($16)], agg#3=[sum($17)]) + HiveJoin(condition=[=($5, $41)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($12, $36)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[AND(=($3, $34), <>($33, $35))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($10, $32)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $30)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($7, $28)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($4, $27)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($11, $26)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[AND(=($8, $0), =($14, $1))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(sr_item_sk=[$1], sr_ticket_number=[$8]) HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]) - HiveJoin(condition=[=($15, $0)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) - HiveTableScan(table=[[default, customer_address]], table:alias=[ad1]) - HiveJoin(condition=[=($6, $20)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $23)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($11, $20)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(c_customer_sk=[$0], c_current_cdemo_sk=[$2], c_current_hdemo_sk=[$3], c_current_addr_sk=[$4], c_first_shipto_date_sk=[$5], c_first_sales_date_sk=[$6]) HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($6), IS NOT NULL($3), IS NOT NULL($2), IS NOT NULL($4))]) @@ -137,31 +135,33 @@ HiveProject(product_name=[$0], store_name=[$1], store_zip=[$2], b_street_number= HiveProject(d_date_sk=[$0]) HiveFilter(condition=[=($6, 2000)]) HiveTableScan(table=[[default, date_dim]], table:alias=[d1]) - HiveProject(cs_item_sk=[$0]) - HiveFilter(condition=[>($1, *(2:DECIMAL(10, 0), $2))]) - HiveAggregate(group=[{0}], agg#0=[sum($2)], agg#1=[sum($5)]) - HiveJoin(condition=[AND(=($0, $3), =($1, $4))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(cs_item_sk=[$14], cs_order_number=[$16], cs_ext_list_price=[$24]) - HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) - HiveProject(cr_item_sk=[$1], cr_order_number=[$15], $f2=[+(+($22, $23), $24)]) - HiveTableScan(table=[[default, catalog_returns]], table:alias=[catalog_returns]) - HiveProject(s_store_sk=[$0], s_store_name=[$5], s_zip=[$25]) - HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($25))]) - HiveTableScan(table=[[default, store]], table:alias=[store]) + HiveProject(s_store_sk=[$0], s_store_name=[$5], s_zip=[$25]) + HiveFilter(condition=[AND(IS NOT NULL($25), IS NOT NULL($5))]) + HiveTableScan(table=[[default, store]], table:alias=[store]) + HiveProject(cs_item_sk=[$0]) + HiveFilter(condition=[>($1, *(2:DECIMAL(10, 0), $2))]) + HiveAggregate(group=[{0}], agg#0=[sum($2)], agg#1=[sum($5)]) + HiveJoin(condition=[AND(=($0, $3), =($1, $4))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(cs_item_sk=[$14], cs_order_number=[$16], cs_ext_list_price=[$24]) + HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) + HiveProject(cr_item_sk=[$1], cr_order_number=[$15], $f2=[+(+($22, $23), $24)]) + HiveTableScan(table=[[default, catalog_returns]], table:alias=[catalog_returns]) + HiveProject(hd_demo_sk=[$0]) + HiveFilter(condition=[IS NOT NULL($1)]) + HiveTableScan(table=[[default, household_demographics]], table:alias=[hd1]) HiveProject(hd_demo_sk=[$0]) HiveFilter(condition=[IS NOT NULL($1)]) - HiveTableScan(table=[[default, household_demographics]], table:alias=[hd1]) - HiveProject(hd_demo_sk=[$0]) - HiveFilter(condition=[IS NOT NULL($1)]) - HiveTableScan(table=[[default, household_demographics]], table:alias=[hd2]) + HiveTableScan(table=[[default, household_demographics]], table:alias=[hd2]) + HiveProject(d_date_sk=[$0], d_year=[$6]) + HiveTableScan(table=[[default, date_dim]], table:alias=[d2]) HiveProject(d_date_sk=[$0], d_year=[$6]) - HiveTableScan(table=[[default, date_dim]], table:alias=[d2]) - HiveProject(d_date_sk=[$0], d_year=[$6]) - HiveTableScan(table=[[default, date_dim]], table:alias=[d3]) + HiveTableScan(table=[[default, date_dim]], table:alias=[d3]) + HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd1]) HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd1]) - HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd2]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd2]) + HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) + HiveTableScan(table=[[default, customer_address]], table:alias=[ad1]) HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) HiveTableScan(table=[[default, customer_address]], table:alias=[ad2]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query7.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query7.q.out index 5c5d16b51077..2cef673adc7d 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query7.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query7.q.out @@ -1,23 +1,23 @@ CBO PLAN: HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]) HiveProject(i_item_id=[$0], agg1=[/(CAST($1):DOUBLE, $2)], agg2=[CAST(/($3, $4)):DECIMAL(11, 6)], agg3=[CAST(/($5, $6)):DECIMAL(11, 6)], agg4=[CAST(/($7, $8)):DECIMAL(11, 6)]) - HiveAggregate(group=[{12}], agg#0=[sum($3)], agg#1=[count($3)], agg#2=[sum($4)], agg#3=[count($4)], agg#4=[sum($6)], agg#5=[count($6)], agg#6=[sum($5)], agg#7=[count($5)]) - HiveJoin(condition=[=($0, $11)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $10)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($1, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $8)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveAggregate(group=[{1}], agg#0=[sum($5)], agg#1=[count($5)], agg#2=[sum($6)], agg#3=[count($6)], agg#4=[sum($8)], agg#5=[count($8)], agg#6=[sum($7)], agg#7=[count($7)]) + HiveJoin(condition=[=($2, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(i_item_sk=[$0], i_item_id=[$1]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveJoin(condition=[=($1, $10)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($7, $9)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $8)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(ss_item_sk=[$1], ss_cdemo_sk=[$3], ss_promo_sk=[$7], ss_quantity=[$9], ss_list_price=[$11], ss_sales_price=[$12], ss_coupon_amt=[$18], ss_sold_date_sk=[$22]) HiveFilter(condition=[AND(IS NOT NULL($3), IS NOT NULL($7), IS NOT NULL($22))]) HiveTableScan(table=[[default, store_sales]], table:alias=[store_sales]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[=($6, 1998)]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cd_demo_sk=[$0]) - HiveFilter(condition=[AND(=($2, _UTF-16LE'W'), =($1, _UTF-16LE'F'), =($3, _UTF-16LE'Primary '))]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[customer_demographics]) - HiveProject(p_promo_sk=[$0]) - HiveFilter(condition=[OR(=($9, _UTF-16LE'N'), =($14, _UTF-16LE'N'))]) - HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) - HiveProject(i_item_sk=[$0], i_item_id=[$1]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(p_promo_sk=[$0]) + HiveFilter(condition=[OR(=($9, _UTF-16LE'N'), =($14, _UTF-16LE'N'))]) + HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[=($6, 1998)]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(cd_demo_sk=[$0]) + HiveFilter(condition=[AND(=($2, _UTF-16LE'W'), =($1, _UTF-16LE'F'), =($3, _UTF-16LE'Primary '))]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[customer_demographics]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query8.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query8.q.out index 0bf0810023ae..321c390bd531 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query8.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query8.q.out @@ -26,14 +26,14 @@ HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]) HiveAggregate(group=[{0}], agg#0=[count()]) HiveProject($f0=[substr($0, 1, 5)]) HiveFilter(condition=[>($1, 10)]) - HiveAggregate(group=[{1}], agg#0=[count()]) - HiveJoin(condition=[=($0, $2)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(ca_address_sk=[$0], ca_zip=[$9]) - HiveFilter(condition=[IS NOT NULL(substr(substr($9, 1, 5), 1, 2))]) - HiveTableScan(table=[[default, customer_address]], table:alias=[customer_address]) + HiveAggregate(group=[{2}], agg#0=[count()]) + HiveJoin(condition=[=($1, $0)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(c_current_addr_sk=[$4]) HiveFilter(condition=[AND(=($10, _UTF-16LE'Y'), IS NOT NULL($4))]) HiveTableScan(table=[[default, customer]], table:alias=[customer]) + HiveProject(ca_address_sk=[$0], ca_zip=[$9]) + HiveFilter(condition=[IS NOT NULL(substr(substr($9, 1, 5), 1, 2))]) + HiveTableScan(table=[[default, customer_address]], table:alias=[customer_address]) HiveProject(s_store_sk=[$0], s_store_name=[$5], EXPR$0=[substr($25, 1, 2)]) HiveFilter(condition=[IS NOT NULL(substr($25, 1, 2))]) HiveTableScan(table=[[default, store]], table:alias=[store]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query80.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query80.q.out index f8676ae03592..8c295ec9b763 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query80.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query80.q.out @@ -23,8 +23,8 @@ HiveSortLimit(sort0=[$0], sort1=[$1], dir0=[ASC], dir1=[ASC], fetch=[100]) HiveAggregate(group=[{0}], agg#0=[sum($1)], agg#1=[sum($2)], agg#2=[sum($3)]) HiveProject($f0=[$15], $f1=[$4], $f2=[CASE(IS NOT NULL($9), $9, 0:DECIMAL(12, 2))], $f3=[-($5, CASE(IS NOT NULL($10), $10, 0:DECIMAL(12, 2)))]) HiveJoin(condition=[=($1, $14)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($6, $13)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $12)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $13)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $12)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($0, $11)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[AND(=($0, $7), =($3, $8))], joinType=[left], algorithm=[none], cost=[not available]) HiveProject(ss_item_sk=[$1], ss_store_sk=[$6], ss_promo_sk=[$7], ss_ticket_number=[$8], ss_ext_sales_price=[$14], ss_net_profit=[$21], ss_sold_date_sk=[$22]) @@ -35,20 +35,20 @@ HiveSortLimit(sort0=[$0], sort1=[$1], dir0=[ASC], dir1=[ASC], fetch=[100]) HiveProject(i_item_sk=[$0]) HiveFilter(condition=[>($5, 50:DECIMAL(2, 0))]) HiveTableScan(table=[[default, item]], table:alias=[item]) - HiveProject(p_promo_sk=[$0]) - HiveFilter(condition=[=($11, _UTF-16LE'N')]) - HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(p_promo_sk=[$0]) + HiveFilter(condition=[=($11, _UTF-16LE'N')]) + HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) HiveProject(s_store_sk=[$0], s_store_id=[$1]) HiveTableScan(table=[[default, store]], table:alias=[store]) HiveProject(channel=[_UTF-16LE'catalog channel':VARCHAR(2147483647) CHARACTER SET "UTF-16LE"], id=[||(_UTF-16LE'catalog_page':VARCHAR(2147483647) CHARACTER SET "UTF-16LE", $0)], sales=[$1], returns=[$2], profit=[$3]) HiveAggregate(group=[{0}], agg#0=[sum($1)], agg#1=[sum($2)], agg#2=[sum($3)]) HiveProject($f0=[$15], $f1=[$4], $f2=[CASE(IS NOT NULL($9), $9, 0:DECIMAL(12, 2))], $f3=[-($5, CASE(IS NOT NULL($10), $10, 0:DECIMAL(12, 2)))]) HiveJoin(condition=[=($0, $14)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($6, $13)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $12)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $13)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $12)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($1, $11)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[AND(=($1, $7), =($3, $8))], joinType=[left], algorithm=[none], cost=[not available]) HiveProject(cs_catalog_page_sk=[$11], cs_item_sk=[$14], cs_promo_sk=[$15], cs_order_number=[$16], cs_ext_sales_price=[$22], cs_net_profit=[$32], cs_sold_date_sk=[$33]) @@ -59,20 +59,20 @@ HiveSortLimit(sort0=[$0], sort1=[$1], dir0=[ASC], dir1=[ASC], fetch=[100]) HiveProject(i_item_sk=[$0]) HiveFilter(condition=[>($5, 50:DECIMAL(2, 0))]) HiveTableScan(table=[[default, item]], table:alias=[item]) - HiveProject(p_promo_sk=[$0]) - HiveFilter(condition=[=($11, _UTF-16LE'N')]) - HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(p_promo_sk=[$0]) + HiveFilter(condition=[=($11, _UTF-16LE'N')]) + HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) HiveProject(cp_catalog_page_sk=[$0], cp_catalog_page_id=[$1]) HiveTableScan(table=[[default, catalog_page]], table:alias=[catalog_page]) HiveProject(channel=[_UTF-16LE'web channel':VARCHAR(2147483647) CHARACTER SET "UTF-16LE"], id=[||(_UTF-16LE'web_site':VARCHAR(2147483647) CHARACTER SET "UTF-16LE", $0)], sales=[$1], returns=[$2], profit=[$3]) HiveAggregate(group=[{0}], agg#0=[sum($1)], agg#1=[sum($2)], agg#2=[sum($3)]) HiveProject($f0=[$15], $f1=[$4], $f2=[CASE(IS NOT NULL($9), $9, 0:DECIMAL(12, 2))], $f3=[-($5, CASE(IS NOT NULL($10), $10, 0:DECIMAL(12, 2)))]) HiveJoin(condition=[=($1, $14)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($6, $13)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $12)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $13)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $12)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($0, $11)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[AND(=($0, $7), =($3, $8))], joinType=[left], algorithm=[none], cost=[not available]) HiveProject(ws_item_sk=[$2], ws_web_site_sk=[$12], ws_promo_sk=[$15], ws_order_number=[$16], ws_ext_sales_price=[$22], ws_net_profit=[$32], ws_sold_date_sk=[$33]) @@ -83,12 +83,12 @@ HiveSortLimit(sort0=[$0], sort1=[$1], dir0=[ASC], dir1=[ASC], fetch=[100]) HiveProject(i_item_sk=[$0]) HiveFilter(condition=[>($5, 50:DECIMAL(2, 0))]) HiveTableScan(table=[[default, item]], table:alias=[item]) - HiveProject(p_promo_sk=[$0]) - HiveFilter(condition=[=($11, _UTF-16LE'N')]) - HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(p_promo_sk=[$0]) + HiveFilter(condition=[=($11, _UTF-16LE'N')]) + HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) HiveProject(web_site_sk=[$0], web_site_id=[$1]) HiveTableScan(table=[[default, web_site]], table:alias=[web_site]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query96.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query96.q.out index c5293dfc7d11..410434109319 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query96.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/cte/cbo_query96.q.out @@ -1,7 +1,7 @@ CBO PLAN: HiveAggregate(group=[{}], agg#0=[count()]) - HiveJoin(condition=[=($1, $5)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $4)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $5)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($1, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($0, $3)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(ss_sold_time_sk=[$0], ss_hdemo_sk=[$4], ss_store_sk=[$6]) HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($4), IS NOT NULL($0))]) @@ -9,10 +9,10 @@ HiveAggregate(group=[{}], agg#0=[count()]) HiveProject(t_time_sk=[$0]) HiveFilter(condition=[AND(=($3, 8), >=($4, 30))]) HiveTableScan(table=[[default, time_dim]], table:alias=[time_dim]) - HiveProject(s_store_sk=[$0]) - HiveFilter(condition=[=($5, _UTF-16LE'ese')]) - HiveTableScan(table=[[default, store]], table:alias=[store]) - HiveProject(hd_demo_sk=[$0]) - HiveFilter(condition=[=($3, 5)]) - HiveTableScan(table=[[default, household_demographics]], table:alias=[household_demographics]) + HiveProject(hd_demo_sk=[$0]) + HiveFilter(condition=[=($3, 5)]) + HiveTableScan(table=[[default, household_demographics]], table:alias=[household_demographics]) + HiveProject(s_store_sk=[$0]) + HiveFilter(condition=[=($5, _UTF-16LE'ese')]) + HiveTableScan(table=[[default, store]], table:alias=[store]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_ext_query1.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_ext_query1.q.out index 5b4b7d14c27a..6c5d7a2d38b6 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_ext_query1.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_ext_query1.q.out @@ -1,10 +1,10 @@ CBO PLAN: HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveProject(c_customer_id=[$1]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveJoin(condition=[AND(=($3, $7), >($4, $6))], joinType=[inner], algorithm=[none], cost=[not available]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveJoin(condition=[=($2, $0)], joinType=[inner], algorithm=[none], cost=[not available]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveProject(c_customer_sk=[$0], c_customer_id=[$1]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveTableScan(table=[[default, customer]], table:alias=[customer]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveJoin(condition=[=($2, $0)], joinType=[inner], algorithm=[none], cost=[not available]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveProject(c_customer_sk=[$0], c_customer_id=[$1]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveTableScan(table=[[default, customer]], table:alias=[customer]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveJoin(condition=[AND(=($1, $5), >($2, $4))], joinType=[inner], algorithm=[none], cost=[not available]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveJoin(condition=[=($3, $1)], joinType=[inner], algorithm=[none], cost=[not available]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveFilter(condition=[IS NOT NULL($2)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### @@ -19,27 +19,27 @@ HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]): rowcount = ###Masked###, cum HiveProject(s_store_sk=[$0]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveFilter(condition=[=($24, _UTF-16LE'NM')]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveTableScan(table=[[default, store]], table:alias=[store]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveProject(_o__c0=[*(CAST(/($1, $2)):DECIMAL(21, 6), 1.2:DECIMAL(2, 1))], ctr_store_sk=[$0]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveFilter(condition=[IS NOT NULL(CAST(/($1, $2)):DECIMAL(21, 6))]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveAggregate(group=[{1}], agg#0=[sum($2)], agg#1=[count($2)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveAggregate(group=[{0, 1}], agg#0=[sum($2)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveProject(sr_customer_sk=[$2], sr_store_sk=[$6], sr_fee=[$13], sr_returned_date_sk=[$19]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($19))]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveProject(d_date_sk=[$0]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveFilter(condition=[=($6, 2000)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveProject(_o__c0=[*(CAST(/($1, $2)):DECIMAL(21, 6), 1.2:DECIMAL(2, 1))], ctr_store_sk=[$0]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveFilter(condition=[IS NOT NULL(CAST(/($1, $2)):DECIMAL(21, 6))]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveAggregate(group=[{1}], agg#0=[sum($2)], agg#1=[count($2)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveAggregate(group=[{0, 1}], agg#0=[sum($2)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveProject(sr_customer_sk=[$2], sr_store_sk=[$6], sr_fee=[$13], sr_returned_date_sk=[$19]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($19))]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveProject(d_date_sk=[$0]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveFilter(condition=[=($6, 2000)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### CBO PLAN: HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveProject(c_customer_id=[$1]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveJoin(condition=[AND(=($3, $7), >($4, $6))], joinType=[inner], algorithm=[none], cost=[{13.140068448808671 rows, 0.0 cpu, 0.0 io}]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveJoin(condition=[=($2, $0)], joinType=[inner], algorithm=[none], cost=[{8.000001214006844E7 rows, 0.0 cpu, 0.0 io}]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveProject(c_customer_sk=[$0], c_customer_id=[$1]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveTableScan(table=[[default, customer]], table:alias=[customer]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveJoin(condition=[=($3, $1)], joinType=[inner], algorithm=[none], cost=[{572.8902844748543 rows, 0.0 cpu, 0.0 io}]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveJoin(condition=[=($2, $0)], joinType=[inner], algorithm=[none], cost=[{8.0000001E7 rows, 0.0 cpu, 0.0 io}]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveProject(c_customer_sk=[$0], c_customer_id=[$1]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveTableScan(table=[[default, customer]], table:alias=[customer]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveJoin(condition=[AND(=($1, $5), >($2, $4))], joinType=[inner], algorithm=[none], cost=[{13.42239562203678 rows, 0.0 cpu, 0.0 io}]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveJoin(condition=[=($3, $1)], joinType=[inner], algorithm=[none], cost=[{573.7909187243257 rows, 0.0 cpu, 0.0 io}]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveFilter(condition=[IS NOT NULL($2)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveAggregate(group=[{0, 1}], agg#0=[sum($2)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### @@ -53,16 +53,16 @@ HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]): rowcount = ###Masked###, cum HiveProject(s_store_sk=[$0]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveFilter(condition=[=($24, _UTF-16LE'NM')]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### HiveTableScan(table=[[default, store]], table:alias=[store]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveProject(_o__c0=[*(CAST(/($1, $2)):DECIMAL(21, 6), 1.2:DECIMAL(2, 1))], ctr_store_sk=[$0]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveFilter(condition=[IS NOT NULL(CAST(/($1, $2)):DECIMAL(21, 6))]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveAggregate(group=[{1}], agg#0=[sum($2)], agg#1=[count($2)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveAggregate(group=[{0, 1}], agg#0=[sum($2)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[{8.180936341080402E9 rows, 0.0 cpu, 0.0 io}]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveProject(sr_customer_sk=[$2], sr_store_sk=[$6], sr_fee=[$13], sr_returned_date_sk=[$19]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($19))]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveProject(d_date_sk=[$0]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveFilter(condition=[=($6, 2000)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveProject(_o__c0=[*(CAST(/($1, $2)):DECIMAL(21, 6), 1.2:DECIMAL(2, 1))], ctr_store_sk=[$0]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveFilter(condition=[IS NOT NULL(CAST(/($1, $2)):DECIMAL(21, 6))]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveAggregate(group=[{1}], agg#0=[sum($2)], agg#1=[count($2)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveAggregate(group=[{0, 1}], agg#0=[sum($2)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[{8.180936341080402E9 rows, 0.0 cpu, 0.0 io}]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveProject(sr_customer_sk=[$2], sr_store_sk=[$6], sr_fee=[$13], sr_returned_date_sk=[$19]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($19))]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveProject(d_date_sk=[$0]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveFilter(condition=[=($6, 2000)]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]): rowcount = ###Masked###, cumulative cost = ###Masked###, id = ###Masked### diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query1.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query1.q.out index 1216481c7623..88ff9b49f746 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query1.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query1.q.out @@ -1,10 +1,10 @@ CBO PLAN: HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]) HiveProject(c_customer_id=[$1]) - HiveJoin(condition=[AND(=($3, $7), >($4, $6))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $0)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(c_customer_sk=[$0], c_customer_id=[$1]) - HiveTableScan(table=[[default, customer]], table:alias=[customer]) + HiveJoin(condition=[=($2, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(c_customer_sk=[$0], c_customer_id=[$1]) + HiveTableScan(table=[[default, customer]], table:alias=[customer]) + HiveJoin(condition=[AND(=($1, $5), >($2, $4))], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($3, $1)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]) HiveFilter(condition=[IS NOT NULL($2)]) @@ -19,16 +19,16 @@ HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]) HiveProject(s_store_sk=[$0]) HiveFilter(condition=[=($24, _UTF-16LE'NM')]) HiveTableScan(table=[[default, store]], table:alias=[store]) - HiveProject(_o__c0=[*(CAST(/($1, $2)):DECIMAL(21, 6), 1.2:DECIMAL(2, 1))], ctr_store_sk=[$0]) - HiveFilter(condition=[IS NOT NULL(CAST(/($1, $2)):DECIMAL(21, 6))]) - HiveAggregate(group=[{1}], agg#0=[sum($2)], agg#1=[count($2)]) - HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]) - HiveAggregate(group=[{0, 1}], agg#0=[sum($2)]) - HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(sr_customer_sk=[$2], sr_store_sk=[$6], sr_fee=[$13], sr_returned_date_sk=[$19]) - HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($19))]) - HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[=($6, 2000)]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(_o__c0=[*(CAST(/($1, $2)):DECIMAL(21, 6), 1.2:DECIMAL(2, 1))], ctr_store_sk=[$0]) + HiveFilter(condition=[IS NOT NULL(CAST(/($1, $2)):DECIMAL(21, 6))]) + HiveAggregate(group=[{1}], agg#0=[sum($2)], agg#1=[count($2)]) + HiveProject(sr_customer_sk=[$0], sr_store_sk=[$1], $f2=[$2]) + HiveAggregate(group=[{0, 1}], agg#0=[sum($2)]) + HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(sr_customer_sk=[$2], sr_store_sk=[$6], sr_fee=[$13], sr_returned_date_sk=[$19]) + HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($19))]) + HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[=($6, 2000)]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query26.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query26.q.out index dda45cc67163..f8d40531b0e6 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query26.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query26.q.out @@ -1,23 +1,23 @@ CBO PLAN: HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]) HiveProject(i_item_id=[$0], agg1=[/(CAST($1):DOUBLE, $2)], agg2=[CAST(/($3, $4)):DECIMAL(11, 6)], agg3=[CAST(/($5, $6)):DECIMAL(11, 6)], agg4=[CAST(/($7, $8)):DECIMAL(11, 6)]) - HiveAggregate(group=[{12}], agg#0=[sum($3)], agg#1=[count($3)], agg#2=[sum($4)], agg#3=[count($4)], agg#4=[sum($6)], agg#5=[count($6)], agg#6=[sum($5)], agg#7=[count($5)]) - HiveJoin(condition=[=($1, $11)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $10)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($0, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $8)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveAggregate(group=[{1}], agg#0=[sum($5)], agg#1=[count($5)], agg#2=[sum($6)], agg#3=[count($6)], agg#4=[sum($8)], agg#5=[count($8)], agg#6=[sum($7)], agg#7=[count($7)]) + HiveJoin(condition=[=($3, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(i_item_sk=[$0], i_item_id=[$1]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveJoin(condition=[=($0, $10)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($7, $9)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $8)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(cs_bill_cdemo_sk=[$3], cs_item_sk=[$14], cs_promo_sk=[$15], cs_quantity=[$17], cs_list_price=[$19], cs_sales_price=[$20], cs_coupon_amt=[$26], cs_sold_date_sk=[$33]) HiveFilter(condition=[AND(IS NOT NULL($15), IS NOT NULL($3), IS NOT NULL($33))]) HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[=($6, 1998)]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cd_demo_sk=[$0]) - HiveFilter(condition=[AND(=($2, _UTF-16LE'W'), =($1, _UTF-16LE'F'), =($3, _UTF-16LE'Primary '))]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[customer_demographics]) - HiveProject(p_promo_sk=[$0]) - HiveFilter(condition=[OR(=($9, _UTF-16LE'N'), =($14, _UTF-16LE'N'))]) - HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) - HiveProject(i_item_sk=[$0], i_item_id=[$1]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(p_promo_sk=[$0]) + HiveFilter(condition=[OR(=($9, _UTF-16LE'N'), =($14, _UTF-16LE'N'))]) + HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[=($6, 1998)]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(cd_demo_sk=[$0]) + HiveFilter(condition=[AND(=($2, _UTF-16LE'W'), =($1, _UTF-16LE'F'), =($3, _UTF-16LE'Primary '))]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[customer_demographics]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query47.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query47.q.out index c174e1bbd06e..d5c9a401fa59 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query47.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query47.q.out @@ -18,10 +18,10 @@ HiveProject(i_category=[$0], d_year=[$1], d_moy=[$2], avg_monthly_sales=[$3], su HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) HiveProject(s_store_sk=[$0], s_store_name=[$5], s_company_name=[$17]) - HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($17))]) + HiveFilter(condition=[AND(IS NOT NULL($17), IS NOT NULL($5))]) HiveTableScan(table=[[default, store]], table:alias=[store]) HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) HiveTableScan(table=[[default, item]], table:alias=[item]) HiveJoin(condition=[AND(=($6, $0), =($7, $1), =($8, $2), =($9, $3), =($14, $5))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject((tok_table_or_col i_category)=[$0], (tok_table_or_col i_brand)=[$1], (tok_table_or_col s_store_name)=[$2], (tok_table_or_col s_company_name)=[$3], (tok_function sum (tok_table_or_col ss_sales_price))=[$4], EXPR$0=[+($5, 1)]) @@ -39,10 +39,10 @@ HiveProject(i_category=[$0], d_year=[$1], d_moy=[$2], avg_monthly_sales=[$3], su HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) HiveProject(s_store_sk=[$0], s_store_name=[$5], s_company_name=[$17]) - HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($17))]) + HiveFilter(condition=[AND(IS NOT NULL($17), IS NOT NULL($5))]) HiveTableScan(table=[[default, store]], table:alias=[store]) HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) HiveTableScan(table=[[default, item]], table:alias=[item]) HiveProject((tok_table_or_col i_category)=[$0], (tok_table_or_col i_brand)=[$1], (tok_table_or_col s_store_name)=[$2], (tok_table_or_col s_company_name)=[$3], (tok_table_or_col d_year)=[$4], (tok_table_or_col d_moy)=[$5], (tok_function sum (tok_table_or_col ss_sales_price))=[$6], avg_window_0=[$7], rank_window_1=[$8]) HiveFilter(condition=[AND(=($4, 2000), >($7, 0:DECIMAL(1, 0)), CASE(>($7, 0:DECIMAL(1, 0)), >(/(ABS(-($6, $7)), $7), 0.1:DECIMAL(1, 1)), false), IS NOT NULL($8))]) @@ -59,9 +59,9 @@ HiveProject(i_category=[$0], d_year=[$1], d_moy=[$2], avg_monthly_sales=[$3], su HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) HiveProject(s_store_sk=[$0], s_store_name=[$5], s_company_name=[$17]) - HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($17))]) + HiveFilter(condition=[AND(IS NOT NULL($17), IS NOT NULL($5))]) HiveTableScan(table=[[default, store]], table:alias=[store]) HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) HiveTableScan(table=[[default, item]], table:alias=[item]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query53.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query53.q.out index 07fa3e1c3c13..d479f73cc927 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query53.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query53.q.out @@ -11,7 +11,7 @@ HiveSortLimit(sort0=[$2], sort1=[$1], sort2=[$0], dir0=[ASC], dir1=[ASC], dir2=[ HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($22))]) HiveTableScan(table=[[default, store_sales]], table:alias=[store_sales]) HiveProject(i_item_sk=[$0], i_manufact_id=[$13]) - HiveFilter(condition=[AND(IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants', _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'reference', _UTF-16LE'self-help'), IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics', _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'exportiunivamalg #9', _UTF-16LE'importoamalg #1', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9'), OR(AND(IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics'), IN($10, _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'reference', _UTF-16LE'self-help'), IN($8, _UTF-16LE'exportiunivamalg #9', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9')), AND(IN($12, _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'importoamalg #1'))))]) + HiveFilter(condition=[AND(IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants', _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'reference', _UTF-16LE'self-help'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'exportiunivamalg #9', _UTF-16LE'importoamalg #1', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9'), IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics', _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), OR(AND(IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics'), IN($10, _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'reference', _UTF-16LE'self-help'), IN($8, _UTF-16LE'exportiunivamalg #9', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9')), AND(IN($12, _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'importoamalg #1'))))]) HiveTableScan(table=[[default, item]], table:alias=[item]) HiveProject(d_date_sk=[$0], d_qoy=[$10]) HiveFilter(condition=[IN($3, 1212, 1213, 1214, 1215, 1216, 1217, 1218, 1219, 1220, 1221, 1222, 1223)]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query54.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query54.q.out index 1feeb5e1d87c..645c57f6e945 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query54.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query54.q.out @@ -1,83 +1,84 @@ -Warning: Map Join MAPJOIN[294][bigTable=?] in task 'Map 21' is a cross product -Warning: Map Join MAPJOIN[291][bigTable=?] in task 'Map 21' is a cross product -Warning: Map Join MAPJOIN[292][bigTable=?] in task 'Map 1' is a cross product -Warning: Map Join MAPJOIN[286][bigTable=?] in task 'Map 1' is a cross product +Warning: Map Join MAPJOIN[289][bigTable=?] in task 'Reducer 12' is a cross product +Warning: Map Join MAPJOIN[290][bigTable=?] in task 'Map 5' is a cross product +Warning: Map Join MAPJOIN[284][bigTable=?] in task 'Map 5' is a cross product +Warning: Map Join MAPJOIN[283][bigTable=?] in task 'Map 1' is a cross product CBO PLAN: HiveSortLimit(sort0=[$0], sort1=[$1], dir0=[ASC], dir1=[ASC], fetch=[100]) HiveProject(segment=[$0], num_customers=[$1], segment_base=[*($0, 50)]) HiveAggregate(group=[{0}], agg#0=[count()]) HiveProject($f0=[CAST(/($1, 50:DECIMAL(10, 0))):INTEGER]) - HiveAggregate(group=[{10}], agg#0=[sum($1)]) - HiveJoin(condition=[=($2, $12)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($10, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveAggregate(group=[{14}], agg#0=[sum($1)]) + HiveJoin(condition=[=($14, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[true], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[true], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(ss_customer_sk=[$2], ss_ext_sales_price=[$14], ss_sold_date_sk=[$22]) - HiveFilter(condition=[AND(IS NOT NULL($2), IS NOT NULL($22))]) - HiveTableScan(table=[[default, store_sales]], table:alias=[store_sales]) - HiveProject(cnt=[$0]) - HiveFilter(condition=[sq_count_check($0)]) - HiveProject(cnt=[$0]) - HiveAggregate(group=[{}], cnt=[COUNT()]) - HiveProject($f0=[$0]) - HiveAggregate(group=[{0}]) - HiveProject($f0=[+($3, 3)]) - HiveFilter(condition=[AND(=($6, 1999), =($8, 3))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(ss_customer_sk=[$2], ss_ext_sales_price=[$14], ss_sold_date_sk=[$22]) + HiveFilter(condition=[AND(IS NOT NULL($2), IS NOT NULL($22))]) + HiveTableScan(table=[[default, store_sales]], table:alias=[store_sales]) HiveProject(cnt=[$0]) HiveFilter(condition=[sq_count_check($0)]) HiveProject(cnt=[$0]) HiveAggregate(group=[{}], cnt=[COUNT()]) HiveProject($f0=[$0]) HiveAggregate(group=[{0}]) - HiveProject($f0=[+($3, 1)]) - HiveFilter(condition=[AND(=($6, 1999), =($8, 3))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(ca_address_sk=[$0], ca_county=[$1], ca_state=[$2], s_county=[$3], s_state=[$4], c_customer_sk=[$5], c_current_addr_sk=[$6]) - HiveJoin(condition=[=($6, $0)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[AND(=($1, $3), =($2, $4))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(ca_address_sk=[$0], ca_county=[$7], ca_state=[$8]) - HiveFilter(condition=[AND(IS NOT NULL($7), IS NOT NULL($8))]) - HiveTableScan(table=[[default, customer_address]], table:alias=[customer_address]) - HiveProject(s_county=[$23], s_state=[$24]) - HiveFilter(condition=[AND(IS NOT NULL($23), IS NOT NULL($24))]) - HiveTableScan(table=[[default, store]], table:alias=[store]) - HiveProject(c_customer_sk=[$0], c_current_addr_sk=[$1]) - HiveSemiJoin(condition=[=($0, $2)], joinType=[semi]) - HiveProject(c_customer_sk=[$0], c_current_addr_sk=[$4]) - HiveFilter(condition=[IS NOT NULL($4)]) - HiveTableScan(table=[[default, customer]], table:alias=[customer]) - HiveProject(customer_sk=[$1]) - HiveJoin(condition=[=($2, $4)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($0, $3)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(sold_date_sk=[$0], customer_sk=[$1], item_sk=[$2]) - HiveUnion(all=[true]) - HiveProject(sold_date_sk=[$33], customer_sk=[$2], item_sk=[$14]) - HiveFilter(condition=[AND(IS NOT NULL($2), IS NOT NULL($33))]) - HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) - HiveProject(sold_date_sk=[$33], customer_sk=[$3], item_sk=[$2]) - HiveFilter(condition=[AND(IS NOT NULL($3), IS NOT NULL($33))]) - HiveTableScan(table=[[default, web_sales]], table:alias=[web_sales]) - HiveProject(d_date_sk=[$0]) + HiveProject($f0=[+($3, 3)]) HiveFilter(condition=[AND(=($6, 1999), =($8, 3))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(i_item_sk=[$0]) - HiveFilter(condition=[AND(=($10, _UTF-16LE'consignment '), =($12, _UTF-16LE'Jewelry '))]) - HiveTableScan(table=[[default, item]], table:alias=[item]) - HiveProject(d_date_sk=[$0], d_month_seq=[$1], $f0=[$2], $f00=[$3]) - HiveJoin(condition=[<=($1, $3)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[<=($2, $1)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(d_date_sk=[$0], d_month_seq=[$3]) - HiveFilter(condition=[IS NOT NULL($3)]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject($f0=[$0]) - HiveAggregate(group=[{0}]) - HiveProject($f0=[+($3, 1)]) - HiveFilter(condition=[AND(=($6, 1999), =($8, 3), IS NOT NULL($3))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject($f0=[$0]) - HiveAggregate(group=[{0}]) - HiveProject($f0=[+($3, 3)]) - HiveFilter(condition=[AND(=($6, 1999), =($8, 3), IS NOT NULL($3))]) + HiveProject(d_date_sk=[$0], d_month_seq=[$1], $f0=[$2], $f00=[$3], cnt=[$4]) + HiveJoin(condition=[<=($1, $3)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[<=($2, $1)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(d_date_sk=[$0], d_month_seq=[$3]) + HiveFilter(condition=[IS NOT NULL($3)]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject($f0=[$0]) + HiveAggregate(group=[{0}]) + HiveProject($f0=[+($3, 1)]) + HiveFilter(condition=[AND(=($6, 1999), =($8, 3), IS NOT NULL($3))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject($f0=[$0], cnt=[$1]) + HiveJoin(condition=[true], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject($f0=[$0]) + HiveAggregate(group=[{0}]) + HiveProject($f0=[+($3, 3)]) + HiveFilter(condition=[AND(=($6, 1999), =($8, 3), IS NOT NULL($3))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(cnt=[$0]) + HiveFilter(condition=[sq_count_check($0)]) + HiveProject(cnt=[$0]) + HiveAggregate(group=[{}], cnt=[COUNT()]) + HiveProject($f0=[$0]) + HiveAggregate(group=[{0}]) + HiveProject($f0=[+($3, 1)]) + HiveFilter(condition=[AND(=($6, 1999), =($8, 3))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(ca_address_sk=[$0], ca_county=[$1], ca_state=[$2], s_county=[$3], s_state=[$4], c_customer_sk=[$5], c_current_addr_sk=[$6]) + HiveJoin(condition=[=($6, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[AND(=($1, $3), =($2, $4))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(ca_address_sk=[$0], ca_county=[$7], ca_state=[$8]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($7))]) + HiveTableScan(table=[[default, customer_address]], table:alias=[customer_address]) + HiveProject(s_county=[$23], s_state=[$24]) + HiveFilter(condition=[AND(IS NOT NULL($24), IS NOT NULL($23))]) + HiveTableScan(table=[[default, store]], table:alias=[store]) + HiveProject(c_customer_sk=[$0], c_current_addr_sk=[$1]) + HiveSemiJoin(condition=[=($0, $2)], joinType=[semi]) + HiveProject(c_customer_sk=[$0], c_current_addr_sk=[$4]) + HiveFilter(condition=[IS NOT NULL($4)]) + HiveTableScan(table=[[default, customer]], table:alias=[customer]) + HiveProject(customer_sk=[$1]) + HiveJoin(condition=[=($2, $4)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($0, $3)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(sold_date_sk=[$0], customer_sk=[$1], item_sk=[$2]) + HiveUnion(all=[true]) + HiveProject(sold_date_sk=[$33], customer_sk=[$2], item_sk=[$14]) + HiveFilter(condition=[AND(IS NOT NULL($2), IS NOT NULL($33))]) + HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) + HiveProject(sold_date_sk=[$33], customer_sk=[$3], item_sk=[$2]) + HiveFilter(condition=[AND(IS NOT NULL($3), IS NOT NULL($33))]) + HiveTableScan(table=[[default, web_sales]], table:alias=[web_sales]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[AND(=($6, 1999), =($8, 3))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(i_item_sk=[$0]) + HiveFilter(condition=[AND(=($10, _UTF-16LE'consignment '), =($12, _UTF-16LE'Jewelry '))]) + HiveTableScan(table=[[default, item]], table:alias=[item]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query57.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query57.q.out index f2a671fa06b4..6fecf4eeff2e 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query57.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query57.q.out @@ -5,11 +5,11 @@ HiveProject(i_category=[$0], i_brand=[$1], d_year=[$2], d_moy=[$3], avg_monthly_ HiveJoin(condition=[AND(=($10, $0), =($11, $1), =($12, $2), =($17, $4))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject((tok_table_or_col i_category)=[$0], (tok_table_or_col i_brand)=[$1], (tok_table_or_col cc_name)=[$2], (tok_function sum (tok_table_or_col cs_sales_price))=[$3], EXPR$0=[-($4, 1)]) HiveFilter(condition=[IS NOT NULL($4)]) - HiveProject((tok_table_or_col i_category)=[$4], (tok_table_or_col i_brand)=[$3], (tok_table_or_col cc_name)=[$2], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], rank_window_1=[rank() OVER (PARTITION BY $4, $3, $2 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) - HiveProject(d_year=[$0], d_moy=[$1], cc_name=[$2], i_brand=[$3], i_category=[$4], $f5=[$5]) - HiveAggregate(group=[{5, 6, 8, 10, 11}], agg#0=[sum($2)]) - HiveJoin(condition=[=($1, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject((tok_table_or_col i_category)=[$3], (tok_table_or_col i_brand)=[$2], (tok_table_or_col cc_name)=[$4], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], rank_window_1=[rank() OVER (PARTITION BY $3, $2, $4 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) + HiveProject(d_year=[$0], d_moy=[$1], i_brand=[$2], i_category=[$3], cc_name=[$4], $f5=[$5]) + HiveAggregate(group=[{5, 6, 8, 9, 11}], agg#0=[sum($2)]) + HiveJoin(condition=[=($10, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($1, $7)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(cs_call_center_sk=[$10], cs_item_sk=[$14], cs_sales_price=[$20], cs_sold_date_sk=[$33]) HiveFilter(condition=[AND(IS NOT NULL($10), IS NOT NULL($33))]) @@ -17,20 +17,20 @@ HiveProject(i_category=[$0], i_brand=[$1], d_year=[$2], d_moy=[$3], avg_monthly_ HiveProject(d_date_sk=[$0], d_year=[$6], d_moy=[$8]) HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) - HiveFilter(condition=[IS NOT NULL($6)]) - HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) - HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) + HiveFilter(condition=[IS NOT NULL($6)]) + HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) HiveJoin(condition=[AND(=($5, $0), =($6, $1), =($7, $2), =($12, $4))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject((tok_table_or_col i_category)=[$0], (tok_table_or_col i_brand)=[$1], (tok_table_or_col cc_name)=[$2], (tok_function sum (tok_table_or_col cs_sales_price))=[$3], EXPR$0=[+($4, 1)]) HiveFilter(condition=[IS NOT NULL($4)]) - HiveProject((tok_table_or_col i_category)=[$4], (tok_table_or_col i_brand)=[$3], (tok_table_or_col cc_name)=[$2], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], rank_window_1=[rank() OVER (PARTITION BY $4, $3, $2 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) - HiveProject(d_year=[$0], d_moy=[$1], cc_name=[$2], i_brand=[$3], i_category=[$4], $f5=[$5]) - HiveAggregate(group=[{5, 6, 8, 10, 11}], agg#0=[sum($2)]) - HiveJoin(condition=[=($1, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject((tok_table_or_col i_category)=[$3], (tok_table_or_col i_brand)=[$2], (tok_table_or_col cc_name)=[$4], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], rank_window_1=[rank() OVER (PARTITION BY $3, $2, $4 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) + HiveProject(d_year=[$0], d_moy=[$1], i_brand=[$2], i_category=[$3], cc_name=[$4], $f5=[$5]) + HiveAggregate(group=[{5, 6, 8, 9, 11}], agg#0=[sum($2)]) + HiveJoin(condition=[=($10, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($1, $7)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(cs_call_center_sk=[$10], cs_item_sk=[$14], cs_sales_price=[$20], cs_sold_date_sk=[$33]) HiveFilter(condition=[AND(IS NOT NULL($10), IS NOT NULL($33))]) @@ -38,19 +38,19 @@ HiveProject(i_category=[$0], i_brand=[$1], d_year=[$2], d_moy=[$3], avg_monthly_ HiveProject(d_date_sk=[$0], d_year=[$6], d_moy=[$8]) HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) - HiveFilter(condition=[IS NOT NULL($6)]) - HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) - HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) + HiveFilter(condition=[IS NOT NULL($6)]) + HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) HiveProject((tok_table_or_col i_category)=[$0], (tok_table_or_col i_brand)=[$1], (tok_table_or_col cc_name)=[$2], (tok_table_or_col d_year)=[$3], (tok_table_or_col d_moy)=[$4], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], avg_window_0=[$6], rank_window_1=[$7]) HiveFilter(condition=[AND(=($3, 2000), >($6, 0:DECIMAL(1, 0)), CASE(>($6, 0:DECIMAL(1, 0)), >(/(ABS(-($5, $6)), $6), 0.1:DECIMAL(1, 1)), false), IS NOT NULL($7))]) - HiveProject((tok_table_or_col i_category)=[$4], (tok_table_or_col i_brand)=[$3], (tok_table_or_col cc_name)=[$2], (tok_table_or_col d_year)=[$0], (tok_table_or_col d_moy)=[$1], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], avg_window_0=[avg($5) OVER (PARTITION BY $4, $3, $2, $0 ORDER BY $4 NULLS FIRST, $3 NULLS FIRST, $2 NULLS FIRST, $0 NULLS FIRST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)], rank_window_1=[rank() OVER (PARTITION BY $4, $3, $2 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) - HiveProject(d_year=[$0], d_moy=[$1], cc_name=[$2], i_brand=[$3], i_category=[$4], $f5=[$5]) - HiveAggregate(group=[{5, 6, 8, 10, 11}], agg#0=[sum($2)]) - HiveJoin(condition=[=($1, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject((tok_table_or_col i_category)=[$3], (tok_table_or_col i_brand)=[$2], (tok_table_or_col cc_name)=[$4], (tok_table_or_col d_year)=[$0], (tok_table_or_col d_moy)=[$1], (tok_function sum (tok_table_or_col cs_sales_price))=[$5], avg_window_0=[avg($5) OVER (PARTITION BY $3, $2, $4, $0 ORDER BY $3 NULLS FIRST, $2 NULLS FIRST, $4 NULLS FIRST, $0 NULLS FIRST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)], rank_window_1=[rank() OVER (PARTITION BY $3, $2, $4 ORDER BY $0 NULLS LAST, $1 NULLS LAST RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING)]) + HiveProject(d_year=[$0], d_moy=[$1], i_brand=[$2], i_category=[$3], cc_name=[$4], $f5=[$5]) + HiveAggregate(group=[{5, 6, 8, 9, 11}], agg#0=[sum($2)]) + HiveJoin(condition=[=($10, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($1, $7)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($3, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(cs_call_center_sk=[$10], cs_item_sk=[$14], cs_sales_price=[$20], cs_sold_date_sk=[$33]) HiveFilter(condition=[AND(IS NOT NULL($10), IS NOT NULL($33))]) @@ -58,10 +58,10 @@ HiveProject(i_category=[$0], i_brand=[$1], d_year=[$2], d_moy=[$3], avg_monthly_ HiveProject(d_date_sk=[$0], d_year=[$6], d_moy=[$8]) HiveFilter(condition=[AND(IN($6, 1999, 2000, 2001), OR(=($6, 2000), IN(ROW($6, $8), ROW(1999, 12), ROW(2001, 1))))]) HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) - HiveFilter(condition=[IS NOT NULL($6)]) - HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) - HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) - HiveFilter(condition=[AND(IS NOT NULL($12), IS NOT NULL($8))]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(i_item_sk=[$0], i_brand=[$8], i_category=[$12]) + HiveFilter(condition=[AND(IS NOT NULL($8), IS NOT NULL($12))]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(cc_call_center_sk=[$0], cc_name=[$6]) + HiveFilter(condition=[IS NOT NULL($6)]) + HiveTableScan(table=[[default, call_center]], table:alias=[call_center]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query63.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query63.q.out index 5d881de389d6..ad91e1502da0 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query63.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query63.q.out @@ -11,7 +11,7 @@ HiveSortLimit(sort0=[$0], sort1=[$2], sort2=[$1], dir0=[ASC], dir1=[ASC], dir2=[ HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($22))]) HiveTableScan(table=[[default, store_sales]], table:alias=[store_sales]) HiveProject(i_item_sk=[$0], i_manager_id=[$20]) - HiveFilter(condition=[AND(IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants', _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'refernece', _UTF-16LE'self-help'), IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics', _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'exportiunivamalg #9', _UTF-16LE'importoamalg #1', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9'), OR(AND(IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics'), IN($10, _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'refernece', _UTF-16LE'self-help'), IN($8, _UTF-16LE'exportiunivamalg #9', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9')), AND(IN($12, _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'importoamalg #1'))))]) + HiveFilter(condition=[AND(IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants', _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'refernece', _UTF-16LE'self-help'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'exportiunivamalg #9', _UTF-16LE'importoamalg #1', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9'), IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics', _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), OR(AND(IN($12, _UTF-16LE'Books', _UTF-16LE'Children', _UTF-16LE'Electronics'), IN($10, _UTF-16LE'personal', _UTF-16LE'portable', _UTF-16LE'refernece', _UTF-16LE'self-help'), IN($8, _UTF-16LE'exportiunivamalg #9', _UTF-16LE'scholaramalgamalg #14', _UTF-16LE'scholaramalgamalg #7', _UTF-16LE'scholaramalgamalg #9')), AND(IN($12, _UTF-16LE'Men', _UTF-16LE'Music', _UTF-16LE'Women'), IN($10, _UTF-16LE'accessories', _UTF-16LE'classical', _UTF-16LE'fragrances', _UTF-16LE'pants'), IN($8, _UTF-16LE'amalgimporto #1', _UTF-16LE'edu packscholar #1', _UTF-16LE'exportiimporto #1', _UTF-16LE'importoamalg #1'))))]) HiveTableScan(table=[[default, item]], table:alias=[item]) HiveProject(d_date_sk=[$0], d_moy=[$8]) HiveFilter(condition=[IN($3, 1212, 1213, 1214, 1215, 1216, 1217, 1218, 1219, 1220, 1221, 1222, 1223)]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query64.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query64.q.out index a0f3693017d2..ab082840d185 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query64.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query64.q.out @@ -5,23 +5,21 @@ HiveProject(product_name=[$0], store_name=[$1], store_zip=[$2], b_street_number= HiveJoin(condition=[AND(=($8, $0), <=($3, $19), =($9, $1), =($10, $2))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject($f1=[$0], $f2=[$1], $f3=[$2], $f15=[$13], $f16=[$14], $f17=[$15], $f18=[$16]) HiveFilter(condition=[IS NOT NULL($13)]) - HiveProject(i_item_sk=[$4], s_store_name=[$5], s_zip=[$6], ca_street_number=[$0], ca_street_name=[$1], ca_city=[$2], ca_zip=[$3], ca_street_number0=[$9], ca_street_name0=[$10], ca_city0=[$11], ca_zip0=[$12], d_year=[$7], d_year0=[$8], $f13=[$13], $f14=[$14], $f15=[$15], $f16=[$16]) - HiveAggregate(group=[{3, 4, 5, 6, 24, 29, 30, 34, 36, 42, 43, 44, 45}], agg#0=[count()], agg#1=[sum($20)], agg#2=[sum($21)], agg#3=[sum($22)]) - HiveJoin(condition=[=($10, $41)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[AND(=($8, $39), <>($38, $40))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($15, $37)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($11, $35)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($12, $33)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($9, $32)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($16, $31)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($18, $28)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[AND(=($13, $0), =($19, $1))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(i_item_sk=[$0], s_store_name=[$1], s_zip=[$2], ca_street_number=[$5], ca_street_name=[$6], ca_city=[$7], ca_zip=[$8], ca_street_number0=[$9], ca_street_name0=[$10], ca_city0=[$11], ca_zip0=[$12], d_year=[$3], d_year0=[$4], $f13=[$13], $f14=[$14], $f15=[$15], $f16=[$16]) + HiveAggregate(group=[{19, 23, 24, 29, 31, 37, 38, 39, 40, 42, 43, 44, 45}], agg#0=[count()], agg#1=[sum($15)], agg#2=[sum($16)], agg#3=[sum($17)]) + HiveJoin(condition=[=($5, $41)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($12, $36)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[AND(=($3, $34), <>($33, $35))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($10, $32)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $30)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($7, $28)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($4, $27)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($11, $26)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[AND(=($8, $0), =($14, $1))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(sr_item_sk=[$1], sr_ticket_number=[$8]) HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]) - HiveJoin(condition=[=($15, $0)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) - HiveTableScan(table=[[default, customer_address]], table:alias=[ad1]) - HiveJoin(condition=[=($6, $20)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $23)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($11, $20)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(c_customer_sk=[$0], c_current_cdemo_sk=[$2], c_current_hdemo_sk=[$3], c_current_addr_sk=[$4], c_first_shipto_date_sk=[$5], c_first_sales_date_sk=[$6]) HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($6), IS NOT NULL($3), IS NOT NULL($2), IS NOT NULL($4))]) @@ -37,52 +35,52 @@ HiveProject(product_name=[$0], store_name=[$1], store_zip=[$2], b_street_number= HiveProject(d_date_sk=[$0]) HiveFilter(condition=[=($6, 2001)]) HiveTableScan(table=[[default, date_dim]], table:alias=[d1]) - HiveProject(cs_item_sk=[$0]) - HiveFilter(condition=[>($1, *(2:DECIMAL(10, 0), $2))]) - HiveAggregate(group=[{0}], agg#0=[sum($2)], agg#1=[sum($5)]) - HiveJoin(condition=[AND(=($0, $3), =($1, $4))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(cs_item_sk=[$14], cs_order_number=[$16], cs_ext_list_price=[$24]) - HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) - HiveProject(cr_item_sk=[$1], cr_order_number=[$15], $f2=[+(+($22, $23), $24)]) - HiveTableScan(table=[[default, catalog_returns]], table:alias=[catalog_returns]) - HiveProject(s_store_sk=[$0], s_store_name=[$5], s_zip=[$25]) - HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($25))]) - HiveTableScan(table=[[default, store]], table:alias=[store]) + HiveProject(s_store_sk=[$0], s_store_name=[$5], s_zip=[$25]) + HiveFilter(condition=[AND(IS NOT NULL($25), IS NOT NULL($5))]) + HiveTableScan(table=[[default, store]], table:alias=[store]) + HiveProject(cs_item_sk=[$0]) + HiveFilter(condition=[>($1, *(2:DECIMAL(10, 0), $2))]) + HiveAggregate(group=[{0}], agg#0=[sum($2)], agg#1=[sum($5)]) + HiveJoin(condition=[AND(=($0, $3), =($1, $4))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(cs_item_sk=[$14], cs_order_number=[$16], cs_ext_list_price=[$24]) + HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) + HiveProject(cr_item_sk=[$1], cr_order_number=[$15], $f2=[+(+($22, $23), $24)]) + HiveTableScan(table=[[default, catalog_returns]], table:alias=[catalog_returns]) + HiveProject(hd_demo_sk=[$0]) + HiveFilter(condition=[IS NOT NULL($1)]) + HiveTableScan(table=[[default, household_demographics]], table:alias=[hd1]) HiveProject(hd_demo_sk=[$0]) HiveFilter(condition=[IS NOT NULL($1)]) - HiveTableScan(table=[[default, household_demographics]], table:alias=[hd1]) - HiveProject(hd_demo_sk=[$0]) - HiveFilter(condition=[IS NOT NULL($1)]) - HiveTableScan(table=[[default, household_demographics]], table:alias=[hd2]) + HiveTableScan(table=[[default, household_demographics]], table:alias=[hd2]) + HiveProject(d_date_sk=[$0], d_year=[$6]) + HiveTableScan(table=[[default, date_dim]], table:alias=[d2]) HiveProject(d_date_sk=[$0], d_year=[$6]) - HiveTableScan(table=[[default, date_dim]], table:alias=[d2]) - HiveProject(d_date_sk=[$0], d_year=[$6]) - HiveTableScan(table=[[default, date_dim]], table:alias=[d3]) + HiveTableScan(table=[[default, date_dim]], table:alias=[d3]) + HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd1]) HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd1]) - HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd2]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd2]) + HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) + HiveTableScan(table=[[default, customer_address]], table:alias=[ad1]) HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) HiveTableScan(table=[[default, customer_address]], table:alias=[ad2]) HiveProject($f0=[$0], $f1=[$1], $f2=[$2], $f3=[$3], $f4=[$4], $f5=[$5], $f6=[$6], $f7=[$7], $f8=[$8], $f9=[$9], $f10=[$10], $f11=[$11], $f15=[$14], $f16=[$15], $f17=[$16], $f18=[$17]) HiveFilter(condition=[IS NOT NULL($14)]) - HiveProject(i_product_name=[$5], i_item_sk=[$4], s_store_name=[$6], s_zip=[$7], ca_street_number=[$0], ca_street_name=[$1], ca_city=[$2], ca_zip=[$3], ca_street_number0=[$10], ca_street_name0=[$11], ca_city0=[$12], ca_zip0=[$13], d_year=[$8], d_year0=[$9], $f14=[$14], $f15=[$15], $f16=[$16], $f17=[$17]) - HiveAggregate(group=[{3, 4, 5, 6, 24, 25, 29, 30, 34, 36, 42, 43, 44, 45}], agg#0=[count()], agg#1=[sum($20)], agg#2=[sum($21)], agg#3=[sum($22)]) - HiveJoin(condition=[=($10, $41)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[AND(=($8, $39), <>($38, $40))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($15, $37)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($11, $35)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($12, $33)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($9, $32)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($16, $31)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($18, $28)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[AND(=($13, $0), =($19, $1))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(i_product_name=[$1], i_item_sk=[$0], s_store_name=[$2], s_zip=[$3], ca_street_number=[$6], ca_street_name=[$7], ca_city=[$8], ca_zip=[$9], ca_street_number0=[$10], ca_street_name0=[$11], ca_city0=[$12], ca_zip0=[$13], d_year=[$4], d_year0=[$5], $f14=[$14], $f15=[$15], $f16=[$16], $f17=[$17]) + HiveAggregate(group=[{19, 20, 23, 24, 29, 31, 37, 38, 39, 40, 42, 43, 44, 45}], agg#0=[count()], agg#1=[sum($15)], agg#2=[sum($16)], agg#3=[sum($17)]) + HiveJoin(condition=[=($5, $41)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($12, $36)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[AND(=($3, $34), <>($33, $35))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($10, $32)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $30)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($7, $28)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($4, $27)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($11, $26)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[AND(=($8, $0), =($14, $1))], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(sr_item_sk=[$1], sr_ticket_number=[$8]) HiveTableScan(table=[[default, store_returns]], table:alias=[store_returns]) - HiveJoin(condition=[=($15, $0)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) - HiveTableScan(table=[[default, customer_address]], table:alias=[ad1]) - HiveJoin(condition=[=($6, $20)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $23)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($11, $20)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($7, $0)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(c_customer_sk=[$0], c_current_cdemo_sk=[$2], c_current_hdemo_sk=[$3], c_current_addr_sk=[$4], c_first_shipto_date_sk=[$5], c_first_sales_date_sk=[$6]) HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($6), IS NOT NULL($3), IS NOT NULL($2), IS NOT NULL($4))]) @@ -98,31 +96,33 @@ HiveProject(product_name=[$0], store_name=[$1], store_zip=[$2], b_street_number= HiveProject(d_date_sk=[$0]) HiveFilter(condition=[=($6, 2000)]) HiveTableScan(table=[[default, date_dim]], table:alias=[d1]) - HiveProject(cs_item_sk=[$0]) - HiveFilter(condition=[>($1, *(2:DECIMAL(10, 0), $2))]) - HiveAggregate(group=[{0}], agg#0=[sum($2)], agg#1=[sum($5)]) - HiveJoin(condition=[AND(=($0, $3), =($1, $4))], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(cs_item_sk=[$14], cs_order_number=[$16], cs_ext_list_price=[$24]) - HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) - HiveProject(cr_item_sk=[$1], cr_order_number=[$15], $f2=[+(+($22, $23), $24)]) - HiveTableScan(table=[[default, catalog_returns]], table:alias=[catalog_returns]) - HiveProject(s_store_sk=[$0], s_store_name=[$5], s_zip=[$25]) - HiveFilter(condition=[AND(IS NOT NULL($5), IS NOT NULL($25))]) - HiveTableScan(table=[[default, store]], table:alias=[store]) + HiveProject(s_store_sk=[$0], s_store_name=[$5], s_zip=[$25]) + HiveFilter(condition=[AND(IS NOT NULL($25), IS NOT NULL($5))]) + HiveTableScan(table=[[default, store]], table:alias=[store]) + HiveProject(cs_item_sk=[$0]) + HiveFilter(condition=[>($1, *(2:DECIMAL(10, 0), $2))]) + HiveAggregate(group=[{0}], agg#0=[sum($2)], agg#1=[sum($5)]) + HiveJoin(condition=[AND(=($0, $3), =($1, $4))], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(cs_item_sk=[$14], cs_order_number=[$16], cs_ext_list_price=[$24]) + HiveTableScan(table=[[default, catalog_sales]], table:alias=[catalog_sales]) + HiveProject(cr_item_sk=[$1], cr_order_number=[$15], $f2=[+(+($22, $23), $24)]) + HiveTableScan(table=[[default, catalog_returns]], table:alias=[catalog_returns]) + HiveProject(hd_demo_sk=[$0]) + HiveFilter(condition=[IS NOT NULL($1)]) + HiveTableScan(table=[[default, household_demographics]], table:alias=[hd1]) HiveProject(hd_demo_sk=[$0]) HiveFilter(condition=[IS NOT NULL($1)]) - HiveTableScan(table=[[default, household_demographics]], table:alias=[hd1]) - HiveProject(hd_demo_sk=[$0]) - HiveFilter(condition=[IS NOT NULL($1)]) - HiveTableScan(table=[[default, household_demographics]], table:alias=[hd2]) + HiveTableScan(table=[[default, household_demographics]], table:alias=[hd2]) + HiveProject(d_date_sk=[$0], d_year=[$6]) + HiveTableScan(table=[[default, date_dim]], table:alias=[d2]) HiveProject(d_date_sk=[$0], d_year=[$6]) - HiveTableScan(table=[[default, date_dim]], table:alias=[d2]) - HiveProject(d_date_sk=[$0], d_year=[$6]) - HiveTableScan(table=[[default, date_dim]], table:alias=[d3]) + HiveTableScan(table=[[default, date_dim]], table:alias=[d3]) + HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd1]) HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd1]) - HiveProject(cd_demo_sk=[$0], cd_marital_status=[$2]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd2]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[cd2]) + HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) + HiveTableScan(table=[[default, customer_address]], table:alias=[ad1]) HiveProject(ca_address_sk=[$0], ca_street_number=[$2], ca_street_name=[$3], ca_city=[$6], ca_zip=[$9]) HiveTableScan(table=[[default, customer_address]], table:alias=[ad2]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query7.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query7.q.out index 5c5d16b51077..2cef673adc7d 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query7.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query7.q.out @@ -1,23 +1,23 @@ CBO PLAN: HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]) HiveProject(i_item_id=[$0], agg1=[/(CAST($1):DOUBLE, $2)], agg2=[CAST(/($3, $4)):DECIMAL(11, 6)], agg3=[CAST(/($5, $6)):DECIMAL(11, 6)], agg4=[CAST(/($7, $8)):DECIMAL(11, 6)]) - HiveAggregate(group=[{12}], agg#0=[sum($3)], agg#1=[count($3)], agg#2=[sum($4)], agg#3=[count($4)], agg#4=[sum($6)], agg#5=[count($6)], agg#6=[sum($5)], agg#7=[count($5)]) - HiveJoin(condition=[=($0, $11)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $10)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($1, $9)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($7, $8)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveAggregate(group=[{1}], agg#0=[sum($5)], agg#1=[count($5)], agg#2=[sum($6)], agg#3=[count($6)], agg#4=[sum($8)], agg#5=[count($8)], agg#6=[sum($7)], agg#7=[count($7)]) + HiveJoin(condition=[=($2, $0)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveProject(i_item_sk=[$0], i_item_id=[$1]) + HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveJoin(condition=[=($1, $10)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($7, $9)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $8)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(ss_item_sk=[$1], ss_cdemo_sk=[$3], ss_promo_sk=[$7], ss_quantity=[$9], ss_list_price=[$11], ss_sales_price=[$12], ss_coupon_amt=[$18], ss_sold_date_sk=[$22]) HiveFilter(condition=[AND(IS NOT NULL($3), IS NOT NULL($7), IS NOT NULL($22))]) HiveTableScan(table=[[default, store_sales]], table:alias=[store_sales]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[=($6, 1998)]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) - HiveProject(cd_demo_sk=[$0]) - HiveFilter(condition=[AND(=($2, _UTF-16LE'W'), =($1, _UTF-16LE'F'), =($3, _UTF-16LE'Primary '))]) - HiveTableScan(table=[[default, customer_demographics]], table:alias=[customer_demographics]) - HiveProject(p_promo_sk=[$0]) - HiveFilter(condition=[OR(=($9, _UTF-16LE'N'), =($14, _UTF-16LE'N'))]) - HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) - HiveProject(i_item_sk=[$0], i_item_id=[$1]) - HiveTableScan(table=[[default, item]], table:alias=[item]) + HiveProject(p_promo_sk=[$0]) + HiveFilter(condition=[OR(=($9, _UTF-16LE'N'), =($14, _UTF-16LE'N'))]) + HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[=($6, 1998)]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(cd_demo_sk=[$0]) + HiveFilter(condition=[AND(=($2, _UTF-16LE'W'), =($1, _UTF-16LE'F'), =($3, _UTF-16LE'Primary '))]) + HiveTableScan(table=[[default, customer_demographics]], table:alias=[customer_demographics]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query8.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query8.q.out index 0bf0810023ae..321c390bd531 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query8.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query8.q.out @@ -26,14 +26,14 @@ HiveSortLimit(sort0=[$0], dir0=[ASC], fetch=[100]) HiveAggregate(group=[{0}], agg#0=[count()]) HiveProject($f0=[substr($0, 1, 5)]) HiveFilter(condition=[>($1, 10)]) - HiveAggregate(group=[{1}], agg#0=[count()]) - HiveJoin(condition=[=($0, $2)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveProject(ca_address_sk=[$0], ca_zip=[$9]) - HiveFilter(condition=[IS NOT NULL(substr(substr($9, 1, 5), 1, 2))]) - HiveTableScan(table=[[default, customer_address]], table:alias=[customer_address]) + HiveAggregate(group=[{2}], agg#0=[count()]) + HiveJoin(condition=[=($1, $0)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(c_current_addr_sk=[$4]) HiveFilter(condition=[AND(=($10, _UTF-16LE'Y'), IS NOT NULL($4))]) HiveTableScan(table=[[default, customer]], table:alias=[customer]) + HiveProject(ca_address_sk=[$0], ca_zip=[$9]) + HiveFilter(condition=[IS NOT NULL(substr(substr($9, 1, 5), 1, 2))]) + HiveTableScan(table=[[default, customer_address]], table:alias=[customer_address]) HiveProject(s_store_sk=[$0], s_store_name=[$5], EXPR$0=[substr($25, 1, 2)]) HiveFilter(condition=[IS NOT NULL(substr($25, 1, 2))]) HiveTableScan(table=[[default, store]], table:alias=[store]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query80.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query80.q.out index b8fae4529e69..501a67af3946 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query80.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query80.q.out @@ -8,8 +8,8 @@ HiveSortLimit(sort0=[$0], sort1=[$1], dir0=[ASC], dir1=[ASC], fetch=[100]) HiveAggregate(group=[{0}], agg#0=[sum($1)], agg#1=[sum($2)], agg#2=[sum($3)]) HiveProject($f0=[$15], $f1=[$4], $f2=[CASE(IS NOT NULL($9), $9, 0:DECIMAL(12, 2))], $f3=[-($5, CASE(IS NOT NULL($10), $10, 0:DECIMAL(12, 2)))]) HiveJoin(condition=[=($1, $14)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($6, $13)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $12)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $13)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $12)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($0, $11)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[AND(=($0, $7), =($3, $8))], joinType=[left], algorithm=[none], cost=[not available]) HiveProject(ss_item_sk=[$1], ss_store_sk=[$6], ss_promo_sk=[$7], ss_ticket_number=[$8], ss_ext_sales_price=[$14], ss_net_profit=[$21], ss_sold_date_sk=[$22]) @@ -20,20 +20,20 @@ HiveSortLimit(sort0=[$0], sort1=[$1], dir0=[ASC], dir1=[ASC], fetch=[100]) HiveProject(i_item_sk=[$0]) HiveFilter(condition=[>($5, 50:DECIMAL(2, 0))]) HiveTableScan(table=[[default, item]], table:alias=[item]) - HiveProject(p_promo_sk=[$0]) - HiveFilter(condition=[=($11, _UTF-16LE'N')]) - HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(p_promo_sk=[$0]) + HiveFilter(condition=[=($11, _UTF-16LE'N')]) + HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) HiveProject(s_store_sk=[$0], s_store_id=[$1]) HiveTableScan(table=[[default, store]], table:alias=[store]) HiveProject(channel=[_UTF-16LE'catalog channel':VARCHAR(2147483647) CHARACTER SET "UTF-16LE"], id=[||(_UTF-16LE'catalog_page':VARCHAR(2147483647) CHARACTER SET "UTF-16LE", $0)], sales=[$1], returns=[$2], profit=[$3]) HiveAggregate(group=[{0}], agg#0=[sum($1)], agg#1=[sum($2)], agg#2=[sum($3)]) HiveProject($f0=[$15], $f1=[$4], $f2=[CASE(IS NOT NULL($9), $9, 0:DECIMAL(12, 2))], $f3=[-($5, CASE(IS NOT NULL($10), $10, 0:DECIMAL(12, 2)))]) HiveJoin(condition=[=($0, $14)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($6, $13)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $12)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $13)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $12)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($1, $11)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[AND(=($1, $7), =($3, $8))], joinType=[left], algorithm=[none], cost=[not available]) HiveProject(cs_catalog_page_sk=[$11], cs_item_sk=[$14], cs_promo_sk=[$15], cs_order_number=[$16], cs_ext_sales_price=[$22], cs_net_profit=[$32], cs_sold_date_sk=[$33]) @@ -44,20 +44,20 @@ HiveSortLimit(sort0=[$0], sort1=[$1], dir0=[ASC], dir1=[ASC], fetch=[100]) HiveProject(i_item_sk=[$0]) HiveFilter(condition=[>($5, 50:DECIMAL(2, 0))]) HiveTableScan(table=[[default, item]], table:alias=[item]) - HiveProject(p_promo_sk=[$0]) - HiveFilter(condition=[=($11, _UTF-16LE'N')]) - HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(p_promo_sk=[$0]) + HiveFilter(condition=[=($11, _UTF-16LE'N')]) + HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) HiveProject(cp_catalog_page_sk=[$0], cp_catalog_page_id=[$1]) HiveTableScan(table=[[default, catalog_page]], table:alias=[catalog_page]) HiveProject(channel=[_UTF-16LE'web channel':VARCHAR(2147483647) CHARACTER SET "UTF-16LE"], id=[||(_UTF-16LE'web_site':VARCHAR(2147483647) CHARACTER SET "UTF-16LE", $0)], sales=[$1], returns=[$2], profit=[$3]) HiveAggregate(group=[{0}], agg#0=[sum($1)], agg#1=[sum($2)], agg#2=[sum($3)]) HiveProject($f0=[$15], $f1=[$4], $f2=[CASE(IS NOT NULL($9), $9, 0:DECIMAL(12, 2))], $f3=[-($5, CASE(IS NOT NULL($10), $10, 0:DECIMAL(12, 2)))]) HiveJoin(condition=[=($1, $14)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($6, $13)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $12)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $13)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($6, $12)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($0, $11)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[AND(=($0, $7), =($3, $8))], joinType=[left], algorithm=[none], cost=[not available]) HiveProject(ws_item_sk=[$2], ws_web_site_sk=[$12], ws_promo_sk=[$15], ws_order_number=[$16], ws_ext_sales_price=[$22], ws_net_profit=[$32], ws_sold_date_sk=[$33]) @@ -68,12 +68,12 @@ HiveSortLimit(sort0=[$0], sort1=[$1], dir0=[ASC], dir1=[ASC], fetch=[100]) HiveProject(i_item_sk=[$0]) HiveFilter(condition=[>($5, 50:DECIMAL(2, 0))]) HiveTableScan(table=[[default, item]], table:alias=[item]) - HiveProject(p_promo_sk=[$0]) - HiveFilter(condition=[=($11, _UTF-16LE'N')]) - HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) - HiveProject(d_date_sk=[$0]) - HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) - HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(d_date_sk=[$0]) + HiveFilter(condition=[BETWEEN(false, CAST($2):TIMESTAMP(9), 1998-08-04 00:00:00:TIMESTAMP(9), 1998-09-03 00:00:00:TIMESTAMP(9))]) + HiveTableScan(table=[[default, date_dim]], table:alias=[date_dim]) + HiveProject(p_promo_sk=[$0]) + HiveFilter(condition=[=($11, _UTF-16LE'N')]) + HiveTableScan(table=[[default, promotion]], table:alias=[promotion]) HiveProject(web_site_sk=[$0], web_site_id=[$1]) HiveTableScan(table=[[default, web_site]], table:alias=[web_site]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query96.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query96.q.out index c5293dfc7d11..410434109319 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query96.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/cbo_query96.q.out @@ -1,7 +1,7 @@ CBO PLAN: HiveAggregate(group=[{}], agg#0=[count()]) - HiveJoin(condition=[=($1, $5)], joinType=[inner], algorithm=[none], cost=[not available]) - HiveJoin(condition=[=($2, $4)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($2, $5)], joinType=[inner], algorithm=[none], cost=[not available]) + HiveJoin(condition=[=($1, $4)], joinType=[inner], algorithm=[none], cost=[not available]) HiveJoin(condition=[=($0, $3)], joinType=[inner], algorithm=[none], cost=[not available]) HiveProject(ss_sold_time_sk=[$0], ss_hdemo_sk=[$4], ss_store_sk=[$6]) HiveFilter(condition=[AND(IS NOT NULL($6), IS NOT NULL($4), IS NOT NULL($0))]) @@ -9,10 +9,10 @@ HiveAggregate(group=[{}], agg#0=[count()]) HiveProject(t_time_sk=[$0]) HiveFilter(condition=[AND(=($3, 8), >=($4, 30))]) HiveTableScan(table=[[default, time_dim]], table:alias=[time_dim]) - HiveProject(s_store_sk=[$0]) - HiveFilter(condition=[=($5, _UTF-16LE'ese')]) - HiveTableScan(table=[[default, store]], table:alias=[store]) - HiveProject(hd_demo_sk=[$0]) - HiveFilter(condition=[=($3, 5)]) - HiveTableScan(table=[[default, household_demographics]], table:alias=[household_demographics]) + HiveProject(hd_demo_sk=[$0]) + HiveFilter(condition=[=($3, 5)]) + HiveTableScan(table=[[default, household_demographics]], table:alias=[household_demographics]) + HiveProject(s_store_sk=[$0]) + HiveFilter(condition=[=($5, _UTF-16LE'ese')]) + HiveTableScan(table=[[default, store]], table:alias=[store]) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query1.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query1.q.out index 509b613345fc..37430ac90f49 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query1.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query1.q.out @@ -7,14 +7,14 @@ STAGE PLANS: Tez #### A masked pattern was here #### Edges: - Map 1 <- Map 12 (BROADCAST_EDGE), Reducer 11 (BROADCAST_EDGE), Reducer 6 (BROADCAST_EDGE) - Map 8 <- Map 12 (BROADCAST_EDGE), Reducer 6 (BROADCAST_EDGE) + Map 1 <- Map 5 (BROADCAST_EDGE), Reducer 11 (BROADCAST_EDGE), Reducer 7 (BROADCAST_EDGE) + Map 8 <- Map 5 (BROADCAST_EDGE), Reducer 7 (BROADCAST_EDGE) Reducer 10 <- Reducer 9 (SIMPLE_EDGE) Reducer 11 <- Reducer 10 (CUSTOM_SIMPLE_EDGE) - Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 5 (BROADCAST_EDGE) - Reducer 3 <- Map 7 (CUSTOM_SIMPLE_EDGE), Reducer 10 (BROADCAST_EDGE), Reducer 2 (CUSTOM_SIMPLE_EDGE) + Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 6 (BROADCAST_EDGE), Reducer 10 (BROADCAST_EDGE) + Reducer 3 <- Map 12 (CUSTOM_SIMPLE_EDGE), Reducer 2 (CUSTOM_SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) - Reducer 6 <- Map 5 (CUSTOM_SIMPLE_EDGE) + Reducer 7 <- Map 6 (CUSTOM_SIMPLE_EDGE) Reducer 9 <- Map 8 (SIMPLE_EDGE) #### A masked pattern was here #### Vertices: @@ -22,10 +22,10 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store_returns - filterExpr: (sr_store_sk is not null and sr_customer_sk is not null and sr_store_sk BETWEEN DynamicValue(RS_41_store_s_store_sk_min) AND DynamicValue(RS_41_store_s_store_sk_max) and sr_store_sk BETWEEN DynamicValue(RS_47_store_returns_sr_store_sk_min) AND DynamicValue(RS_47_store_returns_sr_store_sk_max) and in_bloom_filter(sr_store_sk, DynamicValue(RS_41_store_s_store_sk_bloom_filter)) and in_bloom_filter(sr_store_sk, DynamicValue(RS_47_store_returns_sr_store_sk_bloom_filter))) (type: boolean) + filterExpr: (sr_store_sk is not null and sr_customer_sk is not null and sr_store_sk BETWEEN DynamicValue(RS_41_store_s_store_sk_min) AND DynamicValue(RS_41_store_s_store_sk_max) and sr_store_sk BETWEEN DynamicValue(RS_44_store_returns_sr_store_sk_min) AND DynamicValue(RS_44_store_returns_sr_store_sk_max) and in_bloom_filter(sr_store_sk, DynamicValue(RS_41_store_s_store_sk_bloom_filter)) and in_bloom_filter(sr_store_sk, DynamicValue(RS_44_store_returns_sr_store_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 8332595709 Data size: 1113890910776 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (sr_store_sk is not null and sr_customer_sk is not null and sr_store_sk BETWEEN DynamicValue(RS_41_store_s_store_sk_min) AND DynamicValue(RS_41_store_s_store_sk_max) and sr_store_sk BETWEEN DynamicValue(RS_47_store_returns_sr_store_sk_min) AND DynamicValue(RS_47_store_returns_sr_store_sk_max) and in_bloom_filter(sr_store_sk, DynamicValue(RS_41_store_s_store_sk_bloom_filter)) and in_bloom_filter(sr_store_sk, DynamicValue(RS_47_store_returns_sr_store_sk_bloom_filter))) (type: boolean) + predicate: (sr_store_sk is not null and sr_customer_sk is not null and sr_store_sk BETWEEN DynamicValue(RS_41_store_s_store_sk_min) AND DynamicValue(RS_41_store_s_store_sk_max) and sr_store_sk BETWEEN DynamicValue(RS_44_store_returns_sr_store_sk_min) AND DynamicValue(RS_44_store_returns_sr_store_sk_max) and in_bloom_filter(sr_store_sk, DynamicValue(RS_41_store_s_store_sk_bloom_filter)) and in_bloom_filter(sr_store_sk, DynamicValue(RS_44_store_returns_sr_store_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 8033148295 Data size: 1073861157208 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: sr_customer_sk (type: bigint), sr_store_sk (type: bigint), sr_fee (type: decimal(7,2)), sr_returned_date_sk (type: bigint) @@ -39,7 +39,7 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col0, _col1, _col2 input vertices: - 1 Map 12 + 1 Map 5 Statistics: Num rows: 1472589806 Data size: 169844484256 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) @@ -58,6 +58,24 @@ STAGE PLANS: Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 12 + Map Operator Tree: + TableScan + alias: customer + Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: c_customer_sk (type: bigint), c_customer_id (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: string) + Execution mode: vectorized, llap + LLAP IO: may be used (ACID table) + Map 5 Map Operator Tree: TableScan alias: date_dim @@ -91,7 +109,7 @@ STAGE PLANS: Target Input: store_returns Partition key expr: sr_returned_date_sk Statistics: Num rows: 367 Data size: 2936 Basic stats: COMPLETE Column stats: COMPLETE - Target Vertex: Map 8 + Target Vertex: Map 1 Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z @@ -113,35 +131,35 @@ STAGE PLANS: Target Input: store_returns Partition key expr: sr_returned_date_sk Statistics: Num rows: 367 Data size: 2936 Basic stats: COMPLETE Column stats: COMPLETE - Target Vertex: Map 1 + Target Vertex: Map 8 Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 5 + Map 6 Map Operator Tree: TableScan alias: store filterExpr: (s_state = 'NM') (type: boolean) - Statistics: Num rows: 1704 Data size: 160176 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 159230 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (s_state = 'NM') (type: boolean) - Statistics: Num rows: 39 Data size: 3666 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 3760 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 39 Data size: 312 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 320 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 39 Data size: 312 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 320 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 39 Data size: 312 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 320 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1000000) - minReductionHashAggr: 0.974359 + minReductionHashAggr: 0.975 mode: hash outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE @@ -152,24 +170,6 @@ STAGE PLANS: value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 7 - Map Operator Tree: - TableScan - alias: customer - Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: c_customer_sk (type: bigint), c_customer_id (type: char(16)) - outputColumnNames: _col0, _col1 - Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) - Execution mode: vectorized, llap - LLAP IO: may be used (ACID table) Map 8 Map Operator Tree: TableScan @@ -191,7 +191,7 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col0, _col1, _col2 input vertices: - 1 Map 12 + 1 Map 5 Statistics: Num rows: 1499681380 Data size: 172969152424 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) @@ -284,15 +284,27 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col0, _col1, _col2 input vertices: - 1 Map 5 - Statistics: Num rows: 33743267 Data size: 3779245920 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 33743267 Data size: 3779245920 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: bigint), _col2 (type: decimal(17,2)) + 1 Map 6 + Statistics: Num rows: 34608481 Data size: 3876149888 Basic stats: COMPLETE Column stats: COMPLETE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: bigint) + 1 _col1 (type: bigint) + outputColumnNames: _col0, _col2, _col4 + input vertices: + 1 Reducer 10 + Statistics: Num rows: 34824784 Data size: 7802482048 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: (_col2 > _col4) (type: boolean) + Statistics: Num rows: 11608261 Data size: 2600827280 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 11608261 Data size: 2600827280 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: vectorized, llap Reduce Operator Tree: @@ -302,46 +314,33 @@ STAGE PLANS: keys: 0 KEY.reducesinkkey0 (type: bigint) 1 KEY.reducesinkkey0 (type: bigint) - outputColumnNames: _col1, _col2, _col5 + outputColumnNames: _col7 input vertices: - 1 Map 7 - Statistics: Num rows: 33743267 Data size: 7153572612 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 12 + Statistics: Num rows: 11608261 Data size: 1160826100 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true - Map Join Operator - condition map: - Inner Join 0 to 1 - keys: - 0 _col1 (type: bigint) - 1 _col1 (type: bigint) - outputColumnNames: _col2, _col5, _col6 - input vertices: - 1 Reducer 10 - Statistics: Num rows: 33954162 Data size: 11001148488 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: (_col2 > _col6) (type: boolean) - Statistics: Num rows: 11318054 Data size: 3667049496 Basic stats: COMPLETE Column stats: COMPLETE - Top N Key Operator - sort order: + - keys: _col5 (type: char(16)) + Top N Key Operator + sort order: + + keys: _col7 (type: string) + null sort order: z + Statistics: Num rows: 11608261 Data size: 1160826100 Basic stats: COMPLETE Column stats: COMPLETE + top n: 100 + Select Operator + expressions: _col7 (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 11608261 Data size: 1160826100 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: string) null sort order: z - Statistics: Num rows: 11318054 Data size: 3667049496 Basic stats: COMPLETE Column stats: COMPLETE - top n: 100 - Select Operator - expressions: _col5 (type: char(16)) - outputColumnNames: _col0 - Statistics: Num rows: 11318054 Data size: 1131805400 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: char(16)) - null sort order: z - sort order: + - Statistics: Num rows: 11318054 Data size: 1131805400 Basic stats: COMPLETE Column stats: COMPLETE + sort order: + + Statistics: Num rows: 11608261 Data size: 1160826100 Basic stats: COMPLETE Column stats: COMPLETE Reducer 4 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator - expressions: KEY.reducesinkkey0 (type: char(16)) + expressions: KEY.reducesinkkey0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 11318054 Data size: 1131805400 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 11608261 Data size: 1160826100 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 10000 Basic stats: COMPLETE Column stats: COMPLETE @@ -352,7 +351,7 @@ STAGE PLANS: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - Reducer 6 + Reducer 7 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query10.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query10.q.out index 26da6dc22675..25d3485a06a6 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query10.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query10.q.out @@ -116,7 +116,7 @@ STAGE PLANS: TableScan alias: c filterExpr: (c_current_cdemo_sk is not null and c_current_addr_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_163_container, bigKeyColName:c_current_addr_sk, smallTablePos:1, keyRatio:0.00250005 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_163_container, bigKeyColName:c_current_addr_sk, smallTablePos:1, keyRatio:0.0025026375 Statistics: Num rows: 80000000 Data size: 1897611080 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (c_current_cdemo_sk is not null and c_current_addr_sk is not null) (type: boolean) @@ -134,18 +134,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 7 - Statistics: Num rows: 200004 Data size: 1600040 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 200211 Data size: 1601696 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 200004 Data size: 1600040 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 200211 Data size: 1601696 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 200004 Data size: 1600032 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 200211 Data size: 1601688 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -164,20 +164,20 @@ STAGE PLANS: TableScan alias: ca filterExpr: (ca_county) IN ('Dona Ana County', 'Douglas County', 'Gaines County', 'Richland County', 'Walker County') (type: boolean) - Statistics: Num rows: 40000000 Data size: 4240000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 4122577968 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ca_county) IN ('Dona Ana County', 'Douglas County', 'Gaines County', 'Richland County', 'Walker County') (type: boolean) - Statistics: Num rows: 103627 Data size: 10984462 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 103734 Data size: 10691416 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 103627 Data size: 829016 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 103734 Data size: 829872 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 103627 Data size: 829016 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 103734 Data size: 829872 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 8 @@ -348,7 +348,7 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 8 - Statistics: Num rows: 1481515 Data size: 22104216 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1483045 Data size: 22127040 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Map Join Operator condition map: @@ -359,7 +359,7 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col5 input vertices: 1 Reducer 11 - Statistics: Num rows: 5246461 Data size: 103329196 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5246461 Data size: 103327540 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Left Outer Join 0 to 1 @@ -369,14 +369,14 @@ STAGE PLANS: outputColumnNames: _col1, _col5, _col7 input vertices: 1 Reducer 13 - Statistics: Num rows: 5209374 Data size: 81749960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5209374 Data size: 81748304 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col5 is not null or _col7 is not null) (type: boolean) - Statistics: Num rows: 5209374 Data size: 81749960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5209374 Data size: 81748304 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: bigint) outputColumnNames: _col1 - Statistics: Num rows: 5209374 Data size: 40074968 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5209374 Data size: 40073312 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query11.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query11.q.out index d569bd484af9..1dc828759f42 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query11.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query11.q.out @@ -30,20 +30,20 @@ STAGE PLANS: Map Operator Tree: TableScan alias: customer - Statistics: Num rows: 80000000 Data size: 16000000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15742561276 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: c_customer_sk (type: bigint), c_customer_id (type: char(16)), c_birth_country (type: varchar(20)) + expressions: c_customer_sk (type: bigint), c_customer_id (type: string), c_birth_country (type: varchar(20)) outputColumnNames: _col0, _col1, _col4 - Statistics: Num rows: 80000000 Data size: 16000000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15742561276 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 16000000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)), _col4 (type: varchar(20)) + Statistics: Num rows: 80000000 Data size: 15742561276 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: string), _col4 (type: varchar(20)) Select Operator - expressions: c_customer_sk (type: bigint), c_customer_id (type: char(16)) + expressions: c_customer_sk (type: bigint), c_customer_id (type: string) outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator @@ -52,21 +52,21 @@ STAGE PLANS: sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) + value expressions: _col1 (type: string) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) + value expressions: _col1 (type: string) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) + value expressions: _col1 (type: string) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 10 @@ -253,36 +253,36 @@ STAGE PLANS: TableScan alias: customer probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_302_container, bigKeyColName:c_customer_id, smallTablePos:0, keyRatio:0.1111111125 - Statistics: Num rows: 80000000 Data size: 29760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 28998830376 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: c_customer_id (type: char(16)), c_first_name (type: char(20)), c_last_name (type: char(30)), c_birth_country (type: varchar(20)) + expressions: c_customer_id (type: string), c_first_name (type: char(20)), c_last_name (type: char(30)), c_birth_country (type: varchar(20)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 80000000 Data size: 29760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 28998830376 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: char(16)) - 1 _col0 (type: char(16)) + 0 _col0 (type: string) + 1 _col0 (type: string) outputColumnNames: _col0, _col2, _col3, _col4 input vertices: 0 Reducer 9 - Statistics: Num rows: 13333333 Data size: 4959999876 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 13333333 Data size: 4198830252 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++++ - keys: _col0 (type: char(16)), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: varchar(20)) + keys: _col0 (type: string), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: varchar(20)) null sort order: zzzz - Statistics: Num rows: 13333333 Data size: 4959999876 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 13333333 Data size: 4198830252 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator - expressions: _col0 (type: char(16)), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: varchar(20)) + expressions: _col0 (type: string), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: varchar(20)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 13333333 Data size: 4959999876 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 13333333 Data size: 3437660356 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)), _col1 (type: char(20)), _col2 (type: char(30)), _col3 (type: varchar(20)) + key expressions: _col0 (type: string), _col1 (type: char(20)), _col2 (type: char(30)), _col3 (type: varchar(20)) null sort order: zzzz sort order: ++++ - Statistics: Num rows: 13333333 Data size: 4959999876 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 13333333 Data size: 3437660356 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 2 @@ -377,16 +377,16 @@ STAGE PLANS: DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col2) - keys: _col5 (type: char(16)) + keys: _col5 (type: string) minReductionHashAggr: 0.9815675 mode: hash outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(18,2)) Reducer 15 @@ -394,15 +394,15 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)) + keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(18,2)) Reducer 16 @@ -421,16 +421,16 @@ STAGE PLANS: DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col2) - keys: _col5 (type: char(16)) + keys: _col5 (type: string) minReductionHashAggr: 0.9815675 mode: hash outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(18,2)) Reducer 17 @@ -438,7 +438,7 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)) + keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE @@ -446,29 +446,29 @@ STAGE PLANS: predicate: (_col1 > 0) (type: boolean) Statistics: Num rows: 26666666 Data size: 5653333192 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)), _col1 (type: decimal(18,2)), (_col1 > 0) (type: boolean) + expressions: _col0 (type: string), _col1 (type: decimal(18,2)), (_col1 > 0) (type: boolean) outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 26666666 Data size: 5759999856 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 26666666 Data size: 5759999856 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(18,2)), _col2 (type: boolean) Reducer 19 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator - expressions: KEY.reducesinkkey0 (type: char(16)), KEY.reducesinkkey1 (type: char(20)), KEY.reducesinkkey2 (type: char(30)), KEY.reducesinkkey3 (type: varchar(20)) + expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: char(20)), KEY.reducesinkkey2 (type: char(30)), KEY.reducesinkkey3 (type: varchar(20)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 13333333 Data size: 4959999876 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 13333333 Data size: 3437660356 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 - Statistics: Num rows: 100 Data size: 37200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 26048 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 100 Data size: 37200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 26048 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -489,16 +489,16 @@ STAGE PLANS: DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col2) - keys: _col5 (type: char(16)) + keys: _col5 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(18,2)) Reducer 4 @@ -506,7 +506,7 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)) + keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE @@ -514,14 +514,14 @@ STAGE PLANS: predicate: (_col1 > 0) (type: boolean) Statistics: Num rows: 26666666 Data size: 5653333192 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)), _col1 (type: decimal(18,2)), (_col1 > 0) (type: boolean) + expressions: _col0 (type: string), _col1 (type: decimal(18,2)), (_col1 > 0) (type: boolean) outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 26666666 Data size: 5759999856 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 26666666 Data size: 5759999856 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(18,2)), _col2 (type: boolean) Reducer 5 @@ -536,40 +536,40 @@ STAGE PLANS: outputColumnNames: _col2, _col5, _col8 input vertices: 1 Map 1 - Statistics: Num rows: 16584098707 Data size: 5041566006928 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 16584098707 Data size: 5041308568204 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col2) - keys: _col5 (type: char(16)), _col8 (type: varchar(20)) - minReductionHashAggr: 0.9291035 + keys: _col5 (type: string), _col8 (type: varchar(20)) + minReductionHashAggr: 0.92926776 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 80000000 Data size: 24320000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 24318758276 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)), _col1 (type: varchar(20)) + key expressions: _col0 (type: string), _col1 (type: varchar(20)) null sort order: zz sort order: ++ - Map-reduce partition columns: _col0 (type: char(16)), _col1 (type: varchar(20)) - Statistics: Num rows: 80000000 Data size: 24320000000 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col0 (type: string), _col1 (type: varchar(20)) + Statistics: Num rows: 80000000 Data size: 24318758276 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(18,2)) Reducer 6 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)), KEY._col1 (type: varchar(20)) + keys: KEY._col0 (type: string), KEY._col1 (type: varchar(20)) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 80000000 Data size: 24320000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 24318758276 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)), _col2 (type: decimal(18,2)) + expressions: _col0 (type: string), _col2 (type: decimal(18,2)) outputColumnNames: _col0, _col2 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(18,2)) Reducer 7 @@ -579,18 +579,18 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 KEY.reducesinkkey0 (type: char(16)) - 1 KEY.reducesinkkey0 (type: char(16)) + 0 KEY.reducesinkkey0 (type: string) + 1 KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col2, _col4, _col5 input vertices: 1 Reducer 4 Statistics: Num rows: 26666666 Data size: 8746666448 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 26666666 Data size: 8746666448 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(18,2)), _col4 (type: decimal(18,2)), _col5 (type: boolean) Reducer 8 @@ -600,18 +600,18 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 KEY.reducesinkkey0 (type: char(16)) - 1 KEY.reducesinkkey0 (type: char(16)) + 0 KEY.reducesinkkey0 (type: string) + 1 KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col2, _col4, _col5, _col7 input vertices: 1 Reducer 15 Statistics: Num rows: 26666666 Data size: 11733333040 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 26666666 Data size: 11733333040 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(18,2)), _col4 (type: decimal(18,2)), _col5 (type: boolean), _col7 (type: decimal(18,2)) Reducer 9 @@ -621,8 +621,8 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 KEY.reducesinkkey0 (type: char(16)) - 1 KEY.reducesinkkey0 (type: char(16)) + 0 KEY.reducesinkkey0 (type: string) + 1 KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col2, _col4, _col5, _col7, _col9, _col10 input vertices: 1 Reducer 17 @@ -632,14 +632,14 @@ STAGE PLANS: predicate: if(_col5, if(_col10, ((_col7 / _col9) > (_col2 / _col4)), (0 > (_col2 / _col4))), if(_col10, ((_col7 / _col9) > 0), false)) (type: boolean) Statistics: Num rows: 13333333 Data size: 7413333148 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)) + expressions: _col0 (type: string) outputColumnNames: _col0 Statistics: Num rows: 13333333 Data size: 1333333300 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 13333333 Data size: 1333333300 Basic stats: COMPLETE Column stats: COMPLETE Stage: Stage-0 diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query12.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query12.q.out index 8d5eeb1dcade..7b47669a792c 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query12.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query12.q.out @@ -17,7 +17,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: web_sales - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_56_container, bigKeyColName:ws_item_sk, smallTablePos:1, keyRatio:0.2727272808816537 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_56_container, bigKeyColName:ws_item_sk, smallTablePos:1, keyRatio:0.3000000119566716 Statistics: Num rows: 21594638446 Data size: 2763811113552 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ws_item_sk (type: bigint), ws_ext_sales_price (type: decimal(7,2)), ws_sold_date_sk (type: bigint) @@ -32,7 +32,7 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col4, _col5, _col6, _col7, _col8 input vertices: 1 Map 5 - Statistics: Num rows: 5889447025 Data size: 4110531380410 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6478391792 Data size: 4521614698726 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -42,20 +42,20 @@ STAGE PLANS: outputColumnNames: _col1, _col4, _col5, _col6, _col7, _col8 input vertices: 1 Map 6 - Statistics: Num rows: 654338207 Data size: 451190719790 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 719772035 Data size: 496339932060 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col8 (type: char(50)), _col7 (type: char(50)), _col4 (type: string), _col5 (type: varchar(200)), _col6 (type: decimal(7,2)) - minReductionHashAggr: 0.98058045 + minReductionHashAggr: 0.9796346 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: string), _col3 (type: varchar(200)), _col4 (type: decimal(7,2)) null sort order: zzzzz sort order: +++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: string), _col3 (type: varchar(200)), _col4 (type: decimal(7,2)) - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -64,20 +64,20 @@ STAGE PLANS: TableScan alias: item filterExpr: (i_category) IN ('Books ', 'Jewelry ', 'Sports ') (type: boolean) - Statistics: Num rows: 462000 Data size: 270601408 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 270182180 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_category) IN ('Books ', 'Jewelry ', 'Sports ') (type: boolean) - Statistics: Num rows: 126000 Data size: 73800496 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 81055046 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_id (type: string), i_item_desc (type: varchar(200)), i_current_price (type: decimal(7,2)), i_class (type: char(50)), i_category (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 73800496 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 81055046 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 126000 Data size: 73800496 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 81055046 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(200)), _col3 (type: decimal(7,2)), _col4 (type: char(50)), _col5 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -126,13 +126,13 @@ STAGE PLANS: keys: KEY._col0 (type: char(50)), KEY._col1 (type: char(50)), KEY._col2 (type: string), KEY._col3 (type: varchar(200)), KEY._col4 (type: decimal(7,2)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: char(50)) null sort order: a sort order: + Map-reduce partition columns: _col1 (type: char(50)) - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(50)), _col2 (type: string), _col3 (type: varchar(200)), _col4 (type: decimal(7,2)), _col5 (type: decimal(17,2)) Reducer 3 Execution mode: vectorized, llap @@ -140,7 +140,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), VALUE._col1 (type: string), VALUE._col2 (type: varchar(200)), VALUE._col3 (type: decimal(7,2)), VALUE._col4 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -160,22 +160,22 @@ STAGE PLANS: name: sum window function: GenericUDAFSumHiveDecimal window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++++ keys: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: string), _col3 (type: varchar(200)), ((_col5 * 100) / sum_window_0) (type: decimal(38,17)) null sort order: zzzzz - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col3 (type: varchar(200)), _col0 (type: char(50)), _col1 (type: char(50)), _col4 (type: decimal(7,2)), _col5 (type: decimal(17,2)), ((_col5 * 100) / sum_window_0) (type: decimal(38,17)), _col2 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 126000 Data size: 101052000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 111157200 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: char(50)), _col2 (type: char(50)), _col6 (type: string), _col0 (type: varchar(200)), _col5 (type: decimal(38,17)) null sort order: zzzzz sort order: +++++ - Statistics: Num rows: 126000 Data size: 101052000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 111157200 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(7,2)), _col4 (type: decimal(17,2)) Reducer 4 Execution mode: vectorized, llap @@ -183,7 +183,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey3 (type: varchar(200)), KEY.reducesinkkey0 (type: char(50)), KEY.reducesinkkey1 (type: char(50)), VALUE._col0 (type: decimal(7,2)), VALUE._col1 (type: decimal(17,2)), KEY.reducesinkkey4 (type: decimal(38,17)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 88452000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 97297200 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 70200 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query13.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query13.q.out index 0219ac32e5eb..4799304a997f 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query13.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query13.q.out @@ -16,7 +16,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: (ss_net_profit is not null and ss_sales_price is not null and ss_cdemo_sk is not null and ss_addr_sk is not null and ss_hdemo_sk is not null and ss_store_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_89_container, bigKeyColName:ss_hdemo_sk, smallTablePos:1, keyRatio:7.945618813963477E-8 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_89_container, bigKeyColName:ss_hdemo_sk, smallTablePos:1, keyRatio:1.6196651895943854E-7 Statistics: Num rows: 82510879939 Data size: 39653754183252 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ss_net_profit is not null and ss_sales_price is not null and ss_cdemo_sk is not null and ss_addr_sk is not null and ss_hdemo_sk is not null and ss_store_sk is not null) (type: boolean) @@ -44,10 +44,10 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3, _col4, _col5, _col7, _col8, _col9, _col10, _col11, _col12, _col15, _col16, _col17 input vertices: 1 Map 4 - Statistics: Num rows: 1220237740 Data size: 43928558884 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2487407293 Data size: 284875875036 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col15 and _col7) or (_col16 and _col8) or (_col17 and _col9)) (type: boolean) - Statistics: Num rows: 915178305 Data size: 32946419224 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1865555469 Data size: 213656906308 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -57,7 +57,7 @@ STAGE PLANS: outputColumnNames: _col0, _col3, _col4, _col5, _col10, _col11, _col12, _col19, _col20 input vertices: 1 Map 5 - Statistics: Num rows: 183035664 Data size: 3660713516 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 373111100 Data size: 7462222236 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -67,14 +67,14 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col5, _col10, _col11, _col12, _col19, _col20, _col22, _col23, _col24, _col25, _col26, _col27 input vertices: 1 Map 6 - Statistics: Num rows: 47066317 Data size: 2070918176 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 95942860 Data size: 4221486068 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col22 and _col23 and _col10 and _col19) or (_col24 and _col25 and _col11 and _col20) or (_col26 and _col27 and _col12 and _col20)) (type: boolean) - Statistics: Num rows: 8824932 Data size: 388297236 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 17989284 Data size: 791528724 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: int), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) outputColumnNames: _col3, _col4, _col5 - Statistics: Num rows: 8824932 Data size: 388297236 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 17989284 Data size: 791528724 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col3), count(_col3), sum(_col4), count(_col4), sum(_col5), count(_col5) minReductionHashAggr: 0.99 @@ -130,20 +130,20 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: ((ca_state) IN ('GA', 'IN', 'KY', 'MO', 'MT', 'NM', 'OR', 'WI', 'WV') and (ca_country = 'United States')) (type: boolean) - Statistics: Num rows: 40000000 Data size: 7640000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 7420490932 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((ca_state) IN ('GA', 'IN', 'KY', 'MO', 'MT', 'NM', 'OR', 'WI', 'WV') and (ca_country = 'United States')) (type: boolean) - Statistics: Num rows: 3396227 Data size: 648679357 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6923077 Data size: 1284315894 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), (ca_state) IN ('GA', 'KY', 'NM') (type: boolean), (ca_state) IN ('IN', 'MT', 'OR') (type: boolean), (ca_state) IN ('MO', 'WI', 'WV') (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 3396227 Data size: 67924540 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6923077 Data size: 138461540 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 3396227 Data size: 67924540 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6923077 Data size: 138461540 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: boolean), _col2 (type: boolean), _col3 (type: boolean) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query15.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query15.q.out index 771fbbaf8173..3785ce263ade 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query15.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query15.q.out @@ -40,17 +40,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: customer_address - Statistics: Num rows: 40000000 Data size: 7320000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 7109993931 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_zip (type: char(10)), (ca_state) IN ('CA', 'GA', 'WA') (type: boolean), (substr(ca_zip, 1, 5)) IN ('85669', '86197', '88274', '83405', '86475', '85392', '85460', '80348', '81792') (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 40000000 Data size: 4200000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 4093173033 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 4200000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 4093173033 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(10)), _col2 (type: boolean), _col3 (type: boolean) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -135,14 +135,14 @@ STAGE PLANS: outputColumnNames: _col0, _col3, _col4, _col5 input vertices: 1 Map 3 - Statistics: Num rows: 80000000 Data size: 8400000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 8293173033 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 8400000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 8293173033 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: char(10)), _col4 (type: boolean), _col5 (type: boolean) Reducer 5 Execution mode: vectorized, llap @@ -156,34 +156,34 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col5, _col7, _col9 input vertices: 0 Reducer 2 - Statistics: Num rows: 2146106610 Data size: 445233418138 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2146106610 Data size: 445126591171 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Filter Operator predicate: (_col4 or _col9 or _col5) (type: boolean) - Statistics: Num rows: 2146106610 Data size: 445233418138 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2146106610 Data size: 445126591171 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: + keys: _col3 (type: char(10)) null sort order: z - Statistics: Num rows: 2146106610 Data size: 445233418138 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2146106610 Data size: 445126591171 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col3 (type: char(10)), _col7 (type: decimal(7,2)) outputColumnNames: _col3, _col7 - Statistics: Num rows: 2146106610 Data size: 445233418138 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2146106610 Data size: 445126591171 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col7) keys: _col3 (type: char(10)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 16596120 Data size: 3335820120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 16588321 Data size: 3332601215 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(10)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: char(10)) - Statistics: Num rows: 16596120 Data size: 3335820120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 16588321 Data size: 3332601215 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Reducer 6 Execution mode: vectorized, llap @@ -193,12 +193,12 @@ STAGE PLANS: keys: KEY._col0 (type: char(10)) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 9538 Data size: 1917138 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9539 Data size: 1916449 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(10)) null sort order: z sort order: + - Statistics: Num rows: 9538 Data size: 1917138 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9539 Data size: 1916449 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Reducer 7 Execution mode: vectorized, llap @@ -206,7 +206,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: char(10)), VALUE._col0 (type: decimal(17,2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 9538 Data size: 1917138 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9539 Data size: 1916449 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 20100 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query16.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query16.q.out index 9cd4986a6e30..c7a4ecc725ab 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query16.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query16.q.out @@ -41,7 +41,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col3, _col4, _col5, _col6 input vertices: 1 Map 8 - Statistics: Num rows: 803365808 Data size: 176672786488 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 818815406 Data size: 180627883576 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -51,7 +51,7 @@ STAGE PLANS: outputColumnNames: _col0, _col3, _col4, _col5, _col6 input vertices: 1 Map 9 - Statistics: Num rows: 160673164 Data size: 19280779808 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 163763084 Data size: 19651570208 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -61,20 +61,20 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col5, _col6 input vertices: 1 Map 10 - Statistics: Num rows: 17851352 Data size: 2142162360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18194653 Data size: 2183358480 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col4 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col4 (type: bigint) - Statistics: Num rows: 17851352 Data size: 2142162360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18194653 Data size: 2183358480 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) Select Operator expressions: _col4 (type: bigint) outputColumnNames: _col4 - Statistics: Num rows: 17851352 Data size: 142810816 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18194653 Data size: 145557224 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col4), max(_col4), bloom_filter(_col4, expectedEntries=1869746) + aggregations: min(_col4), max(_col4), bloom_filter(_col4, expectedEntries=1905703) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 @@ -167,20 +167,20 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: (ca_state = 'NY') (type: boolean) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ca_state = 'NY') (type: boolean) - Statistics: Num rows: 754717 Data size: 70943398 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 70323608 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 754717 Data size: 6037736 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 6153848 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 754717 Data size: 6037736 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 6153848 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 9 @@ -217,25 +217,25 @@ STAGE PLANS: input vertices: 1 Map 11 residual filter predicates: {(_col3 <> _col14)} - Statistics: Num rows: 17851352 Data size: 2142162368 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18194653 Data size: 2183358488 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Select Operator expressions: _col4 (type: bigint), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) outputColumnNames: _col4, _col5, _col6 - Statistics: Num rows: 17851352 Data size: 2142162352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18194653 Data size: 2183358472 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col4 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col4 (type: bigint) - Statistics: Num rows: 17851352 Data size: 2142162352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18194653 Data size: 2183358472 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) Select Operator expressions: _col4 (type: bigint) outputColumnNames: _col4 - Statistics: Num rows: 17851352 Data size: 142810816 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18194653 Data size: 145557224 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col4), max(_col4), bloom_filter(_col4, expectedEntries=1869746) + aggregations: min(_col4), max(_col4), bloom_filter(_col4, expectedEntries=1905703) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 @@ -257,7 +257,7 @@ STAGE PLANS: outputColumnNames: _col4, _col5, _col6 input vertices: 1 Map 12 - Statistics: Num rows: 17851352 Data size: 2142162352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18194653 Data size: 2183358472 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col5), sum(_col6) @@ -265,13 +265,13 @@ STAGE PLANS: minReductionHashAggr: 0.8952603 mode: hash outputColumnNames: _col0, _col2, _col3 - Statistics: Num rows: 8925676 Data size: 2070756832 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9097326 Data size: 2110579632 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 8925676 Data size: 2070756832 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9097326 Data size: 2110579632 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(17,2)), _col3 (type: decimal(17,2)) Reducer 4 Execution mode: vectorized, llap @@ -281,7 +281,7 @@ STAGE PLANS: keys: KEY._col0 (type: bigint) mode: partial2 outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 8925676 Data size: 2070756832 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9097326 Data size: 2110579632 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col0), sum(_col1), sum(_col2) mode: partial2 @@ -311,7 +311,7 @@ STAGE PLANS: Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1869746) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1905703) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE @@ -324,7 +324,7 @@ STAGE PLANS: Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1869746) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1905703) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query17.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query17.q.out index d37b1ee2e8df..f0aa109c25cd 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query17.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query17.q.out @@ -54,17 +54,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store - Statistics: Num rows: 1704 Data size: 160176 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 159230 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_state (type: char(2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 1704 Data size: 160176 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 159230 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 160176 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 159230 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -72,17 +72,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 134904000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 134691112 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_id (type: string), i_item_desc (type: varchar(200)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 462000 Data size: 134904000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 134691112 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 134904000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 134691112 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(200)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -325,7 +325,7 @@ STAGE PLANS: outputColumnNames: _col2, _col5, _col9, _col15, _col19 input vertices: 1 Map 11 - Statistics: Num rows: 3459560664786 Data size: 366704984826736 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3459560664786 Data size: 366704984825790 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -335,30 +335,30 @@ STAGE PLANS: outputColumnNames: _col2, _col9, _col15, _col19, _col21, _col22 input vertices: 1 Map 12 - Statistics: Num rows: 3459560664786 Data size: 1321543728307672 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3459560664786 Data size: 1321543728093838 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++ keys: _col21 (type: string), _col22 (type: varchar(200)), _col19 (type: char(2)) null sort order: zzz - Statistics: Num rows: 3459560664786 Data size: 1321543728307672 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3459560664786 Data size: 1321543728093838 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col21 (type: string), _col22 (type: varchar(200)), _col19 (type: char(2)), _col9 (type: int), _col15 (type: int), _col2 (type: int), UDFToDouble(_col9) (type: double), (UDFToDouble(_col9) * UDFToDouble(_col9)) (type: double), UDFToDouble(_col15) (type: double), (UDFToDouble(_col15) * UDFToDouble(_col15)) (type: double), UDFToDouble(_col2) (type: double), (UDFToDouble(_col2) * UDFToDouble(_col2)) (type: double) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 - Statistics: Num rows: 3459560664786 Data size: 1321543728307672 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3459560664786 Data size: 1321543728093838 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col3), sum(_col3), sum(_col7), sum(_col6), count(_col6), count(_col4), sum(_col4), sum(_col9), sum(_col8), count(_col8), count(_col5), sum(_col5), sum(_col11), sum(_col10), count(_col10) keys: _col0 (type: string), _col1 (type: varchar(200)), _col2 (type: char(2)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17 - Statistics: Num rows: 3459560664786 Data size: 1695184725745140 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3459560664786 Data size: 1695184725317202 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: varchar(200)), _col2 (type: char(2)) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: string), _col1 (type: varchar(200)), _col2 (type: char(2)) - Statistics: Num rows: 3459560664786 Data size: 1695184725745140 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3459560664786 Data size: 1695184725317202 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint), _col5 (type: double), _col6 (type: double), _col7 (type: bigint), _col8 (type: bigint), _col9 (type: bigint), _col10 (type: double), _col11 (type: double), _col12 (type: bigint), _col13 (type: bigint), _col14 (type: bigint), _col15 (type: double), _col16 (type: double), _col17 (type: bigint) Reducer 6 Execution mode: vectorized, llap @@ -368,16 +368,16 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: varchar(200)), KEY._col2 (type: char(2)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17 - Statistics: Num rows: 3459560664786 Data size: 1695184725745140 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3459560664786 Data size: 1695184725317202 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: varchar(200)), _col2 (type: char(2)), _col3 (type: bigint), (UDFToDouble(_col4) / _col3) (type: double), power(((_col5 - ((_col6 * _col6) / _col7)) / if((_col7 = 1L), null, (_col7 - 1))), 0.5) (type: double), (power(((_col5 - ((_col6 * _col6) / _col7)) / if((_col7 = 1L), null, (_col7 - 1))), 0.5) / (UDFToDouble(_col4) / _col3)) (type: double), _col8 (type: bigint), (UDFToDouble(_col9) / _col8) (type: double), power(((_col10 - ((_col11 * _col11) / _col12)) / if((_col12 = 1L), null, (_col12 - 1))), 0.5) (type: double), (power(((_col10 - ((_col11 * _col11) / _col12)) / if((_col12 = 1L), null, (_col12 - 1))), 0.5) / (UDFToDouble(_col9) / _col8)) (type: double), _col13 (type: bigint), (UDFToDouble(_col14) / _col13) (type: double), (power(((_col15 - ((_col16 * _col16) / _col17)) / if((_col17 = 1L), null, (_col17 - 1))), 0.5) / (UDFToDouble(_col14) / _col13)) (type: double) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13 - Statistics: Num rows: 3459560664786 Data size: 1584478784471988 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3459560664786 Data size: 1584478784044050 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: varchar(200)), _col2 (type: char(2)) null sort order: zzz sort order: +++ - Statistics: Num rows: 3459560664786 Data size: 1584478784471988 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3459560664786 Data size: 1584478784044050 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: double), _col5 (type: double), _col6 (type: double), _col7 (type: bigint), _col8 (type: double), _col9 (type: double), _col10 (type: double), _col11 (type: bigint), _col12 (type: double), _col13 (type: double) Reducer 7 Execution mode: vectorized, llap @@ -385,7 +385,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: varchar(200)), KEY.reducesinkkey2 (type: char(2)), VALUE._col0 (type: bigint), VALUE._col1 (type: double), VALUE._col2 (type: double), VALUE._col3 (type: double), VALUE._col4 (type: bigint), VALUE._col5 (type: double), VALUE._col6 (type: double), VALUE._col7 (type: double), VALUE._col8 (type: bigint), VALUE._col9 (type: double), VALUE._col10 (type: double), VALUE._col10 (type: double) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14 - Statistics: Num rows: 3459560664786 Data size: 1612155269790276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3459560664786 Data size: 1612155269362338 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 46600 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query18.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query18.q.out index 081b2ed7c5df..79af2055a9a8 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query18.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query18.q.out @@ -57,7 +57,7 @@ STAGE PLANS: outputColumnNames: _col2, _col4, _col5, _col6, _col7, _col8, _col11, _col13, _col15, _col17, _col18, _col19 input vertices: 1 Map 7 - Statistics: Num rows: 80563578 Data size: 50834699922 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 82112872 Data size: 51770047200 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -67,7 +67,7 @@ STAGE PLANS: outputColumnNames: _col4, _col5, _col6, _col7, _col8, _col11, _col13, _col15, _col17, _col18, _col19, _col21 input vertices: 1 Map 9 - Statistics: Num rows: 80563578 Data size: 58246549098 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 82112872 Data size: 59324431424 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -77,21 +77,21 @@ STAGE PLANS: outputColumnNames: _col4, _col5, _col6, _col7, _col8, _col11, _col15, _col17, _col18, _col19, _col21 input vertices: 1 Map 5 - Statistics: Num rows: 80563578 Data size: 57612843314 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 82112872 Data size: 58678331288 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col4), count(_col4), sum(_col5), count(_col5), sum(_col6), count(_col6), sum(_col7), count(_col7), sum(_col8), count(_col8), sum(_col15), count(_col15), sum(_col11), count(_col11) keys: _col17 (type: varchar(30)), _col18 (type: char(2)), _col19 (type: varchar(20)), _col21 (type: string), 0L (type: bigint) grouping sets: 0, 8, 12, 14, 15 - minReductionHashAggr: 0.7567873 + minReductionHashAggr: 0.7614403 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18 - Statistics: Num rows: 402817890 Data size: 495063186810 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 410564360 Data size: 504356818196 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)), _col1 (type: char(2)), _col2 (type: varchar(20)), _col3 (type: string), _col4 (type: bigint) null sort order: zzzzz sort order: +++++ Map-reduce partition columns: _col0 (type: varchar(30)), _col1 (type: char(2)), _col2 (type: varchar(20)), _col3 (type: string), _col4 (type: bigint) - Statistics: Num rows: 402817890 Data size: 495063186810 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 410564360 Data size: 504356818196 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: decimal(22,2)), _col6 (type: bigint), _col7 (type: decimal(22,2)), _col8 (type: bigint), _col9 (type: decimal(22,2)), _col10 (type: bigint), _col11 (type: decimal(22,2)), _col12 (type: bigint), _col13 (type: decimal(22,2)), _col14 (type: bigint), _col15 (type: decimal(22,2)), _col16 (type: bigint), _col17 (type: decimal(22,2)), _col18 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -168,7 +168,7 @@ STAGE PLANS: TableScan alias: customer filterExpr: ((c_birth_month) IN (1, 4, 5, 9, 10, 12) and c_current_cdemo_sk is not null and c_current_addr_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_135_container, bigKeyColName:c_current_addr_sk, smallTablePos:1, keyRatio:0.0637275625 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_135_container, bigKeyColName:c_current_addr_sk, smallTablePos:1, keyRatio:0.0649530875 Statistics: Num rows: 80000000 Data size: 2515215652 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((c_birth_month) IN (1, 4, 5, 9, 10, 12) and c_current_cdemo_sk is not null and c_current_addr_sk is not null) (type: boolean) @@ -186,13 +186,13 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3, _col5, _col6, _col7 input vertices: 1 Map 8 - Statistics: Num rows: 5098205 Data size: 1923120445 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5196247 Data size: 1917863799 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 5098205 Data size: 1923120445 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5196247 Data size: 1917863799 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint), _col3 (type: decimal(12,2)), _col5 (type: varchar(30)), _col6 (type: char(2)), _col7 (type: varchar(20)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -201,20 +201,20 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: (ca_state) IN ('AL', 'MS', 'NC', 'ND', 'OK', 'TN', 'WI') (type: boolean) - Statistics: Num rows: 40000000 Data size: 11560000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 11223068900 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ca_state) IN ('AL', 'MS', 'NC', 'ND', 'OK', 'TN', 'WI') (type: boolean) - Statistics: Num rows: 5283019 Data size: 1526792491 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5384615 Data size: 1510797911 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_county (type: varchar(30)), ca_state (type: char(2)), ca_country (type: varchar(20)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 5283019 Data size: 1526792491 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5384615 Data size: 1510797911 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 5283019 Data size: 1526792491 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5384615 Data size: 1510797911 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(30)), _col2 (type: char(2)), _col3 (type: varchar(20)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -244,23 +244,23 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(30)), KEY._col1 (type: char(2)), KEY._col2 (type: varchar(20)), KEY._col3 (type: string), KEY._col4 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18 - Statistics: Num rows: 402817890 Data size: 495063186810 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 410564360 Data size: 504356818196 Basic stats: COMPLETE Column stats: COMPLETE pruneGroupingSetId: true Top N Key Operator sort order: ++++ keys: _col2 (type: varchar(20)), _col1 (type: char(2)), _col0 (type: varchar(30)), _col3 (type: string) null sort order: zzzz - Statistics: Num rows: 402817890 Data size: 495063186810 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 410564360 Data size: 504356818196 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col3 (type: string), _col2 (type: varchar(20)), _col1 (type: char(2)), _col0 (type: varchar(30)), CAST( (_col5 / _col6) AS decimal(16,6)) (type: decimal(16,6)), CAST( (_col7 / _col8) AS decimal(16,6)) (type: decimal(16,6)), CAST( (_col9 / _col10) AS decimal(16,6)) (type: decimal(16,6)), CAST( (_col11 / _col12) AS decimal(16,6)) (type: decimal(16,6)), CAST( (_col13 / _col14) AS decimal(16,6)) (type: decimal(16,6)), CAST( (_col15 / _col16) AS decimal(16,6)) (type: decimal(16,6)), CAST( (_col17 / _col18) AS decimal(16,6)) (type: decimal(16,6)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10 - Statistics: Num rows: 402817890 Data size: 469282841850 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 410564360 Data size: 477853918631 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: varchar(20)), _col2 (type: char(2)), _col3 (type: varchar(30)), _col0 (type: string) null sort order: zzzz sort order: ++++ - Statistics: Num rows: 402817890 Data size: 469282841850 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 410564360 Data size: 477853918631 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(16,6)), _col5 (type: decimal(16,6)), _col6 (type: decimal(16,6)), _col7 (type: decimal(16,6)), _col8 (type: decimal(16,6)), _col9 (type: decimal(16,6)), _col10 (type: decimal(16,6)) Reducer 3 Execution mode: vectorized, llap @@ -268,7 +268,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey3 (type: string), KEY.reducesinkkey0 (type: varchar(20)), KEY.reducesinkkey1 (type: char(2)), KEY.reducesinkkey2 (type: varchar(30)), VALUE._col0 (type: decimal(16,6)), VALUE._col1 (type: decimal(16,6)), VALUE._col2 (type: decimal(16,6)), VALUE._col3 (type: decimal(16,6)), VALUE._col4 (type: decimal(16,6)), VALUE._col5 (type: decimal(16,6)), VALUE._col6 (type: decimal(16,6)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10 - Statistics: Num rows: 402817890 Data size: 469282841850 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 410564360 Data size: 477853918631 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 116500 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query19.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query19.q.out index e7c795225aec..bff9027b7c8c 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query19.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query19.q.out @@ -40,17 +40,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store - Statistics: Num rows: 1704 Data size: 165288 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 164309 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), substr(s_zip, 1, 5) (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 1704 Data size: 163584 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 162616 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 163584 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 162616 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -58,17 +58,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: customer_address - Statistics: Num rows: 40000000 Data size: 3880000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3773173033 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), substr(ca_zip, 1, 5) (type: string) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40000000 Data size: 3840000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3734373336 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 3840000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3734373336 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -105,13 +105,13 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col3, _col7, _col8, _col9, _col10 input vertices: 1 Map 9 - Statistics: Num rows: 12841079 Data size: 2606739085 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 2606737135 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 12841079 Data size: 2606739085 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 2606737135 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint), _col3 (type: decimal(7,2)), _col7 (type: int), _col8 (type: char(50)), _col9 (type: int), _col10 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -157,20 +157,20 @@ STAGE PLANS: TableScan alias: item filterExpr: (i_manager_id = 7) (type: boolean) - Statistics: Num rows: 462000 Data size: 99316352 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 99090947 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_manager_id = 7) (type: boolean) - Statistics: Num rows: 4442 Data size: 954910 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 952960 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_brand_id (type: int), i_brand (type: char(50)), i_manufact_id (type: int), i_manufact (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 4442 Data size: 937182 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 935232 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 4442 Data size: 937182 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 935232 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: char(50)), _col3 (type: int), _col4 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -186,14 +186,14 @@ STAGE PLANS: outputColumnNames: _col0, _col3 input vertices: 1 Map 3 - Statistics: Num rows: 80000000 Data size: 7680000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 7574373336 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 7680000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 7574373336 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: string) Reducer 5 Execution mode: vectorized, llap @@ -207,7 +207,7 @@ STAGE PLANS: outputColumnNames: _col3, _col6, _col7, _col11, _col12, _col13, _col14 input vertices: 0 Reducer 2 - Statistics: Num rows: 12841079 Data size: 3736754029 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 3631125415 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Map Join Operator condition map: @@ -218,27 +218,27 @@ STAGE PLANS: outputColumnNames: _col3, _col7, _col11, _col12, _col13, _col14, _col16 input vertices: 1 Map 10 - Statistics: Num rows: 12841079 Data size: 4866768973 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 4761139391 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col3 <> _col16) (type: boolean) - Statistics: Num rows: 12841079 Data size: 4866768973 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 4761139391 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col7 (type: decimal(7,2)), _col11 (type: int), _col12 (type: char(50)), _col13 (type: int), _col14 (type: char(50)) outputColumnNames: _col7, _col11, _col12, _col13, _col14 - Statistics: Num rows: 12841079 Data size: 4866768973 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 4761139391 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col7) keys: _col12 (type: char(50)), _col11 (type: int), _col13 (type: int), _col14 (type: char(50)) - minReductionHashAggr: 0.9687239 + minReductionHashAggr: 0.96868783 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 12841079 Data size: 4044939805 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 4044937855 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: int), _col2 (type: int), _col3 (type: char(50)) null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: int), _col2 (type: int), _col3 (type: char(50)) - Statistics: Num rows: 12841079 Data size: 4044939805 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 4044937855 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)) Reducer 6 Execution mode: vectorized, llap @@ -248,29 +248,29 @@ STAGE PLANS: keys: KEY._col0 (type: char(50)), KEY._col1 (type: int), KEY._col2 (type: int), KEY._col3 (type: char(50)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 12841079 Data size: 4044939805 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 4044937855 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: -++++ keys: _col4 (type: decimal(17,2)), _col0 (type: char(50)), _col1 (type: int), _col2 (type: int), _col3 (type: char(50)) null sort order: azzzz - Statistics: Num rows: 12841079 Data size: 4044939805 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 4044937855 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col2 (type: int), _col3 (type: char(50)), _col4 (type: decimal(17,2)), _col0 (type: char(50)), _col1 (type: int) outputColumnNames: _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 12841079 Data size: 4044939717 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 4044935622 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col4 (type: decimal(17,2)), _col5 (type: char(50)), _col6 (type: int), _col2 (type: int), _col3 (type: char(50)) null sort order: azzzz sort order: -++++ - Statistics: Num rows: 12841079 Data size: 4044939717 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 4044935622 Basic stats: COMPLETE Column stats: COMPLETE Reducer 7 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey2 (type: int), KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey3 (type: int), KEY.reducesinkkey4 (type: char(50)), KEY.reducesinkkey0 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 12841079 Data size: 4044939717 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12841079 Data size: 4044935622 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 31500 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query1b.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query1b.q.out index 93081e70ebcd..0d53c653d4eb 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query1b.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query1b.q.out @@ -7,27 +7,27 @@ STAGE PLANS: Tez #### A masked pattern was here #### Edges: - Map 1 <- Map 13 (BROADCAST_EDGE), Reducer 12 (BROADCAST_EDGE), Reducer 7 (BROADCAST_EDGE) - Map 8 <- Reducer 5 (BROADCAST_EDGE) - Map 9 <- Map 13 (BROADCAST_EDGE), Reducer 7 (BROADCAST_EDGE) + Map 1 <- Map 6 (BROADCAST_EDGE), Reducer 12 (BROADCAST_EDGE), Reducer 8 (BROADCAST_EDGE) + Map 13 <- Reducer 5 (BROADCAST_EDGE) + Map 9 <- Map 6 (BROADCAST_EDGE), Reducer 8 (BROADCAST_EDGE) Reducer 10 <- Map 9 (SIMPLE_EDGE) Reducer 11 <- Reducer 10 (SIMPLE_EDGE) Reducer 12 <- Reducer 11 (CUSTOM_SIMPLE_EDGE) - Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 6 (BROADCAST_EDGE) - Reducer 3 <- Map 8 (CUSTOM_SIMPLE_EDGE), Reducer 11 (BROADCAST_EDGE), Reducer 2 (CUSTOM_SIMPLE_EDGE) + Reducer 2 <- Map 1 (SIMPLE_EDGE), Map 7 (BROADCAST_EDGE), Reducer 11 (BROADCAST_EDGE) + Reducer 3 <- Map 13 (CUSTOM_SIMPLE_EDGE), Reducer 2 (CUSTOM_SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 2 (CUSTOM_SIMPLE_EDGE) - Reducer 7 <- Map 6 (CUSTOM_SIMPLE_EDGE) + Reducer 8 <- Map 7 (CUSTOM_SIMPLE_EDGE) #### A masked pattern was here #### Vertices: Map 1 Map Operator Tree: TableScan alias: store_returns - filterExpr: (sr_store_sk is not null and sr_customer_sk is not null and sr_store_sk BETWEEN DynamicValue(RS_41_store_s_store_sk_min) AND DynamicValue(RS_41_store_s_store_sk_max) and sr_store_sk BETWEEN DynamicValue(RS_47_store_returns_sr_store_sk_min) AND DynamicValue(RS_47_store_returns_sr_store_sk_max) and in_bloom_filter(sr_store_sk, DynamicValue(RS_41_store_s_store_sk_bloom_filter)) and in_bloom_filter(sr_store_sk, DynamicValue(RS_47_store_returns_sr_store_sk_bloom_filter))) (type: boolean) + filterExpr: (sr_store_sk is not null and sr_customer_sk is not null and sr_store_sk BETWEEN DynamicValue(RS_41_store_s_store_sk_min) AND DynamicValue(RS_41_store_s_store_sk_max) and sr_store_sk BETWEEN DynamicValue(RS_44_store_returns_sr_store_sk_min) AND DynamicValue(RS_44_store_returns_sr_store_sk_max) and in_bloom_filter(sr_store_sk, DynamicValue(RS_41_store_s_store_sk_bloom_filter)) and in_bloom_filter(sr_store_sk, DynamicValue(RS_44_store_returns_sr_store_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 8332595709 Data size: 1113890910776 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (sr_store_sk is not null and sr_customer_sk is not null and sr_store_sk BETWEEN DynamicValue(RS_41_store_s_store_sk_min) AND DynamicValue(RS_41_store_s_store_sk_max) and sr_store_sk BETWEEN DynamicValue(RS_47_store_returns_sr_store_sk_min) AND DynamicValue(RS_47_store_returns_sr_store_sk_max) and in_bloom_filter(sr_store_sk, DynamicValue(RS_41_store_s_store_sk_bloom_filter)) and in_bloom_filter(sr_store_sk, DynamicValue(RS_47_store_returns_sr_store_sk_bloom_filter))) (type: boolean) + predicate: (sr_store_sk is not null and sr_customer_sk is not null and sr_store_sk BETWEEN DynamicValue(RS_41_store_s_store_sk_min) AND DynamicValue(RS_41_store_s_store_sk_max) and sr_store_sk BETWEEN DynamicValue(RS_44_store_returns_sr_store_sk_min) AND DynamicValue(RS_44_store_returns_sr_store_sk_max) and in_bloom_filter(sr_store_sk, DynamicValue(RS_41_store_s_store_sk_bloom_filter)) and in_bloom_filter(sr_store_sk, DynamicValue(RS_44_store_returns_sr_store_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 8033148295 Data size: 1073861157208 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: sr_customer_sk (type: bigint), sr_store_sk (type: bigint), sr_fee (type: decimal(7,2)), sr_returned_date_sk (type: bigint) @@ -41,7 +41,7 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col0, _col1, _col2 input vertices: - 1 Map 13 + 1 Map 6 Statistics: Num rows: 1472589806 Data size: 169844484256 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) @@ -60,6 +60,28 @@ STAGE PLANS: Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 13 + Map Operator Tree: + TableScan + alias: customer + filterExpr: (c_customer_sk BETWEEN DynamicValue(RS_47_store_returns_sr_customer_sk_min) AND DynamicValue(RS_47_store_returns_sr_customer_sk_max) and in_bloom_filter(c_customer_sk, DynamicValue(RS_47_store_returns_sr_customer_sk_bloom_filter))) (type: boolean) + Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: (c_customer_sk BETWEEN DynamicValue(RS_47_store_returns_sr_customer_sk_min) AND DynamicValue(RS_47_store_returns_sr_customer_sk_max) and in_bloom_filter(c_customer_sk, DynamicValue(RS_47_store_returns_sr_customer_sk_bloom_filter))) (type: boolean) + Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: c_customer_sk (type: bigint), c_customer_id (type: string) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: string) + Execution mode: vectorized, llap + LLAP IO: may be used (ACID table) + Map 6 Map Operator Tree: TableScan alias: date_dim @@ -93,7 +115,7 @@ STAGE PLANS: Target Input: store_returns Partition key expr: sr_returned_date_sk Statistics: Num rows: 367 Data size: 2936 Basic stats: COMPLETE Column stats: COMPLETE - Target Vertex: Map 9 + Target Vertex: Map 1 Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z @@ -115,35 +137,35 @@ STAGE PLANS: Target Input: store_returns Partition key expr: sr_returned_date_sk Statistics: Num rows: 367 Data size: 2936 Basic stats: COMPLETE Column stats: COMPLETE - Target Vertex: Map 1 + Target Vertex: Map 9 Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 6 + Map 7 Map Operator Tree: TableScan alias: store filterExpr: (s_state = 'NM') (type: boolean) - Statistics: Num rows: 1704 Data size: 160176 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 159230 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (s_state = 'NM') (type: boolean) - Statistics: Num rows: 39 Data size: 3666 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 3760 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 39 Data size: 312 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 320 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 39 Data size: 312 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 320 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 39 Data size: 312 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40 Data size: 320 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=39) - minReductionHashAggr: 0.974359 + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=40) + minReductionHashAggr: 0.975 mode: hash outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE @@ -154,28 +176,6 @@ STAGE PLANS: value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 8 - Map Operator Tree: - TableScan - alias: customer - filterExpr: (c_customer_sk BETWEEN DynamicValue(RS_43_store_returns_sr_customer_sk_min) AND DynamicValue(RS_43_store_returns_sr_customer_sk_max) and in_bloom_filter(c_customer_sk, DynamicValue(RS_43_store_returns_sr_customer_sk_bloom_filter))) (type: boolean) - Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: (c_customer_sk BETWEEN DynamicValue(RS_43_store_returns_sr_customer_sk_min) AND DynamicValue(RS_43_store_returns_sr_customer_sk_max) and in_bloom_filter(c_customer_sk, DynamicValue(RS_43_store_returns_sr_customer_sk_bloom_filter))) (type: boolean) - Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: c_customer_sk (type: bigint), c_customer_id (type: char(16)) - outputColumnNames: _col0, _col1 - Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) - Execution mode: vectorized, llap - LLAP IO: may be used (ACID table) Map 9 Map Operator Tree: TableScan @@ -197,7 +197,7 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col0, _col1, _col2 input vertices: - 1 Map 13 + 1 Map 6 Statistics: Num rows: 1499681380 Data size: 172969152424 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) @@ -317,30 +317,42 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col0, _col1, _col2 input vertices: - 1 Map 6 - Statistics: Num rows: 33743267 Data size: 3779245920 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 33743267 Data size: 3779245920 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: bigint), _col2 (type: decimal(17,2)) - Select Operator - expressions: _col0 (type: bigint) - outputColumnNames: _col0 - Statistics: Num rows: 33743267 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=329849) - minReductionHashAggr: 0.99 - mode: hash - outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 7 + Statistics: Num rows: 34608481 Data size: 3876149888 Basic stats: COMPLETE Column stats: COMPLETE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col1 (type: bigint) + 1 _col1 (type: bigint) + outputColumnNames: _col0, _col2, _col4 + input vertices: + 1 Reducer 11 + Statistics: Num rows: 34824784 Data size: 7802482048 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: (_col2 > _col4) (type: boolean) + Statistics: Num rows: 11608261 Data size: 2600827280 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 11608261 Data size: 2600827280 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: _col0 (type: bigint) + outputColumnNames: _col0 + Statistics: Num rows: 11608261 Data size: 576816 Basic stats: COMPLETE Column stats: COMPLETE + Group By Operator + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=338307) + minReductionHashAggr: 0.99 + mode: hash + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + null sort order: + sort order: + Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) Reducer 3 Execution mode: vectorized, llap Reduce Operator Tree: @@ -350,46 +362,33 @@ STAGE PLANS: keys: 0 KEY.reducesinkkey0 (type: bigint) 1 KEY.reducesinkkey0 (type: bigint) - outputColumnNames: _col1, _col2, _col5 + outputColumnNames: _col7 input vertices: - 1 Map 8 - Statistics: Num rows: 33743267 Data size: 7153572612 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 13 + Statistics: Num rows: 11608261 Data size: 1160826100 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true - Map Join Operator - condition map: - Inner Join 0 to 1 - keys: - 0 _col1 (type: bigint) - 1 _col1 (type: bigint) - outputColumnNames: _col2, _col5, _col6 - input vertices: - 1 Reducer 11 - Statistics: Num rows: 33954162 Data size: 11001148488 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: (_col2 > _col6) (type: boolean) - Statistics: Num rows: 11318054 Data size: 3667049496 Basic stats: COMPLETE Column stats: COMPLETE - Top N Key Operator - sort order: + - keys: _col5 (type: char(16)) + Top N Key Operator + sort order: + + keys: _col7 (type: string) + null sort order: z + Statistics: Num rows: 11608261 Data size: 1160826100 Basic stats: COMPLETE Column stats: COMPLETE + top n: 100 + Select Operator + expressions: _col7 (type: string) + outputColumnNames: _col0 + Statistics: Num rows: 11608261 Data size: 1160826100 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: string) null sort order: z - Statistics: Num rows: 11318054 Data size: 3667049496 Basic stats: COMPLETE Column stats: COMPLETE - top n: 100 - Select Operator - expressions: _col5 (type: char(16)) - outputColumnNames: _col0 - Statistics: Num rows: 11318054 Data size: 1131805400 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: char(16)) - null sort order: z - sort order: + - Statistics: Num rows: 11318054 Data size: 1131805400 Basic stats: COMPLETE Column stats: COMPLETE + sort order: + + Statistics: Num rows: 11608261 Data size: 1160826100 Basic stats: COMPLETE Column stats: COMPLETE Reducer 4 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator - expressions: KEY.reducesinkkey0 (type: char(16)) + expressions: KEY.reducesinkkey0 (type: string) outputColumnNames: _col0 - Statistics: Num rows: 11318054 Data size: 1131805400 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 11608261 Data size: 1160826100 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 10000 Basic stats: COMPLETE Column stats: COMPLETE @@ -404,7 +403,7 @@ STAGE PLANS: Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=329849) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=338307) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE @@ -413,11 +412,11 @@ STAGE PLANS: sort order: Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) - Reducer 7 + Reducer 8 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=39) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=40) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query20.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query20.q.out index e7dac6389994..a6a1f71091cf 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query20.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query20.q.out @@ -17,7 +17,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: catalog_sales - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_56_container, bigKeyColName:cs_item_sk, smallTablePos:1, keyRatio:0.2727272808721824 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_56_container, bigKeyColName:cs_item_sk, smallTablePos:1, keyRatio:0.3000000119404418 Statistics: Num rows: 43005109025 Data size: 5492607208208 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: cs_item_sk (type: bigint), cs_ext_sales_price (type: decimal(7,2)), cs_sold_date_sk (type: bigint) @@ -32,7 +32,7 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col4, _col5, _col6, _col7, _col8 input vertices: 1 Map 5 - Statistics: Num rows: 11728666448 Data size: 8174562398208 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12901533221 Data size: 8993223276712 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -42,20 +42,20 @@ STAGE PLANS: outputColumnNames: _col1, _col4, _col5, _col6, _col7, _col8 input vertices: 1 Map 6 - Statistics: Num rows: 1303095951 Data size: 887089423694 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1433405560 Data size: 977002924854 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col8 (type: char(50)), _col7 (type: char(50)), _col4 (type: string), _col5 (type: varchar(200)), _col6 (type: decimal(7,2)) - minReductionHashAggr: 0.99 + minReductionHashAggr: 0.9897737 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: string), _col3 (type: varchar(200)), _col4 (type: decimal(7,2)) null sort order: zzzzz sort order: +++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: string), _col3 (type: varchar(200)), _col4 (type: decimal(7,2)) - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -64,20 +64,20 @@ STAGE PLANS: TableScan alias: item filterExpr: (i_category) IN ('Books ', 'Jewelry ', 'Sports ') (type: boolean) - Statistics: Num rows: 462000 Data size: 270601408 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 270182180 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_category) IN ('Books ', 'Jewelry ', 'Sports ') (type: boolean) - Statistics: Num rows: 126000 Data size: 73800496 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 81055046 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_id (type: string), i_item_desc (type: varchar(200)), i_current_price (type: decimal(7,2)), i_class (type: char(50)), i_category (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 73800496 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 81055046 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 126000 Data size: 73800496 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 81055046 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(200)), _col3 (type: decimal(7,2)), _col4 (type: char(50)), _col5 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -126,13 +126,13 @@ STAGE PLANS: keys: KEY._col0 (type: char(50)), KEY._col1 (type: char(50)), KEY._col2 (type: string), KEY._col3 (type: varchar(200)), KEY._col4 (type: decimal(7,2)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: char(50)) null sort order: a sort order: + Map-reduce partition columns: _col1 (type: char(50)) - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(50)), _col2 (type: string), _col3 (type: varchar(200)), _col4 (type: decimal(7,2)), _col5 (type: decimal(17,2)) Reducer 3 Execution mode: vectorized, llap @@ -140,7 +140,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), VALUE._col1 (type: string), VALUE._col2 (type: varchar(200)), VALUE._col3 (type: decimal(7,2)), VALUE._col4 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -160,22 +160,22 @@ STAGE PLANS: name: sum window function: GenericUDAFSumHiveDecimal window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++++ keys: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: string), _col3 (type: varchar(200)), ((_col5 * 100) / sum_window_0) (type: decimal(38,17)) null sort order: zzzzz - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col3 (type: varchar(200)), _col0 (type: char(50)), _col1 (type: char(50)), _col4 (type: decimal(7,2)), _col5 (type: decimal(17,2)), ((_col5 * 100) / sum_window_0) (type: decimal(38,17)), _col2 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 126000 Data size: 101052000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 111157200 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: char(50)), _col2 (type: char(50)), _col6 (type: string), _col0 (type: varchar(200)), _col5 (type: decimal(38,17)) null sort order: zzzzz sort order: +++++ - Statistics: Num rows: 126000 Data size: 101052000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 111157200 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(7,2)), _col4 (type: decimal(17,2)) Reducer 4 Execution mode: vectorized, llap @@ -183,7 +183,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey3 (type: varchar(200)), KEY.reducesinkkey0 (type: char(50)), KEY.reducesinkkey1 (type: char(50)), VALUE._col0 (type: decimal(7,2)), VALUE._col1 (type: decimal(17,2)), KEY.reducesinkkey4 (type: decimal(38,17)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 88452000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 97297200 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 70200 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query21.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query21.q.out index b8ecf93fa13f..5f434c59bec9 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query21.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query21.q.out @@ -142,21 +142,21 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(20)), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 19251 Data size: 4158216 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18538 Data size: 4004208 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (if((_col2 > 0L), (0.666667D <= (UDFToDouble(_col3) / UDFToDouble(_col2))), false) and if((_col2 > 0L), ((UDFToDouble(_col3) / UDFToDouble(_col2)) <= 1.5D), false)) (type: boolean) - Statistics: Num rows: 4812 Data size: 1039392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4634 Data size: 1000944 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++ keys: _col0 (type: varchar(20)), _col1 (type: string) null sort order: zz - Statistics: Num rows: 4812 Data size: 1039392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4634 Data size: 1000944 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Reduce Output Operator key expressions: _col0 (type: varchar(20)), _col1 (type: string) null sort order: zz sort order: ++ - Statistics: Num rows: 4812 Data size: 1039392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4634 Data size: 1000944 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint), _col3 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -164,7 +164,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: varchar(20)), KEY.reducesinkkey1 (type: string), VALUE._col0 (type: bigint), VALUE._col1 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 4812 Data size: 1039392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4634 Data size: 1000944 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 21600 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query22.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query22.q.out index 592b285f4099..8e3dc573a1f3 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query22.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query22.q.out @@ -42,7 +42,7 @@ STAGE PLANS: outputColumnNames: _col2, _col5, _col6, _col7, _col8 input vertices: 1 Map 6 - Statistics: Num rows: 321094889 Data size: 125864702465 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 321094889 Data size: 125864259273 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col8 (type: char(50)) null sort order: z @@ -76,17 +76,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 183414000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 182970808 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_brand (type: char(50)), i_class (type: char(50)), i_category (type: char(50)), i_product_name (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 462000 Data size: 183414000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 182970808 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 183414000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 182970808 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)), _col2 (type: char(50)), _col3 (type: char(50)), _col4 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -100,16 +100,16 @@ STAGE PLANS: aggregations: sum(_col2), count(_col2) keys: _col5 (type: char(50)), _col6 (type: char(50)), _col7 (type: char(50)), _col8 (type: char(50)), 0L (type: bigint) grouping sets: 0, 2, 6, 14, 15 - minReductionHashAggr: 0.83334786 + minReductionHashAggr: 0.833658 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 1605474445 Data size: 663060945785 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1605474445 Data size: 663058728269 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: char(50)), _col3 (type: char(50)), _col4 (type: bigint) null sort order: zzzzz sort order: +++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: char(50)), _col3 (type: char(50)), _col4 (type: bigint) - Statistics: Num rows: 1605474445 Data size: 663060945785 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1605474445 Data size: 663058728269 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: bigint), _col6 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -119,30 +119,30 @@ STAGE PLANS: keys: KEY._col0 (type: char(50)), KEY._col1 (type: char(50)), KEY._col2 (type: char(50)), KEY._col3 (type: char(50)), KEY._col4 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col5, _col6 - Statistics: Num rows: 1605474445 Data size: 663060945785 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1605474445 Data size: 663058728269 Basic stats: COMPLETE Column stats: COMPLETE pruneGroupingSetId: true Top N Key Operator sort order: +++++ keys: (UDFToDouble(_col5) / _col6) (type: double), _col3 (type: char(50)), _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: char(50)) null sort order: zzzzz - Statistics: Num rows: 1605474445 Data size: 663060945785 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1605474445 Data size: 663058728269 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col3 (type: char(50)), _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: char(50)), (UDFToDouble(_col5) / _col6) (type: double) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 1605474445 Data size: 637373354665 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1605474445 Data size: 637368919244 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col4 (type: double), _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: char(50)), _col3 (type: char(50)) null sort order: zzzzz sort order: +++++ - Statistics: Num rows: 1605474445 Data size: 637373354665 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1605474445 Data size: 637368919244 Basic stats: COMPLETE Column stats: COMPLETE Reducer 4 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey2 (type: char(50)), KEY.reducesinkkey3 (type: char(50)), KEY.reducesinkkey4 (type: char(50)), KEY.reducesinkkey0 (type: double) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 1605474445 Data size: 637373354665 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1605474445 Data size: 637368919244 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 39700 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query24.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query24.q.out index 68170ac209aa..37c7f095e773 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query24.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query24.q.out @@ -64,20 +64,20 @@ STAGE PLANS: TableScan alias: store filterExpr: ((s_market_id = 7) and s_zip is not null) (type: boolean) - Statistics: Num rows: 1704 Data size: 468544 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 465739 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((s_market_id = 7) and s_zip is not null) (type: boolean) - Statistics: Num rows: 170 Data size: 46750 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 169 Data size: 46475 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_store_name (type: varchar(50)), s_state (type: char(2)), s_zip (type: char(10)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 170 Data size: 46070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 169 Data size: 45799 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col3 (type: char(10)) null sort order: z sort order: + Map-reduce partition columns: _col3 (type: char(10)) - Statistics: Num rows: 170 Data size: 46070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 169 Data size: 45799 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col1 (type: varchar(50)), _col2 (type: char(2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -86,14 +86,14 @@ STAGE PLANS: TableScan alias: customer filterExpr: c_current_addr_sk is not null (type: boolean) - Statistics: Num rows: 80000000 Data size: 23040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 22278830376 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: c_current_addr_sk is not null (type: boolean) - Statistics: Num rows: 80000000 Data size: 23040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 22278830376 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: c_customer_sk (type: bigint), c_current_addr_sk (type: bigint), c_first_name (type: char(20)), c_last_name (type: char(30)), c_birth_country (type: varchar(20)) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 80000000 Data size: 23040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 22278830376 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -103,27 +103,27 @@ STAGE PLANS: outputColumnNames: _col1, _col3, _col4, _col5, _col6, _col8, _col10, _col11, _col12 input vertices: 0 Map 9 - Statistics: Num rows: 7981221 Data size: 5147887545 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7934273 Data size: 4230628536 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col12 <> _col3) (type: boolean) - Statistics: Num rows: 7981221 Data size: 5147887545 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7934273 Data size: 4230628536 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col8 (type: bigint), _col10 (type: char(20)), _col11 (type: char(30)), _col1 (type: char(2)), _col4 (type: bigint), _col5 (type: varchar(50)), _col6 (type: char(2)) outputColumnNames: _col0, _col2, _col3, _col6, _col9, _col10, _col11 - Statistics: Num rows: 7981221 Data size: 3639436776 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7934273 Data size: 3055174738 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col9 (type: bigint), _col0 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col9 (type: bigint), _col0 (type: bigint) - Statistics: Num rows: 7981221 Data size: 3639436776 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7934273 Data size: 3055174738 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: char(20)), _col3 (type: char(30)), _col6 (type: char(2)), _col10 (type: varchar(50)), _col11 (type: char(2)) Select Operator expressions: _col9 (type: bigint), _col0 (type: bigint), hash(_col9,_col0) (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 7981221 Data size: 159624420 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7934273 Data size: 158685460 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), min(_col1), max(_col1), bloom_filter(_col3, expectedEntries=7981221) + aggregations: min(_col0), max(_col0), min(_col1), max(_col1), bloom_filter(_col3, expectedEntries=7934273) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 @@ -138,14 +138,14 @@ STAGE PLANS: null sort order: zz sort order: ++ Map-reduce partition columns: _col9 (type: bigint), _col0 (type: bigint) - Statistics: Num rows: 7981221 Data size: 3639436776 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7934273 Data size: 3055174738 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: char(20)), _col3 (type: char(30)), _col6 (type: char(2)), _col10 (type: varchar(50)), _col11 (type: char(2)) Select Operator expressions: _col9 (type: bigint), _col0 (type: bigint), hash(_col9,_col0) (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 7981221 Data size: 159624420 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7934273 Data size: 158685460 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), min(_col1), max(_col1), bloom_filter(_col3, expectedEntries=7981221) + aggregations: min(_col0), max(_col0), min(_col1), max(_col1), bloom_filter(_col3, expectedEntries=7934273) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 @@ -161,25 +161,25 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 179582916 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 179273816 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_color = 'orchid ') (type: boolean) - Statistics: Num rows: 4863 Data size: 1890431 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4915 Data size: 1907655 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_current_price (type: decimal(7,2)), i_size (type: char(20)), i_units (type: char(10)), i_manager_id (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 4863 Data size: 1457624 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4915 Data size: 1471288 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 4863 Data size: 1457624 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4915 Data size: 1471288 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(7,2)), _col2 (type: char(20)), _col3 (type: char(10)), _col4 (type: int) Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 4863 Data size: 38904 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4915 Data size: 39320 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -194,13 +194,13 @@ STAGE PLANS: Select Operator expressions: i_item_sk (type: bigint), i_current_price (type: decimal(7,2)), i_size (type: char(20)), i_color (type: char(20)), i_units (type: char(10)), i_manager_id (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 462000 Data size: 179582916 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 179273816 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 179582916 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 179273816 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(7,2)), _col2 (type: char(20)), _col3 (type: char(20)), _col4 (type: char(10)), _col5 (type: int) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -248,14 +248,14 @@ STAGE PLANS: alias: customer_address filterExpr: ca_zip is not null (type: boolean) probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_322_container, bigKeyColName:ca_zip, smallTablePos:1, keyRatio:2.5E-8 - Statistics: Num rows: 40000000 Data size: 11200000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 10873663965 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ca_zip is not null (type: boolean) - Statistics: Num rows: 40000000 Data size: 11200000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38799696 Data size: 10547371358 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_state (type: char(2)), ca_zip (type: char(10)), upper(ca_country) (type: varchar(20)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 40000000 Data size: 11200000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38799696 Data size: 10547371358 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -265,13 +265,13 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3, _col4, _col5, _col6 input vertices: 1 Map 10 - Statistics: Num rows: 712937 Data size: 265925501 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 687476 Data size: 130620623 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 712937 Data size: 265925501 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 687476 Data size: 130620623 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)), _col3 (type: varchar(20)), _col4 (type: bigint), _col5 (type: varchar(50)), _col6 (type: char(2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -279,7 +279,7 @@ STAGE PLANS: Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), min(VALUE._col2), max(VALUE._col3), bloom_filter(VALUE._col4, 1, expectedEntries=7981221) + aggregations: min(VALUE._col0), max(VALUE._col1), min(VALUE._col2), max(VALUE._col3), bloom_filter(VALUE._col4, 1, expectedEntries=7934273) mode: final outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 1 Data size: 176 Basic stats: COMPLETE Column stats: COMPLETE @@ -292,7 +292,7 @@ STAGE PLANS: Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), min(VALUE._col2), max(VALUE._col3), bloom_filter(VALUE._col4, 1, expectedEntries=7981221) + aggregations: min(VALUE._col0), max(VALUE._col1), min(VALUE._col2), max(VALUE._col3), bloom_filter(VALUE._col4, 1, expectedEntries=7934273) mode: final outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 1 Data size: 176 Basic stats: COMPLETE Column stats: COMPLETE @@ -342,7 +342,7 @@ STAGE PLANS: outputColumnNames: _col0, _col4, _col9, _col10, _col13, _col17, _col18 input vertices: 1 Map 11 - Statistics: Num rows: 9604070077 Data size: 4981069864848 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9547575979 Data size: 4948870316218 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -352,20 +352,20 @@ STAGE PLANS: outputColumnNames: _col4, _col9, _col10, _col13, _col17, _col18, _col21, _col22, _col23, _col24 input vertices: 1 Map 14 - Statistics: Num rows: 101092197 Data size: 73999487040 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 101572160 Data size: 73787964270 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col4) keys: _col9 (type: char(20)), _col10 (type: char(30)), _col17 (type: varchar(50)), _col13 (type: char(2)), _col18 (type: char(2)), _col21 (type: decimal(7,2)), _col22 (type: char(20)), _col23 (type: char(10)), _col24 (type: int) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9 - Statistics: Num rows: 101092197 Data size: 85321812992 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 101572160 Data size: 85164046078 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(20)), _col1 (type: char(30)), _col2 (type: varchar(50)), _col3 (type: char(2)), _col4 (type: char(2)), _col5 (type: decimal(7,2)), _col6 (type: char(20)), _col7 (type: char(10)), _col8 (type: int) null sort order: zzzzzzzzz sort order: +++++++++ Map-reduce partition columns: _col0 (type: char(20)), _col1 (type: char(30)), _col2 (type: varchar(50)), _col3 (type: char(2)), _col4 (type: char(2)), _col5 (type: decimal(7,2)), _col6 (type: char(20)), _col7 (type: char(10)), _col8 (type: int) - Statistics: Num rows: 101092197 Data size: 85321812992 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 101572160 Data size: 85164046078 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col9 (type: decimal(17,2)) Reducer 3 Execution mode: vectorized, llap @@ -375,24 +375,24 @@ STAGE PLANS: keys: KEY._col0 (type: char(20)), KEY._col1 (type: char(30)), KEY._col2 (type: varchar(50)), KEY._col3 (type: char(2)), KEY._col4 (type: char(2)), KEY._col5 (type: decimal(7,2)), KEY._col6 (type: char(20)), KEY._col7 (type: char(10)), KEY._col8 (type: int) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9 - Statistics: Num rows: 101092197 Data size: 85321812992 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 101572160 Data size: 85164046078 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(20)), _col1 (type: char(30)), _col2 (type: varchar(50)), _col9 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col3, _col9 - Statistics: Num rows: 101092197 Data size: 85321812992 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 101572160 Data size: 85164046078 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col9) keys: _col0 (type: char(20)), _col1 (type: char(30)), _col3 (type: varchar(50)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 12024 Data size: 4569120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 32634 Data size: 12239280 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(20)), _col1 (type: char(30)), _col2 (type: varchar(50)) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(20)), _col1 (type: char(30)), _col2 (type: varchar(50)) - Statistics: Num rows: 12024 Data size: 4569120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 32634 Data size: 12239280 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(27,2)) Reducer 4 Execution mode: vectorized, llap @@ -402,18 +402,18 @@ STAGE PLANS: keys: KEY._col0 (type: char(20)), KEY._col1 (type: char(30)), KEY._col2 (type: varchar(50)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 36 Data size: 13680 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 49 Data size: 18620 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: char(30)), _col0 (type: char(20)), _col2 (type: varchar(50)), _col3 (type: decimal(27,2)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 36 Data size: 13680 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 49 Data size: 18620 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col3 is not null (type: boolean) - Statistics: Num rows: 36 Data size: 13680 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 49 Data size: 18620 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator null sort order: sort order: - Statistics: Num rows: 36 Data size: 13680 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 49 Data size: 18620 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: varchar(50)), _col3 (type: decimal(27,2)) Reducer 5 Execution mode: vectorized, llap @@ -438,7 +438,7 @@ STAGE PLANS: outputColumnNames: _col0, _col4, _col9, _col10, _col13, _col17, _col18 input vertices: 1 Map 11 - Statistics: Num rows: 9604070077 Data size: 4981069864848 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9547575979 Data size: 4948870316218 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -448,20 +448,20 @@ STAGE PLANS: outputColumnNames: _col4, _col9, _col10, _col13, _col17, _col18, _col21, _col22, _col23, _col24, _col25 input vertices: 1 Map 14 - Statistics: Num rows: 9604070077 Data size: 8563387868485 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9547575979 Data size: 8510115712201 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col4) keys: _col9 (type: char(20)), _col10 (type: char(30)), _col13 (type: char(2)), _col17 (type: varchar(50)), _col18 (type: char(2)), _col21 (type: decimal(7,2)), _col22 (type: char(20)), _col23 (type: char(20)), _col24 (type: char(10)), _col25 (type: int) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10 - Statistics: Num rows: 9604070077 Data size: 8960597246757 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9547575979 Data size: 8907325090473 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(20)), _col1 (type: char(30)), _col2 (type: char(2)), _col3 (type: varchar(50)), _col4 (type: char(2)), _col5 (type: decimal(7,2)), _col6 (type: char(20)), _col7 (type: char(20)), _col8 (type: char(10)), _col9 (type: int) null sort order: zzzzzzzzzz sort order: ++++++++++ Map-reduce partition columns: _col0 (type: char(20)), _col1 (type: char(30)), _col2 (type: char(2)), _col3 (type: varchar(50)), _col4 (type: char(2)), _col5 (type: decimal(7,2)), _col6 (type: char(20)), _col7 (type: char(20)), _col8 (type: char(10)), _col9 (type: int) - Statistics: Num rows: 9604070077 Data size: 8960597246757 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9547575979 Data size: 8907325090473 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col10 (type: decimal(17,2)) Reducer 6 Execution mode: vectorized, llap @@ -471,11 +471,11 @@ STAGE PLANS: keys: KEY._col0 (type: char(20)), KEY._col1 (type: char(30)), KEY._col2 (type: char(2)), KEY._col3 (type: varchar(50)), KEY._col4 (type: char(2)), KEY._col5 (type: decimal(7,2)), KEY._col6 (type: char(20)), KEY._col7 (type: char(20)), KEY._col8 (type: char(10)), KEY._col9 (type: int) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10 - Statistics: Num rows: 9604070077 Data size: 8960597246757 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9547575979 Data size: 8907325090473 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col10 (type: decimal(17,2)) outputColumnNames: _col10 - Statistics: Num rows: 9604070077 Data size: 8960597246757 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9547575979 Data size: 8907325090473 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col10), count(_col10) minReductionHashAggr: 0.99 @@ -511,17 +511,17 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4 input vertices: 0 Reducer 4 - Statistics: Num rows: 36 Data size: 17712 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 49 Data size: 24108 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col3 > _col4) (type: boolean) - Statistics: Num rows: 12 Data size: 5904 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 16 Data size: 7872 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: varchar(50)), _col3 (type: decimal(27,2)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 12 Data size: 4560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 16 Data size: 6080 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 12 Data size: 4560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 16 Data size: 6080 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query25.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query25.q.out index eee452d8a295..9bb83417b1c1 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query25.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query25.q.out @@ -54,17 +54,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store - Statistics: Num rows: 1704 Data size: 333984 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 333104 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_store_id (type: string), s_store_name (type: varchar(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1704 Data size: 333984 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 333104 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 333984 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 333104 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -72,17 +72,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 134904000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 134691112 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_id (type: string), i_item_desc (type: varchar(200)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 462000 Data size: 134904000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 134691112 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 134904000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 134691112 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(200)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -325,7 +325,7 @@ STAGE PLANS: outputColumnNames: _col2, _col5, _col9, _col15, _col19, _col20 input vertices: 1 Map 11 - Statistics: Num rows: 1178531569624 Data size: 626812675956880 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531569624 Data size: 626812675956000 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -335,12 +335,12 @@ STAGE PLANS: outputColumnNames: _col2, _col9, _col15, _col19, _col20, _col22, _col23 input vertices: 1 Map 12 - Statistics: Num rows: 1178531569624 Data size: 952087389173104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531569624 Data size: 952087388959336 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++++ keys: _col22 (type: string), _col23 (type: varchar(200)), _col19 (type: string), _col20 (type: varchar(50)) null sort order: zzzz - Statistics: Num rows: 1178531569624 Data size: 952087389173104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531569624 Data size: 952087388959336 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator aggregations: sum(_col9), sum(_col15), sum(_col2) @@ -348,13 +348,13 @@ STAGE PLANS: minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 1178531569624 Data size: 952253508256192 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531569624 Data size: 952253507828384 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: varchar(200)), _col2 (type: string), _col3 (type: varchar(50)) null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: string), _col1 (type: varchar(200)), _col2 (type: string), _col3 (type: varchar(50)) - Statistics: Num rows: 1178531569624 Data size: 952253508256192 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531569624 Data size: 952253507828384 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)) Reducer 6 Execution mode: vectorized, llap @@ -364,12 +364,12 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: varchar(200)), KEY._col2 (type: string), KEY._col3 (type: varchar(50)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 1178531569624 Data size: 952253508256192 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531569624 Data size: 952253507828384 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: varchar(200)), _col2 (type: string), _col3 (type: varchar(50)) null sort order: zzzz sort order: ++++ - Statistics: Num rows: 1178531569624 Data size: 952253508256192 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531569624 Data size: 952253507828384 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)) Reducer 7 Execution mode: vectorized, llap @@ -377,7 +377,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: varchar(200)), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: varchar(50)), VALUE._col0 (type: decimal(17,2)), VALUE._col1 (type: decimal(17,2)), VALUE._col2 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 1178531569624 Data size: 952253508256192 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531569624 Data size: 952253507828384 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 80800 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query26.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query26.q.out index ddb99d5646ce..d09200a77321 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query26.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query26.q.out @@ -17,7 +17,7 @@ STAGE PLANS: TableScan alias: catalog_sales filterExpr: (cs_promo_sk is not null and cs_bill_cdemo_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_94_container, bigKeyColName:cs_bill_cdemo_sk, smallTablePos:1, keyRatio:0.0028366486625829453 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_98_container, bigKeyColName:cs_promo_sk, smallTablePos:1, keyRatio:4.466448390779309E-5 Statistics: Num rows: 43005109025 Data size: 15959723945900 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (cs_promo_sk is not null and cs_bill_cdemo_sk is not null) (type: boolean) @@ -30,27 +30,27 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col7 (type: bigint) + 0 _col2 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 + outputColumnNames: _col0, _col1, _col3, _col4, _col5, _col6, _col7 input vertices: 1 Map 4 - Statistics: Num rows: 8539326845 Data size: 3070329057008 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 42790293199 Data size: 15538538783328 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: bigint) + 0 _col7 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col1, _col2, _col3, _col4, _col5, _col6 + outputColumnNames: _col0, _col1, _col3, _col4, _col5, _col6 input vertices: 1 Map 5 - Statistics: Num rows: 121990385 Data size: 6296772048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8539326845 Data size: 3002872415712 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col2 (type: bigint) + 0 _col0 (type: bigint) 1 _col0 (type: bigint) outputColumnNames: _col1, _col3, _col4, _col5, _col6 input vertices: @@ -89,6 +89,27 @@ STAGE PLANS: Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 4 + Map Operator Tree: + TableScan + alias: promotion + filterExpr: ((p_channel_email = 'N') or (p_channel_event = 'N')) (type: boolean) + Statistics: Num rows: 2300 Data size: 405235 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: ((p_channel_email = 'N') or (p_channel_event = 'N')) (type: boolean) + Statistics: Num rows: 2300 Data size: 405235 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: p_promo_sk (type: bigint) + outputColumnNames: _col0 + Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE + Execution mode: vectorized, llap + LLAP IO: may be used (ACID table) + Map 5 Map Operator Tree: TableScan alias: date_dim @@ -125,7 +146,7 @@ STAGE PLANS: Target Vertex: Map 1 Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 5 + Map 6 Map Operator Tree: TableScan alias: customer_demographics @@ -146,27 +167,6 @@ STAGE PLANS: Statistics: Num rows: 27440 Data size: 219520 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 6 - Map Operator Tree: - TableScan - alias: promotion - filterExpr: ((p_channel_email = 'N') or (p_channel_event = 'N')) (type: boolean) - Statistics: Num rows: 2300 Data size: 409400 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: ((p_channel_email = 'N') or (p_channel_event = 'N')) (type: boolean) - Statistics: Num rows: 2300 Data size: 409400 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: p_promo_sk (type: bigint) - outputColumnNames: _col0 - Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE - Execution mode: vectorized, llap - LLAP IO: may be used (ACID table) Map 7 Map Operator Tree: TableScan diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query27.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query27.q.out index 81f22c1653dc..85e8c31c9da5 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query27.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query27.q.out @@ -17,7 +17,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: (ss_cdemo_sk is not null and ss_store_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_96_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:2.1936500996451943E-9 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_96_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:2.2542481686961665E-9 Statistics: Num rows: 82510879939 Data size: 30001917572116 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ss_cdemo_sk is not null and ss_store_sk is not null) (type: boolean) @@ -55,7 +55,7 @@ STAGE PLANS: outputColumnNames: _col0, _col3, _col4, _col5, _col6, _col11 input vertices: 1 Map 6 - Statistics: Num rows: 30788489 Data size: 2894118306 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 31584740 Data size: 2968965814 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -65,31 +65,31 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col5, _col6, _col11, _col13 input vertices: 1 Map 7 - Statistics: Num rows: 30788489 Data size: 5726659294 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 31584740 Data size: 5874761894 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++ keys: _col13 (type: string), _col11 (type: char(2)) null sort order: zz - Statistics: Num rows: 30788489 Data size: 5726659294 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 31584740 Data size: 5874761894 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col13 (type: string), _col11 (type: char(2)), _col3 (type: int), _col4 (type: decimal(7,2)), _col6 (type: decimal(7,2)), _col5 (type: decimal(7,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 30788489 Data size: 5726659294 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 31584740 Data size: 5874761894 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2), count(_col2), sum(_col3), count(_col3), sum(_col4), count(_col4), sum(_col5), count(_col5) keys: _col0 (type: string), _col1 (type: char(2)), 0L (type: bigint) grouping sets: 0, 1, 3 - minReductionHashAggr: 0.98030734 + minReductionHashAggr: 0.97783417 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10 - Statistics: Num rows: 46182733 Data size: 26324157810 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 47377110 Data size: 27004952270 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: char(2)), _col2 (type: bigint) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: string), _col1 (type: char(2)), _col2 (type: bigint) - Statistics: Num rows: 46182733 Data size: 26324157810 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 47377110 Data size: 27004952270 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint), _col5 (type: decimal(17,2)), _col6 (type: bigint), _col7 (type: decimal(17,2)), _col8 (type: bigint), _col9 (type: decimal(17,2)), _col10 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -156,20 +156,20 @@ STAGE PLANS: TableScan alias: store filterExpr: (s_state) IN ('FL', 'LA', 'MI', 'MO', 'SC', 'SD') (type: boolean) - Statistics: Num rows: 1704 Data size: 160176 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 159230 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (s_state) IN ('FL', 'LA', 'MI', 'MO', 'SC', 'SD') (type: boolean) - Statistics: Num rows: 232 Data size: 21808 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 238 Data size: 22286 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_state (type: char(2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 232 Data size: 21808 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 238 Data size: 22286 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 232 Data size: 21808 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 238 Data size: 22286 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -199,16 +199,16 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: char(2)), KEY._col2 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10 - Statistics: Num rows: 4455432 Data size: 2539596240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5940576 Data size: 3386128320 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: string), _col1 (type: char(2)), grouping(_col2, 0L) (type: bigint), (UDFToDouble(_col3) / _col4) (type: double), CAST( (_col5 / _col6) AS decimal(11,6)) (type: decimal(11,6)), CAST( (_col7 / _col8) AS decimal(11,6)) (type: decimal(11,6)), CAST( (_col9 / _col10) AS decimal(11,6)) (type: decimal(11,6)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 4455432 Data size: 2397022416 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5940576 Data size: 3196029888 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: char(2)) null sort order: zz sort order: ++ - Statistics: Num rows: 4455432 Data size: 2397022416 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5940576 Data size: 3196029888 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint), _col3 (type: double), _col4 (type: decimal(11,6)), _col5 (type: decimal(11,6)), _col6 (type: decimal(11,6)) Reducer 3 Execution mode: vectorized, llap @@ -216,7 +216,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: char(2)), VALUE._col0 (type: bigint), VALUE._col1 (type: double), VALUE._col2 (type: decimal(11,6)), VALUE._col3 (type: decimal(11,6)), VALUE._col4 (type: decimal(11,6)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 4455432 Data size: 2397022416 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5940576 Data size: 3196029888 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 53800 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query29.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query29.q.out index c7bba5a19646..f94a108195a4 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query29.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query29.q.out @@ -54,17 +54,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store - Statistics: Num rows: 1704 Data size: 333984 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 333104 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_store_id (type: string), s_store_name (type: varchar(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1704 Data size: 333984 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 333104 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 333984 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 333104 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -72,17 +72,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 134904000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 134691112 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_id (type: string), i_item_desc (type: varchar(200)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 462000 Data size: 134904000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 134691112 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 134904000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 134691112 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(200)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -332,7 +332,7 @@ STAGE PLANS: outputColumnNames: _col2, _col5, _col9, _col15, _col19, _col20 input vertices: 1 Map 11 - Statistics: Num rows: 1178531672141 Data size: 245128218895444 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531672141 Data size: 245128218894564 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -342,12 +342,12 @@ STAGE PLANS: outputColumnNames: _col2, _col9, _col15, _col19, _col20, _col22, _col23 input vertices: 1 Map 12 - Statistics: Num rows: 1178531672141 Data size: 570402960406360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531672141 Data size: 570402960192592 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++++ keys: _col22 (type: string), _col23 (type: varchar(200)), _col19 (type: string), _col20 (type: varchar(50)) null sort order: zzzz - Statistics: Num rows: 1178531672141 Data size: 570402960406360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531672141 Data size: 570402960192592 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator aggregations: sum(_col9), sum(_col15), sum(_col2) @@ -355,13 +355,13 @@ STAGE PLANS: minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 1178531672141 Data size: 584551709381936 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531672141 Data size: 584551708954128 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: varchar(200)), _col2 (type: string), _col3 (type: varchar(50)) null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: string), _col1 (type: varchar(200)), _col2 (type: string), _col3 (type: varchar(50)) - Statistics: Num rows: 1178531672141 Data size: 584551709381936 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531672141 Data size: 584551708954128 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint) Reducer 5 Execution mode: vectorized, llap @@ -371,12 +371,12 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: varchar(200)), KEY._col2 (type: string), KEY._col3 (type: varchar(50)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 1178531672141 Data size: 584551709381936 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531672141 Data size: 584551708954128 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: varchar(200)), _col2 (type: string), _col3 (type: varchar(50)) null sort order: zzzz sort order: ++++ - Statistics: Num rows: 1178531672141 Data size: 584551709381936 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531672141 Data size: 584551708954128 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint) Reducer 6 Execution mode: vectorized, llap @@ -384,7 +384,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: varchar(200)), KEY.reducesinkkey2 (type: string), KEY.reducesinkkey3 (type: varchar(50)), VALUE._col0 (type: bigint), VALUE._col1 (type: bigint), VALUE._col2 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 1178531672141 Data size: 584551709381936 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1178531672141 Data size: 584551708954128 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 49600 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query3.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query3.q.out index 7d2b692eb471..6163bcb049aa 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query3.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query3.q.out @@ -54,13 +54,13 @@ STAGE PLANS: minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 931320 Data size: 204890400 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 955200 Data size: 210144000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: int), _col2 (type: char(50)) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: int), _col1 (type: int), _col2 (type: char(50)) - Statistics: Num rows: 931320 Data size: 204890400 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 955200 Data size: 210144000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -69,7 +69,7 @@ STAGE PLANS: TableScan alias: item filterExpr: (i_manufact_id = 436) (type: boolean) - Statistics: Num rows: 462000 Data size: 53582844 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 53467544 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_manufact_id = 436) (type: boolean) Statistics: Num rows: 468 Data size: 54288 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query30.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query30.q.out index 39636685cd64..b0547db7fcc7 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query30.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query30.q.out @@ -23,15 +23,15 @@ STAGE PLANS: TableScan alias: customer filterExpr: c_current_addr_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_159_container, bigKeyColName:c_current_addr_sk, smallTablePos:1, keyRatio:0.0185202875 - Statistics: Num rows: 80000000 Data size: 61944003308 Basic stats: COMPLETE Column stats: COMPLETE + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_159_container, bigKeyColName:c_current_addr_sk, smallTablePos:1, keyRatio:0.0188764625 + Statistics: Num rows: 80000000 Data size: 53670337766 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: c_current_addr_sk is not null (type: boolean) - Statistics: Num rows: 80000000 Data size: 61944003308 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 53670337766 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: c_customer_sk (type: bigint), c_customer_id (type: char(16)), c_current_addr_sk (type: bigint), c_salutation (type: char(10)), c_first_name (type: char(20)), c_last_name (type: char(30)), c_preferred_cust_flag (type: char(1)), c_birth_day (type: int), c_birth_month (type: int), c_birth_year (type: int), c_birth_country (type: varchar(20)), c_login (type: char(13)), c_email_address (type: char(50)), c_last_review_date_sk (type: bigint) + expressions: c_customer_sk (type: bigint), c_customer_id (type: string), c_current_addr_sk (type: bigint), c_salutation (type: char(10)), c_first_name (type: char(20)), c_last_name (type: char(30)), c_preferred_cust_flag (type: char(1)), c_birth_day (type: int), c_birth_month (type: int), c_birth_year (type: int), c_birth_country (type: varchar(20)), c_login (type: char(13)), c_email_address (type: char(50)), c_last_review_date_sk (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13 - Statistics: Num rows: 80000000 Data size: 61944003308 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 53670337766 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -41,20 +41,20 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13 input vertices: 1 Map 3 - Statistics: Num rows: 1509434 Data size: 1127547218 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1538463 Data size: 166154663 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1509434 Data size: 1127547218 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col6 (type: char(1)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: varchar(20)), _col11 (type: char(13)), _col12 (type: char(50)), _col13 (type: bigint) + Statistics: Num rows: 1538463 Data size: 166154663 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: string), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col6 (type: char(1)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: varchar(20)), _col11 (type: char(13)), _col12 (type: char(50)), _col13 (type: bigint) Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 1509434 Data size: 12075472 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1538463 Data size: 12307704 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1481623) + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1510117) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 @@ -130,41 +130,41 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: (ca_state is not null or (ca_state = 'IL')) (type: boolean) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ca_state is not null (type: boolean) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38800242 Data size: 3547138356 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_state (type: char(2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38800242 Data size: 3547138356 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38800242 Data size: 3547138356 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38800242 Data size: 3547138356 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)) Filter Operator predicate: (ca_state = 'IL') (type: boolean) - Statistics: Num rows: 754717 Data size: 70943398 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 70323608 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 754717 Data size: 6037736 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 6153848 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 754717 Data size: 6037736 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 6153848 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 5 @@ -199,20 +199,20 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col6 input vertices: 1 Map 3 - Statistics: Num rows: 338617340 Data size: 64060966704 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 328460848 Data size: 61868644960 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col6 (type: char(2)), _col0 (type: bigint) minReductionHashAggr: 0.71617645 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 338617340 Data size: 69375636960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 328460848 Data size: 67183315216 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(2)), _col1 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: char(2)), _col1 (type: bigint) - Statistics: Num rows: 338617340 Data size: 69375636960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 328460848 Data size: 67183315216 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(17,2)) Filter Operator predicate: (wr_returning_addr_sk is not null and wr_returning_customer_sk is not null and wr_returning_customer_sk BETWEEN DynamicValue(RS_57_customer_c_customer_sk_min) AND DynamicValue(RS_57_customer_c_customer_sk_max) and in_bloom_filter(wr_returning_customer_sk, DynamicValue(RS_57_customer_c_customer_sk_bloom_filter))) (type: boolean) @@ -240,20 +240,20 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col6 input vertices: 1 Reducer 4 - Statistics: Num rows: 330641649 Data size: 62552093862 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 320724380 Data size: 60409052056 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col0 (type: bigint), _col6 (type: char(2)) minReductionHashAggr: 0.7093301 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 330641649 Data size: 67741584070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 320724380 Data size: 65598542264 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: char(2)) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: char(2)) - Statistics: Num rows: 330641649 Data size: 67741584070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 320724380 Data size: 65598542264 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -273,7 +273,7 @@ STAGE PLANS: Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1481623) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1510117) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE @@ -293,7 +293,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38800242 Data size: 3547138356 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)) Reducer 6 Execution mode: vectorized, llap @@ -303,24 +303,24 @@ STAGE PLANS: keys: KEY._col0 (type: char(2)), KEY._col1 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 338617340 Data size: 69375636960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 328460848 Data size: 67183315216 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(2)), _col2 (type: decimal(17,2)) outputColumnNames: _col0, _col2 - Statistics: Num rows: 338617340 Data size: 69375636960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 328460848 Data size: 67183315216 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2), count(_col2) keys: _col0 (type: char(2)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 14363 Data size: 2958778 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 13939 Data size: 2867306 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(2)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: char(2)) - Statistics: Num rows: 14363 Data size: 2958778 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 13939 Data size: 2867306 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(27,2)), _col2 (type: bigint) Reducer 7 Execution mode: vectorized, llap @@ -353,10 +353,10 @@ STAGE PLANS: keys: KEY._col0 (type: bigint), KEY._col1 (type: char(2)) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 330641649 Data size: 67741584070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 320724380 Data size: 65598542264 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col2 is not null (type: boolean) - Statistics: Num rows: 330641649 Data size: 67741584070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 320724380 Data size: 65598542264 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -366,7 +366,7 @@ STAGE PLANS: outputColumnNames: _col1, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col16, _col17 input vertices: 0 Map 1 - Statistics: Num rows: 330641649 Data size: 316393869433 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 320724380 Data size: 305819300810 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -376,32 +376,32 @@ STAGE PLANS: outputColumnNames: _col1, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col17, _col18 input vertices: 1 Reducer 7 - Statistics: Num rows: 330641649 Data size: 324990552307 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 326892156 Data size: 320321142890 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col17 > _col18) (type: boolean) - Statistics: Num rows: 110213883 Data size: 108330184109 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 108964052 Data size: 106773714736 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++++++++++++ - keys: _col1 (type: char(16)), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col6 (type: char(1)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: varchar(20)), _col11 (type: char(13)), _col12 (type: char(50)), _col13 (type: bigint), _col17 (type: decimal(17,2)) + keys: _col1 (type: string), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col6 (type: char(1)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: varchar(20)), _col11 (type: char(13)), _col12 (type: char(50)), _col13 (type: bigint), _col17 (type: decimal(17,2)) null sort order: zzzzzzzzzzzzz - Statistics: Num rows: 110213883 Data size: 108330184109 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 108964052 Data size: 106773714736 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator - expressions: _col1 (type: char(16)), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col6 (type: char(1)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: varchar(20)), _col11 (type: char(13)), _col12 (type: char(50)), _col13 (type: bigint), _col17 (type: decimal(17,2)) + expressions: _col1 (type: string), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col6 (type: char(1)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: varchar(20)), _col11 (type: char(13)), _col12 (type: char(50)), _col13 (type: bigint), _col17 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12 - Statistics: Num rows: 110213883 Data size: 95976166313 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 108964052 Data size: 94231791873 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)), _col1 (type: char(10)), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: char(1)), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col8 (type: varchar(20)), _col9 (type: char(13)), _col10 (type: char(50)), _col11 (type: bigint), _col12 (type: decimal(17,2)) + key expressions: _col0 (type: string), _col1 (type: char(10)), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: char(1)), _col5 (type: int), _col6 (type: int), _col7 (type: int), _col8 (type: varchar(20)), _col9 (type: char(13)), _col10 (type: char(50)), _col11 (type: bigint), _col12 (type: decimal(17,2)) null sort order: zzzzzzzzzzzzz sort order: +++++++++++++ - Statistics: Num rows: 110213883 Data size: 95976166313 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 108964052 Data size: 94231791873 Basic stats: COMPLETE Column stats: COMPLETE Reducer 9 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator - expressions: KEY.reducesinkkey0 (type: char(16)), KEY.reducesinkkey1 (type: char(10)), KEY.reducesinkkey2 (type: char(20)), KEY.reducesinkkey3 (type: char(30)), KEY.reducesinkkey4 (type: char(1)), KEY.reducesinkkey5 (type: int), KEY.reducesinkkey6 (type: int), KEY.reducesinkkey7 (type: int), KEY.reducesinkkey8 (type: varchar(20)), KEY.reducesinkkey9 (type: char(13)), KEY.reducesinkkey10 (type: char(50)), KEY.reducesinkkey11 (type: bigint), KEY.reducesinkkey12 (type: decimal(17,2)) + expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: char(10)), KEY.reducesinkkey2 (type: char(20)), KEY.reducesinkkey3 (type: char(30)), KEY.reducesinkkey4 (type: char(1)), KEY.reducesinkkey5 (type: int), KEY.reducesinkkey6 (type: int), KEY.reducesinkkey7 (type: int), KEY.reducesinkkey8 (type: varchar(20)), KEY.reducesinkkey9 (type: char(13)), KEY.reducesinkkey10 (type: char(50)), KEY.reducesinkkey11 (type: bigint), KEY.reducesinkkey12 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12 - Statistics: Num rows: 110213883 Data size: 95976166313 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 108964052 Data size: 94231791873 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 87100 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query31.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query31.q.out index 112185cad005..0294c54ad92b 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query31.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query31.q.out @@ -26,7 +26,7 @@ STAGE PLANS: TableScan alias: web_sales filterExpr: ws_bill_addr_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_393_container, bigKeyColName:ws_bill_addr_sk, smallTablePos:1, keyRatio:0.05037635576628538 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_393_container, bigKeyColName:ws_bill_addr_sk, smallTablePos:1, keyRatio:0.04886735157149479 Statistics: Num rows: 21594638446 Data size: 2763789503808 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ws_bill_addr_sk is not null (type: boolean) @@ -54,20 +54,20 @@ STAGE PLANS: outputColumnNames: _col1, _col5 input vertices: 1 Map 6 - Statistics: Num rows: 1087859189 Data size: 228147860010 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1055272789 Data size: 221190811296 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col5 (type: varchar(30)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 1721560 Data size: 361527600 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1668585 Data size: 350222824 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: varchar(30)) - Statistics: Num rows: 1721560 Data size: 361527600 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1668585 Data size: 350222824 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -76,7 +76,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: ss_addr_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_401_container, bigKeyColName:ss_addr_sk, smallTablePos:1, keyRatio:0.049193881825049336 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_401_container, bigKeyColName:ss_addr_sk, smallTablePos:1, keyRatio:0.047720298170507186 Statistics: Num rows: 82510879939 Data size: 10327822006760 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ss_addr_sk is not null (type: boolean) @@ -104,20 +104,20 @@ STAGE PLANS: outputColumnNames: _col1, _col5 input vertices: 1 Map 6 - Statistics: Num rows: 4059030477 Data size: 639544095946 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3937443793 Data size: 613896987592 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col5 (type: varchar(30)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 4823070 Data size: 1012844700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4627671 Data size: 971677140 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: varchar(30)) - Statistics: Num rows: 4823070 Data size: 1012844700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4627671 Data size: 971677140 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -126,7 +126,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: ss_addr_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_403_container, bigKeyColName:ss_addr_sk, smallTablePos:1, keyRatio:0.049193881825049336 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_403_container, bigKeyColName:ss_addr_sk, smallTablePos:1, keyRatio:0.047720298170507186 Statistics: Num rows: 82510879939 Data size: 10327822006760 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ss_addr_sk is not null (type: boolean) @@ -154,20 +154,20 @@ STAGE PLANS: outputColumnNames: _col1, _col5 input vertices: 1 Map 6 - Statistics: Num rows: 4059030477 Data size: 639544095946 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3937443793 Data size: 613896987592 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col5 (type: varchar(30)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 4823070 Data size: 1012844700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4627671 Data size: 971677140 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: varchar(30)) - Statistics: Num rows: 4823070 Data size: 1012844700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4627671 Data size: 971677140 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -176,7 +176,7 @@ STAGE PLANS: TableScan alias: web_sales filterExpr: ws_bill_addr_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_395_container, bigKeyColName:ws_bill_addr_sk, smallTablePos:1, keyRatio:0.05037635576628538 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_395_container, bigKeyColName:ws_bill_addr_sk, smallTablePos:1, keyRatio:0.04886735157149479 Statistics: Num rows: 21594638446 Data size: 2763789503808 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ws_bill_addr_sk is not null (type: boolean) @@ -204,20 +204,20 @@ STAGE PLANS: outputColumnNames: _col1, _col5 input vertices: 1 Map 6 - Statistics: Num rows: 1087859189 Data size: 228147860010 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1055272789 Data size: 221190811296 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col5 (type: varchar(30)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 1721560 Data size: 361527600 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1668585 Data size: 350222824 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: varchar(30)) - Statistics: Num rows: 1721560 Data size: 361527600 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1668585 Data size: 350222824 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -357,55 +357,55 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: ca_county is not null (type: boolean) - Statistics: Num rows: 40000000 Data size: 4240000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 4122577968 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ca_county is not null (type: boolean) - Statistics: Num rows: 40000000 Data size: 4240000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38801815 Data size: 3999087676 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_county (type: varchar(30)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40000000 Data size: 4240000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38801815 Data size: 3999087676 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 4240000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38801815 Data size: 3999087676 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(30)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 4240000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38801815 Data size: 3999087676 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(30)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 4240000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38801815 Data size: 3999087676 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(30)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 4240000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38801815 Data size: 3999087676 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(30)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 4240000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38801815 Data size: 3999087676 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(30)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 4240000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38801815 Data size: 3999087676 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(30)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -414,7 +414,7 @@ STAGE PLANS: TableScan alias: web_sales filterExpr: ws_bill_addr_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_397_container, bigKeyColName:ws_bill_addr_sk, smallTablePos:1, keyRatio:0.05037635576628538 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_397_container, bigKeyColName:ws_bill_addr_sk, smallTablePos:1, keyRatio:0.04886735157149479 Statistics: Num rows: 21594638446 Data size: 2763789503808 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ws_bill_addr_sk is not null (type: boolean) @@ -442,20 +442,20 @@ STAGE PLANS: outputColumnNames: _col1, _col5 input vertices: 1 Map 6 - Statistics: Num rows: 1087859189 Data size: 228147860010 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1055272789 Data size: 221190811296 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col5 (type: varchar(30)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 1721560 Data size: 361527600 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1668585 Data size: 350222824 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: varchar(30)) - Statistics: Num rows: 1721560 Data size: 361527600 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1668585 Data size: 350222824 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -464,7 +464,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: ss_addr_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_399_container, bigKeyColName:ss_addr_sk, smallTablePos:1, keyRatio:0.049193881825049336 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_399_container, bigKeyColName:ss_addr_sk, smallTablePos:1, keyRatio:0.047720298170507186 Statistics: Num rows: 82510879939 Data size: 10327822006760 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ss_addr_sk is not null (type: boolean) @@ -492,20 +492,20 @@ STAGE PLANS: outputColumnNames: _col1, _col5 input vertices: 1 Map 6 - Statistics: Num rows: 4059030477 Data size: 639544095946 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3937443793 Data size: 613896987592 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col5 (type: varchar(30)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 4823070 Data size: 1012844700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4627671 Data size: 971677140 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: varchar(30)) - Statistics: Num rows: 4823070 Data size: 1012844700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4627671 Data size: 971677140 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -517,7 +517,7 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(30)) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 1930 Data size: 405300 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 405090 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -537,7 +537,7 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3, _col5 input vertices: 1 Reducer 14 - Statistics: Num rows: 1930 Data size: 837620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1931 Data size: 838054 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -547,17 +547,17 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col4, _col6, _col7, _col8, _col9, _col11, _col13 input vertices: 0 Reducer 2 - Statistics: Num rows: 1930 Data size: 1501540 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1934 Data size: 1504652 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (if((_col9 > 0), if(_col7, ((_col4 / _col6) > (_col13 / _col9)), false), false) and if((_col11 > 0), if(_col2, ((_col6 / _col1) > (_col9 / _col11)), false), false)) (type: boolean) - Statistics: Num rows: 482 Data size: 374996 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 483 Data size: 375774 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col8 (type: varchar(30)), 2000 (type: int), (_col6 / _col1) (type: decimal(37,20)), (_col9 / _col11) (type: decimal(37,20)), (_col4 / _col6) (type: decimal(37,20)), (_col13 / _col9) (type: decimal(37,20)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 482 Data size: 265100 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 483 Data size: 265650 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 482 Data size: 265100 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 483 Data size: 265650 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -570,13 +570,13 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(30)) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 1930 Data size: 405300 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 405090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: varchar(30)) - Statistics: Num rows: 1930 Data size: 405300 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 405090 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Reducer 14 Execution mode: vectorized, llap @@ -586,13 +586,13 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(30)) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 1930 Data size: 405300 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 405090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: varchar(30)) - Statistics: Num rows: 1930 Data size: 405300 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 405090 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Reducer 2 Execution mode: vectorized, llap @@ -602,11 +602,11 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(30)) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 1930 Data size: 405300 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 404992 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: varchar(30)), _col1 (type: decimal(17,2)), (_col1 > 0) (type: boolean) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1930 Data size: 413020 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 412708 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -616,7 +616,7 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col4 input vertices: 1 Reducer 4 - Statistics: Num rows: 1930 Data size: 629180 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1930 Data size: 629082 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -626,13 +626,13 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col4, _col6, _col7 input vertices: 1 Reducer 8 - Statistics: Num rows: 1930 Data size: 853060 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1931 Data size: 853404 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: varchar(30)) - Statistics: Num rows: 1930 Data size: 853060 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1931 Data size: 853404 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)), _col2 (type: boolean), _col4 (type: decimal(17,2)), _col6 (type: decimal(17,2)), _col7 (type: boolean) Reducer 4 Execution mode: vectorized, llap @@ -642,13 +642,13 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(30)) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 1930 Data size: 405300 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 404992 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: varchar(30)) - Statistics: Num rows: 1930 Data size: 405300 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 404992 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Reducer 8 Execution mode: vectorized, llap @@ -658,17 +658,17 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(30)) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 1930 Data size: 405300 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 404992 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: varchar(30)), _col1 (type: decimal(17,2)), (_col1 > 0) (type: boolean) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1930 Data size: 413020 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 412708 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: varchar(30)) - Statistics: Num rows: 1930 Data size: 413020 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1929 Data size: 412708 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)), _col2 (type: boolean) Stage: Stage-0 diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query33.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query33.q.out index bec4c53aab72..19abe6c0ea82 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query33.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query33.q.out @@ -349,17 +349,17 @@ STAGE PLANS: TableScan alias: item filterExpr: (((i_category = 'Books ') and i_manufact_id is not null) or i_manufact_id is not null) (type: boolean) - Statistics: Num rows: 462000 Data size: 43423396 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 43323316 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((i_category = 'Books ') and i_manufact_id is not null) (type: boolean) - Statistics: Num rows: 41895 Data size: 3937718 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46085 Data size: 4321634 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_manufact_id (type: int) outputColumnNames: _col0 - Statistics: Num rows: 41895 Data size: 167168 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46085 Data size: 183884 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: int) - minReductionHashAggr: 0.97641724 + minReductionHashAggr: 0.97856134 mode: hash outputColumnNames: _col0 Statistics: Num rows: 988 Data size: 3948 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query34.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query34.q.out index 3bd4b54e6623..6b1154df450b 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query34.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query34.q.out @@ -18,11 +18,11 @@ STAGE PLANS: TableScan alias: customer probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_92_container, bigKeyColName:c_customer_sk, smallTablePos:1, keyRatio:1.25E-8 - Statistics: Num rows: 80000000 Data size: 28800000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 27814510494 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: c_customer_sk (type: bigint), c_salutation (type: char(10)), c_first_name (type: char(20)), c_last_name (type: char(30)), c_preferred_cust_flag (type: char(1)) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 80000000 Data size: 28800000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 27814510494 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -32,16 +32,16 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col3, _col4, _col5, _col7 input vertices: 1 Reducer 4 - Statistics: Num rows: 6 Data size: 2208 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6 Data size: 448 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: char(30)), _col2 (type: char(20)), _col1 (type: char(10)), _col4 (type: char(1)), _col5 (type: bigint), _col7 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 6 Data size: 2208 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6 Data size: 448 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: char(10)), _col3 (type: char(1)) null sort order: zzza sort order: +++- - Statistics: Num rows: 6 Data size: 2208 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6 Data size: 448 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: bigint), _col5 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -168,7 +168,7 @@ STAGE PLANS: TableScan alias: store filterExpr: (s_county) IN ('Barrow County', 'Fairfield County', 'Huron County', 'Jackson County', 'Kittitas County', 'Maverick County', 'Mobile County', 'Pennington County') (type: boolean) - Statistics: Num rows: 1704 Data size: 180624 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 179546 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (s_county) IN ('Barrow County', 'Fairfield County', 'Huron County', 'Jackson County', 'Kittitas County', 'Maverick County', 'Mobile County', 'Pennington County') (type: boolean) Statistics: Num rows: 107 Data size: 11342 Basic stats: COMPLETE Column stats: COMPLETE @@ -190,10 +190,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: char(30)), KEY.reducesinkkey1 (type: char(20)), KEY.reducesinkkey2 (type: char(10)), KEY.reducesinkkey3 (type: char(1)), VALUE._col0 (type: bigint), VALUE._col1 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 6 Data size: 2208 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6 Data size: 448 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 6 Data size: 2208 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6 Data size: 448 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query35.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query35.q.out index c78475a0d3e5..671beb725a34 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query35.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query35.q.out @@ -158,17 +158,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: ca - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_state (type: char(2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -357,13 +357,13 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col3, _col4, _col5, _col14 input vertices: 1 Map 13 - Statistics: Num rows: 15670819 Data size: 4199779492 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15670819 Data size: 4096600390 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Top N Key Operator sort order: ++++++ keys: _col14 (type: char(2)), _col1 (type: char(1)), _col2 (type: char(1)), _col3 (type: int), _col4 (type: int), _col5 (type: int) null sort order: zzzzzz - Statistics: Num rows: 15670819 Data size: 4199779492 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15670819 Data size: 4096600390 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator aggregations: count(), sum(_col3), count(_col3), max(_col3), sum(_col4), count(_col4), max(_col4), sum(_col5), count(_col5), max(_col5) @@ -371,13 +371,13 @@ STAGE PLANS: minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15 - Statistics: Num rows: 1224510 Data size: 411435360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1282820 Data size: 414135056 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(2)), _col1 (type: char(1)), _col2 (type: char(1)), _col3 (type: int), _col4 (type: int), _col5 (type: int) null sort order: zzzzzz sort order: ++++++ Map-reduce partition columns: _col0 (type: char(2)), _col1 (type: char(1)), _col2 (type: char(1)), _col3 (type: int), _col4 (type: int), _col5 (type: int) - Statistics: Num rows: 1224510 Data size: 411435360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1282820 Data size: 414135056 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col6 (type: bigint), _col7 (type: bigint), _col8 (type: bigint), _col9 (type: int), _col10 (type: bigint), _col11 (type: bigint), _col12 (type: int), _col13 (type: bigint), _col14 (type: bigint), _col15 (type: int) Reducer 5 Execution mode: vectorized, llap @@ -387,16 +387,16 @@ STAGE PLANS: keys: KEY._col0 (type: char(2)), KEY._col1 (type: char(1)), KEY._col2 (type: char(1)), KEY._col3 (type: int), KEY._col4 (type: int), KEY._col5 (type: int) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15 - Statistics: Num rows: 72030 Data size: 24202080 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 75460 Data size: 24361002 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(2)), _col1 (type: char(1)), _col2 (type: char(1)), _col6 (type: bigint), (UDFToDouble(_col7) / _col8) (type: double), _col9 (type: int), _col7 (type: bigint), _col4 (type: int), (UDFToDouble(_col10) / _col11) (type: double), _col12 (type: int), _col10 (type: bigint), _col5 (type: int), (UDFToDouble(_col13) / _col14) (type: double), _col15 (type: int), _col13 (type: bigint), _col3 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col9, _col10, _col11, _col12, _col14, _col15, _col16, _col17 - Statistics: Num rows: 72030 Data size: 24202080 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 75460 Data size: 24361002 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(2)), _col1 (type: char(1)), _col2 (type: char(1)), _col17 (type: int), _col7 (type: int), _col12 (type: int) null sort order: zzzzzz sort order: ++++++ - Statistics: Num rows: 72030 Data size: 24202080 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 75460 Data size: 24361002 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: double), _col5 (type: int), _col6 (type: bigint), _col9 (type: double), _col10 (type: int), _col11 (type: bigint), _col14 (type: double), _col15 (type: int), _col16 (type: bigint) Reducer 6 Execution mode: vectorized, llap @@ -404,13 +404,13 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: char(2)), KEY.reducesinkkey1 (type: char(1)), KEY.reducesinkkey2 (type: char(1)), VALUE._col0 (type: bigint), VALUE._col1 (type: double), VALUE._col2 (type: int), VALUE._col3 (type: bigint), KEY.reducesinkkey4 (type: int), VALUE._col0 (type: bigint), VALUE._col4 (type: double), VALUE._col5 (type: int), VALUE._col6 (type: bigint), KEY.reducesinkkey5 (type: int), VALUE._col0 (type: bigint), VALUE._col7 (type: double), VALUE._col8 (type: int), VALUE._col9 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16 - Statistics: Num rows: 72030 Data size: 25066440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 75460 Data size: 25266522 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 - Statistics: Num rows: 100 Data size: 34800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 33596 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 100 Data size: 34800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 33596 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query36.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query36.q.out index 8b144f96242b..3bc7ad8e2642 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query36.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query36.q.out @@ -18,7 +18,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: ss_store_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_74_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:2.049790283718186E-7 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_74_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:2.096087208473129E-7 Statistics: Num rows: 82510879939 Data size: 20011209733336 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ss_store_sk is not null (type: boolean) @@ -46,7 +46,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col3 input vertices: 1 Map 6 - Statistics: Num rows: 2949381825 Data size: 258560072776 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3015980781 Data size: 274011030568 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -56,11 +56,11 @@ STAGE PLANS: outputColumnNames: _col2, _col3, _col8, _col9 input vertices: 1 Map 7 - Statistics: Num rows: 2949381825 Data size: 771752510326 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3015980781 Data size: 798791480122 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col9 (type: char(50)), _col8 (type: char(50)), _col3 (type: decimal(7,2)), _col2 (type: decimal(7,2)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 2949381825 Data size: 771752510326 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3015980781 Data size: 798791480122 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2), sum(_col3) keys: _col0 (type: char(50)), _col1 (type: char(50)), 0L (type: bigint) @@ -68,13 +68,13 @@ STAGE PLANS: minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 9850005 Data size: 4077902070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 10093314 Data size: 4178631450 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: bigint) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: bigint) - Statistics: Num rows: 9850005 Data size: 4077902070 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 10093314 Data size: 4178631450 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -120,37 +120,37 @@ STAGE PLANS: TableScan alias: store filterExpr: (s_state) IN ('AL', 'FL', 'GA', 'LA', 'MI', 'MO', 'SC', 'SD') (type: boolean) - Statistics: Num rows: 1704 Data size: 160176 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 159230 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (s_state) IN ('AL', 'FL', 'GA', 'LA', 'MI', 'MO', 'SC', 'SD') (type: boolean) - Statistics: Num rows: 310 Data size: 29140 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 317 Data size: 29712 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 310 Data size: 2480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 317 Data size: 2536 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 310 Data size: 2480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 317 Data size: 2536 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 7 Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 87780000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 87573660 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_class (type: char(50)), i_category (type: char(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 462000 Data size: 87780000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 87573660 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 87780000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 87573660 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)), _col2 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -162,17 +162,17 @@ STAGE PLANS: keys: KEY._col0 (type: char(50)), KEY._col1 (type: char(50)), KEY._col2 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 3267 Data size: 1352538 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 1338876 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)), _col2 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 3267 Data size: 1352538 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 1338876 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: (grouping(_col4, 1L) + grouping(_col4, 0L)) (type: bigint), CASE WHEN ((grouping(_col4, 0L) = UDFToLong(0))) THEN (_col0) ELSE (CAST( null AS CHAR(50))) END (type: char(50)), (_col2 / _col3) (type: decimal(37,20)) null sort order: aaz sort order: +++ Map-reduce partition columns: (grouping(_col4, 1L) + grouping(_col4, 0L)) (type: bigint), CASE WHEN ((grouping(_col4, 0L) = UDFToLong(0))) THEN (_col0) ELSE (CAST( null AS CHAR(50))) END (type: char(50)) - Statistics: Num rows: 3267 Data size: 1352538 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 1338876 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: decimal(17,2)), _col3 (type: decimal(17,2)), _col4 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -180,7 +180,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: char(50)), VALUE._col1 (type: char(50)), VALUE._col2 (type: decimal(17,2)), VALUE._col3 (type: decimal(17,2)), VALUE._col4 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 3267 Data size: 1352538 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 1338876 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -201,22 +201,22 @@ STAGE PLANS: window function: GenericUDAFRankEvaluator window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) isPivotResult: true - Statistics: Num rows: 3267 Data size: 1352538 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 1338876 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: -++ keys: (grouping(_col4, 1L) + grouping(_col4, 0L)) (type: bigint), if(((grouping(_col4, 1L) + grouping(_col4, 0L)) = 0L), _col0, null) (type: char(50)), rank_window_0 (type: int) null sort order: azz - Statistics: Num rows: 3267 Data size: 1352538 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 1338876 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: (_col2 / _col3) (type: decimal(37,20)), _col0 (type: char(50)), _col1 (type: char(50)), (grouping(_col4, 1L) + grouping(_col4, 0L)) (type: bigint), rank_window_0 (type: int), if(((grouping(_col4, 1L) + grouping(_col4, 0L)) = 0L), _col0, null) (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 3267 Data size: 999792 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 989694 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col3 (type: bigint), _col5 (type: char(50)), _col4 (type: int) null sort order: azz sort order: -++ - Statistics: Num rows: 3267 Data size: 999792 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 989694 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: decimal(37,20)), _col1 (type: char(50)), _col2 (type: char(50)) Reducer 4 Execution mode: vectorized, llap @@ -224,7 +224,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: decimal(37,20)), VALUE._col1 (type: char(50)), VALUE._col2 (type: char(50)), KEY.reducesinkkey0 (type: bigint), KEY.reducesinkkey2 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 3267 Data size: 999702 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 989604 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 30600 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query37.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query37.q.out index b37ba649551d..2a8c636dd2bc 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query37.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query37.q.out @@ -37,7 +37,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col3, _col4, _col5 input vertices: 1 Map 2 - Statistics: Num rows: 1203452 Data size: 495822112 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1203452 Data size: 495821928 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -47,13 +47,13 @@ STAGE PLANS: outputColumnNames: _col2, _col3, _col4, _col5 input vertices: 1 Map 4 - Statistics: Num rows: 133708 Data size: 54017920 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 133708 Data size: 54017736 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col2 (type: bigint) - Statistics: Num rows: 133708 Data size: 54017920 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 133708 Data size: 54017736 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: string), _col4 (type: varchar(200)), _col5 (type: decimal(7,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -62,20 +62,20 @@ STAGE PLANS: TableScan alias: item filterExpr: ((i_manufact_id) IN (678, 849, 918, 964) and i_current_price BETWEEN 22 AND 52) (type: boolean) - Statistics: Num rows: 462000 Data size: 188360804 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 188147916 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((i_manufact_id) IN (678, 849, 918, 964) and i_current_price BETWEEN 22 AND 52) (type: boolean) - Statistics: Num rows: 759 Data size: 309556 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 759 Data size: 309372 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_id (type: string), i_item_desc (type: varchar(200)), i_current_price (type: decimal(7,2)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 759 Data size: 306524 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 759 Data size: 306340 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 759 Data size: 306524 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 759 Data size: 306340 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(200)), _col3 (type: decimal(7,2)) Select Operator expressions: _col0 (type: bigint) @@ -138,12 +138,12 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col5 input vertices: 0 Map 1 - Statistics: Num rows: 71005705 Data size: 28118259068 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 71005705 Data size: 28118258884 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++ keys: _col3 (type: string), _col4 (type: varchar(200)), _col5 (type: decimal(7,2)) null sort order: zzz - Statistics: Num rows: 71005705 Data size: 28118259068 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 71005705 Data size: 28118258884 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator keys: _col3 (type: string), _col4 (type: varchar(200)), _col5 (type: decimal(7,2)) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query38.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query38.q.out index 9a35919c5a20..827b1d803f45 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query38.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query38.q.out @@ -172,31 +172,31 @@ STAGE PLANS: Map Operator Tree: TableScan alias: customer - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: c_customer_sk (type: bigint), c_first_name (type: char(20)), c_last_name (type: char(30)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(20)), _col2 (type: char(30)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(20)), _col2 (type: char(30)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(20)), _col2 (type: char(30)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -244,20 +244,20 @@ STAGE PLANS: outputColumnNames: _col3, _col5, _col6 input vertices: 1 Map 14 - Statistics: Num rows: 4245017503 Data size: 1001824130708 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4245017503 Data size: 1001320399808 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator keys: _col6 (type: char(30)), _col5 (type: char(20)), _col3 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 2122508751 Data size: 500912065236 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2122508751 Data size: 500660199966 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 2122508751 Data size: 500912065236 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2122508751 Data size: 500660199966 Basic stats: COMPLETE Column stats: COMPLETE Reducer 13 Execution mode: vectorized, llap Reduce Operator Tree: @@ -265,30 +265,30 @@ STAGE PLANS: keys: KEY._col0 (type: char(30)), KEY._col1 (type: char(20)), KEY._col2 (type: date) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1061254375 Data size: 250456032500 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1061254375 Data size: 250330100000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: char(20)), _col0 (type: char(30)), _col2 (type: date) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1061254375 Data size: 250456032500 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1061254375 Data size: 250330100000 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: char(30)), _col0 (type: char(20)), _col2 (type: date) mode: complete outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 265313593 Data size: 64736516692 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 265313593 Data size: 64705033792 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col3) keys: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 889341640 Data size: 216999360160 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 889341640 Data size: 216936394090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 889341640 Data size: 216999360160 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 889341640 Data size: 216936394090 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint) Reducer 2 Execution mode: vectorized, llap @@ -302,20 +302,20 @@ STAGE PLANS: outputColumnNames: _col3, _col5, _col6 input vertices: 1 Map 14 - Statistics: Num rows: 15839433273 Data size: 3738106252428 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15839433273 Data size: 3737602521528 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator keys: _col6 (type: char(30)), _col5 (type: char(20)), _col3 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 7919716636 Data size: 1869053126096 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7919716636 Data size: 1868801260826 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 7919716636 Data size: 1869053126096 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7919716636 Data size: 1868801260826 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: vectorized, llap Reduce Operator Tree: @@ -323,30 +323,30 @@ STAGE PLANS: keys: KEY._col0 (type: char(30)), KEY._col1 (type: char(20)), KEY._col2 (type: date) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 3959858318 Data size: 934526563048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3959858318 Data size: 934400630458 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: char(20)), _col0 (type: char(30)), _col2 (type: date) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 3959858318 Data size: 934526563048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3959858318 Data size: 934400630458 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: char(30)), _col0 (type: char(20)), _col2 (type: date) mode: complete outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 989964579 Data size: 241551357276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 989964579 Data size: 241519874286 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col3) keys: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 889341640 Data size: 216999360160 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 889341640 Data size: 216936394090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 889341640 Data size: 216999360160 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 889341640 Data size: 216936394090 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint) Reducer 5 Execution mode: vectorized, llap @@ -356,7 +356,7 @@ STAGE PLANS: keys: KEY._col0 (type: char(30)), KEY._col1 (type: char(20)), KEY._col2 (type: date) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 444670820 Data size: 108499680080 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 444670820 Data size: 108468197090 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: bigint) outputColumnNames: _col3 @@ -404,20 +404,20 @@ STAGE PLANS: outputColumnNames: _col3, _col5, _col6 input vertices: 1 Map 14 - Statistics: Num rows: 8374481746 Data size: 1976377692056 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8374481746 Data size: 1975873961156 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator keys: _col6 (type: char(30)), _col5 (type: char(20)), _col3 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 4187240873 Data size: 988188846028 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4187240873 Data size: 987936980578 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 4187240873 Data size: 988188846028 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4187240873 Data size: 987936980578 Basic stats: COMPLETE Column stats: COMPLETE Reducer 9 Execution mode: vectorized, llap Reduce Operator Tree: @@ -425,30 +425,30 @@ STAGE PLANS: keys: KEY._col0 (type: char(30)), KEY._col1 (type: char(20)), KEY._col2 (type: date) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 2093620436 Data size: 494094422896 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2093620436 Data size: 493968490306 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: char(20)), _col0 (type: char(30)), _col2 (type: date) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 2093620436 Data size: 494094422896 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2093620436 Data size: 493968490306 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: char(30)), _col0 (type: char(20)), _col2 (type: date) mode: complete outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 523405109 Data size: 127710846596 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 523405109 Data size: 127679363516 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col3) keys: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 889341640 Data size: 216999360160 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 889341640 Data size: 216936394090 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 889341640 Data size: 216999360160 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 889341640 Data size: 216936394090 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint) Union 4 Vertex: Union 4 diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query4.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query4.q.out index 5ae35bed4722..038a5266cdfb 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query4.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query4.q.out @@ -144,7 +144,7 @@ STAGE PLANS: alias: customer Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: c_customer_sk (type: bigint), c_customer_id (type: char(16)) + expressions: c_customer_sk (type: bigint), c_customer_id (type: string) outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator @@ -153,46 +153,46 @@ STAGE PLANS: sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) + value expressions: _col1 (type: string) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) + value expressions: _col1 (type: string) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) + value expressions: _col1 (type: string) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) + value expressions: _col1 (type: string) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) + value expressions: _col1 (type: string) Select Operator - expressions: c_customer_sk (type: bigint), c_customer_id (type: char(16)), c_birth_country (type: varchar(20)) + expressions: c_customer_sk (type: bigint), c_customer_id (type: string), c_birth_country (type: varchar(20)) outputColumnNames: _col0, _col1, _col4 - Statistics: Num rows: 80000000 Data size: 16000000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15742561276 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 16000000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)), _col4 (type: varchar(20)) + Statistics: Num rows: 80000000 Data size: 15742561276 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: string), _col4 (type: varchar(20)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 17 @@ -430,36 +430,36 @@ STAGE PLANS: TableScan alias: customer probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_486_container, bigKeyColName:c_customer_id, smallTablePos:0, keyRatio:0.083333325 - Statistics: Num rows: 80000000 Data size: 29760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 28998830376 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: c_customer_id (type: char(16)), c_first_name (type: char(20)), c_last_name (type: char(30)), c_birth_country (type: varchar(20)) + expressions: c_customer_id (type: string), c_first_name (type: char(20)), c_last_name (type: char(30)), c_birth_country (type: varchar(20)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 80000000 Data size: 29760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 28998830376 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: char(16)) - 1 _col0 (type: char(16)) + 0 _col0 (type: string) + 1 _col0 (type: string) outputColumnNames: _col0, _col2, _col3, _col4 input vertices: 0 Reducer 8 - Statistics: Num rows: 6666666 Data size: 2479999752 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6666666 Data size: 1718830128 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++++ - keys: _col0 (type: char(16)), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: varchar(20)) + keys: _col0 (type: string), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: varchar(20)) null sort order: zzzz - Statistics: Num rows: 6666666 Data size: 2479999752 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6666666 Data size: 1718830128 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator - expressions: _col0 (type: char(16)), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: varchar(20)) + expressions: _col0 (type: string), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: varchar(20)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 6666666 Data size: 2479999752 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6666666 Data size: 957660232 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)), _col1 (type: char(20)), _col2 (type: char(30)), _col3 (type: varchar(20)) + key expressions: _col0 (type: string), _col1 (type: char(20)), _col2 (type: char(30)), _col3 (type: varchar(20)) null sort order: zzzz sort order: ++++ - Statistics: Num rows: 6666666 Data size: 2479999752 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6666666 Data size: 957660232 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 10 @@ -467,7 +467,7 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)) + keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE @@ -475,14 +475,14 @@ STAGE PLANS: predicate: (_col1 > 0) (type: boolean) Statistics: Num rows: 26666666 Data size: 5653333192 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)), _col1 (type: decimal(24,6)), (_col1 > 0) (type: boolean) + expressions: _col0 (type: string), _col1 (type: decimal(24,6)), (_col1 > 0) (type: boolean) outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 26666666 Data size: 5759999856 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 26666666 Data size: 5759999856 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(24,6)), _col2 (type: boolean) Reducer 12 @@ -501,16 +501,16 @@ STAGE PLANS: DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col2) - keys: _col5 (type: char(16)) + keys: _col5 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(24,6)) Reducer 13 @@ -518,15 +518,15 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)) + keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(24,6)) Reducer 14 @@ -545,16 +545,16 @@ STAGE PLANS: DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col2) - keys: _col5 (type: char(16)) + keys: _col5 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(24,6)) Reducer 15 @@ -562,7 +562,7 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)) + keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE @@ -570,14 +570,14 @@ STAGE PLANS: predicate: (_col1 > 0) (type: boolean) Statistics: Num rows: 26666666 Data size: 5653333192 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)), _col1 (type: decimal(24,6)), (_col1 > 0) (type: boolean) + expressions: _col0 (type: string), _col1 (type: decimal(24,6)), (_col1 > 0) (type: boolean) outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 26666666 Data size: 5759999856 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 26666666 Data size: 5759999856 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(24,6)), _col2 (type: boolean) Reducer 18 @@ -596,16 +596,16 @@ STAGE PLANS: DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col2) - keys: _col5 (type: char(16)) + keys: _col5 (type: string) minReductionHashAggr: 0.9815675 mode: hash outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(24,6)) Reducer 19 @@ -613,15 +613,15 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)) + keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(24,6)) Reducer 2 @@ -636,21 +636,21 @@ STAGE PLANS: outputColumnNames: _col2, _col5, _col8 input vertices: 1 Map 16 - Statistics: Num rows: 16584098707 Data size: 5041566006928 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 16584098707 Data size: 5041308568204 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col2) - keys: _col5 (type: char(16)), _col8 (type: varchar(20)) - minReductionHashAggr: 0.9291035 + keys: _col5 (type: string), _col8 (type: varchar(20)) + minReductionHashAggr: 0.92926776 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 80000000 Data size: 24320000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 24318758276 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)), _col1 (type: varchar(20)) + key expressions: _col0 (type: string), _col1 (type: varchar(20)) null sort order: zz sort order: ++ - Map-reduce partition columns: _col0 (type: char(16)), _col1 (type: varchar(20)) - Statistics: Num rows: 80000000 Data size: 24320000000 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col0 (type: string), _col1 (type: varchar(20)) + Statistics: Num rows: 80000000 Data size: 24318758276 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(24,6)) Reducer 20 Execution mode: vectorized, llap @@ -668,16 +668,16 @@ STAGE PLANS: DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col2) - keys: _col5 (type: char(16)) + keys: _col5 (type: string) minReductionHashAggr: 0.9815675 mode: hash outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(24,6)) Reducer 21 @@ -685,7 +685,7 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)) + keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE @@ -693,14 +693,14 @@ STAGE PLANS: predicate: (_col1 > 0) (type: boolean) Statistics: Num rows: 26666666 Data size: 5653333192 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)), _col1 (type: decimal(24,6)), (_col1 > 0) (type: boolean) + expressions: _col0 (type: string), _col1 (type: decimal(24,6)), (_col1 > 0) (type: boolean) outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 26666666 Data size: 5759999856 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 26666666 Data size: 5759999856 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(24,6)), _col2 (type: boolean) Reducer 23 @@ -743,15 +743,15 @@ STAGE PLANS: Execution mode: vectorized, llap Reduce Operator Tree: Select Operator - expressions: KEY.reducesinkkey0 (type: char(16)), KEY.reducesinkkey1 (type: char(20)), KEY.reducesinkkey2 (type: char(30)), KEY.reducesinkkey3 (type: varchar(20)) + expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: char(20)), KEY.reducesinkkey2 (type: char(30)), KEY.reducesinkkey3 (type: varchar(20)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 6666666 Data size: 2479999752 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6666666 Data size: 957660232 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 - Statistics: Num rows: 100 Data size: 37200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 14624 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 100 Data size: 37200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 14624 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -761,19 +761,19 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)), KEY._col1 (type: varchar(20)) + keys: KEY._col0 (type: string), KEY._col1 (type: varchar(20)) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 80000000 Data size: 24320000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 24318758276 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)), _col2 (type: decimal(24,6)) + expressions: _col0 (type: string), _col2 (type: decimal(24,6)) outputColumnNames: _col0, _col2 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(24,6)) Reducer 4 @@ -783,18 +783,18 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 KEY.reducesinkkey0 (type: char(16)) - 1 KEY.reducesinkkey0 (type: char(16)) + 0 KEY.reducesinkkey0 (type: string) + 1 KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col2, _col4, _col5 input vertices: 1 Reducer 10 Statistics: Num rows: 26666666 Data size: 8746666448 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 26666666 Data size: 8746666448 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(24,6)), _col4 (type: decimal(24,6)), _col5 (type: boolean) Reducer 5 @@ -804,18 +804,18 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 KEY.reducesinkkey0 (type: char(16)) - 1 KEY.reducesinkkey0 (type: char(16)) + 0 KEY.reducesinkkey0 (type: string) + 1 KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col2, _col4, _col5, _col7 input vertices: 1 Reducer 13 Statistics: Num rows: 26666666 Data size: 11733333040 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 26666666 Data size: 11733333040 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(24,6)), _col4 (type: decimal(24,6)), _col5 (type: boolean), _col7 (type: decimal(24,6)) Reducer 6 @@ -825,8 +825,8 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 KEY.reducesinkkey0 (type: char(16)) - 1 KEY.reducesinkkey0 (type: char(16)) + 0 KEY.reducesinkkey0 (type: string) + 1 KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col2, _col4, _col5, _col7, _col9, _col10 input vertices: 1 Reducer 15 @@ -836,10 +836,10 @@ STAGE PLANS: predicate: if(_col5, if(_col10, ((_col7 / _col9) > (_col2 / _col4)), false), false) (type: boolean) Statistics: Num rows: 13333333 Data size: 7413333148 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 13333333 Data size: 7413333148 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col7 (type: decimal(24,6)), _col9 (type: decimal(24,6)), _col10 (type: boolean) Reducer 7 @@ -849,18 +849,18 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 KEY.reducesinkkey0 (type: char(16)) - 1 KEY.reducesinkkey0 (type: char(16)) + 0 KEY.reducesinkkey0 (type: string) + 1 KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col7, _col9, _col10, _col12 input vertices: 1 Reducer 19 Statistics: Num rows: 13333333 Data size: 5866666520 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 13333333 Data size: 5866666520 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col7 (type: decimal(24,6)), _col9 (type: decimal(24,6)), _col10 (type: boolean), _col12 (type: decimal(24,6)) Reducer 8 @@ -870,8 +870,8 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 KEY.reducesinkkey0 (type: char(16)) - 1 KEY.reducesinkkey0 (type: char(16)) + 0 KEY.reducesinkkey0 (type: string) + 1 KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col7, _col9, _col10, _col12, _col14, _col15 input vertices: 1 Reducer 21 @@ -881,14 +881,14 @@ STAGE PLANS: predicate: if(_col15, if(_col10, ((_col7 / _col9) > (_col12 / _col14)), false), false) (type: boolean) Statistics: Num rows: 6666666 Data size: 3706666296 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)) + expressions: _col0 (type: string) outputColumnNames: _col0 Statistics: Num rows: 6666666 Data size: 666666600 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 6666666 Data size: 666666600 Basic stats: COMPLETE Column stats: COMPLETE Reducer 9 Execution mode: vectorized, llap @@ -906,16 +906,16 @@ STAGE PLANS: DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col2) - keys: _col5 (type: char(16)) + keys: _col5 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(24,6)) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query41.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query41.q.out index e7ac140dba20..a201fc6d8d84 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query41.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query41.q.out @@ -18,15 +18,15 @@ STAGE PLANS: TableScan alias: i1 filterExpr: (i_manufact_id BETWEEN 970 AND 1010 and i_manufact is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_43_container, bigKeyColName:i_manufact, smallTablePos:1, keyRatio:0.001751082251082251 - Statistics: Num rows: 462000 Data size: 95167396 Basic stats: COMPLETE Column stats: COMPLETE + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_43_container, bigKeyColName:i_manufact, smallTablePos:1, keyRatio:0.0023073593073593074 + Statistics: Num rows: 462000 Data size: 94935739 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_manufact_id BETWEEN 970 AND 1010 and i_manufact is not null) (type: boolean) - Statistics: Num rows: 14511 Data size: 2989126 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14475 Data size: 2974640 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_manufact (type: char(50)), i_product_name (type: char(50)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 14511 Data size: 2931222 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14475 Data size: 2916880 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -36,25 +36,25 @@ STAGE PLANS: outputColumnNames: _col1 input vertices: 1 Reducer 5 - Statistics: Num rows: 809 Data size: 86563 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1066 Data size: 110317 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: + keys: _col1 (type: char(50)) null sort order: z - Statistics: Num rows: 809 Data size: 86563 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1066 Data size: 110317 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator keys: _col1 (type: char(50)) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 86563 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1066 Data size: 106465 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: char(50)) - Statistics: Num rows: 809 Data size: 86563 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1066 Data size: 106465 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 4 @@ -62,27 +62,27 @@ STAGE PLANS: TableScan alias: item filterExpr: ((((i_category = 'Women ') and (i_color) IN ('frosted ', 'rose ') and (i_units) IN ('Gross ', 'Lb ') and (i_size) IN ('large ', 'medium ')) or ((i_category = 'Women ') and (i_color) IN ('black ', 'chocolate ') and (i_units) IN ('Box ', 'Dram ') and (i_size) IN ('economy ', 'petite ')) or ((i_category = 'Men ') and (i_color) IN ('magenta ', 'slate ') and (i_units) IN ('Bundle ', 'Carton ') and (i_size) IN ('N/A ', 'small ')) or ((i_category = 'Men ') and (i_color) IN ('cornflower ', 'firebrick ') and (i_units) IN ('Oz ', 'Pound ') and (i_size) IN ('large ', 'medium ')) or ((i_category = 'Women ') and (i_color) IN ('almond ', 'steel ') and (i_units) IN ('Case ', 'Tsp ') and (i_size) IN ('large ', 'medium ')) or ((i_category = 'Women ') and (i_color) IN ('aquamarine ', 'purple ') and (i_units) IN ('Bunch ', 'Gram ') and (i_size) IN ('economy ', 'petite ')) or ((i_category = 'Men ') and (i_color) IN ('lavender ', 'papaya ') and (i_units) IN ('Cup ', 'Pallet ') and (i_size) IN ('N/A ', 'small ')) or ((i_category = 'Men ') and (i_color) IN ('cyan ', 'maroon ') and (i_units) IN ('Each ', 'N/A ') and (i_size) IN ('large ', 'medium '))) and i_manufact is not null) (type: boolean) - Statistics: Num rows: 462000 Data size: 207900000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 207380715 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((((i_category = 'Women ') and (i_color) IN ('frosted ', 'rose ') and (i_units) IN ('Gross ', 'Lb ') and (i_size) IN ('large ', 'medium ')) or ((i_category = 'Women ') and (i_color) IN ('black ', 'chocolate ') and (i_units) IN ('Box ', 'Dram ') and (i_size) IN ('economy ', 'petite ')) or ((i_category = 'Men ') and (i_color) IN ('magenta ', 'slate ') and (i_units) IN ('Bundle ', 'Carton ') and (i_size) IN ('N/A ', 'small ')) or ((i_category = 'Men ') and (i_color) IN ('cornflower ', 'firebrick ') and (i_units) IN ('Oz ', 'Pound ') and (i_size) IN ('large ', 'medium ')) or ((i_category = 'Women ') and (i_color) IN ('almond ', 'steel ') and (i_units) IN ('Case ', 'Tsp ') and (i_size) IN ('large ', 'medium ')) or ((i_category = 'Women ') and (i_color) IN ('aquamarine ', 'purple ') and (i_units) IN ('Bunch ', 'Gram ') and (i_size) IN ('economy ', 'petite ')) or ((i_category = 'Men ') and (i_color) IN ('lavender ', 'papaya ') and (i_units) IN ('Cup ', 'Pallet ') and (i_size) IN ('N/A ', 'small ')) or ((i_category = 'Men ') and (i_color) IN ('cyan ', 'maroon ') and (i_units) IN ('Each ', 'N/A ') and (i_size) IN ('large ', 'medium '))) and i_manufact is not null) (type: boolean) - Statistics: Num rows: 168 Data size: 75600 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 224 Data size: 100800 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_manufact (type: char(50)) outputColumnNames: i_manufact - Statistics: Num rows: 168 Data size: 75600 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 224 Data size: 100800 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: i_manufact (type: char(50)) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 168 Data size: 17304 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 224 Data size: 23072 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: char(50)) - Statistics: Num rows: 168 Data size: 17304 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 224 Data size: 23072 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -93,25 +93,25 @@ STAGE PLANS: keys: KEY._col0 (type: char(50)) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 86563 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1066 Data size: 106465 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)) null sort order: z sort order: + - Statistics: Num rows: 809 Data size: 86563 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1066 Data size: 106465 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: char(50)) outputColumnNames: _col0 - Statistics: Num rows: 809 Data size: 86563 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1066 Data size: 106465 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 - Statistics: Num rows: 100 Data size: 10700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 10058 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 100 Data size: 10700 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 10058 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -124,20 +124,20 @@ STAGE PLANS: keys: KEY._col0 (type: char(50)) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 168 Data size: 17304 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 224 Data size: 23072 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col1 > 0L) (type: boolean) - Statistics: Num rows: 56 Data size: 5768 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 74 Data size: 7622 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(50)) outputColumnNames: _col0 - Statistics: Num rows: 56 Data size: 5320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 74 Data size: 7030 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: char(50)) - Statistics: Num rows: 56 Data size: 5320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 74 Data size: 7030 Basic stats: COMPLETE Column stats: COMPLETE Stage: Stage-0 Fetch Operator diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query42.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query42.q.out index ee12089c0632..dac75e0ad731 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query42.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query42.q.out @@ -41,7 +41,7 @@ STAGE PLANS: outputColumnNames: _col1, _col5, _col6 input vertices: 1 Map 5 - Statistics: Num rows: 13467990 Data size: 1265991132 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 13467990 Data size: 1265990232 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col5 (type: int), _col6 (type: char(50)) @@ -100,20 +100,20 @@ STAGE PLANS: TableScan alias: item filterExpr: (i_manager_id = 1) (type: boolean) - Statistics: Num rows: 462000 Data size: 48962948 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 48862868 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_manager_id = 1) (type: boolean) - Statistics: Num rows: 4442 Data size: 470772 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 469872 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_category_id (type: int), i_category (type: char(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 4442 Data size: 453044 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 452144 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 4442 Data size: 453044 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 452144 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -125,29 +125,29 @@ STAGE PLANS: keys: KEY._col0 (type: int), KEY._col1 (type: char(50)) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 110 Data size: 22660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 20600 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: -++ keys: _col2 (type: decimal(17,2)), _col0 (type: int), _col1 (type: char(50)) null sort order: azz - Statistics: Num rows: 110 Data size: 22660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 20600 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col0 (type: int), _col1 (type: char(50)), _col2 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 110 Data size: 22660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 20600 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col3 (type: decimal(17,2)), _col0 (type: int), _col1 (type: char(50)) null sort order: azz sort order: -++ - Statistics: Num rows: 110 Data size: 22660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 20600 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey1 (type: int), KEY.reducesinkkey2 (type: char(50)), KEY.reducesinkkey0 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 110 Data size: 22660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 20600 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 20600 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query43.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query43.q.out index 83c84054d0ea..7bf51c4cd3b8 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query43.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query43.q.out @@ -45,17 +45,17 @@ STAGE PLANS: outputColumnNames: _col1, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col12, _col13 input vertices: 1 Map 5 - Statistics: Num rows: 3244319959 Data size: 851663160776 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3244319959 Data size: 851663160688 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++ keys: _col13 (type: varchar(50)), _col12 (type: string) null sort order: zz - Statistics: Num rows: 3244319959 Data size: 851663160776 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3244319959 Data size: 851663160688 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col13 (type: varchar(50)), _col12 (type: string), if(_col4, _col1, null) (type: decimal(7,2)), if(_col5, _col1, null) (type: decimal(7,2)), if(_col6, _col1, null) (type: decimal(7,2)), if(_col7, _col1, null) (type: decimal(7,2)), if(_col8, _col1, null) (type: decimal(7,2)), if(_col9, _col1, null) (type: decimal(7,2)), if(_col10, _col1, null) (type: decimal(7,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8 - Statistics: Num rows: 3244319959 Data size: 851663160776 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3244319959 Data size: 851663160688 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2), sum(_col3), sum(_col4), sum(_col5), sum(_col6), sum(_col7), sum(_col8) keys: _col0 (type: varchar(50)), _col1 (type: string) @@ -115,20 +115,20 @@ STAGE PLANS: TableScan alias: store filterExpr: (s_gmt_offset = -6) (type: boolean) - Statistics: Num rows: 1704 Data size: 523936 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 523056 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (s_gmt_offset = -6) (type: boolean) - Statistics: Num rows: 341 Data size: 104916 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 341 Data size: 104828 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_store_id (type: string), s_store_name (type: varchar(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 341 Data size: 66836 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 341 Data size: 66748 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 341 Data size: 66836 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 341 Data size: 66748 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -140,25 +140,25 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(50)), KEY._col1 (type: string) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8 - Statistics: Num rows: 3751 Data size: 3645972 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3410 Data size: 3314520 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++++++++ keys: _col0 (type: varchar(50)), _col1 (type: string), _col2 (type: decimal(17,2)), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)), _col7 (type: decimal(17,2)), _col8 (type: decimal(17,2)) null sort order: zzzzzzzzz - Statistics: Num rows: 3751 Data size: 3645972 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3410 Data size: 3314520 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Reduce Output Operator key expressions: _col0 (type: varchar(50)), _col1 (type: string), _col2 (type: decimal(17,2)), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)), _col7 (type: decimal(17,2)), _col8 (type: decimal(17,2)) null sort order: zzzzzzzzz sort order: +++++++++ - Statistics: Num rows: 3751 Data size: 3645972 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3410 Data size: 3314520 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: varchar(50)), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: decimal(17,2)), KEY.reducesinkkey3 (type: decimal(17,2)), KEY.reducesinkkey4 (type: decimal(17,2)), KEY.reducesinkkey5 (type: decimal(17,2)), KEY.reducesinkkey6 (type: decimal(17,2)), KEY.reducesinkkey7 (type: decimal(17,2)), KEY.reducesinkkey8 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8 - Statistics: Num rows: 3751 Data size: 3645972 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3410 Data size: 3314520 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 97200 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query44.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query44.q.out index b152d4d94b9b..25dbdd49c189 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query44.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query44.q.out @@ -70,24 +70,24 @@ STAGE PLANS: Map Operator Tree: TableScan alias: i1 - Statistics: Num rows: 462000 Data size: 53130000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 53008448 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_product_name (type: char(50)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 462000 Data size: 53130000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 53008448 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 53130000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 53008448 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 53130000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 53008448 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -200,7 +200,7 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col5 input vertices: 1 Reducer 8 - Statistics: Num rows: 51333 Data size: 6108627 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51333 Data size: 5987075 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -210,22 +210,22 @@ STAGE PLANS: outputColumnNames: _col1, _col5, _col7 input vertices: 1 Map 7 - Statistics: Num rows: 51333 Data size: 11190594 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51333 Data size: 10947490 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: + keys: _col1 (type: int) null sort order: z - Statistics: Num rows: 51333 Data size: 11190594 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51333 Data size: 10947490 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col1 (type: int), _col5 (type: char(50)), _col7 (type: char(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 51333 Data size: 11190594 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51333 Data size: 10704172 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int) null sort order: z sort order: + - Statistics: Num rows: 51333 Data size: 11190594 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51333 Data size: 10704172 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)), _col2 (type: char(50)) Reducer 4 Execution mode: vectorized, llap @@ -233,13 +233,13 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: int), VALUE._col0 (type: char(50)), VALUE._col1 (type: char(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 51333 Data size: 11190594 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 51333 Data size: 10704172 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 - Statistics: Num rows: 100 Data size: 21800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 21158 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 100 Data size: 21800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 21158 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -322,7 +322,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 53130000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 53008448 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)) Stage: Stage-0 diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query45.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query45.q.out index 90e29e7317d7..386c974b0aa7 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query45.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query45.q.out @@ -69,17 +69,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: customer_address - Statistics: Num rows: 40000000 Data size: 7800000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 7575751001 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_county (type: varchar(30)), ca_zip (type: char(10)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40000000 Data size: 7800000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 7575751001 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 7800000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 7575751001 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(30)), _col2 (type: char(10)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -211,14 +211,14 @@ STAGE PLANS: outputColumnNames: _col0, _col3, _col4 input vertices: 1 Map 3 - Statistics: Num rows: 80000000 Data size: 15600000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15375751001 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 15600000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15375751001 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: varchar(30)), _col4 (type: char(10)) Reducer 5 Execution mode: vectorized, llap @@ -232,7 +232,7 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col5, _col7 input vertices: 0 Reducer 2 - Statistics: Num rows: 1087859571 Data size: 333670462313 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1087859571 Data size: 333446213314 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Map Join Operator condition map: @@ -243,37 +243,37 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col7, _col15 input vertices: 1 Map 9 - Statistics: Num rows: 1087859571 Data size: 329317176033 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1087859571 Data size: 329092927034 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col7 (type: decimal(7,2)), _col3 (type: varchar(30)), _col4 (type: char(10)), _col15 (type: boolean) outputColumnNames: _col2, _col7, _col8, _col15 - Statistics: Num rows: 1087859571 Data size: 329317176033 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1087859571 Data size: 329092927034 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col15 is not null or (substr(_col8, 1, 5)) IN ('85669', '86197', '88274', '83405', '86475', '85392', '85460', '80348', '81792')) (type: boolean) - Statistics: Num rows: 1087859571 Data size: 329317176033 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1087859571 Data size: 329092927034 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++ keys: _col8 (type: char(10)), _col7 (type: varchar(30)) null sort order: zz - Statistics: Num rows: 1087859571 Data size: 329317176033 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1087859571 Data size: 329092927034 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col2 (type: decimal(7,2)), _col7 (type: varchar(30)), _col8 (type: char(10)) outputColumnNames: _col2, _col7, _col8 - Statistics: Num rows: 1087859571 Data size: 329317176033 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1087859571 Data size: 329092927034 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col8 (type: char(10)), _col7 (type: varchar(30)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1087859571 Data size: 325270011729 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1087859571 Data size: 324821513544 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(10)), _col1 (type: varchar(30)) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: char(10)), _col1 (type: varchar(30)) - Statistics: Num rows: 1087859571 Data size: 325270011729 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1087859571 Data size: 324821513544 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(17,2)) Reducer 6 Execution mode: vectorized, llap @@ -283,12 +283,12 @@ STAGE PLANS: keys: KEY._col0 (type: char(10)), KEY._col1 (type: varchar(30)) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 18408340 Data size: 5504093660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18400731 Data size: 5494232579 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(10)), _col1 (type: varchar(30)) null sort order: zz sort order: ++ - Statistics: Num rows: 18408340 Data size: 5504093660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18400731 Data size: 5494232579 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(17,2)) Reducer 7 Execution mode: vectorized, llap @@ -296,7 +296,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: char(10)), KEY.reducesinkkey1 (type: varchar(30)), VALUE._col0 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 18408340 Data size: 5504093660 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18400731 Data size: 5494232579 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 29900 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query46.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query46.q.out index 395e6bb7c52f..fd589574be51 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query46.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query46.q.out @@ -20,20 +20,20 @@ STAGE PLANS: TableScan alias: customer filterExpr: c_current_addr_sk is not null (type: boolean) - Statistics: Num rows: 80000000 Data size: 15680000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15176269100 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: c_current_addr_sk is not null (type: boolean) - Statistics: Num rows: 80000000 Data size: 15680000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15176269100 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: c_customer_sk (type: bigint), c_current_addr_sk (type: bigint), c_first_name (type: char(20)), c_last_name (type: char(30)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 80000000 Data size: 15680000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15176269100 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 80000000 Data size: 15680000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15176269100 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col2 (type: char(20)), _col3 (type: char(30)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -42,7 +42,7 @@ STAGE PLANS: TableScan alias: store filterExpr: (s_city) IN ('Cedar Grove', 'Highland Park', 'Salem', 'Union', 'Wildwood') (type: boolean) - Statistics: Num rows: 1704 Data size: 172104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 171081 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (s_city) IN ('Cedar Grove', 'Highland Park', 'Salem', 'Union', 'Wildwood') (type: boolean) Statistics: Num rows: 32 Data size: 3232 Basic stats: COMPLETE Column stats: COMPLETE @@ -83,24 +83,24 @@ STAGE PLANS: Map Operator Tree: TableScan alias: current_addr - Statistics: Num rows: 40000000 Data size: 4040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3928420739 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_city (type: varchar(60)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40000000 Data size: 4040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3928420739 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 4040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3928420739 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(60)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 4040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3928420739 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(60)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -206,14 +206,14 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col3, _col5 input vertices: 1 Map 3 - Statistics: Num rows: 80000000 Data size: 22480000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 21864689839 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 22480000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 21864689839 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: char(20)), _col3 (type: char(30)), _col5 (type: varchar(60)) Reducer 5 Execution mode: vectorized, llap @@ -227,7 +227,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col4, _col5, _col6, _col12 input vertices: 1 Map 3 - Statistics: Num rows: 64869023 Data size: 6551771563 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 6440192302 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col5), sum(_col6) @@ -235,13 +235,13 @@ STAGE PLANS: minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 64869023 Data size: 21082432491 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 20970853230 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: varchar(60)), _col2 (type: bigint), _col3 (type: bigint) null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: varchar(60)), _col2 (type: bigint), _col3 (type: bigint) - Statistics: Num rows: 64869023 Data size: 21082432491 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 20970853230 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)) Reducer 6 Execution mode: vectorized, llap @@ -251,17 +251,17 @@ STAGE PLANS: keys: KEY._col0 (type: bigint), KEY._col1 (type: varchar(60)), KEY._col2 (type: bigint), KEY._col3 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 64869023 Data size: 21082432491 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 20970853230 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: bigint), _col0 (type: bigint), _col1 (type: varchar(60)), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 64869023 Data size: 21082432483 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 20970853222 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 64869023 Data size: 21082432483 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 20970853222 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col2 (type: varchar(60)), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)) Reducer 7 Execution mode: vectorized, llap @@ -275,26 +275,26 @@ STAGE PLANS: outputColumnNames: _col2, _col3, _col5, _col6, _col8, _col9, _col10 input vertices: 0 Reducer 2 - Statistics: Num rows: 64869023 Data size: 38791675754 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 38064786332 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Filter Operator predicate: (_col5 <> _col8) (type: boolean) - Statistics: Num rows: 64869023 Data size: 38791675754 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 38064786332 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++++ keys: _col3 (type: char(30)), _col2 (type: char(20)), _col5 (type: varchar(60)), _col8 (type: varchar(60)), _col6 (type: bigint) null sort order: zzzzz - Statistics: Num rows: 64869023 Data size: 38791675754 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 38064786332 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col3 (type: char(30)), _col2 (type: char(20)), _col5 (type: varchar(60)), _col8 (type: varchar(60)), _col6 (type: bigint), _col9 (type: decimal(17,2)), _col10 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 64869023 Data size: 38791675754 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 37337896544 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col4 (type: bigint) null sort order: zzzzz sort order: +++++ - Statistics: Num rows: 64869023 Data size: 38791675754 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 37337896544 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)) Reducer 8 Execution mode: vectorized, llap @@ -302,13 +302,13 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: char(30)), KEY.reducesinkkey1 (type: char(20)), KEY.reducesinkkey2 (type: varchar(60)), KEY.reducesinkkey3 (type: varchar(60)), KEY.reducesinkkey4 (type: bigint), VALUE._col0 (type: decimal(17,2)), VALUE._col1 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 64869023 Data size: 38791675754 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 64869023 Data size: 37337896544 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 - Statistics: Num rows: 100 Data size: 59800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 57802 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 100 Data size: 59800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 57802 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query47.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query47.q.out index bbe8be4bbd66..14b3bdc07179 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query47.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query47.q.out @@ -48,7 +48,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col5, _col6, _col8, _col9 input vertices: 1 Map 9 - Statistics: Num rows: 18884534606 Data size: 5585078338266 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18651541762 Data size: 5513549533277 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -58,20 +58,20 @@ STAGE PLANS: outputColumnNames: _col2, _col5, _col6, _col8, _col9, _col11, _col12 input vertices: 1 Map 10 - Statistics: Num rows: 18884534606 Data size: 9022063636558 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 18560140713 Data size: 8863434806670 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col5 (type: int), _col6 (type: int), _col8 (type: varchar(50)), _col9 (type: varchar(50)), _col11 (type: char(50)), _col12 (type: char(50)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 9442267303 Data size: 4617268711167 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9280070356 Data size: 4537954296207 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: int), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col4 (type: char(50)), _col5 (type: char(50)) null sort order: zzzzzz sort order: ++++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: int), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col4 (type: char(50)), _col5 (type: char(50)) - Statistics: Num rows: 9442267303 Data size: 4617268711167 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9280070356 Data size: 4537954296207 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col6 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -79,21 +79,21 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - filterExpr: (i_category is not null and i_brand is not null) (type: boolean) - Statistics: Num rows: 462000 Data size: 91476000 Basic stats: COMPLETE Column stats: COMPLETE + filterExpr: (i_brand is not null and i_category is not null) (type: boolean) + Statistics: Num rows: 462000 Data size: 91260620 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (i_category is not null and i_brand is not null) (type: boolean) - Statistics: Num rows: 462000 Data size: 91476000 Basic stats: COMPLETE Column stats: COMPLETE + predicate: (i_brand is not null and i_category is not null) (type: boolean) + Statistics: Num rows: 459736 Data size: 90813398 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_brand (type: char(50)), i_category (type: char(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 462000 Data size: 91476000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 459736 Data size: 90813398 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 91476000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 459736 Data size: 90813398 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)), _col2 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -139,21 +139,21 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store - filterExpr: (s_store_name is not null and s_company_name is not null) (type: boolean) - Statistics: Num rows: 1704 Data size: 318648 Basic stats: COMPLETE Column stats: COMPLETE + filterExpr: (s_company_name is not null and s_store_name is not null) (type: boolean) + Statistics: Num rows: 1704 Data size: 316767 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (s_store_name is not null and s_company_name is not null) (type: boolean) - Statistics: Num rows: 1704 Data size: 318648 Basic stats: COMPLETE Column stats: COMPLETE + predicate: (s_company_name is not null and s_store_name is not null) (type: boolean) + Statistics: Num rows: 1681 Data size: 312466 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_store_name (type: varchar(50)), s_company_name (type: varchar(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1704 Data size: 318648 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1681 Data size: 312466 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 318648 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1681 Data size: 312466 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(50)), _col2 (type: varchar(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -165,20 +165,20 @@ STAGE PLANS: keys: KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: varchar(50)), KEY._col3 (type: varchar(50)), KEY._col4 (type: char(50)), KEY._col5 (type: char(50)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col5 (type: char(50)), _col4 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col0 (type: int), _col1 (type: int) null sort order: aaaazz sort order: ++++++ Map-reduce partition columns: _col5 (type: char(50)), _col4 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)) - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col6 (type: decimal(17,2)) Reduce Output Operator key expressions: _col5 (type: char(50)), _col4 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col0 (type: int) null sort order: aaaaa sort order: +++++ Map-reduce partition columns: _col5 (type: char(50)), _col4 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col0 (type: int) - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col6 (type: decimal(17,2)) Reducer 3 Execution mode: vectorized, llap @@ -186,7 +186,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey4 (type: int), KEY.reducesinkkey5 (type: int), KEY.reducesinkkey2 (type: varchar(50)), KEY.reducesinkkey3 (type: varchar(50)), KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), VALUE._col0 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -207,20 +207,20 @@ STAGE PLANS: window function: GenericUDAFRankEvaluator window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) isPivotResult: true - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: rank_window_0 is not null (type: boolean) - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col5 (type: char(50)), _col4 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col6 (type: decimal(17,2)), (rank_window_0 + 1) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 4309536 Data size: 2090124960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2092941840 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col5 (type: int) null sort order: zzzzz sort order: +++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col5 (type: int) - Statistics: Num rows: 4309536 Data size: 2090124960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2092941840 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)) PTF Operator Function definitions: @@ -242,20 +242,20 @@ STAGE PLANS: window function: GenericUDAFRankEvaluator window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) isPivotResult: true - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: rank_window_0 is not null (type: boolean) - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col5 (type: char(50)), _col4 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col6 (type: decimal(17,2)), (rank_window_0 - 1) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 4309536 Data size: 2090124960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2092941840 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col5 (type: int) null sort order: zzzzz sort order: +++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col5 (type: int) - Statistics: Num rows: 4309536 Data size: 2090124960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2092941840 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)) Reducer 4 Execution mode: vectorized, llap @@ -268,7 +268,7 @@ STAGE PLANS: null sort order: zzzzz sort order: +++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col5 (type: int) - Statistics: Num rows: 4309536 Data size: 2090124960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2092941840 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)) Reducer 5 Execution mode: vectorized, llap @@ -276,7 +276,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey4 (type: int), VALUE._col0 (type: int), KEY.reducesinkkey2 (type: varchar(50)), KEY.reducesinkkey3 (type: varchar(50)), KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), VALUE._col1 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -296,17 +296,17 @@ STAGE PLANS: name: avg window function: GenericUDAFAverageEvaluatorDecimal window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: avg_window_0 (type: decimal(21,6)), _col0 (type: int), _col1 (type: int), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col4 (type: char(50)), _col5 (type: char(50)), _col6 (type: decimal(17,2)) outputColumnNames: avg_window_0, _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col5 (type: char(50)), _col4 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)), _col0 (type: int), _col1 (type: int) null sort order: aaaazz sort order: ++++++ Map-reduce partition columns: _col5 (type: char(50)), _col4 (type: char(50)), _col2 (type: varchar(50)), _col3 (type: varchar(50)) - Statistics: Num rows: 4309536 Data size: 2107363104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2110203216 Basic stats: COMPLETE Column stats: COMPLETE value expressions: avg_window_0 (type: decimal(21,6)), _col6 (type: decimal(17,2)) Reducer 6 Execution mode: vectorized, llap @@ -314,7 +314,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: decimal(21,6)), KEY.reducesinkkey4 (type: int), KEY.reducesinkkey5 (type: int), KEY.reducesinkkey2 (type: varchar(50)), KEY.reducesinkkey3 (type: varchar(50)), KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), VALUE._col1 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 4309536 Data size: 2590031136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2593521744 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -335,21 +335,21 @@ STAGE PLANS: window function: GenericUDAFRankEvaluator window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) isPivotResult: true - Statistics: Num rows: 4309536 Data size: 2590031136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4315344 Data size: 2593521744 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col0 > 0) and rank_window_1 is not null and (_col1 = 2000)) (type: boolean) - Statistics: Num rows: 718256 Data size: 431671856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 719224 Data size: 432253624 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: rank_window_1 (type: int), _col0 (type: decimal(21,6)), _col1 (type: int), _col2 (type: int), _col3 (type: varchar(50)), _col4 (type: varchar(50)), _col5 (type: char(50)), _col6 (type: char(50)), _col7 (type: decimal(17,2)) outputColumnNames: rank_window_1, _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 718256 Data size: 431671856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 719224 Data size: 432253624 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: if((_col0 > 0), ((abs((_col7 - _col0)) / _col0) > 0.1), false) (type: boolean) - Statistics: Num rows: 359128 Data size: 217272440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 359612 Data size: 217565260 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col6 (type: char(50)), _col5 (type: char(50)), _col3 (type: varchar(50)), _col4 (type: varchar(50)), _col1 (type: int), _col2 (type: int), _col7 (type: decimal(17,2)), _col0 (type: decimal(21,6)), rank_window_1 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8 - Statistics: Num rows: 359128 Data size: 217272440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 359612 Data size: 217565260 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -359,7 +359,7 @@ STAGE PLANS: outputColumnNames: _col4, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14 input vertices: 0 Reducer 4 - Statistics: Num rows: 359128 Data size: 257494776 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 359612 Data size: 257841804 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -369,22 +369,22 @@ STAGE PLANS: outputColumnNames: _col4, _col6, _col10, _col11, _col12, _col13, _col19 input vertices: 1 Reducer 3 - Statistics: Num rows: 359128 Data size: 196083888 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 359612 Data size: 196348152 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++ keys: (_col12 - _col13) (type: decimal(22,6)), _col11 (type: int) null sort order: zz - Statistics: Num rows: 359128 Data size: 196083888 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 359612 Data size: 196348152 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col6 (type: char(50)), _col10 (type: int), _col11 (type: int), _col13 (type: decimal(21,6)), _col12 (type: decimal(17,2)), _col4 (type: decimal(17,2)), _col19 (type: decimal(17,2)), (_col12 - _col13) (type: decimal(22,6)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 359128 Data size: 236306224 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 359612 Data size: 236624696 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col7 (type: decimal(22,6)), _col2 (type: int) null sort order: zz sort order: ++ - Statistics: Num rows: 359128 Data size: 236306224 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 359612 Data size: 236624696 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(50)), _col1 (type: int), _col3 (type: decimal(21,6)), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)) Reducer 7 Execution mode: vectorized, llap @@ -392,7 +392,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: char(50)), VALUE._col1 (type: int), KEY.reducesinkkey1 (type: int), VALUE._col2 (type: decimal(21,6)), VALUE._col3 (type: decimal(17,2)), VALUE._col4 (type: decimal(17,2)), VALUE._col5 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 359128 Data size: 196083888 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 359612 Data size: 196348152 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 54600 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query48.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query48.q.out index 59b49bfa8fc1..dd57e3402696 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query48.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query48.q.out @@ -16,7 +16,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: (ss_sales_price BETWEEN 50 AND 200 and ss_net_profit is not null and ss_cdemo_sk is not null and ss_addr_sk is not null and ss_store_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_66_container, bigKeyColName:ss_addr_sk, smallTablePos:1, keyRatio:3.323733066508898E-4 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_66_container, bigKeyColName:ss_addr_sk, smallTablePos:1, keyRatio:6.775300789584274E-4 Statistics: Num rows: 82510879939 Data size: 20962809999708 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ss_sales_price BETWEEN 50 AND 200 and ss_net_profit is not null and ss_cdemo_sk is not null and ss_addr_sk is not null and ss_store_sk is not null) (type: boolean) @@ -54,14 +54,14 @@ STAGE PLANS: outputColumnNames: _col2, _col4, _col5, _col6, _col10, _col11, _col12 input vertices: 1 Map 5 - Statistics: Num rows: 27424414 Data size: 658185940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 55903603 Data size: 1341686476 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col10 and _col4) or (_col11 and _col5) or (_col12 and _col6)) (type: boolean) - Statistics: Num rows: 20568309 Data size: 493639420 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 41927700 Data size: 1006264804 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col2 (type: int) outputColumnNames: _col2 - Statistics: Num rows: 20568309 Data size: 493639420 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 41927700 Data size: 1006264804 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) minReductionHashAggr: 0.99 @@ -138,20 +138,20 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: ((ca_state) IN ('GA', 'IN', 'KY', 'MO', 'MT', 'NM', 'OR', 'WI', 'WV') and (ca_country = 'United States')) (type: boolean) - Statistics: Num rows: 40000000 Data size: 7640000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 7420490932 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((ca_state) IN ('GA', 'IN', 'KY', 'MO', 'MT', 'NM', 'OR', 'WI', 'WV') and (ca_country = 'United States')) (type: boolean) - Statistics: Num rows: 3396227 Data size: 648679357 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6923077 Data size: 1284315894 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), (ca_state) IN ('GA', 'KY', 'NM') (type: boolean), (ca_state) IN ('IN', 'MT', 'OR') (type: boolean), (ca_state) IN ('MO', 'WI', 'WV') (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 3396227 Data size: 67924540 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6923077 Data size: 138461540 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 3396227 Data size: 67924540 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6923077 Data size: 138461540 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: boolean), _col2 (type: boolean), _col3 (type: boolean) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query50.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query50.q.out index 0e28ac34c278..3ee7b36c9055 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query50.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query50.q.out @@ -125,17 +125,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store - Statistics: Num rows: 1704 Data size: 1407456 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 1398604 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_store_name (type: varchar(50)), s_company_id (type: int), s_street_number (type: varchar(10)), s_street_name (type: varchar(60)), s_street_type (type: char(15)), s_suite_number (type: char(10)), s_city (type: varchar(60)), s_county (type: varchar(30)), s_state (type: char(2)), s_zip (type: char(10)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10 - Statistics: Num rows: 1704 Data size: 1407456 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 1398604 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 1407456 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 1398604 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(50)), _col2 (type: int), _col3 (type: varchar(10)), _col4 (type: varchar(60)), _col5 (type: char(15)), _col6 (type: char(10)), _col7 (type: varchar(60)), _col8 (type: varchar(30)), _col9 (type: char(2)), _col10 (type: char(10)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -175,30 +175,30 @@ STAGE PLANS: outputColumnNames: _col3, _col9, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20 input vertices: 1 Map 8 - Statistics: Num rows: 1384306375 Data size: 1154511516702 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1384306375 Data size: 1154511507850 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++++++++++ keys: _col11 (type: varchar(50)), _col12 (type: int), _col13 (type: varchar(10)), _col14 (type: varchar(60)), _col15 (type: char(15)), _col16 (type: char(10)), _col17 (type: varchar(60)), _col18 (type: varchar(30)), _col19 (type: char(2)), _col20 (type: char(10)) null sort order: zzzzzzzzzz - Statistics: Num rows: 1384306375 Data size: 1154511516702 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1384306375 Data size: 1154511507850 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col11 (type: varchar(50)), _col12 (type: int), _col13 (type: varchar(10)), _col14 (type: varchar(60)), _col15 (type: char(15)), _col16 (type: char(10)), _col17 (type: varchar(60)), _col18 (type: varchar(30)), _col19 (type: char(2)), _col20 (type: char(10)), if(((_col3 - _col9) <= 30L), 1, 0) (type: int), if((((_col3 - _col9) > 30L) and ((_col3 - _col9) <= 60L)), 1, 0) (type: int), if((((_col3 - _col9) > 60L) and ((_col3 - _col9) <= 90L)), 1, 0) (type: int), if((((_col3 - _col9) > 90L) and ((_col3 - _col9) <= 120L)), 1, 0) (type: int), if(((_col3 - _col9) > 120L), 1, 0) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14 - Statistics: Num rows: 1384306375 Data size: 1154511516702 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1384306375 Data size: 1154511507850 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col10), sum(_col11), sum(_col12), sum(_col13), sum(_col14) keys: _col0 (type: varchar(50)), _col1 (type: int), _col2 (type: varchar(10)), _col3 (type: varchar(60)), _col4 (type: char(15)), _col5 (type: char(10)), _col6 (type: varchar(60)), _col7 (type: varchar(30)), _col8 (type: char(2)), _col9 (type: char(10)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14 - Statistics: Num rows: 1384306375 Data size: 1187734869650 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1384306375 Data size: 1187734851132 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(50)), _col1 (type: int), _col2 (type: varchar(10)), _col3 (type: varchar(60)), _col4 (type: char(15)), _col5 (type: char(10)), _col6 (type: varchar(60)), _col7 (type: varchar(30)), _col8 (type: char(2)), _col9 (type: char(10)) null sort order: zzzzzzzzzz sort order: ++++++++++ Map-reduce partition columns: _col0 (type: varchar(50)), _col1 (type: int), _col2 (type: varchar(10)), _col3 (type: varchar(60)), _col4 (type: char(15)), _col5 (type: char(10)), _col6 (type: varchar(60)), _col7 (type: varchar(30)), _col8 (type: char(2)), _col9 (type: char(10)) - Statistics: Num rows: 1384306375 Data size: 1187734869650 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1384306375 Data size: 1187734851132 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col10 (type: bigint), _col11 (type: bigint), _col12 (type: bigint), _col13 (type: bigint), _col14 (type: bigint) Reducer 6 Execution mode: vectorized, llap @@ -208,12 +208,12 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(50)), KEY._col1 (type: int), KEY._col2 (type: varchar(10)), KEY._col3 (type: varchar(60)), KEY._col4 (type: char(15)), KEY._col5 (type: char(10)), KEY._col6 (type: varchar(60)), KEY._col7 (type: varchar(30)), KEY._col8 (type: char(2)), KEY._col9 (type: char(10)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14 - Statistics: Num rows: 1384306375 Data size: 1187734869650 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1384306375 Data size: 1187734851132 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(50)), _col1 (type: int), _col2 (type: varchar(10)), _col3 (type: varchar(60)), _col4 (type: char(15)), _col5 (type: char(10)), _col6 (type: varchar(60)), _col7 (type: varchar(30)), _col8 (type: char(2)), _col9 (type: char(10)) null sort order: zzzzzzzzzz sort order: ++++++++++ - Statistics: Num rows: 1384306375 Data size: 1187734869650 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1384306375 Data size: 1187734851132 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col10 (type: bigint), _col11 (type: bigint), _col12 (type: bigint), _col13 (type: bigint), _col14 (type: bigint) Reducer 7 Execution mode: vectorized, llap @@ -221,7 +221,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: varchar(50)), KEY.reducesinkkey1 (type: int), KEY.reducesinkkey2 (type: varchar(10)), KEY.reducesinkkey3 (type: varchar(60)), KEY.reducesinkkey4 (type: char(15)), KEY.reducesinkkey5 (type: char(10)), KEY.reducesinkkey6 (type: varchar(60)), KEY.reducesinkkey7 (type: varchar(30)), KEY.reducesinkkey8 (type: char(2)), KEY.reducesinkkey9 (type: char(10)), VALUE._col0 (type: bigint), VALUE._col1 (type: bigint), VALUE._col2 (type: bigint), VALUE._col3 (type: bigint), VALUE._col4 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14 - Statistics: Num rows: 1384306375 Data size: 1187734869650 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1384306375 Data size: 1187734851132 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 85800 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query52.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query52.q.out index 97a380747731..a9f3c67b1819 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query52.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query52.q.out @@ -41,7 +41,7 @@ STAGE PLANS: outputColumnNames: _col1, _col5, _col6 input vertices: 1 Map 5 - Statistics: Num rows: 13467990 Data size: 1400671032 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 13467990 Data size: 1400670032 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col5 (type: int), _col6 (type: char(50)) @@ -100,20 +100,20 @@ STAGE PLANS: TableScan alias: item filterExpr: (i_manager_id = 1) (type: boolean) - Statistics: Num rows: 462000 Data size: 53582956 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 53467656 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_manager_id = 1) (type: boolean) - Statistics: Num rows: 4442 Data size: 515192 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 514192 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_brand_id (type: int), i_brand (type: char(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 4442 Data size: 497464 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 496464 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 4442 Data size: 497464 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 496464 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query53.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query53.q.out index 2bb9dacf8fba..405ed73f9184 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query53.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query53.q.out @@ -66,10 +66,10 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - filterExpr: ((i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ', 'personal ', 'portable ', 'reference ', 'self-help ') and (i_category) IN ('Books ', 'Children ', 'Electronics ', 'Men ', 'Music ', 'Women ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'exportiunivamalg #9 ', 'importoamalg #1 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ') and (((i_category) IN ('Books ', 'Children ', 'Electronics ') and (i_class) IN ('personal ', 'portable ', 'reference ', 'self-help ') and (i_brand) IN ('exportiunivamalg #9 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ')) or ((i_category) IN ('Men ', 'Music ', 'Women ') and (i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'importoamalg #1 ')))) (type: boolean) - Statistics: Num rows: 462000 Data size: 135823396 Basic stats: COMPLETE Column stats: COMPLETE + filterExpr: ((i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ', 'personal ', 'portable ', 'reference ', 'self-help ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'exportiunivamalg #9 ', 'importoamalg #1 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ') and (i_category) IN ('Books ', 'Children ', 'Electronics ', 'Men ', 'Music ', 'Women ') and (((i_category) IN ('Books ', 'Children ', 'Electronics ') and (i_class) IN ('personal ', 'portable ', 'reference ', 'self-help ') and (i_brand) IN ('exportiunivamalg #9 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ')) or ((i_category) IN ('Men ', 'Music ', 'Women ') and (i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'importoamalg #1 ')))) (type: boolean) + Statistics: Num rows: 462000 Data size: 135501756 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: ((i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ', 'personal ', 'portable ', 'reference ', 'self-help ') and (i_category) IN ('Books ', 'Children ', 'Electronics ', 'Men ', 'Music ', 'Women ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'exportiunivamalg #9 ', 'importoamalg #1 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ') and (((i_category) IN ('Books ', 'Children ', 'Electronics ') and (i_class) IN ('personal ', 'portable ', 'reference ', 'self-help ') and (i_brand) IN ('exportiunivamalg #9 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ')) or ((i_category) IN ('Men ', 'Music ', 'Women ') and (i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'importoamalg #1 ')))) (type: boolean) + predicate: ((i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ', 'personal ', 'portable ', 'reference ', 'self-help ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'exportiunivamalg #9 ', 'importoamalg #1 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ') and (i_category) IN ('Books ', 'Children ', 'Electronics ', 'Men ', 'Music ', 'Women ') and (((i_category) IN ('Books ', 'Children ', 'Electronics ') and (i_class) IN ('personal ', 'portable ', 'reference ', 'self-help ') and (i_brand) IN ('exportiunivamalg #9 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ')) or ((i_category) IN ('Men ', 'Music ', 'Women ') and (i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'importoamalg #1 ')))) (type: boolean) Statistics: Num rows: 48 Data size: 14112 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_manufact_id (type: int) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query54.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query54.q.out index bc282c8d9b5c..cf151ee20d6a 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query54.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query54.q.out @@ -1,7 +1,7 @@ -Warning: Map Join MAPJOIN[294][bigTable=?] in task 'Map 21' is a cross product -Warning: Map Join MAPJOIN[291][bigTable=?] in task 'Map 21' is a cross product -Warning: Map Join MAPJOIN[292][bigTable=?] in task 'Map 1' is a cross product -Warning: Map Join MAPJOIN[286][bigTable=?] in task 'Map 1' is a cross product +Warning: Map Join MAPJOIN[289][bigTable=?] in task 'Reducer 12' is a cross product +Warning: Map Join MAPJOIN[290][bigTable=?] in task 'Map 5' is a cross product +Warning: Map Join MAPJOIN[284][bigTable=?] in task 'Map 5' is a cross product +Warning: Map Join MAPJOIN[283][bigTable=?] in task 'Map 1' is a cross product STAGE DEPENDENCIES: Stage-1 is a root stage Stage-0 depends on stages: Stage-1 @@ -11,23 +11,23 @@ STAGE PLANS: Tez #### A masked pattern was here #### Edges: - Map 1 <- Map 21 (BROADCAST_EDGE), Reducer 15 (BROADCAST_EDGE), Reducer 7 (BROADCAST_EDGE), Reducer 9 (BROADCAST_EDGE) - Map 12 <- Map 13 (BROADCAST_EDGE) - Map 14 <- Union 17 (BROADCAST_EDGE) - Map 16 <- Map 19 (BROADCAST_EDGE), Map 5 (BROADCAST_EDGE), Union 17 (CONTAINS) - Map 18 <- Map 19 (BROADCAST_EDGE), Map 5 (BROADCAST_EDGE), Reducer 20 (BROADCAST_EDGE), Union 17 (CONTAINS) - Map 21 <- Reducer 10 (BROADCAST_EDGE), Reducer 11 (BROADCAST_EDGE) - Reducer 10 <- Map 5 (SIMPLE_EDGE) - Reducer 11 <- Map 5 (SIMPLE_EDGE) - Reducer 15 <- Map 12 (CUSTOM_SIMPLE_EDGE), Map 14 (CUSTOM_SIMPLE_EDGE) + Map 1 <- Map 5 (BROADCAST_EDGE), Reducer 10 (BROADCAST_EDGE), Reducer 16 (BROADCAST_EDGE) + Map 13 <- Map 14 (BROADCAST_EDGE) + Map 15 <- Union 18 (BROADCAST_EDGE) + Map 17 <- Map 20 (BROADCAST_EDGE), Map 6 (BROADCAST_EDGE), Union 18 (CONTAINS) + Map 19 <- Map 20 (BROADCAST_EDGE), Map 6 (BROADCAST_EDGE), Reducer 21 (BROADCAST_EDGE), Union 18 (CONTAINS) + Map 5 <- Reducer 12 (BROADCAST_EDGE), Reducer 7 (BROADCAST_EDGE) + Reducer 10 <- Reducer 9 (CUSTOM_SIMPLE_EDGE) + Reducer 11 <- Map 6 (SIMPLE_EDGE) + Reducer 12 <- Reducer 11 (CUSTOM_SIMPLE_EDGE), Reducer 8 (BROADCAST_EDGE) + Reducer 16 <- Map 13 (CUSTOM_SIMPLE_EDGE), Map 15 (CUSTOM_SIMPLE_EDGE) Reducer 2 <- Map 1 (SIMPLE_EDGE) - Reducer 20 <- Map 19 (CUSTOM_SIMPLE_EDGE) + Reducer 21 <- Map 20 (CUSTOM_SIMPLE_EDGE) Reducer 3 <- Reducer 2 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) - Reducer 6 <- Map 5 (SIMPLE_EDGE) - Reducer 7 <- Reducer 6 (CUSTOM_SIMPLE_EDGE) - Reducer 8 <- Map 5 (SIMPLE_EDGE) - Reducer 9 <- Reducer 8 (CUSTOM_SIMPLE_EDGE) + Reducer 7 <- Map 6 (SIMPLE_EDGE) + Reducer 8 <- Map 6 (SIMPLE_EDGE) + Reducer 9 <- Map 6 (SIMPLE_EDGE) #### A masked pattern was here #### Vertices: Map 1 @@ -51,67 +51,57 @@ STAGE PLANS: 1 outputColumnNames: _col0, _col1, _col2 input vertices: - 1 Reducer 9 + 1 Reducer 10 Statistics: Num rows: 80566020964 Data size: 10084401010960 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 - 1 - outputColumnNames: _col0, _col1, _col2 + 0 _col2 (type: bigint) + 1 _col0 (type: bigint) + outputColumnNames: _col0, _col1 input vertices: - 1 Reducer 7 - Statistics: Num rows: 80566020964 Data size: 10084401010960 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 5 + Statistics: Num rows: 80566020964 Data size: 9439872843248 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: 0 _col0 (type: bigint) 1 _col5 (type: bigint) - outputColumnNames: _col1, _col2, _col10 + outputColumnNames: _col1, _col14 input vertices: - 1 Reducer 15 - Statistics: Num rows: 80566020964 Data size: 10099593145520 Basic stats: COMPLETE Column stats: COMPLETE - Map Join Operator - condition map: - Inner Join 0 to 1 - keys: - 0 _col2 (type: bigint) - 1 _col0 (type: bigint) - outputColumnNames: _col1, _col10 - input vertices: - 1 Map 21 - Statistics: Num rows: 80566020964 Data size: 9455064977808 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator - aggregations: sum(_col1) - keys: _col10 (type: bigint) - minReductionHashAggr: 0.99 - mode: hash - outputColumnNames: _col0, _col1 + 1 Reducer 16 + Statistics: Num rows: 80566020964 Data size: 9455064977808 Basic stats: COMPLETE Column stats: COMPLETE + Group By Operator + aggregations: sum(_col1) + keys: _col14 (type: bigint) + minReductionHashAggr: 0.99 + mode: hash + outputColumnNames: _col0, _col1 + Statistics: Num rows: 36934 Data size: 4432080 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 36934 Data size: 4432080 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 36934 Data size: 4432080 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: decimal(17,2)) + value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 12 + Map 13 Map Operator Tree: TableScan alias: customer_address - filterExpr: (ca_county is not null and ca_state is not null) (type: boolean) - Statistics: Num rows: 40000000 Data size: 7680000000 Basic stats: COMPLETE Column stats: COMPLETE + filterExpr: (ca_state is not null and ca_county is not null) (type: boolean) + Statistics: Num rows: 40000000 Data size: 7459398866 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (ca_county is not null and ca_state is not null) (type: boolean) - Statistics: Num rows: 40000000 Data size: 7680000000 Basic stats: COMPLETE Column stats: COMPLETE + predicate: (ca_state is not null and ca_county is not null) (type: boolean) + Statistics: Num rows: 37637995 Data size: 7018920456 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_county (type: varchar(30)), ca_state (type: char(2)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40000000 Data size: 7680000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 37637995 Data size: 7018920456 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -120,38 +110,38 @@ STAGE PLANS: 1 _col0 (type: varchar(30)), _col1 (type: char(2)) outputColumnNames: _col0 input vertices: - 1 Map 13 - Statistics: Num rows: 35316062 Data size: 282528496 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 14 + Statistics: Num rows: 32796593 Data size: 262372744 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 35316062 Data size: 282528496 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 32796593 Data size: 262372744 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 13 + Map 14 Map Operator Tree: TableScan alias: store - filterExpr: (s_county is not null and s_state is not null) (type: boolean) - Statistics: Num rows: 1704 Data size: 313536 Basic stats: COMPLETE Column stats: COMPLETE + filterExpr: (s_state is not null and s_county is not null) (type: boolean) + Statistics: Num rows: 1704 Data size: 311512 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (s_county is not null and s_state is not null) (type: boolean) - Statistics: Num rows: 1704 Data size: 313536 Basic stats: COMPLETE Column stats: COMPLETE + predicate: (s_state is not null and s_county is not null) (type: boolean) + Statistics: Num rows: 1680 Data size: 307096 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_county (type: varchar(30)), s_state (type: char(2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 1704 Data size: 313536 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1680 Data size: 307096 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(30)), _col1 (type: char(2)) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: varchar(30)), _col1 (type: char(2)) - Statistics: Num rows: 1704 Data size: 313536 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1680 Data size: 307096 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 14 + Map 15 Map Operator Tree: TableScan alias: customer @@ -172,23 +162,23 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col0, _col1 input vertices: - 1 Union 17 - Statistics: Num rows: 1216 Data size: 19456 Basic stats: COMPLETE Column stats: COMPLETE + 1 Union 18 + Statistics: Num rows: 1365 Data size: 21840 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 1216 Data size: 19456 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1365 Data size: 21840 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 16 + Map 17 Map Operator Tree: TableScan alias: catalog_sales filterExpr: cs_bill_customer_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_289_container, bigKeyColName:cs_item_sk, smallTablePos:1, keyRatio:2.3199545882327872E-5 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_287_container, bigKeyColName:cs_item_sk, smallTablePos:1, keyRatio:2.6044765968361594E-5 Statistics: Num rows: 43005109025 Data size: 1031276889552 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: cs_bill_customer_sk is not null (type: boolean) @@ -205,7 +195,7 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col1, _col2 input vertices: - 1 Map 5 + 1 Map 6 Statistics: Num rows: 1087114782 Data size: 15684993992 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: @@ -215,34 +205,34 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col1 input vertices: - 1 Map 19 - Statistics: Num rows: 997699 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 20 + Statistics: Num rows: 1120058 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 997699 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1120058 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: bigint) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1216 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1365 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1216 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1365 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 18 + Map 19 Map Operator Tree: TableScan alias: web_sales - filterExpr: (ws_bill_customer_sk is not null and ws_item_sk BETWEEN DynamicValue(RS_60_item_i_item_sk_min) AND DynamicValue(RS_60_item_i_item_sk_max) and in_bloom_filter(ws_item_sk, DynamicValue(RS_60_item_i_item_sk_bloom_filter))) (type: boolean) + filterExpr: (ws_bill_customer_sk is not null and ws_item_sk BETWEEN DynamicValue(RS_92_item_i_item_sk_min) AND DynamicValue(RS_92_item_i_item_sk_max) and in_bloom_filter(ws_item_sk, DynamicValue(RS_92_item_i_item_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 21594638446 Data size: 518249773640 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (ws_bill_customer_sk is not null and ws_item_sk BETWEEN DynamicValue(RS_60_item_i_item_sk_min) AND DynamicValue(RS_60_item_i_item_sk_max) and in_bloom_filter(ws_item_sk, DynamicValue(RS_60_item_i_item_sk_bloom_filter))) (type: boolean) + predicate: (ws_bill_customer_sk is not null and ws_item_sk BETWEEN DynamicValue(RS_92_item_i_item_sk_min) AND DynamicValue(RS_92_item_i_item_sk_max) and in_bloom_filter(ws_item_sk, DynamicValue(RS_92_item_i_item_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 21591944812 Data size: 518185129112 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ws_sold_date_sk (type: bigint), ws_bill_customer_sk (type: bigint), ws_item_sk (type: bigint) @@ -256,7 +246,7 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col1, _col2 input vertices: - 1 Map 5 + 1 Map 6 Statistics: Num rows: 1087114782 Data size: 15684993992 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: @@ -266,49 +256,49 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col1 input vertices: - 1 Map 19 - Statistics: Num rows: 997699 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 20 + Statistics: Num rows: 1120058 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 997699 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1120058 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: bigint) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0 - Statistics: Num rows: 1216 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1365 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1216 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1365 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 19 + Map 20 Map Operator Tree: TableScan alias: item filterExpr: ((i_class = 'consignment ') and (i_category = 'Jewelry ')) (type: boolean) - Statistics: Num rows: 462000 Data size: 87780000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 87573660 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((i_class = 'consignment ') and (i_category = 'Jewelry ')) (type: boolean) - Statistics: Num rows: 424 Data size: 80560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 476 Data size: 90440 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 424 Data size: 3392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 476 Data size: 3808 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 424 Data size: 3392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 476 Data size: 3808 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 424 Data size: 3392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 476 Data size: 3808 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -325,10 +315,10 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 424 Data size: 3392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 476 Data size: 3808 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 21 + Map 5 Map Operator Tree: TableScan alias: date_dim @@ -349,7 +339,7 @@ STAGE PLANS: 1 outputColumnNames: _col0, _col1, _col2 input vertices: - 1 Reducer 10 + 1 Reducer 7 Statistics: Num rows: 2264519 Data size: 36232304 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col2 <= _col1) (type: boolean) @@ -362,7 +352,7 @@ STAGE PLANS: 1 outputColumnNames: _col0, _col1, _col3 input vertices: - 1 Reducer 11 + 1 Reducer 12 Statistics: Num rows: 23400009 Data size: 374400144 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col1 <= _col3) (type: boolean) @@ -395,14 +385,14 @@ STAGE PLANS: Target Vertex: Map 1 Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 5 + Map 6 Map Operator Tree: TableScan alias: date_dim - filterExpr: (((d_year = 1999) and (d_moy = 3)) or ((d_year = 1999) and (d_moy = 3) and d_month_seq is not null)) (type: boolean) + filterExpr: (((d_year = 1999) and (d_moy = 3) and d_month_seq is not null) or ((d_year = 1999) and (d_moy = 3))) (type: boolean) Statistics: Num rows: 73049 Data size: 876588 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: ((d_year = 1999) and (d_moy = 3)) (type: boolean) + predicate: ((d_year = 1999) and (d_moy = 3) and d_month_seq is not null) (type: boolean) Statistics: Num rows: 31 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: (d_month_seq + 1) (type: int) @@ -436,6 +426,41 @@ STAGE PLANS: sort order: + Map-reduce partition columns: _col0 (type: int) Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: ((d_year = 1999) and (d_moy = 3)) (type: boolean) + Statistics: Num rows: 31 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: (d_month_seq + 3) (type: int) + outputColumnNames: _col0 + Statistics: Num rows: 31 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE + Group By Operator + keys: _col0 (type: int) + minReductionHashAggr: 0.4 + mode: hash + outputColumnNames: _col0 + Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: int) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: (d_month_seq + 1) (type: int) + outputColumnNames: _col0 + Statistics: Num rows: 31 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE + Group By Operator + keys: _col0 (type: int) + minReductionHashAggr: 0.4 + mode: hash + outputColumnNames: _col0 + Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: int) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: int) + Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: d_date_sk (type: bigint) outputColumnNames: _col0 @@ -461,7 +486,7 @@ STAGE PLANS: Target Input: catalog_sales Partition key expr: cs_sold_date_sk Statistics: Num rows: 31 Data size: 248 Basic stats: COMPLETE Column stats: COMPLETE - Target Vertex: Map 16 + Target Vertex: Map 17 Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 @@ -477,63 +502,32 @@ STAGE PLANS: Target Input: web_sales Partition key expr: ws_sold_date_sk Statistics: Num rows: 31 Data size: 248 Basic stats: COMPLETE Column stats: COMPLETE - Target Vertex: Map 18 + Target Vertex: Map 19 Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 31 Data size: 248 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: ((d_year = 1999) and (d_moy = 3) and d_month_seq is not null) (type: boolean) - Statistics: Num rows: 31 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: (d_month_seq + 1) (type: int) - outputColumnNames: _col0 - Statistics: Num rows: 31 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator - keys: _col0 (type: int) - minReductionHashAggr: 0.4 - mode: hash - outputColumnNames: _col0 - Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: int) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: (d_month_seq + 3) (type: int) - outputColumnNames: _col0 - Statistics: Num rows: 31 Data size: 372 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator - keys: _col0 (type: int) - minReductionHashAggr: 0.4 - mode: hash - outputColumnNames: _col0 - Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: int) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: int) - Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 10 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator - keys: KEY._col0 (type: int) + aggregations: count(VALUE._col0) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: int) + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: sq_count_check(_col0) (type: boolean) + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + null sort order: + sort order: + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Reducer 11 Execution mode: vectorized, llap Reduce Operator Tree: @@ -542,12 +536,48 @@ STAGE PLANS: mode: mergepartial outputColumnNames: _col0 Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: + Select Operator Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: int) - Reducer 15 + Group By Operator + aggregations: count() + minReductionHashAggr: 0.96774197 + mode: hash + outputColumnNames: _col0 + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + null sort order: + sort order: + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: bigint) + Reducer 12 + Execution mode: vectorized, llap + Reduce Operator Tree: + Group By Operator + aggregations: count(VALUE._col0) + mode: mergepartial + outputColumnNames: _col0 + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: sq_count_check(_col0) (type: boolean) + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 + 1 + outputColumnNames: _col0 + input vertices: + 0 Reducer 8 + Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + null sort order: + sort order: + Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: int) + Reducer 16 Execution mode: vectorized, llap Reduce Operator Tree: Map Join Operator @@ -558,15 +588,15 @@ STAGE PLANS: 1 KEY.reducesinkkey0 (type: bigint) outputColumnNames: _col5 input vertices: - 0 Map 12 - Statistics: Num rows: 1216 Data size: 9728 Basic stats: COMPLETE Column stats: COMPLETE + 0 Map 13 + Statistics: Num rows: 1285 Data size: 10280 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator key expressions: _col5 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col5 (type: bigint) - Statistics: Num rows: 1216 Data size: 9728 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1285 Data size: 10280 Basic stats: COMPLETE Column stats: COMPLETE Reducer 2 Execution mode: vectorized, llap Reduce Operator Tree: @@ -600,7 +630,7 @@ STAGE PLANS: Map-reduce partition columns: _col0 (type: int) Statistics: Num rows: 1 Data size: 12 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) - Reducer 20 + Reducer 21 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator @@ -655,7 +685,7 @@ STAGE PLANS: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe - Reducer 6 + Reducer 7 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator @@ -663,37 +693,25 @@ STAGE PLANS: mode: mergepartial outputColumnNames: _col0 Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator + Reduce Output Operator + null sort order: + sort order: Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator - aggregations: count() - minReductionHashAggr: 0.96774197 - mode: hash - outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: bigint) - Reducer 7 + value expressions: _col0 (type: int) + Reducer 8 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator - aggregations: count(VALUE._col0) + keys: KEY._col0 (type: int) mode: mergepartial outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: sq_count_check(_col0) (type: boolean) - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Reducer 8 + Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + null sort order: + sort order: + Statistics: Num rows: 31 Data size: 124 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: int) + Reducer 9 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator @@ -714,25 +732,8 @@ STAGE PLANS: sort order: Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint) - Reducer 9 - Execution mode: vectorized, llap - Reduce Operator Tree: - Group By Operator - aggregations: count(VALUE._col0) - mode: mergepartial - outputColumnNames: _col0 - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: sq_count_check(_col0) (type: boolean) - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE - Union 17 - Vertex: Union 17 + Union 18 + Vertex: Union 18 Stage: Stage-0 Fetch Operator diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query55.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query55.q.out index 67d3d6e2dec5..7f7f9c47eec4 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query55.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query55.q.out @@ -41,7 +41,7 @@ STAGE PLANS: outputColumnNames: _col1, _col5, _col6 input vertices: 1 Map 5 - Statistics: Num rows: 13467990 Data size: 1400671032 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 13467990 Data size: 1400670032 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col5 (type: int), _col6 (type: char(50)) @@ -100,20 +100,20 @@ STAGE PLANS: TableScan alias: item filterExpr: (i_manager_id = 36) (type: boolean) - Statistics: Num rows: 462000 Data size: 53582956 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 53467656 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_manager_id = 36) (type: boolean) - Statistics: Num rows: 4442 Data size: 515192 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 514192 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_brand_id (type: int), i_brand (type: char(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 4442 Data size: 497464 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 496464 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 4442 Data size: 497464 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 496464 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query56.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query56.q.out index 120408d701ca..fee2850a558e 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query56.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query56.q.out @@ -73,20 +73,20 @@ STAGE PLANS: outputColumnNames: _col2, _col10 input vertices: 1 Map 7 - Statistics: Num rows: 13435479 Data size: 1343548012 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 13579144 Data size: 1357914512 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col10 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 5160 Data size: 1093920 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5274 Data size: 1118088 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 5160 Data size: 1093920 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5274 Data size: 1118088 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -143,20 +143,20 @@ STAGE PLANS: outputColumnNames: _col2, _col10 input vertices: 1 Map 7 - Statistics: Num rows: 7103466 Data size: 710346712 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7179424 Data size: 717942512 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col10 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 2580 Data size: 546960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2637 Data size: 559044 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 2580 Data size: 546960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2637 Data size: 559044 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -246,20 +246,20 @@ STAGE PLANS: outputColumnNames: _col2, _col10 input vertices: 1 Map 7 - Statistics: Num rows: 3600837 Data size: 460807764 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3639341 Data size: 468970612 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col10 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 1720 Data size: 364640 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1758 Data size: 372696 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 1720 Data size: 364640 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1758 Data size: 372696 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -348,38 +348,38 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 87318000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 87212268 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_color) IN ('chiffon ', 'lace ', 'orchid ') (type: boolean) - Statistics: Num rows: 14589 Data size: 2757321 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14745 Data size: 2783512 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_id (type: string) outputColumnNames: _col0 - Statistics: Num rows: 14589 Data size: 1458900 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14745 Data size: 1474500 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0 - Statistics: Num rows: 14589 Data size: 1458900 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14745 Data size: 1474500 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 14589 Data size: 1458900 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14745 Data size: 1474500 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 14589 Data size: 1458900 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14745 Data size: 1474500 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 14589 Data size: 1458900 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14745 Data size: 1474500 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_id (type: string) outputColumnNames: _col0, _col1 @@ -428,20 +428,20 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col0 (type: string) minReductionHashAggr: 0.6666666 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(27,2)) Reducer 15 Execution mode: vectorized, llap @@ -451,20 +451,20 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col0 (type: string) minReductionHashAggr: 0.6666666 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(27,2)) Reducer 2 Execution mode: vectorized, llap @@ -474,20 +474,20 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col0 (type: string) minReductionHashAggr: 0.6666666 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(27,2)) Reducer 4 Execution mode: vectorized, llap @@ -497,18 +497,18 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: + keys: _col1 (type: decimal(27,2)) null sort order: z - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Reduce Output Operator key expressions: _col1 (type: decimal(27,2)) null sort order: z sort order: + - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: string) Reducer 5 Execution mode: vectorized, llap @@ -516,7 +516,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: string), KEY.reducesinkkey0 (type: decimal(27,2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 860 Data size: 182320 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 879 Data size: 186348 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 21200 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query57.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query57.q.out index 962def104e16..4c98e032eea8 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query57.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query57.q.out @@ -43,58 +43,58 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: bigint) + 0 _col1 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col1, _col2, _col5, _col6, _col8 + outputColumnNames: _col0, _col2, _col5, _col6, _col8, _col9 input vertices: 1 Map 9 - Statistics: Num rows: 9983632978 Data size: 2244414272948 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9934708630 Data size: 3146492056474 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: bigint) + 0 _col0 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col2, _col5, _col6, _col8, _col10, _col11 + outputColumnNames: _col2, _col5, _col6, _col8, _col9, _col11 input vertices: 1 Map 10 - Statistics: Num rows: 9983632978 Data size: 4061435474944 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9934708630 Data size: 4041474126630 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) - keys: _col5 (type: int), _col6 (type: int), _col8 (type: varchar(50)), _col10 (type: char(50)), _col11 (type: char(50)) + keys: _col5 (type: int), _col6 (type: int), _col8 (type: char(50)), _col9 (type: char(50)), _col11 (type: varchar(50)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 4991816489 Data size: 2036661127512 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4967354315 Data size: 2026680453450 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: int), _col1 (type: int), _col2 (type: varchar(50)), _col3 (type: char(50)), _col4 (type: char(50)) + key expressions: _col0 (type: int), _col1 (type: int), _col2 (type: char(50)), _col3 (type: char(50)), _col4 (type: varchar(50)) null sort order: zzzzz sort order: +++++ - Map-reduce partition columns: _col0 (type: int), _col1 (type: int), _col2 (type: varchar(50)), _col3 (type: char(50)), _col4 (type: char(50)) - Statistics: Num rows: 4991816489 Data size: 2036661127512 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col0 (type: int), _col1 (type: int), _col2 (type: char(50)), _col3 (type: char(50)), _col4 (type: varchar(50)) + Statistics: Num rows: 4967354315 Data size: 2026680453450 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 10 Map Operator Tree: TableScan - alias: item - filterExpr: (i_category is not null and i_brand is not null) (type: boolean) - Statistics: Num rows: 462000 Data size: 91476000 Basic stats: COMPLETE Column stats: COMPLETE + alias: call_center + filterExpr: cc_name is not null (type: boolean) + Statistics: Num rows: 60 Data size: 6360 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (i_category is not null and i_brand is not null) (type: boolean) - Statistics: Num rows: 462000 Data size: 91476000 Basic stats: COMPLETE Column stats: COMPLETE + predicate: cc_name is not null (type: boolean) + Statistics: Num rows: 60 Data size: 6360 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: i_item_sk (type: bigint), i_brand (type: char(50)), i_category (type: char(50)) - outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 462000 Data size: 91476000 Basic stats: COMPLETE Column stats: COMPLETE + expressions: cc_call_center_sk (type: bigint), cc_name (type: varchar(50)) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 60 Data size: 6360 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 91476000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(50)), _col2 (type: char(50)) + Statistics: Num rows: 60 Data size: 6360 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: varchar(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 8 @@ -138,23 +138,23 @@ STAGE PLANS: Map 9 Map Operator Tree: TableScan - alias: call_center - filterExpr: cc_name is not null (type: boolean) - Statistics: Num rows: 60 Data size: 6360 Basic stats: COMPLETE Column stats: COMPLETE + alias: item + filterExpr: (i_brand is not null and i_category is not null) (type: boolean) + Statistics: Num rows: 462000 Data size: 91260620 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: cc_name is not null (type: boolean) - Statistics: Num rows: 60 Data size: 6360 Basic stats: COMPLETE Column stats: COMPLETE + predicate: (i_brand is not null and i_category is not null) (type: boolean) + Statistics: Num rows: 459736 Data size: 90813398 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: cc_call_center_sk (type: bigint), cc_name (type: varchar(50)) - outputColumnNames: _col0, _col1 - Statistics: Num rows: 60 Data size: 6360 Basic stats: COMPLETE Column stats: COMPLETE + expressions: i_item_sk (type: bigint), i_brand (type: char(50)), i_category (type: char(50)) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 459736 Data size: 90813398 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 60 Data size: 6360 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: varchar(50)) + Statistics: Num rows: 459736 Data size: 90813398 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: char(50)), _col2 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 2 @@ -162,42 +162,42 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: varchar(50)), KEY._col3 (type: char(50)), KEY._col4 (type: char(50)) + keys: KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: char(50)), KEY._col3 (type: char(50)), KEY._col4 (type: varchar(50)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2400900480 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col4 (type: char(50)), _col3 (type: char(50)), _col2 (type: varchar(50)), _col0 (type: int), _col1 (type: int) + key expressions: _col3 (type: char(50)), _col2 (type: char(50)), _col4 (type: varchar(50)), _col0 (type: int), _col1 (type: int) null sort order: aaazz sort order: +++++ - Map-reduce partition columns: _col4 (type: char(50)), _col3 (type: char(50)), _col2 (type: varchar(50)) - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col3 (type: char(50)), _col2 (type: char(50)), _col4 (type: varchar(50)) + Statistics: Num rows: 5884560 Data size: 2400900480 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: decimal(17,2)) Reduce Output Operator - key expressions: _col4 (type: char(50)), _col3 (type: char(50)), _col2 (type: varchar(50)), _col0 (type: int) + key expressions: _col3 (type: char(50)), _col2 (type: char(50)), _col4 (type: varchar(50)), _col0 (type: int) null sort order: aaaa sort order: ++++ - Map-reduce partition columns: _col4 (type: char(50)), _col3 (type: char(50)), _col2 (type: varchar(50)), _col0 (type: int) - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col3 (type: char(50)), _col2 (type: char(50)), _col4 (type: varchar(50)), _col0 (type: int) + Statistics: Num rows: 5884560 Data size: 2400900480 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col5 (type: decimal(17,2)) Reducer 3 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator - expressions: KEY.reducesinkkey3 (type: int), KEY.reducesinkkey4 (type: int), KEY.reducesinkkey2 (type: varchar(50)), KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), VALUE._col0 (type: decimal(17,2)) + expressions: KEY.reducesinkkey3 (type: int), KEY.reducesinkkey4 (type: int), KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), KEY.reducesinkkey2 (type: varchar(50)), VALUE._col0 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2400900480 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition input alias: ptf_0 - output shape: _col0: int, _col1: int, _col2: varchar(50), _col3: char(50), _col4: char(50), _col5: decimal(17,2) + output shape: _col0: int, _col1: int, _col2: char(50), _col3: char(50), _col4: varchar(50), _col5: decimal(17,2) type: WINDOWING Windowing table definition input alias: ptf_1 name: windowingtablefunction order by: _col0 ASC NULLS LAST, _col1 ASC NULLS LAST - partition by: _col4, _col3, _col2 + partition by: _col3, _col2, _col4 raw input shape: window functions: window function definition @@ -207,32 +207,32 @@ STAGE PLANS: window function: GenericUDAFRankEvaluator window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) isPivotResult: true - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2400900480 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: rank_window_0 is not null (type: boolean) - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2400900290 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col4 (type: char(50)), _col3 (type: char(50)), _col2 (type: varchar(50)), _col5 (type: decimal(17,2)), (rank_window_0 + 1) (type: int) + expressions: _col3 (type: char(50)), _col2 (type: char(50)), _col4 (type: varchar(50)), _col5 (type: decimal(17,2)), (rank_window_0 + 1) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 5876640 Data size: 2374162560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2377362050 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col4 (type: int), _col2 (type: varchar(50)) null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col4 (type: int), _col2 (type: varchar(50)) - Statistics: Num rows: 5876640 Data size: 2374162560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2377362050 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(17,2)) PTF Operator Function definitions: Input definition input alias: ptf_0 - output shape: _col0: int, _col1: int, _col2: varchar(50), _col3: char(50), _col4: char(50), _col5: decimal(17,2) + output shape: _col0: int, _col1: int, _col2: char(50), _col3: char(50), _col4: varchar(50), _col5: decimal(17,2) type: WINDOWING Windowing table definition input alias: ptf_1 name: windowingtablefunction order by: _col0 ASC NULLS LAST, _col1 ASC NULLS LAST - partition by: _col4, _col3, _col2 + partition by: _col3, _col2, _col4 raw input shape: window functions: window function definition @@ -242,20 +242,20 @@ STAGE PLANS: window function: GenericUDAFRankEvaluator window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) isPivotResult: true - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2400900480 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: rank_window_0 is not null (type: boolean) - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2400900290 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col4 (type: char(50)), _col3 (type: char(50)), _col2 (type: varchar(50)), _col5 (type: decimal(17,2)), (rank_window_0 - 1) (type: int) + expressions: _col3 (type: char(50)), _col2 (type: char(50)), _col4 (type: varchar(50)), _col5 (type: decimal(17,2)), (rank_window_0 - 1) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 5876640 Data size: 2374162560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2377362050 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col4 (type: int), _col2 (type: varchar(50)) null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col4 (type: int), _col2 (type: varchar(50)) - Statistics: Num rows: 5876640 Data size: 2374162560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2377362050 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(17,2)) Reducer 4 Execution mode: vectorized, llap @@ -268,26 +268,26 @@ STAGE PLANS: null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col4 (type: int), _col2 (type: varchar(50)) - Statistics: Num rows: 5876640 Data size: 2374162560 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2377362050 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(17,2)) Reducer 5 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator - expressions: KEY.reducesinkkey3 (type: int), VALUE._col0 (type: int), KEY.reducesinkkey2 (type: varchar(50)), KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), VALUE._col1 (type: decimal(17,2)) + expressions: KEY.reducesinkkey3 (type: int), VALUE._col0 (type: int), KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), KEY.reducesinkkey2 (type: varchar(50)), VALUE._col1 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2400900480 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition input alias: ptf_0 - output shape: _col0: int, _col1: int, _col2: varchar(50), _col3: char(50), _col4: char(50), _col5: decimal(17,2) + output shape: _col0: int, _col1: int, _col2: char(50), _col3: char(50), _col4: varchar(50), _col5: decimal(17,2) type: WINDOWING Windowing table definition input alias: ptf_1 name: windowingtablefunction - order by: _col4 ASC NULLS FIRST, _col3 ASC NULLS FIRST, _col2 ASC NULLS FIRST, _col0 ASC NULLS FIRST - partition by: _col4, _col3, _col2, _col0 + order by: _col3 ASC NULLS FIRST, _col2 ASC NULLS FIRST, _col4 ASC NULLS FIRST, _col0 ASC NULLS FIRST + partition by: _col3, _col2, _col4, _col0 raw input shape: window functions: window function definition @@ -296,36 +296,36 @@ STAGE PLANS: name: avg window function: GenericUDAFAverageEvaluatorDecimal window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2400900480 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: avg_window_0 (type: decimal(21,6)), _col0 (type: int), _col1 (type: int), _col2 (type: varchar(50)), _col3 (type: char(50)), _col4 (type: char(50)), _col5 (type: decimal(17,2)) + expressions: avg_window_0 (type: decimal(21,6)), _col0 (type: int), _col1 (type: int), _col2 (type: char(50)), _col3 (type: char(50)), _col4 (type: varchar(50)), _col5 (type: decimal(17,2)) outputColumnNames: avg_window_0, _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 2400900480 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col4 (type: char(50)), _col3 (type: char(50)), _col2 (type: varchar(50)), _col0 (type: int), _col1 (type: int) + key expressions: _col3 (type: char(50)), _col2 (type: char(50)), _col4 (type: varchar(50)), _col0 (type: int), _col1 (type: int) null sort order: aaazz sort order: +++++ - Map-reduce partition columns: _col4 (type: char(50)), _col3 (type: char(50)), _col2 (type: varchar(50)) - Statistics: Num rows: 5876640 Data size: 2397669120 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col3 (type: char(50)), _col2 (type: char(50)), _col4 (type: varchar(50)) + Statistics: Num rows: 5884560 Data size: 2400900480 Basic stats: COMPLETE Column stats: COMPLETE value expressions: avg_window_0 (type: decimal(21,6)), _col5 (type: decimal(17,2)) Reducer 6 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator - expressions: VALUE._col0 (type: decimal(21,6)), KEY.reducesinkkey3 (type: int), KEY.reducesinkkey4 (type: int), KEY.reducesinkkey2 (type: varchar(50)), KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), VALUE._col1 (type: decimal(17,2)) + expressions: VALUE._col0 (type: decimal(21,6)), KEY.reducesinkkey3 (type: int), KEY.reducesinkkey4 (type: int), KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), KEY.reducesinkkey2 (type: varchar(50)), VALUE._col1 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 5876640 Data size: 3055852800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 3059971010 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition input alias: ptf_0 - output shape: _col0: decimal(21,6), _col1: int, _col2: int, _col3: varchar(50), _col4: char(50), _col5: char(50), _col6: decimal(17,2) + output shape: _col0: decimal(21,6), _col1: int, _col2: int, _col3: char(50), _col4: char(50), _col5: varchar(50), _col6: decimal(17,2) type: WINDOWING Windowing table definition input alias: ptf_1 name: windowingtablefunction order by: _col1 ASC NULLS LAST, _col2 ASC NULLS LAST - partition by: _col5, _col4, _col3 + partition by: _col4, _col3, _col5 raw input shape: window functions: window function definition @@ -335,21 +335,21 @@ STAGE PLANS: window function: GenericUDAFRankEvaluator window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) isPivotResult: true - Statistics: Num rows: 5876640 Data size: 3055852800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5884560 Data size: 3059971010 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col0 > 0) and rank_window_1 is not null and (_col1 = 2000)) (type: boolean) - Statistics: Num rows: 979440 Data size: 509308800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 980760 Data size: 509995200 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: rank_window_1 (type: int), _col0 (type: decimal(21,6)), _col1 (type: int), _col2 (type: int), _col3 (type: varchar(50)), _col4 (type: char(50)), _col5 (type: char(50)), _col6 (type: decimal(17,2)) + expressions: rank_window_1 (type: int), _col0 (type: decimal(21,6)), _col1 (type: int), _col2 (type: int), _col3 (type: char(50)), _col4 (type: char(50)), _col5 (type: varchar(50)), _col6 (type: decimal(17,2)) outputColumnNames: rank_window_1, _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 979440 Data size: 509308800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 980760 Data size: 509995200 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: if((_col0 > 0), ((abs((_col6 - _col0)) / _col0) > 0.1), false) (type: boolean) - Statistics: Num rows: 489720 Data size: 256613280 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 490380 Data size: 256959120 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col5 (type: char(50)), _col4 (type: char(50)), _col3 (type: varchar(50)), _col1 (type: int), _col2 (type: int), _col6 (type: decimal(17,2)), _col0 (type: decimal(21,6)), rank_window_1 (type: int) + expressions: _col4 (type: char(50)), _col3 (type: char(50)), _col5 (type: varchar(50)), _col1 (type: int), _col2 (type: int), _col6 (type: decimal(17,2)), _col0 (type: decimal(21,6)), rank_window_1 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 489720 Data size: 256613280 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 490380 Data size: 256959120 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -359,7 +359,7 @@ STAGE PLANS: outputColumnNames: _col3, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12 input vertices: 0 Reducer 4 - Statistics: Num rows: 489720 Data size: 311461920 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 490380 Data size: 311881680 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -369,22 +369,22 @@ STAGE PLANS: outputColumnNames: _col3, _col5, _col6, _col8, _col9, _col10, _col11, _col16 input vertices: 1 Reducer 3 - Statistics: Num rows: 489720 Data size: 316359120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 490380 Data size: 316785480 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++ keys: (_col10 - _col11) (type: decimal(22,6)), _col8 (type: int) null sort order: zz - Statistics: Num rows: 489720 Data size: 316359120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 490380 Data size: 316785480 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col5 (type: char(50)), _col6 (type: char(50)), _col8 (type: int), _col9 (type: int), _col11 (type: decimal(21,6)), _col10 (type: decimal(17,2)), _col3 (type: decimal(17,2)), _col16 (type: decimal(17,2)), (_col10 - _col11) (type: decimal(22,6)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8 - Statistics: Num rows: 489720 Data size: 371207760 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 490380 Data size: 371707850 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col8 (type: decimal(22,6)), _col2 (type: int) null sort order: zz sort order: ++ - Statistics: Num rows: 489720 Data size: 371207760 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 490380 Data size: 371707850 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col3 (type: int), _col4 (type: decimal(21,6)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)), _col7 (type: decimal(17,2)) Reducer 7 Execution mode: vectorized, llap @@ -392,7 +392,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: char(50)), VALUE._col1 (type: char(50)), KEY.reducesinkkey1 (type: int), VALUE._col2 (type: int), VALUE._col3 (type: decimal(21,6)), VALUE._col4 (type: decimal(17,2)), VALUE._col5 (type: decimal(17,2)), VALUE._col6 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 489720 Data size: 316359120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 490380 Data size: 316785290 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 64600 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query59.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query59.q.out index 6d0eda9d0ba3..41963f391966 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query59.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query59.q.out @@ -24,11 +24,11 @@ STAGE PLANS: TableScan alias: store probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_162_container, bigKeyColName:s_store_id, smallTablePos:1, keyRatio:0.5158450704225352 - Statistics: Num rows: 1704 Data size: 333984 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 333104 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_store_id (type: string), s_store_name (type: varchar(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1704 Data size: 333984 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 333104 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -38,13 +38,13 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3 input vertices: 1 Map 2 - Statistics: Num rows: 3303 Data size: 673812 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3303 Data size: 672932 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 3303 Data size: 673812 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3303 Data size: 672932 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(50)), _col3 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -378,7 +378,7 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col3, _col5, _col7, _col8, _col9, _col10, _col11, _col12, _col13 input vertices: 0 Map 1 - Statistics: Num rows: 312689 Data size: 307685976 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 312689 Data size: 307685096 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -388,22 +388,22 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col5, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col17, _col18, _col19, _col20, _col21, _col22 input vertices: 1 Reducer 6 - Statistics: Num rows: 57379349 Data size: 94561167152 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 57379349 Data size: 94561166272 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++ keys: _col2 (type: varchar(50)), _col1 (type: string), _col5 (type: int) null sort order: zzz - Statistics: Num rows: 57379349 Data size: 94561167152 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 57379349 Data size: 94561166272 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col2 (type: varchar(50)), _col1 (type: string), _col5 (type: int), (_col7 / _col17) (type: decimal(37,20)), (_col8 / _col18) (type: decimal(37,20)), (_col9 / _col9) (type: decimal(37,20)), (_col10 / _col19) (type: decimal(37,20)), (_col11 / _col20) (type: decimal(37,20)), (_col12 / _col21) (type: decimal(37,20)), (_col13 / _col22) (type: decimal(37,20)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9 - Statistics: Num rows: 57379349 Data size: 56002244624 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 57379349 Data size: 56002242776 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(50)), _col1 (type: string), _col2 (type: int) null sort order: zzz sort order: +++ - Statistics: Num rows: 57379349 Data size: 56002244624 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 57379349 Data size: 56002242776 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(37,20)), _col4 (type: decimal(37,20)), _col5 (type: decimal(37,20)), _col6 (type: decimal(37,20)), _col7 (type: decimal(37,20)), _col8 (type: decimal(37,20)), _col9 (type: decimal(37,20)) Reducer 8 Execution mode: vectorized, llap @@ -411,7 +411,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: varchar(50)), KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: int), VALUE._col0 (type: decimal(37,20)), VALUE._col1 (type: decimal(37,20)), VALUE._col2 (type: decimal(37,20)), VALUE._col3 (type: decimal(37,20)), VALUE._col4 (type: decimal(37,20)), VALUE._col5 (type: decimal(37,20)), VALUE._col6 (type: decimal(37,20)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9 - Statistics: Num rows: 57379349 Data size: 56002244624 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 57379349 Data size: 56002242776 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 97600 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query6.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query6.q.out index 3aaa8ab05d5d..dc398ab1e881 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query6.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query6.q.out @@ -60,10 +60,10 @@ STAGE PLANS: TableScan alias: j filterExpr: i_category is not null (type: boolean) - Statistics: Num rows: 462000 Data size: 93193408 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 93093328 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: i_category is not null (type: boolean) - Statistics: Num rows: 462000 Data size: 93193408 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 460887 Data size: 92869108 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(i_current_price), count(i_current_price) keys: i_category (type: char(50)) @@ -85,7 +85,7 @@ STAGE PLANS: TableScan alias: s filterExpr: ss_customer_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_171_container, bigKeyColName:ss_item_sk, smallTablePos:0, keyRatio:7.749438625217859E-6 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_171_container, bigKeyColName:ss_item_sk, smallTablePos:0, keyRatio:7.044949713658877E-6 Statistics: Num rows: 82510879939 Data size: 1964702246744 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ss_customer_sk is not null (type: boolean) @@ -103,17 +103,17 @@ STAGE PLANS: outputColumnNames: _col6, _col7 input vertices: 0 Map 9 - Statistics: Num rows: 639413 Data size: 5115312 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 581285 Data size: 4650288 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col6 (type: bigint), _col7 (type: bigint) outputColumnNames: _col1, _col2 - Statistics: Num rows: 639413 Data size: 5115312 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 581285 Data size: 4650288 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 639413 Data size: 5115312 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 581285 Data size: 4650288 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -215,17 +215,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: a - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_state (type: char(2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -234,15 +234,15 @@ STAGE PLANS: TableScan alias: i filterExpr: (i_current_price is not null and i_category is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_170_container, bigKeyColName:i_category, smallTablePos:1, keyRatio:0.997474025974026 - Statistics: Num rows: 462000 Data size: 96889408 Basic stats: COMPLETE Column stats: COMPLETE + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_170_container, bigKeyColName:i_category, smallTablePos:1, keyRatio:0.9950714285714286 + Statistics: Num rows: 462000 Data size: 96789328 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_current_price is not null and i_category is not null) (type: boolean) - Statistics: Num rows: 460833 Data size: 96644674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 459723 Data size: 96312280 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_current_price (type: decimal(7,2)), i_category (type: char(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 460833 Data size: 96644674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 459723 Data size: 96312280 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -252,16 +252,16 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col4 input vertices: 1 Reducer 11 - Statistics: Num rows: 460833 Data size: 106783000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 459723 Data size: 106525816 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col1 > _col4) (type: boolean) - Statistics: Num rows: 153611 Data size: 35594408 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 153241 Data size: 35508680 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 153611 Data size: 35594408 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 153241 Data size: 35508680 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 11 @@ -272,20 +272,20 @@ STAGE PLANS: keys: KEY._col0 (type: char(50)) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 11 Data size: 2310 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 10 Data size: 2100 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: CAST( CAST( (_col1 / _col2) AS decimal(11,6)) AS decimal(16,6)) is not null (type: boolean) - Statistics: Num rows: 11 Data size: 2310 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 10 Data size: 2100 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(50)), (1.2 * CAST( CAST( (_col1 / _col2) AS decimal(11,6)) AS decimal(16,6))) (type: decimal(14,7)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 11 Data size: 2222 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 10 Data size: 2020 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: char(50)) - Statistics: Num rows: 11 Data size: 2222 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 10 Data size: 2020 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(14,7)) Reducer 13 Execution mode: vectorized, llap @@ -299,7 +299,7 @@ STAGE PLANS: outputColumnNames: _col4, _col7 input vertices: 0 Reducer 2 - Statistics: Num rows: 639413 Data size: 60104822 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 581285 Data size: 4650366 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Map Join Operator condition map: @@ -310,20 +310,20 @@ STAGE PLANS: outputColumnNames: _col4 input vertices: 1 Map 16 - Statistics: Num rows: 639413 Data size: 54989518 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 581285 Data size: 86 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col4 (type: char(2)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 1 Data size: 94 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2 Data size: 102 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(2)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: char(2)) - Statistics: Num rows: 1 Data size: 94 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2 Data size: 102 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 14 Execution mode: vectorized, llap @@ -333,7 +333,7 @@ STAGE PLANS: keys: KEY._col0 (type: char(2)) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 1 Data size: 94 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2 Data size: 102 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col1 >= 10L) (type: boolean) Statistics: Num rows: 1 Data size: 94 Basic stats: COMPLETE Column stats: COMPLETE @@ -355,13 +355,13 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: char(2)), KEY.reducesinkkey0 (type: bigint) outputColumnNames: _col0, _col1 - Statistics: Num rows: 1 Data size: 94 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 - Statistics: Num rows: 1 Data size: 94 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 1 Data size: 94 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -378,14 +378,14 @@ STAGE PLANS: outputColumnNames: _col0, _col4 input vertices: 1 Map 8 - Statistics: Num rows: 80000000 Data size: 7520000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 7416820898 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 7520000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 7416820898 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: char(2)) Reducer 4 Execution mode: vectorized, llap diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query60.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query60.q.out index b0e5ba681a36..4d7ef498df6e 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query60.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query60.q.out @@ -73,20 +73,20 @@ STAGE PLANS: outputColumnNames: _col2, _col10 input vertices: 1 Map 7 - Statistics: Num rows: 38679150 Data size: 3867915112 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 42547065 Data size: 4254706612 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col10 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 114032 Data size: 24174784 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 146608 Data size: 31080896 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 114032 Data size: 24174784 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 146608 Data size: 31080896 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -143,20 +143,20 @@ STAGE PLANS: outputColumnNames: _col2, _col10 input vertices: 1 Map 7 - Statistics: Num rows: 20450037 Data size: 2045003812 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 22495041 Data size: 2249504212 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col10 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 57016 Data size: 12087392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 77616 Data size: 16454592 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 57016 Data size: 12087392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 77616 Data size: 16454592 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -246,20 +246,20 @@ STAGE PLANS: outputColumnNames: _col2, _col10 input vertices: 1 Map 7 - Statistics: Num rows: 10366384 Data size: 1895103728 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 11403022 Data size: 2114870984 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col10 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 57016 Data size: 12087392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 77616 Data size: 16454592 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 57016 Data size: 12087392 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 77616 Data size: 16454592 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -348,38 +348,38 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 87780000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 87679920 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_category = 'Children ') (type: boolean) - Statistics: Num rows: 42000 Data size: 7980000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46200 Data size: 8768100 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_id (type: string) outputColumnNames: _col0 - Statistics: Num rows: 42000 Data size: 4200000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46200 Data size: 4620000 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: string) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0 - Statistics: Num rows: 42000 Data size: 4200000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46200 Data size: 4620000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 42000 Data size: 4200000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46200 Data size: 4620000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 42000 Data size: 4200000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46200 Data size: 4620000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 42000 Data size: 4200000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46200 Data size: 4620000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_id (type: string) outputColumnNames: _col0, _col1 @@ -428,12 +428,12 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: + keys: _col0 (type: string) null sort order: z - Statistics: Num rows: 21381 Data size: 4532772 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 25872 Data size: 5484864 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator aggregations: sum(_col1) @@ -441,13 +441,13 @@ STAGE PLANS: minReductionHashAggr: 0.6666666 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(27,2)) Reducer 15 Execution mode: vectorized, llap @@ -457,12 +457,12 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: + keys: _col0 (type: string) null sort order: z - Statistics: Num rows: 21381 Data size: 4532772 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 25872 Data size: 5484864 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator aggregations: sum(_col1) @@ -470,13 +470,13 @@ STAGE PLANS: minReductionHashAggr: 0.6666666 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(27,2)) Reducer 2 Execution mode: vectorized, llap @@ -486,12 +486,12 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: + keys: _col0 (type: string) null sort order: z - Statistics: Num rows: 21381 Data size: 4532772 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 25872 Data size: 5484864 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator aggregations: sum(_col1) @@ -499,13 +499,13 @@ STAGE PLANS: minReductionHashAggr: 0.6666666 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(27,2)) Reducer 4 Execution mode: vectorized, llap @@ -515,25 +515,25 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++ keys: _col0 (type: string), _col1 (type: decimal(27,2)) null sort order: zz - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: decimal(27,2)) null sort order: zz sort order: ++ - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE Reducer 5 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: decimal(27,2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 7127 Data size: 1510924 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8624 Data size: 1828288 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 21200 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query61.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query61.q.out index d1a4083c34eb..1584438c3d2e 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query61.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query61.q.out @@ -61,10 +61,10 @@ STAGE PLANS: TableScan alias: promotion filterExpr: ((p_channel_email = 'Y') or (p_channel_tv = 'Y') or (p_channel_dmail = 'Y')) (type: boolean) - Statistics: Num rows: 2300 Data size: 604900 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2300 Data size: 598525 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((p_channel_email = 'Y') or (p_channel_tv = 'Y') or (p_channel_dmail = 'Y')) (type: boolean) - Statistics: Num rows: 2300 Data size: 604900 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2300 Data size: 598525 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: p_promo_sk (type: bigint) outputColumnNames: _col0 @@ -82,26 +82,26 @@ STAGE PLANS: TableScan alias: item filterExpr: (i_category = 'Electronics ') (type: boolean) - Statistics: Num rows: 462000 Data size: 45276000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 45175920 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_category = 'Electronics ') (type: boolean) - Statistics: Num rows: 42000 Data size: 4116000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46200 Data size: 4517700 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 42000 Data size: 336000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46200 Data size: 369600 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 42000 Data size: 336000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46200 Data size: 369600 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 42000 Data size: 336000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46200 Data size: 369600 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 3 @@ -157,7 +157,7 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col3, _col4 input vertices: 1 Reducer 13 - Statistics: Num rows: 118561176 Data size: 136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 130417292 Data size: 136 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -167,7 +167,7 @@ STAGE PLANS: outputColumnNames: _col1, _col3, _col4 input vertices: 1 Reducer 10 - Statistics: Num rows: 23754047 Data size: 128 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 26129451 Data size: 128 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -177,7 +177,7 @@ STAGE PLANS: outputColumnNames: _col1, _col4 input vertices: 1 Map 11 - Statistics: Num rows: 23754047 Data size: 120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 26129451 Data size: 120 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -187,7 +187,7 @@ STAGE PLANS: outputColumnNames: _col7 input vertices: 0 Reducer 2 - Statistics: Num rows: 3959008 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4354909 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col7) minReductionHashAggr: 0.99 @@ -225,7 +225,7 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col3 input vertices: 1 Map 12 - Statistics: Num rows: 121414971 Data size: 128 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 133556467 Data size: 128 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -235,7 +235,7 @@ STAGE PLANS: outputColumnNames: _col1, _col3 input vertices: 1 Map 9 - Statistics: Num rows: 24325812 Data size: 120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 26758393 Data size: 120 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -245,7 +245,7 @@ STAGE PLANS: outputColumnNames: _col6 input vertices: 0 Map 1 - Statistics: Num rows: 4054303 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4459733 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col6) minReductionHashAggr: 0.99 @@ -352,7 +352,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 42000 Data size: 336000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 46200 Data size: 369600 Basic stats: COMPLETE Column stats: COMPLETE Reducer 2 Execution mode: vectorized, llap Reduce Operator Tree: diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query62.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query62.q.out index d90878edae16..3040eb8ef8f7 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query62.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query62.q.out @@ -65,12 +65,12 @@ STAGE PLANS: outputColumnNames: _col4, _col5, _col6, _col7, _col8, _col11, _col13, _col15 input vertices: 1 Map 7 - Statistics: Num rows: 3982805920 Data size: 1198824581920 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3982805920 Data size: 1198824581830 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++ keys: _col13 (type: string), _col11 (type: char(30)), _col15 (type: varchar(50)) null sort order: zzz - Statistics: Num rows: 3982805920 Data size: 1198824581920 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3982805920 Data size: 1198824581830 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator aggregations: sum(_col4), sum(_col5), sum(_col6), sum(_col7), sum(_col8) @@ -149,17 +149,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: web_site - Statistics: Num rows: 84 Data size: 8232 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 84 Data size: 8142 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: web_site_sk (type: bigint), web_name (type: varchar(50)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 84 Data size: 8232 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 84 Data size: 8142 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 84 Data size: 8232 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 84 Data size: 8142 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -171,16 +171,16 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: char(30)), KEY._col2 (type: varchar(50)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 2430 Data size: 780030 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2184 Data size: 701064 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: char(30)), _col2 (type: varchar(50)), _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint), _col7 (type: bigint), _col0 (type: string) outputColumnNames: _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8 - Statistics: Num rows: 2430 Data size: 780030 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2184 Data size: 701064 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col8 (type: string), _col1 (type: char(30)), _col2 (type: varchar(50)) null sort order: zzz sort order: +++ - Statistics: Num rows: 2430 Data size: 780030 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2184 Data size: 701064 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint), _col7 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -188,7 +188,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: char(30)), KEY.reducesinkkey2 (type: varchar(50)), VALUE._col0 (type: bigint), VALUE._col1 (type: bigint), VALUE._col2 (type: bigint), VALUE._col3 (type: bigint), VALUE._col4 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 2430 Data size: 780030 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2184 Data size: 701064 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 32100 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query63.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query63.q.out index 5cb0c9859d91..d00f47e643bf 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query63.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query63.q.out @@ -66,10 +66,10 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - filterExpr: ((i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ', 'personal ', 'portable ', 'refernece ', 'self-help ') and (i_category) IN ('Books ', 'Children ', 'Electronics ', 'Men ', 'Music ', 'Women ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'exportiunivamalg #9 ', 'importoamalg #1 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ') and (((i_category) IN ('Books ', 'Children ', 'Electronics ') and (i_class) IN ('personal ', 'portable ', 'refernece ', 'self-help ') and (i_brand) IN ('exportiunivamalg #9 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ')) or ((i_category) IN ('Men ', 'Music ', 'Women ') and (i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'importoamalg #1 ')))) (type: boolean) - Statistics: Num rows: 462000 Data size: 135823508 Basic stats: COMPLETE Column stats: COMPLETE + filterExpr: ((i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ', 'personal ', 'portable ', 'refernece ', 'self-help ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'exportiunivamalg #9 ', 'importoamalg #1 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ') and (i_category) IN ('Books ', 'Children ', 'Electronics ', 'Men ', 'Music ', 'Women ') and (((i_category) IN ('Books ', 'Children ', 'Electronics ') and (i_class) IN ('personal ', 'portable ', 'refernece ', 'self-help ') and (i_brand) IN ('exportiunivamalg #9 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ')) or ((i_category) IN ('Men ', 'Music ', 'Women ') and (i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'importoamalg #1 ')))) (type: boolean) + Statistics: Num rows: 462000 Data size: 135501868 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: ((i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ', 'personal ', 'portable ', 'refernece ', 'self-help ') and (i_category) IN ('Books ', 'Children ', 'Electronics ', 'Men ', 'Music ', 'Women ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'exportiunivamalg #9 ', 'importoamalg #1 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ') and (((i_category) IN ('Books ', 'Children ', 'Electronics ') and (i_class) IN ('personal ', 'portable ', 'refernece ', 'self-help ') and (i_brand) IN ('exportiunivamalg #9 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ')) or ((i_category) IN ('Men ', 'Music ', 'Women ') and (i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'importoamalg #1 ')))) (type: boolean) + predicate: ((i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ', 'personal ', 'portable ', 'refernece ', 'self-help ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'exportiunivamalg #9 ', 'importoamalg #1 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ') and (i_category) IN ('Books ', 'Children ', 'Electronics ', 'Men ', 'Music ', 'Women ') and (((i_category) IN ('Books ', 'Children ', 'Electronics ') and (i_class) IN ('personal ', 'portable ', 'refernece ', 'self-help ') and (i_brand) IN ('exportiunivamalg #9 ', 'scholaramalgamalg #14 ', 'scholaramalgamalg #7 ', 'scholaramalgamalg #9 ')) or ((i_category) IN ('Men ', 'Music ', 'Women ') and (i_class) IN ('accessories ', 'classical ', 'fragrances ', 'pants ') and (i_brand) IN ('amalgimporto #1 ', 'edu packscholar #1 ', 'exportiimporto #1 ', 'importoamalg #1 ')))) (type: boolean) Statistics: Num rows: 48 Data size: 14112 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_manager_id (type: int) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query64.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query64.q.out index d38476f52ca9..6836aad971b5 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query64.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query64.q.out @@ -7,45 +7,47 @@ STAGE PLANS: Tez #### A masked pattern was here #### Edges: - Map 1 <- Map 19 (BROADCAST_EDGE), Map 31 (BROADCAST_EDGE), Reducer 9 (BROADCAST_EDGE) - Map 13 <- Reducer 32 (BROADCAST_EDGE), Reducer 33 (BROADCAST_EDGE) - Map 25 <- Map 19 (BROADCAST_EDGE), Map 31 (BROADCAST_EDGE), Reducer 12 (BROADCAST_EDGE), Reducer 5 (BROADCAST_EDGE) - Map 35 <- Reducer 12 (BROADCAST_EDGE), Reducer 32 (BROADCAST_EDGE), Reducer 33 (BROADCAST_EDGE), Reducer 9 (BROADCAST_EDGE) - Map 6 <- Reducer 32 (BROADCAST_EDGE), Reducer 33 (BROADCAST_EDGE) - Reducer 10 <- Map 13 (CUSTOM_SIMPLE_EDGE), Map 6 (CUSTOM_SIMPLE_EDGE) - Reducer 11 <- Reducer 10 (SIMPLE_EDGE) - Reducer 12 <- Reducer 11 (CUSTOM_SIMPLE_EDGE) + Map 1 <- Map 19 (BROADCAST_EDGE), Map 31 (BROADCAST_EDGE), Reducer 10 (BROADCAST_EDGE) + Map 14 <- Reducer 32 (BROADCAST_EDGE), Reducer 33 (BROADCAST_EDGE) + Map 15 <- Reducer 10 (BROADCAST_EDGE), Reducer 13 (BROADCAST_EDGE), Reducer 32 (BROADCAST_EDGE), Reducer 33 (BROADCAST_EDGE) + Map 25 <- Map 19 (BROADCAST_EDGE), Map 31 (BROADCAST_EDGE), Reducer 13 (BROADCAST_EDGE), Reducer 5 (BROADCAST_EDGE) + Map 7 <- Reducer 32 (BROADCAST_EDGE), Reducer 33 (BROADCAST_EDGE) + Reducer 10 <- Reducer 9 (CUSTOM_SIMPLE_EDGE) + Reducer 11 <- Map 14 (CUSTOM_SIMPLE_EDGE), Map 7 (CUSTOM_SIMPLE_EDGE) + Reducer 12 <- Reducer 11 (SIMPLE_EDGE) + Reducer 13 <- Reducer 12 (CUSTOM_SIMPLE_EDGE) Reducer 17 <- Map 16 (SIMPLE_EDGE) Reducer 18 <- Map 16 (SIMPLE_EDGE) - Reducer 2 <- Map 1 (CUSTOM_SIMPLE_EDGE), Map 14 (BROADCAST_EDGE), Map 34 (CUSTOM_SIMPLE_EDGE), Reducer 8 (BROADCAST_EDGE) + Reducer 2 <- Map 1 (CUSTOM_SIMPLE_EDGE), Map 34 (BROADCAST_EDGE), Map 6 (CUSTOM_SIMPLE_EDGE), Reducer 9 (BROADCAST_EDGE) Reducer 20 <- Map 19 (SIMPLE_EDGE) Reducer 21 <- Map 19 (SIMPLE_EDGE) Reducer 23 <- Map 22 (SIMPLE_EDGE) Reducer 24 <- Map 22 (SIMPLE_EDGE) - Reducer 26 <- Map 14 (BROADCAST_EDGE), Map 25 (CUSTOM_SIMPLE_EDGE), Map 34 (CUSTOM_SIMPLE_EDGE), Reducer 11 (BROADCAST_EDGE) - Reducer 27 <- Map 14 (BROADCAST_EDGE), Map 15 (BROADCAST_EDGE), Map 16 (BROADCAST_EDGE), Map 19 (BROADCAST_EDGE), Map 22 (BROADCAST_EDGE), Map 35 (CUSTOM_SIMPLE_EDGE), Reducer 18 (BROADCAST_EDGE), Reducer 21 (BROADCAST_EDGE), Reducer 24 (BROADCAST_EDGE), Reducer 26 (CUSTOM_SIMPLE_EDGE) + Reducer 26 <- Map 25 (CUSTOM_SIMPLE_EDGE), Map 34 (BROADCAST_EDGE), Map 6 (CUSTOM_SIMPLE_EDGE), Reducer 12 (BROADCAST_EDGE) + Reducer 27 <- Map 15 (CUSTOM_SIMPLE_EDGE), Map 16 (BROADCAST_EDGE), Map 19 (BROADCAST_EDGE), Map 22 (BROADCAST_EDGE), Map 35 (BROADCAST_EDGE), Reducer 18 (BROADCAST_EDGE), Reducer 21 (BROADCAST_EDGE), Reducer 24 (BROADCAST_EDGE), Reducer 26 (CUSTOM_SIMPLE_EDGE), Reducer 36 (BROADCAST_EDGE) Reducer 28 <- Reducer 27 (SIMPLE_EDGE) Reducer 29 <- Reducer 28 (CUSTOM_SIMPLE_EDGE), Reducer 4 (CUSTOM_SIMPLE_EDGE) - Reducer 3 <- Map 14 (BROADCAST_EDGE), Map 15 (BROADCAST_EDGE), Map 16 (BROADCAST_EDGE), Map 19 (BROADCAST_EDGE), Map 22 (BROADCAST_EDGE), Map 35 (CUSTOM_SIMPLE_EDGE), Reducer 17 (BROADCAST_EDGE), Reducer 2 (CUSTOM_SIMPLE_EDGE), Reducer 20 (BROADCAST_EDGE), Reducer 23 (BROADCAST_EDGE) + Reducer 3 <- Map 15 (CUSTOM_SIMPLE_EDGE), Map 16 (BROADCAST_EDGE), Map 19 (BROADCAST_EDGE), Map 22 (BROADCAST_EDGE), Map 35 (BROADCAST_EDGE), Reducer 17 (BROADCAST_EDGE), Reducer 2 (CUSTOM_SIMPLE_EDGE), Reducer 20 (BROADCAST_EDGE), Reducer 23 (BROADCAST_EDGE), Reducer 37 (BROADCAST_EDGE) Reducer 30 <- Reducer 29 (SIMPLE_EDGE) Reducer 32 <- Map 31 (CUSTOM_SIMPLE_EDGE) Reducer 33 <- Map 31 (CUSTOM_SIMPLE_EDGE) + Reducer 36 <- Map 35 (SIMPLE_EDGE) + Reducer 37 <- Map 35 (SIMPLE_EDGE) Reducer 4 <- Reducer 3 (SIMPLE_EDGE) Reducer 5 <- Reducer 4 (CUSTOM_SIMPLE_EDGE) - Reducer 7 <- Map 13 (CUSTOM_SIMPLE_EDGE), Map 6 (CUSTOM_SIMPLE_EDGE) - Reducer 8 <- Reducer 7 (SIMPLE_EDGE) - Reducer 9 <- Reducer 8 (CUSTOM_SIMPLE_EDGE) + Reducer 8 <- Map 14 (CUSTOM_SIMPLE_EDGE), Map 7 (CUSTOM_SIMPLE_EDGE) + Reducer 9 <- Reducer 8 (SIMPLE_EDGE) #### A masked pattern was here #### Vertices: Map 1 Map Operator Tree: TableScan alias: store_sales - filterExpr: (ss_cdemo_sk is not null and ss_addr_sk is not null and ss_hdemo_sk is not null and ss_customer_sk is not null and ss_store_sk is not null and ss_promo_sk is not null and ss_item_sk BETWEEN DynamicValue(RS_58_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_58_catalog_sales_cs_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_58_catalog_sales_cs_item_sk_bloom_filter))) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_993_container, bigKeyColName:ss_item_sk, smallTablePos:1, keyRatio:1.8543009129597497E-9 + filterExpr: (ss_cdemo_sk is not null and ss_addr_sk is not null and ss_hdemo_sk is not null and ss_customer_sk is not null and ss_store_sk is not null and ss_promo_sk is not null and ss_item_sk BETWEEN DynamicValue(RS_61_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_61_catalog_sales_cs_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_61_catalog_sales_cs_item_sk_bloom_filter))) (type: boolean) + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_991_container, bigKeyColName:ss_item_sk, smallTablePos:1, keyRatio:1.9027793682005275E-9 Statistics: Num rows: 82510879939 Data size: 32917667058984 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (ss_cdemo_sk is not null and ss_addr_sk is not null and ss_hdemo_sk is not null and ss_customer_sk is not null and ss_store_sk is not null and ss_promo_sk is not null and ss_item_sk BETWEEN DynamicValue(RS_58_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_58_catalog_sales_cs_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_58_catalog_sales_cs_item_sk_bloom_filter))) (type: boolean) + predicate: (ss_cdemo_sk is not null and ss_addr_sk is not null and ss_hdemo_sk is not null and ss_customer_sk is not null and ss_store_sk is not null and ss_promo_sk is not null and ss_item_sk BETWEEN DynamicValue(RS_61_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_61_catalog_sales_cs_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_61_catalog_sales_cs_item_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 71511093715 Data size: 28529308809584 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ss_item_sk (type: bigint), ss_customer_sk (type: bigint), ss_cdemo_sk (type: bigint), ss_hdemo_sk (type: bigint), ss_addr_sk (type: bigint), ss_store_sk (type: bigint), ss_ticket_number (type: bigint), ss_wholesale_cost (type: decimal(7,2)), ss_list_price (type: decimal(7,2)), ss_coupon_amt (type: decimal(7,2)), ss_sold_date_sk (type: bigint) @@ -60,7 +62,7 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11 input vertices: 1 Map 31 - Statistics: Num rows: 1300511220 Data size: 41616359416 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1314442053 Data size: 42062146072 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -70,17 +72,17 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col11 input vertices: 1 Map 19 - Statistics: Num rows: 261380636 Data size: 6273135640 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 264180497 Data size: 6340332304 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 261380636 Data size: 6273135640 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 264180497 Data size: 6340332304 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col2 (type: bigint), _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col11 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 13 + Map 14 Map Operator Tree: TableScan alias: catalog_returns @@ -116,72 +118,38 @@ STAGE PLANS: value expressions: _col2 (type: decimal(9,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 14 - Map Operator Tree: - TableScan - alias: ad1 - Statistics: Num rows: 40000000 Data size: 14760000000 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: ca_address_sk (type: bigint), ca_street_number (type: char(10)), ca_street_name (type: varchar(60)), ca_city (type: varchar(60)), ca_zip (type: char(10)) - outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 40000000 Data size: 14760000000 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 14760000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(10)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col4 (type: char(10)) - Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 14760000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(10)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col4 (type: char(10)) - Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 14760000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(10)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col4 (type: char(10)) - Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 14760000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(10)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col4 (type: char(10)) - Execution mode: vectorized, llap - LLAP IO: may be used (ACID table) Map 15 Map Operator Tree: TableScan - alias: store - filterExpr: (s_store_name is not null and s_zip is not null) (type: boolean) - Statistics: Num rows: 1704 Data size: 315240 Basic stats: COMPLETE Column stats: COMPLETE + alias: store_returns + filterExpr: ((sr_item_sk BETWEEN DynamicValue(RS_61_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_61_catalog_sales_cs_item_sk_max) and sr_item_sk BETWEEN DynamicValue(RS_49_item_i_item_sk_min) AND DynamicValue(RS_49_item_i_item_sk_max) and in_bloom_filter(sr_item_sk, DynamicValue(RS_61_catalog_sales_cs_item_sk_bloom_filter)) and in_bloom_filter(sr_item_sk, DynamicValue(RS_49_item_i_item_sk_bloom_filter))) or (sr_item_sk BETWEEN DynamicValue(RS_159_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_159_catalog_sales_cs_item_sk_max) and sr_item_sk BETWEEN DynamicValue(RS_147_item_i_item_sk_min) AND DynamicValue(RS_147_item_i_item_sk_max) and in_bloom_filter(sr_item_sk, DynamicValue(RS_159_catalog_sales_cs_item_sk_bloom_filter)) and in_bloom_filter(sr_item_sk, DynamicValue(RS_147_item_i_item_sk_bloom_filter)))) (type: boolean) + Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (s_store_name is not null and s_zip is not null) (type: boolean) - Statistics: Num rows: 1704 Data size: 315240 Basic stats: COMPLETE Column stats: COMPLETE + predicate: (sr_item_sk BETWEEN DynamicValue(RS_49_item_i_item_sk_min) AND DynamicValue(RS_49_item_i_item_sk_max) and sr_item_sk BETWEEN DynamicValue(RS_61_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_61_catalog_sales_cs_item_sk_max) and in_bloom_filter(sr_item_sk, DynamicValue(RS_49_item_i_item_sk_bloom_filter)) and in_bloom_filter(sr_item_sk, DynamicValue(RS_61_catalog_sales_cs_item_sk_bloom_filter))) (type: boolean) + Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: s_store_sk (type: bigint), s_store_name (type: varchar(50)), s_zip (type: char(10)) - outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1704 Data size: 315240 Basic stats: COMPLETE Column stats: COMPLETE + expressions: sr_item_sk (type: bigint), sr_ticket_number (type: bigint) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 315240 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: varchar(50)), _col2 (type: char(10)) + key expressions: _col0 (type: bigint), _col1 (type: bigint) + null sort order: zz + sort order: ++ + Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint) + Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: (sr_item_sk BETWEEN DynamicValue(RS_147_item_i_item_sk_min) AND DynamicValue(RS_147_item_i_item_sk_max) and sr_item_sk BETWEEN DynamicValue(RS_159_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_159_catalog_sales_cs_item_sk_max) and in_bloom_filter(sr_item_sk, DynamicValue(RS_147_item_i_item_sk_bloom_filter)) and in_bloom_filter(sr_item_sk, DynamicValue(RS_159_catalog_sales_cs_item_sk_bloom_filter))) (type: boolean) + Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: sr_item_sk (type: bigint), sr_ticket_number (type: bigint) + outputColumnNames: _col0, _col1 + Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 315240 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: varchar(50)), _col2 (type: char(10)) + key expressions: _col0 (type: bigint), _col1 (type: bigint) + null sort order: zz + sort order: ++ + Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint) + Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 16 @@ -363,11 +331,11 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store_sales - filterExpr: (ss_cdemo_sk is not null and ss_addr_sk is not null and ss_hdemo_sk is not null and ss_customer_sk is not null and ss_store_sk is not null and ss_promo_sk is not null and ss_item_sk BETWEEN DynamicValue(RS_156_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_156_catalog_sales_cs_item_sk_max) and ss_item_sk BETWEEN DynamicValue(RS_196_item_i_item_sk_min) AND DynamicValue(RS_196_item_i_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_156_catalog_sales_cs_item_sk_bloom_filter)) and in_bloom_filter(ss_item_sk, DynamicValue(RS_196_item_i_item_sk_bloom_filter))) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_1008_container, bigKeyColName:ss_item_sk, smallTablePos:1, keyRatio:1.8543009129597497E-9 + filterExpr: (ss_cdemo_sk is not null and ss_addr_sk is not null and ss_hdemo_sk is not null and ss_customer_sk is not null and ss_store_sk is not null and ss_promo_sk is not null and ss_item_sk BETWEEN DynamicValue(RS_159_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_159_catalog_sales_cs_item_sk_max) and ss_item_sk BETWEEN DynamicValue(RS_196_item_i_item_sk_min) AND DynamicValue(RS_196_item_i_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_159_catalog_sales_cs_item_sk_bloom_filter)) and in_bloom_filter(ss_item_sk, DynamicValue(RS_196_item_i_item_sk_bloom_filter))) (type: boolean) + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_1006_container, bigKeyColName:ss_item_sk, smallTablePos:1, keyRatio:1.9027793682005275E-9 Statistics: Num rows: 82510879939 Data size: 32917667058984 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (ss_cdemo_sk is not null and ss_addr_sk is not null and ss_hdemo_sk is not null and ss_customer_sk is not null and ss_store_sk is not null and ss_promo_sk is not null and ss_item_sk BETWEEN DynamicValue(RS_196_item_i_item_sk_min) AND DynamicValue(RS_196_item_i_item_sk_max) and ss_item_sk BETWEEN DynamicValue(RS_156_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_156_catalog_sales_cs_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_196_item_i_item_sk_bloom_filter)) and in_bloom_filter(ss_item_sk, DynamicValue(RS_156_catalog_sales_cs_item_sk_bloom_filter))) (type: boolean) + predicate: (ss_cdemo_sk is not null and ss_addr_sk is not null and ss_hdemo_sk is not null and ss_customer_sk is not null and ss_store_sk is not null and ss_promo_sk is not null and ss_item_sk BETWEEN DynamicValue(RS_196_item_i_item_sk_min) AND DynamicValue(RS_196_item_i_item_sk_max) and ss_item_sk BETWEEN DynamicValue(RS_159_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_159_catalog_sales_cs_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_196_item_i_item_sk_bloom_filter)) and in_bloom_filter(ss_item_sk, DynamicValue(RS_159_catalog_sales_cs_item_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 71511093715 Data size: 28529308809584 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ss_item_sk (type: bigint), ss_customer_sk (type: bigint), ss_cdemo_sk (type: bigint), ss_hdemo_sk (type: bigint), ss_addr_sk (type: bigint), ss_store_sk (type: bigint), ss_ticket_number (type: bigint), ss_wholesale_cost (type: decimal(7,2)), ss_list_price (type: decimal(7,2)), ss_coupon_amt (type: decimal(7,2)), ss_sold_date_sk (type: bigint) @@ -382,7 +350,7 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12 input vertices: 1 Map 31 - Statistics: Num rows: 1300511220 Data size: 180771059956 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1314442053 Data size: 182707443603 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -392,13 +360,13 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col11, _col12 input vertices: 1 Map 19 - Statistics: Num rows: 261380636 Data size: 34240863692 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 264180497 Data size: 34607643343 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 261380636 Data size: 34240863692 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 264180497 Data size: 34607643343 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col2 (type: bigint), _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col11 (type: bigint), _col12 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -407,25 +375,25 @@ STAGE PLANS: TableScan alias: item filterExpr: (i_current_price BETWEEN 36 AND 45 and (i_color) IN ('burnished ', 'chocolate ', 'dim ', 'maroon ', 'navajo ', 'steel ')) (type: boolean) - Statistics: Num rows: 462000 Data size: 145861408 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 145634124 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_current_price BETWEEN 36 AND 45 and (i_color) IN ('burnished ', 'chocolate ', 'dim ', 'maroon ', 'navajo ', 'steel ')) (type: boolean) - Statistics: Num rows: 8402 Data size: 2652792 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8492 Data size: 2677223 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_product_name (type: char(50)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 8402 Data size: 966230 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8492 Data size: 974440 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 8402 Data size: 966230 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8492 Data size: 974440 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)) Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 8402 Data size: 67216 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8492 Data size: 67936 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -440,17 +408,17 @@ STAGE PLANS: Select Operator expressions: i_item_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 8402 Data size: 67216 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8492 Data size: 67936 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 8402 Data size: 67216 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8492 Data size: 67936 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 8402 Data size: 67216 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8492 Data size: 67936 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -465,6 +433,74 @@ STAGE PLANS: Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 34 + Map Operator Tree: + TableScan + alias: store + filterExpr: (s_zip is not null and s_store_name is not null) (type: boolean) + Statistics: Num rows: 1704 Data size: 313381 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: (s_zip is not null and s_store_name is not null) (type: boolean) + Statistics: Num rows: 1681 Data size: 309126 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: s_store_sk (type: bigint), s_store_name (type: varchar(50)), s_zip (type: char(10)) + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 1681 Data size: 309126 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 1681 Data size: 309126 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: varchar(50)), _col2 (type: char(10)) + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 1681 Data size: 309126 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: varchar(50)), _col2 (type: char(10)) + Execution mode: vectorized, llap + LLAP IO: may be used (ACID table) + Map 35 + Map Operator Tree: + TableScan + alias: ad2 + Statistics: Num rows: 40000000 Data size: 14326780359 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: ca_address_sk (type: bigint), ca_street_number (type: char(10)), ca_street_name (type: varchar(60)), ca_city (type: varchar(60)), ca_zip (type: char(10)) + outputColumnNames: _col0, _col1, _col2, _col3, _col4 + Statistics: Num rows: 40000000 Data size: 14326780359 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 40000000 Data size: 14326780359 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: char(10)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col4 (type: char(10)) + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 40000000 Data size: 14326780359 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: char(10)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col4 (type: char(10)) + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 40000000 Data size: 14326780359 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: char(10)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col4 (type: char(10)) + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 40000000 Data size: 14326780359 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: char(10)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col4 (type: char(10)) + Execution mode: vectorized, llap + LLAP IO: may be used (ACID table) + Map 6 Map Operator Tree: TableScan alias: customer @@ -493,41 +529,7 @@ STAGE PLANS: value expressions: _col1 (type: bigint), _col2 (type: bigint), _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 35 - Map Operator Tree: - TableScan - alias: store_returns - filterExpr: ((sr_item_sk BETWEEN DynamicValue(RS_156_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_156_catalog_sales_cs_item_sk_max) and sr_item_sk BETWEEN DynamicValue(RS_147_item_i_item_sk_min) AND DynamicValue(RS_147_item_i_item_sk_max) and in_bloom_filter(sr_item_sk, DynamicValue(RS_156_catalog_sales_cs_item_sk_bloom_filter)) and in_bloom_filter(sr_item_sk, DynamicValue(RS_147_item_i_item_sk_bloom_filter))) or (sr_item_sk BETWEEN DynamicValue(RS_58_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_58_catalog_sales_cs_item_sk_max) and sr_item_sk BETWEEN DynamicValue(RS_49_item_i_item_sk_min) AND DynamicValue(RS_49_item_i_item_sk_max) and in_bloom_filter(sr_item_sk, DynamicValue(RS_58_catalog_sales_cs_item_sk_bloom_filter)) and in_bloom_filter(sr_item_sk, DynamicValue(RS_49_item_i_item_sk_bloom_filter)))) (type: boolean) - Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: (sr_item_sk BETWEEN DynamicValue(RS_147_item_i_item_sk_min) AND DynamicValue(RS_147_item_i_item_sk_max) and sr_item_sk BETWEEN DynamicValue(RS_156_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_156_catalog_sales_cs_item_sk_max) and in_bloom_filter(sr_item_sk, DynamicValue(RS_147_item_i_item_sk_bloom_filter)) and in_bloom_filter(sr_item_sk, DynamicValue(RS_156_catalog_sales_cs_item_sk_bloom_filter))) (type: boolean) - Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: sr_item_sk (type: bigint), sr_ticket_number (type: bigint) - outputColumnNames: _col0, _col1 - Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: bigint), _col1 (type: bigint) - null sort order: zz - sort order: ++ - Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint) - Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: (sr_item_sk BETWEEN DynamicValue(RS_49_item_i_item_sk_min) AND DynamicValue(RS_49_item_i_item_sk_max) and sr_item_sk BETWEEN DynamicValue(RS_58_catalog_sales_cs_item_sk_min) AND DynamicValue(RS_58_catalog_sales_cs_item_sk_max) and in_bloom_filter(sr_item_sk, DynamicValue(RS_49_item_i_item_sk_bloom_filter)) and in_bloom_filter(sr_item_sk, DynamicValue(RS_58_catalog_sales_cs_item_sk_bloom_filter))) (type: boolean) - Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: sr_item_sk (type: bigint), sr_ticket_number (type: bigint) - outputColumnNames: _col0, _col1 - Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: bigint), _col1 (type: bigint) - null sort order: zz - sort order: ++ - Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint) - Statistics: Num rows: 8634166995 Data size: 138146671920 Basic stats: COMPLETE Column stats: COMPLETE - Execution mode: vectorized, llap - LLAP IO: may be used (ACID table) - Map 6 + Map 7 Map Operator Tree: TableScan alias: catalog_sales @@ -564,6 +566,24 @@ STAGE PLANS: Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 10 + Execution mode: vectorized, llap + Reduce Operator Tree: + Group By Operator + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1000000) + mode: final + outputColumnNames: _col0, _col1, _col2 + Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + null sort order: + sort order: + Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) + Reduce Output Operator + null sort order: + sort order: + Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) + Reducer 11 Execution mode: vectorized, llap Reduce Operator Tree: Map Join Operator @@ -574,7 +594,7 @@ STAGE PLANS: 1 KEY.reducesinkkey0 (type: bigint), KEY.reducesinkkey1 (type: bigint) outputColumnNames: _col0, _col2, _col5 input vertices: - 1 Map 13 + 1 Map 14 Statistics: Num rows: 41876960211 Data size: 9691486353656 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator @@ -591,7 +611,7 @@ STAGE PLANS: Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 16946565830 Data size: 3931603272560 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)), _col2 (type: decimal(19,2)) - Reducer 11 + Reducer 12 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator @@ -628,7 +648,7 @@ STAGE PLANS: sort order: Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) - Reducer 12 + Reducer 13 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator @@ -681,36 +701,36 @@ STAGE PLANS: 1 KEY.reducesinkkey0 (type: bigint) outputColumnNames: _col0, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col11, _col15, _col16, _col17, _col18, _col19 input vertices: - 1 Map 34 - Statistics: Num rows: 226670367 Data size: 14429217296 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 6 + Statistics: Num rows: 229098418 Data size: 14584612560 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: bigint) + 0 _col5 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col0, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col11, _col15, _col16, _col17, _col18, _col19 + outputColumnNames: _col0, _col2, _col3, _col4, _col6, _col7, _col8, _col9, _col11, _col15, _col16, _col17, _col18, _col19, _col21, _col22 input vertices: - 1 Reducer 8 - Statistics: Num rows: 226670367 Data size: 14429217296 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 34 + Statistics: Num rows: 226271857 Data size: 54453829478 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col4 (type: bigint) + 0 _col0 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col0, _col2, _col3, _col5, _col6, _col7, _col8, _col9, _col11, _col15, _col16, _col17, _col18, _col19, _col22, _col23, _col24, _col25 + outputColumnNames: _col0, _col2, _col3, _col4, _col6, _col7, _col8, _col9, _col11, _col15, _col16, _col17, _col18, _col19, _col21, _col22 input vertices: - 1 Map 14 - Statistics: Num rows: 226670367 Data size: 96257219775 Basic stats: COMPLETE Column stats: COMPLETE + 1 Reducer 9 + Statistics: Num rows: 226271857 Data size: 54453829478 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col6 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col6 (type: bigint) - Statistics: Num rows: 226670367 Data size: 96257219775 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col2 (type: bigint), _col3 (type: bigint), _col5 (type: bigint), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col11 (type: bigint), _col15 (type: bigint), _col16 (type: bigint), _col17 (type: bigint), _col18 (type: bigint), _col19 (type: bigint), _col22 (type: char(10)), _col23 (type: varchar(60)), _col24 (type: varchar(60)), _col25 (type: char(10)) + Statistics: Num rows: 226271857 Data size: 54453829478 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col2 (type: bigint), _col3 (type: bigint), _col4 (type: bigint), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col11 (type: bigint), _col15 (type: bigint), _col16 (type: bigint), _col17 (type: bigint), _col18 (type: bigint), _col19 (type: bigint), _col21 (type: varchar(50)), _col22 (type: char(10)) Reducer 20 Execution mode: vectorized, llap Reduce Operator Tree: @@ -774,36 +794,36 @@ STAGE PLANS: 1 KEY.reducesinkkey0 (type: bigint) outputColumnNames: _col0, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col11, _col12, _col15, _col16, _col17, _col18, _col19 input vertices: - 1 Map 34 - Statistics: Num rows: 226670367 Data size: 38682946565 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 6 + Statistics: Num rows: 229098418 Data size: 39098141146 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col0 (type: bigint) + 0 _col5 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col0, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col11, _col12, _col15, _col16, _col17, _col18, _col19 + outputColumnNames: _col0, _col2, _col3, _col4, _col6, _col7, _col8, _col9, _col11, _col12, _col15, _col16, _col17, _col18, _col19, _col21, _col22 input vertices: - 1 Reducer 11 - Statistics: Num rows: 226670367 Data size: 38682946565 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 34 + Statistics: Num rows: 226271857 Data size: 78664916037 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col4 (type: bigint) + 0 _col0 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col0, _col2, _col3, _col5, _col6, _col7, _col8, _col9, _col11, _col12, _col15, _col16, _col17, _col18, _col19, _col22, _col23, _col24, _col25 + outputColumnNames: _col0, _col2, _col3, _col4, _col6, _col7, _col8, _col9, _col11, _col12, _col15, _col16, _col17, _col18, _col19, _col21, _col22 input vertices: - 1 Map 14 - Statistics: Num rows: 226670367 Data size: 120510949044 Basic stats: COMPLETE Column stats: COMPLETE + 1 Reducer 12 + Statistics: Num rows: 226271857 Data size: 78664916037 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col6 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col6 (type: bigint) - Statistics: Num rows: 226670367 Data size: 120510949044 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col2 (type: bigint), _col3 (type: bigint), _col5 (type: bigint), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col11 (type: bigint), _col12 (type: char(50)), _col15 (type: bigint), _col16 (type: bigint), _col17 (type: bigint), _col18 (type: bigint), _col19 (type: bigint), _col22 (type: char(10)), _col23 (type: varchar(60)), _col24 (type: varchar(60)), _col25 (type: char(10)) + Statistics: Num rows: 226271857 Data size: 78664916037 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col2 (type: bigint), _col3 (type: bigint), _col4 (type: bigint), _col7 (type: decimal(7,2)), _col8 (type: decimal(7,2)), _col9 (type: decimal(7,2)), _col11 (type: bigint), _col12 (type: char(50)), _col15 (type: bigint), _col16 (type: bigint), _col17 (type: bigint), _col18 (type: bigint), _col19 (type: bigint), _col21 (type: varchar(50)), _col22 (type: char(10)) Reducer 27 Execution mode: vectorized, llap Reduce Operator Tree: @@ -813,134 +833,134 @@ STAGE PLANS: keys: 0 KEY.reducesinkkey0 (type: bigint), KEY.reducesinkkey1 (type: bigint) 1 KEY.reducesinkkey0 (type: bigint), KEY.reducesinkkey1 (type: bigint) - outputColumnNames: _col2, _col3, _col5, _col7, _col8, _col9, _col11, _col12, _col15, _col16, _col17, _col18, _col19, _col22, _col23, _col24, _col25 + outputColumnNames: _col2, _col3, _col4, _col7, _col8, _col9, _col11, _col12, _col15, _col16, _col17, _col18, _col19, _col21, _col22 input vertices: - 1 Map 35 - Statistics: Num rows: 382653083 Data size: 253525082388 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 15 + Statistics: Num rows: 381980339 Data size: 182794835869 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col5 (type: bigint) + 0 _col3 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col2, _col3, _col7, _col8, _col9, _col11, _col12, _col15, _col16, _col17, _col18, _col19, _col22, _col23, _col24, _col25, _col29, _col30 + outputColumnNames: _col2, _col4, _col7, _col8, _col9, _col11, _col12, _col15, _col16, _col17, _col18, _col19, _col21, _col22 input vertices: - 1 Map 15 - Statistics: Num rows: 382653083 Data size: 320006816343 Basic stats: COMPLETE Column stats: COMPLETE + 1 Reducer 18 + Statistics: Num rows: 381980339 Data size: 181549168005 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col3 (type: bigint) + 0 _col16 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col2, _col7, _col8, _col9, _col11, _col12, _col15, _col16, _col17, _col18, _col19, _col22, _col23, _col24, _col25, _col29, _col30 + outputColumnNames: _col2, _col4, _col7, _col8, _col9, _col11, _col12, _col15, _col17, _col18, _col19, _col21, _col22 input vertices: - 1 Reducer 18 - Statistics: Num rows: 382653083 Data size: 318758954607 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 16 + Statistics: Num rows: 381980339 Data size: 178512743765 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col16 (type: bigint) + 0 _col19 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col2, _col7, _col8, _col9, _col11, _col12, _col15, _col17, _col18, _col19, _col22, _col23, _col24, _col25, _col29, _col30 + outputColumnNames: _col2, _col4, _col7, _col8, _col9, _col11, _col12, _col15, _col17, _col18, _col21, _col22, _col29 input vertices: - 1 Map 16 - Statistics: Num rows: 382653083 Data size: 315717148415 Basic stats: COMPLETE Column stats: COMPLETE + 1 Reducer 21 + Statistics: Num rows: 381980339 Data size: 177004244401 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col19 (type: bigint) + 0 _col18 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col2, _col7, _col8, _col9, _col11, _col12, _col15, _col17, _col18, _col22, _col23, _col24, _col25, _col29, _col30, _col34 + outputColumnNames: _col2, _col4, _col7, _col8, _col9, _col11, _col12, _col15, _col17, _col21, _col22, _col29, _col31 input vertices: - 1 Reducer 21 - Statistics: Num rows: 382653083 Data size: 314205958075 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 19 + Statistics: Num rows: 381980339 Data size: 175495753381 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col18 (type: bigint) + 0 _col2 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col2, _col7, _col8, _col9, _col11, _col12, _col15, _col17, _col22, _col23, _col24, _col25, _col29, _col30, _col34, _col36 + outputColumnNames: _col4, _col7, _col8, _col9, _col11, _col12, _col15, _col17, _col21, _col22, _col29, _col31, _col33 input vertices: - 1 Map 19 - Statistics: Num rows: 382653083 Data size: 312694776079 Basic stats: COMPLETE Column stats: COMPLETE + 1 Reducer 24 + Statistics: Num rows: 381980339 Data size: 206718414332 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col2 (type: bigint) + 0 _col15 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col7, _col8, _col9, _col11, _col12, _col15, _col17, _col22, _col23, _col24, _col25, _col29, _col30, _col34, _col36, _col38 + outputColumnNames: _col4, _col7, _col8, _col9, _col11, _col12, _col17, _col21, _col22, _col29, _col31, _col33, _col35 input vertices: - 1 Reducer 24 - Statistics: Num rows: 382653083 Data size: 343972426398 Basic stats: COMPLETE Column stats: COMPLETE - Map Join Operator - condition map: - Inner Join 0 to 1 - keys: - 0 _col15 (type: bigint) - 1 _col0 (type: bigint) - outputColumnNames: _col7, _col8, _col9, _col11, _col12, _col17, _col22, _col23, _col24, _col25, _col29, _col30, _col34, _col36, _col38, _col40 - input vertices: - 1 Map 22 - Statistics: Num rows: 382653083 Data size: 373456129549 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: (_col38 <> _col40) (type: boolean) - Statistics: Num rows: 382653083 Data size: 373456129549 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 22 + Statistics: Num rows: 381980339 Data size: 236150316195 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: (_col33 <> _col35) (type: boolean) + Statistics: Num rows: 381980339 Data size: 236150316195 Basic stats: COMPLETE Column stats: COMPLETE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col4 (type: bigint) + 1 _col0 (type: bigint) + outputColumnNames: _col7, _col8, _col9, _col11, _col12, _col17, _col21, _col22, _col29, _col31, _col37, _col38, _col39, _col40 + input vertices: + 1 Reducer 36 + Statistics: Num rows: 381980339 Data size: 307429673439 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: 0 _col17 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col7, _col8, _col9, _col11, _col12, _col22, _col23, _col24, _col25, _col29, _col30, _col34, _col36, _col42, _col43, _col44, _col45 + outputColumnNames: _col7, _col8, _col9, _col11, _col12, _col21, _col22, _col29, _col31, _col37, _col38, _col39, _col40, _col42, _col43, _col44, _col45 input vertices: - 1 Map 14 - Statistics: Num rows: 382653083 Data size: 443481643738 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 35 + Statistics: Num rows: 381980339 Data size: 441835513465 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(), sum(_col7), sum(_col8), sum(_col9) - keys: _col29 (type: varchar(50)), _col11 (type: bigint), _col30 (type: char(10)), _col22 (type: char(10)), _col23 (type: varchar(60)), _col24 (type: varchar(60)), _col25 (type: char(10)), _col12 (type: char(50)), _col34 (type: int), _col36 (type: int), _col42 (type: char(10)), _col43 (type: varchar(60)), _col44 (type: varchar(60)), _col45 (type: char(10)) - minReductionHashAggr: 0.823521 + keys: _col21 (type: varchar(50)), _col11 (type: bigint), _col22 (type: char(10)), _col12 (type: char(50)), _col29 (type: int), _col31 (type: int), _col37 (type: char(10)), _col38 (type: varchar(60)), _col39 (type: varchar(60)), _col40 (type: char(10)), _col42 (type: char(10)), _col43 (type: varchar(60)), _col44 (type: varchar(60)), _col45 (type: char(10)) + minReductionHashAggr: 0.82318413 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17 - Statistics: Num rows: 382653083 Data size: 522704111378 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 520918699793 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: varchar(50)), _col1 (type: bigint), _col2 (type: char(10)), _col3 (type: char(10)), _col4 (type: varchar(60)), _col5 (type: varchar(60)), _col6 (type: char(10)), _col7 (type: char(50)), _col8 (type: int), _col9 (type: int), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(60)), _col13 (type: char(10)) + key expressions: _col0 (type: varchar(50)), _col1 (type: bigint), _col2 (type: char(10)), _col3 (type: char(50)), _col4 (type: int), _col5 (type: int), _col6 (type: char(10)), _col7 (type: varchar(60)), _col8 (type: varchar(60)), _col9 (type: char(10)), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(60)), _col13 (type: char(10)) null sort order: zzzzzzzzzzzzzz sort order: ++++++++++++++ - Map-reduce partition columns: _col0 (type: varchar(50)), _col1 (type: bigint), _col2 (type: char(10)), _col3 (type: char(10)), _col4 (type: varchar(60)), _col5 (type: varchar(60)), _col6 (type: char(10)), _col7 (type: char(50)), _col8 (type: int), _col9 (type: int), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(60)), _col13 (type: char(10)) - Statistics: Num rows: 382653083 Data size: 522704111378 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col0 (type: varchar(50)), _col1 (type: bigint), _col2 (type: char(10)), _col3 (type: char(50)), _col4 (type: int), _col5 (type: int), _col6 (type: char(10)), _col7 (type: varchar(60)), _col8 (type: varchar(60)), _col9 (type: char(10)), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(60)), _col13 (type: char(10)) + Statistics: Num rows: 381980339 Data size: 520918699793 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col14 (type: bigint), _col15 (type: decimal(17,2)), _col16 (type: decimal(17,2)), _col17 (type: decimal(17,2)) Reducer 28 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator aggregations: count(VALUE._col0), sum(VALUE._col1), sum(VALUE._col2), sum(VALUE._col3) - keys: KEY._col0 (type: varchar(50)), KEY._col1 (type: bigint), KEY._col2 (type: char(10)), KEY._col3 (type: char(10)), KEY._col4 (type: varchar(60)), KEY._col5 (type: varchar(60)), KEY._col6 (type: char(10)), KEY._col7 (type: char(50)), KEY._col8 (type: int), KEY._col9 (type: int), KEY._col10 (type: char(10)), KEY._col11 (type: varchar(60)), KEY._col12 (type: varchar(60)), KEY._col13 (type: char(10)) + keys: KEY._col0 (type: varchar(50)), KEY._col1 (type: bigint), KEY._col2 (type: char(10)), KEY._col3 (type: char(50)), KEY._col4 (type: int), KEY._col5 (type: int), KEY._col6 (type: char(10)), KEY._col7 (type: varchar(60)), KEY._col8 (type: varchar(60)), KEY._col9 (type: char(10)), KEY._col10 (type: char(10)), KEY._col11 (type: varchar(60)), KEY._col12 (type: varchar(60)), KEY._col13 (type: char(10)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17 - Statistics: Num rows: 382653083 Data size: 522704111378 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 520918699793 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col7 (type: char(50)), _col1 (type: bigint), _col0 (type: varchar(50)), _col2 (type: char(10)), _col3 (type: char(10)), _col4 (type: varchar(60)), _col5 (type: varchar(60)), _col6 (type: char(10)), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(60)), _col13 (type: char(10)), _col14 (type: bigint), _col15 (type: decimal(17,2)), _col16 (type: decimal(17,2)), _col17 (type: decimal(17,2)) + expressions: _col3 (type: char(50)), _col1 (type: bigint), _col0 (type: varchar(50)), _col2 (type: char(10)), _col6 (type: char(10)), _col7 (type: varchar(60)), _col8 (type: varchar(60)), _col9 (type: char(10)), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(60)), _col13 (type: char(10)), _col14 (type: bigint), _col15 (type: decimal(17,2)), _col16 (type: decimal(17,2)), _col17 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col14, _col15, _col16, _col17 - Statistics: Num rows: 382653083 Data size: 519642886714 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 517862857081 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col14 is not null (type: boolean) - Statistics: Num rows: 382653083 Data size: 519642886714 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 517862857081 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(50)), _col1 (type: bigint), _col2 (type: varchar(50)), _col3 (type: char(10)), _col4 (type: char(10)), _col5 (type: varchar(60)), _col6 (type: varchar(60)), _col7 (type: char(10)), _col8 (type: char(10)), _col9 (type: varchar(60)), _col10 (type: varchar(60)), _col11 (type: char(10)), _col14 (type: bigint), _col15 (type: decimal(17,2)), _col16 (type: decimal(17,2)), _col17 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15 - Statistics: Num rows: 382653083 Data size: 519642886714 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 517862857081 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: varchar(50)), _col1 (type: bigint), _col3 (type: char(10)) null sort order: zzz sort order: +++ Map-reduce partition columns: _col2 (type: varchar(50)), _col1 (type: bigint), _col3 (type: char(10)) - Statistics: Num rows: 382653083 Data size: 519642886714 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 517862857081 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(50)), _col4 (type: char(10)), _col5 (type: varchar(60)), _col6 (type: varchar(60)), _col7 (type: char(10)), _col8 (type: char(10)), _col9 (type: varchar(60)), _col10 (type: varchar(60)), _col11 (type: char(10)), _col12 (type: bigint), _col13 (type: decimal(17,2)), _col14 (type: decimal(17,2)), _col15 (type: decimal(17,2)) Reducer 29 Execution mode: vectorized, llap @@ -954,20 +974,20 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col5, _col6, _col7, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22 input vertices: 0 Reducer 4 - Statistics: Num rows: 99947700975703 Data size: 169311405452840883 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 99732726850686 Data size: 168947238418618801 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Filter Operator predicate: (_col3 <= _col19) (type: boolean) - Statistics: Num rows: 33315900325234 Data size: 56437135150946396 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 33244242283562 Data size: 56315746139540421 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col7 (type: char(50)), _col9 (type: varchar(50)), _col10 (type: char(10)), _col11 (type: char(10)), _col12 (type: varchar(60)), _col13 (type: varchar(60)), _col14 (type: char(10)), _col15 (type: char(10)), _col16 (type: varchar(60)), _col17 (type: varchar(60)), _col18 (type: char(10)), _col19 (type: bigint), _col20 (type: decimal(17,2)), _col21 (type: decimal(17,2)), _col22 (type: decimal(17,2)), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)), _col3 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18 - Statistics: Num rows: 33315900325234 Data size: 56437135150946396 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 33244242283562 Data size: 56315746139540421 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: varchar(50)), _col18 (type: bigint) null sort order: zzz sort order: +++ - Statistics: Num rows: 33315900325234 Data size: 56437135150946396 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 33244242283562 Data size: 56315746139540421 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: char(10)), _col3 (type: char(10)), _col4 (type: varchar(60)), _col5 (type: varchar(60)), _col6 (type: char(10)), _col7 (type: char(10)), _col8 (type: varchar(60)), _col9 (type: varchar(60)), _col10 (type: char(10)), _col11 (type: bigint), _col12 (type: decimal(17,2)), _col13 (type: decimal(17,2)), _col14 (type: decimal(17,2)), _col15 (type: decimal(17,2)), _col16 (type: decimal(17,2)), _col17 (type: decimal(17,2)) Reducer 3 Execution mode: vectorized, llap @@ -978,107 +998,107 @@ STAGE PLANS: keys: 0 KEY.reducesinkkey0 (type: bigint), KEY.reducesinkkey1 (type: bigint) 1 KEY.reducesinkkey0 (type: bigint), KEY.reducesinkkey1 (type: bigint) - outputColumnNames: _col2, _col3, _col5, _col7, _col8, _col9, _col11, _col15, _col16, _col17, _col18, _col19, _col22, _col23, _col24, _col25 + outputColumnNames: _col2, _col3, _col4, _col7, _col8, _col9, _col11, _col15, _col16, _col17, _col18, _col19, _col21, _col22 input vertices: - 1 Map 35 - Statistics: Num rows: 382653083 Data size: 212581202507 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 15 + Statistics: Num rows: 381980339 Data size: 141922941736 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col5 (type: bigint) + 0 _col3 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col2, _col3, _col7, _col8, _col9, _col11, _col15, _col16, _col17, _col18, _col19, _col22, _col23, _col24, _col25, _col29, _col30 + outputColumnNames: _col2, _col4, _col7, _col8, _col9, _col11, _col15, _col16, _col17, _col18, _col19, _col21, _col22 input vertices: - 1 Map 15 - Statistics: Num rows: 382653083 Data size: 279062936462 Basic stats: COMPLETE Column stats: COMPLETE + 1 Reducer 17 + Statistics: Num rows: 381980339 Data size: 140677273872 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col3 (type: bigint) + 0 _col16 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col2, _col7, _col8, _col9, _col11, _col15, _col16, _col17, _col18, _col19, _col22, _col23, _col24, _col25, _col29, _col30 + outputColumnNames: _col2, _col4, _col7, _col8, _col9, _col11, _col15, _col17, _col18, _col19, _col21, _col22 input vertices: - 1 Reducer 17 - Statistics: Num rows: 382653083 Data size: 277815074726 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 16 + Statistics: Num rows: 381980339 Data size: 137640849632 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col16 (type: bigint) + 0 _col19 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col2, _col7, _col8, _col9, _col11, _col15, _col17, _col18, _col19, _col22, _col23, _col24, _col25, _col29, _col30 + outputColumnNames: _col2, _col4, _col7, _col8, _col9, _col11, _col15, _col17, _col18, _col21, _col22, _col29 input vertices: - 1 Map 16 - Statistics: Num rows: 382653083 Data size: 274773268534 Basic stats: COMPLETE Column stats: COMPLETE + 1 Reducer 20 + Statistics: Num rows: 381980339 Data size: 136132350268 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col19 (type: bigint) + 0 _col18 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col2, _col7, _col8, _col9, _col11, _col15, _col17, _col18, _col22, _col23, _col24, _col25, _col29, _col30, _col34 + outputColumnNames: _col2, _col4, _col7, _col8, _col9, _col11, _col15, _col17, _col21, _col22, _col29, _col31 input vertices: - 1 Reducer 20 - Statistics: Num rows: 382653083 Data size: 273262078194 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 19 + Statistics: Num rows: 381980339 Data size: 134623859248 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col18 (type: bigint) + 0 _col2 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col2, _col7, _col8, _col9, _col11, _col15, _col17, _col22, _col23, _col24, _col25, _col29, _col30, _col34, _col36 + outputColumnNames: _col4, _col7, _col8, _col9, _col11, _col15, _col17, _col21, _col22, _col29, _col31, _col33 input vertices: - 1 Map 19 - Statistics: Num rows: 382653083 Data size: 271750896198 Basic stats: COMPLETE Column stats: COMPLETE + 1 Reducer 23 + Statistics: Num rows: 381980339 Data size: 165846520199 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col2 (type: bigint) + 0 _col15 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col7, _col8, _col9, _col11, _col15, _col17, _col22, _col23, _col24, _col25, _col29, _col30, _col34, _col36, _col38 + outputColumnNames: _col4, _col7, _col8, _col9, _col11, _col17, _col21, _col22, _col29, _col31, _col33, _col35 input vertices: - 1 Reducer 23 - Statistics: Num rows: 382653083 Data size: 303028546517 Basic stats: COMPLETE Column stats: COMPLETE - Map Join Operator - condition map: - Inner Join 0 to 1 - keys: - 0 _col15 (type: bigint) - 1 _col0 (type: bigint) - outputColumnNames: _col7, _col8, _col9, _col11, _col17, _col22, _col23, _col24, _col25, _col29, _col30, _col34, _col36, _col38, _col40 - input vertices: - 1 Map 22 - Statistics: Num rows: 382653083 Data size: 332512249668 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: (_col38 <> _col40) (type: boolean) - Statistics: Num rows: 382653083 Data size: 332512249668 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 22 + Statistics: Num rows: 381980339 Data size: 195278422062 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: (_col33 <> _col35) (type: boolean) + Statistics: Num rows: 381980339 Data size: 195278422062 Basic stats: COMPLETE Column stats: COMPLETE + Map Join Operator + condition map: + Inner Join 0 to 1 + keys: + 0 _col4 (type: bigint) + 1 _col0 (type: bigint) + outputColumnNames: _col7, _col8, _col9, _col11, _col17, _col21, _col22, _col29, _col31, _col37, _col38, _col39, _col40 + input vertices: + 1 Reducer 37 + Statistics: Num rows: 381980339 Data size: 266557779306 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: 0 _col17 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col7, _col8, _col9, _col11, _col22, _col23, _col24, _col25, _col29, _col30, _col34, _col36, _col42, _col43, _col44, _col45 + outputColumnNames: _col7, _col8, _col9, _col11, _col21, _col22, _col29, _col31, _col37, _col38, _col39, _col40, _col42, _col43, _col44, _col45 input vertices: - 1 Map 14 - Statistics: Num rows: 382653083 Data size: 402537763857 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 35 + Statistics: Num rows: 381980339 Data size: 400963619332 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(), sum(_col7), sum(_col8), sum(_col9) - keys: _col29 (type: varchar(50)), _col11 (type: bigint), _col30 (type: char(10)), _col22 (type: char(10)), _col23 (type: varchar(60)), _col24 (type: varchar(60)), _col25 (type: char(10)), _col34 (type: int), _col36 (type: int), _col42 (type: char(10)), _col43 (type: varchar(60)), _col44 (type: varchar(60)), _col45 (type: char(10)) - minReductionHashAggr: 0.8260248 + keys: _col21 (type: varchar(50)), _col11 (type: bigint), _col22 (type: char(10)), _col29 (type: int), _col31 (type: int), _col37 (type: char(10)), _col38 (type: varchar(60)), _col39 (type: varchar(60)), _col40 (type: char(10)), _col42 (type: char(10)), _col43 (type: varchar(60)), _col44 (type: varchar(60)), _col45 (type: char(10)) + minReductionHashAggr: 0.8256874 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16 - Statistics: Num rows: 382653083 Data size: 481760231497 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 480046805660 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: varchar(50)), _col1 (type: bigint), _col2 (type: char(10)), _col3 (type: char(10)), _col4 (type: varchar(60)), _col5 (type: varchar(60)), _col6 (type: char(10)), _col7 (type: int), _col8 (type: int), _col9 (type: char(10)), _col10 (type: varchar(60)), _col11 (type: varchar(60)), _col12 (type: char(10)) + key expressions: _col0 (type: varchar(50)), _col1 (type: bigint), _col2 (type: char(10)), _col3 (type: int), _col4 (type: int), _col5 (type: char(10)), _col6 (type: varchar(60)), _col7 (type: varchar(60)), _col8 (type: char(10)), _col9 (type: char(10)), _col10 (type: varchar(60)), _col11 (type: varchar(60)), _col12 (type: char(10)) null sort order: zzzzzzzzzzzzz sort order: +++++++++++++ - Map-reduce partition columns: _col0 (type: varchar(50)), _col1 (type: bigint), _col2 (type: char(10)), _col3 (type: char(10)), _col4 (type: varchar(60)), _col5 (type: varchar(60)), _col6 (type: char(10)), _col7 (type: int), _col8 (type: int), _col9 (type: char(10)), _col10 (type: varchar(60)), _col11 (type: varchar(60)), _col12 (type: char(10)) - Statistics: Num rows: 382653083 Data size: 481760231497 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col0 (type: varchar(50)), _col1 (type: bigint), _col2 (type: char(10)), _col3 (type: int), _col4 (type: int), _col5 (type: char(10)), _col6 (type: varchar(60)), _col7 (type: varchar(60)), _col8 (type: char(10)), _col9 (type: char(10)), _col10 (type: varchar(60)), _col11 (type: varchar(60)), _col12 (type: char(10)) + Statistics: Num rows: 381980339 Data size: 480046805660 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col13 (type: bigint), _col14 (type: decimal(17,2)), _col15 (type: decimal(17,2)), _col16 (type: decimal(17,2)) Reducer 30 Execution mode: vectorized, llap @@ -1086,10 +1106,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: char(50)), KEY.reducesinkkey1 (type: varchar(50)), VALUE._col0 (type: char(10)), VALUE._col1 (type: char(10)), VALUE._col2 (type: varchar(60)), VALUE._col3 (type: varchar(60)), VALUE._col4 (type: char(10)), VALUE._col5 (type: char(10)), VALUE._col6 (type: varchar(60)), VALUE._col7 (type: varchar(60)), VALUE._col8 (type: char(10)), 2000 (type: int), VALUE._col9 (type: bigint), VALUE._col10 (type: decimal(17,2)), VALUE._col11 (type: decimal(17,2)), VALUE._col12 (type: decimal(17,2)), VALUE._col13 (type: decimal(17,2)), VALUE._col14 (type: decimal(17,2)), VALUE._col15 (type: decimal(17,2)), 2001 (type: int), KEY.reducesinkkey2 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20 - Statistics: Num rows: 33315900325234 Data size: 56703662353548268 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 33244242283562 Data size: 56581700077808917 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 33315900325234 Data size: 56703662353548268 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 33244242283562 Data size: 56581700077808917 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -1140,37 +1160,63 @@ STAGE PLANS: sort order: Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) + Reducer 36 + Execution mode: vectorized, llap + Reduce Operator Tree: + Select Operator + expressions: KEY.reducesinkkey0 (type: bigint), VALUE._col0 (type: char(10)), VALUE._col1 (type: varchar(60)), VALUE._col2 (type: varchar(60)), VALUE._col3 (type: char(10)) + outputColumnNames: _col0, _col1, _col2, _col3, _col4 + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 40000000 Data size: 14326780359 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: char(10)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col4 (type: char(10)) + Reducer 37 + Execution mode: vectorized, llap + Reduce Operator Tree: + Select Operator + expressions: KEY.reducesinkkey0 (type: bigint), VALUE._col0 (type: char(10)), VALUE._col1 (type: varchar(60)), VALUE._col2 (type: varchar(60)), VALUE._col3 (type: char(10)) + outputColumnNames: _col0, _col1, _col2, _col3, _col4 + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 40000000 Data size: 14326780359 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: char(10)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col4 (type: char(10)) Reducer 4 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator aggregations: count(VALUE._col0), sum(VALUE._col1), sum(VALUE._col2), sum(VALUE._col3) - keys: KEY._col0 (type: varchar(50)), KEY._col1 (type: bigint), KEY._col2 (type: char(10)), KEY._col3 (type: char(10)), KEY._col4 (type: varchar(60)), KEY._col5 (type: varchar(60)), KEY._col6 (type: char(10)), KEY._col7 (type: int), KEY._col8 (type: int), KEY._col9 (type: char(10)), KEY._col10 (type: varchar(60)), KEY._col11 (type: varchar(60)), KEY._col12 (type: char(10)) + keys: KEY._col0 (type: varchar(50)), KEY._col1 (type: bigint), KEY._col2 (type: char(10)), KEY._col3 (type: int), KEY._col4 (type: int), KEY._col5 (type: char(10)), KEY._col6 (type: varchar(60)), KEY._col7 (type: varchar(60)), KEY._col8 (type: char(10)), KEY._col9 (type: char(10)), KEY._col10 (type: varchar(60)), KEY._col11 (type: varchar(60)), KEY._col12 (type: char(10)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16 - Statistics: Num rows: 382653083 Data size: 481760231497 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 480046805660 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: bigint), _col0 (type: varchar(50)), _col2 (type: char(10)), _col13 (type: bigint), _col14 (type: decimal(17,2)), _col15 (type: decimal(17,2)), _col16 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col13, _col14, _col15, _col16 - Statistics: Num rows: 382653083 Data size: 202423480907 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 202067597472 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col13 is not null (type: boolean) - Statistics: Num rows: 382653083 Data size: 202423480907 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 202067597472 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: bigint), _col1 (type: varchar(50)), _col2 (type: char(10)), _col13 (type: bigint), _col14 (type: decimal(17,2)), _col15 (type: decimal(17,2)), _col16 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 382653083 Data size: 202423480907 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 202067597472 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: varchar(50)), _col0 (type: bigint), _col2 (type: char(10)) null sort order: zzz sort order: +++ Map-reduce partition columns: _col1 (type: varchar(50)), _col0 (type: bigint), _col2 (type: char(10)) - Statistics: Num rows: 382653083 Data size: 202423480907 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 202067597472 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)) Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 382653083 Data size: 3061224664 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 381980339 Data size: 3055842712 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -1195,7 +1241,7 @@ STAGE PLANS: sort order: Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) - Reducer 7 + Reducer 8 Execution mode: vectorized, llap Reduce Operator Tree: Map Join Operator @@ -1206,7 +1252,7 @@ STAGE PLANS: 1 KEY.reducesinkkey0 (type: bigint), KEY.reducesinkkey1 (type: bigint) outputColumnNames: _col0, _col2, _col5 input vertices: - 1 Map 13 + 1 Map 14 Statistics: Num rows: 41876960211 Data size: 9691486353656 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator @@ -1223,7 +1269,7 @@ STAGE PLANS: Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 16946565830 Data size: 3931603272560 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)), _col2 (type: decimal(19,2)) - Reducer 8 + Reducer 9 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator @@ -1260,24 +1306,6 @@ STAGE PLANS: sort order: Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) - Reducer 9 - Execution mode: vectorized, llap - Reduce Operator Tree: - Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1000000) - mode: final - outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) Stage: Stage-0 Fetch Operator diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query65.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query65.q.out index 9dd942616db6..a5557a57e312 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query65.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query65.q.out @@ -59,17 +59,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 238136080 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 237807892 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_desc (type: varchar(200)), i_current_price (type: decimal(7,2)), i_wholesale_cost (type: decimal(7,2)), i_brand (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 462000 Data size: 238136080 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 237807892 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 238136080 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 237807892 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(200)), _col2 (type: decimal(7,2)), _col3 (type: decimal(7,2)), _col4 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -175,17 +175,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store - Statistics: Num rows: 1704 Data size: 163584 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 162704 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_store_name (type: varchar(50)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 1704 Data size: 163584 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 162704 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 163584 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 162704 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -223,7 +223,7 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col6 input vertices: 1 Map 9 - Statistics: Num rows: 5268374 Data size: 1095821792 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5268374 Data size: 1095820912 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -233,22 +233,22 @@ STAGE PLANS: outputColumnNames: _col2, _col6, _col8, _col9, _col10, _col11 input vertices: 1 Map 10 - Statistics: Num rows: 5268374 Data size: 3729752872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5268374 Data size: 3729423804 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++ keys: _col6 (type: varchar(50)), _col8 (type: varchar(200)) null sort order: zz - Statistics: Num rows: 5268374 Data size: 3729752872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5268374 Data size: 3729423804 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col6 (type: varchar(50)), _col8 (type: varchar(200)), _col2 (type: decimal(17,2)), _col9 (type: decimal(7,2)), _col10 (type: decimal(7,2)), _col11 (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5268374 Data size: 3729496728 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5268374 Data size: 3728838220 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(50)), _col1 (type: varchar(200)) null sort order: zz sort order: ++ - Statistics: Num rows: 5268374 Data size: 3729496728 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5268374 Data size: 3728838220 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(17,2)), _col3 (type: decimal(7,2)), _col4 (type: decimal(7,2)), _col5 (type: char(50)) Reducer 3 Execution mode: vectorized, llap @@ -256,7 +256,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: varchar(50)), KEY.reducesinkkey1 (type: varchar(200)), VALUE._col0 (type: decimal(17,2)), VALUE._col1 (type: decimal(7,2)), VALUE._col2 (type: decimal(7,2)), VALUE._col3 (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5268374 Data size: 3729496728 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5268374 Data size: 3728838220 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 70800 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query66.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query66.q.out index fd52072a7b8d..5575fac99ee4 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query66.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query66.q.out @@ -377,12 +377,12 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(20)), KEY._col1 (type: int), KEY._col2 (type: varchar(60)), KEY._col3 (type: varchar(30)), KEY._col4 (type: char(2)), KEY._col5 (type: varchar(20)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23, _col24, _col25, _col26, _col27, _col28, _col29, _col30, _col31, _col32, _col33, _col34, _col35, _col36, _col37, _col38, _col39, _col40, _col41 - Statistics: Num rows: 2122848 Data size: 9574044480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2044224 Data size: 9219450240 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(20)) null sort order: z sort order: + - Statistics: Num rows: 2122848 Data size: 9574044480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2044224 Data size: 9219450240 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: varchar(60)), _col3 (type: varchar(30)), _col4 (type: char(2)), _col5 (type: varchar(20)), _col6 (type: decimal(38,2)), _col7 (type: decimal(38,2)), _col8 (type: decimal(38,2)), _col9 (type: decimal(38,2)), _col10 (type: decimal(38,2)), _col11 (type: decimal(38,2)), _col12 (type: decimal(38,2)), _col13 (type: decimal(38,2)), _col14 (type: decimal(38,2)), _col15 (type: decimal(38,2)), _col16 (type: decimal(38,2)), _col17 (type: decimal(38,2)), _col18 (type: decimal(38,12)), _col19 (type: decimal(38,12)), _col20 (type: decimal(38,12)), _col21 (type: decimal(38,12)), _col22 (type: decimal(38,12)), _col23 (type: decimal(38,12)), _col24 (type: decimal(38,12)), _col25 (type: decimal(38,12)), _col26 (type: decimal(38,12)), _col27 (type: decimal(38,12)), _col28 (type: decimal(38,12)), _col29 (type: decimal(38,12)), _col30 (type: decimal(38,2)), _col31 (type: decimal(38,2)), _col32 (type: decimal(38,2)), _col33 (type: decimal(38,2)), _col34 (type: decimal(38,2)), _col35 (type: decimal(38,2)), _col36 (type: decimal(38,2)), _col37 (type: decimal(38,2)), _col38 (type: decimal(38,2)), _col39 (type: decimal(38,2)), _col40 (type: decimal(38,2)), _col41 (type: decimal(38,2)) Reducer 5 Execution mode: vectorized, llap @@ -390,7 +390,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: varchar(20)), VALUE._col0 (type: int), VALUE._col1 (type: varchar(60)), VALUE._col2 (type: varchar(30)), VALUE._col3 (type: char(2)), VALUE._col4 (type: varchar(20)), VALUE._col5 (type: decimal(38,2)), VALUE._col6 (type: decimal(38,2)), VALUE._col7 (type: decimal(38,2)), VALUE._col8 (type: decimal(38,2)), VALUE._col9 (type: decimal(38,2)), VALUE._col10 (type: decimal(38,2)), VALUE._col11 (type: decimal(38,2)), VALUE._col12 (type: decimal(38,2)), VALUE._col13 (type: decimal(38,2)), VALUE._col14 (type: decimal(38,2)), VALUE._col15 (type: decimal(38,2)), VALUE._col16 (type: decimal(38,2)), VALUE._col17 (type: decimal(38,12)), VALUE._col18 (type: decimal(38,12)), VALUE._col19 (type: decimal(38,12)), VALUE._col20 (type: decimal(38,12)), VALUE._col21 (type: decimal(38,12)), VALUE._col22 (type: decimal(38,12)), VALUE._col23 (type: decimal(38,12)), VALUE._col24 (type: decimal(38,12)), VALUE._col25 (type: decimal(38,12)), VALUE._col26 (type: decimal(38,12)), VALUE._col27 (type: decimal(38,12)), VALUE._col28 (type: decimal(38,12)), VALUE._col29 (type: decimal(38,2)), VALUE._col30 (type: decimal(38,2)), VALUE._col31 (type: decimal(38,2)), VALUE._col32 (type: decimal(38,2)), VALUE._col33 (type: decimal(38,2)), VALUE._col34 (type: decimal(38,2)), VALUE._col35 (type: decimal(38,2)), VALUE._col36 (type: decimal(38,2)), VALUE._col37 (type: decimal(38,2)), VALUE._col38 (type: decimal(38,2)), VALUE._col39 (type: decimal(38,2)), VALUE._col40 (type: decimal(38,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20, _col21, _col22, _col23, _col24, _col25, _col26, _col27, _col28, _col29, _col30, _col31, _col32, _col33, _col34, _col35, _col36, _col37, _col38, _col39, _col40, _col41 - Statistics: Num rows: 2122848 Data size: 9574044480 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2044224 Data size: 9219450240 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 451000 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query67.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query67.q.out index 4d0da1c88eb5..62d28f8d42d8 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query67.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query67.q.out @@ -57,7 +57,7 @@ STAGE PLANS: outputColumnNames: _col3, _col5, _col6, _col7, _col9, _col11, _col12, _col13, _col14 input vertices: 1 Map 8 - Statistics: Num rows: 15840066266 Data size: 9709960621058 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15840066266 Data size: 9709960177866 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col14 (type: char(50)) null sort order: z @@ -126,17 +126,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 183414000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 182970808 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_brand (type: char(50)), i_class (type: char(50)), i_category (type: char(50)), i_product_name (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 462000 Data size: 183414000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 182970808 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 183414000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 182970808 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)), _col2 (type: char(50)), _col3 (type: char(50)), _col4 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -150,16 +150,16 @@ STAGE PLANS: aggregations: sum(_col3) keys: _col5 (type: int), _col6 (type: int), _col7 (type: int), _col9 (type: string), _col11 (type: char(50)), _col12 (type: char(50)), _col13 (type: char(50)), _col14 (type: char(50)), 0L (type: bigint) grouping sets: 0, 16, 80, 112, 240, 241, 249, 253, 255 - minReductionHashAggr: 0.9867937 + minReductionHashAggr: 0.9867976 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9 - Statistics: Num rows: 142560596394 Data size: 88530130360674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 142560596394 Data size: 88530126368834 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string), _col4 (type: char(50)), _col5 (type: char(50)), _col6 (type: char(50)), _col7 (type: char(50)), _col8 (type: bigint) null sort order: zzzzzzzzz sort order: +++++++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string), _col4 (type: char(50)), _col5 (type: char(50)), _col6 (type: char(50)), _col7 (type: char(50)), _col8 (type: bigint) - Statistics: Num rows: 142560596394 Data size: 88530130360674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 142560596394 Data size: 88530126368834 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col9 (type: decimal(28,2)) Reducer 3 Execution mode: vectorized, llap @@ -169,25 +169,25 @@ STAGE PLANS: keys: KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: int), KEY._col3 (type: string), KEY._col4 (type: char(50)), KEY._col5 (type: char(50)), KEY._col6 (type: char(50)), KEY._col7 (type: char(50)), KEY._col8 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col9 - Statistics: Num rows: 142560596394 Data size: 88530130360674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 142560596394 Data size: 88530126368834 Basic stats: COMPLETE Column stats: COMPLETE pruneGroupingSetId: true Top N Key Operator sort order: +- keys: _col6 (type: char(50)), _col9 (type: decimal(28,2)) null sort order: aa Map-reduce partition columns: _col6 (type: char(50)) - Statistics: Num rows: 142560596394 Data size: 88530130360674 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 142560596394 Data size: 88530126368834 Basic stats: COMPLETE Column stats: COMPLETE top n: 101 Select Operator expressions: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string), _col4 (type: char(50)), _col5 (type: char(50)), _col6 (type: char(50)), _col7 (type: char(50)), _col9 (type: decimal(28,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8 - Statistics: Num rows: 142560596394 Data size: 87389645589522 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 142560596394 Data size: 87389637605453 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col6 (type: char(50)), _col8 (type: decimal(28,2)) null sort order: aa sort order: +- Map-reduce partition columns: _col6 (type: char(50)) - Statistics: Num rows: 142560596394 Data size: 87389645589522 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 142560596394 Data size: 87389637605453 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: string), _col4 (type: char(50)), _col5 (type: char(50)), _col7 (type: char(50)) Reducer 4 Execution mode: vectorized, llap @@ -195,7 +195,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: int), VALUE._col1 (type: int), VALUE._col2 (type: int), VALUE._col3 (type: string), VALUE._col4 (type: char(50)), VALUE._col5 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), VALUE._col6 (type: char(50)), KEY.reducesinkkey1 (type: decimal(28,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8 - Statistics: Num rows: 142560596394 Data size: 87389645589522 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 142560596394 Data size: 87389637605453 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -216,32 +216,32 @@ STAGE PLANS: window function: GenericUDAFRankEvaluator window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) isPivotResult: true - Statistics: Num rows: 142560596394 Data size: 87389645589522 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 142560596394 Data size: 87389637605453 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (rank_window_0 <= 100) (type: boolean) - Statistics: Num rows: 47520198798 Data size: 29129881863174 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 47520198798 Data size: 29129876540591 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++++++++++ keys: _col6 (type: char(50)), _col5 (type: char(50)), _col4 (type: char(50)), _col7 (type: char(50)), _col0 (type: int), _col2 (type: int), _col1 (type: int), _col3 (type: string), _col8 (type: decimal(28,2)), rank_window_0 (type: int) null sort order: zzzzzzzzzz - Statistics: Num rows: 47520198798 Data size: 29129881863174 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 47520198798 Data size: 29129876540591 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col6 (type: char(50)), _col5 (type: char(50)), _col4 (type: char(50)), _col7 (type: char(50)), _col0 (type: int), _col2 (type: int), _col1 (type: int), _col3 (type: string), _col8 (type: decimal(28,2)), rank_window_0 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9 - Statistics: Num rows: 47520198798 Data size: 29319962658366 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 47520198798 Data size: 29319952012811 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: char(50)), _col3 (type: char(50)), _col4 (type: int), _col5 (type: int), _col6 (type: int), _col7 (type: string), _col8 (type: decimal(28,2)), _col9 (type: int) null sort order: zzzzzzzzzz sort order: ++++++++++ - Statistics: Num rows: 47520198798 Data size: 29319962658366 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 47520198798 Data size: 29319952012811 Basic stats: COMPLETE Column stats: COMPLETE Reducer 5 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: char(50)), KEY.reducesinkkey1 (type: char(50)), KEY.reducesinkkey2 (type: char(50)), KEY.reducesinkkey3 (type: char(50)), KEY.reducesinkkey4 (type: int), KEY.reducesinkkey5 (type: int), KEY.reducesinkkey6 (type: int), KEY.reducesinkkey7 (type: string), KEY.reducesinkkey8 (type: decimal(28,2)), KEY.reducesinkkey9 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9 - Statistics: Num rows: 47520198798 Data size: 29319962658366 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 47520198798 Data size: 29319952012811 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 61700 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query68.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query68.q.out index 30c393c008f2..bec595585d4c 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query68.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query68.q.out @@ -19,20 +19,20 @@ STAGE PLANS: TableScan alias: customer filterExpr: c_current_addr_sk is not null (type: boolean) - Statistics: Num rows: 80000000 Data size: 15680000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15176269100 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: c_current_addr_sk is not null (type: boolean) - Statistics: Num rows: 80000000 Data size: 15680000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15176269100 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: c_customer_sk (type: bigint), c_current_addr_sk (type: bigint), c_first_name (type: char(20)), c_last_name (type: char(30)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 80000000 Data size: 15680000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15176269100 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 80000000 Data size: 15680000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 15176269100 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col2 (type: char(20)), _col3 (type: char(30)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -61,24 +61,24 @@ STAGE PLANS: Map Operator Tree: TableScan alias: current_addr - Statistics: Num rows: 40000000 Data size: 4040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3928420739 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_city (type: varchar(60)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40000000 Data size: 4040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3928420739 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 4040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3928420739 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(60)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 4040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3928420739 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(60)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -177,7 +177,7 @@ STAGE PLANS: TableScan alias: store filterExpr: (s_city) IN ('Cedar Grove', 'Wildwood') (type: boolean) - Statistics: Num rows: 1704 Data size: 172104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 171081 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (s_city) IN ('Cedar Grove', 'Wildwood') (type: boolean) Statistics: Num rows: 13 Data size: 1313 Basic stats: COMPLETE Column stats: COMPLETE @@ -205,7 +205,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col3, _col5 input vertices: 1 Map 4 - Statistics: Num rows: 80000000 Data size: 22480000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 21864689839 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Map Join Operator condition map: @@ -216,25 +216,25 @@ STAGE PLANS: outputColumnNames: _col2, _col3, _col5, _col6, _col8, _col9, _col10, _col11 input vertices: 1 Reducer 7 - Statistics: Num rows: 5939893 Data size: 4217324030 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 3490434608 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col5 <> _col8) (type: boolean) - Statistics: Num rows: 5939893 Data size: 4217324030 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 3490434608 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++ keys: _col3 (type: char(30)), _col6 (type: bigint) null sort order: zz - Statistics: Num rows: 5939893 Data size: 4217324030 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 3490434608 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col3 (type: char(30)), _col2 (type: char(20)), _col5 (type: varchar(60)), _col8 (type: varchar(60)), _col6 (type: bigint), _col9 (type: decimal(17,2)), _col11 (type: decimal(17,2)), _col10 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 5939893 Data size: 4217324030 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 2763544820 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col4 (type: bigint) null sort order: zz sort order: ++ - Statistics: Num rows: 5939893 Data size: 4217324030 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 2763544820 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(20)), _col2 (type: varchar(60)), _col3 (type: varchar(60)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)), _col7 (type: decimal(17,2)) Reducer 3 Execution mode: vectorized, llap @@ -242,13 +242,13 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: char(30)), VALUE._col0 (type: char(20)), VALUE._col1 (type: varchar(60)), VALUE._col2 (type: varchar(60)), KEY.reducesinkkey1 (type: bigint), VALUE._col3 (type: decimal(17,2)), VALUE._col4 (type: decimal(17,2)), VALUE._col5 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 5939893 Data size: 4217324030 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 2763544820 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 - Statistics: Num rows: 100 Data size: 71000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 47006 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 100 Data size: 71000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 100 Data size: 47006 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -265,7 +265,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col4, _col5, _col6, _col7, _col13 input vertices: 1 Map 4 - Statistics: Num rows: 5939893 Data size: 599929545 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 488350284 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col5), sum(_col6), sum(_col7) @@ -273,13 +273,13 @@ STAGE PLANS: minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 5939893 Data size: 2595733257 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 2484153996 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: varchar(60)), _col2 (type: bigint), _col3 (type: bigint) null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: varchar(60)), _col2 (type: bigint), _col3 (type: bigint) - Statistics: Num rows: 5939893 Data size: 2595733257 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 2484153996 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)) Reducer 7 Execution mode: vectorized, llap @@ -289,17 +289,17 @@ STAGE PLANS: keys: KEY._col0 (type: bigint), KEY._col1 (type: varchar(60)), KEY._col2 (type: bigint), KEY._col3 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 5939893 Data size: 2595733257 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 2484153996 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: bigint), _col0 (type: bigint), _col1 (type: varchar(60)), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5939893 Data size: 2595733249 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 2484153988 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 5939893 Data size: 2595733249 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5939893 Data size: 2484153988 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col2 (type: varchar(60)), _col3 (type: decimal(17,2)), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)) Stage: Stage-0 diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query69.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query69.q.out index 7703593c815e..488a2dcc9378 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query69.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query69.q.out @@ -26,7 +26,7 @@ STAGE PLANS: TableScan alias: c filterExpr: (c_current_cdemo_sk is not null and c_current_addr_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_157_container, bigKeyColName:c_current_addr_sk, smallTablePos:1, keyRatio:0.054623625 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_157_container, bigKeyColName:c_current_addr_sk, smallTablePos:1, keyRatio:0.055674075 Statistics: Num rows: 80000000 Data size: 1897611080 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (c_current_cdemo_sk is not null and c_current_addr_sk is not null) (type: boolean) @@ -44,20 +44,20 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 10 - Statistics: Num rows: 4369890 Data size: 48312544 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4453926 Data size: 49657120 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 4369890 Data size: 48312544 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4453926 Data size: 49657120 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 4369890 Data size: 34959120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4453926 Data size: 35631408 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=4369890) + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=4453926) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 @@ -74,20 +74,20 @@ STAGE PLANS: TableScan alias: ca filterExpr: (ca_state) IN ('CO', 'IL', 'MN') (type: boolean) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ca_state) IN ('CO', 'IL', 'MN') (type: boolean) - Statistics: Num rows: 2264151 Data size: 212830194 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2307692 Data size: 210970472 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 2264151 Data size: 18113208 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2307692 Data size: 18461536 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 2264151 Data size: 18113208 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2307692 Data size: 18461536 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 11 @@ -311,19 +311,19 @@ STAGE PLANS: outputColumnNames: _col0, _col1 input vertices: 1 Map 11 - Statistics: Num rows: 15228208 Data size: 222045632 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15521056 Data size: 226731200 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 15228208 Data size: 222045632 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15521056 Data size: 226731200 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 15228208 Data size: 121825664 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15521056 Data size: 124168448 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=3956347) minReductionHashAggr: 0.99 @@ -492,7 +492,7 @@ STAGE PLANS: Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=4369890) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=4453926) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query7.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query7.q.out index 1b813b0fe846..e25b2e1ae19c 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query7.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query7.q.out @@ -17,7 +17,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: (ss_cdemo_sk is not null and ss_promo_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_94_container, bigKeyColName:ss_cdemo_sk, smallTablePos:1, keyRatio:1.6082727526128025E-8 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_100_container, bigKeyColName:ss_cdemo_sk, smallTablePos:1, keyRatio:1.6082727526128025E-8 Statistics: Num rows: 82510879939 Data size: 30001935686500 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ss_cdemo_sk is not null and ss_promo_sk is not null) (type: boolean) @@ -30,27 +30,27 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col7 (type: bigint) + 0 _col2 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 + outputColumnNames: _col0, _col1, _col3, _col4, _col5, _col6, _col7 input vertices: 1 Map 4 - Statistics: Num rows: 15811383493 Data size: 5095447574104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 78670256451 Data size: 27990870156136 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: bigint) + 0 _col7 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col0, _col2, _col3, _col4, _col5, _col6 + outputColumnNames: _col0, _col1, _col3, _col4, _col5, _col6 input vertices: 1 Map 5 - Statistics: Num rows: 225876909 Data size: 1807015620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15811383493 Data size: 4983749331480 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col2 (type: bigint) + 0 _col1 (type: bigint) 1 _col0 (type: bigint) outputColumnNames: _col0, _col3, _col4, _col5, _col6 input vertices: @@ -89,6 +89,27 @@ STAGE PLANS: Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 4 + Map Operator Tree: + TableScan + alias: promotion + filterExpr: ((p_channel_email = 'N') or (p_channel_event = 'N')) (type: boolean) + Statistics: Num rows: 2300 Data size: 405235 Basic stats: COMPLETE Column stats: COMPLETE + Filter Operator + predicate: ((p_channel_email = 'N') or (p_channel_event = 'N')) (type: boolean) + Statistics: Num rows: 2300 Data size: 405235 Basic stats: COMPLETE Column stats: COMPLETE + Select Operator + expressions: p_promo_sk (type: bigint) + outputColumnNames: _col0 + Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE + Reduce Output Operator + key expressions: _col0 (type: bigint) + null sort order: z + sort order: + + Map-reduce partition columns: _col0 (type: bigint) + Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE + Execution mode: vectorized, llap + LLAP IO: may be used (ACID table) + Map 5 Map Operator Tree: TableScan alias: date_dim @@ -125,7 +146,7 @@ STAGE PLANS: Target Vertex: Map 1 Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 5 + Map 6 Map Operator Tree: TableScan alias: customer_demographics @@ -146,27 +167,6 @@ STAGE PLANS: Statistics: Num rows: 27440 Data size: 219520 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 6 - Map Operator Tree: - TableScan - alias: promotion - filterExpr: ((p_channel_email = 'N') or (p_channel_event = 'N')) (type: boolean) - Statistics: Num rows: 2300 Data size: 409400 Basic stats: COMPLETE Column stats: COMPLETE - Filter Operator - predicate: ((p_channel_email = 'N') or (p_channel_event = 'N')) (type: boolean) - Statistics: Num rows: 2300 Data size: 409400 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: p_promo_sk (type: bigint) - outputColumnNames: _col0 - Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - key expressions: _col0 (type: bigint) - null sort order: z - sort order: + - Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE - Execution mode: vectorized, llap - LLAP IO: may be used (ACID table) Map 7 Map Operator Tree: TableScan diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query70.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query70.q.out index f417133c1fa9..f87d83a96d00 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query70.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query70.q.out @@ -21,7 +21,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: ss_store_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_120_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:0.1919754858718087 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_120_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:0.19084767828972019 Statistics: Num rows: 82510879939 Data size: 10327900046896 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ss_store_sk is not null (type: boolean) @@ -49,7 +49,7 @@ STAGE PLANS: outputColumnNames: _col1, _col6, _col7 input vertices: 1 Map 6 - Statistics: Num rows: 15840066266 Data size: 4475829148384 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15747009870 Data size: 4448284453144 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Left Semi Join 0 to 1 @@ -59,11 +59,11 @@ STAGE PLANS: outputColumnNames: _col1, _col6, _col7 input vertices: 1 Reducer 9 - Statistics: Num rows: 5040021084 Data size: 1279015774512 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5126933446 Data size: 1304741831640 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col7 (type: char(2)), _col6 (type: varchar(30)), _col1 (type: decimal(7,2)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 5040021084 Data size: 1279015774512 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5126933446 Data size: 1304741831640 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col0 (type: char(2)), _col1 (type: varchar(30)), 0L (type: bigint) @@ -71,13 +71,13 @@ STAGE PLANS: minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 3073155 Data size: 934239120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3945078 Data size: 1199303712 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(2)), _col1 (type: varchar(30)), _col2 (type: bigint) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(2)), _col1 (type: varchar(30)), _col2 (type: bigint) - Statistics: Num rows: 3073155 Data size: 934239120 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3945078 Data size: 1199303712 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -145,31 +145,31 @@ STAGE PLANS: TableScan alias: store filterExpr: s_state is not null (type: boolean) - Statistics: Num rows: 1704 Data size: 327168 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 325144 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: s_state is not null (type: boolean) - Statistics: Num rows: 1704 Data size: 327168 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1692 Data size: 322840 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_county (type: varchar(30)), s_state (type: char(2)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1704 Data size: 327168 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1692 Data size: 322840 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 327168 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1692 Data size: 322840 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(30)), _col2 (type: char(2)) Select Operator expressions: s_store_sk (type: bigint), s_state (type: char(2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 1704 Data size: 160176 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1692 Data size: 158102 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 160176 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1692 Data size: 158102 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -178,7 +178,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: ss_store_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_122_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:0.1919754858718087 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_122_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:0.19084767828972019 Statistics: Num rows: 82510879939 Data size: 10327900046896 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ss_store_sk is not null (type: boolean) @@ -206,20 +206,20 @@ STAGE PLANS: outputColumnNames: _col1, _col5 input vertices: 1 Map 6 - Statistics: Num rows: 15840066266 Data size: 2923502654316 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15747009870 Data size: 2905077486962 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col5 (type: char(2)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 502480 Data size: 99491040 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 499312 Data size: 98863776 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(2)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: char(2)) - Statistics: Num rows: 502480 Data size: 99491040 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 499312 Data size: 98863776 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -231,17 +231,17 @@ STAGE PLANS: keys: KEY._col0 (type: char(2)), KEY._col1 (type: varchar(30)), KEY._col2 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 615 Data size: 186960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 630 Data size: 191520 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(2)), _col1 (type: varchar(30)), _col3 (type: decimal(17,2)), _col2 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 615 Data size: 186960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 630 Data size: 191520 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: (grouping(_col3, 1L) + grouping(_col3, 0L)) (type: bigint), CASE WHEN ((grouping(_col3, 0L) = UDFToLong(0))) THEN (_col0) ELSE (CAST( null AS CHAR(2))) END (type: char(2)), _col2 (type: decimal(17,2)) null sort order: aaa sort order: ++- Map-reduce partition columns: (grouping(_col3, 1L) + grouping(_col3, 0L)) (type: bigint), CASE WHEN ((grouping(_col3, 0L) = UDFToLong(0))) THEN (_col0) ELSE (CAST( null AS CHAR(2))) END (type: char(2)) - Statistics: Num rows: 615 Data size: 186960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 630 Data size: 191520 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(2)), _col1 (type: varchar(30)), _col3 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -249,7 +249,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: char(2)), VALUE._col1 (type: varchar(30)), KEY.reducesinkkey2 (type: decimal(17,2)), VALUE._col2 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 615 Data size: 186960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 630 Data size: 191520 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -270,22 +270,22 @@ STAGE PLANS: window function: GenericUDAFRankEvaluator window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) isPivotResult: true - Statistics: Num rows: 615 Data size: 186960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 630 Data size: 191520 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: -++ keys: (grouping(_col3, 1L) + grouping(_col3, 0L)) (type: bigint), if(((grouping(_col3, 1L) + grouping(_col3, 0L)) = 0L), _col0, null) (type: char(2)), rank_window_0 (type: int) null sort order: azz - Statistics: Num rows: 615 Data size: 186960 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 630 Data size: 191520 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col2 (type: decimal(17,2)), _col0 (type: char(2)), _col1 (type: varchar(30)), (grouping(_col3, 1L) + grouping(_col3, 0L)) (type: bigint), rank_window_0 (type: int), if(((grouping(_col3, 1L) + grouping(_col3, 0L)) = 0L), _col0, null) (type: char(2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 615 Data size: 189506 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 630 Data size: 194126 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col3 (type: bigint), _col5 (type: char(2)), _col4 (type: int) null sort order: azz sort order: -++ - Statistics: Num rows: 615 Data size: 189506 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 630 Data size: 194126 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: decimal(17,2)), _col1 (type: char(2)), _col2 (type: varchar(30)) Reducer 4 Execution mode: vectorized, llap @@ -293,7 +293,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: decimal(17,2)), VALUE._col1 (type: char(2)), VALUE._col2 (type: varchar(30)), KEY.reducesinkkey0 (type: bigint), KEY.reducesinkkey2 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 615 Data size: 189420 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 630 Data size: 194040 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 30800 Basic stats: COMPLETE Column stats: COMPLETE @@ -312,27 +312,27 @@ STAGE PLANS: keys: KEY._col0 (type: char(2)) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 44 Data size: 8712 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 43 Data size: 8514 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +- keys: _col0 (type: char(2)), _col1 (type: decimal(17,2)) null sort order: aa Map-reduce partition columns: _col0 (type: char(2)) - Statistics: Num rows: 44 Data size: 8712 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 43 Data size: 8514 Basic stats: COMPLETE Column stats: COMPLETE top n: 6 Reduce Output Operator key expressions: _col0 (type: char(2)), _col1 (type: decimal(17,2)) null sort order: aa sort order: +- Map-reduce partition columns: _col0 (type: char(2)) - Statistics: Num rows: 44 Data size: 8712 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 43 Data size: 8514 Basic stats: COMPLETE Column stats: COMPLETE Reducer 9 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator expressions: KEY.reducesinkkey0 (type: char(2)), KEY.reducesinkkey1 (type: decimal(17,2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 44 Data size: 8712 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 43 Data size: 8514 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -353,7 +353,7 @@ STAGE PLANS: window function: GenericUDAFRankEvaluator window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) isPivotResult: true - Statistics: Num rows: 44 Data size: 8712 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 43 Data size: 8514 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (rank_window_0 <= 5) (type: boolean) Statistics: Num rows: 14 Data size: 2772 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query71.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query71.q.out index b5c0f12a1272..16b39d57a5d9 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query71.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query71.q.out @@ -20,7 +20,7 @@ STAGE PLANS: TableScan alias: web_sales filterExpr: ws_sold_time_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_119_container, bigKeyColName:ws_sold_time_sk, smallTablePos:1, keyRatio:4.3992401279400425E-9 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_119_container, bigKeyColName:ws_sold_time_sk, smallTablePos:1, keyRatio:5.881089434193531E-9 Statistics: Num rows: 21594638446 Data size: 2936546600912 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ws_sold_time_sk is not null (type: boolean) @@ -52,7 +52,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col4, _col5 input vertices: 1 Map 8 - Statistics: Num rows: 23627911 Data size: 2457302824 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 23627911 Data size: 2457301824 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -62,20 +62,20 @@ STAGE PLANS: outputColumnNames: _col0, _col4, _col5, _col7, _col8 input vertices: 1 Map 10 - Statistics: Num rows: 11813956 Data size: 1323163144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 1764216576 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0) keys: _col4 (type: int), _col5 (type: char(50)), _col7 (type: int), _col8 (type: int) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 11813956 Data size: 2646326104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 3528433968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: char(50)), _col2 (type: int), _col3 (type: int) null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: char(50)), _col2 (type: int), _col3 (type: int) - Statistics: Num rows: 11813956 Data size: 2646326104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 3528433968 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -84,34 +84,34 @@ STAGE PLANS: TableScan alias: time_dim filterExpr: (t_meal_time) IN ('breakfast ', 'dinner ') (type: boolean) - Statistics: Num rows: 86400 Data size: 8899200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 86400 Data size: 4514487 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (t_meal_time) IN ('breakfast ', 'dinner ') (type: boolean) - Statistics: Num rows: 43200 Data size: 4449600 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 57600 Data size: 3009687 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: t_time_sk (type: bigint), t_hour (type: int), t_minute (type: int) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 43200 Data size: 691200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 57600 Data size: 921600 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 43200 Data size: 691200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 57600 Data size: 921600 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 43200 Data size: 691200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 57600 Data size: 921600 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 43200 Data size: 691200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 57600 Data size: 921600 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -151,7 +151,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col4, _col5 input vertices: 1 Map 8 - Statistics: Num rows: 23627911 Data size: 2457302824 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 23627911 Data size: 2457301824 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -161,20 +161,20 @@ STAGE PLANS: outputColumnNames: _col0, _col4, _col5, _col7, _col8 input vertices: 1 Map 10 - Statistics: Num rows: 11813956 Data size: 1323163144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 1764216576 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0) keys: _col4 (type: int), _col5 (type: char(50)), _col7 (type: int), _col8 (type: int) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 11813956 Data size: 2646326104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 3528433968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: char(50)), _col2 (type: int), _col3 (type: int) null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: char(50)), _col2 (type: int), _col3 (type: int) - Statistics: Num rows: 11813956 Data size: 2646326104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 3528433968 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -295,7 +295,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col4, _col5 input vertices: 1 Map 8 - Statistics: Num rows: 23627911 Data size: 2457302824 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 23627911 Data size: 2457301824 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -305,20 +305,20 @@ STAGE PLANS: outputColumnNames: _col0, _col4, _col5, _col7, _col8 input vertices: 1 Map 10 - Statistics: Num rows: 11813956 Data size: 1323163144 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 1764216576 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col0) keys: _col4 (type: int), _col5 (type: char(50)), _col7 (type: int), _col8 (type: int) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 11813956 Data size: 2646326104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 3528433968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: char(50)), _col2 (type: int), _col3 (type: int) null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: char(50)), _col2 (type: int), _col3 (type: int) - Statistics: Num rows: 11813956 Data size: 2646326104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 3528433968 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -327,20 +327,20 @@ STAGE PLANS: TableScan alias: item filterExpr: (i_manager_id = 1) (type: boolean) - Statistics: Num rows: 462000 Data size: 53582956 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 53467656 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_manager_id = 1) (type: boolean) - Statistics: Num rows: 4442 Data size: 515192 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 514192 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_brand_id (type: int), i_brand (type: char(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 4442 Data size: 497464 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 496464 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 4442 Data size: 497464 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 496464 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: char(50)) Select Operator expressions: _col0 (type: bigint) @@ -362,14 +362,14 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 4442 Data size: 497464 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 496464 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: char(50)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 4442 Data size: 497464 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4442 Data size: 496464 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -381,16 +381,16 @@ STAGE PLANS: keys: KEY._col0 (type: int), KEY._col1 (type: char(50)), KEY._col2 (type: int), KEY._col3 (type: int) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 11813956 Data size: 2646326104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 3528433968 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: char(50)), _col2 (type: int), _col3 (type: int), _col4 (type: decimal(17,2)), _col0 (type: int) outputColumnNames: _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 11813956 Data size: 2646326104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 3528433968 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col4 (type: decimal(17,2)), _col5 (type: int) null sort order: az sort order: -+ - Statistics: Num rows: 11813956 Data size: 2646326104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 3528433968 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)), _col2 (type: int), _col3 (type: int) Reducer 4 Execution mode: vectorized, llap @@ -398,10 +398,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey1 (type: int), VALUE._col0 (type: char(50)), VALUE._col1 (type: int), VALUE._col2 (type: int), KEY.reducesinkkey0 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 11813956 Data size: 2646326104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 3528433968 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 11813956 Data size: 2646326104 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15751942 Data size: 3528433968 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query72.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query72.q.out index 362a76884717..ba4d9ea3c1ea 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query72.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query72.q.out @@ -235,17 +235,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 88704000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 88491112 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_desc (type: varchar(200)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 462000 Data size: 88704000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 88491112 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 88704000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 88491112 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(200)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -450,24 +450,24 @@ STAGE PLANS: outputColumnNames: _col15, _col21, _col25, _col27 input vertices: 1 Map 17 - Statistics: Num rows: 273405096989 Data size: 80927908708744 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 273405096989 Data size: 80927908495856 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col27 (type: varchar(200)), _col25 (type: varchar(20)), _col15 (type: int), if(_col21 is null, 1, 0) (type: int), if(_col21 is not null, 1, 0) (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 273405096989 Data size: 80927908708744 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 273405096989 Data size: 80927908495856 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col3), count(_col4), count() keys: _col0 (type: varchar(200)), _col1 (type: varchar(20)), _col2 (type: int) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 273405096989 Data size: 85302390260568 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 273405096989 Data size: 85302390047680 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: varchar(200)), _col1 (type: varchar(20)), _col2 (type: int) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: varchar(200)), _col1 (type: varchar(20)), _col2 (type: int) - Statistics: Num rows: 273405096989 Data size: 85302390260568 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 273405096989 Data size: 85302390047680 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint) Reducer 4 Execution mode: vectorized, llap @@ -477,18 +477,18 @@ STAGE PLANS: keys: KEY._col0 (type: varchar(200)), KEY._col1 (type: varchar(20)), KEY._col2 (type: int) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 3387352014 Data size: 1056853828368 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3387361923 Data size: 1056856917584 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: -+++ keys: _col5 (type: bigint), _col0 (type: varchar(200)), _col1 (type: varchar(20)), _col2 (type: int) null sort order: azzz - Statistics: Num rows: 3387352014 Data size: 1056853828368 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3387361923 Data size: 1056856917584 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Reduce Output Operator key expressions: _col5 (type: bigint), _col0 (type: varchar(200)), _col1 (type: varchar(20)), _col2 (type: int) null sort order: azzz sort order: -+++ - Statistics: Num rows: 3387352014 Data size: 1056853828368 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3387361923 Data size: 1056856917584 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint) Reducer 5 Execution mode: vectorized, llap @@ -496,7 +496,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey1 (type: varchar(200)), KEY.reducesinkkey2 (type: varchar(20)), KEY.reducesinkkey3 (type: int), VALUE._col0 (type: bigint), VALUE._col1 (type: bigint), KEY.reducesinkkey0 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 3387352014 Data size: 1056853828368 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3387361923 Data size: 1056856915008 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 31200 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query73.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query73.q.out index bd1b3a77a5ef..a347e2e2920c 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query73.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query73.q.out @@ -18,11 +18,11 @@ STAGE PLANS: TableScan alias: customer probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_92_container, bigKeyColName:c_customer_sk, smallTablePos:1, keyRatio:1.25E-8 - Statistics: Num rows: 80000000 Data size: 28800000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 27814510494 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: c_customer_sk (type: bigint), c_salutation (type: char(10)), c_first_name (type: char(20)), c_last_name (type: char(30)), c_preferred_cust_flag (type: char(1)) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 80000000 Data size: 28800000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 27814510494 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -32,16 +32,16 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col3, _col4, _col5, _col7 input vertices: 1 Reducer 4 - Statistics: Num rows: 5 Data size: 1840 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5 Data size: 432 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: char(30)), _col2 (type: char(20)), _col1 (type: char(10)), _col4 (type: char(1)), _col5 (type: bigint), _col7 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5 Data size: 1840 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5 Data size: 432 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col5 (type: bigint) null sort order: a sort order: - - Statistics: Num rows: 5 Data size: 1840 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5 Data size: 432 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: char(10)), _col3 (type: char(1)), _col4 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -50,7 +50,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: (ss_hdemo_sk is not null and ss_customer_sk is not null and ss_store_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_91_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:1.5365246388564515E-7 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_91_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:1.5654905158628162E-7 Statistics: Num rows: 82510879939 Data size: 3253774532920 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ss_hdemo_sk is not null and ss_customer_sk is not null and ss_store_sk is not null) (type: boolean) @@ -88,20 +88,20 @@ STAGE PLANS: outputColumnNames: _col0, _col3 input vertices: 1 Map 7 - Statistics: Num rows: 12400839 Data size: 99206720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12634816 Data size: 101078536 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: bigint), _col3 (type: bigint) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 12400839 Data size: 198413432 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12634816 Data size: 202157064 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint) - Statistics: Num rows: 12400839 Data size: 198413432 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12634816 Data size: 202157064 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -168,20 +168,20 @@ STAGE PLANS: TableScan alias: store filterExpr: (s_county) IN ('Huron County', 'Kittitas County', 'Maverick County', 'Mobile County') (type: boolean) - Statistics: Num rows: 1704 Data size: 180624 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 179546 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (s_county) IN ('Huron County', 'Kittitas County', 'Maverick County', 'Mobile County') (type: boolean) - Statistics: Num rows: 53 Data size: 5618 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 54 Data size: 5724 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 53 Data size: 424 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 54 Data size: 432 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 53 Data size: 424 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 54 Data size: 432 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 2 @@ -190,10 +190,10 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: char(30)), VALUE._col1 (type: char(20)), VALUE._col2 (type: char(10)), VALUE._col3 (type: char(1)), VALUE._col4 (type: bigint), KEY.reducesinkkey0 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5 Data size: 1840 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5 Data size: 432 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 5 Data size: 1840 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5 Data size: 432 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat @@ -206,11 +206,11 @@ STAGE PLANS: keys: KEY._col0 (type: bigint), KEY._col1 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 12400839 Data size: 198413432 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12634816 Data size: 202157064 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: bigint), _col0 (type: bigint), _col2 (type: bigint) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 12400839 Data size: 198413432 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 12634816 Data size: 202157064 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col2 BETWEEN 1L AND 5L (type: boolean) Statistics: Num rows: 5 Data size: 88 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query74.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query74.q.out index bf65d327cbdf..a4d4d3fc6f27 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query74.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query74.q.out @@ -229,7 +229,7 @@ STAGE PLANS: alias: customer Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: c_customer_sk (type: bigint), c_customer_id (type: char(16)) + expressions: c_customer_sk (type: bigint), c_customer_id (type: string) outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator @@ -238,32 +238,32 @@ STAGE PLANS: sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) + value expressions: _col1 (type: string) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) + value expressions: _col1 (type: string) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) Statistics: Num rows: 80000000 Data size: 8640000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)) + value expressions: _col1 (type: string) Select Operator - expressions: c_customer_sk (type: bigint), c_customer_id (type: char(16)), c_first_name (type: char(20)), c_last_name (type: char(30)) + expressions: c_customer_sk (type: bigint), c_customer_id (type: string), c_first_name (type: char(20)), c_last_name (type: char(30)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 80000000 Data size: 23040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 22536269100 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 23040000000 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)), _col2 (type: char(20)), _col3 (type: char(30)) + Statistics: Num rows: 80000000 Data size: 22536269100 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: string), _col2 (type: char(20)), _col3 (type: char(30)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 11 @@ -282,16 +282,16 @@ STAGE PLANS: DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col1) - keys: _col5 (type: char(16)) + keys: _col5 (type: string) minReductionHashAggr: 0.9815652 mode: hash outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Reducer 12 @@ -299,15 +299,15 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)) + keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Reducer 13 @@ -326,16 +326,16 @@ STAGE PLANS: DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col1) - keys: _col5 (type: char(16)) + keys: _col5 (type: string) minReductionHashAggr: 0.9815652 mode: hash outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Reducer 14 @@ -343,7 +343,7 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)) + keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE @@ -351,14 +351,14 @@ STAGE PLANS: predicate: (_col1 > 0) (type: boolean) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)), _col1 (type: decimal(17,2)), (_col1 > 0) (type: boolean) + expressions: _col0 (type: string), _col1 (type: decimal(17,2)), (_col1 > 0) (type: boolean) outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 80000000 Data size: 17280000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 17280000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)), _col2 (type: boolean) Reducer 16 @@ -397,37 +397,37 @@ STAGE PLANS: outputColumnNames: _col1, _col5, _col6, _col7 input vertices: 1 Map 18 - Statistics: Num rows: 16192399916 Data size: 6135275611584 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 16192399916 Data size: 6134771880684 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col1) - keys: _col5 (type: char(16)), _col6 (type: char(20)), _col7 (type: char(30)) + keys: _col5 (type: string), _col6 (type: char(20)), _col7 (type: char(30)) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 80000000 Data size: 31360000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 31357511410 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)), _col1 (type: char(20)), _col2 (type: char(30)) + key expressions: _col0 (type: string), _col1 (type: char(20)), _col2 (type: char(30)) null sort order: zzz sort order: +++ - Map-reduce partition columns: _col0 (type: char(16)), _col1 (type: char(20)), _col2 (type: char(30)) - Statistics: Num rows: 80000000 Data size: 31360000000 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col0 (type: string), _col1 (type: char(20)), _col2 (type: char(30)) + Statistics: Num rows: 80000000 Data size: 31357511410 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(17,2)) Reducer 3 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)), KEY._col1 (type: char(20)), KEY._col2 (type: char(30)) + keys: KEY._col0 (type: string), KEY._col1 (type: char(20)), KEY._col2 (type: char(30)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 80000000 Data size: 31360000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 31357511410 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) - Statistics: Num rows: 80000000 Data size: 31360000000 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 80000000 Data size: 31357511410 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(20)), _col2 (type: char(30)), _col3 (type: decimal(17,2)) Reducer 4 Execution mode: vectorized, llap @@ -445,16 +445,16 @@ STAGE PLANS: DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col1) - keys: _col5 (type: char(16)) + keys: _col5 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)) Reducer 5 @@ -462,7 +462,7 @@ STAGE PLANS: Reduce Operator Tree: Group By Operator aggregations: sum(VALUE._col0) - keys: KEY._col0 (type: char(16)) + keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE @@ -470,14 +470,14 @@ STAGE PLANS: predicate: (_col1 > 0) (type: boolean) Statistics: Num rows: 80000000 Data size: 16960000000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)), _col1 (type: decimal(17,2)), (_col1 > 0) (type: boolean) + expressions: _col0 (type: string), _col1 (type: decimal(17,2)), (_col1 > 0) (type: boolean) outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 80000000 Data size: 17280000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) + Map-reduce partition columns: _col0 (type: string) Statistics: Num rows: 80000000 Data size: 17280000000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)), _col2 (type: boolean) Reducer 6 @@ -487,19 +487,19 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 KEY.reducesinkkey0 (type: char(16)) - 1 KEY.reducesinkkey0 (type: char(16)) + 0 KEY.reducesinkkey0 (type: string) + 1 KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col5, _col6 input vertices: 0 Reducer 3 - Statistics: Num rows: 80000000 Data size: 40640000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 40637511410 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) - Statistics: Num rows: 80000000 Data size: 40640000000 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 80000000 Data size: 40637511410 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(20)), _col2 (type: char(30)), _col3 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: boolean) Reducer 7 Execution mode: vectorized, llap @@ -508,19 +508,19 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 KEY.reducesinkkey0 (type: char(16)) - 1 KEY.reducesinkkey0 (type: char(16)) + 0 KEY.reducesinkkey0 (type: string) + 1 KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col5, _col6, _col8 input vertices: 1 Reducer 12 - Statistics: Num rows: 80000000 Data size: 49600000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 49597511410 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator - key expressions: _col0 (type: char(16)) + key expressions: _col0 (type: string) null sort order: z sort order: + - Map-reduce partition columns: _col0 (type: char(16)) - Statistics: Num rows: 80000000 Data size: 49600000000 Basic stats: COMPLETE Column stats: COMPLETE + Map-reduce partition columns: _col0 (type: string) + Statistics: Num rows: 80000000 Data size: 49597511410 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(20)), _col2 (type: char(30)), _col3 (type: decimal(17,2)), _col5 (type: decimal(17,2)), _col6 (type: boolean), _col8 (type: decimal(17,2)) Reducer 8 Execution mode: vectorized, llap @@ -529,38 +529,38 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 KEY.reducesinkkey0 (type: char(16)) - 1 KEY.reducesinkkey0 (type: char(16)) + 0 KEY.reducesinkkey0 (type: string) + 1 KEY.reducesinkkey0 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col5, _col6, _col8, _col10, _col11 input vertices: 1 Reducer 14 - Statistics: Num rows: 80000000 Data size: 58880000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 58877511410 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Filter Operator predicate: if(_col6, if(_col11, ((_col8 / _col10) > (_col3 / _col5)), false), false) (type: boolean) - Statistics: Num rows: 40000000 Data size: 29440000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 29438755750 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++ - keys: _col2 (type: char(30)), _col0 (type: char(16)), _col1 (type: char(20)) + keys: _col2 (type: char(30)), _col0 (type: string), _col1 (type: char(20)) null sort order: zzz - Statistics: Num rows: 40000000 Data size: 29440000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 29438755750 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator - expressions: _col0 (type: char(16)), _col1 (type: char(20)), _col2 (type: char(30)) + expressions: _col0 (type: string), _col1 (type: char(20)), _col2 (type: char(30)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40000000 Data size: 11200000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 11197511320 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col2 (type: char(30)), _col0 (type: char(16)), _col1 (type: char(20)) + key expressions: _col2 (type: char(30)), _col0 (type: string), _col1 (type: char(20)) null sort order: zzz sort order: +++ - Statistics: Num rows: 40000000 Data size: 11200000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 11197511320 Basic stats: COMPLETE Column stats: COMPLETE Reducer 9 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator - expressions: KEY.reducesinkkey1 (type: char(16)), KEY.reducesinkkey2 (type: char(20)), KEY.reducesinkkey0 (type: char(30)) + expressions: KEY.reducesinkkey1 (type: string), KEY.reducesinkkey2 (type: char(20)), KEY.reducesinkkey0 (type: char(30)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 40000000 Data size: 11200000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 11197511320 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 28000 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query75.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query75.q.out index d8a87abb66ef..fb410a0a6414 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query75.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query75.q.out @@ -42,55 +42,55 @@ STAGE PLANS: TableScan alias: item filterExpr: ((i_category = 'Sports ') and i_manufact_id is not null and i_category_id is not null and i_brand_id is not null and i_class_id is not null) (type: boolean) - Statistics: Num rows: 462000 Data size: 52649820 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 52549740 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((i_category = 'Sports ') and i_manufact_id is not null and i_category_id is not null and i_brand_id is not null and i_class_id is not null) (type: boolean) - Statistics: Num rows: 41585 Data size: 4739062 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 45745 Data size: 5203332 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_brand_id (type: int), i_class_id (type: int), i_category_id (type: int), i_manufact_id (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 41585 Data size: 996412 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 45745 Data size: 1096092 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 41585 Data size: 996412 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 45745 Data size: 1096092 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 41585 Data size: 996412 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 45745 Data size: 1096092 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 41585 Data size: 996412 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 45745 Data size: 1096092 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 41585 Data size: 996412 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 45745 Data size: 1096092 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 41585 Data size: 996412 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 45745 Data size: 1096092 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 41585 Data size: 996412 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 45745 Data size: 1096092 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -272,18 +272,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col7, _col8, _col9, _col10 input vertices: 1 Reducer 4 - Statistics: Num rows: 1492674976 Data size: 47765597720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1641996368 Data size: 52543882104 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint) - Statistics: Num rows: 1492674976 Data size: 47765597720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1641996368 Data size: 52543882104 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: int), _col3 (type: decimal(7,2)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int) Select Operator expressions: _col0 (type: bigint), _col1 (type: bigint), hash(_col0,_col1) (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 1492674976 Data size: 29853499520 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1641996368 Data size: 32839927360 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), min(_col1), max(_col1), bloom_filter(_col3, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -314,18 +314,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col7, _col8, _col9, _col10 input vertices: 1 Map 1 - Statistics: Num rows: 1492674976 Data size: 47765597720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1641996368 Data size: 52543882104 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint) - Statistics: Num rows: 1492674976 Data size: 47765597720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1641996368 Data size: 52543882104 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: int), _col3 (type: decimal(7,2)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int) Select Operator expressions: _col0 (type: bigint), _col1 (type: bigint), hash(_col0,_col1) (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 1492674976 Data size: 29853499520 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1641996368 Data size: 32839927360 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), min(_col1), max(_col1), bloom_filter(_col3, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -367,18 +367,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col7, _col8, _col9, _col10 input vertices: 1 Reducer 3 - Statistics: Num rows: 390660922 Data size: 57504437720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 429741120 Data size: 63288306864 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint) - Statistics: Num rows: 390660922 Data size: 57504437720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 429741120 Data size: 63288306864 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: int), _col3 (type: decimal(7,2)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int) Select Operator expressions: _col0 (type: bigint), _col1 (type: bigint), hash(_col0,_col1) (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 390660922 Data size: 7813218440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 429741120 Data size: 8594822400 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), min(_col1), max(_col1), bloom_filter(_col3, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -409,18 +409,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col7, _col8, _col9, _col10 input vertices: 1 Map 1 - Statistics: Num rows: 390660922 Data size: 57504437720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 429741120 Data size: 63288306864 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint) - Statistics: Num rows: 390660922 Data size: 57504437720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 429741120 Data size: 63288306864 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: int), _col3 (type: decimal(7,2)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int) Select Operator expressions: _col0 (type: bigint), _col1 (type: bigint), hash(_col0,_col1) (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 390660922 Data size: 7813218440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 429741120 Data size: 8594822400 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), min(_col1), max(_col1), bloom_filter(_col3, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -534,18 +534,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col7, _col8, _col9, _col10 input vertices: 1 Map 1 - Statistics: Num rows: 772490513 Data size: 101850760856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 849767456 Data size: 113287748260 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint) - Statistics: Num rows: 772490513 Data size: 101850760856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 849767456 Data size: 113287748260 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: int), _col3 (type: decimal(7,2)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int) Select Operator expressions: _col0 (type: bigint), _col1 (type: bigint), hash(_col0,_col1) (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 772490513 Data size: 15449810260 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 849767456 Data size: 16995349120 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), min(_col1), max(_col1), bloom_filter(_col3, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -576,18 +576,18 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col3, _col7, _col8, _col9, _col10 input vertices: 1 Reducer 2 - Statistics: Num rows: 772490513 Data size: 101850760856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 849767456 Data size: 113287748260 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint) - Statistics: Num rows: 772490513 Data size: 101850760856 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 849767456 Data size: 113287748260 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: int), _col3 (type: decimal(7,2)), _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int) Select Operator expressions: _col0 (type: bigint), _col1 (type: bigint), hash(_col0,_col1) (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 772490513 Data size: 15449810260 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 849767456 Data size: 16995349120 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), min(_col1), max(_col1), bloom_filter(_col3, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -626,24 +626,24 @@ STAGE PLANS: outputColumnNames: _col2, _col3, _col7, _col8, _col9, _col10, _col13, _col14 input vertices: 1 Map 21 - Statistics: Num rows: 2017213214 Data size: 388166715564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2219007370 Data size: 429247540704 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Select Operator expressions: _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int), (_col2 - if(_col13 is not null, _col13, 0)) (type: int), (_col3 - if(_col14 is not null, _col14, 0)) (type: decimal(8,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 2017213214 Data size: 266272142620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2219007370 Data size: 292908971052 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) null sort order: zzzzzz sort order: ++++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int) - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reducer 13 Execution mode: vectorized, llap Reduce Operator Tree: @@ -651,7 +651,7 @@ STAGE PLANS: keys: KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: int), KEY._col3 (type: int), KEY._col4 (type: int), KEY._col5 (type: decimal(8,2)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col4), sum(_col5) keys: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int) @@ -767,7 +767,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 41585 Data size: 996412 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 45745 Data size: 1096092 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) Reducer 20 Execution mode: vectorized, llap @@ -793,24 +793,24 @@ STAGE PLANS: outputColumnNames: _col2, _col3, _col7, _col8, _col9, _col10, _col13, _col14 input vertices: 1 Map 5 - Statistics: Num rows: 4012530964 Data size: 613800764264 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4413928937 Data size: 678704898464 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Select Operator expressions: _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int), (_col2 - if(_col13 is not null, _col13, 0)) (type: int), (_col3 - if(_col14 is not null, _col14, 0)) (type: decimal(8,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 4012530964 Data size: 529654085620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4413928937 Data size: 582638617896 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) null sort order: zzzzzz sort order: ++++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int) - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reducer 24 Execution mode: vectorized, llap Reduce Operator Tree: @@ -836,24 +836,24 @@ STAGE PLANS: outputColumnNames: _col2, _col3, _col7, _col8, _col9, _col10, _col13, _col14 input vertices: 1 Map 5 - Statistics: Num rows: 4012530964 Data size: 613800764264 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4413928937 Data size: 678704898464 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Select Operator expressions: _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int), (_col2 - if(_col13 is not null, _col13, 0)) (type: int), (_col3 - if(_col14 is not null, _col14, 0)) (type: decimal(8,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 4012530964 Data size: 529654085620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4413928937 Data size: 582638617896 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) null sort order: zzzzzz sort order: ++++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int) - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reducer 26 Execution mode: vectorized, llap Reduce Operator Tree: @@ -879,24 +879,24 @@ STAGE PLANS: outputColumnNames: _col2, _col3, _col7, _col8, _col9, _col10, _col13, _col14 input vertices: 1 Map 32 - Statistics: Num rows: 1031325981 Data size: 198862953200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1134495818 Data size: 219915769648 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Select Operator expressions: _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int), (_col2 - if(_col13 is not null, _col13, 0)) (type: int), (_col3 - if(_col14 is not null, _col14, 0)) (type: decimal(8,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 1031325981 Data size: 136135027864 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1134495818 Data size: 149753446188 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) null sort order: zzzzzz sort order: ++++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int) - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reducer 29 Execution mode: vectorized, llap Reduce Operator Tree: @@ -921,7 +921,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 41585 Data size: 996412 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 45745 Data size: 1096092 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) Reducer 30 Execution mode: vectorized, llap @@ -935,24 +935,24 @@ STAGE PLANS: outputColumnNames: _col2, _col3, _col7, _col8, _col9, _col10, _col13, _col14 input vertices: 1 Map 32 - Statistics: Num rows: 1031325981 Data size: 198862953200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1134495818 Data size: 219915769648 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Select Operator expressions: _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int), (_col2 - if(_col13 is not null, _col13, 0)) (type: int), (_col3 - if(_col14 is not null, _col14, 0)) (type: decimal(8,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 1031325981 Data size: 136135027864 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1134495818 Data size: 149753446188 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) null sort order: zzzzzz sort order: ++++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int) - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reducer 31 Execution mode: vectorized, llap Reduce Operator Tree: @@ -977,7 +977,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 41585 Data size: 996412 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 45745 Data size: 1096092 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int) Reducer 7 Execution mode: vectorized, llap @@ -991,24 +991,24 @@ STAGE PLANS: outputColumnNames: _col2, _col3, _col7, _col8, _col9, _col10, _col13, _col14 input vertices: 1 Map 21 - Statistics: Num rows: 2017213214 Data size: 388166715564 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2219007370 Data size: 429247540704 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Select Operator expressions: _col7 (type: int), _col8 (type: int), _col9 (type: int), _col10 (type: int), (_col2 - if(_col13 is not null, _col13, 0)) (type: int), (_col3 - if(_col14 is not null, _col14, 0)) (type: decimal(8,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 2017213214 Data size: 266272142620 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2219007370 Data size: 292908971052 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator keys: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int), _col4 (type: int), _col5 (type: decimal(8,2)) null sort order: zzzzzz sort order: ++++++ Map-reduce partition columns: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int) - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Reducer 9 Execution mode: vectorized, llap Reduce Operator Tree: @@ -1016,7 +1016,7 @@ STAGE PLANS: keys: KEY._col0 (type: int), KEY._col1 (type: int), KEY._col2 (type: int), KEY._col3 (type: int), KEY._col4 (type: int), KEY._col5 (type: decimal(8,2)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 6029744178 Data size: 795926226580 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6632936307 Data size: 875547587128 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col4), sum(_col5) keys: _col0 (type: int), _col1 (type: int), _col2 (type: int), _col3 (type: int) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query76.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query76.q.out index 58b21d9f3ea4..69db3005efd5 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query76.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query76.q.out @@ -127,16 +127,16 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col4, _col7 input vertices: 1 Map 6 - Statistics: Num rows: 1946839900 Data size: 403692777096 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1946839900 Data size: 403692677016 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: 'store' (type: string), 'ss_addr_sk' (type: string), _col1 (type: int), _col2 (type: int), _col7 (type: char(50)), _col4 (type: decimal(7,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 1946839900 Data size: 759964478796 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1946839900 Data size: 759964378716 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++++ keys: _col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: char(50)) null sort order: zzzzz - Statistics: Num rows: 2057228617 Data size: 804076268851 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2057228617 Data size: 804075968611 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator aggregations: count(), sum(_col5) @@ -144,13 +144,13 @@ STAGE PLANS: minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 27502596 Data size: 11221059168 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 27502596 Data size: 11221048548 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: char(50)) null sort order: zzzzz sort order: +++++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: char(50)) - Statistics: Num rows: 27502596 Data size: 11221059168 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 27502596 Data size: 11221048548 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: bigint), _col6 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -158,31 +158,31 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 45276000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 45175920 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_category (type: char(50)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 462000 Data size: 45276000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 45175920 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 45276000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 45175920 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 45276000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 45175920 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 45276000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 45175920 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -219,16 +219,16 @@ STAGE PLANS: outputColumnNames: _col1, _col4, _col5, _col7 input vertices: 1 Map 6 - Statistics: Num rows: 2698517 Data size: 566650826 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2698517 Data size: 566550746 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: 'web' (type: string), 'ws_web_page_sk' (type: string), _col4 (type: int), _col5 (type: int), _col7 (type: char(50)), _col1 (type: decimal(7,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 2698517 Data size: 1065876471 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2698517 Data size: 1065776391 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++++ keys: _col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: char(50)) null sort order: zzzzz - Statistics: Num rows: 2057228617 Data size: 804076268851 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2057228617 Data size: 804075968611 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator aggregations: count(), sum(_col5) @@ -236,13 +236,13 @@ STAGE PLANS: minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 27502596 Data size: 11221059168 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 27502596 Data size: 11221048548 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: char(50)) null sort order: zzzzz sort order: +++++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: char(50)) - Statistics: Num rows: 27502596 Data size: 11221059168 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 27502596 Data size: 11221048548 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: bigint), _col6 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -279,16 +279,16 @@ STAGE PLANS: outputColumnNames: _col1, _col4, _col5, _col7 input vertices: 1 Map 6 - Statistics: Num rows: 107690200 Data size: 22584775584 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 107690200 Data size: 22584675504 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: 'catalog' (type: string), 'cs_warehouse_sk' (type: string), _col4 (type: int), _col5 (type: int), _col7 (type: char(50)), _col1 (type: decimal(7,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 107690200 Data size: 43045913584 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 107690200 Data size: 43045813504 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++++ keys: _col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: char(50)) null sort order: zzzzz - Statistics: Num rows: 2057228617 Data size: 804076268851 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2057228617 Data size: 804075968611 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator aggregations: count(), sum(_col5) @@ -296,13 +296,13 @@ STAGE PLANS: minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 27502596 Data size: 11221059168 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 27502596 Data size: 11221048548 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: char(50)) null sort order: zzzzz sort order: +++++ Map-reduce partition columns: _col0 (type: string), _col1 (type: string), _col2 (type: int), _col3 (type: int), _col4 (type: char(50)) - Statistics: Num rows: 27502596 Data size: 11221059168 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 27502596 Data size: 11221048548 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: bigint), _col6 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query79.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query79.q.out index 3ae0064cc2de..3da84acf50dd 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query79.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query79.q.out @@ -17,17 +17,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: customer - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: c_customer_sk (type: bigint), c_first_name (type: char(20)), c_last_name (type: char(30)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(20)), _col2 (type: char(30)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -64,7 +64,7 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col2, _col4, _col5, _col6, _col10 input vertices: 1 Map 7 - Statistics: Num rows: 6348351959 Data size: 1766432268779 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6348351959 Data size: 1766432267756 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -74,20 +74,20 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col4, _col5, _col6, _col10 input vertices: 1 Map 8 - Statistics: Num rows: 5713516612 Data size: 1513660477204 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5713516612 Data size: 1513660476181 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col5), sum(_col6) keys: _col0 (type: bigint), _col2 (type: bigint), _col4 (type: bigint), _col10 (type: varchar(60)) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5713516612 Data size: 1919324915684 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5713516612 Data size: 1919324914661 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: varchar(60)) null sort order: zzzz sort order: ++++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: bigint), _col3 (type: varchar(60)) - Statistics: Num rows: 5713516612 Data size: 1919324915684 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5713516612 Data size: 1919324914661 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -133,20 +133,20 @@ STAGE PLANS: TableScan alias: store filterExpr: s_number_employees BETWEEN 200 AND 295 (type: boolean) - Statistics: Num rows: 1704 Data size: 178872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 177849 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: s_number_employees BETWEEN 200 AND 295 (type: boolean) - Statistics: Num rows: 1636 Data size: 171736 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1636 Data size: 170713 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_city (type: varchar(60)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 1636 Data size: 165236 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1636 Data size: 164213 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1636 Data size: 165236 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1636 Data size: 164213 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(60)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -179,17 +179,17 @@ STAGE PLANS: keys: KEY._col0 (type: bigint), KEY._col1 (type: bigint), KEY._col2 (type: bigint), KEY._col3 (type: varchar(60)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5713516612 Data size: 1919324915684 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5713516612 Data size: 1919324914661 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col2 (type: bigint), _col0 (type: bigint), _col4 (type: decimal(17,2)), _col5 (type: decimal(17,2)), substr(_col3, 1, 30) (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 5713516612 Data size: 1882402767360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5713516612 Data size: 1882402766348 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col1 (type: bigint) - Statistics: Num rows: 5713516612 Data size: 1882402767360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5713516612 Data size: 1882402766348 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col2 (type: decimal(17,2)), _col3 (type: decimal(17,2)), _col4 (type: string) Reducer 4 Execution mode: vectorized, llap @@ -203,23 +203,23 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col3, _col5, _col6, _col7 input vertices: 0 Map 1 - Statistics: Num rows: 5713516612 Data size: 2879612372448 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5713516612 Data size: 2879108640536 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Top N Key Operator sort order: ++++ keys: _col2 (type: char(30)), _col1 (type: char(20)), _col7 (type: string), _col6 (type: decimal(17,2)) null sort order: zzzz - Statistics: Num rows: 5713516612 Data size: 2879612372448 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5713516612 Data size: 2879108640536 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col2 (type: char(30)), _col1 (type: char(20)), _col3 (type: bigint), _col5 (type: decimal(17,2)), _col6 (type: decimal(17,2)), _col7 (type: string) outputColumnNames: _col0, _col1, _col3, _col4, _col5, _col6 - Statistics: Num rows: 5713516612 Data size: 2879612372448 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5713516612 Data size: 2878604908352 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col6 (type: string), _col5 (type: decimal(17,2)) null sort order: zzzz sort order: ++++ - Statistics: Num rows: 5713516612 Data size: 2879612372448 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5713516612 Data size: 2878604908352 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: decimal(17,2)) Reducer 5 Execution mode: vectorized, llap @@ -227,7 +227,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: char(30)), KEY.reducesinkkey1 (type: char(20)), KEY.reducesinkkey2 (type: string), VALUE._col0 (type: bigint), VALUE._col1 (type: decimal(17,2)), KEY.reducesinkkey3 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 5713516612 Data size: 2879612372448 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 5713516612 Data size: 2878604908352 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 50400 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query8.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query8.q.out index 24be5673172a..00ffad4cb0cc 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query8.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query8.q.out @@ -77,20 +77,20 @@ STAGE PLANS: TableScan alias: store filterExpr: substr(s_zip, 1, 2) is not null (type: boolean) - Statistics: Num rows: 1704 Data size: 315240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 313381 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: substr(s_zip, 1, 2) is not null (type: boolean) - Statistics: Num rows: 1704 Data size: 315240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1692 Data size: 311161 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_store_name (type: varchar(50)), substr(s_zip, 1, 2) (type: string) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1704 Data size: 310128 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1692 Data size: 306118 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col2 (type: string) - Statistics: Num rows: 1704 Data size: 310128 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1692 Data size: 306118 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col1 (type: varchar(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -136,41 +136,41 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: (((substr(ca_zip, 1, 5)) IN ('89436', '30868', '65085', '22977', '83927', '77557', '58429', '40697', '80614', '10502', '32779', '91137', '61265', '98294', '17921', '18427', '21203', '59362', '87291', '84093', '21505', '17184', '10866', '67898', '25797', '28055', '18377', '80332', '74535', '21757', '29742', '90885', '29898', '17819', '40811', '25990', '47513', '89531', '91068', '10391', '18846', '99223', '82637', '41368', '83658', '86199', '81625', '26696', '89338', '88425', '32200', '81427', '19053', '77471', '36610', '99823', '43276', '41249', '48584', '83550', '82276', '18842', '78890', '14090', '38123', '40936', '34425', '19850', '43286', '80072', '79188', '54191', '11395', '50497', '84861', '90733', '21068', '57666', '37119', '25004', '57835', '70067', '62878', '95806', '19303', '18840', '19124', '29785', '16737', '16022', '49613', '89977', '68310', '60069', '98360', '48649', '39050', '41793', '25002', '27413', '39736', '47208', '16515', '94808', '57648', '15009', '80015', '42961', '63982', '21744', '71853', '81087', '67468', '34175', '64008', '20261', '11201', '51799', '48043', '45645', '61163', '48375', '36447', '57042', '21218', '41100', '89951', '22745', '35851', '83326', '61125', '78298', '80752', '49858', '52940', '96976', '63792', '11376', '53582', '18717', '90226', '50530', '94203', '99447', '27670', '96577', '57856', '56372', '16165', '23427', '54561', '28806', '44439', '22926', '30123', '61451', '92397', '56979', '92309', '70873', '13355', '21801', '46346', '37562', '56458', '28286', '47306', '99555', '69399', '26234', '47546', '49661', '88601', '35943', '39936', '25632', '24611', '44166', '56648', '30379', '59785', '11110', '14329', '93815', '52226', '71381', '13842', '25612', '63294', '14664', '21077', '82626', '18799', '60915', '81020', '56447', '76619', '11433', '13414', '42548', '92713', '70467', '30884', '47484', '16072', '38936', '13036', '88376', '45539', '35901', '19506', '65690', '73957', '71850', '49231', '14276', '20005', '18384', '76615', '11635', '38177', '55607', '41369', '95447', '58581', '58149', '91946', '33790', '76232', '75692', '95464', '22246', '51061', '56692', '53121', '77209', '15482', '10688', '14868', '45907', '73520', '72666', '25734', '17959', '24677', '66446', '94627', '53535', '15560', '41967', '69297', '11929', '59403', '33283', '52232', '57350', '43933', '40921', '36635', '10827', '71286', '19736', '80619', '25251', '95042', '15526', '36496', '55854', '49124', '81980', '35375', '49157', '63512', '28944', '14946', '36503', '54010', '18767', '23969', '43905', '66979', '33113', '21286', '58471', '59080', '13395', '79144', '70373', '67031', '38360', '26705', '50906', '52406', '26066', '73146', '15884', '31897', '30045', '61068', '45550', '92454', '13376', '14354', '19770', '22928', '97790', '50723', '46081', '30202', '14410', '20223', '88500', '67298', '13261', '14172', '81410', '93578', '83583', '46047', '94167', '82564', '21156', '15799', '86709', '37931', '74703', '83103', '23054', '70470', '72008', '49247', '91911', '69998', '20961', '70070', '63197', '54853', '88191', '91830', '49521', '19454', '81450', '89091', '62378', '25683', '61869', '51744', '36580', '85778', '36871', '48121', '28810', '83712', '45486', '67393', '26935', '42393', '20132', '55349', '86057', '21309', '80218', '10094', '11357', '48819', '39734', '40758', '30432', '21204', '29467', '30214', '61024', '55307', '74621', '11622', '68908', '33032', '52868', '99194', '99900', '84936', '69036', '99149', '45013', '32895', '59004', '32322', '14933', '32936', '33562', '72550', '27385', '58049', '58200', '16808', '21360', '32961', '18586', '79307', '15492') and substr(substr(ca_zip, 1, 5), 1, 2) is not null) or substr(substr(ca_zip, 1, 5), 1, 2) is not null) (type: boolean) - Statistics: Num rows: 40000000 Data size: 3560000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3453173033 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((substr(ca_zip, 1, 5)) IN ('89436', '30868', '65085', '22977', '83927', '77557', '58429', '40697', '80614', '10502', '32779', '91137', '61265', '98294', '17921', '18427', '21203', '59362', '87291', '84093', '21505', '17184', '10866', '67898', '25797', '28055', '18377', '80332', '74535', '21757', '29742', '90885', '29898', '17819', '40811', '25990', '47513', '89531', '91068', '10391', '18846', '99223', '82637', '41368', '83658', '86199', '81625', '26696', '89338', '88425', '32200', '81427', '19053', '77471', '36610', '99823', '43276', '41249', '48584', '83550', '82276', '18842', '78890', '14090', '38123', '40936', '34425', '19850', '43286', '80072', '79188', '54191', '11395', '50497', '84861', '90733', '21068', '57666', '37119', '25004', '57835', '70067', '62878', '95806', '19303', '18840', '19124', '29785', '16737', '16022', '49613', '89977', '68310', '60069', '98360', '48649', '39050', '41793', '25002', '27413', '39736', '47208', '16515', '94808', '57648', '15009', '80015', '42961', '63982', '21744', '71853', '81087', '67468', '34175', '64008', '20261', '11201', '51799', '48043', '45645', '61163', '48375', '36447', '57042', '21218', '41100', '89951', '22745', '35851', '83326', '61125', '78298', '80752', '49858', '52940', '96976', '63792', '11376', '53582', '18717', '90226', '50530', '94203', '99447', '27670', '96577', '57856', '56372', '16165', '23427', '54561', '28806', '44439', '22926', '30123', '61451', '92397', '56979', '92309', '70873', '13355', '21801', '46346', '37562', '56458', '28286', '47306', '99555', '69399', '26234', '47546', '49661', '88601', '35943', '39936', '25632', '24611', '44166', '56648', '30379', '59785', '11110', '14329', '93815', '52226', '71381', '13842', '25612', '63294', '14664', '21077', '82626', '18799', '60915', '81020', '56447', '76619', '11433', '13414', '42548', '92713', '70467', '30884', '47484', '16072', '38936', '13036', '88376', '45539', '35901', '19506', '65690', '73957', '71850', '49231', '14276', '20005', '18384', '76615', '11635', '38177', '55607', '41369', '95447', '58581', '58149', '91946', '33790', '76232', '75692', '95464', '22246', '51061', '56692', '53121', '77209', '15482', '10688', '14868', '45907', '73520', '72666', '25734', '17959', '24677', '66446', '94627', '53535', '15560', '41967', '69297', '11929', '59403', '33283', '52232', '57350', '43933', '40921', '36635', '10827', '71286', '19736', '80619', '25251', '95042', '15526', '36496', '55854', '49124', '81980', '35375', '49157', '63512', '28944', '14946', '36503', '54010', '18767', '23969', '43905', '66979', '33113', '21286', '58471', '59080', '13395', '79144', '70373', '67031', '38360', '26705', '50906', '52406', '26066', '73146', '15884', '31897', '30045', '61068', '45550', '92454', '13376', '14354', '19770', '22928', '97790', '50723', '46081', '30202', '14410', '20223', '88500', '67298', '13261', '14172', '81410', '93578', '83583', '46047', '94167', '82564', '21156', '15799', '86709', '37931', '74703', '83103', '23054', '70470', '72008', '49247', '91911', '69998', '20961', '70070', '63197', '54853', '88191', '91830', '49521', '19454', '81450', '89091', '62378', '25683', '61869', '51744', '36580', '85778', '36871', '48121', '28810', '83712', '45486', '67393', '26935', '42393', '20132', '55349', '86057', '21309', '80218', '10094', '11357', '48819', '39734', '40758', '30432', '21204', '29467', '30214', '61024', '55307', '74621', '11622', '68908', '33032', '52868', '99194', '99900', '84936', '69036', '99149', '45013', '32895', '59004', '32322', '14933', '32936', '33562', '72550', '27385', '58049', '58200', '16808', '21360', '32961', '18586', '79307', '15492') and substr(substr(ca_zip, 1, 5), 1, 2) is not null) (type: boolean) - Statistics: Num rows: 20000000 Data size: 1780000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19399848 Data size: 1674775834 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: substr(ca_zip, 1, 5) (type: string) outputColumnNames: _col0 - Statistics: Num rows: 20000000 Data size: 1780000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 19399848 Data size: 1674775834 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 133532 Data size: 12819072 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 133546 Data size: 12467888 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 133532 Data size: 12819072 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 133546 Data size: 12467888 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Filter Operator predicate: substr(substr(ca_zip, 1, 5), 1, 2) is not null (type: boolean) - Statistics: Num rows: 40000000 Data size: 3880000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38799696 Data size: 3659949147 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_zip (type: char(10)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40000000 Data size: 3880000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38799696 Data size: 3659949147 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 3880000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38799696 Data size: 3659949147 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(10)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -179,20 +179,20 @@ STAGE PLANS: TableScan alias: customer filterExpr: ((c_preferred_cust_flag = 'Y') and c_current_addr_sk is not null) (type: boolean) - Statistics: Num rows: 80000000 Data size: 7440000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 7201952145 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((c_preferred_cust_flag = 'Y') and c_current_addr_sk is not null) (type: boolean) - Statistics: Num rows: 26666667 Data size: 2480000031 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3600976115 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: c_current_addr_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 26666667 Data size: 213333336 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 320000000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 26666667 Data size: 213333336 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 320000000 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 10 @@ -204,24 +204,24 @@ STAGE PLANS: keys: 0 KEY.reducesinkkey0 (type: bigint) 1 KEY.reducesinkkey0 (type: bigint) - outputColumnNames: _col1 + outputColumnNames: _col2 input vertices: - 0 Map 5 - Statistics: Num rows: 26666667 Data size: 2373333363 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 5 + Statistics: Num rows: 38799696 Data size: 3349551579 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator aggregations: count() - keys: _col1 (type: char(10)) + keys: _col2 (type: char(10)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 63590 Data size: 6168230 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 133546 Data size: 12597428 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(10)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: char(10)) - Statistics: Num rows: 63590 Data size: 6168230 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 133546 Data size: 12597428 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 11 Execution mode: vectorized, llap @@ -231,27 +231,27 @@ STAGE PLANS: keys: KEY._col0 (type: char(10)) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 6359 Data size: 616823 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9539 Data size: 899918 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col1 > 10L) (type: boolean) - Statistics: Num rows: 2119 Data size: 205543 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3179 Data size: 299997 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: substr(_col0, 1, 5) (type: string) outputColumnNames: _col0 - Statistics: Num rows: 2119 Data size: 205543 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3179 Data size: 299997 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: string) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 2119 Data size: 203424 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3179 Data size: 296912 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 2119 Data size: 203424 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3179 Data size: 296912 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 12 Execution mode: vectorized, llap @@ -261,20 +261,20 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 2119 Data size: 203424 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3179 Data size: 296912 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col1) keys: _col0 (type: string) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 9538 Data size: 915648 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9538 Data size: 871736 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 9538 Data size: 915648 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9538 Data size: 871736 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 2 Execution mode: vectorized, llap @@ -316,20 +316,20 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 9538 Data size: 915648 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9539 Data size: 890664 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col1) keys: _col0 (type: string) minReductionHashAggr: 0.4 mode: hash outputColumnNames: _col0, _col1 - Statistics: Num rows: 9538 Data size: 915648 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9538 Data size: 871736 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 9538 Data size: 915648 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9538 Data size: 871736 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint) Reducer 8 Execution mode: vectorized, llap @@ -339,7 +339,7 @@ STAGE PLANS: keys: KEY._col0 (type: string) mode: mergepartial outputColumnNames: _col0, _col1 - Statistics: Num rows: 9538 Data size: 915648 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 9538 Data size: 871736 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col1 = 2L) (type: boolean) Statistics: Num rows: 1 Data size: 96 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query80.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query80.q.out index 86ce0891d9b0..7b9c0e980197 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query80.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query80.q.out @@ -7,23 +7,20 @@ STAGE PLANS: Tez #### A masked pattern was here #### Edges: - Map 1 <- Reducer 16 (BROADCAST_EDGE), Reducer 20 (BROADCAST_EDGE) - Map 10 <- Reducer 15 (BROADCAST_EDGE), Reducer 19 (BROADCAST_EDGE) + Map 1 <- Reducer 16 (BROADCAST_EDGE) + Map 10 <- Reducer 15 (BROADCAST_EDGE) Map 13 <- Reducer 15 (BROADCAST_EDGE) - Map 23 <- Reducer 17 (BROADCAST_EDGE), Reducer 21 (BROADCAST_EDGE) - Map 26 <- Reducer 17 (BROADCAST_EDGE) + Map 20 <- Reducer 17 (BROADCAST_EDGE) + Map 23 <- Reducer 17 (BROADCAST_EDGE) Map 7 <- Reducer 16 (BROADCAST_EDGE) - Reducer 11 <- Map 10 (CUSTOM_SIMPLE_EDGE), Map 13 (CUSTOM_SIMPLE_EDGE), Map 14 (BROADCAST_EDGE), Map 18 (BROADCAST_EDGE), Map 22 (BROADCAST_EDGE), Map 8 (BROADCAST_EDGE) + Reducer 11 <- Map 10 (CUSTOM_SIMPLE_EDGE), Map 13 (CUSTOM_SIMPLE_EDGE), Map 14 (BROADCAST_EDGE), Map 18 (BROADCAST_EDGE), Map 19 (BROADCAST_EDGE), Map 8 (BROADCAST_EDGE) Reducer 12 <- Reducer 11 (SIMPLE_EDGE), Union 4 (CONTAINS) Reducer 15 <- Map 14 (CUSTOM_SIMPLE_EDGE) Reducer 16 <- Map 14 (CUSTOM_SIMPLE_EDGE) Reducer 17 <- Map 14 (CUSTOM_SIMPLE_EDGE) - Reducer 19 <- Map 18 (CUSTOM_SIMPLE_EDGE) Reducer 2 <- Map 1 (CUSTOM_SIMPLE_EDGE), Map 14 (BROADCAST_EDGE), Map 18 (BROADCAST_EDGE), Map 7 (CUSTOM_SIMPLE_EDGE), Map 8 (BROADCAST_EDGE), Map 9 (BROADCAST_EDGE) - Reducer 20 <- Map 18 (CUSTOM_SIMPLE_EDGE) - Reducer 21 <- Map 18 (CUSTOM_SIMPLE_EDGE) - Reducer 24 <- Map 14 (BROADCAST_EDGE), Map 18 (BROADCAST_EDGE), Map 23 (CUSTOM_SIMPLE_EDGE), Map 26 (CUSTOM_SIMPLE_EDGE), Map 27 (BROADCAST_EDGE), Map 8 (BROADCAST_EDGE) - Reducer 25 <- Reducer 24 (SIMPLE_EDGE), Union 4 (CONTAINS) + Reducer 21 <- Map 14 (BROADCAST_EDGE), Map 18 (BROADCAST_EDGE), Map 20 (CUSTOM_SIMPLE_EDGE), Map 23 (CUSTOM_SIMPLE_EDGE), Map 24 (BROADCAST_EDGE), Map 8 (BROADCAST_EDGE) + Reducer 22 <- Reducer 21 (SIMPLE_EDGE), Union 4 (CONTAINS) Reducer 3 <- Reducer 2 (SIMPLE_EDGE), Union 4 (CONTAINS) Reducer 5 <- Union 4 (SIMPLE_EDGE) Reducer 6 <- Reducer 5 (SIMPLE_EDGE) @@ -33,10 +30,10 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store_sales - filterExpr: (ss_store_sk is not null and ss_promo_sk is not null and ss_item_sk BETWEEN DynamicValue(RS_20_item_i_item_sk_min) AND DynamicValue(RS_20_item_i_item_sk_max) and ss_promo_sk BETWEEN DynamicValue(RS_23_promotion_p_promo_sk_min) AND DynamicValue(RS_23_promotion_p_promo_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_20_item_i_item_sk_bloom_filter)) and in_bloom_filter(ss_promo_sk, DynamicValue(RS_23_promotion_p_promo_sk_bloom_filter))) (type: boolean) + filterExpr: (ss_store_sk is not null and ss_promo_sk is not null and ss_item_sk BETWEEN DynamicValue(RS_20_item_i_item_sk_min) AND DynamicValue(RS_20_item_i_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_20_item_i_item_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 82510879939 Data size: 21315868812296 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (ss_store_sk is not null and ss_promo_sk is not null and ss_promo_sk BETWEEN DynamicValue(RS_23_promotion_p_promo_sk_min) AND DynamicValue(RS_23_promotion_p_promo_sk_max) and ss_item_sk BETWEEN DynamicValue(RS_20_item_i_item_sk_min) AND DynamicValue(RS_20_item_i_item_sk_max) and in_bloom_filter(ss_promo_sk, DynamicValue(RS_23_promotion_p_promo_sk_bloom_filter)) and in_bloom_filter(ss_item_sk, DynamicValue(RS_20_item_i_item_sk_bloom_filter))) (type: boolean) + predicate: (ss_store_sk is not null and ss_promo_sk is not null and ss_item_sk BETWEEN DynamicValue(RS_20_item_i_item_sk_min) AND DynamicValue(RS_20_item_i_item_sk_max) and in_bloom_filter(ss_item_sk, DynamicValue(RS_20_item_i_item_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 78675502838 Data size: 20325037116048 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ss_item_sk (type: bigint), ss_store_sk (type: bigint), ss_promo_sk (type: bigint), ss_ticket_number (type: bigint), ss_ext_sales_price (type: decimal(7,2)), ss_net_profit (type: decimal(7,2)), ss_sold_date_sk (type: bigint) @@ -55,10 +52,10 @@ STAGE PLANS: Map Operator Tree: TableScan alias: catalog_sales - filterExpr: (cs_catalog_page_sk is not null and cs_promo_sk is not null and cs_item_sk BETWEEN DynamicValue(RS_57_item_i_item_sk_min) AND DynamicValue(RS_57_item_i_item_sk_max) and cs_promo_sk BETWEEN DynamicValue(RS_60_promotion_p_promo_sk_min) AND DynamicValue(RS_60_promotion_p_promo_sk_max) and in_bloom_filter(cs_item_sk, DynamicValue(RS_57_item_i_item_sk_bloom_filter)) and in_bloom_filter(cs_promo_sk, DynamicValue(RS_60_promotion_p_promo_sk_bloom_filter))) (type: boolean) + filterExpr: (cs_catalog_page_sk is not null and cs_promo_sk is not null and cs_item_sk BETWEEN DynamicValue(RS_57_item_i_item_sk_min) AND DynamicValue(RS_57_item_i_item_sk_max) and in_bloom_filter(cs_item_sk, DynamicValue(RS_57_item_i_item_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 43005109025 Data size: 11339575410520 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (cs_catalog_page_sk is not null and cs_promo_sk is not null and cs_promo_sk BETWEEN DynamicValue(RS_60_promotion_p_promo_sk_min) AND DynamicValue(RS_60_promotion_p_promo_sk_max) and cs_item_sk BETWEEN DynamicValue(RS_57_item_i_item_sk_min) AND DynamicValue(RS_57_item_i_item_sk_max) and in_bloom_filter(cs_promo_sk, DynamicValue(RS_60_promotion_p_promo_sk_bloom_filter)) and in_bloom_filter(cs_item_sk, DynamicValue(RS_57_item_i_item_sk_bloom_filter))) (type: boolean) + predicate: (cs_catalog_page_sk is not null and cs_promo_sk is not null and cs_item_sk BETWEEN DynamicValue(RS_57_item_i_item_sk_min) AND DynamicValue(RS_57_item_i_item_sk_max) and in_bloom_filter(cs_item_sk, DynamicValue(RS_57_item_i_item_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 42789551679 Data size: 11282737308320 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: cs_catalog_page_sk (type: bigint), cs_item_sk (type: bigint), cs_promo_sk (type: bigint), cs_order_number (type: bigint), cs_ext_sales_price (type: decimal(7,2)), cs_net_profit (type: decimal(7,2)), cs_sold_date_sk (type: bigint) @@ -176,82 +173,85 @@ STAGE PLANS: Map 18 Map Operator Tree: TableScan - alias: promotion - filterExpr: (p_channel_tv = 'N') (type: boolean) - Statistics: Num rows: 2300 Data size: 213900 Basic stats: COMPLETE Column stats: COMPLETE + alias: date_dim + filterExpr: CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'1998-08-04 00:00:00' AND TIMESTAMP'1998-09-03 00:00:00' (type: boolean) + Statistics: Num rows: 73049 Data size: 4675136 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (p_channel_tv = 'N') (type: boolean) - Statistics: Num rows: 1150 Data size: 106950 Basic stats: COMPLETE Column stats: COMPLETE + predicate: CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'1998-08-04 00:00:00' AND TIMESTAMP'1998-09-03 00:00:00' (type: boolean) + Statistics: Num rows: 8116 Data size: 519424 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: p_promo_sk (type: bigint) + expressions: d_date_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 1150 Data size: 9200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1150 Data size: 9200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 1150 Data size: 9200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1000000) - minReductionHashAggr: 0.99 + keys: _col0 (type: bigint) + minReductionHashAggr: 0.4 mode: hash - outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) + outputColumnNames: _col0 + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE + Dynamic Partitioning Event Operator + Target column: cs_sold_date_sk (bigint) + Target Input: catalog_sales + Partition key expr: cs_sold_date_sk + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE + Target Vertex: Map 10 Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1150 Data size: 9200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 1150 Data size: 9200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1000000) - minReductionHashAggr: 0.99 + keys: _col0 (type: bigint) + minReductionHashAggr: 0.4 mode: hash - outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) + outputColumnNames: _col0 + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE + Dynamic Partitioning Event Operator + Target column: ws_sold_date_sk (bigint) + Target Input: web_sales + Partition key expr: ws_sold_date_sk + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE + Target Vertex: Map 20 Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1150 Data size: 9200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 1150 Data size: 9200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1000000) - minReductionHashAggr: 0.99 + keys: _col0 (type: bigint) + minReductionHashAggr: 0.4 mode: hash - outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) + outputColumnNames: _col0 + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE + Dynamic Partitioning Event Operator + Target column: ss_sold_date_sk (bigint) + Target Input: store_sales + Partition key expr: ss_sold_date_sk + Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE + Target Vertex: Map 1 Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 22 + Map 19 Map Operator Tree: TableScan alias: catalog_page @@ -269,14 +269,14 @@ STAGE PLANS: value expressions: _col1 (type: string) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 23 + Map 20 Map Operator Tree: TableScan alias: web_sales - filterExpr: (ws_web_site_sk is not null and ws_promo_sk is not null and ws_item_sk BETWEEN DynamicValue(RS_95_item_i_item_sk_min) AND DynamicValue(RS_95_item_i_item_sk_max) and ws_promo_sk BETWEEN DynamicValue(RS_98_promotion_p_promo_sk_min) AND DynamicValue(RS_98_promotion_p_promo_sk_max) and in_bloom_filter(ws_item_sk, DynamicValue(RS_95_item_i_item_sk_bloom_filter)) and in_bloom_filter(ws_promo_sk, DynamicValue(RS_98_promotion_p_promo_sk_bloom_filter))) (type: boolean) + filterExpr: (ws_web_site_sk is not null and ws_promo_sk is not null and ws_item_sk BETWEEN DynamicValue(RS_95_item_i_item_sk_min) AND DynamicValue(RS_95_item_i_item_sk_max) and in_bloom_filter(ws_item_sk, DynamicValue(RS_95_item_i_item_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 21594638446 Data size: 5700638697608 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (ws_web_site_sk is not null and ws_promo_sk is not null and ws_promo_sk BETWEEN DynamicValue(RS_98_promotion_p_promo_sk_min) AND DynamicValue(RS_98_promotion_p_promo_sk_max) and ws_item_sk BETWEEN DynamicValue(RS_95_item_i_item_sk_min) AND DynamicValue(RS_95_item_i_item_sk_max) and in_bloom_filter(ws_promo_sk, DynamicValue(RS_98_promotion_p_promo_sk_bloom_filter)) and in_bloom_filter(ws_item_sk, DynamicValue(RS_95_item_i_item_sk_bloom_filter))) (type: boolean) + predicate: (ws_web_site_sk is not null and ws_promo_sk is not null and ws_item_sk BETWEEN DynamicValue(RS_95_item_i_item_sk_min) AND DynamicValue(RS_95_item_i_item_sk_max) and in_bloom_filter(ws_item_sk, DynamicValue(RS_95_item_i_item_sk_bloom_filter))) (type: boolean) Statistics: Num rows: 21589233207 Data size: 5699211801048 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ws_item_sk (type: bigint), ws_web_site_sk (type: bigint), ws_promo_sk (type: bigint), ws_order_number (type: bigint), ws_ext_sales_price (type: decimal(7,2)), ws_net_profit (type: decimal(7,2)), ws_sold_date_sk (type: bigint) @@ -291,7 +291,7 @@ STAGE PLANS: value expressions: _col1 (type: bigint), _col2 (type: bigint), _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)), _col6 (type: bigint) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 26 + Map 23 Map Operator Tree: TableScan alias: web_returns @@ -313,7 +313,7 @@ STAGE PLANS: value expressions: _col2 (type: decimal(7,2)), _col3 (type: decimal(7,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) - Map 27 + Map 24 Map Operator Tree: TableScan alias: web_site @@ -356,82 +356,34 @@ STAGE PLANS: Map 8 Map Operator Tree: TableScan - alias: date_dim - filterExpr: CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'1998-08-04 00:00:00' AND TIMESTAMP'1998-09-03 00:00:00' (type: boolean) - Statistics: Num rows: 73049 Data size: 4675136 Basic stats: COMPLETE Column stats: COMPLETE + alias: promotion + filterExpr: (p_channel_tv = 'N') (type: boolean) + Statistics: Num rows: 2300 Data size: 211690 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: CAST( d_date AS TIMESTAMP) BETWEEN TIMESTAMP'1998-08-04 00:00:00' AND TIMESTAMP'1998-09-03 00:00:00' (type: boolean) - Statistics: Num rows: 8116 Data size: 519424 Basic stats: COMPLETE Column stats: COMPLETE + predicate: (p_channel_tv = 'N') (type: boolean) + Statistics: Num rows: 2300 Data size: 211690 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: d_date_sk (type: bigint) + expressions: p_promo_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: _col0 (type: bigint) - outputColumnNames: _col0 - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator - keys: _col0 (type: bigint) - minReductionHashAggr: 0.4 - mode: hash - outputColumnNames: _col0 - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Dynamic Partitioning Event Operator - Target column: ss_sold_date_sk (bigint) - Target Input: store_sales - Partition key expr: ss_sold_date_sk - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Target Vertex: Map 1 + Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: _col0 (type: bigint) - outputColumnNames: _col0 - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator - keys: _col0 (type: bigint) - minReductionHashAggr: 0.4 - mode: hash - outputColumnNames: _col0 - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Dynamic Partitioning Event Operator - Target column: ws_sold_date_sk (bigint) - Target Input: web_sales - Partition key expr: ws_sold_date_sk - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Target Vertex: Map 23 + Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Select Operator - expressions: _col0 (type: bigint) - outputColumnNames: _col0 - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Group By Operator - keys: _col0 (type: bigint) - minReductionHashAggr: 0.4 - mode: hash - outputColumnNames: _col0 - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Dynamic Partitioning Event Operator - Target column: cs_sold_date_sk (bigint) - Target Input: catalog_sales - Partition key expr: cs_sold_date_sk - Statistics: Num rows: 8116 Data size: 64928 Basic stats: COMPLETE Column stats: COMPLETE - Target Vertex: Map 10 + Statistics: Num rows: 2300 Data size: 18400 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 9 @@ -480,22 +432,22 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col2 (type: bigint) + 0 _col6 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col0, _col4, _col5, _col6, _col9, _col10 + outputColumnNames: _col0, _col2, _col4, _col5, _col9, _col10 input vertices: 1 Map 18 - Statistics: Num rows: 17045880285 Data size: 4078164892288 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3787714088 Data size: 895347046408 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col6 (type: bigint) + 0 _col2 (type: bigint) 1 _col0 (type: bigint) outputColumnNames: _col0, _col4, _col5, _col9, _col10 input vertices: 1 Map 8 - Statistics: Num rows: 1893857044 Data size: 426528458096 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3787714088 Data size: 865903292304 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -504,25 +456,25 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col4, _col5, _col9, _col10, _col15 input vertices: - 1 Map 22 - Statistics: Num rows: 1893857044 Data size: 601623318160 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 19 + Statistics: Num rows: 3787714088 Data size: 1215233000416 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col15 (type: string), _col4 (type: decimal(7,2)), if(_col9 is not null, _col9, 0) (type: decimal(7,2)), (_col5 - if(_col10 is not null, _col10, 0)) (type: decimal(8,2)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 1893857044 Data size: 601623318160 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3787714088 Data size: 1215233000416 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1), sum(_col2), sum(_col3) keys: _col0 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 107889741 Data size: 47039927076 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 217890468 Data size: 95000244048 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 107889741 Data size: 47039927076 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 217890468 Data size: 95000244048 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)), _col2 (type: decimal(17,2)), _col3 (type: decimal(18,2)) Reducer 12 Execution mode: vectorized, llap @@ -612,19 +564,6 @@ STAGE PLANS: sort order: Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) - Reducer 19 - Execution mode: vectorized, llap - Reduce Operator Tree: - Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1000000) - mode: final - outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) Reducer 2 Execution mode: vectorized, llap Reduce Operator Tree: @@ -653,22 +592,22 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col2 (type: bigint) + 0 _col6 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col1, _col4, _col5, _col6, _col9, _col10 + outputColumnNames: _col1, _col2, _col4, _col5, _col9, _col10 input vertices: 1 Map 18 - Statistics: Num rows: 31432193628 Data size: 7113224649584 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6984453758 Data size: 1230973268960 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col6 (type: bigint) + 0 _col2 (type: bigint) 1 _col0 (type: bigint) outputColumnNames: _col1, _col4, _col5, _col9, _col10 input vertices: 1 Map 8 - Statistics: Num rows: 3492226879 Data size: 379694814792 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6984453758 Data size: 1189891450720 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -678,52 +617,26 @@ STAGE PLANS: outputColumnNames: _col4, _col5, _col9, _col10, _col15 input vertices: 1 Map 9 - Statistics: Num rows: 3492226879 Data size: 715790771852 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6984453758 Data size: 1847272280648 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col15 (type: string), _col4 (type: decimal(7,2)), if(_col9 is not null, _col9, 0) (type: decimal(7,2)), (_col5 - if(_col10 is not null, _col10, 0)) (type: decimal(8,2)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 3492226879 Data size: 715790771852 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6984453758 Data size: 1847272280648 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1), sum(_col2), sum(_col3) keys: _col0 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 2458563 Data size: 1071933468 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6342864 Data size: 2765488704 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 2458563 Data size: 1071933468 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6342864 Data size: 2765488704 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)), _col2 (type: decimal(17,2)), _col3 (type: decimal(18,2)) - Reducer 20 - Execution mode: vectorized, llap - Reduce Operator Tree: - Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1000000) - mode: final - outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) Reducer 21 - Execution mode: vectorized, llap - Reduce Operator Tree: - Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1000000) - mode: final - outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - Reduce Output Operator - null sort order: - sort order: - Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: bigint), _col1 (type: bigint), _col2 (type: binary) - Reducer 24 Execution mode: vectorized, llap Reduce Operator Tree: Map Join Operator @@ -734,7 +647,7 @@ STAGE PLANS: 1 KEY.reducesinkkey0 (type: bigint), KEY.reducesinkkey1 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col4, _col5, _col6, _col9, _col10 input vertices: - 1 Map 26 + 1 Map 23 Statistics: Num rows: 33633305448 Data size: 14391212980304 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Map Join Operator @@ -751,22 +664,22 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col2 (type: bigint) + 0 _col6 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col1, _col4, _col5, _col6, _col9, _col10 + outputColumnNames: _col1, _col2, _col4, _col5, _col9, _col10 input vertices: 1 Map 18 - Statistics: Num rows: 8415060154 Data size: 2151835885288 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1869885354 Data size: 448426719584 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col6 (type: bigint) + 0 _col2 (type: bigint) 1 _col0 (type: bigint) outputColumnNames: _col1, _col4, _col5, _col9, _col10 input vertices: 1 Map 8 - Statistics: Num rows: 934942678 Data size: 216582544488 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1869885354 Data size: 433489245320 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -775,27 +688,27 @@ STAGE PLANS: 1 _col0 (type: bigint) outputColumnNames: _col4, _col5, _col9, _col10, _col15 input vertices: - 1 Map 27 - Statistics: Num rows: 934942678 Data size: 302618896072 Basic stats: COMPLETE Column stats: COMPLETE + 1 Map 24 + Statistics: Num rows: 1869885354 Data size: 605540323096 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col15 (type: string), _col4 (type: decimal(7,2)), if(_col9 is not null, _col9, 0) (type: decimal(7,2)), (_col5 - if(_col10 is not null, _col10, 0)) (type: decimal(8,2)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 934942678 Data size: 302618896072 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1869885354 Data size: 605540323096 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1), sum(_col2), sum(_col3) keys: _col0 (type: string) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 49686 Data size: 21663096 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 99372 Data size: 43326192 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: string) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: string) - Statistics: Num rows: 49686 Data size: 21663096 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 99372 Data size: 43326192 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(17,2)), _col2 (type: decimal(17,2)), _col3 (type: decimal(18,2)) - Reducer 25 + Reducer 22 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query81.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query81.q.out index 817a9878004c..ba260662e0cc 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query81.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query81.q.out @@ -23,15 +23,15 @@ STAGE PLANS: TableScan alias: customer filterExpr: c_current_addr_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_160_container, bigKeyColName:c_current_addr_sk, smallTablePos:1, keyRatio:0.0185202875 - Statistics: Num rows: 80000000 Data size: 30640000000 Basic stats: COMPLETE Column stats: COMPLETE + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_160_container, bigKeyColName:c_current_addr_sk, smallTablePos:1, keyRatio:0.0188764625 + Statistics: Num rows: 80000000 Data size: 29892558349 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: c_current_addr_sk is not null (type: boolean) - Statistics: Num rows: 80000000 Data size: 30640000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 29892558349 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: c_customer_sk (type: bigint), c_customer_id (type: char(16)), c_current_addr_sk (type: bigint), c_salutation (type: char(10)), c_first_name (type: char(20)), c_last_name (type: char(30)) + expressions: c_customer_sk (type: bigint), c_customer_id (type: string), c_current_addr_sk (type: bigint), c_salutation (type: char(10)), c_first_name (type: char(20)), c_last_name (type: char(30)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 80000000 Data size: 30640000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 29892558349 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -41,20 +41,20 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3, _col4, _col5, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16 input vertices: 1 Map 10 - Statistics: Num rows: 1509434 Data size: 1983876888 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1538463 Data size: 1592137965 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1509434 Data size: 1983876888 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col1 (type: char(16)), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col7 (type: char(10)), _col8 (type: varchar(60)), _col9 (type: char(15)), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(30)), _col13 (type: char(10)), _col14 (type: varchar(20)), _col15 (type: decimal(5,2)), _col16 (type: char(20)) + Statistics: Num rows: 1538463 Data size: 1592137965 Basic stats: COMPLETE Column stats: COMPLETE + value expressions: _col1 (type: string), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col7 (type: char(10)), _col8 (type: varchar(60)), _col9 (type: char(15)), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(30)), _col13 (type: char(10)), _col14 (type: varchar(20)), _col15 (type: decimal(5,2)), _col16 (type: char(20)) Select Operator expressions: _col0 (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 1509434 Data size: 12075472 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1538463 Data size: 12307704 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator - aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1481623) + aggregations: min(_col0), max(_col0), bloom_filter(_col0, expectedEntries=1510117) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 @@ -71,41 +71,41 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: (ca_state is not null or (ca_state = 'IL')) (type: boolean) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ca_state is not null (type: boolean) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38800242 Data size: 3547138356 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_state (type: char(2)) outputColumnNames: _col0, _col1 - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38800242 Data size: 3547138356 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38800242 Data size: 3547138356 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38800242 Data size: 3547138356 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)) Filter Operator predicate: (ca_state = 'IL') (type: boolean) - Statistics: Num rows: 754717 Data size: 778593839 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 772459990 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), ca_street_number (type: char(10)), ca_street_name (type: varchar(60)), ca_street_type (type: char(15)), ca_suite_number (type: char(10)), ca_city (type: varchar(60)), ca_county (type: varchar(30)), ca_zip (type: char(10)), ca_country (type: varchar(20)), ca_gmt_offset (type: decimal(5,2)), ca_location_type (type: char(20)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10 - Statistics: Num rows: 754717 Data size: 713688177 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 708290230 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 754717 Data size: 713688177 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 708290230 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(10)), _col2 (type: varchar(60)), _col3 (type: char(15)), _col4 (type: char(10)), _col5 (type: varchar(60)), _col6 (type: varchar(30)), _col7 (type: char(10)), _col8 (type: varchar(20)), _col9 (type: decimal(5,2)), _col10 (type: char(20)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -141,20 +141,20 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col6 input vertices: 1 Map 10 - Statistics: Num rows: 739053777 Data size: 142054564750 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 716886590 Data size: 137388039836 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col6 (type: char(2)), _col0 (type: bigint) minReductionHashAggr: 0.86675507 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 739053777 Data size: 151574886190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 716886590 Data size: 146908361276 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(2)), _col1 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: char(2)), _col1 (type: bigint) - Statistics: Num rows: 739053777 Data size: 151574886190 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 716886590 Data size: 146908361276 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(17,2)) Filter Operator predicate: (cr_returning_addr_sk is not null and cr_returning_customer_sk is not null and cr_returning_customer_sk BETWEEN DynamicValue(RS_57_customer_c_customer_sk_min) AND DynamicValue(RS_57_customer_c_customer_sk_max) and in_bloom_filter(cr_returning_customer_sk, DynamicValue(RS_57_customer_c_customer_sk_bloom_filter))) (type: boolean) @@ -182,20 +182,20 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col6 input vertices: 1 Reducer 11 - Statistics: Num rows: 724434361 Data size: 139244546270 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 702705669 Data size: 134668351326 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col0 (type: bigint), _col6 (type: char(2)) minReductionHashAggr: 0.8640661 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 724434361 Data size: 148576543742 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 702705669 Data size: 144000348798 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col1 (type: char(2)) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col1 (type: char(2)) - Statistics: Num rows: 724434361 Data size: 148576543742 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 702705669 Data size: 144000348798 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -269,13 +269,13 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 38800242 Data size: 3547138356 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(2)) Reducer 2 Execution mode: vectorized, llap Reduce Operator Tree: Group By Operator - aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1481623) + aggregations: min(VALUE._col0), max(VALUE._col1), bloom_filter(VALUE._col2, 1, expectedEntries=1510117) mode: final outputColumnNames: _col0, _col1, _col2 Statistics: Num rows: 1 Data size: 160 Basic stats: COMPLETE Column stats: COMPLETE @@ -292,24 +292,24 @@ STAGE PLANS: keys: KEY._col0 (type: char(2)), KEY._col1 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 716910171 Data size: 147033383714 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 695407170 Data size: 142506679842 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(2)), _col2 (type: decimal(17,2)) outputColumnNames: _col0, _col2 - Statistics: Num rows: 716910171 Data size: 147033383714 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 695407170 Data size: 142506679842 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2), count(_col2) keys: _col0 (type: char(2)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 30475 Data size: 6277850 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 29521 Data size: 6077284 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(2)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: char(2)) - Statistics: Num rows: 30475 Data size: 6277850 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 29521 Data size: 6077284 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: decimal(27,2)), _col2 (type: bigint) Reducer 5 Execution mode: vectorized, llap @@ -342,10 +342,10 @@ STAGE PLANS: keys: KEY._col0 (type: bigint), KEY._col1 (type: char(2)) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 716910171 Data size: 147033383722 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 695407170 Data size: 142504720598 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: _col2 is not null (type: boolean) - Statistics: Num rows: 716910171 Data size: 147033383722 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 695407170 Data size: 142504720598 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -355,7 +355,7 @@ STAGE PLANS: outputColumnNames: _col1, _col3, _col4, _col5, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col18, _col19 input vertices: 0 Map 1 - Statistics: Num rows: 716910171 Data size: 1079664179270 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 695407170 Data size: 1046751673767 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -365,37 +365,37 @@ STAGE PLANS: outputColumnNames: _col1, _col3, _col4, _col5, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15, _col16, _col19, _col20 input vertices: 1 Reducer 5 - Statistics: Num rows: 716910171 Data size: 1098303843716 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 708780384 Data size: 1085419068945 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (_col19 > _col20) (type: boolean) - Statistics: Num rows: 238970057 Data size: 366101281276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 236260128 Data size: 361806357143 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++++++++++++++ - keys: _col1 (type: char(16)), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col7 (type: char(10)), _col8 (type: varchar(60)), _col9 (type: char(15)), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(30)), _col13 (type: char(10)), _col14 (type: varchar(20)), _col15 (type: decimal(5,2)), _col16 (type: char(20)), _col19 (type: decimal(17,2)) + keys: _col1 (type: string), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col7 (type: char(10)), _col8 (type: varchar(60)), _col9 (type: char(15)), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(30)), _col13 (type: char(10)), _col14 (type: varchar(20)), _col15 (type: decimal(5,2)), _col16 (type: char(20)), _col19 (type: decimal(17,2)) null sort order: zzzzzzzzzzzzzzz - Statistics: Num rows: 238970057 Data size: 366101281276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 236260128 Data size: 361806357143 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator - expressions: _col1 (type: char(16)), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col7 (type: char(10)), _col8 (type: varchar(60)), _col9 (type: char(15)), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(30)), _col13 (type: char(10)), _col14 (type: varchar(20)), _col15 (type: decimal(5,2)), _col16 (type: char(20)), _col19 (type: decimal(17,2)) + expressions: _col1 (type: string), _col3 (type: char(10)), _col4 (type: char(20)), _col5 (type: char(30)), _col7 (type: char(10)), _col8 (type: varchar(60)), _col9 (type: char(15)), _col10 (type: char(10)), _col11 (type: varchar(60)), _col12 (type: varchar(30)), _col13 (type: char(10)), _col14 (type: varchar(20)), _col15 (type: decimal(5,2)), _col16 (type: char(20)), _col19 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14 - Statistics: Num rows: 238970057 Data size: 339335788732 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 236260128 Data size: 335201062646 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col0 (type: char(16)), _col1 (type: char(10)), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: char(10)), _col5 (type: varchar(60)), _col6 (type: char(15)), _col7 (type: char(10)), _col8 (type: varchar(60)), _col9 (type: varchar(30)), _col10 (type: char(10)), _col11 (type: varchar(20)), _col12 (type: decimal(5,2)), _col13 (type: char(20)), _col14 (type: decimal(17,2)) + key expressions: _col0 (type: string), _col1 (type: char(10)), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: char(10)), _col5 (type: varchar(60)), _col6 (type: char(15)), _col7 (type: char(10)), _col8 (type: varchar(60)), _col9 (type: varchar(30)), _col10 (type: char(10)), _col11 (type: varchar(20)), _col12 (type: decimal(5,2)), _col13 (type: char(20)), _col14 (type: decimal(17,2)) null sort order: zzzzzzzzzzzzzzz sort order: +++++++++++++++ - Statistics: Num rows: 238970057 Data size: 339335788732 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 236260128 Data size: 335201062646 Basic stats: COMPLETE Column stats: COMPLETE Reducer 7 Execution mode: vectorized, llap Reduce Operator Tree: Select Operator - expressions: KEY.reducesinkkey0 (type: char(16)), KEY.reducesinkkey1 (type: char(10)), KEY.reducesinkkey2 (type: char(20)), KEY.reducesinkkey3 (type: char(30)), KEY.reducesinkkey4 (type: char(10)), KEY.reducesinkkey5 (type: varchar(60)), KEY.reducesinkkey6 (type: char(15)), KEY.reducesinkkey7 (type: char(10)), KEY.reducesinkkey8 (type: varchar(60)), KEY.reducesinkkey9 (type: varchar(30)), KEY.reducesinkkey10 (type: char(10)), KEY.reducesinkkey11 (type: varchar(20)), KEY.reducesinkkey12 (type: decimal(5,2)), KEY.reducesinkkey13 (type: char(20)), KEY.reducesinkkey14 (type: decimal(17,2)) + expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: char(10)), KEY.reducesinkkey2 (type: char(20)), KEY.reducesinkkey3 (type: char(30)), KEY.reducesinkkey4 (type: char(10)), KEY.reducesinkkey5 (type: varchar(60)), KEY.reducesinkkey6 (type: char(15)), KEY.reducesinkkey7 (type: char(10)), KEY.reducesinkkey8 (type: varchar(60)), KEY.reducesinkkey9 (type: varchar(30)), KEY.reducesinkkey10 (type: char(10)), KEY.reducesinkkey11 (type: varchar(20)), KEY.reducesinkkey12 (type: decimal(5,2)), KEY.reducesinkkey13 (type: char(20)), KEY.reducesinkkey14 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14 - Statistics: Num rows: 238970057 Data size: 339335788732 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 236260128 Data size: 335201062646 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 142000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: _col0 (type: char(16)), _col1 (type: char(10)), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: char(10)), _col5 (type: varchar(60)), _col6 (type: char(15)), _col7 (type: char(10)), _col8 (type: varchar(60)), _col9 (type: varchar(30)), 'IL' (type: char(2)), _col10 (type: char(10)), _col11 (type: varchar(20)), _col12 (type: decimal(5,2)), _col13 (type: char(20)), _col14 (type: decimal(17,2)) + expressions: _col0 (type: string), _col1 (type: char(10)), _col2 (type: char(20)), _col3 (type: char(30)), _col4 (type: char(10)), _col5 (type: varchar(60)), _col6 (type: char(15)), _col7 (type: char(10)), _col8 (type: varchar(60)), _col9 (type: varchar(30)), 'IL' (type: char(2)), _col10 (type: char(10)), _col11 (type: varchar(20)), _col12 (type: decimal(5,2)), _col13 (type: char(20)), _col14 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8, _col9, _col10, _col11, _col12, _col13, _col14, _col15 Statistics: Num rows: 100 Data size: 150600 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query82.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query82.q.out index cbbe0e44173a..22a34814381a 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query82.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query82.q.out @@ -37,7 +37,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col3, _col4, _col5 input vertices: 1 Map 2 - Statistics: Num rows: 1247848 Data size: 514113264 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1247848 Data size: 514113080 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -47,13 +47,13 @@ STAGE PLANS: outputColumnNames: _col2, _col3, _col4, _col5 input vertices: 1 Map 4 - Statistics: Num rows: 138641 Data size: 56010852 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138641 Data size: 56010668 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col2 (type: bigint) - Statistics: Num rows: 138641 Data size: 56010852 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138641 Data size: 56010668 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: string), _col4 (type: varchar(200)), _col5 (type: decimal(7,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -62,20 +62,20 @@ STAGE PLANS: TableScan alias: item filterExpr: ((i_manufact_id) IN (129, 437, 663, 727) and i_current_price BETWEEN 30 AND 60) (type: boolean) - Statistics: Num rows: 462000 Data size: 188360804 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 188147916 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((i_manufact_id) IN (129, 437, 663, 727) and i_current_price BETWEEN 30 AND 60) (type: boolean) - Statistics: Num rows: 787 Data size: 320980 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 787 Data size: 320796 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_id (type: string), i_item_desc (type: varchar(200)), i_current_price (type: decimal(7,2)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 787 Data size: 317836 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 787 Data size: 317652 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 787 Data size: 317836 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 787 Data size: 317652 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(200)), _col3 (type: decimal(7,2)) Select Operator expressions: _col0 (type: bigint) @@ -138,12 +138,12 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col5 input vertices: 0 Map 1 - Statistics: Num rows: 147187549 Data size: 58286269292 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 147187549 Data size: 58286269108 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: +++ keys: _col3 (type: string), _col4 (type: varchar(200)), _col5 (type: decimal(7,2)) null sort order: zzz - Statistics: Num rows: 147187549 Data size: 58286269292 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 147187549 Data size: 58286269108 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Group By Operator keys: _col3 (type: string), _col4 (type: varchar(200)), _col5 (type: decimal(7,2)) diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query84.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query84.q.out index 2c2623c74223..8f22986823c6 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query84.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query84.q.out @@ -49,16 +49,16 @@ STAGE PLANS: Statistics: Num rows: 21903 Data size: 6220452 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: + - keys: _col2 (type: char(16)) + keys: _col2 (type: string) null sort order: z Statistics: Num rows: 21903 Data size: 6220452 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator - expressions: _col6 (type: string), _col2 (type: char(16)) + expressions: _col6 (type: string), _col2 (type: string) outputColumnNames: _col1, _col2 Statistics: Num rows: 21903 Data size: 6220452 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator - key expressions: _col2 (type: char(16)) + key expressions: _col2 (type: string) null sort order: z sort order: + Statistics: Num rows: 21903 Data size: 6220452 Basic stats: COMPLETE Column stats: COMPLETE @@ -88,12 +88,12 @@ STAGE PLANS: alias: customer filterExpr: (c_current_hdemo_sk is not null and c_current_cdemo_sk is not null and c_current_addr_sk is not null) (type: boolean) probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_119_container, bigKeyColName:c_current_hdemo_sk, smallTablePos:1, keyRatio:2.836375E-4 - Statistics: Num rows: 80000000 Data size: 24275219040 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 23771488140 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (c_current_hdemo_sk is not null and c_current_cdemo_sk is not null and c_current_addr_sk is not null) (type: boolean) - Statistics: Num rows: 74500295 Data size: 22606387248 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 74500295 Data size: 22137286008 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: c_customer_id (type: char(16)), c_current_cdemo_sk (type: bigint), c_current_hdemo_sk (type: bigint), c_current_addr_sk (type: bigint), concat(concat(c_last_name, ', '), c_first_name) (type: string) + expressions: c_customer_id (type: string), c_current_cdemo_sk (type: bigint), c_current_hdemo_sk (type: bigint), c_current_addr_sk (type: bigint), concat(concat(c_last_name, ', '), c_first_name) (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4 Statistics: Num rows: 74500295 Data size: 22904388428 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator @@ -122,7 +122,7 @@ STAGE PLANS: sort order: + Map-reduce partition columns: _col1 (type: bigint) Statistics: Num rows: 22691 Data size: 6444252 Basic stats: COMPLETE Column stats: COMPLETE - value expressions: _col0 (type: char(16)), _col4 (type: string) + value expressions: _col0 (type: string), _col4 (type: string) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 5 @@ -130,10 +130,10 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: (ca_city = 'Hopewell') (type: boolean) - Statistics: Num rows: 40000000 Data size: 4040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3928420739 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ca_city = 'Hopewell') (type: boolean) - Statistics: Num rows: 40609 Data size: 4101509 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40609 Data size: 3988328 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint) outputColumnNames: _col0 @@ -203,7 +203,7 @@ STAGE PLANS: Execution mode: vectorized, llap Reduce Operator Tree: Select Operator - expressions: KEY.reducesinkkey0 (type: char(16)), VALUE._col0 (type: string) + expressions: KEY.reducesinkkey0 (type: string), VALUE._col0 (type: string) outputColumnNames: _col0, _col1 Statistics: Num rows: 21903 Data size: 6220452 Basic stats: COMPLETE Column stats: COMPLETE Limit diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query85.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query85.q.out index f50a9a598ee1..6624e89da23b 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query85.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query85.q.out @@ -108,7 +108,7 @@ STAGE PLANS: TableScan alias: web_returns filterExpr: (wr_returning_cdemo_sk is not null and wr_refunded_cdemo_sk is not null and wr_reason_sk is not null and wr_refunded_addr_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_188_container, bigKeyColName:wr_refunded_cdemo_sk, smallTablePos:1, keyRatio:4.669891527614227E-6 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_188_container, bigKeyColName:wr_refunded_cdemo_sk, smallTablePos:1, keyRatio:9.519412074036258E-6 Statistics: Num rows: 2160007345 Data size: 562637317992 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (wr_returning_cdemo_sk is not null and wr_refunded_cdemo_sk is not null and wr_reason_sk is not null and wr_refunded_addr_sk is not null) (type: boolean) @@ -126,7 +126,7 @@ STAGE PLANS: outputColumnNames: _col0, _col1, _col3, _col4, _col5, _col6, _col7, _col9, _col10, _col11 input vertices: 1 Map 8 - Statistics: Num rows: 152543767 Data size: 22050576572 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 310954550 Data size: 65771952680 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -136,7 +136,7 @@ STAGE PLANS: outputColumnNames: _col0, _col3, _col4, _col5, _col6, _col7, _col9, _col10, _col11, _col13, _col14, _col15, _col16, _col17, _col18, _col19, _col20 input vertices: 1 Reducer 10 - Statistics: Num rows: 39225543 Data size: 9061100673 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 79959746 Data size: 18470701566 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -146,18 +146,18 @@ STAGE PLANS: outputColumnNames: _col0, _col4, _col5, _col6, _col7, _col9, _col10, _col11, _col15, _col16, _col17, _col18, _col19, _col20 input vertices: 1 Map 9 - Statistics: Num rows: 39225543 Data size: 2039728468 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 79959746 Data size: 4157907024 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint), _col5 (type: bigint) null sort order: zz sort order: ++ Map-reduce partition columns: _col0 (type: bigint), _col5 (type: bigint) - Statistics: Num rows: 39225543 Data size: 2039728468 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 79959746 Data size: 4157907024 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: bigint), _col6 (type: decimal(7,2)), _col7 (type: decimal(7,2)), _col9 (type: boolean), _col10 (type: boolean), _col11 (type: boolean), _col15 (type: boolean), _col16 (type: boolean), _col17 (type: boolean), _col18 (type: boolean), _col19 (type: boolean), _col20 (type: boolean) Select Operator expressions: _col0 (type: bigint), _col5 (type: bigint), hash(_col0,_col5) (type: int) outputColumnNames: _col0, _col1, _col3 - Statistics: Num rows: 39225543 Data size: 784510860 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 79959746 Data size: 1599194920 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col0), max(_col0), min(_col1), max(_col1), bloom_filter(_col3, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -176,20 +176,20 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: ((ca_state) IN ('GA', 'IN', 'KY', 'MO', 'MT', 'NM', 'OR', 'WI', 'WV') and (ca_country = 'United States')) (type: boolean) - Statistics: Num rows: 40000000 Data size: 7640000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 7420490932 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((ca_state) IN ('GA', 'IN', 'KY', 'MO', 'MT', 'NM', 'OR', 'WI', 'WV') and (ca_country = 'United States')) (type: boolean) - Statistics: Num rows: 3396227 Data size: 648679357 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6923077 Data size: 1284315894 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint), (ca_state) IN ('GA', 'KY', 'NM') (type: boolean), (ca_state) IN ('IN', 'MT', 'OR') (type: boolean), (ca_state) IN ('MO', 'WI', 'WV') (type: boolean) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 3396227 Data size: 67924540 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6923077 Data size: 138461540 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 3396227 Data size: 67924540 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 6923077 Data size: 138461540 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: boolean), _col2 (type: boolean), _col3 (type: boolean) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -250,11 +250,11 @@ STAGE PLANS: outputColumnNames: _col2, _col4, _col5, _col6, _col7, _col8, _col9, _col15, _col17, _col18, _col20, _col21, _col22, _col26, _col27, _col28, _col29, _col30, _col31 input vertices: 1 Map 6 - Statistics: Num rows: 470472027 Data size: 130148627368 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 959038956 Data size: 265314103256 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Filter Operator predicate: (((_col20 and _col4) or (_col21 and _col5) or (_col22 and _col6)) and ((_col26 and _col27 and _col7) or (_col28 and _col29 and _col8) or (_col30 and _col31 and _col9))) (type: boolean) - Statistics: Num rows: 132320256 Data size: 36604301136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 269729706 Data size: 74619591496 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -264,20 +264,20 @@ STAGE PLANS: outputColumnNames: _col2, _col17, _col18, _col36 input vertices: 1 Map 11 - Statistics: Num rows: 132320256 Data size: 40529846024 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 269729706 Data size: 82621662394 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2), count(_col2), sum(_col18), count(_col18), sum(_col17), count(_col17) keys: _col36 (type: char(100)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 11289 Data size: 3985017 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 22933 Data size: 8095349 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(100)) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: char(100)) - Statistics: Num rows: 11289 Data size: 3985017 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 22933 Data size: 8095349 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: bigint), _col2 (type: bigint), _col3 (type: decimal(17,2)), _col4 (type: bigint), _col5 (type: decimal(17,2)), _col6 (type: bigint) Reducer 3 Execution mode: vectorized, llap diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query86.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query86.q.out index b5e4b9aea65e..8cb56e5bf4e5 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query86.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query86.q.out @@ -42,11 +42,11 @@ STAGE PLANS: outputColumnNames: _col1, _col5, _col6 input vertices: 1 Map 6 - Statistics: Num rows: 4245547076 Data size: 1247888905592 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4245547076 Data size: 1247888699252 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col6 (type: char(50)), _col5 (type: char(50)), _col1 (type: decimal(7,2)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 4245547076 Data size: 1247888905592 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4245547076 Data size: 1247888699252 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col0 (type: char(50)), _col1 (type: char(50)), 0L (type: bigint) @@ -54,13 +54,13 @@ STAGE PLANS: minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 15926625 Data size: 4809840750 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15765750 Data size: 4761255954 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: bigint) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: bigint) - Statistics: Num rows: 15926625 Data size: 4809840750 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15765750 Data size: 4761255954 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -105,17 +105,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: item - Statistics: Num rows: 462000 Data size: 87780000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 87573660 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_class (type: char(50)), i_category (type: char(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 462000 Data size: 87780000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 87573660 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 462000 Data size: 87780000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 87573660 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)), _col2 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -127,17 +127,17 @@ STAGE PLANS: keys: KEY._col0 (type: char(50)), KEY._col1 (type: char(50)), KEY._col2 (type: bigint) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 3267 Data size: 986634 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 976668 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col3 (type: decimal(17,2)), _col2 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 3267 Data size: 986634 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 976668 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: (grouping(_col3, 1L) + grouping(_col3, 0L)) (type: bigint), CASE WHEN ((grouping(_col3, 0L) = UDFToLong(0))) THEN (_col0) ELSE (CAST( null AS CHAR(50))) END (type: char(50)), _col2 (type: decimal(17,2)) null sort order: aaa sort order: ++- Map-reduce partition columns: (grouping(_col3, 1L) + grouping(_col3, 0L)) (type: bigint), CASE WHEN ((grouping(_col3, 0L) = UDFToLong(0))) THEN (_col0) ELSE (CAST( null AS CHAR(50))) END (type: char(50)) - Statistics: Num rows: 3267 Data size: 986634 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 976668 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col3 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -145,7 +145,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: char(50)), VALUE._col1 (type: char(50)), KEY.reducesinkkey2 (type: decimal(17,2)), VALUE._col2 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 3267 Data size: 986634 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 976668 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -166,22 +166,22 @@ STAGE PLANS: window function: GenericUDAFRankEvaluator window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) isPivotResult: true - Statistics: Num rows: 3267 Data size: 986634 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 976668 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: -++ keys: (grouping(_col3, 1L) + grouping(_col3, 0L)) (type: bigint), if(((grouping(_col3, 1L) + grouping(_col3, 0L)) = 0L), _col0, null) (type: char(50)), rank_window_0 (type: int) null sort order: azz - Statistics: Num rows: 3267 Data size: 986634 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 976668 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col2 (type: decimal(17,2)), _col0 (type: char(50)), _col1 (type: char(50)), (grouping(_col3, 1L) + grouping(_col3, 0L)) (type: bigint), rank_window_0 (type: int), if(((grouping(_col3, 1L) + grouping(_col3, 0L)) = 0L), _col0, null) (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 3267 Data size: 999792 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 989694 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col3 (type: bigint), _col5 (type: char(50)), _col4 (type: int) null sort order: azz sort order: -++ - Statistics: Num rows: 3267 Data size: 999792 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 989694 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: decimal(17,2)), _col1 (type: char(50)), _col2 (type: char(50)) Reducer 4 Execution mode: vectorized, llap @@ -189,7 +189,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: decimal(17,2)), VALUE._col1 (type: char(50)), VALUE._col2 (type: char(50)), KEY.reducesinkkey0 (type: bigint), KEY.reducesinkkey2 (type: int) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 3267 Data size: 999702 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3234 Data size: 989604 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 30600 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query87.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query87.q.out index 334084e78ceb..86428615a9ba 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query87.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query87.q.out @@ -173,31 +173,31 @@ STAGE PLANS: Map Operator Tree: TableScan alias: customer - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: c_customer_sk (type: bigint), c_first_name (type: char(20)), c_last_name (type: char(30)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(20)), _col2 (type: char(30)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(20)), _col2 (type: char(30)) Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 80000000 Data size: 15040000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 80000000 Data size: 14536269100 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(20)), _col2 (type: char(30)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -245,20 +245,20 @@ STAGE PLANS: outputColumnNames: _col3, _col5, _col6 input vertices: 1 Map 16 - Statistics: Num rows: 8374481746 Data size: 1976377692056 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8374481746 Data size: 1975873961156 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator keys: _col6 (type: char(30)), _col5 (type: char(20)), _col3 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 4187240873 Data size: 988188846028 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4187240873 Data size: 987936980578 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 4187240873 Data size: 988188846028 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4187240873 Data size: 987936980578 Basic stats: COMPLETE Column stats: COMPLETE Reducer 11 Execution mode: vectorized, llap Reduce Operator Tree: @@ -266,38 +266,38 @@ STAGE PLANS: keys: KEY._col0 (type: char(30)), KEY._col1 (type: char(20)), KEY._col2 (type: date) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 2093620436 Data size: 494094422896 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2093620436 Data size: 493968490306 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: char(20)), _col0 (type: char(30)), _col2 (type: date) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 2093620436 Data size: 494094422896 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2093620436 Data size: 493968490306 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: char(30)), _col0 (type: char(20)), _col2 (type: date) mode: complete outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 523405109 Data size: 127710846596 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 523405109 Data size: 127679363516 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date), 1L (type: bigint), _col3 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 523405109 Data size: 131898087468 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 523405109 Data size: 131866604388 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date), _col4 (type: bigint), (_col3 * _col4) (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 1513369688 Data size: 381369161376 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1513369688 Data size: 381306195306 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col3), sum(_col4) keys: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 756684844 Data size: 190684580688 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 756684844 Data size: 190637356068 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 756684844 Data size: 190684580688 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 756684844 Data size: 190637356068 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint) Reducer 14 Execution mode: vectorized, llap @@ -311,20 +311,20 @@ STAGE PLANS: outputColumnNames: _col3, _col5, _col6 input vertices: 1 Map 16 - Statistics: Num rows: 4245017503 Data size: 1001824130708 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4245017503 Data size: 1001320399808 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator keys: _col6 (type: char(30)), _col5 (type: char(20)), _col3 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 2122508751 Data size: 500912065236 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2122508751 Data size: 500660199966 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 2122508751 Data size: 500912065236 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2122508751 Data size: 500660199966 Basic stats: COMPLETE Column stats: COMPLETE Reducer 15 Execution mode: vectorized, llap Reduce Operator Tree: @@ -332,38 +332,38 @@ STAGE PLANS: keys: KEY._col0 (type: char(30)), KEY._col1 (type: char(20)), KEY._col2 (type: date) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1061254375 Data size: 250456032500 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1061254375 Data size: 250330100000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: char(20)), _col0 (type: char(30)), _col2 (type: date) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1061254375 Data size: 250456032500 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1061254375 Data size: 250330100000 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: char(30)), _col0 (type: char(20)), _col2 (type: date) mode: complete outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 265313593 Data size: 64736516692 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 265313593 Data size: 64705033792 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date), 1L (type: bigint), _col3 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 265313593 Data size: 66859025436 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 265313593 Data size: 66827542536 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date), _col4 (type: bigint), (_col3 * _col4) (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 281077860 Data size: 70831620720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 281077860 Data size: 70799154210 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col3), sum(_col4) keys: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 140538930 Data size: 35415810360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 140538930 Data size: 35399085120 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 140538930 Data size: 35415810360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 140538930 Data size: 35399085120 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint) Reducer 2 Execution mode: vectorized, llap @@ -377,20 +377,20 @@ STAGE PLANS: outputColumnNames: _col3, _col5, _col6 input vertices: 1 Map 16 - Statistics: Num rows: 15839433273 Data size: 3738106252428 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15839433273 Data size: 3737602521528 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator keys: _col6 (type: char(30)), _col5 (type: char(20)), _col3 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 7919716636 Data size: 1869053126096 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7919716636 Data size: 1868801260826 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 7919716636 Data size: 1869053126096 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7919716636 Data size: 1868801260826 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: vectorized, llap Reduce Operator Tree: @@ -398,38 +398,38 @@ STAGE PLANS: keys: KEY._col0 (type: char(30)), KEY._col1 (type: char(20)), KEY._col2 (type: date) mode: mergepartial outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 3959858318 Data size: 934526563048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3959858318 Data size: 934400630458 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: char(20)), _col0 (type: char(30)), _col2 (type: date) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 3959858318 Data size: 934526563048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3959858318 Data size: 934400630458 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col1 (type: char(30)), _col0 (type: char(20)), _col2 (type: date) mode: complete outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 989964579 Data size: 241551357276 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 989964579 Data size: 241519874286 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date), 2L (type: bigint), _col3 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 989964579 Data size: 249471073908 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 989964579 Data size: 249439590918 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date), _col4 (type: bigint), (_col3 * _col4) (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 1513369688 Data size: 381369161376 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1513369688 Data size: 381306195306 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col3), sum(_col4) keys: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 756684844 Data size: 190684580688 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 756684844 Data size: 190637356068 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 756684844 Data size: 190684580688 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 756684844 Data size: 190637356068 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint) Reducer 5 Execution mode: vectorized, llap @@ -439,41 +439,41 @@ STAGE PLANS: keys: KEY._col0 (type: char(30)), KEY._col1 (type: char(20)), KEY._col2 (type: date) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 378342422 Data size: 95342290344 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 378342422 Data size: 95318678124 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((_col3 > 0L) and ((_col3 * 2L) = _col4)) (type: boolean) - Statistics: Num rows: 63057070 Data size: 15890381640 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63057070 Data size: 15886446390 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 63057070 Data size: 15890381640 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 63057070 Data size: 15886446390 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() keys: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) mode: complete outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 15764267 Data size: 3846481148 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15764267 Data size: 3845497538 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date), 2L (type: bigint), _col3 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 15764267 Data size: 3972595284 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 15764267 Data size: 3971611674 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date), _col4 (type: bigint), (_col3 * _col4) (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 281077860 Data size: 70831620720 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 281077860 Data size: 70799154210 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col3), sum(_col4) keys: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 140538930 Data size: 35415810360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 140538930 Data size: 35399085120 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) null sort order: zzz sort order: +++ Map-reduce partition columns: _col0 (type: char(30)), _col1 (type: char(20)), _col2 (type: date) - Statistics: Num rows: 140538930 Data size: 35415810360 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 140538930 Data size: 35399085120 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint) Reducer 7 Execution mode: vectorized, llap @@ -483,7 +483,7 @@ STAGE PLANS: keys: KEY._col0 (type: char(30)), KEY._col1 (type: char(20)), KEY._col2 (type: date) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4 - Statistics: Num rows: 70269465 Data size: 17707905180 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 70269465 Data size: 17699542650 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: bigint), _col4 (type: bigint) outputColumnNames: _col3, _col4 diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query88.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query88.q.out index f9ab32981493..2931015a834b 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query88.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query88.q.out @@ -87,7 +87,7 @@ STAGE PLANS: 1 _col0 (type: bigint) input vertices: 1 Reducer 33 - Statistics: Num rows: 62169611 Data size: 497356888 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 68186024 Data size: 545488192 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() minReductionHashAggr: 0.99 @@ -127,7 +127,7 @@ STAGE PLANS: 1 _col0 (type: bigint) input vertices: 1 Reducer 29 - Statistics: Num rows: 62169611 Data size: 497356888 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 68186024 Data size: 545488192 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() minReductionHashAggr: 0.99 @@ -167,7 +167,7 @@ STAGE PLANS: 1 _col0 (type: bigint) input vertices: 1 Reducer 32 - Statistics: Num rows: 62169611 Data size: 497356888 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 68186024 Data size: 545488192 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() minReductionHashAggr: 0.99 @@ -207,7 +207,7 @@ STAGE PLANS: 1 _col0 (type: bigint) input vertices: 1 Reducer 28 - Statistics: Num rows: 64348537 Data size: 514788296 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 70575814 Data size: 564606512 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() minReductionHashAggr: 0.99 @@ -247,7 +247,7 @@ STAGE PLANS: 1 _col0 (type: bigint) input vertices: 1 Reducer 30 - Statistics: Num rows: 64348537 Data size: 514788296 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 70575814 Data size: 564606512 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() minReductionHashAggr: 0.99 @@ -287,7 +287,7 @@ STAGE PLANS: 1 _col0 (type: bigint) input vertices: 1 Map 26 - Statistics: Num rows: 64348537 Data size: 514788296 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 70575814 Data size: 564606512 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() minReductionHashAggr: 0.99 @@ -327,7 +327,7 @@ STAGE PLANS: 1 _col0 (type: bigint) input vertices: 1 Reducer 27 - Statistics: Num rows: 64348537 Data size: 514788296 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 70575814 Data size: 564606512 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() minReductionHashAggr: 0.99 @@ -367,7 +367,7 @@ STAGE PLANS: 1 _col0 (type: bigint) input vertices: 1 Reducer 31 - Statistics: Num rows: 62169611 Data size: 497356888 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 68186024 Data size: 545488192 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() minReductionHashAggr: 0.99 @@ -561,62 +561,62 @@ STAGE PLANS: TableScan alias: store filterExpr: (s_store_name = 'ese') (type: boolean) - Statistics: Num rows: 1704 Data size: 163584 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 162704 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (s_store_name = 'ese') (type: boolean) - Statistics: Num rows: 155 Data size: 14880 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 16320 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 11 @@ -811,7 +811,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reducer 28 Execution mode: vectorized, llap Reduce Operator Tree: @@ -823,7 +823,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reducer 29 Execution mode: vectorized, llap Reduce Operator Tree: @@ -835,7 +835,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reducer 3 Execution mode: vectorized, llap Reduce Operator Tree: @@ -860,7 +860,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reducer 31 Execution mode: vectorized, llap Reduce Operator Tree: @@ -872,7 +872,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reducer 32 Execution mode: vectorized, llap Reduce Operator Tree: @@ -884,7 +884,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reducer 33 Execution mode: vectorized, llap Reduce Operator Tree: @@ -896,7 +896,7 @@ STAGE PLANS: null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reducer 4 Execution mode: vectorized, llap Reduce Operator Tree: diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query89.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query89.q.out index 088291fc49b9..b4d22ea91b28 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query89.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query89.q.out @@ -18,7 +18,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: ss_store_sk is not null (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_82_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:0.0027806824526610506 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_82_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:0.003642158515606326 Statistics: Num rows: 82510879939 Data size: 10988352362648 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ss_store_sk is not null (type: boolean) @@ -36,7 +36,7 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col3, _col5, _col6, _col7 input vertices: 1 Map 5 - Statistics: Num rows: 1141571997 Data size: 331055879250 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1495239477 Data size: 433619442810 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -46,7 +46,7 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col5, _col6, _col7, _col9 input vertices: 1 Map 6 - Statistics: Num rows: 229436556 Data size: 65618855136 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 300517704 Data size: 85948057824 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -56,20 +56,20 @@ STAGE PLANS: outputColumnNames: _col2, _col5, _col6, _col7, _col9, _col11, _col12 input vertices: 1 Map 7 - Statistics: Num rows: 229436556 Data size: 106687998652 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 300517704 Data size: 139740724951 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col2) keys: _col5 (type: char(50)), _col6 (type: char(50)), _col7 (type: char(50)), _col9 (type: int), _col11 (type: varchar(50)), _col12 (type: varchar(50)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 16513200 Data size: 9528116400 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 87062976 Data size: 50235335384 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: char(50)), _col3 (type: int), _col4 (type: varchar(50)), _col5 (type: varchar(50)) null sort order: zzzzzz sort order: ++++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: char(50)), _col3 (type: int), _col4 (type: varchar(50)), _col5 (type: varchar(50)) - Statistics: Num rows: 16513200 Data size: 9528116400 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 87062976 Data size: 50235335384 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col6 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -78,20 +78,20 @@ STAGE PLANS: TableScan alias: item filterExpr: ((i_class) IN ('birdal ', 'musical ', 'pants ', 'parenting ', 'wallpaper ', 'womens ') and (i_category) IN ('Books ', 'Electronics ', 'Home ', 'Jewelry ', 'Men ', 'Shoes ') and (((i_category) IN ('Books ', 'Electronics ', 'Home ') and (i_class) IN ('musical ', 'parenting ', 'wallpaper ')) or ((i_category) IN ('Jewelry ', 'Men ', 'Shoes ') and (i_class) IN ('birdal ', 'pants ', 'womens ')))) (type: boolean) - Statistics: Num rows: 462000 Data size: 133980000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 133658360 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: ((i_class) IN ('birdal ', 'musical ', 'pants ', 'parenting ', 'wallpaper ', 'womens ') and (i_category) IN ('Books ', 'Electronics ', 'Home ', 'Jewelry ', 'Men ', 'Shoes ') and (((i_category) IN ('Books ', 'Electronics ', 'Home ') and (i_class) IN ('musical ', 'parenting ', 'wallpaper ')) or ((i_category) IN ('Jewelry ', 'Men ', 'Shoes ') and (i_class) IN ('birdal ', 'pants ', 'womens ')))) (type: boolean) - Statistics: Num rows: 6546 Data size: 1898340 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8574 Data size: 2480820 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_brand (type: char(50)), i_class (type: char(50)), i_category (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3 - Statistics: Num rows: 6546 Data size: 1898340 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8574 Data size: 2480820 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 6546 Data size: 1898340 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 8574 Data size: 2480820 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)), _col2 (type: char(50)), _col3 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -137,17 +137,17 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store - Statistics: Num rows: 1704 Data size: 318648 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 316767 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: s_store_sk (type: bigint), s_store_name (type: varchar(50)), s_company_name (type: varchar(50)) outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 1704 Data size: 318648 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 316767 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 1704 Data size: 318648 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 1704 Data size: 316767 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: varchar(50)), _col2 (type: varchar(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -159,13 +159,13 @@ STAGE PLANS: keys: KEY._col0 (type: char(50)), KEY._col1 (type: char(50)), KEY._col2 (type: char(50)), KEY._col3 (type: int), KEY._col4 (type: varchar(50)), KEY._col5 (type: varchar(50)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 39600 Data size: 22849200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 159456 Data size: 92006112 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col2 (type: char(50)), _col0 (type: char(50)), _col4 (type: varchar(50)), _col5 (type: varchar(50)) null sort order: aaaa sort order: ++++ Map-reduce partition columns: _col2 (type: char(50)), _col0 (type: char(50)), _col4 (type: varchar(50)), _col5 (type: varchar(50)) - Statistics: Num rows: 39600 Data size: 22849200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 159456 Data size: 92006112 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: char(50)), _col3 (type: int), _col6 (type: decimal(17,2)) Reducer 3 Execution mode: vectorized, llap @@ -173,7 +173,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey1 (type: char(50)), VALUE._col0 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), VALUE._col1 (type: int), KEY.reducesinkkey2 (type: varchar(50)), KEY.reducesinkkey3 (type: varchar(50)), VALUE._col2 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 39600 Data size: 22849200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 159456 Data size: 92006112 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -193,29 +193,29 @@ STAGE PLANS: name: avg window function: GenericUDAFAverageEvaluatorDecimal window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) - Statistics: Num rows: 39600 Data size: 22849200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 159456 Data size: 92006112 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: avg_window_0 (type: decimal(21,6)), _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: char(50)), _col3 (type: int), _col4 (type: varchar(50)), _col5 (type: varchar(50)), _col6 (type: decimal(17,2)) outputColumnNames: avg_window_0, _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 39600 Data size: 22849200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 159456 Data size: 92006112 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: if((avg_window_0 <> 0), ((abs((_col6 - avg_window_0)) / avg_window_0) > 0.1), false) (type: boolean) - Statistics: Num rows: 19800 Data size: 13642200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 79728 Data size: 54932592 Basic stats: COMPLETE Column stats: COMPLETE Top N Key Operator sort order: ++ keys: (_col6 - avg_window_0) (type: decimal(22,6)), _col4 (type: varchar(50)) null sort order: zz - Statistics: Num rows: 19800 Data size: 13642200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 79728 Data size: 54932592 Basic stats: COMPLETE Column stats: COMPLETE top n: 100 Select Operator expressions: _col2 (type: char(50)), _col1 (type: char(50)), _col0 (type: char(50)), _col4 (type: varchar(50)), _col5 (type: varchar(50)), _col3 (type: int), _col6 (type: decimal(17,2)), avg_window_0 (type: decimal(21,6)), (_col6 - avg_window_0) (type: decimal(22,6)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8 - Statistics: Num rows: 19800 Data size: 15859800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 79728 Data size: 63862128 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col8 (type: decimal(22,6)), _col3 (type: varchar(50)) null sort order: zz sort order: ++ - Statistics: Num rows: 19800 Data size: 15859800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 79728 Data size: 63862128 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: char(50)), _col4 (type: varchar(50)), _col5 (type: int), _col6 (type: decimal(17,2)), _col7 (type: decimal(21,6)) Reducer 4 Execution mode: vectorized, llap @@ -223,7 +223,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: char(50)), VALUE._col1 (type: char(50)), VALUE._col2 (type: char(50)), KEY.reducesinkkey1 (type: varchar(50)), VALUE._col3 (type: varchar(50)), VALUE._col4 (type: int), VALUE._col5 (type: decimal(17,2)), VALUE._col6 (type: decimal(21,6)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 19800 Data size: 13642200 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 79728 Data size: 54932592 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 68900 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query94.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query94.q.out index 6ca2d294e5f3..72232a14083a 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query94.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query94.q.out @@ -23,7 +23,7 @@ STAGE PLANS: TableScan alias: ws1 filterExpr: (ws_ship_addr_sk is not null and ws_web_site_sk is not null and ws_ship_date_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_119_container, bigKeyColName:ws_web_site_sk, smallTablePos:1, keyRatio:2.7777730824410645E-10 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_119_container, bigKeyColName:ws_web_site_sk, smallTablePos:1, keyRatio:3.240735262847908E-10 Statistics: Num rows: 21600036511 Data size: 5701632353848 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ws_ship_addr_sk is not null and ws_web_site_sk is not null and ws_ship_date_sk is not null) (type: boolean) @@ -41,7 +41,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col3, _col4, _col5, _col6 input vertices: 1 Map 8 - Statistics: Num rows: 407242361 Data size: 103520524440 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415074075 Data size: 105525443224 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -51,7 +51,7 @@ STAGE PLANS: outputColumnNames: _col0, _col3, _col4, _col5, _col6 input vertices: 1 Map 9 - Statistics: Num rows: 58177483 Data size: 13737647176 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 69179015 Data size: 16466027112 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -61,18 +61,18 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col5, _col6 input vertices: 1 Map 10 - Statistics: Num rows: 6463723 Data size: 904060128 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 1197414288 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col4 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col4 (type: bigint) - Statistics: Num rows: 6463723 Data size: 904060128 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 1197414288 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) Select Operator expressions: _col4 (type: bigint) outputColumnNames: _col4 - Statistics: Num rows: 6463723 Data size: 51709784 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 61488256 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col4), max(_col4), bloom_filter(_col4, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -167,20 +167,20 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: (ca_state = 'TX') (type: boolean) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ca_state = 'TX') (type: boolean) - Statistics: Num rows: 754717 Data size: 70943398 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 70323608 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 754717 Data size: 6037736 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 6153848 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 754717 Data size: 6037736 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 6153848 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 9 @@ -188,20 +188,20 @@ STAGE PLANS: TableScan alias: web_site filterExpr: (web_company_name = 'pri ') (type: boolean) - Statistics: Num rows: 84 Data size: 8064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 84 Data size: 7976 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (web_company_name = 'pri ') (type: boolean) - Statistics: Num rows: 12 Data size: 1152 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14 Data size: 1344 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: web_site_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 12 Data size: 96 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 12 Data size: 96 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 2 @@ -217,23 +217,23 @@ STAGE PLANS: input vertices: 1 Map 11 residual filter predicates: {(_col3 <> _col14)} - Statistics: Num rows: 6463723 Data size: 912569800 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 1215702432 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Select Operator expressions: _col4 (type: bigint), _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) outputColumnNames: _col4, _col5, _col6 - Statistics: Num rows: 6463723 Data size: 895528872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 1179104560 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col4 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col4 (type: bigint) - Statistics: Num rows: 6463723 Data size: 895528872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 1179104560 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: decimal(7,2)), _col6 (type: decimal(7,2)) Select Operator expressions: _col4 (type: bigint) outputColumnNames: _col4 - Statistics: Num rows: 6463723 Data size: 51709784 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 61488256 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col4), max(_col4), bloom_filter(_col4, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -257,21 +257,21 @@ STAGE PLANS: outputColumnNames: _col4, _col5, _col6 input vertices: 1 Map 12 - Statistics: Num rows: 6463723 Data size: 895528872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 1179104560 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Group By Operator aggregations: sum(_col5), sum(_col6) keys: _col4 (type: bigint) - minReductionHashAggr: 0.9166043 + minReductionHashAggr: 0.91660416 mode: hash outputColumnNames: _col0, _col2, _col3 - Statistics: Num rows: 2156188 Data size: 500235616 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3204915 Data size: 743540280 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 2156188 Data size: 500235616 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3204915 Data size: 743540280 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(17,2)), _col3 (type: decimal(17,2)) Reducer 4 Execution mode: vectorized, llap @@ -281,7 +281,7 @@ STAGE PLANS: keys: KEY._col0 (type: bigint) mode: partial2 outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 2156188 Data size: 500235616 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3204915 Data size: 743540280 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col0), sum(_col1), sum(_col2) mode: partial2 diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query95.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query95.q.out index 3a966e9f29c8..58d788fd7e04 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query95.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query95.q.out @@ -28,7 +28,7 @@ STAGE PLANS: TableScan alias: ws1 filterExpr: (ws_ship_addr_sk is not null and ws_web_site_sk is not null and ws_ship_date_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_210_container, bigKeyColName:ws_web_site_sk, smallTablePos:1, keyRatio:2.7777730824410645E-10 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_210_container, bigKeyColName:ws_web_site_sk, smallTablePos:1, keyRatio:3.240735262847908E-10 Statistics: Num rows: 21600036511 Data size: 5528875272680 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ws_ship_addr_sk is not null and ws_web_site_sk is not null and ws_ship_date_sk is not null) (type: boolean) @@ -46,7 +46,7 @@ STAGE PLANS: outputColumnNames: _col0, _col2, _col3, _col4, _col5 input vertices: 1 Map 8 - Statistics: Num rows: 407242361 Data size: 100305764080 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 415074075 Data size: 102248029152 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -56,7 +56,7 @@ STAGE PLANS: outputColumnNames: _col0, _col3, _col4, _col5 input vertices: 1 Map 9 - Statistics: Num rows: 58177483 Data size: 13315405840 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 69179015 Data size: 15955773520 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -66,18 +66,18 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col5 input vertices: 1 Map 10 - Statistics: Num rows: 6463723 Data size: 895528872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 1179104560 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col3 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col3 (type: bigint) - Statistics: Num rows: 6463723 Data size: 895528872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 1179104560 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) Select Operator expressions: _col3 (type: bigint) outputColumnNames: _col3 - Statistics: Num rows: 6463723 Data size: 51709784 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 61488256 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col3), max(_col3), bloom_filter(_col3, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -196,20 +196,20 @@ STAGE PLANS: TableScan alias: customer_address filterExpr: (ca_state = 'TX') (type: boolean) - Statistics: Num rows: 40000000 Data size: 3760000000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 40000000 Data size: 3656820898 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ca_state = 'TX') (type: boolean) - Statistics: Num rows: 754717 Data size: 70943398 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 70323608 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ca_address_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 754717 Data size: 6037736 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 6153848 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 754717 Data size: 6037736 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 769231 Data size: 6153848 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 9 @@ -217,20 +217,20 @@ STAGE PLANS: TableScan alias: web_site filterExpr: (web_company_name = 'pri ') (type: boolean) - Statistics: Num rows: 84 Data size: 8064 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 84 Data size: 7976 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (web_company_name = 'pri ') (type: boolean) - Statistics: Num rows: 12 Data size: 1152 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14 Data size: 1344 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: web_site_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 12 Data size: 96 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 12 Data size: 96 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 14 Data size: 112 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 12 @@ -345,19 +345,19 @@ STAGE PLANS: outputColumnNames: _col3, _col4, _col5 input vertices: 1 Reducer 13 - Statistics: Num rows: 6463723 Data size: 895528872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 1179104560 Basic stats: COMPLETE Column stats: COMPLETE DynamicPartitionHashJoin: true Reduce Output Operator key expressions: _col3 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col3 (type: bigint) - Statistics: Num rows: 6463723 Data size: 895528872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 1179104560 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col4 (type: decimal(7,2)), _col5 (type: decimal(7,2)) Select Operator expressions: _col3 (type: bigint) outputColumnNames: _col3 - Statistics: Num rows: 6463723 Data size: 51709784 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 61488256 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: min(_col3), max(_col3), bloom_filter(_col3, expectedEntries=1000000) minReductionHashAggr: 0.99 @@ -379,20 +379,20 @@ STAGE PLANS: 0 _col3 (type: bigint) 1 _col0 (type: bigint) outputColumnNames: _col3, _col4, _col5 - Statistics: Num rows: 6463723 Data size: 895528872 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 7686032 Data size: 1179104560 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col4), sum(_col5) keys: _col3 (type: bigint) - minReductionHashAggr: 0.9166043 + minReductionHashAggr: 0.91660416 mode: hash outputColumnNames: _col0, _col2, _col3 - Statistics: Num rows: 2156188 Data size: 500235616 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3204915 Data size: 743540280 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 2156188 Data size: 500235616 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3204915 Data size: 743540280 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col2 (type: decimal(17,2)), _col3 (type: decimal(17,2)) Reducer 4 Execution mode: vectorized, llap @@ -402,7 +402,7 @@ STAGE PLANS: keys: KEY._col0 (type: bigint) mode: partial2 outputColumnNames: _col0, _col1, _col2 - Statistics: Num rows: 2156188 Data size: 500235616 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 3204915 Data size: 743540280 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count(_col0), sum(_col1), sum(_col2) mode: partial2 diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query96.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query96.q.out index 80a49252e6d5..db7d34706fb4 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query96.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query96.q.out @@ -16,7 +16,7 @@ STAGE PLANS: TableScan alias: store_sales filterExpr: (ss_store_sk is not null and ss_hdemo_sk is not null and ss_sold_time_sk is not null) (type: boolean) - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_72_container, bigKeyColName:ss_hdemo_sk, smallTablePos:1, keyRatio:2.9979791175219683E-4 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_72_container, bigKeyColName:ss_store_sk, smallTablePos:1, keyRatio:3.288106095294814E-4 Statistics: Num rows: 86404891377 Data size: 1980339026496 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (ss_store_sk is not null and ss_hdemo_sk is not null and ss_sold_time_sk is not null) (type: boolean) @@ -39,21 +39,21 @@ STAGE PLANS: condition map: Inner Join 0 to 1 keys: - 0 _col2 (type: bigint) + 0 _col1 (type: bigint) 1 _col0 (type: bigint) - outputColumnNames: _col1 + outputColumnNames: _col2 input vertices: 1 Map 4 - Statistics: Num rows: 259040049 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 284442504 Data size: 8 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 keys: - 0 _col1 (type: bigint) + 0 _col2 (type: bigint) 1 _col0 (type: bigint) input vertices: 1 Map 5 - Statistics: Num rows: 25904006 Data size: 207232048 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 28410845 Data size: 227286760 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: count() minReductionHashAggr: 0.99 @@ -91,43 +91,43 @@ STAGE PLANS: Map 4 Map Operator Tree: TableScan - alias: store - filterExpr: (s_store_name = 'ese') (type: boolean) - Statistics: Num rows: 1704 Data size: 163584 Basic stats: COMPLETE Column stats: COMPLETE + alias: household_demographics + filterExpr: (hd_dep_count = 5) (type: boolean) + Statistics: Num rows: 7200 Data size: 86400 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (s_store_name = 'ese') (type: boolean) - Statistics: Num rows: 155 Data size: 14880 Basic stats: COMPLETE Column stats: COMPLETE + predicate: (hd_dep_count = 5) (type: boolean) + Statistics: Num rows: 720 Data size: 8640 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: s_store_sk (type: bigint) + expressions: hd_demo_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 720 Data size: 5760 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 155 Data size: 1240 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 720 Data size: 5760 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Map 5 Map Operator Tree: TableScan - alias: household_demographics - filterExpr: (hd_dep_count = 5) (type: boolean) - Statistics: Num rows: 7200 Data size: 86400 Basic stats: COMPLETE Column stats: COMPLETE + alias: store + filterExpr: (s_store_name = 'ese') (type: boolean) + Statistics: Num rows: 1704 Data size: 162704 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator - predicate: (hd_dep_count = 5) (type: boolean) - Statistics: Num rows: 720 Data size: 8640 Basic stats: COMPLETE Column stats: COMPLETE + predicate: (s_store_name = 'ese') (type: boolean) + Statistics: Num rows: 170 Data size: 16320 Basic stats: COMPLETE Column stats: COMPLETE Select Operator - expressions: hd_demo_sk (type: bigint) + expressions: s_store_sk (type: bigint) outputColumnNames: _col0 - Statistics: Num rows: 720 Data size: 5760 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 720 Data size: 5760 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 170 Data size: 1360 Basic stats: COMPLETE Column stats: COMPLETE Execution mode: vectorized, llap LLAP IO: may be used (ACID table) Reducer 2 diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query98.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query98.q.out index c8fc334ead4c..6875fc958941 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query98.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query98.q.out @@ -17,7 +17,7 @@ STAGE PLANS: Map Operator Tree: TableScan alias: store_sales - probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_54_container, bigKeyColName:ss_item_sk, smallTablePos:1, keyRatio:0.2727272808584318 + probeDecodeDetails: cacheKey:HASH_MAP_MAPJOIN_54_container, bigKeyColName:ss_item_sk, smallTablePos:1, keyRatio:0.3000000119293359 Statistics: Num rows: 82510879939 Data size: 10343396725952 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: ss_item_sk (type: bigint), ss_ext_sales_price (type: decimal(7,2)), ss_sold_date_sk (type: bigint) @@ -32,7 +32,7 @@ STAGE PLANS: outputColumnNames: _col1, _col2, _col4, _col5, _col6, _col7, _col8 input vertices: 1 Map 5 - Statistics: Num rows: 22502967927 Data size: 15489075671302 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 24753264966 Data size: 17059782875474 Basic stats: COMPLETE Column stats: COMPLETE Map Join Operator condition map: Inner Join 0 to 1 @@ -42,20 +42,20 @@ STAGE PLANS: outputColumnNames: _col1, _col4, _col5, _col6, _col7, _col8 input vertices: 1 Map 6 - Statistics: Num rows: 2500158608 Data size: 1507113497776 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 2750174496 Data size: 1679624331446 Basic stats: COMPLETE Column stats: COMPLETE Group By Operator aggregations: sum(_col1) keys: _col8 (type: char(50)), _col7 (type: char(50)), _col4 (type: string), _col5 (type: varchar(200)), _col6 (type: decimal(7,2)) minReductionHashAggr: 0.99 mode: hash outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: string), _col3 (type: varchar(200)), _col4 (type: decimal(7,2)) null sort order: zzzzz sort order: +++++ Map-reduce partition columns: _col0 (type: char(50)), _col1 (type: char(50)), _col2 (type: string), _col3 (type: varchar(200)), _col4 (type: decimal(7,2)) - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col5 (type: decimal(17,2)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -64,20 +64,20 @@ STAGE PLANS: TableScan alias: item filterExpr: (i_category) IN ('Books ', 'Jewelry ', 'Sports ') (type: boolean) - Statistics: Num rows: 462000 Data size: 270601408 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 462000 Data size: 270182180 Basic stats: COMPLETE Column stats: COMPLETE Filter Operator predicate: (i_category) IN ('Books ', 'Jewelry ', 'Sports ') (type: boolean) - Statistics: Num rows: 126000 Data size: 73800496 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 81055046 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: i_item_sk (type: bigint), i_item_id (type: string), i_item_desc (type: varchar(200)), i_current_price (type: decimal(7,2)), i_class (type: char(50)), i_category (type: char(50)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 73800496 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 81055046 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col0 (type: bigint) null sort order: z sort order: + Map-reduce partition columns: _col0 (type: bigint) - Statistics: Num rows: 126000 Data size: 73800496 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 81055046 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col1 (type: string), _col2 (type: varchar(200)), _col3 (type: decimal(7,2)), _col4 (type: char(50)), _col5 (type: char(50)) Execution mode: vectorized, llap LLAP IO: may be used (ACID table) @@ -126,13 +126,13 @@ STAGE PLANS: keys: KEY._col0 (type: char(50)), KEY._col1 (type: char(50)), KEY._col2 (type: string), KEY._col3 (type: varchar(200)), KEY._col4 (type: decimal(7,2)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: char(50)) null sort order: a sort order: + Map-reduce partition columns: _col1 (type: char(50)) - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col0 (type: char(50)), _col2 (type: string), _col3 (type: varchar(200)), _col4 (type: decimal(7,2)), _col5 (type: decimal(17,2)) Reducer 3 Execution mode: vectorized, llap @@ -140,7 +140,7 @@ STAGE PLANS: Select Operator expressions: VALUE._col0 (type: char(50)), KEY.reducesinkkey0 (type: char(50)), VALUE._col1 (type: string), VALUE._col2 (type: varchar(200)), VALUE._col3 (type: decimal(7,2)), VALUE._col4 (type: decimal(17,2)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE PTF Operator Function definitions: Input definition @@ -160,16 +160,16 @@ STAGE PLANS: name: sum window function: GenericUDAFSumHiveDecimal window frame: ROWS PRECEDING(MAX)~FOLLOWING(MAX) - Statistics: Num rows: 126000 Data size: 86940000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 95634000 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col3 (type: varchar(200)), _col0 (type: char(50)), _col1 (type: char(50)), _col4 (type: decimal(7,2)), _col5 (type: decimal(17,2)), ((_col5 * 100) / sum_window_0) (type: decimal(38,17)), _col2 (type: string) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6 - Statistics: Num rows: 126000 Data size: 101052000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 111157200 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col1 (type: char(50)), _col2 (type: char(50)), _col6 (type: string), _col0 (type: varchar(200)), _col5 (type: decimal(38,17)) null sort order: zzzzz sort order: +++++ - Statistics: Num rows: 126000 Data size: 101052000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 111157200 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: decimal(7,2)), _col4 (type: decimal(17,2)) Reducer 4 Execution mode: vectorized, llap @@ -177,10 +177,10 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey3 (type: varchar(200)), KEY.reducesinkkey0 (type: char(50)), KEY.reducesinkkey1 (type: char(50)), VALUE._col0 (type: decimal(7,2)), VALUE._col1 (type: decimal(17,2)), KEY.reducesinkkey4 (type: decimal(38,17)) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5 - Statistics: Num rows: 126000 Data size: 88452000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 97297200 Basic stats: COMPLETE Column stats: COMPLETE File Output Operator compressed: false - Statistics: Num rows: 126000 Data size: 88452000 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 138600 Data size: 97297200 Basic stats: COMPLETE Column stats: COMPLETE table: input format: org.apache.hadoop.mapred.SequenceFileInputFormat output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat diff --git a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query99.q.out b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query99.q.out index 2733265a9214..4a2ada446e8d 100644 --- a/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query99.q.out +++ b/ql/src/test/results/clientpositive/perf/tpcds30tb/tez/query99.q.out @@ -171,16 +171,16 @@ STAGE PLANS: keys: KEY._col0 (type: string), KEY._col1 (type: char(30)), KEY._col2 (type: varchar(50)) mode: mergepartial outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 4860 Data size: 1598940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4680 Data size: 1539720 Basic stats: COMPLETE Column stats: COMPLETE Select Operator expressions: _col1 (type: char(30)), _col2 (type: varchar(50)), _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint), _col7 (type: bigint), _col0 (type: string) outputColumnNames: _col1, _col2, _col3, _col4, _col5, _col6, _col7, _col8 - Statistics: Num rows: 4860 Data size: 1598940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4680 Data size: 1539720 Basic stats: COMPLETE Column stats: COMPLETE Reduce Output Operator key expressions: _col8 (type: string), _col1 (type: char(30)), _col2 (type: varchar(50)) null sort order: zzz sort order: +++ - Statistics: Num rows: 4860 Data size: 1598940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4680 Data size: 1539720 Basic stats: COMPLETE Column stats: COMPLETE value expressions: _col3 (type: bigint), _col4 (type: bigint), _col5 (type: bigint), _col6 (type: bigint), _col7 (type: bigint) Reducer 3 Execution mode: vectorized, llap @@ -188,7 +188,7 @@ STAGE PLANS: Select Operator expressions: KEY.reducesinkkey0 (type: string), KEY.reducesinkkey1 (type: char(30)), KEY.reducesinkkey2 (type: varchar(50)), VALUE._col0 (type: bigint), VALUE._col1 (type: bigint), VALUE._col2 (type: bigint), VALUE._col3 (type: bigint), VALUE._col4 (type: bigint) outputColumnNames: _col0, _col1, _col2, _col3, _col4, _col5, _col6, _col7 - Statistics: Num rows: 4860 Data size: 1598940 Basic stats: COMPLETE Column stats: COMPLETE + Statistics: Num rows: 4680 Data size: 1539720 Basic stats: COMPLETE Column stats: COMPLETE Limit Number of rows: 100 Statistics: Num rows: 100 Data size: 32900 Basic stats: COMPLETE Column stats: COMPLETE diff --git a/standalone-metastore/metastore-server/src/test/java/org/apache/hadoop/hive/metastore/dbinstall/rules/PostgresTPCDS.java b/standalone-metastore/metastore-server/src/test/java/org/apache/hadoop/hive/metastore/dbinstall/rules/PostgresTPCDS.java index b0a692d82ca4..701f3d928529 100644 --- a/standalone-metastore/metastore-server/src/test/java/org/apache/hadoop/hive/metastore/dbinstall/rules/PostgresTPCDS.java +++ b/standalone-metastore/metastore-server/src/test/java/org/apache/hadoop/hive/metastore/dbinstall/rules/PostgresTPCDS.java @@ -31,7 +31,7 @@ */ public class PostgresTPCDS extends Postgres { public PostgresTPCDS() { - super(DockerImageName.parse("zabetak/postgres-tpcds-metastore:1.3").asCompatibleSubstituteFor("postgres")); + super(DockerImageName.parse("thomasrebele/postgres-tpcds-metastore:1.4").asCompatibleSubstituteFor("postgres")); container.withUsername("postgres"); } diff --git a/standalone-metastore/metastore-server/src/test/resources/sql/postgres/upgrade-3.1.3000-to-4.2.0.postgres.sql b/standalone-metastore/metastore-server/src/test/resources/sql/postgres/upgrade-3.1.3000-to-4.2.0.postgres.sql index 72d02a6bd3f1..405af46b370f 100644 --- a/standalone-metastore/metastore-server/src/test/resources/sql/postgres/upgrade-3.1.3000-to-4.2.0.postgres.sql +++ b/standalone-metastore/metastore-server/src/test/resources/sql/postgres/upgrade-3.1.3000-to-4.2.0.postgres.sql @@ -11,154 +11,23 @@ ALTER TABLE ONLY "WM_RESOURCEPLAN" ADD CONSTRAINT "UNIQUE_WM_RESOURCEPLAN" UNIQU UPDATE "TAB_COL_STATS" SET "ENGINE" = 'hive' WHERE "ENGINE" IS NULL; UPDATE "PART_COL_STATS" SET "ENGINE" = 'hive' WHERE "ENGINE" IS NULL; -ALTER TABLE "TAB_COL_STATS" ADD "HISTOGRAM" bytea; -ALTER TABLE "PART_COL_STATS" ADD "HISTOGRAM" bytea; - --- HIVE-23683 -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_ENQUEUE_TIME" bigint; -ALTER TABLE "COMPLETED_COMPACTIONS" ADD "CC_ENQUEUE_TIME" bigint; - -- HIVE-22728 ALTER TABLE "KEY_CONSTRAINTS" DROP CONSTRAINT "KEY_CONSTRAINTS_pkey"; ALTER TABLE "KEY_CONSTRAINTS" ADD CONSTRAINT "CONSTRAINTS_PK" PRIMARY KEY ("PARENT_TBL_ID", "CONSTRAINT_NAME", "POSITION"); --- HIVE-21487 -CREATE INDEX "COMPLETED_COMPACTIONS_RES" ON "COMPLETED_COMPACTIONS" ("CC_DATABASE","CC_TABLE","CC_PARTITION"); - - --- HIVE-23107 -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_NEXT_TXN_ID" bigint; ---DROP TABLE "MIN_HISTORY_LEVEL"; - -- HIVE-23048 INSERT INTO "TXNS" ("TXN_ID", "TXN_STATE", "TXN_STARTED", "TXN_LAST_HEARTBEAT", "TXN_USER", "TXN_HOST") SELECT COALESCE(MAX("CTC_TXNID"),0), 'c', 0, 0, '', '' FROM "COMPLETED_TXN_COMPONENTS"; -CREATE SEQUENCE "TXNS_TXN_ID_SEQ" MINVALUE 0 OWNED BY "TXNS"."TXN_ID"; +CREATE SEQUENCE "TXNS_TXN_ID_SEQ" MINVALUE 0; select setval('"TXNS_TXN_ID_SEQ"', (SELECT MAX("TXN_ID") FROM "TXNS")); ALTER TABLE "TXNS" ALTER "TXN_ID" SET DEFAULT nextval('"TXNS_TXN_ID_SEQ"'); ALTER TABLE "NEXT_TXN_ID" RENAME TO "TXN_LOCK_TBL"; ALTER TABLE "TXN_LOCK_TBL" RENAME COLUMN "NTXN_NEXT" TO "TXN_LOCK"; - ---Create table replication metrics -CREATE TABLE "REPLICATION_METRICS" ( - "RM_SCHEDULED_EXECUTION_ID" bigint NOT NULL, - "RM_POLICY" varchar(256) NOT NULL, - "RM_DUMP_EXECUTION_ID" bigint NOT NULL, - "RM_METADATA" varchar(4000), - "RM_PROGRESS" varchar(4000), - PRIMARY KEY("RM_SCHEDULED_EXECUTION_ID") - ); - ---Increase the size of RM_PROGRESS to accomodate the replication statistics -ALTER TABLE "REPLICATION_METRICS" ALTER "RM_PROGRESS" TYPE varchar(24000); - -ALTER TABLE "REPLICATION_METRICS" ALTER "RM_PROGRESS" TYPE varchar(10000); - -ALTER TABLE "REPLICATION_METRICS" ADD "MESSAGE_FORMAT" varchar(16); - ---Create indexes for the replication metrics table -CREATE INDEX "POLICY_IDX" ON "REPLICATION_METRICS" ("RM_POLICY"); -CREATE INDEX "DUMP_IDX" ON "REPLICATION_METRICS" ("RM_DUMP_EXECUTION_ID"); - --- Create stored procedure tables -CREATE TABLE "STORED_PROCS" ( - "SP_ID" BIGINT NOT NULL, - "CREATE_TIME" INTEGER NOT NULL, - "DB_ID" BIGINT NOT NULL, - "NAME" VARCHAR(256) NOT NULL, - "OWNER_NAME" VARCHAR(128) NOT NULL, - "SOURCE" TEXT NOT NULL, - PRIMARY KEY ("SP_ID") - ); - -CREATE UNIQUE INDEX "UNIQUESTOREDPROC" ON "STORED_PROCS" ("NAME", "DB_ID"); -ALTER TABLE ONLY "STORED_PROCS" ADD CONSTRAINT "STOREDPROC_FK1" FOREIGN KEY ("DB_ID") REFERENCES "DBS" ("DB_ID") DEFERRABLE; - --- HIVE-24291 -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_TXN_ID" bigint; - --- HIVE-24275 -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_COMMIT_TIME" bigint; - --- HIVE-24880 -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_INITIATOR_ID" varchar(128); -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_INITIATOR_VERSION" varchar(128); -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_WORKER_VERSION" varchar(128); -ALTER TABLE "COMPLETED_COMPACTIONS" ADD "CC_INITIATOR_ID" varchar(128); -ALTER TABLE "COMPLETED_COMPACTIONS" ADD "CC_INITIATOR_VERSION" varchar(128); -ALTER TABLE "COMPLETED_COMPACTIONS" ADD "CC_WORKER_VERSION" varchar(128); - -- HIVE-24770 UPDATE "SERDES" SET "SLIB"='org.apache.hadoop.hive.serde2.MultiDelimitSerDe' where "SLIB"='org.apache.hadoop.hive.contrib.serde2.MultiDelimitSerDe'; --- HIVE-24396 --- Create DataConnectors and DataConnector_Params tables -CREATE TABLE "DATACONNECTORS" ( - "NAME" character varying(128) NOT NULL, - "TYPE" character varying(32) NOT NULL, - "URL" character varying(4000) NOT NULL, - "COMMENT" character varying(256), - "OWNER_NAME" character varying(256), - "OWNER_TYPE" character varying(10), - "CREATE_TIME" INTEGER NOT NULL, - PRIMARY KEY ("NAME") -); - -CREATE TABLE "DATACONNECTOR_PARAMS" ( - "NAME" character varying(128) NOT NULL, - "PARAM_KEY" character varying(180) NOT NULL, - "PARAM_VALUE" character varying(4000), - PRIMARY KEY ("NAME", "PARAM_KEY"), - CONSTRAINT "DATACONNECTOR_NAME_FK1" FOREIGN KEY ("NAME") REFERENCES "DATACONNECTORS"("NAME") ON DELETE CASCADE -); -ALTER TABLE "DBS" ADD "TYPE" character varying(32) DEFAULT 'NATIVE' NOT NULL; -ALTER TABLE "DBS" ADD "DATACONNECTOR_NAME" character varying(128); -ALTER TABLE "DBS" ADD "REMOTE_DBNAME" character varying(128); -UPDATE "DBS" SET "TYPE"= 'NATIVE' WHERE "TYPE" IS NULL; - --- HIVE-25737 -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_CLEANER_START" bigint; - --- HIVE-25842 -CREATE TABLE "COMPACTION_METRICS_CACHE" ( - "CMC_DATABASE" varchar(128) NOT NULL, - "CMC_TABLE" varchar(128) NOT NULL, - "CMC_PARTITION" varchar(767), - "CMC_METRIC_TYPE" varchar(128) NOT NULL, - "CMC_METRIC_VALUE" integer NOT NULL, - "CMC_VERSION" integer NOT NULL -); - --- HIVE-25993 -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_RETRY_RETENTION" integer NOT NULL DEFAULT 0; - --- HIVE-26280 -ALTER TABLE "COMPLETED_COMPACTIONS" ADD "CC_NEXT_TXN_ID" bigint; -ALTER TABLE "COMPLETED_COMPACTIONS" ADD "CC_TXN_ID" bigint; -ALTER TABLE "COMPLETED_COMPACTIONS" ADD "CC_COMMIT_TIME" bigint; - --- HIVE-26443 -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_POOL_NAME" VARCHAR(128); -ALTER TABLE "COMPLETED_COMPACTIONS" ADD "CC_POOL_NAME" VARCHAR(128); - --- HIVE-26719 -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_NUMBER_OF_BUCKETS" INTEGER; -ALTER TABLE "COMPLETED_COMPACTIONS" ADD "CC_NUMBER_OF_BUCKETS" INTEGER; - --- HIVE-26735 -ALTER TABLE "COMPACTION_QUEUE" ADD "CQ_ORDER_BY" VARCHAR(4000); -ALTER TABLE "COMPLETED_COMPACTIONS" ADD "CC_ORDER_BY" VARCHAR(4000); - --- HIVE-26704 -CREATE TABLE "MIN_HISTORY_WRITE_ID" ( - "MH_TXNID" bigint NOT NULL REFERENCES "TXNS" ("TXN_ID"), - "MH_DATABASE" varchar(128) NOT NULL, - "MH_TABLE" varchar(256) NOT NULL, - "MH_WRITEID" bigint NOT NULL -); - -- HIVE-29178 -- Table structure for CATALOG_PARAMS CREATE TABLE "CATALOG_PARAMS" (