digraph G {
0 [labelType="html" label="<br><b>AdaptiveSparkPlan</b><br><br>"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (3)\n \nduration: 0 ms";
2 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build: 0 ms<br>number of output rows: 1"];
}
3 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 1<br>local merged chunks fetched: 0<br>shuffle write time: 0 ms<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 1<br>local bytes read: 59.0 B<br>fetch wait time: 0 ms<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 1<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size: 16.0 B<br>local merged bytes read: 0.0 B<br>number of partitions: 1<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written: 59.0 B"];
subgraph cluster4 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: 5 ms";
5 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build: 4 ms<br>peak memory: 0.0 B<br>number of output rows: 1<br>number of sort fallback tasks: 0<br>avg hash probes per key: 0"];
6 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build: 1 ms<br>peak memory: 256.0 KiB<br>number of output rows: 476<br>number of sort fallback tasks: 0<br>avg hash probes per key: 0"];
}
7 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 1<br>partition data size: 5.4 KiB<br>number of coalesced partitions: 1"];
8 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 476<br>local merged chunks fetched: 0<br>shuffle write time: 2 ms<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 476<br>local bytes read: 5.1 KiB<br>fetch wait time: 0 ms<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 1<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size: 14.9 KiB<br>local merged bytes read: 0.0 B<br>number of partitions: 10<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written: 5.1 KiB"];
subgraph cluster9 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: 23 ms";
10 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build: 14 ms<br>peak memory: 256.0 KiB<br>number of output rows: 476<br>number of sort fallback tasks: 0<br>avg hash probes per key: 0"];
11 [labelType="html" label="<br><b>Project</b><br><br>"];
12 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 509"];
13 [labelType="html" label="<b>ColumnarToRow</b><br><br>number of output rows: 717<br>number of input batches: 1"];
}
14 [labelType="html" label="<b>Scan parquet </b><br><br>number of files read: 1<br>scan time: 5 ms<br>metadata time: 0 ms<br>size of files read: 26.2 KiB<br>number of output rows: 717"];
2->0;
3->2;
5->3;
6->5;
7->6;
8->7;
10->8;
11->10;
12->11;
13->12;
14->13;
}
15
AdaptiveSparkPlan isFinalPlan=true
HashAggregate(keys=[], functions=[count(1)])
WholeStageCodegen (3)
Exchange SinglePartition, ENSURE_REQUIREMENTS, [plan_id=2205]
HashAggregate(keys=[], functions=[partial_count(1)])
HashAggregate(keys=[COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168], functions=[])
WholeStageCodegen (2)
AQEShuffleRead coalesced
Exchange hashpartitioning(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168, 10), ENSURE_REQUIREMENTS, [plan_id=2111]
HashAggregate(keys=[COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168], functions=[])
Project [str_join(array(IN_UNIT_3349#11930, OUT_UNIT_3350#11933), >) AS COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Filter NOT (str_extract_by_str(str_join(array(IN_UNIT_3349#11930, OUT_UNIT_3350#11933), >), >, LEFT) <=> str_extract_by_str(str_join(array(IN_UNIT_3349#11930, OUT_UNIT_3350#11933), >), >, RIGHT))
ColumnarToRow
WholeStageCodegen (1)
FileScan parquet [IN_UNIT_3349#11930,OUT_UNIT_3350#11933] Batched: true, DataFilters: [NOT (str_extract_by_str(str_join(array(IN_UNIT_3349#11930, OUT_UNIT_3350#11933), >), >, LEFT) <=..., Format: Parquet, Location: InMemoryFileIndex(1 paths)[file:/data/output/cache/parquet/uet/VISIT_3342], PartitionFilters: [], PushedFilters: [], ReadSchema: struct<IN_UNIT_3349:string,OUT_UNIT_3350:string>
== Physical Plan ==
AdaptiveSparkPlan (22)
+- == Final Plan ==
* HashAggregate (13)
+- ShuffleQueryStage (12), Statistics(sizeInBytes=16.0 B, rowCount=1)
+- Exchange (11)
+- * HashAggregate (10)
+- * HashAggregate (9)
+- AQEShuffleRead (8)
+- ShuffleQueryStage (7), Statistics(sizeInBytes=14.9 KiB, rowCount=476)
+- Exchange (6)
+- * HashAggregate (5)
+- * Project (4)
+- * Filter (3)
+- * ColumnarToRow (2)
+- Scan parquet (1)
+- == Initial Plan ==
HashAggregate (21)
+- Exchange (20)
+- HashAggregate (19)
+- HashAggregate (18)
+- Exchange (17)
+- HashAggregate (16)
+- Project (15)
+- Filter (14)
+- Scan parquet (1)
(1) Scan parquet
Output [2]: [IN_UNIT_3349#11930, OUT_UNIT_3350#11933]
Batched: true
Location: InMemoryFileIndex [file:/data/output/cache/parquet/uet/VISIT_3342]
ReadSchema: struct<IN_UNIT_3349:string,OUT_UNIT_3350:string>
(2) ColumnarToRow [codegen id : 1]
Input [2]: [IN_UNIT_3349#11930, OUT_UNIT_3350#11933]
(3) Filter [codegen id : 1]
Input [2]: [IN_UNIT_3349#11930, OUT_UNIT_3350#11933]
Condition : NOT (str_extract_by_str(str_join(array(IN_UNIT_3349#11930, OUT_UNIT_3350#11933), >), >, LEFT) <=> str_extract_by_str(str_join(array(IN_UNIT_3349#11930, OUT_UNIT_3350#11933), >), >, RIGHT))
(4) Project [codegen id : 1]
Output [1]: [str_join(array(IN_UNIT_3349#11930, OUT_UNIT_3350#11933), >) AS COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Input [2]: [IN_UNIT_3349#11930, OUT_UNIT_3350#11933]
(5) HashAggregate [codegen id : 1]
Input [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Keys [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Functions: []
Aggregate Attributes: []
Results [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
(6) Exchange
Input [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Arguments: hashpartitioning(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168, 10), ENSURE_REQUIREMENTS, [plan_id=2111]
(7) ShuffleQueryStage
Output [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Arguments: 0
(8) AQEShuffleRead
Input [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Arguments: coalesced
(9) HashAggregate [codegen id : 2]
Input [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Keys [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Functions: []
Aggregate Attributes: []
Results: []
(10) HashAggregate [codegen id : 2]
Input: []
Keys: []
Functions [1]: [partial_count(1)]
Aggregate Attributes [1]: [count#12499L]
Results [1]: [count#12500L]
(11) Exchange
Input [1]: [count#12500L]
Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=2205]
(12) ShuffleQueryStage
Output [1]: [count#12500L]
Arguments: 1
(13) HashAggregate [codegen id : 3]
Input [1]: [count#12500L]
Keys: []
Functions [1]: [count(1)]
Aggregate Attributes [1]: [count(1)#12358L]
Results [1]: [count(1)#12358L AS count#12359L]
(14) Filter
Input [2]: [IN_UNIT_3349#11930, OUT_UNIT_3350#11933]
Condition : NOT (str_extract_by_str(str_join(array(IN_UNIT_3349#11930, OUT_UNIT_3350#11933), >), >, LEFT) <=> str_extract_by_str(str_join(array(IN_UNIT_3349#11930, OUT_UNIT_3350#11933), >), >, RIGHT))
(15) Project
Output [1]: [str_join(array(IN_UNIT_3349#11930, OUT_UNIT_3350#11933), >) AS COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Input [2]: [IN_UNIT_3349#11930, OUT_UNIT_3350#11933]
(16) HashAggregate
Input [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Keys [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Functions: []
Aggregate Attributes: []
Results [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
(17) Exchange
Input [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Arguments: hashpartitioning(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168, 10), ENSURE_REQUIREMENTS, [plan_id=2080]
(18) HashAggregate
Input [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Keys [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#12168]
Functions: []
Aggregate Attributes: []
Results: []
(19) HashAggregate
Input: []
Keys: []
Functions [1]: [partial_count(1)]
Aggregate Attributes [1]: [count#12499L]
Results [1]: [count#12500L]
(20) Exchange
Input [1]: [count#12500L]
Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=2084]
(21) HashAggregate
Input [1]: [count#12500L]
Keys: []
Functions [1]: [count(1)]
Aggregate Attributes [1]: [count(1)#12358L]
Results [1]: [count(1)#12358L AS count#12359L]
(22) AdaptiveSparkPlan
Output [1]: [count#12359L]
Arguments: isFinalPlan=true