digraph G {
0 [labelType="html" label="<br><b>AdaptiveSparkPlan</b><br><br>"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: 3 ms";
2 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 29"];
3 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build: 1 ms<br>peak memory: 64.2 MiB<br>number of output rows: 476<br>number of sort fallback tasks: 0<br>avg hash probes per key: 1"];
}
4 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 1<br>partition data size: 5.7 KiB<br>number of coalesced partitions: 1"];
5 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 476<br>local merged chunks fetched: 0<br>shuffle write time: 1 ms<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 476<br>local bytes read: 5.4 KiB<br>fetch wait time: 0 ms<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 1<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size: 18.6 KiB<br>local merged bytes read: 0.0 B<br>number of partitions: 10<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written: 5.4 KiB"];
subgraph cluster6 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: 112 ms";
7 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build: 99 ms<br>peak memory: 256.0 KiB<br>number of output rows: 476<br>number of sort fallback tasks: 0<br>avg hash probes per key: 0"];
8 [labelType="html" label="<br><b>Project</b><br><br>"];
9 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 509"];
10 [labelType="html" label="<b>Scan JDBCRelation((SELECT RAWTOHEX(VISIT_ID), RAWTOHEX(PATIENT_ID), \"IN_DATE\", \"OUT_DATE\", \"IN_MODE\", \"OUT_MODE\", \"IN_UNIT\", \"OUT_UNIT\", \"VISIT_TYPE\", \"CHAMP_PMSI\", \"UNIT_PATH\", \"EMERGENCY\", \"CANCELED\" FROM \"DTM_622\".\"VISIT\") x) [numPartitions=1] </b><br><br>number of output rows: 717"];
}
2->0;
3->2;
4->3;
5->4;
7->5;
8->7;
9->8;
10->9;
}
11
AdaptiveSparkPlan isFinalPlan=true
Filter (COL_271E49E1_A230_499E_8192_978ECEDAE3B0#110946L >= 2)
HashAggregate(keys=[COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888], functions=[count(1)])
WholeStageCodegen (2)
AQEShuffleRead coalesced
Exchange hashpartitioning(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, 10), ENSURE_REQUIREMENTS, [plan_id=17541]
HashAggregate(keys=[COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888], functions=[partial_count(1)])
Project [str_join(array(IN_UNIT#110542, OUT_UNIT#110543), >) AS COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888]
Filter NOT (str_extract_by_str(str_join(array(IN_UNIT#110542, OUT_UNIT#110543), >), >, LEFT) <=> str_extract_by_str(str_join(array(IN_UNIT#110542, OUT_UNIT#110543), >), >, RIGHT))
Scan JDBCRelation((SELECT RAWTOHEX(VISIT_ID), RAWTOHEX(PATIENT_ID), "IN_DATE", "OUT_DATE", "IN_MODE", "OUT_MODE", "IN_UNIT", "OUT_UNIT", "VISIT_TYPE", "CHAMP_PMSI", "UNIT_PATH", "EMERGENCY", "CANCELED" FROM "DTM_622"."VISIT") x) [numPartitions=1] [IN_UNIT#110542,OUT_UNIT#110543] PushedFilters: [], ReadSchema: struct<IN_UNIT:string,OUT_UNIT:string>
WholeStageCodegen (1)
== Physical Plan ==
AdaptiveSparkPlan (14)
+- == Final Plan ==
* Filter (9)
+- * HashAggregate (8)
+- AQEShuffleRead (7)
+- ShuffleQueryStage (6), Statistics(sizeInBytes=18.6 KiB, rowCount=476)
+- Exchange (5)
+- * HashAggregate (4)
+- * Project (3)
+- * Filter (2)
+- * Scan JDBCRelation((SELECT RAWTOHEX(VISIT_ID), RAWTOHEX(PATIENT_ID), "IN_DATE", "OUT_DATE", "IN_MODE", "OUT_MODE", "IN_UNIT", "OUT_UNIT", "VISIT_TYPE", "CHAMP_PMSI", "UNIT_PATH", "EMERGENCY", "CANCELED" FROM "DTM_622"."VISIT") x) [numPartitions=1] (1)
+- == Initial Plan ==
CollectLimit (13)
+- Filter (12)
+- HashAggregate (11)
+- Exchange (10)
+- HashAggregate (4)
+- Project (3)
+- Filter (2)
+- Scan JDBCRelation((SELECT RAWTOHEX(VISIT_ID), RAWTOHEX(PATIENT_ID), "IN_DATE", "OUT_DATE", "IN_MODE", "OUT_MODE", "IN_UNIT", "OUT_UNIT", "VISIT_TYPE", "CHAMP_PMSI", "UNIT_PATH", "EMERGENCY", "CANCELED" FROM "DTM_622"."VISIT") x) [numPartitions=1] (1)
(1) Scan JDBCRelation((SELECT RAWTOHEX(VISIT_ID), RAWTOHEX(PATIENT_ID), "IN_DATE", "OUT_DATE", "IN_MODE", "OUT_MODE", "IN_UNIT", "OUT_UNIT", "VISIT_TYPE", "CHAMP_PMSI", "UNIT_PATH", "EMERGENCY", "CANCELED" FROM "DTM_622"."VISIT") x) [numPartitions=1] [codegen id : 1]
Output [2]: [IN_UNIT#110542, OUT_UNIT#110543]
ReadSchema: struct<IN_UNIT:string,OUT_UNIT:string>
(2) Filter [codegen id : 1]
Input [2]: [IN_UNIT#110542, OUT_UNIT#110543]
Condition : NOT (str_extract_by_str(str_join(array(IN_UNIT#110542, OUT_UNIT#110543), >), >, LEFT) <=> str_extract_by_str(str_join(array(IN_UNIT#110542, OUT_UNIT#110543), >), >, RIGHT))
(3) Project [codegen id : 1]
Output [1]: [str_join(array(IN_UNIT#110542, OUT_UNIT#110543), >) AS COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888]
Input [2]: [IN_UNIT#110542, OUT_UNIT#110543]
(4) HashAggregate [codegen id : 1]
Input [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888]
Keys [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888]
Functions [1]: [partial_count(1)]
Aggregate Attributes [1]: [count#111007L]
Results [2]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, count#111008L]
(5) Exchange
Input [2]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, count#111008L]
Arguments: hashpartitioning(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, 10), ENSURE_REQUIREMENTS, [plan_id=17541]
(6) ShuffleQueryStage
Output [2]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, count#111008L]
Arguments: 0
(7) AQEShuffleRead
Input [2]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, count#111008L]
Arguments: coalesced
(8) HashAggregate [codegen id : 2]
Input [2]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, count#111008L]
Keys [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888]
Functions [1]: [count(1)]
Aggregate Attributes [1]: [count(1)#110932L]
Results [6]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888 AS COL_5ED88E4F_DF86_440D_9CC6_0C93B876ABF9#110945, count(1)#110932L AS COL_271E49E1_A230_499E_8192_978ECEDAE3B0#110946L, str_join(array(E, str_extract_by_str(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, >, LEFT)), -) AS COL_58CFE2E8_1D65_4D01_9EF3_F725F7BA87ED#110949, str_join(array(S, str_extract_by_str(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, >, RIGHT)), -) AS COL_E7F5DF76_76CE_4B86_B00C_668C338F8FFF#110953, str_extract_by_str(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, >, LEFT) AS COL_A67D3744_1C8E_4621_8489_9EA38D696691#110958, str_extract_by_str(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, >, RIGHT) AS COL_55823422_AF79_46F7_807C_92C35F353A73#110964]
(9) Filter [codegen id : 2]
Input [6]: [COL_5ED88E4F_DF86_440D_9CC6_0C93B876ABF9#110945, COL_271E49E1_A230_499E_8192_978ECEDAE3B0#110946L, COL_58CFE2E8_1D65_4D01_9EF3_F725F7BA87ED#110949, COL_E7F5DF76_76CE_4B86_B00C_668C338F8FFF#110953, COL_A67D3744_1C8E_4621_8489_9EA38D696691#110958, COL_55823422_AF79_46F7_807C_92C35F353A73#110964]
Condition : (COL_271E49E1_A230_499E_8192_978ECEDAE3B0#110946L >= 2)
(10) Exchange
Input [2]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, count#111008L]
Arguments: hashpartitioning(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, 10), ENSURE_REQUIREMENTS, [plan_id=17527]
(11) HashAggregate
Input [2]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, count#111008L]
Keys [1]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888]
Functions [1]: [count(1)]
Aggregate Attributes [1]: [count(1)#110932L]
Results [6]: [COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888 AS COL_5ED88E4F_DF86_440D_9CC6_0C93B876ABF9#110945, count(1)#110932L AS COL_271E49E1_A230_499E_8192_978ECEDAE3B0#110946L, str_join(array(E, str_extract_by_str(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, >, LEFT)), -) AS COL_58CFE2E8_1D65_4D01_9EF3_F725F7BA87ED#110949, str_join(array(S, str_extract_by_str(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, >, RIGHT)), -) AS COL_E7F5DF76_76CE_4B86_B00C_668C338F8FFF#110953, str_extract_by_str(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, >, LEFT) AS COL_A67D3744_1C8E_4621_8489_9EA38D696691#110958, str_extract_by_str(COL_EB0E2C34_212C_41D4_8CFF_862A35B3D6B5#110888, >, RIGHT) AS COL_55823422_AF79_46F7_807C_92C35F353A73#110964]
(12) Filter
Input [6]: [COL_5ED88E4F_DF86_440D_9CC6_0C93B876ABF9#110945, COL_271E49E1_A230_499E_8192_978ECEDAE3B0#110946L, COL_58CFE2E8_1D65_4D01_9EF3_F725F7BA87ED#110949, COL_E7F5DF76_76CE_4B86_B00C_668C338F8FFF#110953, COL_A67D3744_1C8E_4621_8489_9EA38D696691#110958, COL_55823422_AF79_46F7_807C_92C35F353A73#110964]
Condition : (COL_271E49E1_A230_499E_8192_978ECEDAE3B0#110946L >= 2)
(13) CollectLimit
Input [6]: [COL_5ED88E4F_DF86_440D_9CC6_0C93B876ABF9#110945, COL_271E49E1_A230_499E_8192_978ECEDAE3B0#110946L, COL_58CFE2E8_1D65_4D01_9EF3_F725F7BA87ED#110949, COL_E7F5DF76_76CE_4B86_B00C_668C338F8FFF#110953, COL_A67D3744_1C8E_4621_8489_9EA38D696691#110958, COL_55823422_AF79_46F7_807C_92C35F353A73#110964]
Arguments: 50000
(14) AdaptiveSparkPlan
Output [6]: [COL_5ED88E4F_DF86_440D_9CC6_0C93B876ABF9#110945, COL_271E49E1_A230_499E_8192_978ECEDAE3B0#110946L, COL_58CFE2E8_1D65_4D01_9EF3_F725F7BA87ED#110949, COL_E7F5DF76_76CE_4B86_B00C_668C338F8FFF#110953, COL_A67D3744_1C8E_4621_8489_9EA38D696691#110958, COL_55823422_AF79_46F7_807C_92C35F353A73#110964]
Arguments: isFinalPlan=true