digraph G {
0 [labelType="html" label="<br><b>AdaptiveSparkPlan</b><br><br>"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (3)\n \nduration: 0 ms";
2 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build: 0 ms<br>number of output rows: 1"];
}
3 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 3<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>1 ms (0 ms, 0 ms, 0 ms (stage 884.0: task 824))<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 3<br>local bytes read: 171.0 B<br>fetch wait time: 0 ms<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 3<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size total (min, med, max (stageId: taskId))<br>48.0 B (16.0 B, 16.0 B, 16.0 B (stage 884.0: task 825))<br>local merged bytes read: 0.0 B<br>number of partitions: 1<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>171.0 B (56.0 B, 56.0 B, 59.0 B (stage 884.0: task 824))"];
subgraph cluster4 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: total (min, med, max (stageId: taskId))\n287 ms (7 ms, 7 ms, 273 ms (stage 884.0: task 824))";
5 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build total (min, med, max (stageId: taskId))<br>285 ms (6 ms, 7 ms, 272 ms (stage 884.0: task 824))<br>number of output rows: 3"];
6 [labelType="html" label="<br><b>Project</b><br><br>"];
}
7 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 1"];
subgraph cluster8 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: total (min, med, max (stageId: taskId))\n346 ms (25 ms, 27 ms, 294 ms (stage 884.0: task 824))";
9 [labelType="html" label="<b>ColumnarToRow</b><br><br>number of output rows: 9,522<br>number of input batches: 3"];
}
10 [labelType="html" label="<b>Scan parquet </b><br><br>number of files read: 1<br>scan time total (min, med, max (stageId: taskId))<br>261 ms (6 ms, 7 ms, 248 ms (stage 884.0: task 824))<br>metadata time: 0 ms<br>size of files read: 9.9 MiB<br>number of output rows: 9,522"];
2->0;
3->2;
5->3;
6->5;
7->6;
9->7;
10->9;
}
11
AdaptiveSparkPlan isFinalPlan=true
HashAggregate(keys=[], functions=[count(1)])
WholeStageCodegen (3)
Exchange SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12736]
HashAggregate(keys=[], functions=[partial_count(1)])
Project
WholeStageCodegen (2)
Filter ((DOCUMENT_ID_3241#76473 <=> 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) AND ((((((((((((CASE WHEN isnull(Contains(DOCUMENT_ID_3241#76473, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(DOCUMENT_ID_3241#76473, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END OR CASE WHEN isnull(Contains(METADOCUMENT_ID_3242#76477, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(METADOCUMENT_ID_3242#76477, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(PATIENT_ID_3243#76479, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(PATIENT_ID_3243#76479, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(VISIT_ID_3244#76483, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(VISIT_ID_3244#76483, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(VISIT_UNIT_ID_3245#76484, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(VISIT_UNIT_ID_3245#76484, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(UNIT_3247#76481, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(UNIT_3247#76481, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(DELEGATE_UNIT_3248#76472, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(DELEGATE_UNIT_3248#76472, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(HIERARCHY_UNIT_3249#76476, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(HIERARCHY_UNIT_3249#76476, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(TITLE_3250#76480, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(TITLE_3250#76480, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(DOCUMENT_TYPE_3251#76474, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(DOCUMENT_TYPE_3251#76474, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(BODY_3253#76470, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(BODY_3253#76470, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(AUTHOR_3254#76469, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(AUTHOR_3254#76469, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(to_json(str_to_words(str_replace_regex(BODY_3253#76470, <br\s*\/?>, )), Some(Etc/UTC)), 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(to_json(str_to_words(str_replace_regex(BODY_3253#76470, <br\s*\/?>, )), Some(Etc/UTC)), 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END))
ColumnarToRow
WholeStageCodegen (1)
FileScan parquet [AUTHOR_3254#76469,BODY_3253#76470,DELEGATE_UNIT_3248#76472,DOCUMENT_ID_3241#76473,DOCUMENT_TYPE_3251#76474,HIERARCHY_UNIT_3249#76476,METADOCUMENT_ID_3242#76477,PATIENT_ID_3243#76479,TITLE_3250#76480,UNIT_3247#76481,VISIT_ID_3244#76483,VISIT_UNIT_ID_3245#76484] Batched: true, DataFilters: [(DOCUMENT_ID_3241#76473 <=> 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF), ((((((((((((CASE WHEN isn..., Format: Parquet, Location: InMemoryFileIndex(1 paths)[file:/data/output/cache/parquet/uet/DOCUMENT_3240], PartitionFilters: [], PushedFilters: [EqualNullSafe(DOCUMENT_ID_3241,8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)], ReadSchema: struct<AUTHOR_3254:string,BODY_3253:string,DELEGATE_UNIT_3248:string,DOCUMENT_ID_3241:string,DOCU...
== Physical Plan ==
AdaptiveSparkPlan (14)
+- == Final Plan ==
* HashAggregate (8)
+- ShuffleQueryStage (7), Statistics(sizeInBytes=48.0 B, rowCount=3)
+- Exchange (6)
+- * HashAggregate (5)
+- * Project (4)
+- Filter (3)
+- * ColumnarToRow (2)
+- Scan parquet (1)
+- == Initial Plan ==
HashAggregate (13)
+- Exchange (12)
+- HashAggregate (11)
+- Project (10)
+- Filter (9)
+- Scan parquet (1)
(1) Scan parquet
Output [12]: [AUTHOR_3254#76469, BODY_3253#76470, DELEGATE_UNIT_3248#76472, DOCUMENT_ID_3241#76473, DOCUMENT_TYPE_3251#76474, HIERARCHY_UNIT_3249#76476, METADOCUMENT_ID_3242#76477, PATIENT_ID_3243#76479, TITLE_3250#76480, UNIT_3247#76481, VISIT_ID_3244#76483, VISIT_UNIT_ID_3245#76484]
Batched: true
Location: InMemoryFileIndex [file:/data/output/cache/parquet/uet/DOCUMENT_3240]
PushedFilters: [EqualNullSafe(DOCUMENT_ID_3241,8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)]
ReadSchema: struct<AUTHOR_3254:string,BODY_3253:string,DELEGATE_UNIT_3248:string,DOCUMENT_ID_3241:string,DOCUMENT_TYPE_3251:string,HIERARCHY_UNIT_3249:string,METADOCUMENT_ID_3242:string,PATIENT_ID_3243:string,TITLE_3250:string,UNIT_3247:string,VISIT_ID_3244:string,VISIT_UNIT_ID_3245:string>
(2) ColumnarToRow [codegen id : 1]
Input [12]: [AUTHOR_3254#76469, BODY_3253#76470, DELEGATE_UNIT_3248#76472, DOCUMENT_ID_3241#76473, DOCUMENT_TYPE_3251#76474, HIERARCHY_UNIT_3249#76476, METADOCUMENT_ID_3242#76477, PATIENT_ID_3243#76479, TITLE_3250#76480, UNIT_3247#76481, VISIT_ID_3244#76483, VISIT_UNIT_ID_3245#76484]
(3) Filter
Input [12]: [AUTHOR_3254#76469, BODY_3253#76470, DELEGATE_UNIT_3248#76472, DOCUMENT_ID_3241#76473, DOCUMENT_TYPE_3251#76474, HIERARCHY_UNIT_3249#76476, METADOCUMENT_ID_3242#76477, PATIENT_ID_3243#76479, TITLE_3250#76480, UNIT_3247#76481, VISIT_ID_3244#76483, VISIT_UNIT_ID_3245#76484]
Condition : ((DOCUMENT_ID_3241#76473 <=> 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) AND ((((((((((((CASE WHEN isnull(Contains(DOCUMENT_ID_3241#76473, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(DOCUMENT_ID_3241#76473, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END OR CASE WHEN isnull(Contains(METADOCUMENT_ID_3242#76477, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(METADOCUMENT_ID_3242#76477, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(PATIENT_ID_3243#76479, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(PATIENT_ID_3243#76479, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(VISIT_ID_3244#76483, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(VISIT_ID_3244#76483, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(VISIT_UNIT_ID_3245#76484, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(VISIT_UNIT_ID_3245#76484, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(UNIT_3247#76481, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(UNIT_3247#76481, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(DELEGATE_UNIT_3248#76472, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(DELEGATE_UNIT_3248#76472, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(HIERARCHY_UNIT_3249#76476, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(HIERARCHY_UNIT_3249#76476, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(TITLE_3250#76480, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(TITLE_3250#76480, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(DOCUMENT_TYPE_3251#76474, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(DOCUMENT_TYPE_3251#76474, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(BODY_3253#76470, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(BODY_3253#76470, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(AUTHOR_3254#76469, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(AUTHOR_3254#76469, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(to_json(str_to_words(str_replace_regex(BODY_3253#76470, <br\s*\/?>, )), Some(Etc/UTC)), 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(to_json(str_to_words(str_replace_regex(BODY_3253#76470, <br\s*\/?>, )), Some(Etc/UTC)), 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END))
(4) Project [codegen id : 2]
Output: []
Input [12]: [AUTHOR_3254#76469, BODY_3253#76470, DELEGATE_UNIT_3248#76472, DOCUMENT_ID_3241#76473, DOCUMENT_TYPE_3251#76474, HIERARCHY_UNIT_3249#76476, METADOCUMENT_ID_3242#76477, PATIENT_ID_3243#76479, TITLE_3250#76480, UNIT_3247#76481, VISIT_ID_3244#76483, VISIT_UNIT_ID_3245#76484]
(5) HashAggregate [codegen id : 2]
Input: []
Keys: []
Functions [1]: [partial_count(1)]
Aggregate Attributes [1]: [count#76865L]
Results [1]: [count#76866L]
(6) Exchange
Input [1]: [count#76866L]
Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12736]
(7) ShuffleQueryStage
Output [1]: [count#76866L]
Arguments: 0
(8) HashAggregate [codegen id : 3]
Input [1]: [count#76866L]
Keys: []
Functions [1]: [count(1)]
Aggregate Attributes [1]: [count(1)#76862L]
Results [1]: [count(1)#76862L AS count#76863L]
(9) Filter
Input [12]: [AUTHOR_3254#76469, BODY_3253#76470, DELEGATE_UNIT_3248#76472, DOCUMENT_ID_3241#76473, DOCUMENT_TYPE_3251#76474, HIERARCHY_UNIT_3249#76476, METADOCUMENT_ID_3242#76477, PATIENT_ID_3243#76479, TITLE_3250#76480, UNIT_3247#76481, VISIT_ID_3244#76483, VISIT_UNIT_ID_3245#76484]
Condition : ((DOCUMENT_ID_3241#76473 <=> 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) AND ((((((((((((CASE WHEN isnull(Contains(DOCUMENT_ID_3241#76473, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(DOCUMENT_ID_3241#76473, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END OR CASE WHEN isnull(Contains(METADOCUMENT_ID_3242#76477, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(METADOCUMENT_ID_3242#76477, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(PATIENT_ID_3243#76479, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(PATIENT_ID_3243#76479, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(VISIT_ID_3244#76483, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(VISIT_ID_3244#76483, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(VISIT_UNIT_ID_3245#76484, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(VISIT_UNIT_ID_3245#76484, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(UNIT_3247#76481, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(UNIT_3247#76481, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(DELEGATE_UNIT_3248#76472, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(DELEGATE_UNIT_3248#76472, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(HIERARCHY_UNIT_3249#76476, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(HIERARCHY_UNIT_3249#76476, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(TITLE_3250#76480, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(TITLE_3250#76480, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(DOCUMENT_TYPE_3251#76474, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(DOCUMENT_TYPE_3251#76474, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(BODY_3253#76470, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(BODY_3253#76470, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(AUTHOR_3254#76469, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(AUTHOR_3254#76469, 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END) OR CASE WHEN isnull(Contains(to_json(str_to_words(str_replace_regex(BODY_3253#76470, <br\s*\/?>, )), Some(Etc/UTC)), 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF)) THEN false ELSE Contains(to_json(str_to_words(str_replace_regex(BODY_3253#76470, <br\s*\/?>, )), Some(Etc/UTC)), 8BE75A8015FDF0D67EA8C8C6A4008D75E25BAEEF) END))
(10) Project
Output: []
Input [12]: [AUTHOR_3254#76469, BODY_3253#76470, DELEGATE_UNIT_3248#76472, DOCUMENT_ID_3241#76473, DOCUMENT_TYPE_3251#76474, HIERARCHY_UNIT_3249#76476, METADOCUMENT_ID_3242#76477, PATIENT_ID_3243#76479, TITLE_3250#76480, UNIT_3247#76481, VISIT_ID_3244#76483, VISIT_UNIT_ID_3245#76484]
(11) HashAggregate
Input: []
Keys: []
Functions [1]: [partial_count(1)]
Aggregate Attributes [1]: [count#76865L]
Results [1]: [count#76866L]
(12) Exchange
Input [1]: [count#76866L]
Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12714]
(13) HashAggregate
Input [1]: [count#76866L]
Keys: []
Functions [1]: [count(1)]
Aggregate Attributes [1]: [count(1)#76862L]
Results [1]: [count(1)#76862L AS count#76863L]
(14) AdaptiveSparkPlan
Output [1]: [count#76863L]
Arguments: isFinalPlan=true