digraph G {
0 [labelType="html" label="<br><b>AdaptiveSparkPlan</b><br><br>"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (6)\n \nduration: 0 ms";
2 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build: 0 ms<br>number of output rows: 1"];
}
3 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 1<br>local merged chunks fetched: 0<br>shuffle write time: 0 ms<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 1<br>local bytes read: 59.0 B<br>fetch wait time: 0 ms<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 1<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size: 16.0 B<br>local merged bytes read: 0.0 B<br>number of partitions: 1<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written: 59.0 B"];
subgraph cluster4 {
isCluster="true";
label="WholeStageCodegen (5)\n \nduration: 187 ms";
5 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build: 186 ms<br>peak memory: 0.0 B<br>number of output rows: 1<br>number of sort fallback tasks: 0<br>avg hash probes per key: 0"];
6 [labelType="html" label="<br><b>Project</b><br><br>"];
7 [labelType="html" label="<b>SortMergeJoin</b><br><br>number of output rows: 55,314<br>spill size: 0.0 B"];
}
subgraph cluster8 {
isCluster="true";
label="WholeStageCodegen (3)\n \nduration: 321 ms";
9 [labelType="html" label="<b>Sort</b><br><br>sort time: 37 ms<br>peak memory: 66.0 MiB<br>spill size: 0.0 B"];
}
10 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 1<br>partition data size: 164.7 KiB<br>number of coalesced partitions: 1"];
11 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 55,314<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>9 ms (4 ms, 4 ms, 4 ms (stage 23.0: task 19))<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 55,314<br>local bytes read: 159.4 KiB<br>fetch wait time: 0 ms<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 2<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size total (min, med, max (stageId: taskId))<br>3.0 MiB (854.4 KiB, 2.1 MiB, 2.1 MiB (stage 23.0: task 19))<br>local merged bytes read: 0.0 B<br>number of partitions: 10<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>159.4 KiB (45.6 KiB, 113.9 KiB, 113.9 KiB (stage 23.0: task 19))"];
subgraph cluster12 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: total (min, med, max (stageId: taskId))\n586 ms (229 ms, 357 ms, 357 ms (stage 23.0: task 19))";
13 [labelType="html" label="<br><b>Project</b><br><br>"];
}
14 [labelType="html" label="<b>Scan csv </b><br><br>number of output rows: 55,314<br>number of files read: 1<br>metadata time: 0 ms<br>size of files read: 5.6 MiB"];
subgraph cluster15 {
isCluster="true";
label="WholeStageCodegen (4)\n \nduration: 276 ms";
16 [labelType="html" label="<b>Sort</b><br><br>sort time: 7 ms<br>peak memory: 64.2 MiB<br>spill size: 0.0 B"];
}
17 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 1<br>partition data size: 132.1 KiB<br>number of coalesced partitions: 1"];
18 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 9,960<br>local merged chunks fetched: 0<br>shuffle write time: 8 ms<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 9,960<br>local bytes read: 124.5 KiB<br>fetch wait time: 0 ms<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 1<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size: 544.7 KiB<br>local merged bytes read: 0.0 B<br>number of partitions: 10<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written: 124.5 KiB"];
subgraph cluster19 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: 189 ms";
20 [labelType="html" label="<br><b>Project</b><br><br>"];
21 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 9,960"];
}
22 [labelType="html" label="<b>Scan csv </b><br><br>number of output rows: 9,960<br>number of files read: 1<br>metadata time: 0 ms<br>size of files read: 904.5 KiB"];
2->0;
3->2;
5->3;
6->5;
7->6;
9->7;
10->9;
11->10;
13->11;
14->13;
16->7;
17->16;
18->17;
20->18;
21->20;
22->21;
}
23
AdaptiveSparkPlan isFinalPlan=true
HashAggregate(keys=[], functions=[count(1)])
WholeStageCodegen (6)
Exchange SinglePartition, ENSURE_REQUIREMENTS, [plan_id=856]
HashAggregate(keys=[], functions=[partial_count(1)])
Project
SortMergeJoin [COL_21FE68DA_7812_4E10_B7FA_1CFA23C27FB3#1431, COL_3F3F1D84_AE9D_4449_9C67_EBB38C82D56F#1433], [MUTATION_14407_N_PATIENT_ETABL_14409#1467, MUTATION_14407_N_MUTATION_14408#1466], LeftOuter
WholeStageCodegen (5)
Sort [COL_21FE68DA_7812_4E10_B7FA_1CFA23C27FB3#1431 ASC NULLS FIRST, COL_3F3F1D84_AE9D_4449_9C67_EBB38C82D56F#1433 ASC NULLS FIRST], false, 0
WholeStageCodegen (3)
AQEShuffleRead coalesced
Exchange hashpartitioning(COL_21FE68DA_7812_4E10_B7FA_1CFA23C27FB3#1431, COL_3F3F1D84_AE9D_4449_9C67_EBB38C82D56F#1433, 10), ENSURE_REQUIREMENTS, [plan_id=692]
Project [N_Patient_Etablissement#1236 AS COL_21FE68DA_7812_4E10_B7FA_1CFA23C27FB3#1431, N_Mutation#1238 AS COL_3F3F1D84_AE9D_4449_9C67_EBB38C82D56F#1433]
WholeStageCodegen (1)
FileScan csv [N_Patient_Etablissement#1236,N_Mutation#1238] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/data/input/depot/csv/execution/BIOLOGIE_14335/current/biologie.csv], PartitionFilters: [], PushedFilters: [], ReadSchema: struct<N_Patient_Etablissement:string,N_Mutation:string>
Sort [MUTATION_14407_N_PATIENT_ETABL_14409#1467 ASC NULLS FIRST, MUTATION_14407_N_MUTATION_14408#1466 ASC NULLS FIRST], false, 0
WholeStageCodegen (4)
AQEShuffleRead coalesced
Exchange hashpartitioning(MUTATION_14407_N_PATIENT_ETABL_14409#1467, MUTATION_14407_N_MUTATION_14408#1466, 10), ENSURE_REQUIREMENTS, [plan_id=705]
Project [N_Mutation#1073 AS MUTATION_14407_N_MUTATION_14408#1466, N_Patient_Etablissement#1074 AS MUTATION_14407_N_PATIENT_ETABL_14409#1467]
Filter (isnotnull(N_Patient_Etablissement#1074) AND isnotnull(N_Mutation#1073))
WholeStageCodegen (2)
FileScan csv [N_Mutation#1073,N_Patient_Etablissement#1074] Batched: false, DataFilters: [isnotnull(N_Patient_Etablissement#1074), isnotnull(N_Mutation#1073)], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/data/input/depot/csv/execution/MUTATION_14330/current/mutations...., PartitionFilters: [], PushedFilters: [IsNotNull(N_Patient_Etablissement), IsNotNull(N_Mutation)], ReadSchema: struct<N_Mutation:string,N_Patient_Etablissement:string>