digraph G {
0 [labelType="html" label="<br><b>AdaptiveSparkPlan</b><br><br>"];
1 [labelType="html" label="<br><b>TakeOrderedAndProject</b><br><br>"];
subgraph cluster2 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: 8 ms";
3 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build: 1 ms<br>peak memory: 16.3 MiB<br>number of output rows: 2<br>number of sort fallback tasks: 0<br>avg hash probes per key: 1"];
}
4 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 1<br>partition data size: 1404.0 B<br>number of coalesced partitions: 1"];
5 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 24<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>8 ms (0 ms, 0 ms, 0 ms (stage 468.0: task 604))<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 24<br>local bytes read: 1307.0 B<br>fetch wait time: 0 ms<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 12<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size total (min, med, max (stageId: taskId))<br>960.0 B (80.0 B, 80.0 B, 80.0 B (stage 468.0: task 599))<br>local merged bytes read: 0.0 B<br>number of partitions: 10<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>1307.0 B (107.0 B, 109.0 B, 114.0 B (stage 468.0: task 599))"];
subgraph cluster6 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: total (min, med, max (stageId: taskId))\n6.3 s (256 ms, 590 ms, 628 ms (stage 468.0: task 601))";
7 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build total (min, med, max (stageId: taskId))<br>5.7 s (199 ms, 539 ms, 571 ms (stage 468.0: task 601))<br>peak memory total (min, med, max (stageId: taskId))<br>3.0 MiB (256.0 KiB, 256.0 KiB, 256.0 KiB (stage 468.0: task 599))<br>number of output rows: 24<br>number of sort fallback tasks: 0<br>avg hash probes per key: 0"];
8 [labelType="html" label="<br><b>Project</b><br><br>"];
9 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 346,976"];
10 [labelType="html" label="<b>ColumnarToRow</b><br><br>number of output rows: 525,855<br>number of input batches: 135"];
}
11 [labelType="html" label="<b>Scan parquet </b><br><br>number of files read: 13<br>scan time total (min, med, max (stageId: taskId))<br>786 ms (35 ms, 66 ms, 112 ms (stage 468.0: task 609))<br>metadata time: 0 ms<br>size of files read: 105.5 MiB<br>number of output rows: 525,855"];
1->0;
3->1;
4->3;
5->4;
7->5;
8->7;
9->8;
10->9;
11->10;
}
12
AdaptiveSparkPlan isFinalPlan=true
TakeOrderedAndProject(limit=500000, orderBy=[COL_6E93BD53_C886_4091_B7F3_4186E8AE4620#96796 ASC NULLS FIRST], output=[COL_6E93BD53_C886_4091_B7F3_4186E8AE4620#96796,COL_80F43C4F_83A5_4D49_80A3_E8E8AF4F3113#96918L])
HashAggregate(keys=[COL_12F7278E_C726_4E60_B69C_D3A3AE032982#95628], functions=[count(1)])
WholeStageCodegen (2)
AQEShuffleRead coalesced
Exchange hashpartitioning(COL_12F7278E_C726_4E60_B69C_D3A3AE032982#95628, 10), ENSURE_REQUIREMENTS, [plan_id=7400]
HashAggregate(keys=[COL_12F7278E_C726_4E60_B69C_D3A3AE032982#95628], functions=[partial_count(1)])
Project [COL_C3DDDCF1_DCFA_4104_9FF4_8D48811031D9#94783 AS COL_12F7278E_C726_4E60_B69C_D3A3AE032982#95628]
Filter (CASE WHEN isnull(StartsWith(str_remove_accent(upper(COL_E0BD1FF3_108C_4B51_984D_A65E244263C2#94799)), 38)) THEN false ELSE StartsWith(str_remove_accent(upper(COL_E0BD1FF3_108C_4B51_984D_A65E244263C2#94799)), 38) END AND ((str_remove_accent(upper(COL_C3DDDCF1_DCFA_4104_9FF4_8D48811031D9#94783)) <=> UNE MAISON) OR (str_remove_accent(upper(COL_C3DDDCF1_DCFA_4104_9FF4_8D48811031D9#94783)) <=> UN APPARTEMENT)))
ColumnarToRow
WholeStageCodegen (1)
FileScan parquet [COL_C3DDDCF1_DCFA_4104_9FF4_8D48811031D9#94783,COL_E0BD1FF3_108C_4B51_984D_A65E244263C2#94799] Batched: true, DataFilters: [CASE WHEN isnull(StartsWith(str_remove_accent(upper(COL_E0BD1FF3_108C_4B51_984D_A65E244263C2#947..., Format: Parquet, Location: InMemoryFileIndex(1 paths)[file:/data/output/cache/parquet/datablock/FONCIER_REFEREN_10755], PartitionFilters: [], PushedFilters: [], ReadSchema: struct<COL_C3DDDCF1_DCFA_4104_9FF4_8D48811031D9:string,COL_E0BD1FF3_108C_4B51_984D_A65E244263C2:s...