digraph G {
0 [labelType="html" label="<br><b>AdaptiveSparkPlan</b><br><br>"];
1 [labelType="html" label="<br><b>TakeOrderedAndProject</b><br><br>"];
subgraph cluster2 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: 10 ms";
3 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build: 2 ms<br>peak memory: 16.3 MiB<br>number of output rows: 212<br>number of sort fallback tasks: 0<br>avg hash probes per key: 1"];
}
4 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 1<br>partition data size: 19.0 KiB<br>number of coalesced partitions: 1"];
5 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 1,223<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>17 ms (1 ms, 2 ms, 7 ms (stage 1277.0: task 1804))<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 1,223<br>local bytes read: 18.1 KiB<br>fetch wait time: 0 ms<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 6<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size total (min, med, max (stageId: taskId))<br>47.8 KiB (7.7 KiB, 8.0 KiB, 8.1 KiB (stage 1277.0: task 1817))<br>local merged bytes read: 0.0 B<br>number of partitions: 10<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>18.1 KiB (2.9 KiB, 3.0 KiB, 3.1 KiB (stage 1277.0: task 1798))"];
subgraph cluster6 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: total (min, med, max (stageId: taskId))\n486 ms (23 ms, 100 ms, 121 ms (stage 1277.0: task 1817))";
7 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build total (min, med, max (stageId: taskId))<br>298 ms (15 ms, 50 ms, 102 ms (stage 1277.0: task 1817))<br>peak memory total (min, med, max (stageId: taskId))<br>97.5 MiB (16.3 MiB, 16.3 MiB, 16.3 MiB (stage 1277.0: task 1798))<br>number of output rows: 1,223<br>number of sort fallback tasks: 0<br>avg hash probes per key (min, med, max (stageId: taskId)):<br>(1, 1, 1 (stage 1277.0: task 1798))"];
8 [labelType="html" label="<br><b>Project</b><br><br>"];
9 [labelType="html" label="<b>ColumnarToRow</b><br><br>number of output rows: 81,008<br>number of input batches: 25"];
}
10 [labelType="html" label="<b>Scan parquet </b><br><br>number of files read: 12<br>scan time total (min, med, max (stageId: taskId))<br>122 ms (8 ms, 23 ms, 44 ms (stage 1277.0: task 1825))<br>metadata time: 0 ms<br>size of files read: 5.2 MiB<br>number of output rows: 81,008"];
1->0;
3->1;
4->3;
5->4;
7->5;
8->7;
9->8;
10->9;
}
11
AdaptiveSparkPlan isFinalPlan=true
TakeOrderedAndProject(limit=500000, orderBy=[COL_9B8E7B3A_E221_4E23_AD70_A5E7A59B5C9C#229003 ASC NULLS FIRST], output=[COL_9B8E7B3A_E221_4E23_AD70_A5E7A59B5C9C#229003,COL_28029B36_F04E_40AD_A1F7_C6D015FF1776#229118L,COL_51F4C821_B6FD_4C8F_8754_943549BC69E8#229004])
HashAggregate(keys=[COL_7D82EA7A_3FA1_40E5_9841_750803E45C23#228057, COL_18FB24FA_3757_467B_AF03_07DCFD04D084#228059], functions=[count(1)])
WholeStageCodegen (2)
AQEShuffleRead coalesced
Exchange hashpartitioning(COL_7D82EA7A_3FA1_40E5_9841_750803E45C23#228057, COL_18FB24FA_3757_467B_AF03_07DCFD04D084#228059, 10), ENSURE_REQUIREMENTS, [plan_id=21200]
HashAggregate(keys=[knownfloatingpointnormalized(normalizenanandzero(COL_7D82EA7A_3FA1_40E5_9841_750803E45C23#228057)) AS COL_7D82EA7A_3FA1_40E5_9841_750803E45C23#228057, COL_18FB24FA_3757_467B_AF03_07DCFD04D084#228059], functions=[partial_count(1)])
Project [COL_730E830A_DE0D_4568_81F4_ED74ECA509F0#226558 AS COL_7D82EA7A_3FA1_40E5_9841_750803E45C23#228057, COL_20AD4F6D_147A_4072_A6A0_C62D0125E2C7#226560 AS COL_18FB24FA_3757_467B_AF03_07DCFD04D084#228059]
ColumnarToRow
WholeStageCodegen (1)
FileScan parquet [COL_730E830A_DE0D_4568_81F4_ED74ECA509F0#226558,COL_20AD4F6D_147A_4072_A6A0_C62D0125E2C7#226560] Batched: true, DataFilters: [], Format: Parquet, Location: InMemoryFileIndex(1 paths)[file:/data/output/cache/parquet/datablock/PU_FICHIER_FICT_253787], PartitionFilters: [], PushedFilters: [], ReadSchema: struct<COL_730E830A_DE0D_4568_81F4_ED74ECA509F0:double,COL_20AD4F6D_147A_4072_A6A0_C62D0125E2C7:s...