digraph G {
0 [labelType="html" label="<br><b>AdaptiveSparkPlan</b><br><br>"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (3)\n \nduration: 0 ms";
2 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build: 22 ms<br>peak memory: 64.2 MiB<br>number of output rows: 1<br>number of sort fallback tasks: 0<br>avg hash probes per key: 1"];
}
3 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 1<br>partition data size: 3.5 KiB<br>number of coalesced partitions: 1"];
4 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 40<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>106 ms (0 ms, 2 ms, 11 ms (stage 3.0: task 13))<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 40<br>local bytes read: 679.0 B<br>fetch wait time: 0 ms<br>remote bytes read: 2.7 KiB<br>merged fetch fallback count: 0<br>local blocks read: 8<br>remote merged chunks fetched: 0<br>remote blocks read: 32<br>data size total (min, med, max (stageId: taskId))<br>1040.0 B (32.0 B, 48.0 B, 48.0 B (stage 3.0: task 14))<br>local merged bytes read: 0.0 B<br>number of partitions: 37<br>remote reqs duration: 40 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>3.3 KiB (92.0 B, 165.0 B, 165.0 B (stage 3.0: task 14))"];
subgraph cluster5 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: total (min, med, max (stageId: taskId))\n9.5 s (106 ms, 388 ms, 671 ms (stage 3.0: task 9))";
6 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build total (min, med, max (stageId: taskId))<br>6.1 s (98 ms, 187 ms, 429 ms (stage 3.0: task 6))<br>peak memory total (min, med, max (stageId: taskId))<br>966.2 MiB (256.0 KiB, 64.2 MiB, 64.2 MiB (stage 3.0: task 14))<br>number of output rows: 40<br>number of sort fallback tasks: 0<br>avg hash probes per key (min, med, max (stageId: taskId)):<br>(1, 1, 1 (stage 3.0: task 14))"];
7 [labelType="html" label="<br><b>Project</b><br><br>"];
8 [labelType="html" label="<b>BroadcastHashJoin</b><br><br>number of output rows: 1,196"];
9 [labelType="html" label="<b>ColumnarToRow</b><br><br>number of output rows: 1,196<br>number of input batches: 25"];
}
10 [labelType="html" label="<b>Scan parquet </b><br><br>number of files read: 25<br>scan time total (min, med, max (stageId: taskId))<br>5.9 s (98 ms, 186 ms, 407 ms (stage 3.0: task 9))<br>metadata time: 0 ms<br>size of files read: 83.2 KiB<br>number of output rows: 1,196"];
11 [labelType="html" label="<b>BroadcastExchange</b><br><br>time to broadcast: 14 ms<br>time to build: 50 ms<br>time to collect: 1.8 s<br>number of output rows: 1,196<br>data size: 64.1 MiB"];
subgraph cluster12 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: 908 ms";
13 [labelType="html" label="<b>ColumnarToRow</b><br><br>number of output rows: 1,196<br>number of input batches: 1"];
}
14 [labelType="html" label="<b>Scan parquet </b><br><br>number of files read: 1<br>scan time: 900 ms<br>metadata time: 2 ms<br>size of files read: 8.1 KiB<br>number of output rows: 1,196"];
2->0;
3->2;
4->3;
6->4;
7->6;
8->7;
9->8;
10->9;
11->8;
13->11;
14->13;
}
15
AdaptiveSparkPlan isFinalPlan=true
HashAggregate(keys=[demandProfile#138], functions=[])
WholeStageCodegen (3)
AQEShuffleRead coalesced
Exchange hashpartitioning(demandProfile#138, 37), ENSURE_REQUIREMENTS, [plan_id=100]
HashAggregate(keys=[demandProfile#138], functions=[])
Project [demandProfile#138]
BroadcastHashJoin [coalesce(plant#128, ), isnull(plant#128), coalesce(product#127, ), isnull(product#127)], [coalesce(plant#136, ), isnull(plant#136), coalesce(product#135, ), isnull(product#135)], LeftOuter, BuildRight, false
ColumnarToRow
WholeStageCodegen (2)
FileScan parquet [product#127,plant#128] Batched: true, DataFilters: [], Format: Parquet, Location: InMemoryFileIndex(1 paths)[hdlfs://2e93940d-4be8-4f12-830d-f0b8d392c03a.files.hdl.prod-eu20.hanac..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<product:string,plant:string>
BroadcastExchange HashedRelationBroadcastMode(List(coalesce(input[1, string, true], ), isnull(input[1, string, true]), coalesce(input[0, string, true], ), isnull(input[0, string, true])),false), [plan_id=52]
ColumnarToRow
WholeStageCodegen (1)
FileScan parquet [product#135,plant#136,demandprofile#138] Batched: true, DataFilters: [], Format: Parquet, Location: InMemoryFileIndex(1 paths)[hdlfs://2e93940d-4be8-4f12-830d-f0b8d392c03a.files.hdl.prod-eu20.hanac..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<product:string,plant:string,demandprofile:string>