digraph G {
0 [labelType="html" label="<br><b>AdaptiveSparkPlan</b><br><br>"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: 5 ms";
2 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build: 0 ms<br>peak memory: 256.0 KiB<br>number of output rows: 1<br>number of sort fallback tasks: 0<br>avg hash probes per key: 0"];
}
3 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 1<br>partition data size: 72.0 B<br>number of coalesced partitions: 1"];
4 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 1<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>3 ms (0 ms, 0 ms, 3 ms (stage 13.0: task 14))<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 1<br>local bytes read: 68.0 B<br>fetch wait time: 0 ms<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 1<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size total (min, med, max (stageId: taskId))<br>24.0 B (0.0 B, 0.0 B, 24.0 B (stage 13.0: task 14))<br>local merged bytes read: 0.0 B<br>number of partitions: 200<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>68.0 B (0.0 B, 0.0 B, 68.0 B (stage 13.0: task 14))"];
subgraph cluster5 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: total (min, med, max (stageId: taskId))\n109 ms (0 ms, 41 ms, 68 ms (stage 13.0: task 14))";
6 [labelType="html" label="<b>HashAggregate</b><br><br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 13.0: task 15))<br>time in aggregation build total (min, med, max (stageId: taskId))<br>88 ms (0 ms, 28 ms, 60 ms (stage 13.0: task 14))<br>peak memory total (min, med, max (stageId: taskId))<br>512.0 KiB (0.0 B, 256.0 KiB, 256.0 KiB (stage 13.0: task 15))<br>number of output rows: 1<br>number of sort fallback tasks: 0<br>avg hash probes per key: 0"];
7 [labelType="html" label="<br><b>Project</b><br><br>"];
8 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 1"];
9 [labelType="html" label="<b>ColumnarToRow</b><br><br>number of output rows: 26,236<br>number of input batches: 8"];
}
10 [labelType="html" label="<b>Scan parquet spark_catalog.default.airports</b><br><br>number of files read: 2<br>scan time total (min, med, max (stageId: taskId))<br>78 ms (0 ms, 27 ms, 51 ms (stage 13.0: task 14))<br>metadata time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 13.0: task 15))<br>size of files read total (min, med, max (stageId: taskId))<br>2.1 MiB (0.0 B, 0.0 B, 2.1 MiB (driver))<br>number of output rows: 26,236"];
2->0;
3->2;
4->3;
6->4;
7->6;
8->7;
9->8;
10->9;
}
11
AdaptiveSparkPlan isFinalPlan=true
HashAggregate(keys=[city#189], functions=[])
WholeStageCodegen (2)
AQEShuffleRead coalesced
Exchange hashpartitioning(city#189, 200), ENSURE_REQUIREMENTS, [plan_id=300]
HashAggregate(keys=[city#189], functions=[])
Project [city#189]
Filter (isnotnull(code#191) AND (code#191 = 0GA2))
ColumnarToRow
WholeStageCodegen (1)
FileScan parquet spark_catalog.default.airports[city#189,code#191] Batched: true, DataFilters: [isnotnull(code#191), (code#191 = 0GA2)], Format: Parquet, Location: InMemoryFileIndex(1 paths)[file:/home/acdcadmin/spark-warehouse/airports], PartitionFilters: [], PushedFilters: [IsNotNull(code), EqualTo(code,0GA2)], ReadSchema: struct<city:string,code:string>