digraph G {
0 [labelType="html" label="<br><b>AdaptiveSparkPlan</b><br><br>"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: 0 ms";
2 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build: 0 ms<br>number of output rows: 1"];
}
3 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 2<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 108.0: task 94))<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 2<br>local bytes read: 118.0 B<br>fetch wait time: 0 ms<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 2<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size total (min, med, max (stageId: taskId))<br>32.0 B (0.0 B, 16.0 B, 16.0 B (stage 108.0: task 94))<br>local merged bytes read: 0.0 B<br>number of partitions: 1<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>118.0 B (0.0 B, 59.0 B, 59.0 B (stage 108.0: task 94))"];
subgraph cluster4 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: total (min, med, max (stageId: taskId))\n285 ms (99 ms, 186 ms, 186 ms (stage 108.0: task 93))";
5 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build total (min, med, max (stageId: taskId))<br>284 ms (99 ms, 185 ms, 185 ms (stage 108.0: task 93))<br>number of output rows: 2"];
6 [labelType="html" label="<br><b>Project</b><br><br>"];
7 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 483"];
}
8 [labelType="html" label="<b>Scan csv </b><br><br>number of output rows: 31,257<br>number of files read: 1<br>metadata time: 0 ms<br>size of files read: 5.8 MiB"];
2->0;
3->2;
5->3;
6->5;
7->6;
8->7;
}
9
AdaptiveSparkPlan isFinalPlan=true
HashAggregate(keys=[], functions=[count(1)])
WholeStageCodegen (2)
Exchange SinglePartition, ENSURE_REQUIREMENTS, [plan_id=1379]
HashAggregate(keys=[], functions=[partial_count(1)])
Project
Filter ((isnull(ride_id#9482) OR (ended_at#9485 <= started_at#9484)) OR NOT (((isnotnull(end_station_id#9489) AND isnotnull(start_station_id#9487)) AND NOT (end_station_id#9489 = start_station_id#9487)) <=> true))
WholeStageCodegen (1)
FileScan csv [ride_id#9482,started_at#9484,ended_at#9485,start_station_id#9487,end_station_id#9489] Batched: false, DataFilters: [((isnull(ride_id#9482) OR (ended_at#9485 <= started_at#9484)) OR NOT (((isnotnull(end_station_id..., Format: CSV, Location: InMemoryFileIndex(1 paths)[s3a://rzvde-g8-kirsanov-dmitry/raw/citibike_data/202502/202502-citibik..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<ride_id:string,started_at:timestamp,ended_at:timestamp,start_station_id:string,end_station...