digraph G {
0 [labelType="html" label="<br><b>TakeOrderedAndProject</b><br><br>"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: total (min, med, max (stageId: taskId))\n6.1 s (5 ms, 13 ms, 474 ms (stage 1.1: task 147))";
2 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build total (min, med, max (stageId: taskId))<br>5.0 s (3 ms, 7 ms, 470 ms (stage 1.1: task 147))<br>peak memory total (min, med, max (stageId: taskId))<br>3.2 GiB (16.5 MiB, 16.5 MiB, 16.5 MiB (stage 1.1: task 19))<br>number of output rows: 2,257,379<br>avg hash probe bucket list iters (min, med, max (stageId: taskId)):<br>(1.4, 1.4, 1.4 (stage 1.1: task 19))"];
}
3 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 291,629<br>shuffle write time total (min, med, max (stageId: taskId))<br>26 ms (0 ms, 0 ms, 26 ms (stage 0.1: task 16))<br>records read: 2,260,197<br>local bytes read total (min, med, max (stageId: taskId))<br>86.6 MiB (178.7 KiB, 522.3 KiB, 541.2 KiB (stage 1.1: task 204))<br>fetch wait time total (min, med, max (stageId: taskId))<br>3.7 s (0 ms, 0 ms, 461 ms (stage 1.1: task 147))<br>remote bytes read total (min, med, max (stageId: taskId))<br>52.1 MiB (176.0 KiB, 187.4 KiB, 538.8 KiB (stage 1.1: task 86))<br>local blocks read: 1,008<br>remote blocks read: 592<br>data size total (min, med, max (stageId: taskId))<br>24.5 MiB (0.0 B, 0.0 B, 24.5 MiB (stage 0.1: task 16))<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>17.9 MiB (0.0 B, 0.0 B, 17.9 MiB (stage 0.1: task 16))"];
subgraph cluster4 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: total (min, med, max (stageId: taskId))\n587 ms (0 ms, 0 ms, 587 ms (stage 0.1: task 16))";
5 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build total (min, med, max (stageId: taskId))<br>450 ms (0 ms, 0 ms, 450 ms (stage 0.1: task 16))<br>peak memory total (min, med, max (stageId: taskId))<br>40.0 MiB (0.0 B, 0.0 B, 40.0 MiB (stage 0.1: task 16))<br>number of output rows: 291,629<br>avg hash probe bucket list iters: 1.6"];
6 [labelType="html" label="<b>ColumnarToRow</b><br><br>number of output rows: 291,682<br>number of input batches: 78"];
}
7 [labelType="html" label="<b>Scan parquet itv024694_lending_club.customers</b><br><br>number of files read: 200<br>scan time total (min, med, max (stageId: taskId))<br>297 ms (0 ms, 0 ms, 297 ms (stage 0.1: task 16))<br>metadata time: 2 ms<br>size of files read: 184.9 MiB<br>number of output rows: 291,682"];
2->0;
3->2;
5->3;
6->5;
7->6;
}
8
TakeOrderedAndProject(limit=21, orderBy=[total_count#0L DESC NULLS LAST], output=[member_id#2,total_count#39])
HashAggregate(keys=[member_id#2], functions=[count(1)])
WholeStageCodegen (2)
Exchange hashpartitioning(member_id#2, 200), ENSURE_REQUIREMENTS, [id=#25]
HashAggregate(keys=[member_id#2], functions=[partial_count(1)])
ColumnarToRow
WholeStageCodegen (1)
FileScan parquet itv024694_lending_club.customers[member_id#2] Batched: true, DataFilters: [], Format: Parquet, Location: InMemoryFileIndex[hdfs://m01.itversity.com:9000/public/trendytech/lendingclubproject/cleaned/cust..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<member_id:string>