digraph G {
0 [labelType="html" label="<br><b>TakeOrderedAndProject</b><br><br>"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: total (min, med, max (stageId: taskId))\n92 ms (0 ms, 0 ms, 16 ms (stage 19.0: task 1024))";
2 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build total (min, med, max (stageId: taskId))<br>2 ms (0 ms, 0 ms, 1 ms (stage 19.0: task 1024))<br>peak memory total (min, med, max (stageId: taskId))<br>3.2 GiB (16.3 MiB, 16.3 MiB, 16.3 MiB (stage 19.0: task 1014))<br>number of output rows: 5,655<br>avg hash probe bucket list iters (min, med, max (stageId: taskId)):<br>(1, 1, 1 (stage 19.0: task 1014))"];
}
3 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 5,655<br>shuffle write time: 11 ms<br>records read: 5,655<br>local bytes read total (min, med, max (stageId: taskId))<br>59.5 KiB (174.0 B, 302.0 B, 423.0 B (stage 19.0: task 1044))<br>fetch wait time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 19.0: task 1014))<br>local blocks read: 200<br>data size: 132.5 KiB<br>shuffle bytes written: 59.5 KiB"];
subgraph cluster4 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: 190 ms";
5 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build: 128 ms<br>peak memory: 256.0 KiB<br>number of output rows: 5,655"];
6 [labelType="html" label="<br><b>Project</b><br><br>"];
7 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 7,556"];
}
8 [labelType="html" label="<b>Scan csv </b><br><br>number of output rows: 7,556<br>number of files read: 1<br>metadata time: 0 ms<br>size of files read: 2.9 MiB"];
2->0;
3->2;
5->3;
6->5;
7->6;
8->7;
}
9
TakeOrderedAndProject(limit=21, orderBy=[count#133L DESC NULLS LAST], output=[customer_id#138,count#139])
HashAggregate(keys=[customer_id#18], functions=[count(1)])
WholeStageCodegen (2)
Exchange hashpartitioning(customer_id#18, 200), ENSURE_REQUIREMENTS, [id=#227]
HashAggregate(keys=[customer_id#18], functions=[partial_count(1)])
Project [customer_id#18]
Filter (isnotnull(order_status#19) AND (order_status#19 = CLOSED))
WholeStageCodegen (1)
FileScan csv [customer_id#18,order_status#19] Batched: false, DataFilters: [isnotnull(order_status#19), (order_status#19 = CLOSED)], Format: CSV, Location: InMemoryFileIndex[hdfs://m01.itversity.com:9000/public/trendytech/orders_wh/orders_wh.csv], PartitionFilters: [], PushedFilters: [IsNotNull(order_status), EqualTo(order_status,CLOSED)], ReadSchema: struct<customer_id:int,order_status:string>