digraph G {
0 [labelType="html" label="<br><b>TakeOrderedAndProject</b><br><br>"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (5)\n \nduration: total (min, med, max (stageId: taskId))\n1.2 s (0 ms, 0 ms, 132 ms (stage 2149.0: task 3492))";
2 [labelType="html" label="<br><b>Project</b><br><br>"];
3 [labelType="html" label="<b>SortMergeJoin</b><br><br>number of output rows: 265"];
}
subgraph cluster4 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: total (min, med, max (stageId: taskId))\n2.3 s (0 ms, 2 ms, 152 ms (stage 2149.0: task 3485))";
5 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 2149.0: task 3469))<br>peak memory total (min, med, max (stageId: taskId))<br>2.3 GiB (64.0 KiB, 16.1 MiB, 16.1 MiB (stage 2149.0: task 3469))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 2149.0: task 3469))"];
}
6 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 265<br>shuffle write time total (min, med, max (stageId: taskId))<br>176 ms (7 ms, 11 ms, 13 ms (stage 2148.0: task 3457))<br>records read: 265<br>local bytes read total (min, med, max (stageId: taskId))<br>26.8 KiB (0.0 B, 137.0 B, 418.0 B (stage 2149.0: task 3519))<br>fetch wait time total (min, med, max (stageId: taskId))<br>280 ms (0 ms, 0 ms, 65 ms (stage 2149.0: task 3499))<br>remote bytes read total (min, med, max (stageId: taskId))<br>8.3 KiB (0.0 B, 0.0 B, 351.0 B (stage 2149.0: task 3519))<br>local blocks read: 196<br>remote blocks read: 60<br>data size total (min, med, max (stageId: taskId))<br>28.4 KiB (1680.0 B, 1760.0 B, 2.7 KiB (stage 2148.0: task 3467))<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>35.1 KiB (2.0 KiB, 2.1 KiB, 3.2 KiB (stage 2148.0: task 3467))"];
subgraph cluster7 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: total (min, med, max (stageId: taskId))\n831 ms (49 ms, 51 ms, 57 ms (stage 2148.0: task 3458))";
8 [labelType="html" label="<br><b>Project</b><br><br>"];
9 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 265"];
10 [labelType="html" label="<b>Scan ExistingRDD</b><br><br>number of output rows: 265"];
}
subgraph cluster11 {
isCluster="true";
label="WholeStageCodegen (4)\n \nduration: total (min, med, max (stageId: taskId))\n885 ms (0 ms, 0 ms, 67 ms (stage 2149.0: task 3494))";
12 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 2149.0: task 3469))<br>peak memory total (min, med, max (stageId: taskId))<br>2.3 GiB (0.0 B, 16.1 MiB, 16.1 MiB (stage 2149.0: task 3469))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 2149.0: task 3469))"];
}
13 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 265<br>shuffle write time total (min, med, max (stageId: taskId))<br>156 ms (5 ms, 10 ms, 10 ms (stage 2147.0: task 3443))<br>records read: 265<br>local bytes read total (min, med, max (stageId: taskId))<br>8.8 KiB (0.0 B, 0.0 B, 241.0 B (stage 2149.0: task 3519))<br>fetch wait time total (min, med, max (stageId: taskId))<br>269 ms (0 ms, 0 ms, 66 ms (stage 2149.0: task 3494))<br>remote bytes read total (min, med, max (stageId: taskId))<br>9.7 KiB (0.0 B, 74.0 B, 222.0 B (stage 2149.0: task 3473))<br>local blocks read: 119<br>remote blocks read: 133<br>data size total (min, med, max (stageId: taskId))<br>10.4 KiB (640.0 B, 680.0 B, 680.0 B (stage 2147.0: task 3445))<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>18.4 KiB (1070.0 B, 1196.0 B, 1259.0 B (stage 2147.0: task 3441))"];
subgraph cluster14 {
isCluster="true";
label="WholeStageCodegen (3)\n \nduration: total (min, med, max (stageId: taskId))\n216 ms (10 ms, 13 ms, 17 ms (stage 2147.0: task 3439))";
15 [labelType="html" label="<br><b>Project</b><br><br>"];
16 [labelType="html" label="<br><b>SerializeFromObject</b><br><br>"];
}
17 [labelType="html" label="<b>Scan</b><br><br>number of output rows: 265"];
2->0;
3->2;
5->3;
6->5;
8->6;
9->8;
10->9;
12->3;
13->12;
15->13;
16->15;
17->16;
}
18
TakeOrderedAndProject(limit=6, orderBy=[pagerank#461 DESC NULLS LAST], output=[id#513,pagerank#514])
Project [attr#323.id AS id#457, graphx_attr#424.pagerank AS pagerank#461]
SortMergeJoin [new_id#325L], [new_id#419L], Inner
WholeStageCodegen (5)
Sort [new_id#325L ASC NULLS FIRST], false, 0
WholeStageCodegen (2)
Exchange hashpartitioning(new_id#325L, 200), true, [id=#497]
Project [cast(id#105 as bigint) AS new_id#325L, struct(id, id#105, Borough, Borough#106, Zone, Zone#107, service_zone, service_zone#108) AS attr#323]
Filter isnotnull(cast(id#105 as bigint))
Scan ExistingRDD[id#105,Borough#106,Zone#107,service_zone#108]
WholeStageCodegen (1)
Sort [new_id#419L ASC NULLS FIRST], false, 0
WholeStageCodegen (4)
Exchange hashpartitioning(new_id#419L, 200), true, [id=#506]
Project [struct(pagerank, _2#416._1) AS graphx_attr#424, _1#415L AS new_id#419L]
SerializeFromObject [knownnotnull(assertnotnull(input[0, scala.Tuple2, true]))._1 AS _1#415L, if (isnull(knownnotnull(assertnotnull(input[0, scala.Tuple2, true]))._2)) null else named_struct(_1, knownnotnull(knownnotnull(assertnotnull(input[0, scala.Tuple2, true]))._2)._1) AS _2#416]
WholeStageCodegen (3)
Scan[obj#414]