Show the Stage ID and Task ID that corresponds to the max metric
digraph G {
0 [labelType="html" label="<br><b>CollectLimit</b><br><br>"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (9)\n \nduration: total (min, med, max (stageId: taskId))\n441 ms (0 ms, 2 ms, 8 ms (stage 38.0: task 1170))";
2 [labelType="html" label="<br><b>Project</b><br><br>"];
3 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 22"];
4 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build total (min, med, max (stageId: taskId))<br>302 ms (0 ms, 1 ms, 7 ms (stage 38.0: task 1170))<br>peak memory total (min, med, max (stageId: taskId))<br>9.7 GiB (256.0 KiB, 64.3 MiB, 64.3 MiB (stage 28.0: task 1099))<br>number of output rows: 323<br>avg hash probe bucket list iters (min, med, max (stageId: taskId)):<br>(1, 1, 1 (stage 28.0: task 1099))"];
}
5 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 8,528<br>shuffle write time total (min, med, max (stageId: taskId))<br>660 ms (0 ms, 3 ms, 11 ms (stage 22.0: task 952))<br>records read: 7,876<br>local bytes read total (min, med, max (stageId: taskId))<br>374.1 KiB (0.0 B, 1419.0 B, 7.4 KiB (stage 28.0: task 1098))<br>fetch wait time total (min, med, max (stageId: taskId))<br>52 ms (0 ms, 0 ms, 4 ms (stage 38.0: task 1146))<br>remote bytes read total (min, med, max (stageId: taskId))<br>312.9 KiB (0.0 B, 1502.0 B, 7.3 KiB (stage 38.0: task 1180))<br>local blocks read: 3,655<br>remote blocks read: 3,041<br>data size total (min, med, max (stageId: taskId))<br>523.5 KiB (0.0 B, 2.3 KiB, 7.3 KiB (stage 22.0: task 921))<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>744.9 KiB (0.0 B, 3.4 KiB, 10.1 KiB (stage 22.0: task 921))"];
subgraph cluster6 {
isCluster="true";
label="WholeStageCodegen (8)\n \nduration: total (min, med, max (stageId: taskId))\n24.8 s (1 ms, 16 ms, 1.4 s (stage 22.0: task 995))";
7 [labelType="html" label="<b>HashAggregate</b><br><br>time in aggregation build total (min, med, max (stageId: taskId))<br>23.7 s (0 ms, 10 ms, 1.4 s (stage 22.0: task 995))<br>peak memory total (min, med, max (stageId: taskId))<br>50.0 MiB (256.0 KiB, 256.0 KiB, 256.0 KiB (stage 22.0: task 898))<br>number of output rows: 8,528"];
8 [labelType="html" label="<br><b>Project</b><br><br>"];
}
9 [labelType="html" label="<b>SortMergeJoin</b><br><br>number of output rows: 22,400,728"];
subgraph cluster10 {
isCluster="true";
label="WholeStageCodegen (5)\n \nduration: total (min, med, max (stageId: taskId))\n25.3 s (2 ms, 20 ms, 1.5 s (stage 22.0: task 995))";
11 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>137 ms (0 ms, 0 ms, 18 ms (stage 22.0: task 1008))<br>peak memory total (min, med, max (stageId: taskId))<br>10.8 GiB (64.0 KiB, 64.3 MiB, 256.0 MiB (stage 22.0: task 984))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 22.0: task 898))"];
}
12 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 22,400,728<br>shuffle write time total (min, med, max (stageId: taskId))<br>1.5 s (0 ms, 6 ms, 39 ms (stage 21.0: task 784))<br>records read: 22,400,728<br>local bytes read total (min, med, max (stageId: taskId))<br>188.0 MiB (0.0 B, 66.1 KiB, 11.3 MiB (stage 22.0: task 984))<br>fetch wait time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 22.0: task 898))<br>remote bytes read total (min, med, max (stageId: taskId))<br>195.7 MiB (0.0 B, 76.4 KiB, 12.0 MiB (stage 22.0: task 984))<br>local blocks read: 8,849<br>remote blocks read: 8,445<br>data size total (min, med, max (stageId: taskId))<br>2.3 GiB (0.0 B, 152.6 KiB, 154.1 MiB (stage 21.0: task 784))<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>383.7 MiB (0.0 B, 41.6 KiB, 24.5 MiB (stage 21.0: task 784))"];
subgraph cluster13 {
isCluster="true";
label="WholeStageCodegen (4)\n \nduration: total (min, med, max (stageId: taskId))\n23.4 s (0 ms, 10 ms, 1.6 s (stage 21.0: task 784))";
14 [labelType="html" label="<br><b>Project</b><br><br>"];
}
15 [labelType="html" label="<b>SortMergeJoin</b><br><br>number of output rows: 22,400,728"];
subgraph cluster16 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: total (min, med, max (stageId: taskId))\n24.3 s (2 ms, 13 ms, 1.6 s (stage 21.0: task 784))";
17 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>140 ms (0 ms, 0 ms, 21 ms (stage 21.0: task 784))<br>peak memory total (min, med, max (stageId: taskId))<br>11.0 GiB (64.0 KiB, 64.1 MiB, 256.0 MiB (stage 21.0: task 784))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 21.0: task 698))"];
}
18 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 22,400,728<br>shuffle write time total (min, med, max (stageId: taskId))<br>835 ms (25 ms, 42 ms, 51 ms (stage 20.0: task 689))<br>records read: 22,400,728<br>local bytes read total (min, med, max (stageId: taskId))<br>226.1 MiB (0.0 B, 16.4 KiB, 15.1 MiB (stage 21.0: task 795))<br>fetch wait time total (min, med, max (stageId: taskId))<br>5 ms (0 ms, 0 ms, 5 ms (stage 21.0: task 698))<br>remote bytes read total (min, med, max (stageId: taskId))<br>224.0 MiB (0.0 B, 17.6 KiB, 17.1 MiB (stage 21.0: task 784))<br>local blocks read: 1,435<br>remote blocks read: 1,414<br>data size total (min, med, max (stageId: taskId))<br>2.2 GiB (34.9 MiB, 126.4 MiB, 126.5 MiB (stage 20.0: task 679))<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>450.1 MiB (7.3 MiB, 25.6 MiB, 25.6 MiB (stage 20.0: task 684))"];
19 [labelType="html" label="<b>Scan csv </b><br><br>number of files read: 7<br>metadata time: 0 ms<br>size of files read: 2.2 GiB<br>number of output rows: 22,400,728"];
subgraph cluster20 {
isCluster="true";
label="WholeStageCodegen (3)\n \nduration: total (min, med, max (stageId: taskId))\n13.7 s (1 ms, 4 ms, 1.4 s (stage 21.0: task 784))";
21 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 21.0: task 698))<br>peak memory total (min, med, max (stageId: taskId))<br>9.1 GiB (64.0 KiB, 64.1 MiB, 64.1 MiB (stage 21.0: task 698))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 21.0: task 698))"];
}
22 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 265<br>shuffle write time total (min, med, max (stageId: taskId))<br>24 ms (11 ms, 12 ms, 12 ms (stage 19.0: task 676))<br>records read: 530<br>local bytes read total (min, med, max (stageId: taskId))<br>16.1 KiB (0.0 B, 72.0 B, 126.0 B (stage 22.0: task 998))<br>fetch wait time total (min, med, max (stageId: taskId))<br>894 ms (0 ms, 0 ms, 28 ms (stage 22.0: task 984))<br>remote bytes read total (min, med, max (stageId: taskId))<br>15.8 KiB (0.0 B, 0.0 B, 151.0 B (stage 21.0: task 721))<br>local blocks read: 203<br>remote blocks read: 195<br>data size total (min, med, max (stageId: taskId))<br>9.0 KiB (4.4 KiB, 4.6 KiB, 4.6 KiB (stage 19.0: task 675))<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>16.0 KiB (7.8 KiB, 8.2 KiB, 8.2 KiB (stage 19.0: task 675))"];
subgraph cluster23 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: total (min, med, max (stageId: taskId))\n113 ms (55 ms, 58 ms, 58 ms (stage 19.0: task 676))";
24 [labelType="html" label="<br><b>Project</b><br><br>"];
25 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 265"];
26 [labelType="html" label="<b>Scan ExistingRDD</b><br><br>number of output rows: 265"];
}
subgraph cluster27 {
isCluster="true";
label="WholeStageCodegen (7)\n \nduration: total (min, med, max (stageId: taskId))\n14.7 s (0 ms, 12 ms, 1.1 s (stage 22.0: task 984))";
28 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 22.0: task 898))<br>peak memory total (min, med, max (stageId: taskId))<br>9.1 GiB (64.0 KiB, 64.1 MiB, 64.1 MiB (stage 22.0: task 898))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 22.0: task 898))"];
}
2->0;
3->2;
4->3;
5->4;
7->5;
8->7;
9->8;
11->9;
12->11;
14->12;
15->14;
17->15;
18->17;
19->18;
21->15;
22->21;
24->22;
25->24;
26->25;
28->9;
22->28;
}
29
CollectLimit 21
Project [cast(Month#405 as string) AS Month#604, route#383, cast(total_tip_amount#556 as string) AS total_tip_amount#606, cast(total_passenger_count#558 as string) AS total_passenger_count#607, cast(round((total_tip_amount#556 / total_passenger_count#558), 2) as string) AS average_tip_per_passenger#608]
HashAggregate(keys=[Month#405, route#383], functions=[partial_sum(cast(tip_amount#65 as double)), partial_sum(cast(passenger_count#57 as double))])
Project [passenger_count#57, tip_amount#65, concat_ws( to , Pickup_Borough#147, Borough#15) AS route#383, month(cast(tpep_pickup_datetime#55 as date)) AS Month#405]
WholeStageCodegen (8)
SortMergeJoin [cast(DOLocationID#60 as int)], [LocationID#14], LeftOuter
Sort [cast(DOLocationID#60 as int) ASC NULLS FIRST], false, 0
WholeStageCodegen (5)
Exchange hashpartitioning(cast(DOLocationID#60 as int), 200), true, [id=#403]
Project [tpep_pickup_datetime#55, passenger_count#57, DOLocationID#60, tip_amount#65, Borough#15 AS Pickup_Borough#147]
WholeStageCodegen (4)
SortMergeJoin [cast(PULocationID#59 as int)], [LocationID#14], LeftOuter
Sort [cast(PULocationID#59 as int) ASC NULLS FIRST], false, 0
WholeStageCodegen (1)
Exchange hashpartitioning(cast(PULocationID#59 as int), 200), true, [id=#370]