Show the Stage ID and Task ID that corresponds to the max metric
digraph G {
0 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 0<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 878.0: task 1263))<br>remote merged bytes read total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 878.0: task 1263))<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 878.0: task 1263))<br>remote merged blocks fetched: 0<br>records read: 0<br>local bytes read total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 878.0: task 1263))<br>fetch wait time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 878.0: task 1263))<br>remote bytes read total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 878.0: task 1263))<br>merged fetch fallback count: 0<br>local blocks read: 0<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 878.0: task 1263))<br>local merged bytes read total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 878.0: task 1263))<br>number of partitions: 16<br>remote reqs duration total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 878.0: task 1263))<br>remote bytes read to disk total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 878.0: task 1263))<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 878.0: task 1263))"];
subgraph cluster1 {
isCluster="true";
label="WholeStageCodegen (6)\n \nduration: total (min, med, max (stageId: taskId))\n0 ms (0 ms, 0 ms, 0 ms (stage 820.0: task 1197))";
2 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 0"];
}
3 [labelType="html" label="<b>SortAggregate</b><br><br>number of output rows: 2"];
subgraph cluster4 {
isCluster="true";
label="WholeStageCodegen (5)\n \nduration: total (min, med, max (stageId: taskId))\n8.9 s (126 ms, 168 ms, 258 ms (stage 820.0: task 1202))";
5 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 820.0: task 1197))<br>peak memory total (min, med, max (stageId: taskId))<br>7.1 MiB (64.0 KiB, 64.0 KiB, 2.1 MiB (stage 820.0: task 1202))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 820.0: task 1197))"];
}
6 [labelType="html" label="<b>StateStoreSave</b><br><br>number of shuffle partitions: 50<br>number of removed state rows: 0<br>data returned from Python workers total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 820.0: task 1197))<br>number of total state rows: 6<br>number of state store instances: 50<br>memory used by state total (min, med, max (stageId: taskId))<br>25.8 KiB (432.0 B, 432.0 B, 1296.0 B (stage 820.0: task 1217))<br>count of cache hit on states cache in provider: 700<br>number of output rows: 2<br>estimated size of state only on current version total (min, med, max (stageId: taskId))<br>9.6 KiB (104.0 B, 104.0 B, 936.0 B (stage 820.0: task 1217))<br>number of rows which are dropped by watermark: 0<br>data sent to Python workers total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 820.0: task 1197))<br>count of cache miss on states cache in provider: 0<br>time to commit changes total (min, med, max (stageId: taskId))<br>8.5 s (97 ms, 163 ms, 253 ms (stage 820.0: task 1203))<br>time to remove total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 820.0: task 1197))<br>number of updated state rows: 2<br>time to update total (min, med, max (stageId: taskId))<br>289 ms (0 ms, 1 ms, 151 ms (stage 820.0: task 1202))<br>number of output rows: 0"];
7 [labelType="html" label="<b>SortAggregate</b><br><br>number of output rows: 2"];
subgraph cluster8 {
isCluster="true";
label="WholeStageCodegen (4)\n \nduration: total (min, med, max (stageId: taskId))\n177 ms (0 ms, 1 ms, 81 ms (stage 820.0: task 1208))";
9 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 820.0: task 1197))<br>peak memory total (min, med, max (stageId: taskId))<br>7.1 MiB (64.0 KiB, 64.0 KiB, 2.1 MiB (stage 820.0: task 1202))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 820.0: task 1197))"];
}
10 [labelType="html" label="<b>StateStoreRestore</b><br><br>number of output rows: 2"];
11 [labelType="html" label="<b>SortAggregate</b><br><br>number of output rows: 2"];
subgraph cluster12 {
isCluster="true";
label="WholeStageCodegen (3)\n \nduration: total (min, med, max (stageId: taskId))\n107 ms (0 ms, 1 ms, 22 ms (stage 820.0: task 1212))";
13 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 820.0: task 1197))<br>peak memory total (min, med, max (stageId: taskId))<br>7.1 MiB (64.0 KiB, 64.0 KiB, 2.1 MiB (stage 820.0: task 1202))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 820.0: task 1197))"];
}
14 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 2<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>3 ms (0 ms, 0 ms, 1 ms (stage 819.0: task 1141))<br>remote merged bytes read total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 820.0: task 1197))<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 820.0: task 1197))<br>remote merged blocks fetched: 0<br>records read: 2<br>local bytes read total (min, med, max (stageId: taskId))<br>509.0 B (0.0 B, 0.0 B, 272.0 B (stage 820.0: task 1202))<br>fetch wait time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 820.0: task 1197))<br>remote bytes read total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 820.0: task 1197))<br>merged fetch fallback count: 0<br>local blocks read: 2<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size total (min, med, max (stageId: taskId))<br>1272.0 B (0.0 B, 0.0 B, 656.0 B (stage 819.0: task 1142))<br>local merged bytes read total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 820.0: task 1197))<br>number of partitions: 50<br>remote reqs duration total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 820.0: task 1197))<br>remote bytes read to disk total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 820.0: task 1197))<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>509.0 B (0.0 B, 0.0 B, 272.0 B (stage 819.0: task 1142))"];
15 [labelType="html" label="<b>SortAggregate</b><br><br>number of output rows: 2"];
subgraph cluster16 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: total (min, med, max (stageId: taskId))\n1.1 s (0 ms, 0 ms, 560 ms (stage 819.0: task 1142))";
17 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 820.0: task 1197))<br>peak memory total (min, med, max (stageId: taskId))<br>4.1 MiB (0.0 B, 0.0 B, 2.1 MiB (stage 819.0: task 1141))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 820.0: task 1197))"];
18 [labelType="html" label="<br><b>Project</b><br><br>"];
}
19 [labelType="html" label="<br><b>EventTimeWatermark</b><br><br>"];
subgraph cluster20 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: total (min, med, max (stageId: taskId))\n1.1 s (0 ms, 0 ms, 534 ms (stage 819.0: task 1142))";
21 [labelType="html" label="<br><b>Project</b><br><br>"];
}
22 [labelType="html" label="<br><b>Project</b><br><br>"];
23 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 2"];
24 [labelType="html" label="<b>MicroBatchScan</b><br><br>number of output rows: 2<br>estimated number of fetched offsets out of range: 0<br>number of data loss error: 0"];
2->0;
3->2;
5->3;
6->5;
7->6;
9->7;
10->9;
11->10;
13->11;
14->13;
15->14;
17->15;
18->17;
19->18;
21->19;
22->21;
23->22;
24->23;
}
Project [data#23.title AS title#28, data#23.url AS url#29, data#23.uuid AS uuid#30, data#23.inventory_code AS inventory_code#32, data#23.created_at AS created_at#33, data#23.date AS date#41]
Filter ((((((isnotnull(value#8) AND NOT (RLIKE(from_json(StructField(agent,StringType,true), cast(value#8 as string), Some(Etc/UTC)).agent, Yeti|compatible|googlebot|google\.com\/bot\.html) <=> true)) AND (cast(from_json(StructField(date,StringType,true), cast(value#8 as string), Some(Etc/UTC)).date as date) = cast(from_utc_timestamp(2025-12-05 23:50:00.034, Asia/Seoul) as date))) AND (from_json(StructField(ad_type,StringType,true), cast(value#8 as string), Some(Etc/UTC)).ad_type = request)) AND isnotnull(from_json(StructField(title,StringType,true), cast(value#8 as string), Some(Etc/UTC)).title)) AND NOT (from_json(StructField(title,StringType,true), cast(value#8 as string), Some(Etc/UTC)).title = )) AND isnotnull(from_json(StructField(url,StringType,true), cast(value#8 as string), Some(Etc/UTC)).url))
MicroBatchScan[key#7, value#8, topic#9, partition#10, offset#11L, timestamp#12, timestampType#13] class org.apache.spark.sql.kafka010.KafkaSourceProvider$KafkaScan