<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Spark UI Replay Notebook in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132354#M49441</link>
    <description>&lt;P&gt;I need to load the Spark UI events of a long-running job.&lt;/P&gt;&lt;P&gt;I found this Databricks knowledge base article on the topic:&lt;BR /&gt;&lt;A href="https://kb.databricks.com/clusters/replay-cluster-spark-events" target="_blank"&gt;https://kb.databricks.com/clusters/replay-cluster-spark-events&lt;/A&gt;&lt;/P&gt;&lt;P&gt;However, the referenced notebook is no longer accessible.&lt;/P&gt;&lt;OL&gt;&lt;LI&gt;Does anyone still have a copy of that notebook?&lt;/LI&gt;&lt;LI&gt;Alternatively, is there a better way to increase the default replay limit in Databricks for a completed job?&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="der_0-1758177009088.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20072i9C5AAC451AC538CE/image-size/medium?v=v2&amp;amp;px=400" role="button" title="der_0-1758177009088.png" alt="der_0-1758177009088.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;resulting into:&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="der_1-1758177084191.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20073i04FB0A5441870110/image-size/medium?v=v2&amp;amp;px=400" role="button" title="der_1-1758177084191.png" alt="der_1-1758177084191.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Thu, 18 Sep 2025 06:34:08 GMT</pubDate>
    <dc:creator>der</dc:creator>
    <dc:date>2025-09-18T06:34:08Z</dc:date>
    <item>
      <title>Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132354#M49441</link>
      <description>&lt;P&gt;I need to load the Spark UI events of a long-running job.&lt;/P&gt;&lt;P&gt;I found this Databricks knowledge base article on the topic:&lt;BR /&gt;&lt;A href="https://kb.databricks.com/clusters/replay-cluster-spark-events" target="_blank"&gt;https://kb.databricks.com/clusters/replay-cluster-spark-events&lt;/A&gt;&lt;/P&gt;&lt;P&gt;However, the referenced notebook is no longer accessible.&lt;/P&gt;&lt;OL&gt;&lt;LI&gt;Does anyone still have a copy of that notebook?&lt;/LI&gt;&lt;LI&gt;Alternatively, is there a better way to increase the default replay limit in Databricks for a completed job?&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="der_0-1758177009088.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20072i9C5AAC451AC538CE/image-size/medium?v=v2&amp;amp;px=400" role="button" title="der_0-1758177009088.png" alt="der_0-1758177009088.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;resulting into:&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="der_1-1758177084191.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20073i04FB0A5441870110/image-size/medium?v=v2&amp;amp;px=400" role="button" title="der_1-1758177084191.png" alt="der_1-1758177084191.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 06:34:08 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132354#M49441</guid>
      <dc:creator>der</dc:creator>
      <dc:date>2025-09-18T06:34:08Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132362#M49443</link>
      <description>&lt;P&gt;Hello&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/154226"&gt;@der&lt;/a&gt;&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;Good day!!&lt;BR /&gt;&lt;BR /&gt;I see whole issue over here. As per the doc. the default size for&amp;nbsp;spark.ui.retainedJobs is 1000.&lt;/P&gt;&lt;P&gt;ref:&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Khaja_Zaffer_0-1758179161839.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20078iA3E8F59F8C78256B/image-size/medium?v=v2&amp;amp;px=400" role="button" title="Khaja_Zaffer_0-1758179161839.png" alt="Khaja_Zaffer_0-1758179161839.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Can you increase them?&amp;nbsp;&lt;/P&gt;&lt;P&gt;For very large logs (e.g., 5600+ jobs), scale up further (e.g., to 100000 for retainedTasks/jobs) and use a cluster with more driver memory (e.g., via spark.driver.memory 16g)&lt;BR /&gt;&lt;BR /&gt;I am waiting for your response.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 07:07:46 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132362#M49443</guid>
      <dc:creator>Khaja_Zaffer</dc:creator>
      <dc:date>2025-09-18T07:07:46Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132374#M49446</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/173840"&gt;@Khaja_Zaffer&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;yes I set following values:&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="der_2-1758181541962.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20085i72686FB5B782FAC8/image-size/medium?v=v2&amp;amp;px=400" role="button" title="der_2-1758181541962.png" alt="der_2-1758181541962.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;And the cluster should have also enough memory&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="der_1-1758181451689.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20084iBAB3A45FCEBA1343/image-size/medium?v=v2&amp;amp;px=400" role="button" title="der_1-1758181451689.png" alt="der_1-1758181451689.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;Log is activated:&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="der_3-1758181729042.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20086i9DBD6FD6275F1BB5/image-size/medium?v=v2&amp;amp;px=400" role="button" title="der_3-1758181729042.png" alt="der_3-1758181729042.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 07:49:21 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132374#M49446</guid>
      <dc:creator>der</dc:creator>
      <dc:date>2025-09-18T07:49:21Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132377#M49448</link>
      <description>&lt;P&gt;Okay, we can wait then. let me know if there any further issues&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 08:07:17 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132377#M49448</guid>
      <dc:creator>Khaja_Zaffer</dc:creator>
      <dc:date>2025-09-18T08:07:17Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132384#M49451</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/154226"&gt;@der&lt;/a&gt;&amp;nbsp;,&lt;/P&gt;&lt;P&gt;Here's the content of Event Log Replay notebook. You can use it to achieve your goals &lt;span class="lia-unicode-emoji" title=":slightly_smiling_face:"&gt;🙂&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="szymon_dybczak_0-1758184107442.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20088i2F74D5181C446288/image-size/medium?v=v2&amp;amp;px=400" role="button" title="szymon_dybczak_0-1758184107442.png" alt="szymon_dybczak_0-1758184107442.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="java"&gt;%scala
dbutils.widgets.removeAll()
dbutils.widgets.text("event_log_path", "", "event_log_path")
 
val eventLogPath = dbutils.widgets.get("event_log_path")

package org.apache.spark.util
 
import org.apache.spark.scheduler.SparkListenerEvent
import org.json4s.JsonAST.JValue
 
/**
 * Visibility hack.
 */
object PublicJsonProtocol  {
  def sparkEventFromJson(json: JValue): SparkListenerEvent = {
    JsonProtocol.sparkEventFromJson(json)
  }
}


import java.util.zip.GZIPInputStream
import scala.collection.JavaConversions._
import org.json4s.jackson.JsonMethods._
import com.fasterxml.jackson.core.JsonParseException
import com.fasterxml.jackson.databind.exc.UnrecognizedPropertyException
 
import org.apache.commons.io.IOUtils
import org.apache.hadoop.fs._
import org.apache.spark.util.PublicJsonProtocol
 
 
/**
 * Function to replay all the events that happened on a cluster in the case the Spark History Server fails to
 * load the Spark UI. Run this command on an instance that hasn't run any Spark command to completely replay
 * all the events a cluser went through.
 */
def replaySparkEvents(pathToEventLogs: String): Unit = {
  val eventLogFiles = dbutils.fs.ls(pathToEventLogs).filter(_.name.startsWith("eventlog")).map(_.path)
  require(eventLogFiles.nonEmpty, "No event logs found at this path")
  val inOrder = eventLogFiles.tail ++ Seq(eventLogFiles.head)
  
  val lineIterator = inOrder.iterator.map { file =&amp;gt;
    val path = new Path(file)
    val fs = path.getFileSystem(spark.sessionState.newHadoopConf())
    val fileStream = fs.open(path)
    val stream = if (file.endsWith(".gz")) {
      new GZIPInputStream(fileStream)
    } else {
      fileStream
    }
    print("File process:"+file)
    val lines = IOUtils.readLines(stream)
    (stream, lines)
  }
  
  val lines = lineIterator.flatMap(_._2)
  val streams = lineIterator.map(_._1)
  
  val unrecognizedEvents = new scala.collection.mutable.HashSet[String]
  val unrecognizedProperties = new scala.collection.mutable.HashSet[String]
 
  val listenerBus = sc.listenerBus
  var currentLine: String = null
 
  try {
    while (lines.hasNext) {
      try {
        val entry = lines.next()
        currentLine = entry
        listenerBus.post(PublicJsonProtocol.sparkEventFromJson(parse(currentLine)))
      } catch {
        case e: java.lang.ClassNotFoundException =&amp;gt;
          // Ignore unknown events, parse through the event log file.
          // To avoid spamming, warnings are only displayed once for each unknown event.
          if (!unrecognizedEvents.contains(e.getMessage)) {
            println(s"Drop unrecognized event: ${e.getMessage}")
            unrecognizedEvents.add(e.getMessage)
          }
          println(s"Drop incompatible event log: $currentLine")
        case e: UnrecognizedPropertyException =&amp;gt;
          // Ignore unrecognized properties, parse through the event log file.
          // To avoid spamming, warnings are only displayed once for each unrecognized property.
          if (!unrecognizedProperties.contains(e.getMessage)) {
            println(s"Drop unrecognized property: ${e.getMessage}")
            unrecognizedProperties.add(e.getMessage)
          }
          println(s"Drop incompatible event log: $currentLine")
        case jpe: JsonParseException =&amp;gt;
          // We can only ignore exception from last line of the file that might be truncated
          // the last entry may not be the very last line in the event log, but we treat it
          // as such in a best effort to replay the given input
          if (lines.hasNext) {
            throw jpe
          } else {
            println(s"Got JsonParseException from log file. The file might not have finished writing cleanly.")
          }
      }
    }
  } finally {
    streams.foreach(IOUtils.closeQuietly)
  }
}

replaySparkEvents(eventLogPath)&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 08:28:36 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132384#M49451</guid>
      <dc:creator>szymon_dybczak</dc:creator>
      <dc:date>2025-09-18T08:28:36Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132386#M49453</link>
      <description>&lt;P&gt;Hello&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/110502"&gt;@szymon_dybczak&lt;/a&gt;&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;Do we have any documentation around this?&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 08:36:21 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132386#M49453</guid>
      <dc:creator>Khaja_Zaffer</dc:creator>
      <dc:date>2025-09-18T08:36:21Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132391#M49456</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/173840"&gt;@Khaja_Zaffer&lt;/a&gt;&amp;nbsp;,&lt;/P&gt;&lt;P&gt;Yes, we do -&amp;gt;&amp;nbsp;&lt;A href="https://kb.databricks.com/clusters/replay-cluster-spark-events" target="_blank" rel="noopener"&gt;Replay Apache Spark events in a cluster - Databricks&lt;/A&gt;&lt;/P&gt;&lt;P&gt;It's quite simple. You just need to provide a valid path to your cluster logs and run notebook content that I provided above. It should then replay events.&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="szymon_dybczak_0-1758184889651.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20090i59D29008F7F37424/image-size/medium?v=v2&amp;amp;px=400" role="button" title="szymon_dybczak_0-1758184889651.png" alt="szymon_dybczak_0-1758184889651.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 08:42:18 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132391#M49456</guid>
      <dc:creator>szymon_dybczak</dc:creator>
      <dc:date>2025-09-18T08:42:18Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132393#M49457</link>
      <description>&lt;P&gt;The solution works as long as the cluster is running:&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="der_0-1758184685442.png" style="width: 301px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20089i772B5BE4140B8D1E/image-dimensions/301x223?v=v2" width="301" height="223" role="button" title="der_0-1758184685442.png" alt="der_0-1758184685442.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;However, it does not replay all jobs if cluster is terminated (Example the job cluster from pipeline finished after hours)&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="der_1-1758184941528.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20091iE0DD85F936888B8A/image-size/medium?v=v2&amp;amp;px=400" role="button" title="der_1-1758184941528.png" alt="der_1-1758184941528.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;So how can we replay the full spark UI from a finished job cluster?&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 08:45:02 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132393#M49457</guid>
      <dc:creator>der</dc:creator>
      <dc:date>2025-09-18T08:45:02Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132394#M49458</link>
      <description>&lt;P&gt;Hello&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/110502"&gt;@szymon_dybczak&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I think he has some eventlog file.&amp;nbsp;&lt;/P&gt;&lt;P&gt;But Sorry for not asking properly.&amp;nbsp;&lt;BR /&gt;I mean the scala code? does it has any limitations or we can use it for such issues? I was actually looking for this code.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 08:46:49 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132394#M49458</guid>
      <dc:creator>Khaja_Zaffer</dc:creator>
      <dc:date>2025-09-18T08:46:49Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132396#M49459</link>
      <description>&lt;P&gt;Of course you can point it towards storage account:&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Khaja_Zaffer_0-1758185385429.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20092i90C030323C8D1B49/image-size/medium?v=v2&amp;amp;px=400" role="button" title="Khaja_Zaffer_0-1758185385429.png" alt="Khaja_Zaffer_0-1758185385429.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Enable Spark event log delivery on your workspace/cluster (to DBFS, S3, ADLS, etc.). Otherwise you simply don’t have the logs to replay.&lt;/P&gt;&lt;P&gt;Check spark.eventLog.enabled true&lt;/P&gt;&lt;P&gt;Set spark.eventLog.dir to your persistent storage path.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 08:54:22 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132396#M49459</guid>
      <dc:creator>Khaja_Zaffer</dc:creator>
      <dc:date>2025-09-18T08:54:22Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132403#M49460</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/110502"&gt;@szymon_dybczak&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thank you for providing the content of the notebook. I haven't stored it and now it is not accessible anymore on Databricks Link (Homepage).&lt;/P&gt;&lt;P&gt;I think with this I can do it.&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 09:33:08 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132403#M49460</guid>
      <dc:creator>der</dc:creator>
      <dc:date>2025-09-18T09:33:08Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132405#M49461</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;No problem &lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/154226"&gt;@der&lt;/a&gt;&amp;nbsp;. If the provided answer was helpful please consider marking it as a solution to a thread.&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 09:39:47 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132405#M49461</guid>
      <dc:creator>szymon_dybczak</dc:creator>
      <dc:date>2025-09-18T09:39:47Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132410#M49464</link>
      <description>&lt;P&gt;Your notebook worked!&lt;/P&gt;&lt;P&gt;I only needed to change this cell:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="java"&gt;package org.apache.spark.util

import org.apache.spark.scheduler.SparkListenerEvent
import org.json4s.JsonAST.JValue
import org.json4s.jackson.JsonMethods

/**
 * Visibility hack.
 */
object PublicJsonProtocol  {
  def sparkEventFromJson(json: JValue): SparkListenerEvent = {
    JsonProtocol.sparkEventFromJson(JsonMethods.compact(json))
  }
}&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Spark UI output of an job compute (executed yesterday):&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="der_0-1758189521569.png" style="width: 280px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/20095iCA3531CB89BEC4E4/image-dimensions/280x222?v=v2" width="280" height="222" role="button" title="der_0-1758189521569.png" alt="der_0-1758189521569.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;you made my day&amp;nbsp;&lt;span class="lia-unicode-emoji" title=":hugging_face:"&gt;🤗&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 10:05:34 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132410#M49464</guid>
      <dc:creator>der</dc:creator>
      <dc:date>2025-09-18T10:05:34Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132412#M49466</link>
      <description>&lt;P&gt;Thats great!&lt;/P&gt;&lt;P&gt;congratulations&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/154226"&gt;@der&lt;/a&gt;&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/110502"&gt;@szymon_dybczak&lt;/a&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 10:08:32 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132412#M49466</guid>
      <dc:creator>Khaja_Zaffer</dc:creator>
      <dc:date>2025-09-18T10:08:32Z</dc:date>
    </item>
    <item>
      <title>Re: Spark UI Replay Notebook</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132413#M49467</link>
      <description>&lt;P&gt;So cool that it worked.&amp;nbsp;Good job guys&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/154226"&gt;@der&lt;/a&gt;&amp;nbsp;,&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/173840"&gt;@Khaja_Zaffer&lt;/a&gt;&amp;nbsp;!&lt;/P&gt;</description>
      <pubDate>Thu, 18 Sep 2025 10:12:05 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-ui-replay-notebook/m-p/132413#M49467</guid>
      <dc:creator>szymon_dybczak</dc:creator>
      <dc:date>2025-09-18T10:12:05Z</dc:date>
    </item>
  </channel>
</rss>

