<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Not able to get spark application in Spark History server using cluster eventlogs in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/not-able-to-get-spark-application-in-spark-history-server-using/m-p/83576#M36958</link>
    <description>&lt;P class=""&gt;I'm encountering an issue with incomplete Spark event logs. When I am running the local Spark History Server using the cluster logs, my application appears as "incomplete". Sometime I also see few queries listed as still running, even though the application has completed.&lt;/P&gt;&lt;P class=""&gt;&amp;nbsp;&lt;/P&gt;&lt;P class=""&gt;Are there any known issue/limitation&amp;nbsp;with event logging in the Databricks runtime that could cause this? Or is there any specific configuration I should check to ensure complete event logging?&lt;/P&gt;</description>
    <pubDate>Tue, 20 Aug 2024 09:44:26 GMT</pubDate>
    <dc:creator>ossoul</dc:creator>
    <dc:date>2024-08-20T09:44:26Z</dc:date>
    <item>
      <title>Not able to get spark application in Spark History server using cluster eventlogs</title>
      <link>https://community.databricks.com/t5/data-engineering/not-able-to-get-spark-application-in-spark-history-server-using/m-p/83576#M36958</link>
      <description>&lt;P class=""&gt;I'm encountering an issue with incomplete Spark event logs. When I am running the local Spark History Server using the cluster logs, my application appears as "incomplete". Sometime I also see few queries listed as still running, even though the application has completed.&lt;/P&gt;&lt;P class=""&gt;&amp;nbsp;&lt;/P&gt;&lt;P class=""&gt;Are there any known issue/limitation&amp;nbsp;with event logging in the Databricks runtime that could cause this? Or is there any specific configuration I should check to ensure complete event logging?&lt;/P&gt;</description>
      <pubDate>Tue, 20 Aug 2024 09:44:26 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/not-able-to-get-spark-application-in-spark-history-server-using/m-p/83576#M36958</guid>
      <dc:creator>ossoul</dc:creator>
      <dc:date>2024-08-20T09:44:26Z</dc:date>
    </item>
    <item>
      <title>Re: Not able to get spark application in Spark History server using cluster eventlogs</title>
      <link>https://community.databricks.com/t5/data-engineering/not-able-to-get-spark-application-in-spark-history-server-using/m-p/103344#M41413</link>
      <description>&lt;P&gt;Thanks for your question!&lt;/P&gt;
&lt;P&gt;I believe Databricks has its own SHS implementation, so it's not expected to work with the vanilla SHS. Regarding the queries marked as still running, we can also find this when there are event logs which were not properly closed, or the query failed midway leading to an incomplete/unclosed event.&lt;/P&gt;</description>
      <pubDate>Fri, 27 Dec 2024 18:33:50 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/not-able-to-get-spark-application-in-spark-history-server-using/m-p/103344#M41413</guid>
      <dc:creator>VZLA</dc:creator>
      <dc:date>2024-12-27T18:33:50Z</dc:date>
    </item>
  </channel>
</rss>

