<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: how to manage a dynamic scheduled job if an INTERNAL_ERROR occurs? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/how-to-manage-a-dynamic-scheduled-job-if-an-internal-error/m-p/128336#M48210</link>
    <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/133094"&gt;@jeremy98&lt;/a&gt;&amp;nbsp;,&lt;/P&gt;&lt;P&gt;To investigate, check the Jobs UI for failed runs and review both error messages and cluster logs. Monitor failure trends over time and adjust cluster settings or quotas if needed.&lt;BR /&gt;&lt;A href="https://docs.databricks.com/gcp/en/jobs/repair-job-failures" target="_blank"&gt;https://docs.databricks.com/gcp/en/jobs/repair-job-failures&lt;/A&gt;&lt;/P&gt;&lt;P&gt;For detection, enable job notifications for “on failure” events in Job settings.&lt;BR /&gt;&lt;A href="https://docs.databricks.com/gcp/en/jobs/notifications" target="_blank"&gt;https://docs.databricks.com/gcp/en/jobs/notifications&lt;/A&gt;&lt;/P&gt;&lt;P&gt;For fallback, add a downstream task in the job configured to run only if failed.&lt;/P&gt;</description>
    <pubDate>Wed, 13 Aug 2025 12:20:23 GMT</pubDate>
    <dc:creator>SP_6721</dc:creator>
    <dc:date>2025-08-13T12:20:23Z</dc:date>
    <item>
      <title>how to manage a dynamic scheduled job if an INTERNAL_ERROR occurs?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-manage-a-dynamic-scheduled-job-if-an-internal-error/m-p/128186#M48170</link>
      <description>&lt;P&gt;Hi community,&lt;/P&gt;&lt;P&gt;My team and I have been occasionally experiencing INTERNAL_ERROR events in Databricks. We have a job that runs on a schedule, but the start times vary. Sometimes, when the job is triggered, the underlying cluster fails to start for some reason.&lt;/P&gt;&lt;P&gt;I’d like some advice on how to better investigate these issues and how to set up a mitigation or fallback mechanism. Specifically, I want a way to detect when the job starts but the cluster cannot initialize, and then run an alternative process or alert.&lt;/P&gt;&lt;P&gt;Any suggestions or best practices would be greatly appreciated!&lt;/P&gt;</description>
      <pubDate>Tue, 12 Aug 2025 09:20:37 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-manage-a-dynamic-scheduled-job-if-an-internal-error/m-p/128186#M48170</guid>
      <dc:creator>jeremy98</dc:creator>
      <dc:date>2025-08-12T09:20:37Z</dc:date>
    </item>
    <item>
      <title>Re: how to manage a dynamic scheduled job if an INTERNAL_ERROR occurs?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-manage-a-dynamic-scheduled-job-if-an-internal-error/m-p/128336#M48210</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/133094"&gt;@jeremy98&lt;/a&gt;&amp;nbsp;,&lt;/P&gt;&lt;P&gt;To investigate, check the Jobs UI for failed runs and review both error messages and cluster logs. Monitor failure trends over time and adjust cluster settings or quotas if needed.&lt;BR /&gt;&lt;A href="https://docs.databricks.com/gcp/en/jobs/repair-job-failures" target="_blank"&gt;https://docs.databricks.com/gcp/en/jobs/repair-job-failures&lt;/A&gt;&lt;/P&gt;&lt;P&gt;For detection, enable job notifications for “on failure” events in Job settings.&lt;BR /&gt;&lt;A href="https://docs.databricks.com/gcp/en/jobs/notifications" target="_blank"&gt;https://docs.databricks.com/gcp/en/jobs/notifications&lt;/A&gt;&lt;/P&gt;&lt;P&gt;For fallback, add a downstream task in the job configured to run only if failed.&lt;/P&gt;</description>
      <pubDate>Wed, 13 Aug 2025 12:20:23 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-manage-a-dynamic-scheduled-job-if-an-internal-error/m-p/128336#M48210</guid>
      <dc:creator>SP_6721</dc:creator>
      <dc:date>2025-08-13T12:20:23Z</dc:date>
    </item>
  </channel>
</rss>

