<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Autoloader - File Notification mode in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/autoloader-file-notification-mode/m-p/64051#M32447</link>
    <description>&lt;P&gt;Hi All,&lt;/P&gt;&lt;P&gt;I have set up a DLT pipeline that is using Autoloader in a file notification mode.&lt;/P&gt;&lt;P&gt;Everything runs smoothly for the first time. However, it seems like the next micro-batch did not trigger as I can see some events coming in the queue.&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Gilg_0-1710827649089.png" style="width: 1596px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/6694iCBAE8420C3E708AF/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Gilg_0-1710827649089.png" alt="Gilg_0-1710827649089.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;But if I look at SparkUI I do not see any active jobs for a while now.&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Gilg_1-1710827662118.png" style="width: 377px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/6695iCE0EE89D1BB3059F/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Gilg_1-1710827662118.png" alt="Gilg_1-1710827662118.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;Not sure what is happening here.&lt;/P&gt;&lt;P&gt;Cheers,&lt;/P&gt;&lt;P&gt;Gil&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Tue, 19 Mar 2024 05:56:39 GMT</pubDate>
    <dc:creator>Gilg</dc:creator>
    <dc:date>2024-03-19T05:56:39Z</dc:date>
    <item>
      <title>Autoloader - File Notification mode</title>
      <link>https://community.databricks.com/t5/data-engineering/autoloader-file-notification-mode/m-p/64051#M32447</link>
      <description>&lt;P&gt;Hi All,&lt;/P&gt;&lt;P&gt;I have set up a DLT pipeline that is using Autoloader in a file notification mode.&lt;/P&gt;&lt;P&gt;Everything runs smoothly for the first time. However, it seems like the next micro-batch did not trigger as I can see some events coming in the queue.&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Gilg_0-1710827649089.png" style="width: 1596px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/6694iCBAE8420C3E708AF/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Gilg_0-1710827649089.png" alt="Gilg_0-1710827649089.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;But if I look at SparkUI I do not see any active jobs for a while now.&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Gilg_1-1710827662118.png" style="width: 377px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/6695iCE0EE89D1BB3059F/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Gilg_1-1710827662118.png" alt="Gilg_1-1710827662118.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;Not sure what is happening here.&lt;/P&gt;&lt;P&gt;Cheers,&lt;/P&gt;&lt;P&gt;Gil&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 19 Mar 2024 05:56:39 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/autoloader-file-notification-mode/m-p/64051#M32447</guid>
      <dc:creator>Gilg</dc:creator>
      <dc:date>2024-03-19T05:56:39Z</dc:date>
    </item>
    <item>
      <title>Re: Autoloader - File Notification mode</title>
      <link>https://community.databricks.com/t5/data-engineering/autoloader-file-notification-mode/m-p/64127#M32473</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/9"&gt;@Retired_mod&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I did some digging on the messages that we are receiving.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;By default, autoloader generates the Event Grid System Topic, Event Subscriptions and Storage Queue endpoint.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Gilg_0-1710897237186.png" style="width: 1353px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/6704i57748F4DCAFE4CC1/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Gilg_0-1710897237186.png" alt="Gilg_0-1710897237186.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Gilg_6-1710897546457.png" style="width: 1351px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/6710i98A504CE82A8300A/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Gilg_6-1710897546457.png" alt="Gilg_6-1710897546457.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Looking at the queue endpoint it has a filter that is set automatically below.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Gilg_2-1710897252022.png" style="width: 777px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/6706iE267BE258123F6DE/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Gilg_2-1710897252022.png" alt="Gilg_2-1710897252022.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;In our test we have removed this filter and see what messages we are getting.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;We’ve noticed that messages that we are receiving in the Storage Queue only have a tag of “CreateFile”.&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Gilg_7-1710897593599.png" style="width: 1305px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/6711i4FF5B0B270DEC926/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Gilg_7-1710897593599.png" alt="Gilg_7-1710897593599.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;But autoloader seems to be listening to different api tags according to this below.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Gilg_4-1710897271297.png" style="width: 861px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/6707i796931EC12DAD2CD/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Gilg_4-1710897271297.png" alt="Gilg_4-1710897271297.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I think that it could be the reason why we do not get any Active jobs in SparkUI because Autoloader is looking to different api tags to process.&lt;/P&gt;&lt;P&gt;Not sure why this is happening.&lt;/P&gt;</description>
      <pubDate>Wed, 20 Mar 2024 01:20:22 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/autoloader-file-notification-mode/m-p/64127#M32473</guid>
      <dc:creator>Gilg</dc:creator>
      <dc:date>2024-03-20T01:20:22Z</dc:date>
    </item>
  </channel>
</rss>

