<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Autoloader file latency in Get Started Discussions</title>
    <link>https://community.databricks.com/t5/get-started-discussions/autoloader-file-latency/m-p/58724#M2368</link>
    <description>&lt;P&gt;Hi Team,&lt;/P&gt;&lt;P&gt;I would like to understand if there is a metadata table for the autoloader in Databricks that captures information about file arrival and processing.&lt;/P&gt;&lt;P&gt;The reason we are experiencing data issues is because our table A receives hundreds of files that are processed by an autoloader,&lt;BR /&gt;and in some scenarios, we have noticed that old files are processed after new files, possibly due to a problem in the source system.&lt;BR /&gt;However, if we have clear details about autoloder metadata, it will be easier to identify the root cause analysis.&lt;/P&gt;&lt;P&gt;could you please share the best practices for organizing data in a storage location that an autoloader can effectively process?&lt;/P&gt;</description>
    <pubDate>Tue, 30 Jan 2024 16:27:41 GMT</pubDate>
    <dc:creator>Phani1</dc:creator>
    <dc:date>2024-01-30T16:27:41Z</dc:date>
    <item>
      <title>Autoloader file latency</title>
      <link>https://community.databricks.com/t5/get-started-discussions/autoloader-file-latency/m-p/58724#M2368</link>
      <description>&lt;P&gt;Hi Team,&lt;/P&gt;&lt;P&gt;I would like to understand if there is a metadata table for the autoloader in Databricks that captures information about file arrival and processing.&lt;/P&gt;&lt;P&gt;The reason we are experiencing data issues is because our table A receives hundreds of files that are processed by an autoloader,&lt;BR /&gt;and in some scenarios, we have noticed that old files are processed after new files, possibly due to a problem in the source system.&lt;BR /&gt;However, if we have clear details about autoloder metadata, it will be easier to identify the root cause analysis.&lt;/P&gt;&lt;P&gt;could you please share the best practices for organizing data in a storage location that an autoloader can effectively process?&lt;/P&gt;</description>
      <pubDate>Tue, 30 Jan 2024 16:27:41 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/autoloader-file-latency/m-p/58724#M2368</guid>
      <dc:creator>Phani1</dc:creator>
      <dc:date>2024-01-30T16:27:41Z</dc:date>
    </item>
    <item>
      <title>Re: Autoloader file latency</title>
      <link>https://community.databricks.com/t5/get-started-discussions/autoloader-file-latency/m-p/58764#M2371</link>
      <description>&lt;P&gt;Are you using file listing or file notification for auto loader?&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 31 Jan 2024 00:06:13 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/autoloader-file-latency/m-p/58764#M2371</guid>
      <dc:creator>jose_gonzalez</dc:creator>
      <dc:date>2024-01-31T00:06:13Z</dc:date>
    </item>
    <item>
      <title>Re: Autoloader file latency</title>
      <link>https://community.databricks.com/t5/get-started-discussions/autoloader-file-latency/m-p/58781#M2373</link>
      <description>&lt;P&gt;we are using the default.&lt;/P&gt;</description>
      <pubDate>Wed, 31 Jan 2024 04:58:29 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/autoloader-file-latency/m-p/58781#M2373</guid>
      <dc:creator>Phani1</dc:creator>
      <dc:date>2024-01-31T04:58:29Z</dc:date>
    </item>
    <item>
      <title>Re: Autoloader file latency</title>
      <link>https://community.databricks.com/t5/get-started-discussions/autoloader-file-latency/m-p/58885#M2376</link>
      <description>&lt;P&gt;Check with&amp;nbsp;&lt;/P&gt;
&lt;PRE&gt;&lt;SPAN class="n"&gt;cloud_files_state&lt;/SPAN&gt;&lt;SPAN class="p"&gt;(&lt;/SPAN&gt;&lt;SPAN class="p"&gt;) API&lt;/SPAN&gt;&lt;/PRE&gt;
&lt;P&gt;You can find examples here&amp;nbsp;&lt;A href="https://docs.databricks.com/en/ingestion/auto-loader/production.html#querying-files-discovered-by-auto-loader" target="_blank"&gt;https://docs.databricks.com/en/ingestion/auto-loader/production.html#querying-files-discovered-by-auto-loader&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 31 Jan 2024 19:10:53 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/autoloader-file-latency/m-p/58885#M2376</guid>
      <dc:creator>jose_gonzalez</dc:creator>
      <dc:date>2024-01-31T19:10:53Z</dc:date>
    </item>
  </channel>
</rss>

