<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic AutoLoader - process multiple files in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/autoloader-process-multiple-files/m-p/16998#M11079</link>
    <description>&lt;P&gt;I need to process files of different schema coming to different folders in ADLS using Autoloader. Do I need to start a separate read stream for each file type / folder or can this be handled using a single stream ?&lt;/P&gt;&lt;P&gt;When I tried using a single stream, multiple files gets clubbed in the same read and its quite difficult to process the files as the schema is different.&lt;/P&gt;</description>
    <pubDate>Tue, 13 Dec 2022 15:27:13 GMT</pubDate>
    <dc:creator>avenu</dc:creator>
    <dc:date>2022-12-13T15:27:13Z</dc:date>
    <item>
      <title>AutoLoader - process multiple files</title>
      <link>https://community.databricks.com/t5/data-engineering/autoloader-process-multiple-files/m-p/16998#M11079</link>
      <description>&lt;P&gt;I need to process files of different schema coming to different folders in ADLS using Autoloader. Do I need to start a separate read stream for each file type / folder or can this be handled using a single stream ?&lt;/P&gt;&lt;P&gt;When I tried using a single stream, multiple files gets clubbed in the same read and its quite difficult to process the files as the schema is different.&lt;/P&gt;</description>
      <pubDate>Tue, 13 Dec 2022 15:27:13 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/autoloader-process-multiple-files/m-p/16998#M11079</guid>
      <dc:creator>avenu</dc:creator>
      <dc:date>2022-12-13T15:27:13Z</dc:date>
    </item>
    <item>
      <title>Re: AutoLoader - process multiple files</title>
      <link>https://community.databricks.com/t5/data-engineering/autoloader-process-multiple-files/m-p/16999#M11080</link>
      <description>&lt;P&gt;As you are talking about different schemas ,perhaps schemaevolutionmode, infercolumntypes, or schemahints may help?? Check out this- 32min onward - &lt;A href="https://youtu.be/8a38Fv9cpd8" alt="https://youtu.be/8a38Fv9cpd8" target="_blank"&gt;https://youtu.be/8a38Fv9cpd8&lt;/A&gt; &lt;/P&gt;&lt;P&gt;​&lt;/P&gt;&lt;P&gt;Hope it helps, do let know how you solve it if you can.​&lt;/P&gt;</description>
      <pubDate>Thu, 15 Dec 2022 14:50:42 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/autoloader-process-multiple-files/m-p/16999#M11080</guid>
      <dc:creator>Wassim</dc:creator>
      <dc:date>2022-12-15T14:50:42Z</dc:date>
    </item>
  </channel>
</rss>

