<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Create external table using multiple paths/locations in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/create-external-table-using-multiple-paths-locations/m-p/82041#M36493</link>
    <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/9"&gt;@Retired_mod&lt;/a&gt;, hope you are well.&lt;BR /&gt;&lt;BR /&gt;This is still not working for me.&lt;BR /&gt;&lt;BR /&gt;For example:&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Full path works fine:&amp;nbsp;&lt;UL&gt;&lt;LI&gt;&lt;SPAN&gt;abfss://&amp;lt;container&amp;gt;@&amp;lt;storage_account&amp;gt;.dfs.core.windows.net/automation/&amp;lt;subfolder1&amp;gt;/&amp;lt;subfolder2&amp;gt;/&amp;lt;subfolder3&amp;gt;/part_0_0001.csv&lt;/SPAN&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;DIV&gt;&lt;UL&gt;&lt;LI&gt;&lt;SPAN&gt;But as soon as a use wildcard, any of below options fail:&lt;/SPAN&gt;&lt;UL&gt;&lt;LI&gt;&lt;SPAN&gt;abfss://&amp;lt;container&amp;gt;@&amp;lt;storage_account&amp;gt;.dfs.core.windows.net/automation/&amp;lt;subfolder1&amp;gt;/&amp;lt;subfolder2&amp;gt;/&amp;lt;subfolder3&amp;gt;/*.csv&amp;nbsp; (on File name)&lt;/SPAN&gt;&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;abfss://&amp;lt;container&amp;gt;@&amp;lt;storage_account&amp;gt;.dfs.core.windows.net/automation/&amp;lt;subfolder1&amp;gt;/&amp;lt;subfolder2&amp;gt;/*/part_00001.csv (on Subfolder)&lt;/SPAN&gt;&lt;SPAN&gt;&lt;BR /&gt;&lt;/SPAN&gt;&lt;SPAN&gt;ERROR:&lt;BR /&gt;&lt;/SPAN&gt;&lt;SPAN&gt;Failure to initialize configuration for storage account &amp;lt;storage_account&amp;gt;.dfs.core.windows.net: Invalid configuration value detected for fs.azure.account.key&lt;/SPAN&gt;&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;My table settings are:&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;USING&lt;/SPAN&gt;&lt;SPAN&gt; csv&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;OPTIONS&lt;/SPAN&gt; &lt;SPAN&gt;(&lt;/SPAN&gt;&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN&gt;'DATEFORMAT'&lt;/SPAN&gt; &lt;SPAN&gt;=&lt;/SPAN&gt; &lt;SPAN&gt;'MM/dd/yyyy'&lt;/SPAN&gt;&lt;SPAN&gt;,&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN&gt;'ESCAPE'&lt;/SPAN&gt; &lt;SPAN&gt;=&lt;/SPAN&gt; &lt;SPAN&gt;'"'&lt;/SPAN&gt;&lt;SPAN&gt;,&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN&gt;'HEADER'&lt;/SPAN&gt; &lt;SPAN&gt;=&lt;/SPAN&gt; &lt;SPAN&gt;'true'&lt;/SPAN&gt;&lt;SPAN&gt;)&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;Any suggestions?&lt;/DIV&gt;&lt;DIV&gt;Emiliano&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-center" image-alt="full_path.png" style="width: 999px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/10157i38B6517A0BF3A9F2/image-size/large/is-moderation-mode/true?v=v2&amp;amp;px=999" role="button" title="full_path.png" alt="full_path.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-center" image-alt="wildcard.png" style="width: 999px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/10158i198CF6C9F9F059BA/image-size/large/is-moderation-mode/true?v=v2&amp;amp;px=999" role="button" title="wildcard.png" alt="wildcard.png" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
    <pubDate>Tue, 06 Aug 2024 13:29:31 GMT</pubDate>
    <dc:creator>ellerado</dc:creator>
    <dc:date>2024-08-06T13:29:31Z</dc:date>
    <item>
      <title>Create external table using multiple paths/locations</title>
      <link>https://community.databricks.com/t5/data-engineering/create-external-table-using-multiple-paths-locations/m-p/44042#M27595</link>
      <description>&lt;P&gt;I want to create an external table from more than a single path. I have configured my storage creds and added an external location, and I can successfully create a table using the following code;&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;create table test.base.Example
using csv
options ( 
  header = "true"
) 
location 'abfss://test@exampleblob.dfs.core.windows.net/2022/08/data/'&lt;/LI-CODE&gt;&lt;P&gt;But I have lots of data partitioned by month and date so I'm wondering if there is anyway to import data from multiple paths using wildcards or something similar as outlined in the code below?&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;create table test.base.Example
using csv
options ( 
  header = "true"
) 
location 'abfss://test@exampleblob.dfs.core.windows.net/*/*/data/'&lt;/LI-CODE&gt;&lt;P&gt;Many thanks&lt;/P&gt;&lt;P&gt;Tim&lt;/P&gt;</description>
      <pubDate>Thu, 07 Sep 2023 21:30:58 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/create-external-table-using-multiple-paths-locations/m-p/44042#M27595</guid>
      <dc:creator>TimB</dc:creator>
      <dc:date>2023-09-07T21:30:58Z</dc:date>
    </item>
    <item>
      <title>Re: Create external table using multiple paths/locations</title>
      <link>https://community.databricks.com/t5/data-engineering/create-external-table-using-multiple-paths-locations/m-p/82041#M36493</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/9"&gt;@Retired_mod&lt;/a&gt;, hope you are well.&lt;BR /&gt;&lt;BR /&gt;This is still not working for me.&lt;BR /&gt;&lt;BR /&gt;For example:&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Full path works fine:&amp;nbsp;&lt;UL&gt;&lt;LI&gt;&lt;SPAN&gt;abfss://&amp;lt;container&amp;gt;@&amp;lt;storage_account&amp;gt;.dfs.core.windows.net/automation/&amp;lt;subfolder1&amp;gt;/&amp;lt;subfolder2&amp;gt;/&amp;lt;subfolder3&amp;gt;/part_0_0001.csv&lt;/SPAN&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;DIV&gt;&lt;UL&gt;&lt;LI&gt;&lt;SPAN&gt;But as soon as a use wildcard, any of below options fail:&lt;/SPAN&gt;&lt;UL&gt;&lt;LI&gt;&lt;SPAN&gt;abfss://&amp;lt;container&amp;gt;@&amp;lt;storage_account&amp;gt;.dfs.core.windows.net/automation/&amp;lt;subfolder1&amp;gt;/&amp;lt;subfolder2&amp;gt;/&amp;lt;subfolder3&amp;gt;/*.csv&amp;nbsp; (on File name)&lt;/SPAN&gt;&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;abfss://&amp;lt;container&amp;gt;@&amp;lt;storage_account&amp;gt;.dfs.core.windows.net/automation/&amp;lt;subfolder1&amp;gt;/&amp;lt;subfolder2&amp;gt;/*/part_00001.csv (on Subfolder)&lt;/SPAN&gt;&lt;SPAN&gt;&lt;BR /&gt;&lt;/SPAN&gt;&lt;SPAN&gt;ERROR:&lt;BR /&gt;&lt;/SPAN&gt;&lt;SPAN&gt;Failure to initialize configuration for storage account &amp;lt;storage_account&amp;gt;.dfs.core.windows.net: Invalid configuration value detected for fs.azure.account.key&lt;/SPAN&gt;&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;My table settings are:&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;USING&lt;/SPAN&gt;&lt;SPAN&gt; csv&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;OPTIONS&lt;/SPAN&gt; &lt;SPAN&gt;(&lt;/SPAN&gt;&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN&gt;'DATEFORMAT'&lt;/SPAN&gt; &lt;SPAN&gt;=&lt;/SPAN&gt; &lt;SPAN&gt;'MM/dd/yyyy'&lt;/SPAN&gt;&lt;SPAN&gt;,&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN&gt;'ESCAPE'&lt;/SPAN&gt; &lt;SPAN&gt;=&lt;/SPAN&gt; &lt;SPAN&gt;'"'&lt;/SPAN&gt;&lt;SPAN&gt;,&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN&gt;'HEADER'&lt;/SPAN&gt; &lt;SPAN&gt;=&lt;/SPAN&gt; &lt;SPAN&gt;'true'&lt;/SPAN&gt;&lt;SPAN&gt;)&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;Any suggestions?&lt;/DIV&gt;&lt;DIV&gt;Emiliano&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-center" image-alt="full_path.png" style="width: 999px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/10157i38B6517A0BF3A9F2/image-size/large/is-moderation-mode/true?v=v2&amp;amp;px=999" role="button" title="full_path.png" alt="full_path.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-center" image-alt="wildcard.png" style="width: 999px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/10158i198CF6C9F9F059BA/image-size/large/is-moderation-mode/true?v=v2&amp;amp;px=999" role="button" title="wildcard.png" alt="wildcard.png" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 06 Aug 2024 13:29:31 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/create-external-table-using-multiple-paths-locations/m-p/82041#M36493</guid>
      <dc:creator>ellerado</dc:creator>
      <dc:date>2024-08-06T13:29:31Z</dc:date>
    </item>
    <item>
      <title>Re: Create external table using multiple paths/locations</title>
      <link>https://community.databricks.com/t5/data-engineering/create-external-table-using-multiple-paths-locations/m-p/104974#M41960</link>
      <description>&lt;P&gt;You do not have to create all the partition folders yourslef.&lt;/P&gt;
&lt;P&gt;You just need to specify the parent folder like&amp;nbsp;&lt;/P&gt;
&lt;PRE&gt;&lt;SPAN class="k"&gt;CREATE&lt;/SPAN&gt; &lt;SPAN class="k"&gt;OR&lt;/SPAN&gt; &lt;SPAN class="k"&gt;REPLACE&lt;/SPAN&gt; &lt;SPAN class="k"&gt;TABLE&lt;/SPAN&gt; &lt;SPAN class="o"&gt;&amp;lt;&lt;/SPAN&gt;&lt;SPAN class="k"&gt;catalog&lt;/SPAN&gt;&lt;SPAN class="o"&gt;&amp;gt;&lt;/SPAN&gt;&lt;SPAN class="p"&gt;.&lt;/SPAN&gt;&lt;SPAN class="o"&gt;&amp;lt;&lt;/SPAN&gt;&lt;SPAN class="k"&gt;schema&lt;/SPAN&gt;&lt;SPAN class="o"&gt;&amp;gt;&lt;/SPAN&gt;&lt;SPAN class="p"&gt;.&lt;/SPAN&gt;&lt;SPAN class="o"&gt;&amp;lt;&lt;/SPAN&gt;&lt;SPAN class="k"&gt;table&lt;/SPAN&gt;&lt;SPAN class="o"&gt;-&lt;/SPAN&gt;&lt;SPAN class="n"&gt;name&lt;/SPAN&gt;&lt;SPAN class="o"&gt;&amp;gt;&lt;/SPAN&gt;
&lt;SPAN class="k"&gt;USING&lt;/SPAN&gt; &lt;SPAN class="o"&gt;&amp;lt;&lt;/SPAN&gt;&lt;SPAN class="n"&gt;format&lt;/SPAN&gt;&lt;SPAN class="o"&gt;&amp;gt;&lt;/SPAN&gt;
&lt;SPAN class="n"&gt;PARTITIONED&lt;/SPAN&gt; &lt;SPAN class="k"&gt;BY&lt;/SPAN&gt; &lt;SPAN class="p"&gt;(&lt;/SPAN&gt;&lt;SPAN class="o"&gt;&amp;lt;&lt;/SPAN&gt;&lt;SPAN class="n"&gt;partition&lt;/SPAN&gt;&lt;SPAN class="o"&gt;-&lt;/SPAN&gt;&lt;SPAN class="k"&gt;column&lt;/SPAN&gt;&lt;SPAN class="o"&gt;-&lt;/SPAN&gt;&lt;SPAN class="n"&gt;list&lt;/SPAN&gt;&lt;SPAN class="o"&gt;&amp;gt;&lt;/SPAN&gt;&lt;SPAN class="p"&gt;)&lt;/SPAN&gt;
&lt;SPAN class="k"&gt;LOCATION&lt;/SPAN&gt; &lt;SPAN class="s1"&gt;'s3://&amp;lt;bucket-path&amp;gt;/&amp;lt;table-directory&amp;gt;'&lt;/SPAN&gt;&lt;SPAN class="p"&gt;;&lt;/SPAN&gt;&lt;/PRE&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;some more read -&amp;nbsp;&lt;A href="https://docs.databricks.com/en/tables/external-partition-discovery.html#manually-specify-paths-for-other-partition-types" target="_blank"&gt;https://docs.databricks.com/en/tables/external-partition-discovery.html#manually-specify-paths-for-other-partition-types&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 09 Jan 2025 15:19:23 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/create-external-table-using-multiple-paths-locations/m-p/104974#M41960</guid>
      <dc:creator>NandiniN</dc:creator>
      <dc:date>2025-01-09T15:19:23Z</dc:date>
    </item>
  </channel>
</rss>

