<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Loading multiple gz files from ADLS to Delta Lake/Delta table in ADB in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/loading-multiple-gz-files-from-adls-to-delta-lake-delta-table-in/m-p/5032#M1565</link>
    <description>&lt;P&gt;Hi, You can read GZ files through spark. &lt;/P&gt;&lt;P&gt;&lt;A href="https://stackoverflow.com/questions/42761912/how-to-read-gz-compressed-file-by-pyspark" alt="https://stackoverflow.com/questions/42761912/how-to-read-gz-compressed-file-by-pyspark" target="_blank"&gt;https://stackoverflow.com/questions/42761912/how-to-read-gz-compressed-file-by-pyspark&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Please let us know if this helps. Also, please tag&amp;nbsp;&lt;A href="https://community.databricks.com/s/profile/0053f000000WWwvAAG" alt="https://community.databricks.com/s/profile/0053f000000WWwvAAG" target="_blank"&gt;@Debayan&lt;/A&gt;​&amp;nbsp;with your next comment so that I will get notified. Thank you!&lt;/P&gt;</description>
    <pubDate>Tue, 09 May 2023 13:03:24 GMT</pubDate>
    <dc:creator>Debayan</dc:creator>
    <dc:date>2023-05-09T13:03:24Z</dc:date>
    <item>
      <title>Loading multiple gz files from ADLS to Delta Lake/Delta table in ADB</title>
      <link>https://community.databricks.com/t5/data-engineering/loading-multiple-gz-files-from-adls-to-delta-lake-delta-table-in/m-p/5031#M1564</link>
      <description>&lt;P&gt;I have several gz files (file.csv.gz) in a ADLS folder which are of pretty big size. All of these files are extractd from the same base table so it has the similar data but of different dates. How can I transfer them in delta lake/delta table. We would like to do quick POC on how faster Databricks is in reading the data from these files in delta as other platform(s) couldn't scale it well.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Any help would be much appreciated.&lt;/P&gt;&lt;P&gt;Krish.&lt;/P&gt;</description>
      <pubDate>Fri, 28 Apr 2023 22:21:03 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/loading-multiple-gz-files-from-adls-to-delta-lake-delta-table-in/m-p/5031#M1564</guid>
      <dc:creator>Krish1</dc:creator>
      <dc:date>2023-04-28T22:21:03Z</dc:date>
    </item>
    <item>
      <title>Re: Loading multiple gz files from ADLS to Delta Lake/Delta table in ADB</title>
      <link>https://community.databricks.com/t5/data-engineering/loading-multiple-gz-files-from-adls-to-delta-lake-delta-table-in/m-p/5032#M1565</link>
      <description>&lt;P&gt;Hi, You can read GZ files through spark. &lt;/P&gt;&lt;P&gt;&lt;A href="https://stackoverflow.com/questions/42761912/how-to-read-gz-compressed-file-by-pyspark" alt="https://stackoverflow.com/questions/42761912/how-to-read-gz-compressed-file-by-pyspark" target="_blank"&gt;https://stackoverflow.com/questions/42761912/how-to-read-gz-compressed-file-by-pyspark&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Please let us know if this helps. Also, please tag&amp;nbsp;&lt;A href="https://community.databricks.com/s/profile/0053f000000WWwvAAG" alt="https://community.databricks.com/s/profile/0053f000000WWwvAAG" target="_blank"&gt;@Debayan&lt;/A&gt;​&amp;nbsp;with your next comment so that I will get notified. Thank you!&lt;/P&gt;</description>
      <pubDate>Tue, 09 May 2023 13:03:24 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/loading-multiple-gz-files-from-adls-to-delta-lake-delta-table-in/m-p/5032#M1565</guid>
      <dc:creator>Debayan</dc:creator>
      <dc:date>2023-05-09T13:03:24Z</dc:date>
    </item>
  </channel>
</rss>

