<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: How to load xlsx Files to Delta Live Tables (DLT)? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/how-to-load-xlsx-files-to-delta-live-tables-dlt/m-p/74083#M34719</link>
    <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/102842"&gt;@avrm91&lt;/a&gt;&amp;nbsp; - can try dividing xlsx files into a csv as a preprocessing step and ingest them in to a dataframe using Autoloader. Also, you can use openpyxl to load into a dataframe. refer to this &lt;A href="https://kb.databricks.com/libraries/xlsx-file-not-supported-xlrd?from_search=149888754" target="_self"&gt;doc&lt;/A&gt; for example.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Fri, 14 Jun 2024 20:44:41 GMT</pubDate>
    <dc:creator>shan_chandra</dc:creator>
    <dc:date>2024-06-14T20:44:41Z</dc:date>
    <item>
      <title>How to load xlsx Files to Delta Live Tables (DLT)?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-load-xlsx-files-to-delta-live-tables-dlt/m-p/73793#M34665</link>
      <description>&lt;P&gt;I want to load a .xlsx file to DLT but struggling as it is not available with Autoloader.&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;With the Assistant I tried to load the .xlsx first to a data frame and then send it to DLT.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="python"&gt;import dlt
from pyspark.sql import SparkSession

# Load xlsx file into DataFrame
df = spark.read \
    .format("com.crealytics.spark.excel") \
    .option("dataAddress", "${my_etl.sheet_address}") \
    .option("header", "${my_etl.header}") \
    .option("inferSchema", "${my_etl.infer_schema}") \
    .option("timestampFormat", "${my_etl.timestamp_format}") \
    .load("${my_etl.input_path}")

@dlt.table
def conformed():
    return df&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;but it is not working.&lt;/P&gt;</description>
      <pubDate>Thu, 13 Jun 2024 13:54:41 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-load-xlsx-files-to-delta-live-tables-dlt/m-p/73793#M34665</guid>
      <dc:creator>avrm91</dc:creator>
      <dc:date>2024-06-13T13:54:41Z</dc:date>
    </item>
    <item>
      <title>Re: How to load xlsx Files to Delta Live Tables (DLT)?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-load-xlsx-files-to-delta-live-tables-dlt/m-p/74083#M34719</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/102842"&gt;@avrm91&lt;/a&gt;&amp;nbsp; - can try dividing xlsx files into a csv as a preprocessing step and ingest them in to a dataframe using Autoloader. Also, you can use openpyxl to load into a dataframe. refer to this &lt;A href="https://kb.databricks.com/libraries/xlsx-file-not-supported-xlrd?from_search=149888754" target="_self"&gt;doc&lt;/A&gt; for example.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 14 Jun 2024 20:44:41 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-load-xlsx-files-to-delta-live-tables-dlt/m-p/74083#M34719</guid>
      <dc:creator>shan_chandra</dc:creator>
      <dc:date>2024-06-14T20:44:41Z</dc:date>
    </item>
    <item>
      <title>Re: How to load xlsx Files to Delta Live Tables (DLT)?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-load-xlsx-files-to-delta-live-tables-dlt/m-p/74854#M34799</link>
      <description>&lt;P&gt;For now, I will use the Azure Data Factory to convert the xlsx to csv and then process it within Databricks.&amp;nbsp;&lt;BR /&gt;Overall, I wonder if there will be a xlsx Autoloader implementation in the future, as the preprocessing will not have the Autoloader features and I will need to take care what was already loaded and what not.&lt;BR /&gt;All over I would not say that it is a solution so I will let this ticket open.&lt;/P&gt;</description>
      <pubDate>Tue, 18 Jun 2024 12:07:51 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-load-xlsx-files-to-delta-live-tables-dlt/m-p/74854#M34799</guid>
      <dc:creator>avrm91</dc:creator>
      <dc:date>2024-06-18T12:07:51Z</dc:date>
    </item>
    <item>
      <title>Re: How to load xlsx Files to Delta Live Tables (DLT)?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-load-xlsx-files-to-delta-live-tables-dlt/m-p/74888#M34808</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/102842"&gt;@avrm91&lt;/a&gt;&amp;nbsp;- There is a feature request in place. DB engg will priorotized. As of now no ETA yet on this.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 18 Jun 2024 15:56:08 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-load-xlsx-files-to-delta-live-tables-dlt/m-p/74888#M34808</guid>
      <dc:creator>shan_chandra</dc:creator>
      <dc:date>2024-06-18T15:56:08Z</dc:date>
    </item>
    <item>
      <title>Re: How to load xlsx Files to Delta Live Tables (DLT)?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-load-xlsx-files-to-delta-live-tables-dlt/m-p/76477#M35225</link>
      <description>&lt;P&gt;Added a feature request into Azure Community Portal&lt;BR /&gt;&lt;A href="https://feedback.azure.com/d365community/idea/cfdf2172-5038-ef11-a296-000d3ae4120b" target="_blank"&gt;XLSX - DLT Autoloader · Community (azure.com)&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 02 Jul 2024 08:57:31 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-load-xlsx-files-to-delta-live-tables-dlt/m-p/76477#M35225</guid>
      <dc:creator>avrm91</dc:creator>
      <dc:date>2024-07-02T08:57:31Z</dc:date>
    </item>
  </channel>
</rss>

