<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Performance issues when loading an Excel file from DBFS using R in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/performance-issues-when-loading-an-excel-file-from-dbfs-using-r/m-p/5635#M2002</link>
    <description>&lt;P&gt;Hi @Marcel Baumgartner​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thank you for posting your question in our community! We are happy to assist you.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;To help us provide you with the most accurate information, could you please take a moment to review the responses and select the one that best answers your question?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;This will also help other community members who may have similar questions in the future. Thank you for your participation and let us know if you need any further assistance!&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
    <pubDate>Mon, 24 Apr 2023 04:29:01 GMT</pubDate>
    <dc:creator>Anonymous</dc:creator>
    <dc:date>2023-04-24T04:29:01Z</dc:date>
    <item>
      <title>Performance issues when loading an Excel file from DBFS using R</title>
      <link>https://community.databricks.com/t5/data-engineering/performance-issues-when-loading-an-excel-file-from-dbfs-using-r/m-p/5632#M1999</link>
      <description>&lt;P&gt;I have uploaded small Excel files on my DBFS. I then use function read_xlsx() from the "readxl" package in R to import the file into the R memory. I use a standard cluster (12.1, non ML). The function works but it takes ages. E.g. a simple Excel table with 40000+ records and 5 columns takes 9 minutes. On my R installation on Windows, the load is instantaneous. "readxl" is considered to be the best package to deal with Excel files. It is part of the already made available libraries on the cluster. Any idea what might cause this?&lt;/P&gt;</description>
      <pubDate>Tue, 18 Apr 2023 10:34:20 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/performance-issues-when-loading-an-excel-file-from-dbfs-using-r/m-p/5632#M1999</guid>
      <dc:creator>mbaumga</dc:creator>
      <dc:date>2023-04-18T10:34:20Z</dc:date>
    </item>
    <item>
      <title>Re: Performance issues when loading an Excel file from DBFS using R</title>
      <link>https://community.databricks.com/t5/data-engineering/performance-issues-when-loading-an-excel-file-from-dbfs-using-r/m-p/5634#M2001</link>
      <description>&lt;P&gt;Dear Kaniz, thanks. Your suggestion to copy the Excel file from DBFS to a temp folder "e.g. /tmp/" worked. Once I run read_xlsx() the upload is instantenous.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Indeed, we had the same problem the other way around. I was not able to save an xlsx or pdf file into a folder on "/dbfs/FileStore/*". However, I can save it to "/tmp/*" and then copy it to where I want the file to be. Good to know!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks again!&lt;/P&gt;</description>
      <pubDate>Thu, 20 Apr 2023 05:50:07 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/performance-issues-when-loading-an-excel-file-from-dbfs-using-r/m-p/5634#M2001</guid>
      <dc:creator>mbaumga</dc:creator>
      <dc:date>2023-04-20T05:50:07Z</dc:date>
    </item>
    <item>
      <title>Re: Performance issues when loading an Excel file from DBFS using R</title>
      <link>https://community.databricks.com/t5/data-engineering/performance-issues-when-loading-an-excel-file-from-dbfs-using-r/m-p/5635#M2002</link>
      <description>&lt;P&gt;Hi @Marcel Baumgartner​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thank you for posting your question in our community! We are happy to assist you.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;To help us provide you with the most accurate information, could you please take a moment to review the responses and select the one that best answers your question?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;This will also help other community members who may have similar questions in the future. Thank you for your participation and let us know if you need any further assistance!&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 24 Apr 2023 04:29:01 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/performance-issues-when-loading-an-excel-file-from-dbfs-using-r/m-p/5635#M2002</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2023-04-24T04:29:01Z</dc:date>
    </item>
    <item>
      <title>Re: Performance issues when loading an Excel file from DBFS using R</title>
      <link>https://community.databricks.com/t5/data-engineering/performance-issues-when-loading-an-excel-file-from-dbfs-using-r/m-p/5636#M2003</link>
      <description>&lt;P&gt;The questions was answered, successfully. All okay!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 28 Apr 2023 10:55:50 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/performance-issues-when-loading-an-excel-file-from-dbfs-using-r/m-p/5636#M2003</guid>
      <dc:creator>mbaumga</dc:creator>
      <dc:date>2023-04-28T10:55:50Z</dc:date>
    </item>
  </channel>
</rss>

