<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Best ways to copy the parquet files in the staging directory to the Delta table in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/best-ways-to-copy-the-parquet-files-in-the-staging-directory-to/m-p/19298#M12920</link>
    <description>&lt;P&gt;I have some parquet data in a temporary directory. Can I copy them into the delta table directly, what are the best options. &lt;/P&gt;</description>
    <pubDate>Fri, 25 Jun 2021 17:32:33 GMT</pubDate>
    <dc:creator>brickster_2018</dc:creator>
    <dc:date>2021-06-25T17:32:33Z</dc:date>
    <item>
      <title>Best ways to copy the parquet files in the staging directory to the Delta table</title>
      <link>https://community.databricks.com/t5/data-engineering/best-ways-to-copy-the-parquet-files-in-the-staging-directory-to/m-p/19298#M12920</link>
      <description>&lt;P&gt;I have some parquet data in a temporary directory. Can I copy them into the delta table directly, what are the best options. &lt;/P&gt;</description>
      <pubDate>Fri, 25 Jun 2021 17:32:33 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/best-ways-to-copy-the-parquet-files-in-the-staging-directory-to/m-p/19298#M12920</guid>
      <dc:creator>brickster_2018</dc:creator>
      <dc:date>2021-06-25T17:32:33Z</dc:date>
    </item>
    <item>
      <title>Re: Best ways to copy the parquet files in the staging directory to the Delta table</title>
      <link>https://community.databricks.com/t5/data-engineering/best-ways-to-copy-the-parquet-files-in-the-staging-directory-to/m-p/19299#M12921</link>
      <description>&lt;P&gt;The easiest solution is to use the COPY INTO command. The COPY INTO command ensures idempotency, so even if the operation fails there are no data inconsistencies. COPY INTO command utilizes the resources on the Spark cluster hence completes faster.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.databricks.com/spark/latest/spark-sql/language-manual/delta-copy-into.html" target="test_blank"&gt;https://docs.databricks.com/spark/latest/spark-sql/language-manual/delta-copy-into.html&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 25 Jun 2021 17:33:01 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/best-ways-to-copy-the-parquet-files-in-the-staging-directory-to/m-p/19299#M12921</guid>
      <dc:creator>brickster_2018</dc:creator>
      <dc:date>2021-06-25T17:33:01Z</dc:date>
    </item>
  </channel>
</rss>

