<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Copying Delta table from QA to Prod in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10970#M6012</link>
    <description>&lt;P&gt;Does it support cloning across the subscription ? If so can you share an example?&lt;/P&gt;</description>
    <pubDate>Mon, 23 Jan 2023 03:41:48 GMT</pubDate>
    <dc:creator>MachuPichu</dc:creator>
    <dc:date>2023-01-23T03:41:48Z</dc:date>
    <item>
      <title>Copying Delta table from QA to Prod</title>
      <link>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10967#M6009</link>
      <description>&lt;P&gt;I am looking for a way to copy large managed Delta table like 4TB from one environment (QA) to other(Prod) . QA and Prod are in different subscription and in different region. I understand Databricks provides a way to clone table. But I am not sure if cloning can work across the subscriptions. Yes, there is network connectivity between QA and prod in case files need to be copied from lower to higher environment. I am sure I am not the first person trying to copy tables across the environment. Can you share how you performed such copy/migration ?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Sat, 21 Jan 2023 19:36:11 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10967#M6009</guid>
      <dc:creator>MachuPichu</dc:creator>
      <dc:date>2023-01-21T19:36:11Z</dc:date>
    </item>
    <item>
      <title>Re: Copying Delta table from QA to Prod</title>
      <link>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10968#M6010</link>
      <description>&lt;P&gt;USE DEEP CLONE &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;CREATE&lt;/B&gt; &lt;B&gt;TABLE&lt;/B&gt; delta.`/&lt;B&gt;data&lt;/B&gt;/target/` CLONE delta.`/&lt;B&gt;data&lt;/B&gt;/&lt;B&gt;source&lt;/B&gt;/` -- Create a deep clone of /data/source at /data/target&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;ref link: &lt;A href="https://docs.databricks.com/optimizations/clone.html" target="test_blank"&gt;https://docs.databricks.com/optimizations/clone.html&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Sun, 22 Jan 2023 12:37:09 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10968#M6010</guid>
      <dc:creator>sher</dc:creator>
      <dc:date>2023-01-22T12:37:09Z</dc:date>
    </item>
    <item>
      <title>Re: Copying Delta table from QA to Prod</title>
      <link>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10969#M6011</link>
      <description>&lt;P&gt; I don't know if it would be a ideal option, but please read more Unity Catalog and delta sharing.  DEEP CLONE souds good. &lt;/P&gt;</description>
      <pubDate>Sun, 22 Jan 2023 15:52:04 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10969#M6011</guid>
      <dc:creator>Cami</dc:creator>
      <dc:date>2023-01-22T15:52:04Z</dc:date>
    </item>
    <item>
      <title>Re: Copying Delta table from QA to Prod</title>
      <link>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10970#M6012</link>
      <description>&lt;P&gt;Does it support cloning across the subscription ? If so can you share an example?&lt;/P&gt;</description>
      <pubDate>Mon, 23 Jan 2023 03:41:48 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10970#M6012</guid>
      <dc:creator>MachuPichu</dc:creator>
      <dc:date>2023-01-23T03:41:48Z</dc:date>
    </item>
    <item>
      <title>Re: Copying Delta table from QA to Prod</title>
      <link>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10971#M6013</link>
      <description>&lt;P&gt;We are not using unity catalog. This is still based on Hive catalog&lt;/P&gt;</description>
      <pubDate>Mon, 23 Jan 2023 03:43:03 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10971#M6013</guid>
      <dc:creator>MachuPichu</dc:creator>
      <dc:date>2023-01-23T03:43:03Z</dc:date>
    </item>
    <item>
      <title>Re: Copying Delta table from QA to Prod</title>
      <link>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10972#M6014</link>
      <description>&lt;P&gt;@Ratnadeep Bose​&amp;nbsp;&lt;/P&gt;&lt;P&gt;The best way would be to create a storage that will be used to copy the data between two envs.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;OL&gt;&lt;LI&gt;Create an external table on Sub1 with the same schema as source table, with location on the storage,&lt;/LI&gt;&lt;LI&gt;Insert into external table from source table,&lt;/LI&gt;&lt;LI&gt;Create an external table on Sub2 with the same schema as source table, with location on the storage,&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks to that you've got the same data on both subscriptions.&lt;/P&gt;</description>
      <pubDate>Mon, 23 Jan 2023 09:34:34 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10972#M6014</guid>
      <dc:creator>daniel_sahal</dc:creator>
      <dc:date>2023-01-23T09:34:34Z</dc:date>
    </item>
    <item>
      <title>Re: Copying Delta table from QA to Prod</title>
      <link>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10973#M6015</link>
      <description>&lt;P&gt;I would use a data factory to copy 4TB files as it has gigantic throughput. After completing a copy of everything, I would register as a table in the new metastore.&lt;/P&gt;</description>
      <pubDate>Mon, 23 Jan 2023 13:24:41 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10973#M6015</guid>
      <dc:creator>Hubert-Dudek</dc:creator>
      <dc:date>2023-01-23T13:24:41Z</dc:date>
    </item>
    <item>
      <title>Re: Copying Delta table from QA to Prod</title>
      <link>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10974#M6016</link>
      <description>&lt;P&gt;Just to be clear we are using managed delta table not external table. I am not sure if above solution will still work. Thanks very much for your feedback&lt;/P&gt;</description>
      <pubDate>Tue, 24 Jan 2023 20:29:26 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10974#M6016</guid>
      <dc:creator>MachuPichu</dc:creator>
      <dc:date>2023-01-24T20:29:26Z</dc:date>
    </item>
    <item>
      <title>Re: Copying Delta table from QA to Prod</title>
      <link>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10975#M6017</link>
      <description>&lt;P&gt;Thought about using ADF. Since we are using managed Delta table, I am not sure how you can register based on external data. Any idea?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 24 Jan 2023 20:33:41 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10975#M6017</guid>
      <dc:creator>MachuPichu</dc:creator>
      <dc:date>2023-01-24T20:33:41Z</dc:date>
    </item>
    <item>
      <title>Re: Copying Delta table from QA to Prod</title>
      <link>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10976#M6018</link>
      <description>&lt;P&gt;@Ratnadeep Bose​&amp;nbsp;&lt;/P&gt;&lt;P&gt;That's why I've mentioned creating external table as a table that will be used for data copy between two environments. It should be a copy of source table but with the location on the storage.&lt;/P&gt;</description>
      <pubDate>Wed, 25 Jan 2023 06:32:18 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/copying-delta-table-from-qa-to-prod/m-p/10976#M6018</guid>
      <dc:creator>daniel_sahal</dc:creator>
      <dc:date>2023-01-25T06:32:18Z</dc:date>
    </item>
  </channel>
</rss>

