<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: How to set up partitions on the streaming Delta Table? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/how-to-set-up-partitions-on-the-streaming-delta-table/m-p/33281#M24313</link>
    <description>&lt;P&gt;is the change data feed functionality (of your silver table) an option, combined with merge in your gold table?&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.microsoft.com/en-us/azure/databricks/delta/delta-change-data-feed" alt="https://docs.microsoft.com/en-us/azure/databricks/delta/delta-change-data-feed" target="_blank"&gt;https://docs.microsoft.com/en-us/azure/databricks/delta/delta-change-data-feed&lt;/A&gt;&lt;/P&gt;</description>
    <pubDate>Mon, 29 Aug 2022 08:39:25 GMT</pubDate>
    <dc:creator>-werners-</dc:creator>
    <dc:date>2022-08-29T08:39:25Z</dc:date>
    <item>
      <title>How to set up partitions on the streaming Delta Table?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-set-up-partitions-on-the-streaming-delta-table/m-p/33280#M24312</link>
      <description>&lt;P&gt;Let's assume that we have 3 streaming Delta Tables:&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Bronze&lt;/LI&gt;&lt;LI&gt;Silver&lt;/LI&gt;&lt;LI&gt;Gold&lt;/LI&gt;&lt;/UL&gt;&lt;P&gt;My aim is to add partitioning to Silver table (for example by Date). &lt;/P&gt;&lt;P&gt;So, as a result Gold table with throw an error that source table has been updated and I would need to set 'ignoreChanges' to 'true' option in the streaming. Then streaming will work but it will move all data from Silver (all files has been changed) to Gold resulting in duplicates.&lt;/P&gt;&lt;P&gt;My question is how to handle this problem in the best way? &lt;/P&gt;&lt;P&gt;Is it possible to manipulate streaming checkpoint somehow? &lt;/P&gt;</description>
      <pubDate>Mon, 29 Aug 2022 08:34:17 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-set-up-partitions-on-the-streaming-delta-table/m-p/33280#M24312</guid>
      <dc:creator>Leszek</dc:creator>
      <dc:date>2022-08-29T08:34:17Z</dc:date>
    </item>
    <item>
      <title>Re: How to set up partitions on the streaming Delta Table?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-set-up-partitions-on-the-streaming-delta-table/m-p/33281#M24313</link>
      <description>&lt;P&gt;is the change data feed functionality (of your silver table) an option, combined with merge in your gold table?&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.microsoft.com/en-us/azure/databricks/delta/delta-change-data-feed" alt="https://docs.microsoft.com/en-us/azure/databricks/delta/delta-change-data-feed" target="_blank"&gt;https://docs.microsoft.com/en-us/azure/databricks/delta/delta-change-data-feed&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 29 Aug 2022 08:39:25 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-set-up-partitions-on-the-streaming-delta-table/m-p/33281#M24313</guid>
      <dc:creator>-werners-</dc:creator>
      <dc:date>2022-08-29T08:39:25Z</dc:date>
    </item>
    <item>
      <title>Re: How to set up partitions on the streaming Delta Table?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-set-up-partitions-on-the-streaming-delta-table/m-p/33283#M24315</link>
      <description>&lt;P&gt;I never used CDC in Databricks but my ELT architecture is based on streaming and I don't want to change that. &lt;/P&gt;</description>
      <pubDate>Fri, 09 Sep 2022 13:50:00 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-set-up-partitions-on-the-streaming-delta-table/m-p/33283#M24315</guid>
      <dc:creator>Leszek</dc:creator>
      <dc:date>2022-09-09T13:50:00Z</dc:date>
    </item>
  </channel>
</rss>

