<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Dealing with updates to a delta  table being used as a streaming source in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/dealing-with-updates-to-a-delta-table-being-used-as-a-streaming/m-p/31921#M23273</link>
    <description>&lt;P&gt;Hi @Leszek​&amp;nbsp;&lt;/P&gt;&lt;P&gt;For your case &lt;B&gt;ignoreChanges option will work, but you need to handle duplicates from your streaming app while writing to sink. If your sink is Delta then you can go with Delta Streaming Merge.&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.databricks.com/_static/notebooks/merge-in-streaming.html" target="test_blank"&gt;https://docs.databricks.com/_static/notebooks/merge-in-streaming.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
    <pubDate>Sun, 13 Mar 2022 08:11:38 GMT</pubDate>
    <dc:creator>Manjunath</dc:creator>
    <dc:date>2022-03-13T08:11:38Z</dc:date>
    <item>
      <title>Dealing with updates to a delta  table being used as a streaming source</title>
      <link>https://community.databricks.com/t5/data-engineering/dealing-with-updates-to-a-delta-table-being-used-as-a-streaming/m-p/31917#M23269</link>
      <description>&lt;P&gt;Hi All&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I have a requirement to perform updates on a delta table that is the source for a streaming query.&lt;/P&gt;&lt;P&gt;I would like to be able to update the table and have the stream continue  to work while also not  ending up with duplicates.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;From my research it seems that the ignoreDeletes option will not work as I am not going to be updating/deleting based on the partition column.  The ignoreChanges option also looks unsuitable as it will generate duplicates of not only the rows I update, but also any other rows in the same files.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Does anyone have any suggestions/procedures they've used for similar in the past?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;</description>
      <pubDate>Tue, 11 Jan 2022 09:31:42 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/dealing-with-updates-to-a-delta-table-being-used-as-a-streaming/m-p/31917#M23269</guid>
      <dc:creator>Confused</dc:creator>
      <dc:date>2022-01-11T09:31:42Z</dc:date>
    </item>
    <item>
      <title>Re: Dealing with updates to a delta  table being used as a streaming source</title>
      <link>https://community.databricks.com/t5/data-engineering/dealing-with-updates-to-a-delta-table-being-used-as-a-streaming/m-p/31920#M23272</link>
      <description>&lt;P&gt;Maybe merging data from updated delta into next streaming delta will work? &lt;/P&gt;&lt;P&gt;&lt;A href="https://www.youtube.com/watch?v=2Iy5S0Hf4XM" target="test_blank"&gt;https://www.youtube.com/watch?v=2Iy5S0Hf4XM&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 26 Jan 2022 11:21:16 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/dealing-with-updates-to-a-delta-table-being-used-as-a-streaming/m-p/31920#M23272</guid>
      <dc:creator>Leszek</dc:creator>
      <dc:date>2022-01-26T11:21:16Z</dc:date>
    </item>
    <item>
      <title>Re: Dealing with updates to a delta  table being used as a streaming source</title>
      <link>https://community.databricks.com/t5/data-engineering/dealing-with-updates-to-a-delta-table-being-used-as-a-streaming/m-p/31921#M23273</link>
      <description>&lt;P&gt;Hi @Leszek​&amp;nbsp;&lt;/P&gt;&lt;P&gt;For your case &lt;B&gt;ignoreChanges option will work, but you need to handle duplicates from your streaming app while writing to sink. If your sink is Delta then you can go with Delta Streaming Merge.&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.databricks.com/_static/notebooks/merge-in-streaming.html" target="test_blank"&gt;https://docs.databricks.com/_static/notebooks/merge-in-streaming.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Sun, 13 Mar 2022 08:11:38 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/dealing-with-updates-to-a-delta-table-being-used-as-a-streaming/m-p/31921#M23273</guid>
      <dc:creator>Manjunath</dc:creator>
      <dc:date>2022-03-13T08:11:38Z</dc:date>
    </item>
    <item>
      <title>Re: Dealing with updates to a delta  table being used as a streaming source</title>
      <link>https://community.databricks.com/t5/data-engineering/dealing-with-updates-to-a-delta-table-being-used-as-a-streaming/m-p/31922#M23274</link>
      <description>&lt;P&gt;Hey @Mathew Walters​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Hope you are doing great.&lt;/P&gt;&lt;P&gt;Just wanted to check in if you were able to resolve your issue and would you be happy to share the solution? Else please let us know if you need more help.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;We'd love to hear from you.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 19 May 2022 15:36:37 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/dealing-with-updates-to-a-delta-table-being-used-as-a-streaming/m-p/31922#M23274</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2022-05-19T15:36:37Z</dc:date>
    </item>
  </channel>
</rss>

