<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: error after updating delta table  com.databricks.sql.transaction.tahoe.DeltaUnsupportedOperationException: Detected a data update in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6776#M2793</link>
    <description>&lt;P&gt;I can see ignoreChanges true emits all the updates + emits unupdated files as well for same partition. As per documents, need to handle duplicates in downstream. Can you suggest how to handle duplicate files.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;This is from databrick documents. (https://docs.databricks.com/structured-streaming/delta-lake.html#ignore-updates-and-deletes)&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;"The semantics for ignoreChanges differ greatly from skipChangeCommits. With ignoreChanges enabled, rewritten data files in the source table are re-emitted after a data changing operation such as UPDATE, MERGE INTO, DELETE (within partitions), or OVERWRITE. Unchanged rows are often emitted alongside new rows, so downstream consumers must be able to handle duplicates. Deletes are not propagated downstream. ignoreChanges subsumes ignoreDeletes."&lt;/P&gt;</description>
    <pubDate>Fri, 31 Mar 2023 12:33:40 GMT</pubDate>
    <dc:creator>sanjay</dc:creator>
    <dc:date>2023-03-31T12:33:40Z</dc:date>
    <item>
      <title>error after updating delta table  com.databricks.sql.transaction.tahoe.DeltaUnsupportedOperationException: Detected a data update</title>
      <link>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6771#M2788</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I have pipeline running. I have updated one file in delta table which is already processed. Now I am getting error&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;com.databricks.sql.transaction.tahoe.DeltaUnsupportedOperationException: Detected a data update. This is currently not supported. If you'd like to ignore updates, set the option 'ignoreChanges' to 'true'.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I have set ignoreChanges to true but still getting same error.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;spark.readStream.format("delta")&lt;/P&gt;&lt;P&gt;  .option("ignoreChanges", "true")&lt;/P&gt;&lt;P&gt;  .load("/tmp/delta/user_events")&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;Sanjay&lt;/P&gt;</description>
      <pubDate>Thu, 30 Mar 2023 12:02:21 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6771#M2788</guid>
      <dc:creator>sanjay</dc:creator>
      <dc:date>2023-03-30T12:02:21Z</dc:date>
    </item>
    <item>
      <title>Re: error after updating delta table  com.databricks.sql.transaction.tahoe.DeltaUnsupportedOperationException: Detected a data update</title>
      <link>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6772#M2789</link>
      <description>&lt;P&gt;@Sanjay Jain​&amp;nbsp;which run time version you are using, above should work if you have updated required field and that should be consumed by downstream consumers, please check below article&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt; &lt;A href="https://docs.databricks.com/structured-streaming/delta-lake.html#ignore-updates-and-deletes" target="test_blank"&gt;https://docs.databricks.com/structured-streaming/delta-lake.html#ignore-updates-and-deletes&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 30 Mar 2023 12:16:03 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6772#M2789</guid>
      <dc:creator>karthik_p</dc:creator>
      <dc:date>2023-03-30T12:16:03Z</dc:date>
    </item>
    <item>
      <title>Re: error after updating delta table  com.databricks.sql.transaction.tahoe.DeltaUnsupportedOperationException: Detected a data update</title>
      <link>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6773#M2790</link>
      <description>&lt;P&gt;I am using 11.3 LTS. I have updated one field and this data is consumed by downstream consumer. But challenge is, I am getting other unchanged files as well to consumer along with updated file.&lt;/P&gt;</description>
      <pubDate>Thu, 30 Mar 2023 12:20:06 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6773#M2790</guid>
      <dc:creator>sanjay</dc:creator>
      <dc:date>2023-03-30T12:20:06Z</dc:date>
    </item>
    <item>
      <title>Re: error after updating delta table  com.databricks.sql.transaction.tahoe.DeltaUnsupportedOperationException: Detected a data update</title>
      <link>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6774#M2791</link>
      <description>&lt;P&gt;@Sanjay Jain​&amp;nbsp;how did you update the file? Can you elaborate on the steps, please?&lt;/P&gt;</description>
      <pubDate>Thu, 30 Mar 2023 13:50:03 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6774#M2791</guid>
      <dc:creator>Sandeep</dc:creator>
      <dc:date>2023-03-30T13:50:03Z</dc:date>
    </item>
    <item>
      <title>Re: error after updating delta table  com.databricks.sql.transaction.tahoe.DeltaUnsupportedOperationException: Detected a data update</title>
      <link>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6775#M2792</link>
      <description>&lt;P&gt;Using merge into table a&lt;/P&gt;&lt;P&gt;using table b&lt;/P&gt;&lt;P&gt;when matched then update SET a.name= b.name&lt;/P&gt;</description>
      <pubDate>Thu, 30 Mar 2023 13:57:36 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6775#M2792</guid>
      <dc:creator>sanjay</dc:creator>
      <dc:date>2023-03-30T13:57:36Z</dc:date>
    </item>
    <item>
      <title>Re: error after updating delta table  com.databricks.sql.transaction.tahoe.DeltaUnsupportedOperationException: Detected a data update</title>
      <link>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6776#M2793</link>
      <description>&lt;P&gt;I can see ignoreChanges true emits all the updates + emits unupdated files as well for same partition. As per documents, need to handle duplicates in downstream. Can you suggest how to handle duplicate files.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;This is from databrick documents. (https://docs.databricks.com/structured-streaming/delta-lake.html#ignore-updates-and-deletes)&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;"The semantics for ignoreChanges differ greatly from skipChangeCommits. With ignoreChanges enabled, rewritten data files in the source table are re-emitted after a data changing operation such as UPDATE, MERGE INTO, DELETE (within partitions), or OVERWRITE. Unchanged rows are often emitted alongside new rows, so downstream consumers must be able to handle duplicates. Deletes are not propagated downstream. ignoreChanges subsumes ignoreDeletes."&lt;/P&gt;</description>
      <pubDate>Fri, 31 Mar 2023 12:33:40 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6776#M2793</guid>
      <dc:creator>sanjay</dc:creator>
      <dc:date>2023-03-31T12:33:40Z</dc:date>
    </item>
    <item>
      <title>Re: error after updating delta table  com.databricks.sql.transaction.tahoe.DeltaUnsupportedOperationException: Detected a data update</title>
      <link>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6777#M2794</link>
      <description>&lt;P&gt;Hi @Sanjay Jain​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Hope everything is going great.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Just wanted to check in if you were able to resolve your issue. If yes, would you be happy to mark an answer as best so that other members can find the solution more quickly? If not, please tell us so we can help you.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Cheers!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Sat, 01 Apr 2023 02:19:40 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6777#M2794</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2023-04-01T02:19:40Z</dc:date>
    </item>
    <item>
      <title>Re: error after updating delta table  com.databricks.sql.transaction.tahoe.DeltaUnsupportedOperationException: Detected a data update</title>
      <link>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6778#M2795</link>
      <description>&lt;P&gt;Hi Vidula,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Sorry I am still looking for solution. Appreciate if you can provide any help.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;Sanjay&lt;/P&gt;</description>
      <pubDate>Mon, 03 Apr 2023 07:01:22 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/6778#M2795</guid>
      <dc:creator>sanjay</dc:creator>
      <dc:date>2023-04-03T07:01:22Z</dc:date>
    </item>
    <item>
      <title>Re: error after updating delta table  com.databricks.sql.transaction.tahoe.DeltaUnsupportedOperation</title>
      <link>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/56001#M30483</link>
      <description>&lt;P&gt;Hi Sanjay,&amp;nbsp;&lt;BR /&gt;You can try adding&amp;nbsp;&lt;SPAN class=""&gt;.&lt;/SPAN&gt;&lt;SPAN class=""&gt;option&lt;/SPAN&gt;&lt;SPAN class=""&gt;(&lt;/SPAN&gt;&lt;SPAN class=""&gt;"overwriteSchema"&lt;/SPAN&gt;&lt;SPAN class=""&gt;,&lt;/SPAN&gt; &lt;SPAN class=""&gt;"true"&lt;/SPAN&gt;&lt;SPAN class=""&gt;)&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 01 Jan 2024 20:10:24 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/error-after-updating-delta-table-com-databricks-sql-transaction/m-p/56001#M30483</guid>
      <dc:creator>Sanjeev_Chauhan</dc:creator>
      <dc:date>2024-01-01T20:10:24Z</dc:date>
    </item>
  </channel>
</rss>

