<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Log has failed integrity check error when altering a table property in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/log-has-failed-integrity-check-error-when-altering-a-table/m-p/18463#M12253</link>
    <description>&lt;P&gt;&lt;/P&gt;&lt;P&gt;Below is the integrity check error we are getting when trying to set the deletedRetentionFileDuration table property to 10 days.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image.png"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1031i3FB0CDB63B1B12C8/image-size/large?v=v2&amp;amp;px=999" role="button" title="image.png" alt="image.png" /&gt;&lt;/span&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1029i992B86C30DE0F582/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Observation: The table data is sitting in S3. The size of all the files in S3 is in TB. There are millions of files for this table.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;What is the best way to clear out the error apart from dropping and recreating the table?&lt;/P&gt;</description>
    <pubDate>Mon, 05 Dec 2022 21:56:55 GMT</pubDate>
    <dc:creator>LavaLiah_85929</dc:creator>
    <dc:date>2022-12-05T21:56:55Z</dc:date>
    <item>
      <title>Log has failed integrity check error when altering a table property</title>
      <link>https://community.databricks.com/t5/data-engineering/log-has-failed-integrity-check-error-when-altering-a-table/m-p/18463#M12253</link>
      <description>&lt;P&gt;&lt;/P&gt;&lt;P&gt;Below is the integrity check error we are getting when trying to set the deletedRetentionFileDuration table property to 10 days.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image.png"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1031i3FB0CDB63B1B12C8/image-size/large?v=v2&amp;amp;px=999" role="button" title="image.png" alt="image.png" /&gt;&lt;/span&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1029i992B86C30DE0F582/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Observation: The table data is sitting in S3. The size of all the files in S3 is in TB. There are millions of files for this table.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;What is the best way to clear out the error apart from dropping and recreating the table?&lt;/P&gt;</description>
      <pubDate>Mon, 05 Dec 2022 21:56:55 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/log-has-failed-integrity-check-error-when-altering-a-table/m-p/18463#M12253</guid>
      <dc:creator>LavaLiah_85929</dc:creator>
      <dc:date>2022-12-05T21:56:55Z</dc:date>
    </item>
    <item>
      <title>Re: Log has failed integrity check error when altering a table property</title>
      <link>https://community.databricks.com/t5/data-engineering/log-has-failed-integrity-check-error-when-altering-a-table/m-p/18464#M12254</link>
      <description>&lt;P&gt;This might be because of issues in transaction logs. Since this is an external table and delta format, create or replace table should be fixing the issue. This should fix the transaction log issue.&lt;/P&gt;&lt;P&gt;However if the issue still persists you can contact databricks support or set this confg to skip the issue. &lt;/P&gt;&lt;P&gt;spark.conf.set("spark.databricks.delta.state.corruptionIsFatal", False)&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Hope this helps..&lt;/P&gt;&lt;P&gt;Cheers.&lt;/P&gt;</description>
      <pubDate>Tue, 06 Dec 2022 08:11:36 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/log-has-failed-integrity-check-error-when-altering-a-table/m-p/18464#M12254</guid>
      <dc:creator>UmaMahesh1</dc:creator>
      <dc:date>2022-12-06T08:11:36Z</dc:date>
    </item>
    <item>
      <title>Re: Log has failed integrity check error when altering a table property</title>
      <link>https://community.databricks.com/t5/data-engineering/log-has-failed-integrity-check-error-when-altering-a-table/m-p/18465#M12255</link>
      <description>&lt;P&gt;Please backup your table, then run the repair of files&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;FSCK REPAIR TABLE table_name&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;you can also try to make dry run first&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;FSCK REPAIR TABLE table_name DRY RUN&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;if data is partitioned can be helpful to refresh metastore&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;MSCK REPAIR TABLE mytable&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 06 Dec 2022 11:20:13 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/log-has-failed-integrity-check-error-when-altering-a-table/m-p/18465#M12255</guid>
      <dc:creator>Hubert-Dudek</dc:creator>
      <dc:date>2022-12-06T11:20:13Z</dc:date>
    </item>
  </channel>
</rss>

