<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: What file statistics does Optimize return &amp; How can I use them to my advantage? in Machine Learning</title>
    <link>https://community.databricks.com/t5/machine-learning/what-file-statistics-does-optimize-return-how-can-i-use-them-to/m-p/21590#M1189</link>
    <description>&lt;P&gt;Optimize is largely designed as a data organization strategy for Delta Tables. Its help by compacting small files, collecting columns stats to help with data skipping and also Z-ordering of data if that's called explicitly can help with both read/write performance on Delta Tables. See this for additional details - &lt;A href="https://docs.databricks.com/delta/optimizations/file-mgmt.html" target="test_blank"&gt;https://docs.databricks.com/delta/optimizations/file-mgmt.html&lt;/A&gt;&lt;/P&gt;</description>
    <pubDate>Wed, 23 Jun 2021 03:24:33 GMT</pubDate>
    <dc:creator>aladda</dc:creator>
    <dc:date>2021-06-23T03:24:33Z</dc:date>
    <item>
      <title>What file statistics does Optimize return &amp; How can I use them to my advantage?</title>
      <link>https://community.databricks.com/t5/machine-learning/what-file-statistics-does-optimize-return-how-can-i-use-them-to/m-p/21589#M1188</link>
      <description />
      <pubDate>Wed, 23 Jun 2021 02:07:37 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/what-file-statistics-does-optimize-return-how-can-i-use-them-to/m-p/21589#M1188</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2021-06-23T02:07:37Z</dc:date>
    </item>
    <item>
      <title>Re: What file statistics does Optimize return &amp; How can I use them to my advantage?</title>
      <link>https://community.databricks.com/t5/machine-learning/what-file-statistics-does-optimize-return-how-can-i-use-them-to/m-p/21590#M1189</link>
      <description>&lt;P&gt;Optimize is largely designed as a data organization strategy for Delta Tables. Its help by compacting small files, collecting columns stats to help with data skipping and also Z-ordering of data if that's called explicitly can help with both read/write performance on Delta Tables. See this for additional details - &lt;A href="https://docs.databricks.com/delta/optimizations/file-mgmt.html" target="test_blank"&gt;https://docs.databricks.com/delta/optimizations/file-mgmt.html&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 23 Jun 2021 03:24:33 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/what-file-statistics-does-optimize-return-how-can-i-use-them-to/m-p/21590#M1189</guid>
      <dc:creator>aladda</dc:creator>
      <dc:date>2021-06-23T03:24:33Z</dc:date>
    </item>
  </channel>
</rss>

