<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Z-order or Partitioning? Which is better for Data skipping? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/z-order-or-partitioning-which-is-better-for-data-skipping/m-p/21684#M14815</link>
    <description>&lt;P&gt;Partition pruning is the most efficient way to ensure Data skipping. However, choosing the right column for partitioning is very important. It's common to see choosing the wrong column for partitioning can cause a large number of small file problems and in such scenarios, Z-order is the preferred option. &lt;/P&gt;</description>
    <pubDate>Tue, 22 Jun 2021 23:19:13 GMT</pubDate>
    <dc:creator>brickster_2018</dc:creator>
    <dc:date>2021-06-22T23:19:13Z</dc:date>
    <item>
      <title>Z-order or Partitioning? Which is better for Data skipping?</title>
      <link>https://community.databricks.com/t5/data-engineering/z-order-or-partitioning-which-is-better-for-data-skipping/m-p/21683#M14814</link>
      <description>&lt;P&gt;For Delta tables, among Z-order and Partioning which is recommended technique for efficient Data Skipping&lt;/P&gt;</description>
      <pubDate>Tue, 22 Jun 2021 23:16:50 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/z-order-or-partitioning-which-is-better-for-data-skipping/m-p/21683#M14814</guid>
      <dc:creator>brickster_2018</dc:creator>
      <dc:date>2021-06-22T23:16:50Z</dc:date>
    </item>
    <item>
      <title>Re: Z-order or Partitioning? Which is better for Data skipping?</title>
      <link>https://community.databricks.com/t5/data-engineering/z-order-or-partitioning-which-is-better-for-data-skipping/m-p/21684#M14815</link>
      <description>&lt;P&gt;Partition pruning is the most efficient way to ensure Data skipping. However, choosing the right column for partitioning is very important. It's common to see choosing the wrong column for partitioning can cause a large number of small file problems and in such scenarios, Z-order is the preferred option. &lt;/P&gt;</description>
      <pubDate>Tue, 22 Jun 2021 23:19:13 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/z-order-or-partitioning-which-is-better-for-data-skipping/m-p/21684#M14815</guid>
      <dc:creator>brickster_2018</dc:creator>
      <dc:date>2021-06-22T23:19:13Z</dc:date>
    </item>
  </channel>
</rss>

