<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Number of parquet files per delta table in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/number-of-parquet-files-per-delta-table/m-p/25509#M17749</link>
    <description>&lt;P&gt;Hello. We would like to understand how many parquet files are created per data table. To be more specific, we refer to the current snapshot of the table. For example, we noticed that while we performed initial inserts to a table, one parquet file was created per each row. However, while adding a column and performing a bulk update, one parquet files was created per two rows. Is there any pattern on this? Thank you in advance&lt;/P&gt;</description>
    <pubDate>Thu, 27 Oct 2022 12:21:06 GMT</pubDate>
    <dc:creator>elgeo</dc:creator>
    <dc:date>2022-10-27T12:21:06Z</dc:date>
    <item>
      <title>Number of parquet files per delta table</title>
      <link>https://community.databricks.com/t5/data-engineering/number-of-parquet-files-per-delta-table/m-p/25509#M17749</link>
      <description>&lt;P&gt;Hello. We would like to understand how many parquet files are created per data table. To be more specific, we refer to the current snapshot of the table. For example, we noticed that while we performed initial inserts to a table, one parquet file was created per each row. However, while adding a column and performing a bulk update, one parquet files was created per two rows. Is there any pattern on this? Thank you in advance&lt;/P&gt;</description>
      <pubDate>Thu, 27 Oct 2022 12:21:06 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/number-of-parquet-files-per-delta-table/m-p/25509#M17749</guid>
      <dc:creator>elgeo</dc:creator>
      <dc:date>2022-10-27T12:21:06Z</dc:date>
    </item>
  </channel>
</rss>

