<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic How to calculate the individual file count, file size and number of rows on a Delta table? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/how-to-calculate-the-individual-file-count-file-size-and-number/m-p/83842#M37030</link>
    <description>&lt;P&gt;There are instances where we need to know the individual file size or file count present in the delta table rather than the average size. we can use the below query to determine that.&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;%sql
select count(*) as rows, file_path, file_size from (select * , _metadata.file_path, _metadata.file_size from  &amp;lt;table_name or delta.`file_path`&amp;gt;) group by file_path, file_size&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Wed, 21 Aug 2024 19:18:12 GMT</pubDate>
    <dc:creator>shan_chandra</dc:creator>
    <dc:date>2024-08-21T19:18:12Z</dc:date>
    <item>
      <title>How to calculate the individual file count, file size and number of rows on a Delta table?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-calculate-the-individual-file-count-file-size-and-number/m-p/83842#M37030</link>
      <description>&lt;P&gt;There are instances where we need to know the individual file size or file count present in the delta table rather than the average size. we can use the below query to determine that.&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;%sql
select count(*) as rows, file_path, file_size from (select * , _metadata.file_path, _metadata.file_size from  &amp;lt;table_name or delta.`file_path`&amp;gt;) group by file_path, file_size&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 21 Aug 2024 19:18:12 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-calculate-the-individual-file-count-file-size-and-number/m-p/83842#M37030</guid>
      <dc:creator>shan_chandra</dc:creator>
      <dc:date>2024-08-21T19:18:12Z</dc:date>
    </item>
  </channel>
</rss>

