<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Comparison between parquet format  and avro format in Warehousing &amp; Analytics</title>
    <link>https://community.databricks.com/t5/warehousing-analytics/comparison-between-parquet-format-and-avro-format/m-p/19653#M377</link>
    <description />
    <pubDate>Fri, 25 Jun 2021 15:44:37 GMT</pubDate>
    <dc:creator>User16826994223</dc:creator>
    <dc:date>2021-06-25T15:44:37Z</dc:date>
    <item>
      <title>Comparison between parquet format  and avro format</title>
      <link>https://community.databricks.com/t5/warehousing-analytics/comparison-between-parquet-format-and-avro-format/m-p/19653#M377</link>
      <description />
      <pubDate>Fri, 25 Jun 2021 15:44:37 GMT</pubDate>
      <guid>https://community.databricks.com/t5/warehousing-analytics/comparison-between-parquet-format-and-avro-format/m-p/19653#M377</guid>
      <dc:creator>User16826994223</dc:creator>
      <dc:date>2021-06-25T15:44:37Z</dc:date>
    </item>
    <item>
      <title>Re: Comparison between parquet format  and avro format</title>
      <link>https://community.databricks.com/t5/warehousing-analytics/comparison-between-parquet-format-and-avro-format/m-p/19654#M378</link>
      <description>&lt;OL&gt;&lt;LI&gt;AVRO is a row-based storage format whereas PARQUET is a columnar based storage format.&lt;/LI&gt;&lt;LI&gt;PARQUET is much better for analytical querying i.e. reads and querying are much more efficient than writing.&lt;/LI&gt;&lt;LI&gt;Write operations in AVRO are better than in PARQUET.&lt;/LI&gt;&lt;LI&gt;AVRO is much matured than PARQUET when it comes to schema evolution. PARQUET only supports schema append whereas AVRO supports a much-featured schema evolution i.e. adding or modifying columns.&lt;/LI&gt;&lt;LI&gt;PARQUET is ideal for querying a subset of columns in a multi-column table. AVRO is ideal in case of ETL operations where we need to query all the columns.&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 25 Jun 2021 15:44:50 GMT</pubDate>
      <guid>https://community.databricks.com/t5/warehousing-analytics/comparison-between-parquet-format-and-avro-format/m-p/19654#M378</guid>
      <dc:creator>User16826994223</dc:creator>
      <dc:date>2021-06-25T15:44:50Z</dc:date>
    </item>
  </channel>
</rss>

