<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Delta Table on AWS Glue Catalog in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/delta-table-on-aws-glue-catalog/m-p/64338#M32546</link>
    <description>&lt;P&gt;&lt;SPAN&gt;Hi, could you please refer to something or explain in more detail your point about querying Delta Lake files directly instead of through the AWS Glue catalog and why it was highlighted as a best practice?&lt;/SPAN&gt;&lt;/P&gt;</description>
    <pubDate>Thu, 21 Mar 2024 20:43:22 GMT</pubDate>
    <dc:creator>monometa</dc:creator>
    <dc:date>2024-03-21T20:43:22Z</dc:date>
    <item>
      <title>Delta Table on AWS Glue Catalog</title>
      <link>https://community.databricks.com/t5/data-engineering/delta-table-on-aws-glue-catalog/m-p/52437#M29431</link>
      <description>&lt;P&gt;&lt;SPAN&gt;I have set up Databricks cluster to work with&amp;nbsp;&lt;/SPAN&gt;&lt;STRONG&gt;AWS Glue Catalog&lt;/STRONG&gt;&lt;SPAN&gt;&amp;nbsp;by enabling the&amp;nbsp;&lt;/SPAN&gt;&lt;STRONG&gt;&lt;I&gt;spark.databricks.hive.metastore.glueCatalog.enabled&lt;/I&gt;&lt;/STRONG&gt;&lt;SPAN&gt;&amp;nbsp;to&amp;nbsp;&lt;/SPAN&gt;&lt;STRONG&gt;&lt;I&gt;true&lt;/I&gt;&lt;/STRONG&gt;&lt;SPAN&gt;. However, when I create a&lt;/SPAN&gt;&lt;STRONG&gt;&amp;nbsp;Delta table&lt;/STRONG&gt;&lt;SPAN&gt;&amp;nbsp;on Glue Catalog, the schema reflected in the AWS Glue Catalog is incorrect. the table schema only has one column named `col` of type `array&amp;lt;string&amp;gt;`.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Tam_0-1700157256870.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/5123iE03C4C8FDF303EED/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Tam_0-1700157256870.png" alt="Tam_0-1700157256870.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Tam_1-1700157262740.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/5124i51F7BBFE0C2FF9B8/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Tam_1-1700157262740.png" alt="Tam_1-1700157262740.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;Does anyone have any insights?&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 16 Nov 2023 17:56:46 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/delta-table-on-aws-glue-catalog/m-p/52437#M29431</guid>
      <dc:creator>Tam</dc:creator>
      <dc:date>2023-11-16T17:56:46Z</dc:date>
    </item>
    <item>
      <title>Re: Delta Table on AWS Glue Catalog</title>
      <link>https://community.databricks.com/t5/data-engineering/delta-table-on-aws-glue-catalog/m-p/64338#M32546</link>
      <description>&lt;P&gt;&lt;SPAN&gt;Hi, could you please refer to something or explain in more detail your point about querying Delta Lake files directly instead of through the AWS Glue catalog and why it was highlighted as a best practice?&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 21 Mar 2024 20:43:22 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/delta-table-on-aws-glue-catalog/m-p/64338#M32546</guid>
      <dc:creator>monometa</dc:creator>
      <dc:date>2024-03-21T20:43:22Z</dc:date>
    </item>
  </channel>
</rss>

