<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Users are failing query data from S3 bucket in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23509#M16234</link>
    <description>&lt;P&gt;Hi @karthik p​&amp;nbsp;&lt;/P&gt;&lt;P&gt;Yes, all relevant S3 bucket permission for this user is set&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;</description>
    <pubDate>Wed, 09 Nov 2022 09:40:17 GMT</pubDate>
    <dc:creator>164079</dc:creator>
    <dc:date>2022-11-09T09:40:17Z</dc:date>
    <item>
      <title>Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23500#M16225</link>
      <description>&lt;P&gt;Hi team, &lt;/P&gt;&lt;P&gt;Users are unable run select on data located on S3 buckets, S3 permission are ok.&lt;/P&gt;&lt;P&gt;The only way they manage do it by granted the databricks workspace admin permission.&lt;/P&gt;&lt;P&gt;Attached the error.&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;</description>
      <pubDate>Sun, 06 Nov 2022 11:50:34 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23500#M16225</guid>
      <dc:creator>164079</dc:creator>
      <dc:date>2022-11-06T11:50:34Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23501#M16226</link>
      <description>&lt;P&gt;Hi @Avi Edri​&amp;nbsp;,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;it looks like your users are missing SELECT ANY FILE permission (which admins are granted by default), please see here for more details:&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.databricks.com/security/access-control/table-acls/object-privileges.html" target="test_blank"&gt;https://docs.databricks.com/security/access-control/table-acls/object-privileges.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1235iC498D6DD3386B9ED/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I assume you are not using Unity Catalog. It's not easy to achieve both without Unity Catalog - access data through Tables and through file path (spark.read... ). &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;You might need to re-visit data access on your side. I do believe when you have Table Access Control enabled cluster then you are limited to use tables - select * from some_table, unless you have permission to SELECT ANY FILE, then you can bypass this restriction.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Unity Catalog is way forward, it enables more security and allows some flexibility here.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;thanks,&lt;/P&gt;&lt;P&gt;Patryk.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 07 Nov 2022 12:41:07 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23501#M16226</guid>
      <dc:creator>Pat</dc:creator>
      <dc:date>2022-11-07T12:41:07Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23502#M16227</link>
      <description>&lt;P&gt;Thank you Pat, &lt;/P&gt;&lt;P&gt;Can you please guide me how do i grant the ANY FILE permission to my users or groups?&lt;/P&gt;&lt;P&gt;Also is there a way grant select to all db's via mysql command or terminal?&lt;/P&gt;&lt;P&gt;we are not using unity catalog and our table permission policy is enabled&lt;/P&gt;&lt;P&gt;Avi&lt;/P&gt;</description>
      <pubDate>Tue, 08 Nov 2022 16:25:00 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23502#M16227</guid>
      <dc:creator>164079</dc:creator>
      <dc:date>2022-11-08T16:25:00Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23503#M16228</link>
      <description>&lt;P&gt;This will work with sql (notebook):&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;GRANT SELECT ON ANY FILE TO `group-name`&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;or maybe this with terraform:&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;resource "databricks_sql_permissions" "any_file" {
  any_file = true
&amp;nbsp;
&amp;nbsp;
  privilege_assignments {
    principal  = "group-name"
    privileges = ["SELECT"]
  }
&amp;nbsp;
}&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;I didn't try the terraform one.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://registry.terraform.io/providers/databricks/databricks/latest/docs/resources/sql_permissions#any_file" target="test_blank"&gt;https://registry.terraform.io/providers/databricks/databricks/latest/docs/resources/sql_permissions#any_file&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;thanks,&lt;/P&gt;&lt;P&gt;Pat.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 08 Nov 2022 16:32:03 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23503#M16228</guid>
      <dc:creator>Pat</dc:creator>
      <dc:date>2022-11-08T16:32:03Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23504#M16229</link>
      <description>&lt;P&gt;Thanks you Pat, &lt;/P&gt;&lt;P&gt;When running this query im getting the below exception:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;rror in SQL statement: SparkException: Trying to perform permission action on Hive Metastore /ANY_FILE but Table Access Control is not enabled on this cluster. &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I verified and my workspace settings are with enable table access control is enabled.&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1238i25452D76FC34ED3B/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 08 Nov 2022 17:53:23 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23504#M16229</guid>
      <dc:creator>164079</dc:creator>
      <dc:date>2022-11-08T17:53:23Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23505#M16230</link>
      <description>&lt;P&gt;You need to use cluster with TAC enabled.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.databricks.com/security/access-control/table-acls/table-acl.html" alt="https://docs.databricks.com/security/access-control/table-acls/table-acl.html" target="_blank"&gt;https://docs.databricks.com/security/access-control/table-acls/table-acl.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;there were some changes to the UI recently, you can follow instructions here.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.databricks.com/clusters/cluster-ui-preview.html" alt="https://docs.databricks.com/clusters/cluster-ui-preview.html" target="_blank"&gt;https://docs.databricks.com/clusters/cluster-ui-preview.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;thanks,&lt;/P&gt;&lt;P&gt;Pat.&lt;/P&gt;</description>
      <pubDate>Tue, 08 Nov 2022 19:35:45 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23505#M16230</guid>
      <dc:creator>Pat</dc:creator>
      <dc:date>2022-11-08T19:35:45Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23506#M16231</link>
      <description>&lt;P&gt;@Avi Edri​&amp;nbsp;adding some more info to @Pat Sienkiewicz​&amp;nbsp;suggestion, @Avi Edri​&amp;nbsp;are you using cluster with instance profile, if you are using instance profile configured, please validate read permissions are there on that bucket and instance profile assigned cluster is enabled for user  &lt;/P&gt;</description>
      <pubDate>Tue, 08 Nov 2022 21:34:15 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23506#M16231</guid>
      <dc:creator>karthik_p</dc:creator>
      <dc:date>2022-11-08T21:34:15Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23508#M16233</link>
      <description>&lt;P&gt;Hi @Pat, &lt;/P&gt;&lt;P&gt;Im getting this error after adding this config to my global init script:&lt;/P&gt;&lt;P&gt;spark.databricks.acl.sqlOnly true&lt;/P&gt;&lt;P&gt;This is the error:&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1242iD69C9DC283E7EBD9/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;Thank you!&lt;/P&gt;</description>
      <pubDate>Wed, 09 Nov 2022 07:39:26 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23508#M16233</guid>
      <dc:creator>164079</dc:creator>
      <dc:date>2022-11-09T07:39:26Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23509#M16234</link>
      <description>&lt;P&gt;Hi @karthik p​&amp;nbsp;&lt;/P&gt;&lt;P&gt;Yes, all relevant S3 bucket permission for this user is set&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;</description>
      <pubDate>Wed, 09 Nov 2022 09:40:17 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23509#M16234</guid>
      <dc:creator>164079</dc:creator>
      <dc:date>2022-11-09T09:40:17Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23510#M16235</link>
      <description>&lt;P&gt;Thanks ! @Kaniz Fatma​&amp;nbsp;&lt;/P&gt;&lt;P&gt;Will update as soon as my issue resolved.&lt;/P&gt;&lt;P&gt;Avi&lt;/P&gt;</description>
      <pubDate>Wed, 09 Nov 2022 09:41:14 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23510#M16235</guid>
      <dc:creator>164079</dc:creator>
      <dc:date>2022-11-09T09:41:14Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23511#M16236</link>
      <description>&lt;P&gt;Hmm,&lt;/P&gt;&lt;P&gt;let's try something like this.&lt;/P&gt;&lt;P&gt;When you create new cluster you can click on the `UI Preview` and `Legacy UI is enabled`&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1250i5A1FF53F8CEED901/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;chose Cluster mode: &lt;B&gt;High Concurrency&lt;/B&gt;&lt;/P&gt;&lt;P&gt;in Advanced Options:&lt;/P&gt;&lt;P&gt;Table Access Control - Enable:&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1240iA75EE44E42A9B2D5/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;on the right side you can switch to JSON and see what I have:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;{
    "autoscale": {
        "min_workers": 2,
        "max_workers": 8
    },
    "cluster_name": "Pat's Cluster",
    "spark_version": "10.4.x-scala2.12",
    "spark_conf": {
        "spark.databricks.cluster.profile": "serverless",
        "spark.databricks.repl.allowedLanguages": "python,sql",
        "spark.databricks.acl.dfAclsEnabled": "true"
    },
    "aws_attributes": {
        "first_on_demand": 1,
        "availability": "SPOT_WITH_FALLBACK",
        "zone_id": "auto",
        "spot_bid_price_percent": 100,
        "ebs_volume_type": null,
        "ebs_volume_count": null,
        "ebs_volume_size": null
    },
    "node_type_id": "i3.2xlarge",
    "ssh_public_keys": [],
    "custom_tags": {
        "ResourceClass": "Serverless"
    },
    "spark_env_vars": {
        "PYSPARK_PYTHON": "/databricks/python3/bin/python3"
    },
    "autotermination_minutes": 0,
    "enable_elastic_disk": true,
    "cluster_source": "UI",
    "init_scripts": [],
    "data_security_mode": null,
    "runtime_engine": "STANDARD"
}&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 09 Nov 2022 09:49:28 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23511#M16236</guid>
      <dc:creator>Pat</dc:creator>
      <dc:date>2022-11-09T09:49:28Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23512#M16237</link>
      <description>&lt;P&gt;Thnaks Pat, &lt;/P&gt;&lt;P&gt;Yes it worked!&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1249i911F52482DB2635A/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;is there a command to show grants for user or group?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 09 Nov 2022 11:21:20 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23512#M16237</guid>
      <dc:creator>164079</dc:creator>
      <dc:date>2022-11-09T11:21:20Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23513#M16238</link>
      <description>&lt;P&gt;I think that you always need to add SECURABLE_OBJECT&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.databricks.com/sql/language-manual/security-show-grant.html" target="test_blank"&gt;https://docs.databricks.com/sql/language-manual/security-show-grant.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;SHOW GRANTS [ principal ] ON securable_object&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 09 Nov 2022 11:41:48 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23513#M16238</guid>
      <dc:creator>Pat</dc:creator>
      <dc:date>2022-11-09T11:41:48Z</dc:date>
    </item>
    <item>
      <title>Re: Users are failing query data from S3 bucket</title>
      <link>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23514#M16239</link>
      <description>&lt;P&gt;Great, &lt;/P&gt;&lt;P&gt;Thank you Pat!&lt;/P&gt;</description>
      <pubDate>Wed, 09 Nov 2022 12:07:26 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/users-are-failing-query-data-from-s3-bucket/m-p/23514#M16239</guid>
      <dc:creator>164079</dc:creator>
      <dc:date>2022-11-09T12:07:26Z</dc:date>
    </item>
  </channel>
</rss>

