<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Getting Authentication Error while accessing Azure Blob table (wasb) URL using PySpark in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/getting-authentication-error-while-accessing-azure-blob-table/m-p/17895#M11814</link>
    <description>&lt;P&gt;Hi @Arvind Ravish​&amp;nbsp; Thanks for the response but the given config is already disabled.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;And I am able to query data from Presto but using Pysaprk I am getting this error.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image.png"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1788iE8AC9B25A78A9739/image-size/large?v=v2&amp;amp;px=999" role="button" title="image.png" alt="image.png" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
    <pubDate>Sun, 12 Jun 2022 07:07:59 GMT</pubDate>
    <dc:creator>vivek_sinha</dc:creator>
    <dc:date>2022-06-12T07:07:59Z</dc:date>
    <item>
      <title>Getting Authentication Error while accessing Azure Blob table (wasb) URL using PySpark</title>
      <link>https://community.databricks.com/t5/data-engineering/getting-authentication-error-while-accessing-azure-blob-table/m-p/17893#M11812</link>
      <description>&lt;P&gt;I am trying to access the Azure Blob table using Pyspark but getting an Authentication Error. Here I am passing SAS token (HTTP and HTTPS enabled) but it's working only with WASBS (HTTPS) URL, not with WASB (HTTP) URL.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Even I tried with Account key as well but didn't work.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;The other way is working fine if I try to load the parquet file by passing the WASB URL, but this method is very slow and takes too much time to access the data.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Please help me understand why PySpark-Azure showing such behaviour.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;We had a meeting with the Azure support team as well but they also couldn't find any issue from their end&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;&lt;U&gt;Sample Code:&lt;/U&gt;&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;from pyspark.sql import SparkSession
&amp;nbsp;
    spark = SparkSession.builder.getOrCreate()
&amp;nbsp;
    spark.conf.set("fs.azure.sas.&amp;lt;container-name&amp;gt;.&amp;lt;storage-account&amp;gt;.blob.core.windows.net","&amp;lt;
&amp;nbsp;
SAS Token&amp;gt;")
&amp;nbsp;&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;&lt;U&gt;Error Details:&lt;/U&gt;&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;Py4JJavaError: An error occurred while calling o146.table.
&amp;nbsp;
: java.util.concurrent.ExecutionException: org.apache.hadoop.fs.azure.AzureException: com.microsoft.azure.storage.StorageException: Cannot use HTTP with credentials that only support HTTPS.
&amp;nbsp;
    at org.sparkproject.guava.util.concurrent.AbstractFuture$Sync.getValue(AbstractFuture.java:306)
&amp;nbsp;
    at org.sparkproject.guava.util.concurrent.AbstractFuture$Sync.get(AbstractFuture.java:293)
&amp;nbsp;
    at org.sparkproject.guava.util.concurrent.AbstractFuture.get(AbstractFuture.java:116)
&amp;nbsp;
    at org.sparkproject.guava.util.concurrent.Uninterruptibles.getUninterruptibly(Uninterruptibles.java:135)
&amp;nbsp;
    at org.sparkproject.guava.cache.LocalCache$Segment.getAndRecordStats(LocalCache.java:2410)
&amp;nbsp;
    at org.sparkproject.guava.cache.LocalCache$Segment.loadSync(LocalCache.java:2380)
&amp;nbsp;
    at org.sparkproject.guava.cache.LocalCache$Segment.lockedGetOrLoad(LocalCache.java:2342)
&amp;nbsp;
    at org.sparkproject.guava.cache.LocalCache$Segment.get(LocalCache.java:2257)
&amp;nbsp;
    at org.sparkproject.guava.cache.LocalCache.get(LocalCache.java:4000)
&amp;nbsp;
    at org.sparkproject.guava.cache.LocalCache$LocalManualCache.get(LocalCache.java:4789)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.catalog.SessionCatalog.getCachedPlan(SessionCatalog.scala:155)
&amp;nbsp;
    at org.apache.spark.sql.execution.datasources.FindDataSourceTable.org$apache$spark$sql$execution$datasources$FindDataSourceTable$$readDataSourceTable(DataSourceStrategy.scala:249)
&amp;nbsp;
    at org.apache.spark.sql.execution.datasources.FindDataSourceTable$$anonfun$apply$2.applyOrElse(DataSourceStrategy.scala:288)
&amp;nbsp;
    at org.apache.spark.sql.execution.datasources.FindDataSourceTable$$anonfun$apply$2.applyOrElse(DataSourceStrategy.scala:278)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper.$anonfun$resolveOperatorsDown$2(AnalysisHelper.scala:108)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.trees.CurrentOrigin$.withOrigin(TreeNode.scala:74)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper.$anonfun$resolveOperatorsDown$1(AnalysisHelper.scala:108)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper$.allowInvokingTransformsInAnalyzer(AnalysisHelper.scala:221)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper.resolveOperatorsDown(AnalysisHelper.scala:106)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper.resolveOperatorsDown$(AnalysisHelper.scala:104)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.LogicalPlan.resolveOperatorsDown(LogicalPlan.scala:29)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper.$anonfun$resolveOperatorsDown$4(AnalysisHelper.scala:113)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.trees.TreeNode.$anonfun$mapChildren$1(TreeNode.scala:408)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.trees.TreeNode.mapProductIterator(TreeNode.scala:244)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.trees.TreeNode.mapChildren(TreeNode.scala:406)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.trees.TreeNode.mapChildren(TreeNode.scala:359)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper.$anonfun$resolveOperatorsDown$1(AnalysisHelper.scala:113)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper$.allowInvokingTransformsInAnalyzer(AnalysisHelper.scala:221)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper.resolveOperatorsDown(AnalysisHelper.scala:106)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper.resolveOperatorsDown$(AnalysisHelper.scala:104)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.LogicalPlan.resolveOperatorsDown(LogicalPlan.scala:29)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper.resolveOperators(AnalysisHelper.scala:73)
&amp;nbsp;
    at org.apache.spark.sql.catalyst.plans.logical.AnalysisHelper.resolveOperators$(AnalysisHelper.scala:72)
&amp;nbsp;
    at &lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Sat, 11 Jun 2022 00:07:26 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/getting-authentication-error-while-accessing-azure-blob-table/m-p/17893#M11812</guid>
      <dc:creator>vivek_sinha</dc:creator>
      <dc:date>2022-06-11T00:07:26Z</dc:date>
    </item>
    <item>
      <title>Re: Getting Authentication Error while accessing Azure Blob table (wasb) URL using PySpark</title>
      <link>https://community.databricks.com/t5/data-engineering/getting-authentication-error-while-accessing-azure-blob-table/m-p/17894#M11813</link>
      <description>&lt;P&gt;Based on your error you have enabled Secure transfer enabled on the storage account.&lt;/P&gt;&lt;P&gt;You can disable the below setting and try again with WASB/HTTP&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.microsoft.com/en-us/azure/storage/common/storage-require-secure-transfer" target="test_blank"&gt;https://docs.microsoft.com/en-us/azure/storage/common/storage-require-secure-transfer&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1785iDCDAD3F16E882D70/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Sun, 12 Jun 2022 07:02:13 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/getting-authentication-error-while-accessing-azure-blob-table/m-p/17894#M11813</guid>
      <dc:creator>User16764241763</dc:creator>
      <dc:date>2022-06-12T07:02:13Z</dc:date>
    </item>
    <item>
      <title>Re: Getting Authentication Error while accessing Azure Blob table (wasb) URL using PySpark</title>
      <link>https://community.databricks.com/t5/data-engineering/getting-authentication-error-while-accessing-azure-blob-table/m-p/17895#M11814</link>
      <description>&lt;P&gt;Hi @Arvind Ravish​&amp;nbsp; Thanks for the response but the given config is already disabled.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;And I am able to query data from Presto but using Pysaprk I am getting this error.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image.png"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1788iE8AC9B25A78A9739/image-size/large?v=v2&amp;amp;px=999" role="button" title="image.png" alt="image.png" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Sun, 12 Jun 2022 07:07:59 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/getting-authentication-error-while-accessing-azure-blob-table/m-p/17895#M11814</guid>
      <dc:creator>vivek_sinha</dc:creator>
      <dc:date>2022-06-12T07:07:59Z</dc:date>
    </item>
    <item>
      <title>Re: Getting Authentication Error while accessing Azure Blob table (wasb) URL using PySpark</title>
      <link>https://community.databricks.com/t5/data-engineering/getting-authentication-error-while-accessing-azure-blob-table/m-p/17896#M11815</link>
      <description>&lt;P&gt;Hi @Arvind Ravish​&amp;nbsp; &lt;/P&gt;&lt;P&gt;The issue got fixed after passing HTTP and HTTPS enabled token to spark executors.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks again for your help&lt;/P&gt;</description>
      <pubDate>Sun, 12 Jun 2022 10:42:29 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/getting-authentication-error-while-accessing-azure-blob-table/m-p/17896#M11815</guid>
      <dc:creator>vivek_sinha</dc:creator>
      <dc:date>2022-06-12T10:42:29Z</dc:date>
    </item>
  </channel>
</rss>

