<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: AnalysisException: [ErrorClass=INVALID_PARAMETER_VALUE] Missing cloud file system scheme in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/analysisexception-errorclass-invalid-parameter-value-missing/m-p/43283#M27499</link>
    <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/9"&gt;@Retired_mod&lt;/a&gt;&amp;nbsp;Thanks for your response. I didn't provide cloud file system scheme in the path while creating the table using DataFrame API, but I was still able to create the table.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="python"&gt;%python
# File location and type
file_location = "/mnt/training/ecommerce/users/users.parquet"
file_type = "parquet"

df = spark.read.format(file_type) \
  .load(file_location)

display(df)

temp_table_name = "test_catalog.test_schema.users"
df.createOrReplaceTempView(temp_table_name)&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;When I provided the scheme in SQL, I got the following error:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="python"&gt;%sql
CREATE TABLE IF NOT EXISTS events USING parquet OPTIONS (path "s3://mnt/training/ecommerce/events/events.parquet");

AnalysisException: No parent external location found for path 's3://mnt/training/ecommerce/events/events.parquet'&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Sun, 03 Sep 2023 15:08:42 GMT</pubDate>
    <dc:creator>Madison</dc:creator>
    <dc:date>2023-09-03T15:08:42Z</dc:date>
    <item>
      <title>AnalysisException: [ErrorClass=INVALID_PARAMETER_VALUE] Missing cloud file system scheme</title>
      <link>https://community.databricks.com/t5/data-engineering/analysisexception-errorclass-invalid-parameter-value-missing/m-p/43045#M27474</link>
      <description>&lt;P&gt;I am trying to follow along Apache Spark Programming training module where the instructor creates events table from a parquet file like this:&lt;/P&gt;&lt;LI-CODE lang="python"&gt;%sql
CREATE TABLE IF NOT EXISTS events USING parquet OPTIONS (path "/mnt/training/ecommerce/events/events.parquet");&lt;/LI-CODE&gt;&lt;P&gt;When I tried to run the above command, I got the following error message:&lt;/P&gt;&lt;LI-CODE lang="python"&gt;AnalysisException: [RequestId=... ErrorClass=INVALID_PARAMETER_VALUE] Missing cloud file system scheme
---------------------------------------------------------------------------
AnalysisException                         Traceback (most recent call last)
&amp;lt;command-644583705732552&amp;gt; in &amp;lt;cell line: 1&amp;gt;()
      5     display(df)
      6     return df
----&amp;gt; 7   _sqldf = ____databricks_percent_sql()
      8 finally:
      9   del ____databricks_percent_sql

&amp;lt;command-644583705732552&amp;gt; in ____databricks_percent_sql()
      2   def ____databricks_percent_sql():
      3     import base64
----&amp;gt; 4     df = spark.sql(base64.standard_b64decode("...=").decode())
      5     display(df)
      6     return df

/databricks/spark/python/pyspark/instrumentation_utils.py in wrapper(*args, **kwargs)
     46             start = time.perf_counter()
     47             try:
---&amp;gt; 48                 res = func(*args, **kwargs)&lt;/LI-CODE&gt;</description>
      <pubDate>Fri, 01 Sep 2023 07:54:28 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/analysisexception-errorclass-invalid-parameter-value-missing/m-p/43045#M27474</guid>
      <dc:creator>Madison</dc:creator>
      <dc:date>2023-09-01T07:54:28Z</dc:date>
    </item>
    <item>
      <title>Re: AnalysisException: [ErrorClass=INVALID_PARAMETER_VALUE] Missing cloud file system scheme</title>
      <link>https://community.databricks.com/t5/data-engineering/analysisexception-errorclass-invalid-parameter-value-missing/m-p/43283#M27499</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/9"&gt;@Retired_mod&lt;/a&gt;&amp;nbsp;Thanks for your response. I didn't provide cloud file system scheme in the path while creating the table using DataFrame API, but I was still able to create the table.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="python"&gt;%python
# File location and type
file_location = "/mnt/training/ecommerce/users/users.parquet"
file_type = "parquet"

df = spark.read.format(file_type) \
  .load(file_location)

display(df)

temp_table_name = "test_catalog.test_schema.users"
df.createOrReplaceTempView(temp_table_name)&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;When I provided the scheme in SQL, I got the following error:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="python"&gt;%sql
CREATE TABLE IF NOT EXISTS events USING parquet OPTIONS (path "s3://mnt/training/ecommerce/events/events.parquet");

AnalysisException: No parent external location found for path 's3://mnt/training/ecommerce/events/events.parquet'&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sun, 03 Sep 2023 15:08:42 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/analysisexception-errorclass-invalid-parameter-value-missing/m-p/43283#M27499</guid>
      <dc:creator>Madison</dc:creator>
      <dc:date>2023-09-03T15:08:42Z</dc:date>
    </item>
  </channel>
</rss>

