<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Issue during testing SparkSession.sql() with pytest. in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/issue-during-testing-sparksession-sql-with-pytest/m-p/50456#M28810</link>
    <description>&lt;P&gt;Dear Community,&lt;/P&gt;&lt;P&gt;I am testing pyspark code via pytest using VS code and Databricks Connect.&lt;/P&gt;&lt;P&gt;SparkSession is initiated from Databricks Connect:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;from&lt;/SPAN&gt; &lt;SPAN&gt;databricks&lt;/SPAN&gt;&lt;SPAN&gt;.&lt;/SPAN&gt;&lt;SPAN&gt;connect&lt;/SPAN&gt; &lt;SPAN&gt;import&lt;/SPAN&gt; &lt;SPAN&gt;DatabricksSession&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;spark&lt;/SPAN&gt; &lt;SPAN&gt;=&lt;/SPAN&gt; &lt;SPAN&gt;DatabricksSession&lt;/SPAN&gt;&lt;SPAN&gt;.&lt;/SPAN&gt;&lt;SPAN&gt;builder&lt;/SPAN&gt;&lt;SPAN&gt;.&lt;/SPAN&gt;&lt;SPAN&gt;getOrCreate&lt;/SPAN&gt;&lt;SPAN&gt;()&lt;/SPAN&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;P&gt;I am&amp;nbsp; receiving every time error message when I am calling 'SparkSession.sql()' method.&lt;/P&gt;&lt;DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;For example:&lt;/SPAN&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="python"&gt;# module.py
def create_catalog(spark_session):
    """Doc string"""
    spark_session.sql("""CREATE CATALOG IF NOT EXISTS test_catalog""")

# test_module.py

from module import create_catalog

@pytest.fixture(scope="session")
def spark_session():
    """Creates SparkSession."""

    global spark
    try:
        spark
    except NameError:
        from databricks.connect import DatabricksSession
        spark = DatabricksSession.builder.getOrCreate()
    yield spark

def test_create_catalog(spark_session):
    """Doc string"""
    create_catalog(spark_session)
    &lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I am receiving following error message:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;pyspark.errors.exceptions.connect.SparkConnectGrpcException: &amp;lt;_MultiThreadedRendezvous of RPC that terminated with:
E               status = StatusCode.UNIMPLEMENTED
E               details = "Method not found: spark.connect.SparkConnectService/ReattachExecute"
E               debug_error_string = "UNKNOWN:Error received from peer  {created_time:"2023-11-04T16:14:26.2187837+00:00", grpc_status:12, grpc_message:"Method 
not found: spark.connect.SparkConnectService/ReattachExecute"}"&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Issue occurs also when I am using SparkSession directly and not as a fixture.&lt;/P&gt;&lt;P&gt;I have tested and SparkSession.sql() created from databricks.connect works correctly when I am runing code via 'Run file as a Workflow on Databricks.' from VS Code.&lt;/P&gt;&lt;P&gt;Thank you in advance for any help,&lt;/P&gt;&lt;P&gt;Rafal&lt;/P&gt;</description>
    <pubDate>Sat, 04 Nov 2023 17:04:32 GMT</pubDate>
    <dc:creator>Rafal9</dc:creator>
    <dc:date>2023-11-04T17:04:32Z</dc:date>
    <item>
      <title>Issue during testing SparkSession.sql() with pytest.</title>
      <link>https://community.databricks.com/t5/data-engineering/issue-during-testing-sparksession-sql-with-pytest/m-p/50456#M28810</link>
      <description>&lt;P&gt;Dear Community,&lt;/P&gt;&lt;P&gt;I am testing pyspark code via pytest using VS code and Databricks Connect.&lt;/P&gt;&lt;P&gt;SparkSession is initiated from Databricks Connect:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;from&lt;/SPAN&gt; &lt;SPAN&gt;databricks&lt;/SPAN&gt;&lt;SPAN&gt;.&lt;/SPAN&gt;&lt;SPAN&gt;connect&lt;/SPAN&gt; &lt;SPAN&gt;import&lt;/SPAN&gt; &lt;SPAN&gt;DatabricksSession&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;spark&lt;/SPAN&gt; &lt;SPAN&gt;=&lt;/SPAN&gt; &lt;SPAN&gt;DatabricksSession&lt;/SPAN&gt;&lt;SPAN&gt;.&lt;/SPAN&gt;&lt;SPAN&gt;builder&lt;/SPAN&gt;&lt;SPAN&gt;.&lt;/SPAN&gt;&lt;SPAN&gt;getOrCreate&lt;/SPAN&gt;&lt;SPAN&gt;()&lt;/SPAN&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;P&gt;I am&amp;nbsp; receiving every time error message when I am calling 'SparkSession.sql()' method.&lt;/P&gt;&lt;DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;For example:&lt;/SPAN&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="python"&gt;# module.py
def create_catalog(spark_session):
    """Doc string"""
    spark_session.sql("""CREATE CATALOG IF NOT EXISTS test_catalog""")

# test_module.py

from module import create_catalog

@pytest.fixture(scope="session")
def spark_session():
    """Creates SparkSession."""

    global spark
    try:
        spark
    except NameError:
        from databricks.connect import DatabricksSession
        spark = DatabricksSession.builder.getOrCreate()
    yield spark

def test_create_catalog(spark_session):
    """Doc string"""
    create_catalog(spark_session)
    &lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I am receiving following error message:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;pyspark.errors.exceptions.connect.SparkConnectGrpcException: &amp;lt;_MultiThreadedRendezvous of RPC that terminated with:
E               status = StatusCode.UNIMPLEMENTED
E               details = "Method not found: spark.connect.SparkConnectService/ReattachExecute"
E               debug_error_string = "UNKNOWN:Error received from peer  {created_time:"2023-11-04T16:14:26.2187837+00:00", grpc_status:12, grpc_message:"Method 
not found: spark.connect.SparkConnectService/ReattachExecute"}"&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Issue occurs also when I am using SparkSession directly and not as a fixture.&lt;/P&gt;&lt;P&gt;I have tested and SparkSession.sql() created from databricks.connect works correctly when I am runing code via 'Run file as a Workflow on Databricks.' from VS Code.&lt;/P&gt;&lt;P&gt;Thank you in advance for any help,&lt;/P&gt;&lt;P&gt;Rafal&lt;/P&gt;</description>
      <pubDate>Sat, 04 Nov 2023 17:04:32 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/issue-during-testing-sparksession-sql-with-pytest/m-p/50456#M28810</guid>
      <dc:creator>Rafal9</dc:creator>
      <dc:date>2023-11-04T17:04:32Z</dc:date>
    </item>
  </channel>
</rss>

