<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Databricks-connect VSCode debugging pandas_api not working in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/databricks-connect-vscode-debugging-pandas-api-not-working/m-p/38006#M26539</link>
    <description>&lt;P&gt;Hi&lt;/P&gt;&lt;P&gt;I am using the databricks extension on VSCode and am running against an issue since two days, prior it worked fine. I receive an error when I want to use Pandas-on-Spark during debugging.&lt;/P&gt;&lt;LI-CODE lang="python"&gt;from databricks.connect import DatabricksSession
spark = DatabricksSession.builder.getOrCreate()

df = spark.sql('select 1')
print(df.count()) # ---&amp;gt; printing 1

df.pandas_api().describe()&lt;/LI-CODE&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="FabriceDeseyn_0-1689838667900.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/2900i188560449F0F9089/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="FabriceDeseyn_0-1689838667900.png" alt="FabriceDeseyn_0-1689838667900.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;If I look deeper it seems that SPARK_REMOTE was not set and therefor the error is thrown.&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="FabriceDeseyn_1-1689838868477.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/2901i497008B2D28CDCDE/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="FabriceDeseyn_1-1689838868477.png" alt="FabriceDeseyn_1-1689838868477.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;Can anyone pinpoint what I did wrong.&lt;BR /&gt;I did following steps already:&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;reinstall databricks-connect&lt;/LI&gt;&lt;LI&gt;reinstall extension&lt;/LI&gt;&lt;LI&gt;other cluster&lt;/LI&gt;&lt;LI&gt;other cluster with DBR 13.1 (and corresponding databricks-connect)&lt;/LI&gt;&lt;/UL&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Thu, 20 Jul 2023 07:42:56 GMT</pubDate>
    <dc:creator>FabriceDeseyn</dc:creator>
    <dc:date>2023-07-20T07:42:56Z</dc:date>
    <item>
      <title>Databricks-connect VSCode debugging pandas_api not working</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-connect-vscode-debugging-pandas-api-not-working/m-p/38006#M26539</link>
      <description>&lt;P&gt;Hi&lt;/P&gt;&lt;P&gt;I am using the databricks extension on VSCode and am running against an issue since two days, prior it worked fine. I receive an error when I want to use Pandas-on-Spark during debugging.&lt;/P&gt;&lt;LI-CODE lang="python"&gt;from databricks.connect import DatabricksSession
spark = DatabricksSession.builder.getOrCreate()

df = spark.sql('select 1')
print(df.count()) # ---&amp;gt; printing 1

df.pandas_api().describe()&lt;/LI-CODE&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="FabriceDeseyn_0-1689838667900.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/2900i188560449F0F9089/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="FabriceDeseyn_0-1689838667900.png" alt="FabriceDeseyn_0-1689838667900.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;If I look deeper it seems that SPARK_REMOTE was not set and therefor the error is thrown.&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="FabriceDeseyn_1-1689838868477.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/2901i497008B2D28CDCDE/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="FabriceDeseyn_1-1689838868477.png" alt="FabriceDeseyn_1-1689838868477.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;Can anyone pinpoint what I did wrong.&lt;BR /&gt;I did following steps already:&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;reinstall databricks-connect&lt;/LI&gt;&lt;LI&gt;reinstall extension&lt;/LI&gt;&lt;LI&gt;other cluster&lt;/LI&gt;&lt;LI&gt;other cluster with DBR 13.1 (and corresponding databricks-connect)&lt;/LI&gt;&lt;/UL&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 20 Jul 2023 07:42:56 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-connect-vscode-debugging-pandas-api-not-working/m-p/38006#M26539</guid>
      <dc:creator>FabriceDeseyn</dc:creator>
      <dc:date>2023-07-20T07:42:56Z</dc:date>
    </item>
    <item>
      <title>Re: Databricks-connect VSCode debugging pandas_api not working</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-connect-vscode-debugging-pandas-api-not-working/m-p/38762#M26747</link>
      <description>&lt;P&gt;Additional info:&lt;BR /&gt;It seems that the issue comes from the 1.1.0 version of the databricks extension in VSCode.&lt;BR /&gt;Downgrading to 1.0.0 solves my issue.&lt;/P&gt;</description>
      <pubDate>Mon, 31 Jul 2023 08:28:28 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-connect-vscode-debugging-pandas-api-not-working/m-p/38762#M26747</guid>
      <dc:creator>FabriceDeseyn</dc:creator>
      <dc:date>2023-07-31T08:28:28Z</dc:date>
    </item>
  </channel>
</rss>

