<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Pyspark installation issue in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/pyspark-installation-issue/m-p/22743#M15634</link>
    <description>&lt;P&gt;Kindly replace the version when you install python dependencies from 2.4.8 to 3.2.1.. It should work. Thanks.&lt;/P&gt;</description>
    <pubDate>Wed, 20 Apr 2022 16:36:09 GMT</pubDate>
    <dc:creator>Aashita</dc:creator>
    <dc:date>2022-04-20T16:36:09Z</dc:date>
    <item>
      <title>Pyspark installation issue</title>
      <link>https://community.databricks.com/t5/data-engineering/pyspark-installation-issue/m-p/22739#M15630</link>
      <description>&lt;P&gt;When I try to start pyspark session in pycharm. It throws me this error "RuntimeError("Java gateway process exited before sending its port number"). Could anyone help me to solve this?&lt;/P&gt;</description>
      <pubDate>Thu, 14 Apr 2022 18:25:39 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/pyspark-installation-issue/m-p/22739#M15630</guid>
      <dc:creator>_r_vind1199</dc:creator>
      <dc:date>2022-04-14T18:25:39Z</dc:date>
    </item>
    <item>
      <title>Re: Pyspark installation issue</title>
      <link>https://community.databricks.com/t5/data-engineering/pyspark-installation-issue/m-p/22740#M15631</link>
      <description>&lt;P&gt;&lt;B&gt;@Aravind A&lt;/B&gt;​&amp;nbsp;&lt;B&gt;, What are the dependencies and versions you installed?&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;&lt;U&gt;Install pyspark + openjdk&lt;/U&gt;&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;%pip install pyspark==2.4.8
!apt-get install openjdk-8-jdk-headless -qq &amp;gt; /dev/null&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;&lt;U&gt;Build spark session&lt;/U&gt;&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;from pyspark.sql import SparkSession
spark = SparkSession.builder\
    .appName("Practice”)\
    .getOrCreate()&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;&lt;U&gt;Note that:&lt;/U&gt;&lt;/B&gt;&lt;/P&gt;&lt;P&gt;Spark runs on Java 8/11, Scala 2.12/2.13, Python 3.6+ and R 3.5+.&amp;nbsp;&lt;/P&gt;&lt;P&gt;Python 3.6 support is deprecated as of Spark 3.2.0.&amp;nbsp;&lt;/P&gt;&lt;P&gt;Java 8 prior to version 8u201 support is deprecated as of Spark 3.2.0.&amp;nbsp;&lt;/P&gt;&lt;P&gt;For the Scala API, Spark 3.2.1 uses Scala 2.12. You will need to use a compatible Scala version (2.12.x).&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;A href="https://spark.apache.org/docs/latest/" alt="https://spark.apache.org/docs/latest/" target="_blank"&gt;https://spark.apache.org/docs/latest/&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 14 Apr 2022 23:31:37 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/pyspark-installation-issue/m-p/22740#M15631</guid>
      <dc:creator>Aashita</dc:creator>
      <dc:date>2022-04-14T23:31:37Z</dc:date>
    </item>
    <item>
      <title>Re: Pyspark installation issue</title>
      <link>https://community.databricks.com/t5/data-engineering/pyspark-installation-issue/m-p/22741#M15632</link>
      <description>&lt;P&gt;@Aashita Ramteke​&amp;nbsp;, Pyspark version 3.2.1&lt;/P&gt;</description>
      <pubDate>Fri, 15 Apr 2022 13:47:18 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/pyspark-installation-issue/m-p/22741#M15632</guid>
      <dc:creator>_r_vind1199</dc:creator>
      <dc:date>2022-04-15T13:47:18Z</dc:date>
    </item>
    <item>
      <title>Re: Pyspark installation issue</title>
      <link>https://community.databricks.com/t5/data-engineering/pyspark-installation-issue/m-p/22743#M15634</link>
      <description>&lt;P&gt;Kindly replace the version when you install python dependencies from 2.4.8 to 3.2.1.. It should work. Thanks.&lt;/P&gt;</description>
      <pubDate>Wed, 20 Apr 2022 16:36:09 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/pyspark-installation-issue/m-p/22743#M15634</guid>
      <dc:creator>Aashita</dc:creator>
      <dc:date>2022-04-20T16:36:09Z</dc:date>
    </item>
  </channel>
</rss>

