<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: how to Intercept Spark Listener with Pyspark ? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/how-to-intercept-spark-listener-with-pyspark/m-p/31313#M22795</link>
    <description>&lt;P&gt;Hi again! Thank you for your new question! As usual, we'll let your peers have a chance to answer first. Thanks for your patience!&lt;/P&gt;</description>
    <pubDate>Thu, 20 Jan 2022 16:30:20 GMT</pubDate>
    <dc:creator>Anonymous</dc:creator>
    <dc:date>2022-01-20T16:30:20Z</dc:date>
    <item>
      <title>how to Intercept Spark Listener with Pyspark ?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-intercept-spark-listener-with-pyspark/m-p/31312#M22794</link>
      <description>&lt;P&gt;hi guys,&lt;/P&gt;&lt;P&gt;​&lt;/P&gt;&lt;P&gt;It`s possible to intercept Spark Listener with Pyspark to collect indicator like shuffle, skew ratio, etc  ?&lt;/P&gt;</description>
      <pubDate>Wed, 19 Jan 2022 20:12:37 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-intercept-spark-listener-with-pyspark/m-p/31312#M22794</guid>
      <dc:creator>William_Scardua</dc:creator>
      <dc:date>2022-01-19T20:12:37Z</dc:date>
    </item>
    <item>
      <title>Re: how to Intercept Spark Listener with Pyspark ?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-intercept-spark-listener-with-pyspark/m-p/31313#M22795</link>
      <description>&lt;P&gt;Hi again! Thank you for your new question! As usual, we'll let your peers have a chance to answer first. Thanks for your patience!&lt;/P&gt;</description>
      <pubDate>Thu, 20 Jan 2022 16:30:20 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-intercept-spark-listener-with-pyspark/m-p/31313#M22795</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2022-01-20T16:30:20Z</dc:date>
    </item>
    <item>
      <title>Re: how to Intercept Spark Listener with Pyspark ?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-intercept-spark-listener-with-pyspark/m-p/31314#M22796</link>
      <description>&lt;P&gt;interesting question.&lt;/P&gt;&lt;P&gt;I know that you can use the SparkListener to collect info, f.e. &lt;A href="https://medium.com/analytics-vidhya/better-spark-logging-and-monitoring-with-spark-listener-c2c5fe86547a" alt="https://medium.com/analytics-vidhya/better-spark-logging-and-monitoring-with-spark-listener-c2c5fe86547a" target="_blank"&gt;here&lt;/A&gt;.&lt;/P&gt;&lt;P&gt;Mind that the class is written in Scala, so my first thought was that it is not possible in python/pyspark.&lt;/P&gt;&lt;P&gt;But &lt;A href="https://stackoverflow.com/questions/44082957/how-to-add-a-sparklistener-from-pyspark-in-python" alt="https://stackoverflow.com/questions/44082957/how-to-add-a-sparklistener-from-pyspark-in-python" target="_blank"&gt;SO says it is possible, but with a lot of overhead tbh&lt;/A&gt;.&lt;/P&gt;&lt;P&gt;So far from optimal, I´d try to use scala instead.&lt;/P&gt;</description>
      <pubDate>Fri, 21 Jan 2022 15:04:02 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-intercept-spark-listener-with-pyspark/m-p/31314#M22796</guid>
      <dc:creator>-werners-</dc:creator>
      <dc:date>2022-01-21T15:04:02Z</dc:date>
    </item>
  </channel>
</rss>

