<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Getting broadcast join errors in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/getting-broadcast-join-errors/m-p/22151#M15142</link>
    <description>&lt;P&gt;I would like to know how do disable broadcast join in my job to avoid this error message. Is there a Spark configuration?&lt;/P&gt;</description>
    <pubDate>Fri, 18 Jun 2021 23:23:34 GMT</pubDate>
    <dc:creator>jose_gonzalez</dc:creator>
    <dc:date>2021-06-18T23:23:34Z</dc:date>
    <item>
      <title>Getting broadcast join errors</title>
      <link>https://community.databricks.com/t5/data-engineering/getting-broadcast-join-errors/m-p/22151#M15142</link>
      <description>&lt;P&gt;I would like to know how do disable broadcast join in my job to avoid this error message. Is there a Spark configuration?&lt;/P&gt;</description>
      <pubDate>Fri, 18 Jun 2021 23:23:34 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/getting-broadcast-join-errors/m-p/22151#M15142</guid>
      <dc:creator>jose_gonzalez</dc:creator>
      <dc:date>2021-06-18T23:23:34Z</dc:date>
    </item>
    <item>
      <title>Re: Getting broadcast join errors</title>
      <link>https://community.databricks.com/t5/data-engineering/getting-broadcast-join-errors/m-p/22152#M15143</link>
      <description>&lt;P&gt;You can disable broadcast join by adding the following Spark configuration to you notebook:&lt;/P&gt;&lt;P&gt;&lt;B&gt;spark.conf.set("spark.sql.autoBroadcastJoinThreshold", -1)&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;In addition, you can also add this configuration to your cluster:&lt;/P&gt;&lt;P&gt;&lt;B&gt;spark.sql.autoBroadcastJoinThreshold -1&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;You can disable it at notebook level or cluster level.&lt;/P&gt;</description>
      <pubDate>Fri, 18 Jun 2021 23:25:37 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/getting-broadcast-join-errors/m-p/22152#M15143</guid>
      <dc:creator>jose_gonzalez</dc:creator>
      <dc:date>2021-06-18T23:25:37Z</dc:date>
    </item>
  </channel>
</rss>

