<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic DBR 14.1 Pyspark Join on df1[&amp;quot;col1&amp;quot;] = df2[&amp;quot;col1&amp;quot;] syntax fails in Get Started Discussions</title>
    <link>https://community.databricks.com/t5/get-started-discussions/dbr-14-1-pyspark-join-on-df1-quot-col1-quot-df2-quot-col1-quot/m-p/51993#M1782</link>
    <description>&lt;P&gt;Hello&lt;BR /&gt;After upgrading my cluster from DBR 12 to 14.1 I got a MISSING_ATTRIBUTES.RESOLVED_ATTRIBUTE_APPEAR_IN_OPERATION on some of my Joins&lt;/P&gt;&lt;LI-CODE lang="python"&gt;df1.join(
    df2,
    [df1["name"] == df2["name"], df1["age"] == df2["age"]],
    'left_outer'
)&lt;/LI-CODE&gt;&lt;P&gt;I resolved it by changing the syntax to:&lt;/P&gt;&lt;LI-CODE lang="python"&gt;df1.alias("l").join(
    df2.alias("r"),
    [col("l.name") == col("r.name"), col("l.age"]) == col("r.age")],
    'left_outer'
)&lt;/LI-CODE&gt;&lt;P&gt;Is the second syntax the new standard or am I missing something with the first one ?&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;</description>
    <pubDate>Wed, 15 Nov 2023 09:12:27 GMT</pubDate>
    <dc:creator>Trifa</dc:creator>
    <dc:date>2023-11-15T09:12:27Z</dc:date>
    <item>
      <title>DBR 14.1 Pyspark Join on df1["col1"] = df2["col1"] syntax fails</title>
      <link>https://community.databricks.com/t5/get-started-discussions/dbr-14-1-pyspark-join-on-df1-quot-col1-quot-df2-quot-col1-quot/m-p/51993#M1782</link>
      <description>&lt;P&gt;Hello&lt;BR /&gt;After upgrading my cluster from DBR 12 to 14.1 I got a MISSING_ATTRIBUTES.RESOLVED_ATTRIBUTE_APPEAR_IN_OPERATION on some of my Joins&lt;/P&gt;&lt;LI-CODE lang="python"&gt;df1.join(
    df2,
    [df1["name"] == df2["name"], df1["age"] == df2["age"]],
    'left_outer'
)&lt;/LI-CODE&gt;&lt;P&gt;I resolved it by changing the syntax to:&lt;/P&gt;&lt;LI-CODE lang="python"&gt;df1.alias("l").join(
    df2.alias("r"),
    [col("l.name") == col("r.name"), col("l.age"]) == col("r.age")],
    'left_outer'
)&lt;/LI-CODE&gt;&lt;P&gt;Is the second syntax the new standard or am I missing something with the first one ?&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;</description>
      <pubDate>Wed, 15 Nov 2023 09:12:27 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/dbr-14-1-pyspark-join-on-df1-quot-col1-quot-df2-quot-col1-quot/m-p/51993#M1782</guid>
      <dc:creator>Trifa</dc:creator>
      <dc:date>2023-11-15T09:12:27Z</dc:date>
    </item>
  </channel>
</rss>

