<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Workaround for GraphFrames not working on Delta Live Table? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20190#M13616</link>
    <description>&lt;P&gt;According to &lt;A href="https://docs.databricks.com/release-notes/runtime/11.0ml.html" alt="https://docs.databricks.com/release-notes/runtime/11.0ml.html" target="_blank"&gt;this&lt;/A&gt; page, the GraphFrames package is included in the databricks runtime since at least 11.0. However trying to run a connected components algorithm inside a delta live table notebook yields the error java.lang.ClassNotFoundException: org.graphframes.GraphFramePythonAPI &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I installed with pip using a magic command, but it seems that the package  is not included in the cluster itself. Is there a workaround to get graphframes working on the delta live runtime? I tried adding the maven coordinates in the cluster definition but it seems DLT does not support maven libraries.&lt;/P&gt;</description>
    <pubDate>Tue, 29 Nov 2022 01:22:56 GMT</pubDate>
    <dc:creator>amartinez</dc:creator>
    <dc:date>2022-11-29T01:22:56Z</dc:date>
    <item>
      <title>Workaround for GraphFrames not working on Delta Live Table?</title>
      <link>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20190#M13616</link>
      <description>&lt;P&gt;According to &lt;A href="https://docs.databricks.com/release-notes/runtime/11.0ml.html" alt="https://docs.databricks.com/release-notes/runtime/11.0ml.html" target="_blank"&gt;this&lt;/A&gt; page, the GraphFrames package is included in the databricks runtime since at least 11.0. However trying to run a connected components algorithm inside a delta live table notebook yields the error java.lang.ClassNotFoundException: org.graphframes.GraphFramePythonAPI &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I installed with pip using a magic command, but it seems that the package  is not included in the cluster itself. Is there a workaround to get graphframes working on the delta live runtime? I tried adding the maven coordinates in the cluster definition but it seems DLT does not support maven libraries.&lt;/P&gt;</description>
      <pubDate>Tue, 29 Nov 2022 01:22:56 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20190#M13616</guid>
      <dc:creator>amartinez</dc:creator>
      <dc:date>2022-11-29T01:22:56Z</dc:date>
    </item>
    <item>
      <title>Re: Workaround for GraphFrames not working on Delta Live Table?</title>
      <link>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20191#M13617</link>
      <description>&lt;P&gt;have you tried an ML cluster?   I think that is the key.&lt;/P&gt;</description>
      <pubDate>Tue, 29 Nov 2022 08:44:59 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20191#M13617</guid>
      <dc:creator>-werners-</dc:creator>
      <dc:date>2022-11-29T08:44:59Z</dc:date>
    </item>
    <item>
      <title>Re: Workaround for GraphFrames not working on Delta Live Table?</title>
      <link>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20192#M13618</link>
      <description>&lt;P&gt;How would I specify that I want a ML cluster? According to the Delta Live Table documentation I should not specify a runtime version....&lt;/P&gt;</description>
      <pubDate>Tue, 29 Nov 2022 15:53:54 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20192#M13618</guid>
      <dc:creator>amartinez</dc:creator>
      <dc:date>2022-11-29T15:53:54Z</dc:date>
    </item>
    <item>
      <title>Re: Workaround for GraphFrames not working on Delta Live Table?</title>
      <link>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20193#M13619</link>
      <description>&lt;P&gt;the doc you mention is specifically for the machine learning runtime.&lt;/P&gt;&lt;P&gt;DLT does not use that runtime and, as you correctly asked, you cannot define a runtime for DLT. So my previous answer is not an option. Sorry about that.&lt;/P&gt;&lt;P&gt;Right now, the only way to install libs is by using pip. &lt;/P&gt;&lt;P&gt;According to &lt;A href="https://docs.databricks.com/workflows/delta-live-tables/delta-live-tables-python-ref.html#python-libraries" alt="https://docs.databricks.com/workflows/delta-live-tables/delta-live-tables-python-ref.html#python-libraries" target="_blank"&gt;this doc&lt;/A&gt; pip should work.&lt;/P&gt;&lt;P&gt;But as DLT is still pretty new, it is possible that graphframes is not yet supported.&lt;/P&gt;</description>
      <pubDate>Tue, 29 Nov 2022 16:06:56 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20193#M13619</guid>
      <dc:creator>-werners-</dc:creator>
      <dc:date>2022-11-29T16:06:56Z</dc:date>
    </item>
    <item>
      <title>Re: Workaround for GraphFrames not working on Delta Live Table?</title>
      <link>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20194#M13620</link>
      <description>&lt;P&gt;DLT is specifically built for Data Engineering work as of now&lt;/P&gt;</description>
      <pubDate>Wed, 30 Nov 2022 13:10:33 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20194#M13620</guid>
      <dc:creator>Senthil1</dc:creator>
      <dc:date>2022-11-30T13:10:33Z</dc:date>
    </item>
    <item>
      <title>Re: Workaround for GraphFrames not working on Delta Live Table?</title>
      <link>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20195#M13621</link>
      <description>&lt;P&gt;use MLFlow for tracking, monitoring with ML cluster for now&lt;/P&gt;</description>
      <pubDate>Wed, 30 Nov 2022 13:12:00 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/20195#M13621</guid>
      <dc:creator>Senthil1</dc:creator>
      <dc:date>2022-11-30T13:12:00Z</dc:date>
    </item>
    <item>
      <title>Re: Workaround for GraphFrames not working on Delta Live Table?</title>
      <link>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/76113#M35151</link>
      <description>&lt;P&gt;I'm also trying to use GraphFrames inside a DLT pipeline.&amp;nbsp; &amp;nbsp;I get an error that graphframes not installed in the cluster.&amp;nbsp; &amp;nbsp;i"m using it successfully in test notebooks using the ML version of the cluster.&amp;nbsp; Is there a way to use this inside a DLT job?&lt;/P&gt;</description>
      <pubDate>Fri, 28 Jun 2024 15:35:19 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/workaround-for-graphframes-not-working-on-delta-live-table/m-p/76113#M35151</guid>
      <dc:creator>lprevost</dc:creator>
      <dc:date>2024-06-28T15:35:19Z</dc:date>
    </item>
  </channel>
</rss>

