<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: NVIDIA driver update in Machine Learning</title>
    <link>https://community.databricks.com/t5/machine-learning/nvidia-driver-update/m-p/49649#M2693</link>
    <description>&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/9"&gt;@Retired_mod&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;The DBR runtime compatible&amp;nbsp; cuda version (11.3) is DBR 11.X. unfortunately pyspark.ml.torch.distributed works only with DBR 13.X&lt;/P&gt;&lt;P&gt;So going back to DBR 11.X is not solving the problem&lt;/P&gt;</description>
    <pubDate>Sat, 21 Oct 2023 04:06:13 GMT</pubDate>
    <dc:creator>ravi-kolluri_in</dc:creator>
    <dc:date>2023-10-21T04:06:13Z</dc:date>
    <item>
      <title>NVIDIA driver update</title>
      <link>https://community.databricks.com/t5/machine-learning/nvidia-driver-update/m-p/49543#M2687</link>
      <description>&lt;P&gt;I want to update the cuda driver for the NVIDIA tesla T4 GPU on the cluster.&amp;nbsp;&lt;/P&gt;&lt;P&gt;using the following command&lt;/P&gt;&lt;DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;%&lt;/SPAN&gt;&lt;SPAN&gt;sh&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;sudo&lt;/SPAN&gt;&lt;SPAN&gt; apt-get &lt;/SPAN&gt;&lt;SPAN&gt;--purge&lt;/SPAN&gt;&lt;SPAN&gt; remove &lt;/SPAN&gt;&lt;SPAN&gt;"*nvidia*"&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;sudo&lt;/SPAN&gt;&lt;SPAN&gt; /usr/bin/nvidia-uninstall&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;wget&lt;/SPAN&gt;&lt;SPAN&gt; &lt;A href="https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-ubuntu2204.pin" target="_blank"&gt;https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-ubuntu2204.pin&lt;/A&gt;&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;sudo&lt;/SPAN&gt; &lt;SPAN&gt;mv&lt;/SPAN&gt;&lt;SPAN&gt; cuda-ubuntu2204.pin /etc/apt/preferences.d/cuda-repository-pin-600&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;wget&lt;/SPAN&gt;&lt;SPAN&gt; &lt;A href="https://developer.download.nvidia.com/compute/cuda/" target="_blank"&gt;https://developer.download.nvidia.com/compute/cuda/&lt;/A&gt;&lt;/SPAN&gt;&lt;SPAN&gt;11.8&lt;/SPAN&gt;&lt;SPAN&gt;.&lt;/SPAN&gt;&lt;SPAN&gt;0&lt;/SPAN&gt;&lt;SPAN&gt;/local_installers/cuda-repo-ubuntu2204-11-8-local_11.&lt;/SPAN&gt;&lt;SPAN&gt;8.0&lt;/SPAN&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt;520.61&lt;/SPAN&gt;&lt;SPAN&gt;.&lt;/SPAN&gt;&lt;SPAN&gt;05&lt;/SPAN&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt;1&lt;/SPAN&gt;&lt;SPAN&gt;_amd64.deb&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;sudo&lt;/SPAN&gt;&lt;SPAN&gt; dpkg &lt;/SPAN&gt;&lt;SPAN&gt;-i&lt;/SPAN&gt;&lt;SPAN&gt; cuda-repo-ubuntu2204-11-8-local_11.&lt;/SPAN&gt;&lt;SPAN&gt;8.0&lt;/SPAN&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt;520.61&lt;/SPAN&gt;&lt;SPAN&gt;.&lt;/SPAN&gt;&lt;SPAN&gt;05&lt;/SPAN&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt;1&lt;/SPAN&gt;&lt;SPAN&gt;_amd64.deb&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;sudo&lt;/SPAN&gt; &lt;SPAN&gt;cp&lt;/SPAN&gt;&lt;SPAN&gt; /var/cuda-repo-ubuntu2204-11-8-local/cuda-*-keyring.gpg /usr/share/keyrings/&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;sudo&lt;/SPAN&gt;&lt;SPAN&gt; apt-get update&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;sudo&lt;/SPAN&gt;&lt;SPAN&gt; apt-get &lt;/SPAN&gt;&lt;SPAN&gt;-y&lt;/SPAN&gt;&lt;SPAN&gt; install cuda&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;It is stuck with out returning any result.&amp;nbsp;&lt;/SPAN&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;Please help.&lt;/SPAN&gt;&lt;/DIV&gt;&lt;/DIV&gt;</description>
      <pubDate>Thu, 19 Oct 2023 17:44:12 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/nvidia-driver-update/m-p/49543#M2687</guid>
      <dc:creator>ravi-kolluri_in</dc:creator>
      <dc:date>2023-10-19T17:44:12Z</dc:date>
    </item>
    <item>
      <title>Re: NVIDIA driver update</title>
      <link>https://community.databricks.com/t5/machine-learning/nvidia-driver-update/m-p/49649#M2693</link>
      <description>&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/9"&gt;@Retired_mod&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;The DBR runtime compatible&amp;nbsp; cuda version (11.3) is DBR 11.X. unfortunately pyspark.ml.torch.distributed works only with DBR 13.X&lt;/P&gt;&lt;P&gt;So going back to DBR 11.X is not solving the problem&lt;/P&gt;</description>
      <pubDate>Sat, 21 Oct 2023 04:06:13 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/nvidia-driver-update/m-p/49649#M2693</guid>
      <dc:creator>ravi-kolluri_in</dc:creator>
      <dc:date>2023-10-21T04:06:13Z</dc:date>
    </item>
  </channel>
</rss>

