<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Out of Memory/Connection Lost When Writing to External SQL Server from Databricks Using JDBC Connection in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/16905#M11000</link>
    <description>&lt;P&gt;Please extend the number of dataframe partitions using &amp;nbsp;&lt;/P&gt;&lt;P&gt;coalesce(&amp;lt;N&amp;gt;) or&amp;nbsp;repartition(&amp;lt;N&amp;gt;). In most cases, it should save the issue automatically as it will write in chunks per partition.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;In addition these jdbc connection properties can help (as on &lt;A href="https://spark.apache.org/docs/latest/sql-data-sources-jdbc.html" alt="https://spark.apache.org/docs/latest/sql-data-sources-jdbc.html" target="_blank"&gt;JDBC To Other Databases - Spark 3.3.0 Documentation (apache.org)&lt;/A&gt;&lt;span class="lia-unicode-emoji" title=":disappointed_face:"&gt;😞&lt;/span&gt;&lt;/P&gt;&lt;P&gt;numPartitions&lt;/P&gt;&lt;P&gt;batchsize&lt;/P&gt;&lt;P&gt;isolationLevel&lt;/P&gt;</description>
    <pubDate>Wed, 22 Jun 2022 16:37:46 GMT</pubDate>
    <dc:creator>Hubert-Dudek</dc:creator>
    <dc:date>2022-06-22T16:37:46Z</dc:date>
    <item>
      <title>Out of Memory/Connection Lost When Writing to External SQL Server from Databricks Using JDBC Connection</title>
      <link>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/16904#M10999</link>
      <description>&lt;P&gt;&lt;B&gt;I am working on writing a large amount of data from Databricks to an external SQL server using a JDB connection. I keep getting timeout errors/connection lost but digging deeper it appears to be a memory problem. I am wondering what cluster configurations I may need/where would be best to cache my data. The input data is about about 60 gb of data that is reduced to 60 mil rows. The process works to write about 1 million rows to the external database then crashes.&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;I have tried different cluster configurations, memory optimized, compute optimized etc. I have also tried different garbage collection settings as the garbage collection metric is dark red during the process. &lt;/B&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 22 Jun 2022 15:50:23 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/16904#M10999</guid>
      <dc:creator>Megan05</dc:creator>
      <dc:date>2022-06-22T15:50:23Z</dc:date>
    </item>
    <item>
      <title>Re: Out of Memory/Connection Lost When Writing to External SQL Server from Databricks Using JDBC Connection</title>
      <link>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/16905#M11000</link>
      <description>&lt;P&gt;Please extend the number of dataframe partitions using &amp;nbsp;&lt;/P&gt;&lt;P&gt;coalesce(&amp;lt;N&amp;gt;) or&amp;nbsp;repartition(&amp;lt;N&amp;gt;). In most cases, it should save the issue automatically as it will write in chunks per partition.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;In addition these jdbc connection properties can help (as on &lt;A href="https://spark.apache.org/docs/latest/sql-data-sources-jdbc.html" alt="https://spark.apache.org/docs/latest/sql-data-sources-jdbc.html" target="_blank"&gt;JDBC To Other Databases - Spark 3.3.0 Documentation (apache.org)&lt;/A&gt;&lt;span class="lia-unicode-emoji" title=":disappointed_face:"&gt;😞&lt;/span&gt;&lt;/P&gt;&lt;P&gt;numPartitions&lt;/P&gt;&lt;P&gt;batchsize&lt;/P&gt;&lt;P&gt;isolationLevel&lt;/P&gt;</description>
      <pubDate>Wed, 22 Jun 2022 16:37:46 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/16905#M11000</guid>
      <dc:creator>Hubert-Dudek</dc:creator>
      <dc:date>2022-06-22T16:37:46Z</dc:date>
    </item>
    <item>
      <title>Re: Out of Memory/Connection Lost When Writing to External SQL Server from Databricks Using JDBC Connection</title>
      <link>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/16906#M11001</link>
      <description>&lt;P&gt;Thanks for your response, Hubert! That seemed to work to fix the timeout issue.&lt;/P&gt;</description>
      <pubDate>Wed, 22 Jun 2022 22:41:04 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/16906#M11001</guid>
      <dc:creator>Megan05</dc:creator>
      <dc:date>2022-06-22T22:41:04Z</dc:date>
    </item>
    <item>
      <title>Re: Out of Memory/Connection Lost When Writing to External SQL Server from Databricks Using JDBC Connection</title>
      <link>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/16907#M11002</link>
      <description>&lt;P&gt;Thanks for the answer. I am also get in this problem. &lt;/P&gt;&lt;P&gt;&lt;A href="https://hotrabatte.com/" alt="https://hotrabatte.com/" target="_blank"&gt;Hotrabatt&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 23 Jun 2022 09:42:18 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/16907#M11002</guid>
      <dc:creator>hotrabattecom</dc:creator>
      <dc:date>2022-06-23T09:42:18Z</dc:date>
    </item>
    <item>
      <title>Re: Out of Memory/Connection Lost When Writing to External SQL Server from Databricks Using JDBC Connection</title>
      <link>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/16908#M11003</link>
      <description>&lt;P&gt;Great to hear. If it is possible, please select my answer as the best one.&lt;/P&gt;</description>
      <pubDate>Thu, 23 Jun 2022 18:46:09 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/16908#M11003</guid>
      <dc:creator>Hubert-Dudek</dc:creator>
      <dc:date>2022-06-23T18:46:09Z</dc:date>
    </item>
    <item>
      <title>Re: Out of Memory/Connection Lost When Writing to External SQL Server from Databricks Using JDBC Con</title>
      <link>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/83022#M36812</link>
      <description>&lt;P&gt;Excuse me Megan05, what parameters did you use?&lt;/P&gt;</description>
      <pubDate>Wed, 14 Aug 2024 21:14:26 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/out-of-memory-connection-lost-when-writing-to-external-sql/m-p/83022#M36812</guid>
      <dc:creator>PabloCSD</dc:creator>
      <dc:date>2024-08-14T21:14:26Z</dc:date>
    </item>
  </channel>
</rss>

