<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic How to resolve our of memory error? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/how-to-resolve-our-of-memory-error/m-p/22854#M15734</link>
    <description>&lt;P&gt;Hi, I am working as azure support engineer&lt;/P&gt;&lt;P&gt;I found this error while I am checking the pipeline failure, and showing below error&lt;/P&gt;&lt;P&gt;"org.apache.spark.SparkException: Job aborted due to stage failure: Task 0 in stage 72403.0 failed 4 times, most recent failure: Lost task 0.3 in stage 72403.0 (TID 801507, 10.139.64.5, executor 169):&lt;B&gt; org.apache.spark.memory.SparkOutOfMemoryError: Unable to acquire 65536 bytes of memory, got 0"&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Py4JJavaError                             Traceback (most recent call last)&lt;/P&gt;&lt;P&gt;&amp;lt;command-2313153849666105&amp;gt; in create_destination(location)&lt;/P&gt;&lt;P&gt;    154           try:&lt;/P&gt;&lt;P&gt;--&amp;gt; 155               sql_df = spark.sql(sql_query)&lt;/P&gt;&lt;P&gt;    156               break&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;/databricks/spark/python/pyspark/sql/session.py in sql(self, sqlQuery)&lt;/P&gt;&lt;P&gt;    708         """&lt;/P&gt;&lt;P&gt;--&amp;gt; 709         return DataFrame(self._jsparkSession.sql(sqlQuery), self._wrapped)&lt;/P&gt;&lt;P&gt;    710 &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;/databricks/spark/python/lib/py4j-0.10.9-src.zip/py4j/java_gateway.py in __call__(self, *args)&lt;/P&gt;&lt;P&gt;   1304         return_value = get_return_value(&lt;/P&gt;&lt;P&gt;-&amp;gt; 1305             answer, self.gateway_client, self.target_id, self.name)&lt;/P&gt;&lt;P&gt;   1306 &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;org.apache.spark.memory.TaskMemoryManager.allocatePage(TaskMemoryManager.java:289)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.memory.MemoryConsumer.allocatePage(MemoryConsumer.java:116)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.util.collection.unsafe.sort.UnsafeExternalSorter.acquireNewPageIfNecessary(UnsafeExternalSorter.java:419)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.util.collection.unsafe.sort.UnsafeExternalSorter.insertRecord(UnsafeExternalSorter.java:443)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.UnsafeExternalRowSorter.insertRow(UnsafeExternalRowSorter.java:138)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.UnsafeExternalRowSorter.sort(UnsafeExternalRowSorter.java:241)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.SortExec$$anon$2.sortedIterator(SortExec.scala:133)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.SortExec$$anon$2.hasNext(SortExec.scala:147)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.window.WindowExec$$anon$1.fetchNextRow(WindowExec.scala:185)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.window.WindowExec$$anon$1.&amp;lt;init&amp;gt;(WindowExec.scala:194)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.window.WindowExec.$anonfun$doExecute$3(WindowExec.scala:168)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.window.WindowExec.$anonfun$doExecute$3$adapted(WindowExec.scala:167)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.$anonfun$mapPartitionsWithIndexInternal$2(RDD.scala:866)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.$anonfun$mapPartitionsWithIndexInternal$2$adapted(RDD.scala:866)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:60)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:356)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.iterator(RDD.scala:320)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:60)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:356)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.iterator(RDD.scala:320)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:60)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:356)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.$anonfun$getOrCompute$1(RDD.scala:369)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.storage.BlockManager.$anonfun$doPutIterator$6(BlockManager.scala:1414)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.storage.BlockManager.$anonfun$doPutIterator$6$adapted(BlockManager.scala:1412)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.storage.DiskStore.put(DiskStore.scala:70)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.storage.BlockManager.$anonfun$doPutIterator$1(BlockManager.scala:1412)&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
    <pubDate>Thu, 10 Nov 2022 09:14:30 GMT</pubDate>
    <dc:creator>Bujji</dc:creator>
    <dc:date>2022-11-10T09:14:30Z</dc:date>
    <item>
      <title>How to resolve our of memory error?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-resolve-our-of-memory-error/m-p/22854#M15734</link>
      <description>&lt;P&gt;Hi, I am working as azure support engineer&lt;/P&gt;&lt;P&gt;I found this error while I am checking the pipeline failure, and showing below error&lt;/P&gt;&lt;P&gt;"org.apache.spark.SparkException: Job aborted due to stage failure: Task 0 in stage 72403.0 failed 4 times, most recent failure: Lost task 0.3 in stage 72403.0 (TID 801507, 10.139.64.5, executor 169):&lt;B&gt; org.apache.spark.memory.SparkOutOfMemoryError: Unable to acquire 65536 bytes of memory, got 0"&lt;/B&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Py4JJavaError                             Traceback (most recent call last)&lt;/P&gt;&lt;P&gt;&amp;lt;command-2313153849666105&amp;gt; in create_destination(location)&lt;/P&gt;&lt;P&gt;    154           try:&lt;/P&gt;&lt;P&gt;--&amp;gt; 155               sql_df = spark.sql(sql_query)&lt;/P&gt;&lt;P&gt;    156               break&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;/databricks/spark/python/pyspark/sql/session.py in sql(self, sqlQuery)&lt;/P&gt;&lt;P&gt;    708         """&lt;/P&gt;&lt;P&gt;--&amp;gt; 709         return DataFrame(self._jsparkSession.sql(sqlQuery), self._wrapped)&lt;/P&gt;&lt;P&gt;    710 &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;/databricks/spark/python/lib/py4j-0.10.9-src.zip/py4j/java_gateway.py in __call__(self, *args)&lt;/P&gt;&lt;P&gt;   1304         return_value = get_return_value(&lt;/P&gt;&lt;P&gt;-&amp;gt; 1305             answer, self.gateway_client, self.target_id, self.name)&lt;/P&gt;&lt;P&gt;   1306 &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;org.apache.spark.memory.TaskMemoryManager.allocatePage(TaskMemoryManager.java:289)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.memory.MemoryConsumer.allocatePage(MemoryConsumer.java:116)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.util.collection.unsafe.sort.UnsafeExternalSorter.acquireNewPageIfNecessary(UnsafeExternalSorter.java:419)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.util.collection.unsafe.sort.UnsafeExternalSorter.insertRecord(UnsafeExternalSorter.java:443)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.UnsafeExternalRowSorter.insertRow(UnsafeExternalRowSorter.java:138)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.UnsafeExternalRowSorter.sort(UnsafeExternalRowSorter.java:241)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.SortExec$$anon$2.sortedIterator(SortExec.scala:133)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.SortExec$$anon$2.hasNext(SortExec.scala:147)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.window.WindowExec$$anon$1.fetchNextRow(WindowExec.scala:185)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.window.WindowExec$$anon$1.&amp;lt;init&amp;gt;(WindowExec.scala:194)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.window.WindowExec.$anonfun$doExecute$3(WindowExec.scala:168)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.sql.execution.window.WindowExec.$anonfun$doExecute$3$adapted(WindowExec.scala:167)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.$anonfun$mapPartitionsWithIndexInternal$2(RDD.scala:866)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.$anonfun$mapPartitionsWithIndexInternal$2$adapted(RDD.scala:866)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:60)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:356)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.iterator(RDD.scala:320)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:60)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:356)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.iterator(RDD.scala:320)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.MapPartitionsRDD.compute(MapPartitionsRDD.scala:60)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.computeOrReadCheckpoint(RDD.scala:356)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.rdd.RDD.$anonfun$getOrCompute$1(RDD.scala:369)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.storage.BlockManager.$anonfun$doPutIterator$6(BlockManager.scala:1414)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.storage.BlockManager.$anonfun$doPutIterator$6$adapted(BlockManager.scala:1412)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.storage.DiskStore.put(DiskStore.scala:70)&lt;/P&gt;&lt;P&gt;	at org.apache.spark.storage.BlockManager.$anonfun$doPutIterator$1(BlockManager.scala:1412)&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 10 Nov 2022 09:14:30 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-resolve-our-of-memory-error/m-p/22854#M15734</guid>
      <dc:creator>Bujji</dc:creator>
      <dc:date>2022-11-10T09:14:30Z</dc:date>
    </item>
    <item>
      <title>Re: How to resolve our of memory error?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-resolve-our-of-memory-error/m-p/22855#M15735</link>
      <description>&lt;P&gt;Hi @mahesh bmk​&amp;nbsp;,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;It would be nice to see the sql_query.&lt;/P&gt;&lt;P&gt;is there some window function used? You might try to run this on bigger cluster.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 10 Nov 2022 09:55:58 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-resolve-our-of-memory-error/m-p/22855#M15735</guid>
      <dc:creator>Pat</dc:creator>
      <dc:date>2022-11-10T09:55:58Z</dc:date>
    </item>
  </channel>
</rss>

