<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic how to optimize the runtime in 10.4 cluster in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/how-to-optimize-the-runtime-in-10-4-cluster/m-p/10920#M5963</link>
    <description>&lt;P&gt;i am loading the 1billion data from spark dataframe into target table, but in the 7.3 cluster it takes 3 hours to complete but after migrated to 10.4 cluster its taking 8 hours to complete , how can i reduce the time duration​&lt;/P&gt;</description>
    <pubDate>Sun, 22 Jan 2023 12:58:10 GMT</pubDate>
    <dc:creator>databicky</dc:creator>
    <dc:date>2023-01-22T12:58:10Z</dc:date>
    <item>
      <title>how to optimize the runtime in 10.4 cluster</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-optimize-the-runtime-in-10-4-cluster/m-p/10920#M5963</link>
      <description>&lt;P&gt;i am loading the 1billion data from spark dataframe into target table, but in the 7.3 cluster it takes 3 hours to complete but after migrated to 10.4 cluster its taking 8 hours to complete , how can i reduce the time duration​&lt;/P&gt;</description>
      <pubDate>Sun, 22 Jan 2023 12:58:10 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-optimize-the-runtime-in-10-4-cluster/m-p/10920#M5963</guid>
      <dc:creator>databicky</dc:creator>
      <dc:date>2023-01-22T12:58:10Z</dc:date>
    </item>
    <item>
      <title>Re: how to optimize the runtime in 10.4 cluster</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-optimize-the-runtime-in-10-4-cluster/m-p/10922#M5965</link>
      <description>&lt;P&gt;Hi @Mohammed sadamusean​,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Could you provide more details on what are you doing? What type of transformations/actions are you doing? whats your source and sink? batch or streaming? all that information will help.&lt;/P&gt;</description>
      <pubDate>Wed, 25 Jan 2023 01:33:35 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-optimize-the-runtime-in-10-4-cluster/m-p/10922#M5965</guid>
      <dc:creator>jose_gonzalez</dc:creator>
      <dc:date>2023-01-25T01:33:35Z</dc:date>
    </item>
    <item>
      <title>Re: how to optimize the runtime in 10.4 cluster</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-optimize-the-runtime-in-10-4-cluster/m-p/10923#M5966</link>
      <description>&lt;P&gt;i have data in adls, i load thise data into multiple dataframes in the databricks notebook, from the final dataframe i am loading data into final target table based on the dataframe tempview, usually it takes 3 in 7.3 cluster but in 10.4 cluster it take around 8 hours ,  1 billion records is there​&lt;/P&gt;</description>
      <pubDate>Wed, 25 Jan 2023 02:32:18 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-optimize-the-runtime-in-10-4-cluster/m-p/10923#M5966</guid>
      <dc:creator>databicky</dc:creator>
      <dc:date>2023-01-25T02:32:18Z</dc:date>
    </item>
    <item>
      <title>Re: how to optimize the runtime in 10.4 cluster</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-optimize-the-runtime-in-10-4-cluster/m-p/10924#M5967</link>
      <description>&lt;P&gt;could you check your Spark UI to identify which stage is taking the longest time, and share some information in here&lt;/P&gt;</description>
      <pubDate>Fri, 24 Feb 2023 23:40:25 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-optimize-the-runtime-in-10-4-cluster/m-p/10924#M5967</guid>
      <dc:creator>jose_gonzalez</dc:creator>
      <dc:date>2023-02-24T23:40:25Z</dc:date>
    </item>
    <item>
      <title>Re: how to optimize the runtime in 10.4 cluster</title>
      <link>https://community.databricks.com/t5/data-engineering/how-to-optimize-the-runtime-in-10-4-cluster/m-p/10921#M5964</link>
      <description>&lt;P&gt;Hi, Please refer &lt;A href="https://docs.databricks.com/clusters/cluster-config-best-practices.html" target="test_blank"&gt;https://docs.databricks.com/clusters/cluster-config-best-practices.html&lt;/A&gt; for best practises for cluster configurations. Please let us know if this helps. &lt;/P&gt;</description>
      <pubDate>Tue, 24 Jan 2023 08:06:56 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-to-optimize-the-runtime-in-10-4-cluster/m-p/10921#M5964</guid>
      <dc:creator>Debayan</dc:creator>
      <dc:date>2023-01-24T08:06:56Z</dc:date>
    </item>
  </channel>
</rss>

