<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic What are Best Practices for Spark streaming in Databricks in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/what-are-best-practices-for-spark-streaming-in-databricks/m-p/24698#M17188</link>
    <description>&lt;P&gt;What are best practices for Spark streaming in Databricks&lt;/P&gt;&lt;OL&gt;&lt;LI&gt;is it good idea to consume multiple topics in one streaming job&lt;/LI&gt;&lt;LI&gt;is Auto scaling recommended for spark streaming&lt;/LI&gt;&lt;LI&gt;How many worker nodes we should choose for streaming job&lt;/LI&gt;&lt;LI&gt;When should we run OPTIMIZE for continuously streaming topics&lt;/LI&gt;&lt;LI&gt;any other things to consider to implement  streaming jobs with high throughput &lt;/LI&gt;&lt;/OL&gt;</description>
    <pubDate>Mon, 14 Jun 2021 22:15:21 GMT</pubDate>
    <dc:creator>Srikanth_Gupta_</dc:creator>
    <dc:date>2021-06-14T22:15:21Z</dc:date>
    <item>
      <title>What are Best Practices for Spark streaming in Databricks</title>
      <link>https://community.databricks.com/t5/data-engineering/what-are-best-practices-for-spark-streaming-in-databricks/m-p/24698#M17188</link>
      <description>&lt;P&gt;What are best practices for Spark streaming in Databricks&lt;/P&gt;&lt;OL&gt;&lt;LI&gt;is it good idea to consume multiple topics in one streaming job&lt;/LI&gt;&lt;LI&gt;is Auto scaling recommended for spark streaming&lt;/LI&gt;&lt;LI&gt;How many worker nodes we should choose for streaming job&lt;/LI&gt;&lt;LI&gt;When should we run OPTIMIZE for continuously streaming topics&lt;/LI&gt;&lt;LI&gt;any other things to consider to implement  streaming jobs with high throughput &lt;/LI&gt;&lt;/OL&gt;</description>
      <pubDate>Mon, 14 Jun 2021 22:15:21 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/what-are-best-practices-for-spark-streaming-in-databricks/m-p/24698#M17188</guid>
      <dc:creator>Srikanth_Gupta_</dc:creator>
      <dc:date>2021-06-14T22:15:21Z</dc:date>
    </item>
    <item>
      <title>Re: What are Best Practices for Spark streaming in Databricks</title>
      <link>https://community.databricks.com/t5/data-engineering/what-are-best-practices-for-spark-streaming-in-databricks/m-p/24699#M17189</link>
      <description>&lt;P&gt;What are best practices for Spark streaming in Databricks&lt;/P&gt;&lt;OL&gt;&lt;LI&gt;is it good idea to consume multiple topics in one streaming job - Yes it is fine, we can create a fair pool  and provide the infrastictrue to each stream so that it does not intervene between each other&lt;/LI&gt;&lt;LI&gt;is Auto scaling recommended for spark streaming - Nope &lt;/LI&gt;&lt;LI&gt;How many worker nodes we should choose for streaming job -Per partition one core &lt;/LI&gt;&lt;LI&gt;When should we run OPTIMIZE for continuously streaming topics - Any time &lt;/LI&gt;&lt;LI&gt;any other things to consider to implement streaming jobs with high throughput - Compute VM s are preferred  as node &lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 18 Jun 2021 12:58:22 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/what-are-best-practices-for-spark-streaming-in-databricks/m-p/24699#M17189</guid>
      <dc:creator>User16826994223</dc:creator>
      <dc:date>2021-06-18T12:58:22Z</dc:date>
    </item>
    <item>
      <title>Re: What are Best Practices for Spark streaming in Databricks</title>
      <link>https://community.databricks.com/t5/data-engineering/what-are-best-practices-for-spark-streaming-in-databricks/m-p/24700#M17190</link>
      <description>&lt;P&gt;See our &lt;A href="https://docs.databricks.com/spark/latest/structured-streaming/production.html" alt="https://docs.databricks.com/spark/latest/structured-streaming/production.html" target="_blank"&gt;docs&lt;/A&gt; for other considerations when deploying a production streaming job.&lt;/P&gt;</description>
      <pubDate>Fri, 18 Jun 2021 17:37:30 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/what-are-best-practices-for-spark-streaming-in-databricks/m-p/24700#M17190</guid>
      <dc:creator>craig_ng</dc:creator>
      <dc:date>2021-06-18T17:37:30Z</dc:date>
    </item>
  </channel>
</rss>

