<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic spark cluster monitoring and visibility in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/spark-cluster-monitoring-and-visibility/m-p/17578#M11565</link>
    <description>&lt;P&gt;Hey. I'm working on a project where I'd like to be able to view and play around with the spark cluster metrics. I'd like to know what the utilization % and max values are for metrics like CPU, memory and network.&amp;nbsp;I've tried using some open source solutions(https://github.com/mspnp/spark-monitoring) but I'm not really getting what I'm looking for. Ideally, a solution that could give me insights on my Azure Databricks instances to optimize usage would be perfect. Currently, I can access some of these metrics on the metrics tab on my spark cluster page as static images but it'd be great if I could export that information to make my own insights or graphs.&lt;/P&gt;</description>
    <pubDate>Thu, 16 Jun 2022 07:33:18 GMT</pubDate>
    <dc:creator>Saurav</dc:creator>
    <dc:date>2022-06-16T07:33:18Z</dc:date>
    <item>
      <title>spark cluster monitoring and visibility</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-cluster-monitoring-and-visibility/m-p/17578#M11565</link>
      <description>&lt;P&gt;Hey. I'm working on a project where I'd like to be able to view and play around with the spark cluster metrics. I'd like to know what the utilization % and max values are for metrics like CPU, memory and network.&amp;nbsp;I've tried using some open source solutions(https://github.com/mspnp/spark-monitoring) but I'm not really getting what I'm looking for. Ideally, a solution that could give me insights on my Azure Databricks instances to optimize usage would be perfect. Currently, I can access some of these metrics on the metrics tab on my spark cluster page as static images but it'd be great if I could export that information to make my own insights or graphs.&lt;/P&gt;</description>
      <pubDate>Thu, 16 Jun 2022 07:33:18 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-cluster-monitoring-and-visibility/m-p/17578#M11565</guid>
      <dc:creator>Saurav</dc:creator>
      <dc:date>2022-06-16T07:33:18Z</dc:date>
    </item>
    <item>
      <title>Re: spark cluster monitoring and visibility</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-cluster-monitoring-and-visibility/m-p/17579#M11566</link>
      <description>&lt;P&gt;Hello @Saurav Santhosh​&amp;nbsp;&lt;/P&gt;&lt;P&gt;There are few options for this&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;If you would like to see VM usage you can send these metrics to the Azure Log Analytics workspace &lt;/P&gt;&lt;P&gt;&lt;A href="https://github.com/Azure/AzureDatabricksBestPractices/blob/master/toc.md#Appendix-A" target="test_blank"&gt;https://github.com/Azure/AzureDatabricksBestPractices/blob/master/toc.md#Appendix-A&lt;/A&gt; &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Databricks solution&lt;/P&gt;&lt;P&gt;&lt;A href="https://databrickslabs.github.io/overwatch/" target="test_blank"&gt;https://databrickslabs.github.io/overwatch/&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Datadog&lt;/P&gt;&lt;P&gt;&lt;A href="https://www.datadoghq.com/blog/databricks-monitoring-datadog/" target="test_blank"&gt;https://www.datadoghq.com/blog/databricks-monitoring-datadog/&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://databricks.com/blog/2017/06/01/apache-spark-cluster-monitoring-with-databricks-and-datadog.html" target="test_blank"&gt;https://databricks.com/blog/2017/06/01/apache-spark-cluster-monitoring-with-databricks-and-datadog.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 16 Jun 2022 10:09:13 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-cluster-monitoring-and-visibility/m-p/17579#M11566</guid>
      <dc:creator>User16764241763</dc:creator>
      <dc:date>2022-06-16T10:09:13Z</dc:date>
    </item>
    <item>
      <title>Re: spark cluster monitoring and visibility</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-cluster-monitoring-and-visibility/m-p/17580#M11567</link>
      <description>&lt;P&gt;Prometheus was added in spark 3.0 &lt;/P&gt;&lt;P&gt;&lt;A href="https://databricks.com/session_na20/native-support-of-prometheus-monitoring-in-apache-spark-3-0" target="test_blank"&gt;https://databricks.com/session_na20/native-support-of-prometheus-monitoring-in-apache-spark-3-0&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 16 Jun 2022 11:42:20 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-cluster-monitoring-and-visibility/m-p/17580#M11567</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2022-06-16T11:42:20Z</dc:date>
    </item>
    <item>
      <title>Re: spark cluster monitoring and visibility</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-cluster-monitoring-and-visibility/m-p/17582#M11569</link>
      <description>&lt;P&gt;Hey @Kaniz Fatma​, I Appreciate the suggestions and will be looking into them. Haven't gotten to it yet so I didn't want to mention whether they worked for me or not. Since I'm looking to avoid solutions like DataDog, I'll be checking out the Prometheus and @Arvind Ravish​'s first suggestion. Thanks!&lt;/P&gt;</description>
      <pubDate>Wed, 22 Jun 2022 09:38:03 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-cluster-monitoring-and-visibility/m-p/17582#M11569</guid>
      <dc:creator>Saurav</dc:creator>
      <dc:date>2022-06-22T09:38:03Z</dc:date>
    </item>
    <item>
      <title>Re: spark cluster monitoring and visibility</title>
      <link>https://community.databricks.com/t5/data-engineering/spark-cluster-monitoring-and-visibility/m-p/17584#M11571</link>
      <description>&lt;P&gt;Just a friendly follow-up. Did you have time to check? do you still need help or can you mark as best the response that helped you?&lt;/P&gt;</description>
      <pubDate>Fri, 29 Jul 2022 20:07:48 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/spark-cluster-monitoring-and-visibility/m-p/17584#M11571</guid>
      <dc:creator>jose_gonzalez</dc:creator>
      <dc:date>2022-07-29T20:07:48Z</dc:date>
    </item>
  </channel>
</rss>

