<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: How to get databricks performance metrics programmatically? in Get Started Discussions</title>
    <link>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/65377#M8742</link>
    <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/103069"&gt;@Nandhini_Kumar&lt;/a&gt;, there's many performance metrics available - it depends on what you're looking to do with this data, and how you look to take action in real time. I would strongly recommend mapping out a user journey so you get only the metrics you need, and don't waste time trying to get these all hourly when they won't be used.&amp;nbsp;&lt;/P&gt;
&lt;UL&gt;
&lt;LI&gt;Cluster metrics - you can export these with cluster logging. It's worth noting that ganglia is deprecated for newer runtimes&lt;/LI&gt;
&lt;LI&gt;Warehouse metrics - available through the API for query metrics&lt;/LI&gt;
&lt;LI&gt;System tables - if you're using unity catalog, this will update hourly&lt;/LI&gt;
&lt;LI&gt;Jobs performance - you can use the Jobs API&amp;nbsp;&lt;/LI&gt;
&lt;/UL&gt;
&lt;P&gt;API docs can be found here:&amp;nbsp;&lt;A href="https://docs.databricks.com/api/workspace/introduction" target="_blank"&gt;https://docs.databricks.com/api/workspace/introduction&lt;/A&gt;&lt;/P&gt;
&lt;P&gt;System tables:&amp;nbsp;&lt;A href="https://docs.databricks.com/en/administration-guide/system-tables/index.html" target="_blank"&gt;https://docs.databricks.com/en/administration-guide/system-tables/index.html&lt;/A&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;BR /&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Wed, 03 Apr 2024 09:02:53 GMT</pubDate>
    <dc:creator>holly</dc:creator>
    <dc:date>2024-04-03T09:02:53Z</dc:date>
    <item>
      <title>How to get databricks performance metrics programmatically?</title>
      <link>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/65259#M8738</link>
      <description>&lt;P&gt;&lt;SPAN&gt;How to retrieve all Databricks performance metrics on an hourly basis. Is there a recommended method or API available for retrieving performance metrics ?&lt;BR /&gt;&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 02 Apr 2024 04:52:38 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/65259#M8738</guid>
      <dc:creator>Nandhini_Kumar</dc:creator>
      <dc:date>2024-04-02T04:52:38Z</dc:date>
    </item>
    <item>
      <title>Re: How to get databricks performance metrics programmatically?</title>
      <link>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/65307#M8740</link>
      <description>&lt;P&gt;Thanks&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/9"&gt;@Retired_mod&lt;/a&gt;&amp;nbsp;for your response.&lt;BR /&gt;&lt;SPAN&gt;Could you please provide guidance on how we can achieve the step3 in AWS services?&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 02 Apr 2024 12:38:39 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/65307#M8740</guid>
      <dc:creator>Nandhini_Kumar</dc:creator>
      <dc:date>2024-04-02T12:38:39Z</dc:date>
    </item>
    <item>
      <title>Re: How to get databricks performance metrics programmatically?</title>
      <link>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/65354#M8741</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/9"&gt;@Retired_mod&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;I encountered the "Error: getaddrinfo ENOTFOUND http" while attempting to run the API. &lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;Could you please provide guidance on resolving this issue? Are there any prerequisites that need to be followed before running the API? I'd appreciate any assistance you can offer.&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 03 Apr 2024 02:31:33 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/65354#M8741</guid>
      <dc:creator>Nandhini_Kumar</dc:creator>
      <dc:date>2024-04-03T02:31:33Z</dc:date>
    </item>
    <item>
      <title>Re: How to get databricks performance metrics programmatically?</title>
      <link>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/65377#M8742</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/103069"&gt;@Nandhini_Kumar&lt;/a&gt;, there's many performance metrics available - it depends on what you're looking to do with this data, and how you look to take action in real time. I would strongly recommend mapping out a user journey so you get only the metrics you need, and don't waste time trying to get these all hourly when they won't be used.&amp;nbsp;&lt;/P&gt;
&lt;UL&gt;
&lt;LI&gt;Cluster metrics - you can export these with cluster logging. It's worth noting that ganglia is deprecated for newer runtimes&lt;/LI&gt;
&lt;LI&gt;Warehouse metrics - available through the API for query metrics&lt;/LI&gt;
&lt;LI&gt;System tables - if you're using unity catalog, this will update hourly&lt;/LI&gt;
&lt;LI&gt;Jobs performance - you can use the Jobs API&amp;nbsp;&lt;/LI&gt;
&lt;/UL&gt;
&lt;P&gt;API docs can be found here:&amp;nbsp;&lt;A href="https://docs.databricks.com/api/workspace/introduction" target="_blank"&gt;https://docs.databricks.com/api/workspace/introduction&lt;/A&gt;&lt;/P&gt;
&lt;P&gt;System tables:&amp;nbsp;&lt;A href="https://docs.databricks.com/en/administration-guide/system-tables/index.html" target="_blank"&gt;https://docs.databricks.com/en/administration-guide/system-tables/index.html&lt;/A&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;BR /&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 03 Apr 2024 09:02:53 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/65377#M8742</guid>
      <dc:creator>holly</dc:creator>
      <dc:date>2024-04-03T09:02:53Z</dc:date>
    </item>
    <item>
      <title>Re: How to get databricks performance metrics programmatically?</title>
      <link>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/97968#M8743</link>
      <description>&lt;P&gt;Any response here? Are there any API that expose this? Specially the Job performance metrics?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 06 Nov 2024 13:51:19 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/97968#M8743</guid>
      <dc:creator>rahuja</dc:creator>
      <dc:date>2024-11-06T13:51:19Z</dc:date>
    </item>
    <item>
      <title>Re: How to get databricks performance metrics programmatically?</title>
      <link>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/99130#M8744</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/104464"&gt;@rahuja&lt;/a&gt;&amp;nbsp; can you be more specific on 'job performance'? Do you mean the spark metrics? Whether it was successful? How much it cost?&lt;/P&gt;</description>
      <pubDate>Mon, 18 Nov 2024 10:59:22 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/99130#M8744</guid>
      <dc:creator>holly</dc:creator>
      <dc:date>2024-11-18T10:59:22Z</dc:date>
    </item>
    <item>
      <title>Re: How to get databricks performance metrics programmatically?</title>
      <link>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/99170#M8745</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/36301"&gt;@holly&lt;/a&gt;&amp;nbsp; yes we need spark metrics e.g: amount of Compute used, amount of memory used etc.&lt;/P&gt;</description>
      <pubDate>Mon, 18 Nov 2024 12:34:28 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/99170#M8745</guid>
      <dc:creator>rahuja</dc:creator>
      <dc:date>2024-11-18T12:34:28Z</dc:date>
    </item>
    <item>
      <title>Re: How to get databricks performance metrics programmatically?</title>
      <link>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/99630#M8746</link>
      <description>&lt;P&gt;The spark logs are available through &lt;A href="https://docs.databricks.com/en/compute/configure.html#compute-log-delivery" target="_blank" rel="noopener"&gt;cluster logging.&lt;/A&gt;&amp;nbsp;This is enabled at the cluster level for you to choose the destination for the logs.&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Just a heads up - interpreting them at scale is not trivial. I'd recommend having a read through the &lt;A href="https://databrickslabs.github.io/overwatch/dataengineer/modules/#sparkevents" target="_blank" rel="noopener"&gt;overwatch&lt;/A&gt; project to see how they're aggregated together.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 21 Nov 2024 14:19:46 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/how-to-get-databricks-performance-metrics-programmatically/m-p/99630#M8746</guid>
      <dc:creator>holly</dc:creator>
      <dc:date>2024-11-21T14:19:46Z</dc:date>
    </item>
  </channel>
</rss>

