<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Instance Pool Usage in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/instance-pool-usage/m-p/106852#M42613</link>
    <description>&lt;P&gt;Unfortunately as of now the API endpoint will be the best approach.&lt;/P&gt;</description>
    <pubDate>Thu, 23 Jan 2025 19:40:51 GMT</pubDate>
    <dc:creator>Walter_C</dc:creator>
    <dc:date>2025-01-23T19:40:51Z</dc:date>
    <item>
      <title>Instance Pool Usage</title>
      <link>https://community.databricks.com/t5/data-engineering/instance-pool-usage/m-p/106827#M42606</link>
      <description>&lt;P&gt;We have instance pools setup with a maximum capacity and are looking at ways to monitor the usage to help with our capacity planning.&lt;/P&gt;&lt;P&gt;I have been using the system tables to track how many nodes are being used within a pool at a point in time but it appears to be that the node_timeline table only tracks nodes as they are used and so idle nodes are not counted.&lt;/P&gt;&lt;P&gt;From the docs idle nodes count towards the max capacity of the pool (along with nodes in use) so I cannot see how to capture this from the system tables. Is there any way of doing this?&lt;/P&gt;&lt;P&gt;I realise there is an api that I could hit to get the status of the pool periodically but was hoping there was a query option first.&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 23 Jan 2025 16:36:06 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/instance-pool-usage/m-p/106827#M42606</guid>
      <dc:creator>muir</dc:creator>
      <dc:date>2025-01-23T16:36:06Z</dc:date>
    </item>
    <item>
      <title>Re: Instance Pool Usage</title>
      <link>https://community.databricks.com/t5/data-engineering/instance-pool-usage/m-p/106852#M42613</link>
      <description>&lt;P&gt;Unfortunately as of now the API endpoint will be the best approach.&lt;/P&gt;</description>
      <pubDate>Thu, 23 Jan 2025 19:40:51 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/instance-pool-usage/m-p/106852#M42613</guid>
      <dc:creator>Walter_C</dc:creator>
      <dc:date>2025-01-23T19:40:51Z</dc:date>
    </item>
    <item>
      <title>Re: Instance Pool Usage</title>
      <link>https://community.databricks.com/t5/data-engineering/instance-pool-usage/m-p/106872#M42620</link>
      <description>&lt;P&gt;The system tables like &amp;nbsp;only track active node usage, not idle nodes. Since idle nodes also count toward the pool's maximum capacity, their status cannot be directly captured through queries on system tables. To monitor both active and idle nodes within a pool, you’ll need to use the API to periodically fetch the pool status, as it provides comprehensive details, including idle nodes. Unfortunately, there isn’t a direct query-based solution to achieve this.&lt;/P&gt;</description>
      <pubDate>Fri, 24 Jan 2025 05:57:35 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/instance-pool-usage/m-p/106872#M42620</guid>
      <dc:creator>nick533</dc:creator>
      <dc:date>2025-01-24T05:57:35Z</dc:date>
    </item>
    <item>
      <title>Re: Instance Pool Usage</title>
      <link>https://community.databricks.com/t5/data-engineering/instance-pool-usage/m-p/108879#M43167</link>
      <description>&lt;P&gt;I also using it and it's working properly.&lt;/P&gt;</description>
      <pubDate>Wed, 05 Feb 2025 05:17:10 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/instance-pool-usage/m-p/108879#M43167</guid>
      <dc:creator>TuckerGage</dc:creator>
      <dc:date>2025-02-05T05:17:10Z</dc:date>
    </item>
  </channel>
</rss>

