<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Provisioned concurrency of serving endpoints scales to zero in Machine Learning</title>
    <link>https://community.databricks.com/t5/machine-learning/provisioned-concurrency-of-serving-endpoints-scales-to-zero/m-p/38904#M2015</link>
    <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class=""&gt;We provisioned the endpoint with 4 DBUs and also disabled the scale_to_zero option. For some reason, it randomly drops to 0 provisioned concurrency. Logs available in the serving endpoint service are not insightful.&lt;/DIV&gt;&lt;DIV class=""&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class=""&gt;Currently, we are provisioning the endpoint with 8 DBUs but still, it randomly drops 4. What might be the issue?&lt;/DIV&gt;&lt;DIV class=""&gt;&lt;BR /&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="chidifrank_0-1690968368091.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/3036i5127AF6467C6095E/image-size/medium?v=v2&amp;amp;px=400" role="button" title="chidifrank_0-1690968368091.png" alt="chidifrank_0-1690968368091.png" /&gt;&lt;/span&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;DIV class=""&gt;&amp;nbsp;&lt;/DIV&gt;</description>
    <pubDate>Wed, 02 Aug 2023 09:28:17 GMT</pubDate>
    <dc:creator>chidifrank</dc:creator>
    <dc:date>2023-08-02T09:28:17Z</dc:date>
    <item>
      <title>Provisioned concurrency of serving endpoints scales to zero</title>
      <link>https://community.databricks.com/t5/machine-learning/provisioned-concurrency-of-serving-endpoints-scales-to-zero/m-p/38904#M2015</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&lt;DIV class=""&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class=""&gt;We provisioned the endpoint with 4 DBUs and also disabled the scale_to_zero option. For some reason, it randomly drops to 0 provisioned concurrency. Logs available in the serving endpoint service are not insightful.&lt;/DIV&gt;&lt;DIV class=""&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class=""&gt;Currently, we are provisioning the endpoint with 8 DBUs but still, it randomly drops 4. What might be the issue?&lt;/DIV&gt;&lt;DIV class=""&gt;&lt;BR /&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="chidifrank_0-1690968368091.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/3036i5127AF6467C6095E/image-size/medium?v=v2&amp;amp;px=400" role="button" title="chidifrank_0-1690968368091.png" alt="chidifrank_0-1690968368091.png" /&gt;&lt;/span&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;DIV class=""&gt;&amp;nbsp;&lt;/DIV&gt;</description>
      <pubDate>Wed, 02 Aug 2023 09:28:17 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/provisioned-concurrency-of-serving-endpoints-scales-to-zero/m-p/38904#M2015</guid>
      <dc:creator>chidifrank</dc:creator>
      <dc:date>2023-08-02T09:28:17Z</dc:date>
    </item>
    <item>
      <title>Re: Provisioned concurrency of serving endpoints scales to zero</title>
      <link>https://community.databricks.com/t5/machine-learning/provisioned-concurrency-of-serving-endpoints-scales-to-zero/m-p/39019#M2021</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;I apologize if my question wasn't clear; let me clarify it.&lt;BR /&gt;We are &lt;STRONG&gt;not&lt;/STRONG&gt; using the &lt;STRONG&gt;scale_to_zero&lt;/STRONG&gt; option and we are &lt;STRONG&gt;not&lt;/STRONG&gt; doing any warmup requests so it should never scale to zero despite traffic or zero traffic right?&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="chidifrank_0-1691048861787.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/3048i027C7515CBEEBFE3/image-size/medium?v=v2&amp;amp;px=400" role="button" title="chidifrank_0-1691048861787.png" alt="chidifrank_0-1691048861787.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 03 Aug 2023 11:45:32 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/provisioned-concurrency-of-serving-endpoints-scales-to-zero/m-p/39019#M2021</guid>
      <dc:creator>chidifrank</dc:creator>
      <dc:date>2023-08-03T11:45:32Z</dc:date>
    </item>
  </channel>
</rss>

