<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Are serverless endpoints possible in this Technical Blog post by qianyu? in Generative AI</title>
    <link>https://community.databricks.com/t5/generative-ai/are-serverless-endpoints-possible-in-this-technical-blog-post-by/m-p/117672#M862</link>
    <description>&lt;P&gt;Model serving is already serverless enabled.&amp;nbsp; You can even set a budget for this (public preview).&lt;BR /&gt;&lt;A href="https://docs.databricks.com/aws/en/machine-learning/model-serving/manage-serving-endpoints" target="_blank"&gt;https://docs.databricks.com/aws/en/machine-learning/model-serving/manage-serving-endpoints&lt;/A&gt;&lt;BR /&gt;&lt;A href="https://docs.databricks.com/aws/en/machine-learning/model-serving/foundation-model-overview" target="_blank"&gt;https://docs.databricks.com/aws/en/machine-learning/model-serving/foundation-model-overview&lt;/A&gt;&lt;BR /&gt;&lt;BR /&gt;Or do you mean something else (like using a databricks serverless sql/eng instance)?&lt;/P&gt;</description>
    <pubDate>Mon, 05 May 2025 07:12:34 GMT</pubDate>
    <dc:creator>-werners-</dc:creator>
    <dc:date>2025-05-05T07:12:34Z</dc:date>
    <item>
      <title>Are serverless endpoints possible in this Technical Blog post by qianyu?</title>
      <link>https://community.databricks.com/t5/generative-ai/are-serverless-endpoints-possible-in-this-technical-blog-post-by/m-p/117615#M861</link>
      <description>&lt;P&gt;Hi, are serverless endpoints possible for Whisper and Llama in this Technical Blog post by&amp;nbsp;&lt;SPAN class=""&gt;qianyu&lt;/SPAN&gt;?&lt;/P&gt;&lt;P class=""&gt;&lt;A href="https://community.databricks.com/t5/technical-blog/streamline-customer-call-center-transcripts-analytics-with/ba-p/101689" target="_blank" rel="noopener"&gt;https://community.databricks.com/t5/technical-blog/streamline-customer-call-center-transcripts-analytics-with/ba-p/101689&lt;/A&gt;&lt;/P&gt;&lt;P class=""&gt;Thanks!&lt;/P&gt;&lt;P class=""&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sat, 03 May 2025 17:35:54 GMT</pubDate>
      <guid>https://community.databricks.com/t5/generative-ai/are-serverless-endpoints-possible-in-this-technical-blog-post-by/m-p/117615#M861</guid>
      <dc:creator>brandt6264</dc:creator>
      <dc:date>2025-05-03T17:35:54Z</dc:date>
    </item>
    <item>
      <title>Re: Are serverless endpoints possible in this Technical Blog post by qianyu?</title>
      <link>https://community.databricks.com/t5/generative-ai/are-serverless-endpoints-possible-in-this-technical-blog-post-by/m-p/117672#M862</link>
      <description>&lt;P&gt;Model serving is already serverless enabled.&amp;nbsp; You can even set a budget for this (public preview).&lt;BR /&gt;&lt;A href="https://docs.databricks.com/aws/en/machine-learning/model-serving/manage-serving-endpoints" target="_blank"&gt;https://docs.databricks.com/aws/en/machine-learning/model-serving/manage-serving-endpoints&lt;/A&gt;&lt;BR /&gt;&lt;A href="https://docs.databricks.com/aws/en/machine-learning/model-serving/foundation-model-overview" target="_blank"&gt;https://docs.databricks.com/aws/en/machine-learning/model-serving/foundation-model-overview&lt;/A&gt;&lt;BR /&gt;&lt;BR /&gt;Or do you mean something else (like using a databricks serverless sql/eng instance)?&lt;/P&gt;</description>
      <pubDate>Mon, 05 May 2025 07:12:34 GMT</pubDate>
      <guid>https://community.databricks.com/t5/generative-ai/are-serverless-endpoints-possible-in-this-technical-blog-post-by/m-p/117672#M862</guid>
      <dc:creator>-werners-</dc:creator>
      <dc:date>2025-05-05T07:12:34Z</dc:date>
    </item>
    <item>
      <title>Re: Are serverless endpoints possible in this Technical Blog post by qianyu?</title>
      <link>https://community.databricks.com/t5/generative-ai/are-serverless-endpoints-possible-in-this-technical-blog-post-by/m-p/117728#M863</link>
      <description>&lt;P&gt;Thanks for the clarification and links.&lt;/P&gt;&lt;P&gt;Bottom line, what I am trying to avoid is spinning up AWS resources in the background that will incur ongoing charges until I track them down and terminate them (I am a new Databricks customer and still trying to navigate the billing/cost system). The "Serve this model" UI looked suspiciously like it was going to do this but on second look, maybe not.&lt;/P&gt;&lt;P&gt;I am just wanting to confirm my only costs, Databricks or AWS,&amp;nbsp;&lt;SPAN&gt;for Whisper and Llama in this Technical Blog post &lt;/SPAN&gt;will be only for the short duration they will be used. Thanks!&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 05 May 2025 15:24:43 GMT</pubDate>
      <guid>https://community.databricks.com/t5/generative-ai/are-serverless-endpoints-possible-in-this-technical-blog-post-by/m-p/117728#M863</guid>
      <dc:creator>brandt6264</dc:creator>
      <dc:date>2025-05-05T15:24:43Z</dc:date>
    </item>
    <item>
      <title>Re: Are serverless endpoints possible in this Technical Blog post by qianyu?</title>
      <link>https://community.databricks.com/t5/generative-ai/are-serverless-endpoints-possible-in-this-technical-blog-post-by/m-p/117816#M866</link>
      <description>&lt;P&gt;&lt;A href="https://www.databricks.com/product/pricing/foundation-model-serving" target="_blank"&gt;https://www.databricks.com/product/pricing/foundation-model-serving&lt;/A&gt;&lt;BR /&gt;&lt;BR /&gt;We don´t serve models on databricks, but as far as i can see you pay per input/output tokens (for foundation models).&lt;BR /&gt;For classic models:&lt;BR /&gt;&lt;A href="https://www.databricks.com/product/pricing/model-serving" target="_blank"&gt;https://www.databricks.com/product/pricing/model-serving&lt;/A&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 06 May 2025 07:15:16 GMT</pubDate>
      <guid>https://community.databricks.com/t5/generative-ai/are-serverless-endpoints-possible-in-this-technical-blog-post-by/m-p/117816#M866</guid>
      <dc:creator>-werners-</dc:creator>
      <dc:date>2025-05-06T07:15:16Z</dc:date>
    </item>
  </channel>
</rss>

