<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic DataBricks Foundational model rate limiting approach in Generative AI</title>
    <link>https://community.databricks.com/t5/generative-ai/databricks-foundational-model-rate-limiting-approach/m-p/98562#M639</link>
    <description>&lt;P&gt;Hi there,&lt;/P&gt;&lt;P&gt;is this the correct approach to fulfil the rate limit restrictions in the foundational model API?&lt;/P&gt;&lt;LI-CODE lang="python"&gt;from langchain_core.rate_limiters import InMemoryRateLimiter

rate_limiter = InMemoryRateLimiter(
    requests_per_second=2.0, 
    check_every_n_seconds=0.5, 
    max_bucket_size=10
)

chat_model = ChatDatabricks(
            endpoint=model,
            temperature=temperature,
            max_tokens=max_tokens,
            rate_limiter=rate_limiter
        )&lt;/LI-CODE&gt;</description>
    <pubDate>Tue, 12 Nov 2024 15:51:27 GMT</pubDate>
    <dc:creator>llmnerd</dc:creator>
    <dc:date>2024-11-12T15:51:27Z</dc:date>
    <item>
      <title>DataBricks Foundational model rate limiting approach</title>
      <link>https://community.databricks.com/t5/generative-ai/databricks-foundational-model-rate-limiting-approach/m-p/98562#M639</link>
      <description>&lt;P&gt;Hi there,&lt;/P&gt;&lt;P&gt;is this the correct approach to fulfil the rate limit restrictions in the foundational model API?&lt;/P&gt;&lt;LI-CODE lang="python"&gt;from langchain_core.rate_limiters import InMemoryRateLimiter

rate_limiter = InMemoryRateLimiter(
    requests_per_second=2.0, 
    check_every_n_seconds=0.5, 
    max_bucket_size=10
)

chat_model = ChatDatabricks(
            endpoint=model,
            temperature=temperature,
            max_tokens=max_tokens,
            rate_limiter=rate_limiter
        )&lt;/LI-CODE&gt;</description>
      <pubDate>Tue, 12 Nov 2024 15:51:27 GMT</pubDate>
      <guid>https://community.databricks.com/t5/generative-ai/databricks-foundational-model-rate-limiting-approach/m-p/98562#M639</guid>
      <dc:creator>llmnerd</dc:creator>
      <dc:date>2024-11-12T15:51:27Z</dc:date>
    </item>
    <item>
      <title>Re: DataBricks Foundational model rate limiting approach</title>
      <link>https://community.databricks.com/t5/generative-ai/databricks-foundational-model-rate-limiting-approach/m-p/98588#M641</link>
      <description>&lt;P&gt;Hello&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/132004"&gt;@llmnerd&lt;/a&gt;,&lt;/P&gt;
&lt;P&gt;Yes, the approach you have outlined to fulfill the rate limit restrictions in the foundational model API using &lt;CODE&gt;InMemoryRateLimiter&lt;/CODE&gt; from &lt;CODE&gt;langchain_core&lt;/CODE&gt; appears to be correct. This setup should help you manage the rate limits effectively for your foundational model API. If you have any specific requirements or encounter any issues please let us know.&lt;/P&gt;</description>
      <pubDate>Tue, 12 Nov 2024 22:00:56 GMT</pubDate>
      <guid>https://community.databricks.com/t5/generative-ai/databricks-foundational-model-rate-limiting-approach/m-p/98588#M641</guid>
      <dc:creator>Alberto_Umana</dc:creator>
      <dc:date>2024-11-12T22:00:56Z</dc:date>
    </item>
  </channel>
</rss>

