<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Performance issue while calling Sagemaker Endpoint in pyspark udf in Get Started Discussions</title>
    <link>https://community.databricks.com/t5/get-started-discussions/performance-issue-while-calling-sagemaker-endpoint-in-pyspark/m-p/50113#M1669</link>
    <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I have pyspark dataframe which calls pyspark udf which in turn calls sagemaker endpoint. But when dataframe has more rows, endpoint start failing. Also it takes longer to process.&lt;/P&gt;&lt;P&gt;Please suggest how to call sagemaker endpoint from pyspark.&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;Sanjay&lt;/P&gt;</description>
    <pubDate>Mon, 30 Oct 2023 14:53:48 GMT</pubDate>
    <dc:creator>sanjay</dc:creator>
    <dc:date>2023-10-30T14:53:48Z</dc:date>
    <item>
      <title>Performance issue while calling Sagemaker Endpoint in pyspark udf</title>
      <link>https://community.databricks.com/t5/get-started-discussions/performance-issue-while-calling-sagemaker-endpoint-in-pyspark/m-p/50113#M1669</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I have pyspark dataframe which calls pyspark udf which in turn calls sagemaker endpoint. But when dataframe has more rows, endpoint start failing. Also it takes longer to process.&lt;/P&gt;&lt;P&gt;Please suggest how to call sagemaker endpoint from pyspark.&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;Sanjay&lt;/P&gt;</description>
      <pubDate>Mon, 30 Oct 2023 14:53:48 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/performance-issue-while-calling-sagemaker-endpoint-in-pyspark/m-p/50113#M1669</guid>
      <dc:creator>sanjay</dc:creator>
      <dc:date>2023-10-30T14:53:48Z</dc:date>
    </item>
    <item>
      <title>Re: Performance issue while calling Sagemaker Endpoint in pyspark udf</title>
      <link>https://community.databricks.com/t5/get-started-discussions/performance-issue-while-calling-sagemaker-endpoint-in-pyspark/m-p/50172#M1674</link>
      <description>&lt;P&gt;Thank you&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/9"&gt;@Retired_mod&lt;/a&gt;&amp;nbsp;for prompt response.&amp;nbsp;&lt;/P&gt;&lt;P&gt;"send batch to sagemaker", you mean sending multiple data records in every sagemaker call? As sagemaker has 60 second timeout, will this not timeout the request if there are multiple records in single call&lt;/P&gt;</description>
      <pubDate>Tue, 31 Oct 2023 07:01:55 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/performance-issue-while-calling-sagemaker-endpoint-in-pyspark/m-p/50172#M1674</guid>
      <dc:creator>sanjay</dc:creator>
      <dc:date>2023-10-31T07:01:55Z</dc:date>
    </item>
  </channel>
</rss>

