<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Databricks + Snowflake Snowpipe Streaming in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4588#M1269</link>
    <description>&lt;P&gt;why do you need Snowpipe at all ? Connect to Kafka directly from Databricks : check &lt;A href="https://www.dbdemos.ai/demo.html?demoName=streaming-sessionization" alt="https://www.dbdemos.ai/demo.html?demoName=streaming-sessionization" target="_blank"&gt;https://www.dbdemos.ai/demo.html?demoName=streaming-sessionization&lt;/A&gt;&lt;/P&gt;</description>
    <pubDate>Wed, 10 May 2023 13:35:25 GMT</pubDate>
    <dc:creator>artsheiko</dc:creator>
    <dc:date>2023-05-10T13:35:25Z</dc:date>
    <item>
      <title>Databricks + Snowflake Snowpipe Streaming</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4585#M1266</link>
      <description>&lt;P&gt;Does anyone know whether it is possible to use Databricks Snowflake Connector together with the latest Snowflake feature which is Snowpipe Streaming?&lt;/P&gt;</description>
      <pubDate>Wed, 10 May 2023 11:28:04 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4585#M1266</guid>
      <dc:creator>ptutak</dc:creator>
      <dc:date>2023-05-10T11:28:04Z</dc:date>
    </item>
    <item>
      <title>Re: Databricks + Snowflake Snowpipe Streaming</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4586#M1267</link>
      <description>&lt;P&gt;At its core, &lt;A href="https://docs.snowflake.com/en/user-guide/data-load-snowpipe-intro.html" alt="https://docs.snowflake.com/en/user-guide/data-load-snowpipe-intro.html" target="_blank"&gt;&lt;U&gt;Snowpipe&lt;/U&gt;&lt;/A&gt; is a tool to copy data into Snowflake from cloud storage. Snowpipe is not about a streaming, but about how to batch load data from cloud storage into a table on a recurring basis.&lt;/P&gt;&lt;P&gt;Databricks has a similar feature that we call &lt;A href="https://docs.databricks.com/ingestion/auto-loader/index.html" alt="https://docs.databricks.com/ingestion/auto-loader/index.html" target="_blank"&gt;Auto Loader&lt;/A&gt;. Auto loader enables developers to create a Spark Structured Streaming pipeline with cloud files as a data source.&lt;/P&gt;&lt;P&gt;Use &lt;A href="https://docs.databricks.com/structured-streaming/index.html" alt="https://docs.databricks.com/structured-streaming/index.html" target="_blank"&gt;Structured Streaming&lt;/A&gt; or &lt;A href="https://docs.databricks.com/delta-live-tables/index.html" alt="https://docs.databricks.com/delta-live-tables/index.html" target="_blank"&gt;Delta Live Tables&lt;/A&gt; to implement streaming use-cases.&lt;/P&gt;</description>
      <pubDate>Wed, 10 May 2023 13:17:48 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4586#M1267</guid>
      <dc:creator>artsheiko</dc:creator>
      <dc:date>2023-05-10T13:17:48Z</dc:date>
    </item>
    <item>
      <title>Re: Databricks + Snowflake Snowpipe Streaming</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4587#M1268</link>
      <description>&lt;P&gt;The use case that we're trying to solve is loading data from Kafka into Snowflake using Databricks, we could use the Databricks Snowflake Connector but only if it's able to use &lt;A href="https://docs.snowflake.com/en/user-guide/data-load-snowpipe-streaming-overview" alt="https://docs.snowflake.com/en/user-guide/data-load-snowpipe-streaming-overview" target="_blank"&gt;Snowpipe Streaming&lt;/A&gt; underneath.&lt;/P&gt;</description>
      <pubDate>Wed, 10 May 2023 13:33:24 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4587#M1268</guid>
      <dc:creator>ptutak</dc:creator>
      <dc:date>2023-05-10T13:33:24Z</dc:date>
    </item>
    <item>
      <title>Re: Databricks + Snowflake Snowpipe Streaming</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4588#M1269</link>
      <description>&lt;P&gt;why do you need Snowpipe at all ? Connect to Kafka directly from Databricks : check &lt;A href="https://www.dbdemos.ai/demo.html?demoName=streaming-sessionization" alt="https://www.dbdemos.ai/demo.html?demoName=streaming-sessionization" target="_blank"&gt;https://www.dbdemos.ai/demo.html?demoName=streaming-sessionization&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 10 May 2023 13:35:25 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4588#M1269</guid>
      <dc:creator>artsheiko</dc:creator>
      <dc:date>2023-05-10T13:35:25Z</dc:date>
    </item>
    <item>
      <title>Re: Databricks + Snowflake Snowpipe Streaming</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4589#M1270</link>
      <description>&lt;P&gt;With typical Snowflake Connector we cannot omit the Snowflake Warehouse which adds to the cost of the whole operation, whereas when we're using Snowpipe Streaming we can omit the Warehouse and reduce the cost: &lt;A href="https://docs.snowflake.com/en/user-guide/data-load-snowpipe-streaming-billing" alt="https://docs.snowflake.com/en/user-guide/data-load-snowpipe-streaming-billing" target="_blank"&gt;snowpipe-streaming-cost&lt;/A&gt; .&lt;/P&gt;</description>
      <pubDate>Wed, 10 May 2023 15:22:07 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4589#M1270</guid>
      <dc:creator>ptutak</dc:creator>
      <dc:date>2023-05-10T15:22:07Z</dc:date>
    </item>
    <item>
      <title>Re: Databricks + Snowflake Snowpipe Streaming</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4590#M1271</link>
      <description>&lt;P&gt;@Piotr Tutak​&amp;nbsp;, I believe you don't need Snowflake at all - just use source files / events from your Data Lake / message brocker to process it whithin Databricks. Auto-loader that might be combined with DLT.&lt;/P&gt;&lt;P&gt;&lt;A href="https://www.youtube.com/watch?v=_yfApABaeBk" alt="https://www.youtube.com/watch?v=_yfApABaeBk" target="_blank"&gt;How to + demo&lt;/A&gt;.&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.databricks.com/ingestion/auto-loader/index.html" alt="https://docs.databricks.com/ingestion/auto-loader/index.html" target="_blank"&gt;Auto loader doc&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.databricks.com/delta-live-tables/index.html" alt="https://docs.databricks.com/delta-live-tables/index.html" target="_blank"&gt;DLT doc&lt;/A&gt;&lt;/P&gt;&lt;P&gt;With Auto loader you'll benefit also from the possibility to work in streaming mode and switch to batch if needed. DLT allows to guarantee data quality. Obviously much more value added features might be listed here if we compare vs snowpipe. Among them you'll be able to estimate and control costs - something that is still not possible with snowpipe, unfortunately.&lt;/P&gt;</description>
      <pubDate>Fri, 09 Jun 2023 20:19:00 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-snowflake-snowpipe-streaming/m-p/4590#M1271</guid>
      <dc:creator>artsheiko</dc:creator>
      <dc:date>2023-06-09T20:19:00Z</dc:date>
    </item>
  </channel>
</rss>

