<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Unable to stream from google pub/sub in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/unable-to-stream-from-google-pub-sub/m-p/109524#M43339</link>
    <description>&lt;P&gt;I see some issues from using pubsub as source.&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;in the writeStream, both .foreach or .foreachBatch cannot work to be called when stream data arrives&lt;/P&gt;</description>
    <pubDate>Sun, 09 Feb 2025 08:12:13 GMT</pubDate>
    <dc:creator>davidkhala-ms</dc:creator>
    <dc:date>2025-02-09T08:12:13Z</dc:date>
    <item>
      <title>Unable to stream from google pub/sub</title>
      <link>https://community.databricks.com/t5/data-engineering/unable-to-stream-from-google-pub-sub/m-p/20220#M13627</link>
      <description>&lt;P&gt;I am trying to run below for subscribing to a pubsub but this code is throwing this exception &lt;/P&gt;&lt;P&gt;java.lang.NoClassDefFoundError: org/apache/spark/sql/sources/v2/DataSourceV2&lt;/P&gt;&lt;P&gt;I have tried using all versions of &lt;A href="https://mvnrepository.com/artifact/com.google.cloud/pubsublite-spark-sql-streaming" target="test_blank"&gt;https://mvnrepository.com/artifact/com.google.cloud/pubsublite-spark-sql-streaming&lt;/A&gt; no luck so far.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;from pyspark.sql import SparkSession&lt;/P&gt;&lt;P&gt;spark = SparkSession.builder.appName('Simple Pub/Sub Lite Read').getOrCreate()&lt;/P&gt;&lt;P&gt;df = spark.readStream \&lt;/P&gt;&lt;P&gt;&amp;nbsp;.format("pubsublite") \&lt;/P&gt;&lt;P&gt;&amp;nbsp;.option("pubsublite.subscription", "My subscription path") \&lt;/P&gt;&lt;P&gt;&amp;nbsp;.option("gcp.credentials.key", "my gcp credential").load()&lt;/P&gt;&lt;P&gt;df.show(10, False)&lt;/P&gt;</description>
      <pubDate>Wed, 18 May 2022 22:24:56 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/unable-to-stream-from-google-pub-sub/m-p/20220#M13627</guid>
      <dc:creator>210573</dc:creator>
      <dc:date>2022-05-18T22:24:56Z</dc:date>
    </item>
    <item>
      <title>Re: Unable to stream from google pub/sub</title>
      <link>https://community.databricks.com/t5/data-engineering/unable-to-stream-from-google-pub-sub/m-p/20221#M13628</link>
      <description>&lt;P&gt;can you retry without creating a sparksession? As databricks provides one for you.&lt;/P&gt;</description>
      <pubDate>Thu, 19 May 2022 07:23:05 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/unable-to-stream-from-google-pub-sub/m-p/20221#M13628</guid>
      <dc:creator>-werners-</dc:creator>
      <dc:date>2022-05-19T07:23:05Z</dc:date>
    </item>
    <item>
      <title>Re: Unable to stream from google pub/sub</title>
      <link>https://community.databricks.com/t5/data-engineering/unable-to-stream-from-google-pub-sub/m-p/20222#M13629</link>
      <description>&lt;P&gt;Hi @cloud user​&amp;nbsp;As of now, we do not have structured streaming support with Pub/Sub. Below are the supported sources with structured streaming:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.gcp.databricks.com/spark/latest/structured-streaming/data-sources.html" target="test_blank"&gt;https://docs.gcp.databricks.com/spark/latest/structured-streaming/data-sources.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 02 Jun 2022 03:37:49 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/unable-to-stream-from-google-pub-sub/m-p/20222#M13629</guid>
      <dc:creator>Noopur_Nigam</dc:creator>
      <dc:date>2022-06-02T03:37:49Z</dc:date>
    </item>
    <item>
      <title>Re: Unable to stream from google pub/sub</title>
      <link>https://community.databricks.com/t5/data-engineering/unable-to-stream-from-google-pub-sub/m-p/40368#M27190</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/57791"&gt;@210573&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Databricks now start supporting pub/sub streaming natively now you can start using pubsub streaming for your use case for more info visit below official URL -&lt;/P&gt;&lt;P&gt;&lt;A title="PUB/SUB with Databricks" href="https://docs.databricks.com/en/structured-streaming/pub-sub.html" target="_blank" rel="noopener"&gt;PUB/SUB with Databricks&lt;/A&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 18 Aug 2023 05:02:53 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/unable-to-stream-from-google-pub-sub/m-p/40368#M27190</guid>
      <dc:creator>Ajay-Pandey</dc:creator>
      <dc:date>2023-08-18T05:02:53Z</dc:date>
    </item>
    <item>
      <title>Re: Unable to stream from google pub/sub</title>
      <link>https://community.databricks.com/t5/data-engineering/unable-to-stream-from-google-pub-sub/m-p/109524#M43339</link>
      <description>&lt;P&gt;I see some issues from using pubsub as source.&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;in the writeStream, both .foreach or .foreachBatch cannot work to be called when stream data arrives&lt;/P&gt;</description>
      <pubDate>Sun, 09 Feb 2025 08:12:13 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/unable-to-stream-from-google-pub-sub/m-p/109524#M43339</guid>
      <dc:creator>davidkhala-ms</dc:creator>
      <dc:date>2025-02-09T08:12:13Z</dc:date>
    </item>
  </channel>
</rss>

