<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Unable to connect mongo with Databricks in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/unable-to-connect-mongo-with-databricks/m-p/65738#M32908</link>
    <description>&lt;P&gt;Yes, I verified. The path is correct.&lt;/P&gt;</description>
    <pubDate>Mon, 08 Apr 2024 04:37:02 GMT</pubDate>
    <dc:creator>InTimetec</dc:creator>
    <dc:date>2024-04-08T04:37:02Z</dc:date>
    <item>
      <title>Unable to connect mongo with Databricks</title>
      <link>https://community.databricks.com/t5/data-engineering/unable-to-connect-mongo-with-databricks/m-p/65551#M32839</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;I am trying to connect mongo with Databricks. I also used SSL certificate.&lt;/P&gt;&lt;P&gt;I created my own cluster and installed maven library&amp;nbsp;&lt;A target="_blank"&gt;org.mongodb.spark:mongo-spark-connector_2.12:3.0.1.&lt;/A&gt;&lt;/P&gt;&lt;P&gt;This is my code:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;connection_string =f"mongodb://{secret['user']}:{secret['password']}@{secret['host']}:{secret['port']}/?authSource={secret['database']}&amp;amp;tls=true&amp;amp;tlsCAFile=temp/CA-certificate.pem"

df = spark.read.format("com.mongodb.spark.sql.DefaultSource")\
    .option("database", database)\
    .option("collection", collection)\
    .option("spark.mongodb.input.uri", connectionString)\
    .option("ssl", "true")\
    .option("sslCertificate", sslCertificateFilePath)\
    .load()&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;When I am running above code getting below error:&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="InTimetec_0-1712295715248.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/6926i6199903D9B3C8719/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="InTimetec_0-1712295715248.png" alt="InTimetec_0-1712295715248.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;Please provide me solution for this.&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 05 Apr 2024 05:43:44 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/unable-to-connect-mongo-with-databricks/m-p/65551#M32839</guid>
      <dc:creator>InTimetec</dc:creator>
      <dc:date>2024-04-05T05:43:44Z</dc:date>
    </item>
    <item>
      <title>Re: Unable to connect mongo with Databricks</title>
      <link>https://community.databricks.com/t5/data-engineering/unable-to-connect-mongo-with-databricks/m-p/65641#M32875</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/103252"&gt;@InTimetec&lt;/a&gt;&amp;nbsp;- can you please check/list if the sslCertificate is available in the sslCertifcateFilePath mentioned above?&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 05 Apr 2024 17:47:54 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/unable-to-connect-mongo-with-databricks/m-p/65641#M32875</guid>
      <dc:creator>shan_chandra</dc:creator>
      <dc:date>2024-04-05T17:47:54Z</dc:date>
    </item>
    <item>
      <title>Re: Unable to connect mongo with Databricks</title>
      <link>https://community.databricks.com/t5/data-engineering/unable-to-connect-mongo-with-databricks/m-p/65736#M32907</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/9"&gt;@Retired_mod&lt;/a&gt;&amp;nbsp;I updated my code as below:&lt;/P&gt;&lt;LI-CODE lang="markup"&gt; df = spark.read.format("com.mongodb.spark.sql.DefaultSource")\
        .option("database", database)\
        .option("collection", collection)\
        .option("spark.mongodb.input.uri", connectionString)\
        .option("tlsUseSystemCA","true")\
        .load()&lt;/LI-CODE&gt;&lt;P&gt;Now I am getting below error:&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;Error: An error occurred while calling o516.load.
: com.mongodb.MongoTimeoutException: Timed out after 30000 ms while waiting to connect. Client view of cluster state is {type=UNKNOWN, servers=[{address=a-coe-aws-mongo-db.cluster-cubeteznsgeb.us-west-2.docdb.amazonaws.com:27017, type=UNKNOWN, state=CONNECTING}]
	at com.mongodb.internal.connection.BaseCluster.getDescription(BaseCluster.java:177)
	at com.mongodb.internal.connection.SingleServerCluster.getDescription(SingleServerCluster.java:41)
	at com.mongodb.client.internal.MongoClientDelegate.getConnectedClusterDescription(MongoClientDelegate.java:147)
	at com.mongodb.client.internal.MongoClientDelegate.createClientSession(MongoClientDelegate.java:98)
	at com.mongodb.client.internal.MongoClientDelegate$DelegateOperationExecutor.getClientSession(MongoClientDelegate.java:278)
	at com.mongodb.client.internal.MongoClientDelegate$DelegateOperationExecutor.execute(MongoClientDelegate.java:182)
	at com.mongodb.client.internal.MongoDatabaseImpl.executeCommand(MongoDatabaseImpl.java:194)
	at com.mongodb.client.internal.MongoDatabaseImpl.runCommand(MongoDatabaseImpl.java:163)
	at com.mongodb.client.internal.MongoDatabaseImpl.runCommand(MongoDatabaseImpl.java:158)
	at com.mongodb.spark.MongoConnector.$anonfun$hasSampleAggregateOperator$1(MongoConnector.scala:234)
	at com.mongodb.spark.MongoConnector.$anonfun$withDatabaseDo$1(MongoConnector.scala:171)
	at com.mongodb.spark.MongoConnector.withMongoClientDo(MongoConnector.scala:154)
	at com.mongodb.spark.MongoConnector.withDatabaseDo(MongoConnector.scala:171)
	at com.mongodb.spark.MongoConnector.hasSampleAggregateOperator(MongoConnector.scala:234)
	at com.mongodb.spark.rdd.MongoRDD.hasSampleAggregateOperator$lzycompute(MongoRDD.scala:221)
	at com.mongodb.spark.rdd.MongoRDD.hasSampleAggregateOperator(MongoRDD.scala:221)
	at com.mongodb.spark.sql.MongoInferSchema$.apply(MongoInferSchema.scala:68)
	at com.mongodb.spark.sql.DefaultSource.constructRelation(DefaultSource.scala:97)
	at com.mongodb.spark.sql.DefaultSource.createRelation(DefaultSource.scala:50)
	at org.apache.spark.sql.execution.datasources.DataSource.resolveRelation(DataSource.scala:390)
	at org.apache.spark.sql.DataFrameReader.loadV1Source(DataFrameReader.scala:378)
	at org.apache.spark.sql.DataFrameReader.$anonfun$load$2(DataFrameReader.scala:334)
	at scala.Option.getOrElse(Option.scala:189)
	at org.apache.spark.sql.DataFrameReader.load(DataFrameReader.scala:334)
	at org.apache.spark.sql.DataFrameReader.load(DataFrameReader.scala:226)
	at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)
	at sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)
	at sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
	at java.lang.reflect.Method.invoke(Method.java:498)
	at py4j.reflection.MethodInvoker.invoke(MethodInvoker.java:244)
	at py4j.reflection.ReflectionEngine.invoke(ReflectionEngine.java:397)
	at py4j.Gateway.invoke(Gateway.java:306)
	at py4j.commands.AbstractCommand.invokeMethod(AbstractCommand.java:132)
	at py4j.commands.CallCommand.execute(CallCommand.java:79)
	at py4j.ClientServerConnection.waitForCommands(ClientServerConnection.java:199)
	at py4j.ClientServerConnection.run(ClientServerConnection.java:119)
	at java.lang.Thread.run(Thread.java:750)&lt;/LI-CODE&gt;&lt;P&gt;I tried to increase timeout as well. for this I added below code.&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;.option("spark.mongodb.input.connectionTimeoutMs", "120000")&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;But still getting same error.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 08 Apr 2024 04:34:05 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/unable-to-connect-mongo-with-databricks/m-p/65736#M32907</guid>
      <dc:creator>InTimetec</dc:creator>
      <dc:date>2024-04-08T04:34:05Z</dc:date>
    </item>
    <item>
      <title>Re: Unable to connect mongo with Databricks</title>
      <link>https://community.databricks.com/t5/data-engineering/unable-to-connect-mongo-with-databricks/m-p/65738#M32908</link>
      <description>&lt;P&gt;Yes, I verified. The path is correct.&lt;/P&gt;</description>
      <pubDate>Mon, 08 Apr 2024 04:37:02 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/unable-to-connect-mongo-with-databricks/m-p/65738#M32908</guid>
      <dc:creator>InTimetec</dc:creator>
      <dc:date>2024-04-08T04:37:02Z</dc:date>
    </item>
    <item>
      <title>Re: Unable to connect mongo with Databricks</title>
      <link>https://community.databricks.com/t5/data-engineering/unable-to-connect-mongo-with-databricks/m-p/66042#M32997</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/103252"&gt;@InTimetec&lt;/a&gt;&amp;nbsp; - could you please check if the port 27017 is accessible from the workspace VPC network? Also, please check with your internal network team for any connectivity issues.&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Per this documented observation -&amp;nbsp;&lt;A href="https://community.databricks.com/t5/data-engineering/mongodb-spark-connector-v10-x-read-error-on-databricks-13-x/m-p/45342#M27855," target="_blank"&gt;https://community.databricks.com/t5/data-engineering/mongodb-spark-connector-v10-x-read-error-on-databricks-13-x/m-p/45342#M27855,&lt;/A&gt;&amp;nbsp;you can use DBR 13.3 LTS cluster for compatibility.&lt;/P&gt;</description>
      <pubDate>Wed, 10 Apr 2024 20:17:48 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/unable-to-connect-mongo-with-databricks/m-p/66042#M32997</guid>
      <dc:creator>shan_chandra</dc:creator>
      <dc:date>2024-04-10T20:17:48Z</dc:date>
    </item>
  </channel>
</rss>

