<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Databricks cluster starts with docker in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/databricks-cluster-starts-with-docker/m-p/13531#M8204</link>
    <description>&lt;P&gt;Hi @Ignacio Guillamondegui​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Hope all is well! Just wanted to check in if you were able to resolve your issue and would you be happy to share the solution or mark an answer as best? Else please let us know if you need more help.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;We'd love to hear from you.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
    <pubDate>Sun, 04 Sep 2022 07:04:32 GMT</pubDate>
    <dc:creator>Vidula</dc:creator>
    <dc:date>2022-09-04T07:04:32Z</dc:date>
    <item>
      <title>Databricks cluster starts with docker</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-cluster-starts-with-docker/m-p/13527#M8200</link>
      <description>&lt;P&gt;Hi there!&lt;/P&gt;&lt;P&gt;I hope u are doing well&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I'm trying to start a cluster with a docker image to install all the libraries that I have to use.&lt;/P&gt;&lt;P&gt;I have the following Dockerfile to install only python libraries as you can see&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;FROM databricksruntime/standard
WORKDIR /app
COPY . .
RUN apt-get update &amp;amp;&amp;amp; apt-get install -y python3-pip
RUN sudo apt-get install -y libpq-dev
RUN pip install -r /app/requirements.txt
CMD ["python3"]&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Does anybody knows how to install maven libraries from this same Dockerfile? I've tried and looked up for many solutions but I can't figure it out how to do that.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;The last thing I've had tried is to use a Multi stage building using the Maven image but I had trouble with the dependencies (&lt;B&gt;missing POM.xml file&lt;/B&gt;).&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;# MAVEN + PYTHON
&amp;nbsp;
FROM databricksruntime/standard
WORKDIR /app
COPY . .
RUN apt-get update &amp;amp;&amp;amp; apt-get install -y python3-pip
RUN sudo apt-get install -y libpq-dev
RUN pip install -r /app/requirements.txt
CMD ["python3"]
&amp;nbsp;
FROM maven:latest
WORKDIR /root
COPY --from=0 /app .
&amp;nbsp;
RUN mvn clean install org.apache.maven.plugins:maven-dependency-plugin:2.1:get \
    -DrepoUrl=https://mvnrepository.com/artifact/com.crealytics/spark-excel_2.12/0.14.0 \
    -Dartifact=com.crealytics:spark-excel_2.12:0.14.0
&amp;nbsp;
RUN mvn clean install org.apache.maven.plugins:maven-dependency-plugin:2.1:get \
    -DrepoUrl=https://mvnrepository.com/artifact/mysql/mysql-connector-java \
    -Dartifact=mysql:mysql-connector-java:8.0.29&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image.png"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1691i8599DDFCBC6868E8/image-size/large?v=v2&amp;amp;px=999" role="button" title="image.png" alt="image.png" /&gt;&lt;/span&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I don't get it how to install maven libraries from Dockerfile&lt;/P&gt;&lt;P&gt;If someone has knowledge about something like this and could help me I will appreciate it a lot.&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;</description>
      <pubDate>Thu, 14 Jul 2022 14:09:25 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-cluster-starts-with-docker/m-p/13527#M8200</guid>
      <dc:creator>nachog99</dc:creator>
      <dc:date>2022-07-14T14:09:25Z</dc:date>
    </item>
    <item>
      <title>Re: Databricks cluster starts with docker</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-cluster-starts-with-docker/m-p/13529#M8202</link>
      <description>&lt;P&gt;Thanks! I have tried some answers from the S.O discussion and I could build the image but I can't run it.&lt;/P&gt;&lt;P&gt;I can build the image using the flag &lt;I&gt;dependency:solve&lt;/I&gt;&lt;/P&gt;&lt;P&gt;But still can't install it, when I have to run it I receive the next message, so the cluster can't start&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1701iBB6841F2BFA13A48/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;Anyways, I'm grateful about your answer because it was very useful to keep learning about how to resolve this issue, I appreciate that&lt;/P&gt;</description>
      <pubDate>Fri, 15 Jul 2022 20:57:23 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-cluster-starts-with-docker/m-p/13529#M8202</guid>
      <dc:creator>nachog99</dc:creator>
      <dc:date>2022-07-15T20:57:23Z</dc:date>
    </item>
    <item>
      <title>Re: Databricks cluster starts with docker</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-cluster-starts-with-docker/m-p/13530#M8203</link>
      <description>&lt;P&gt;1) Install your jars in a new layer, not in the same layer &lt;/P&gt;&lt;P&gt;2) installing with maven is more work than building the library in your jar layer&lt;/P&gt;</description>
      <pubDate>Sun, 17 Jul 2022 15:34:07 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-cluster-starts-with-docker/m-p/13530#M8203</guid>
      <dc:creator>axb0</dc:creator>
      <dc:date>2022-07-17T15:34:07Z</dc:date>
    </item>
    <item>
      <title>Re: Databricks cluster starts with docker</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-cluster-starts-with-docker/m-p/13531#M8204</link>
      <description>&lt;P&gt;Hi @Ignacio Guillamondegui​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Hope all is well! Just wanted to check in if you were able to resolve your issue and would you be happy to share the solution or mark an answer as best? Else please let us know if you need more help.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;We'd love to hear from you.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Sun, 04 Sep 2022 07:04:32 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-cluster-starts-with-docker/m-p/13531#M8204</guid>
      <dc:creator>Vidula</dc:creator>
      <dc:date>2022-09-04T07:04:32Z</dc:date>
    </item>
    <item>
      <title>Re: Databricks cluster starts with docker</title>
      <link>https://community.databricks.com/t5/data-engineering/databricks-cluster-starts-with-docker/m-p/13532#M8205</link>
      <description>&lt;P&gt;Hi! I am facing a similar issue.&lt;/P&gt;&lt;P&gt;I tried to use this one&lt;/P&gt;&lt;PRE&gt;&lt;CODE&gt;FROM databricksruntime/standard:10.4-LTS
&amp;nbsp;
ENV DEBIAN_FRONTEND=noninteractive
RUN apt update &amp;amp;&amp;amp; apt install -y maven &amp;amp;&amp;amp; rm -rf /var/lib/apt/lists/*
&amp;nbsp;
RUN /databricks/python3/bin/pip install databricks-cli
&amp;nbsp;
RUN mkdir /databricks/jars
&amp;nbsp;
RUN mvn org.apache.maven.plugins:maven-dependency-plugin:2.8:get -Dartifact=com.microsoft.azure.kusto:kusto-spark_3.0_2.12:2.5.2 -Ddest=/databricks/jars/
&amp;nbsp;
RUN /databricks/python3/bin/pip install azure-kusto-data==2.1.1&lt;/CODE&gt;&lt;/PRE&gt;&lt;P&gt;But it looks like it doesn't work. I get an error &lt;B&gt;java.lang.NoClassDefFoundError: com/microsoft/azure/kusto/data/exceptions/DataServiceException&lt;/B&gt;&lt;/P&gt;&lt;P&gt;And if I install libraries using an interface like on the picture - everything works.&lt;span class="lia-inline-image-display-wrapper" image-alt="Screenshot 2023-03-30 at 10.49.33"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1694i117D8C22DA7C5499/image-size/large?v=v2&amp;amp;px=999" role="button" title="Screenshot 2023-03-30 at 10.49.33" alt="Screenshot 2023-03-30 at 10.49.33" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 30 Mar 2023 08:50:51 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/databricks-cluster-starts-with-docker/m-p/13532#M8205</guid>
      <dc:creator>xneg</dc:creator>
      <dc:date>2023-03-30T08:50:51Z</dc:date>
    </item>
  </channel>
</rss>

