<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Using Libreoffice in Databricks in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/using-libreoffice-in-databricks/m-p/38556#M26674</link>
    <description>&lt;P&gt;I suppose by Libreoffice you mean the sdk, without the frontend?&lt;/P&gt;&lt;P&gt;You will have to install the jar as a library on the compute cluster.&lt;BR /&gt;From that moment on, you can use the classes in your code.&lt;BR /&gt;If you cannot run the jar from a command line, it might be because it is not an executable.&lt;/P&gt;&lt;P&gt;Besides that: Databricks might not be the correct tool for such a scenario.&lt;/P&gt;</description>
    <pubDate>Thu, 27 Jul 2023 09:59:51 GMT</pubDate>
    <dc:creator>-werners-</dc:creator>
    <dc:date>2023-07-27T09:59:51Z</dc:date>
    <item>
      <title>Using Libreoffice in Databricks</title>
      <link>https://community.databricks.com/t5/data-engineering/using-libreoffice-in-databricks/m-p/38544#M26668</link>
      <description>&lt;P&gt;Hi Community,&amp;nbsp;&lt;/P&gt;&lt;P&gt;I'm using Databricks E2, and need to convert pptx files to pdf files.&lt;/P&gt;&lt;P&gt;This can be done in either a python or an R notebook using #Libreoffice&lt;/P&gt;&lt;P&gt;To achieve this I'd have to download LibreOffice; I'm not too sure on how to do that. Would I have to download on the cluster I'm using? if yes, then I tried uploading LibreOffice jar file from the compute tab, i can see it under the /dbfs/FileStore/jars directory., but when I try to use the soffice command in a %sh cell, it does not recognize it&lt;/P&gt;&lt;P&gt;Could someone guide me on how to achieve this.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 27 Jul 2023 07:22:05 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/using-libreoffice-in-databricks/m-p/38544#M26668</guid>
      <dc:creator>dzm</dc:creator>
      <dc:date>2023-07-27T07:22:05Z</dc:date>
    </item>
    <item>
      <title>Re: Using Libreoffice in Databricks</title>
      <link>https://community.databricks.com/t5/data-engineering/using-libreoffice-in-databricks/m-p/38556#M26674</link>
      <description>&lt;P&gt;I suppose by Libreoffice you mean the sdk, without the frontend?&lt;/P&gt;&lt;P&gt;You will have to install the jar as a library on the compute cluster.&lt;BR /&gt;From that moment on, you can use the classes in your code.&lt;BR /&gt;If you cannot run the jar from a command line, it might be because it is not an executable.&lt;/P&gt;&lt;P&gt;Besides that: Databricks might not be the correct tool for such a scenario.&lt;/P&gt;</description>
      <pubDate>Thu, 27 Jul 2023 09:59:51 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/using-libreoffice-in-databricks/m-p/38556#M26674</guid>
      <dc:creator>-werners-</dc:creator>
      <dc:date>2023-07-27T09:59:51Z</dc:date>
    </item>
  </channel>
</rss>

