<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic PDF Generation via databricks Job in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/pdf-generation-via-databricks-job/m-p/113559#M44569</link>
    <description>&lt;P&gt;WE have a databricks Job that will aggregate some data and create some data tables. This needs to be exported out in a PDF format.&lt;BR /&gt;&lt;BR /&gt;I have seen a few python libraries that can generate PDF, but was wondering if the PDF can be generated and dropped in a cloud storage location frm databricks job.&lt;BR /&gt;&lt;BR /&gt;If anyone has some ideas on this, greatly appreciated.&lt;BR /&gt;&lt;BR /&gt;Mulder&lt;/P&gt;</description>
    <pubDate>Tue, 25 Mar 2025 18:31:36 GMT</pubDate>
    <dc:creator>Mulder81</dc:creator>
    <dc:date>2025-03-25T18:31:36Z</dc:date>
    <item>
      <title>PDF Generation via databricks Job</title>
      <link>https://community.databricks.com/t5/data-engineering/pdf-generation-via-databricks-job/m-p/113559#M44569</link>
      <description>&lt;P&gt;WE have a databricks Job that will aggregate some data and create some data tables. This needs to be exported out in a PDF format.&lt;BR /&gt;&lt;BR /&gt;I have seen a few python libraries that can generate PDF, but was wondering if the PDF can be generated and dropped in a cloud storage location frm databricks job.&lt;BR /&gt;&lt;BR /&gt;If anyone has some ideas on this, greatly appreciated.&lt;BR /&gt;&lt;BR /&gt;Mulder&lt;/P&gt;</description>
      <pubDate>Tue, 25 Mar 2025 18:31:36 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/pdf-generation-via-databricks-job/m-p/113559#M44569</guid>
      <dc:creator>Mulder81</dc:creator>
      <dc:date>2025-03-25T18:31:36Z</dc:date>
    </item>
    <item>
      <title>Re: PDF Generation via databricks Job</title>
      <link>https://community.databricks.com/t5/data-engineering/pdf-generation-via-databricks-job/m-p/113567#M44571</link>
      <description>&lt;P&gt;Hey &lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/77919"&gt;@Mulder81&lt;/a&gt;&amp;nbsp;,&lt;/P&gt;&lt;P&gt;After generating file you can copy it to dediacted blob storage using below command.&lt;/P&gt;&lt;P&gt;dbutils.fs.cp(source_path,&amp;nbsp;destination_path)&lt;/P&gt;&lt;P&gt;You can also try saving file in desired path (blob storage) but there can be some obstacles&amp;nbsp;&lt;/P&gt;&lt;P&gt;BR,&lt;/P&gt;&lt;P&gt;Piotrek&lt;/P&gt;</description>
      <pubDate>Tue, 25 Mar 2025 19:10:01 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/pdf-generation-via-databricks-job/m-p/113567#M44571</guid>
      <dc:creator>PiotrMi</dc:creator>
      <dc:date>2025-03-25T19:10:01Z</dc:date>
    </item>
    <item>
      <title>Re: PDF Generation via databricks Job</title>
      <link>https://community.databricks.com/t5/data-engineering/pdf-generation-via-databricks-job/m-p/113570#M44574</link>
      <description>&lt;P&gt;Are there any specific ways to generate the PDF file from a dataframe? and libraries that work&lt;/P&gt;</description>
      <pubDate>Tue, 25 Mar 2025 19:23:49 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/pdf-generation-via-databricks-job/m-p/113570#M44574</guid>
      <dc:creator>Mulder81</dc:creator>
      <dc:date>2025-03-25T19:23:49Z</dc:date>
    </item>
    <item>
      <title>Re: PDF Generation via databricks Job</title>
      <link>https://community.databricks.com/t5/data-engineering/pdf-generation-via-databricks-job/m-p/113593#M44579</link>
      <description>&lt;P&gt;Hey &lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/77919"&gt;@Mulder81&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;You can try this article&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;A title="Pdf tutorial" href="https://medium.com/@mahijain9211/creating-a-python-class-for-generating-pdf-tables-from-a-pandas-dataframe-using-fpdf2-c0eb4b88355c" target="_blank" rel="noopener"&gt;https://medium.com/@mahijain9211/creating-a-python-class-for-generating-pdf-tables-from-a-pandas-dataframe-using-fpdf2-c0eb4b88355c&lt;/A&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;It uses pandas and fpdf. Also you need to read about temporary place/path where you save pdf for later copying for blob&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 25 Mar 2025 21:23:16 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/pdf-generation-via-databricks-job/m-p/113593#M44579</guid>
      <dc:creator>PiotrMi</dc:creator>
      <dc:date>2025-03-25T21:23:16Z</dc:date>
    </item>
  </channel>
</rss>

