<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: TesseractNotFoundError in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7376#M3264</link>
    <description>&lt;P&gt;Hello @feed expedition​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;You can also try this - &lt;/P&gt;&lt;OL&gt;&lt;LI&gt;Create a new cluster or select an existing one in Databricks.&lt;/LI&gt;&lt;LI&gt;In the "Libraries" tab of the cluster settings, click on "Install New" and select "PyPI".&lt;/LI&gt;&lt;LI&gt;In the "Package" field, enter "pytesseract".&lt;/LI&gt;&lt;LI&gt;Click on "Install" and wait for the installation to complete.&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards,&lt;/P&gt;&lt;P&gt;Nandini&lt;/P&gt;</description>
    <pubDate>Tue, 21 Mar 2023 11:28:44 GMT</pubDate>
    <dc:creator>NandiniN</dc:creator>
    <dc:date>2023-03-21T11:28:44Z</dc:date>
    <item>
      <title>TesseractNotFoundError</title>
      <link>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7374#M3262</link>
      <description>&lt;P&gt;TesseractNotFoundError: tesseract is not installed or it's not in your PATH. See README file for more information. in databricks&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 21 Mar 2023 09:51:35 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7374#M3262</guid>
      <dc:creator>feed</dc:creator>
      <dc:date>2023-03-21T09:51:35Z</dc:date>
    </item>
    <item>
      <title>Re: TesseractNotFoundError</title>
      <link>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7375#M3263</link>
      <description>&lt;P&gt;To install Tesseract on your Databricks cluster, you can use the following command&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;%sh apt-get install -y tesseract-ocr&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;After installing Tesseract, you need to add the path to the Tesseract executable file to your PATH environment variable. To do this, you can run the following command in a Databricks notebook:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;%sh echo 'export PATH=/usr/bin:$PATH' &amp;gt;&amp;gt; ~/.bashrc &amp;amp;&amp;amp; source ~/.bashrc&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;This command adds the path to the Tesseract executable file to your PATH environment variable and makes it accessible to your Databricks notebook.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Check if Tesseract OCR is installed on your Databricks cluster. You can do this by running the following command in a Databricks notebook:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;%sh which tesseract&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;After following these steps, you should be able to use pytesseract in your Databricks notebook without encountering the "TesseractNotFoundError" error.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 21 Mar 2023 09:55:34 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7375#M3263</guid>
      <dc:creator>feed</dc:creator>
      <dc:date>2023-03-21T09:55:34Z</dc:date>
    </item>
    <item>
      <title>Re: TesseractNotFoundError</title>
      <link>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7376#M3264</link>
      <description>&lt;P&gt;Hello @feed expedition​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;You can also try this - &lt;/P&gt;&lt;OL&gt;&lt;LI&gt;Create a new cluster or select an existing one in Databricks.&lt;/LI&gt;&lt;LI&gt;In the "Libraries" tab of the cluster settings, click on "Install New" and select "PyPI".&lt;/LI&gt;&lt;LI&gt;In the "Package" field, enter "pytesseract".&lt;/LI&gt;&lt;LI&gt;Click on "Install" and wait for the installation to complete.&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks &amp;amp; Regards,&lt;/P&gt;&lt;P&gt;Nandini&lt;/P&gt;</description>
      <pubDate>Tue, 21 Mar 2023 11:28:44 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7376#M3264</guid>
      <dc:creator>NandiniN</dc:creator>
      <dc:date>2023-03-21T11:28:44Z</dc:date>
    </item>
    <item>
      <title>Re: TesseractNotFoundError</title>
      <link>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7377#M3265</link>
      <description>&lt;P&gt;Yes ofcourse This is fine incase if you need install Python Library pytesseract&lt;/P&gt;&lt;P&gt;But   if you need extract text from image You should install Tesseract OCR  in working Cluster &lt;/P&gt;&lt;P&gt;Otherwise it will give this error&lt;/P&gt;</description>
      <pubDate>Tue, 21 Mar 2023 11:53:37 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7377#M3265</guid>
      <dc:creator>feed</dc:creator>
      <dc:date>2023-03-21T11:53:37Z</dc:date>
    </item>
    <item>
      <title>Re: TesseractNotFoundError</title>
      <link>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7378#M3266</link>
      <description>&lt;P&gt;Ack. Thank you for sharing!&lt;/P&gt;</description>
      <pubDate>Tue, 21 Mar 2023 17:27:23 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7378#M3266</guid>
      <dc:creator>NandiniN</dc:creator>
      <dc:date>2023-03-21T17:27:23Z</dc:date>
    </item>
    <item>
      <title>Re: TesseractNotFoundError</title>
      <link>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7379#M3267</link>
      <description>&lt;P&gt;Hi @feed expedition​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Hope all is well! Just wanted to check in if you were able to resolve your issue and would you be happy to share the solution or mark an answer as best? Else please let us know if you need more help.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;We'd love to hear from you.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 22 Mar 2023 03:18:10 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/7379#M3267</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2023-03-22T03:18:10Z</dc:date>
    </item>
    <item>
      <title>Re: TesseractNotFoundError</title>
      <link>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/55594#M30378</link>
      <description>&lt;P&gt;%sh apt-get install -y tesseract-ocr this command is not working in my new Databricks&amp;nbsp;free trail account, earlier it worked fine in my old Databricks&amp;nbsp;instance. I get below error: E: Could not open lock file /var/lib/dpkg/lock-frontend - open (13: Permission denied) E: Unable to acquire the dpkg frontend lock (/var/lib/dpkg/lock-frontend), are you root? I have installed pytesseract and tesseract both from libraries section of cluster as well as from pip install command in the notebook, but even after doing all the steps i get&amp;nbsp;TesseractNotFoundError Please let me know if anyone can help me&lt;/P&gt;</description>
      <pubDate>Thu, 21 Dec 2023 11:03:16 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/tesseractnotfounderror/m-p/55594#M30378</guid>
      <dc:creator>neha_ayodhya</dc:creator>
      <dc:date>2023-12-21T11:03:16Z</dc:date>
    </item>
  </channel>
</rss>

