<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Can we run pandas dataframe inside databricks? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25358#M17629</link>
    <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I don't see any incorrect in your code, I think your code is correct. Could you check the exist of your file or enable dbfs in your workspace?&lt;/P&gt;</description>
    <pubDate>Mon, 21 Nov 2022 02:09:06 GMT</pubDate>
    <dc:creator>Anonymous</dc:creator>
    <dc:date>2022-11-21T02:09:06Z</dc:date>
    <item>
      <title>Can we run pandas dataframe inside databricks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25353#M17624</link>
      <description>&lt;P&gt;Hi, I want to run &lt;/P&gt;&lt;P&gt;df=pd.read_csv('/dbfs/FileStore/airlines1.csv') while trying to run getting error like&lt;/P&gt;&lt;P&gt;FileNotFoundError: [Errno 2] No such file or directory: '/dbfs/FileStore/airlines1.csv'&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Could you please help me out how to run pandas dataframe inside databricks or we can not run pandas dataframe directly inside databricks?&lt;/P&gt;</description>
      <pubDate>Fri, 28 Oct 2022 13:47:42 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25353#M17624</guid>
      <dc:creator>tinendra</dc:creator>
      <dc:date>2022-10-28T13:47:42Z</dc:date>
    </item>
    <item>
      <title>Re: Can we run pandas dataframe inside databricks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25354#M17625</link>
      <description>&lt;P&gt;@Tinendra Kumar​&amp;nbsp;we have been seeing this issue, but as far as documentation i don't see any solid base why pandas read won't support. but we do have workaround 1. read your csv using spark and store in data frame 2. convert spark data frame to pandas  . below links will help 1. &lt;A href="https://docs.databricks.com/external-data/csv.html" alt="https://docs.databricks.com/external-data/csv.html" target="_blank"&gt;CSV file | Databricks on AWS&lt;/A&gt; 2. &lt;A href="https://stackoverflow.com/questions/50958721/convert-a-spark-dataframe-to-pandas-df" alt="https://stackoverflow.com/questions/50958721/convert-a-spark-dataframe-to-pandas-df" target="_blank"&gt;Convert a spark DataFrame to pandas DF - Stack Overflow&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 28 Oct 2022 14:21:16 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25354#M17625</guid>
      <dc:creator>karthik_p</dc:creator>
      <dc:date>2022-10-28T14:21:16Z</dc:date>
    </item>
    <item>
      <title>Re: Can we run pandas dataframe inside databricks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25355#M17626</link>
      <description>&lt;P&gt;Hi @Tinendra Kumar​,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I would like to share the following documentation &lt;A href="https://docs.databricks.com/languages/pandas-spark.html#pandas-api-on-spark" target="test_blank"&gt;https://docs.databricks.com/languages/pandas-spark.html#pandas-api-on-spark&lt;/A&gt; This is Pandas APIs on Spark. &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Pandas does not scale out to big data (runs on driver only). Pandas API on Spark fills this gap by providing pandas equivalent APIs that work on Apache Spark. Pandas API on Spark is useful not only for pandas users but also PySpark users, because pandas API on Spark supports many tasks that are difficult to do with PySpark, for example plotting data directly from a PySpark DataFrame.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 31 Oct 2022 18:24:12 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25355#M17626</guid>
      <dc:creator>jose_gonzalez</dc:creator>
      <dc:date>2022-10-31T18:24:12Z</dc:date>
    </item>
    <item>
      <title>Re: Can we run pandas dataframe inside databricks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25356#M17627</link>
      <description>&lt;P&gt;Thank you Jose&lt;/P&gt;</description>
      <pubDate>Fri, 11 Nov 2022 03:48:39 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25356#M17627</guid>
      <dc:creator>tinendra</dc:creator>
      <dc:date>2022-11-11T03:48:39Z</dc:date>
    </item>
    <item>
      <title>Re: Can we run pandas dataframe inside databricks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25357#M17628</link>
      <description>&lt;P&gt;Thanks, Karthik&lt;/P&gt;</description>
      <pubDate>Fri, 11 Nov 2022 04:01:14 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25357#M17628</guid>
      <dc:creator>tinendra</dc:creator>
      <dc:date>2022-11-11T04:01:14Z</dc:date>
    </item>
    <item>
      <title>Re: Can we run pandas dataframe inside databricks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25358#M17629</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I don't see any incorrect in your code, I think your code is correct. Could you check the exist of your file or enable dbfs in your workspace?&lt;/P&gt;</description>
      <pubDate>Mon, 21 Nov 2022 02:09:06 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25358#M17629</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2022-11-21T02:09:06Z</dc:date>
    </item>
    <item>
      <title>Re: Can we run pandas dataframe inside databricks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25359#M17630</link>
      <description>&lt;P&gt;Hi @Tinendra Kumar​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Hope all is well! Just wanted to check in if you were able to resolve your issue and would you be happy to share the solution or &lt;B&gt;mark an answer as best&lt;/B&gt;? Else please let us know if you need more help.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;We'd love to hear from you.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 09 Jan 2023 05:10:36 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25359#M17630</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2023-01-09T05:10:36Z</dc:date>
    </item>
    <item>
      <title>Re: Can we run pandas dataframe inside databricks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25360#M17631</link>
      <description>&lt;P&gt;Hi @Vidula Khanna​&amp;nbsp;&lt;/P&gt;&lt;P&gt;Yes, my query has been resolved and I got the solution. Thanks for your support.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;Tinendra&lt;/P&gt;</description>
      <pubDate>Tue, 14 Feb 2023 12:10:07 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-run-pandas-dataframe-inside-databricks/m-p/25360#M17631</guid>
      <dc:creator>tinendra</dc:creator>
      <dc:date>2023-02-14T12:10:07Z</dc:date>
    </item>
  </channel>
</rss>

