<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Data persistence, Dataframe, and Delta in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/data-persistence-dataframe-and-delta/m-p/31186#M22688</link>
    <description>&lt;P&gt;Hey there @Vivek Ranjan​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Hope you are doing great!&lt;/P&gt;&lt;P&gt;Just wanted to check in if you were able to resolve your issue or do you need more help? We'd love to hear from you.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
    <pubDate>Thu, 12 May 2022 13:50:49 GMT</pubDate>
    <dc:creator>Anonymous</dc:creator>
    <dc:date>2022-05-12T13:50:49Z</dc:date>
    <item>
      <title>Data persistence, Dataframe, and Delta</title>
      <link>https://community.databricks.com/t5/data-engineering/data-persistence-dataframe-and-delta/m-p/31182#M22684</link>
      <description>&lt;P&gt;I am new to databricks platform. &lt;/P&gt;&lt;OL&gt;&lt;LI&gt;what is the best way to keep data persistent so that once I restart the cluster I don't need to run all the codes again?So that I can simply continue developing my notebook with the cached data.&lt;/LI&gt;&lt;LI&gt;I have created many dataframes and I want to save them as Delta table using the code &lt;/LI&gt;&lt;/OL&gt;&lt;PRE&gt;&lt;CODE&gt;dataFrame.to_delta('/dbfs/Projects/', index_col='index')&lt;/CODE&gt;&lt;/PRE&gt;&lt;OL&gt;&lt;LI&gt;   then I list the table using the command I see a table with two columns: path, and name. The path column contains the path starting from dbfs:/dbfs/Projects/part-00000-xxxx-snappy.parquet. The name column has only the filename part. How will I later query those two tables if the dataframe name is not saved with the filename.  Do I have to query by the extremely long filename.?&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 21 Jan 2022 17:30:02 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/data-persistence-dataframe-and-delta/m-p/31182#M22684</guid>
      <dc:creator>Vik1</dc:creator>
      <dc:date>2022-01-21T17:30:02Z</dc:date>
    </item>
    <item>
      <title>Re: Data persistence, Dataframe, and Delta</title>
      <link>https://community.databricks.com/t5/data-engineering/data-persistence-dataframe-and-delta/m-p/31183#M22685</link>
      <description>&lt;P&gt;Hi @Vivek Ranjan​! My name is Piper, and I'm a moderator for the community. Welcome to Databricks and the community! Thank you for your question. We give our members time to respond to questions before we circle back. &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks in advance for your patience and best wishes on your Databricks journey.&lt;/P&gt;</description>
      <pubDate>Fri, 21 Jan 2022 19:50:45 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/data-persistence-dataframe-and-delta/m-p/31183#M22685</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2022-01-21T19:50:45Z</dc:date>
    </item>
    <item>
      <title>Re: Data persistence, Dataframe, and Delta</title>
      <link>https://community.databricks.com/t5/data-engineering/data-persistence-dataframe-and-delta/m-p/31184#M22686</link>
      <description>&lt;P&gt;you can just use spark.read.format("delta").load("path to the parent folder of 'delta_log'-folder") &lt;/P&gt;&lt;P&gt;or save it as a table and read that table.&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.microsoft.com/en-us/azure/databricks/delta/quick-start" alt="https://docs.microsoft.com/en-us/azure/databricks/delta/quick-start" target="_blank"&gt;https://docs.microsoft.com/en-us/azure/databricks/delta/quick-start&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 25 Jan 2022 14:32:41 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/data-persistence-dataframe-and-delta/m-p/31184#M22686</guid>
      <dc:creator>-werners-</dc:creator>
      <dc:date>2022-01-25T14:32:41Z</dc:date>
    </item>
    <item>
      <title>Re: Data persistence, Dataframe, and Delta</title>
      <link>https://community.databricks.com/t5/data-engineering/data-persistence-dataframe-and-delta/m-p/31185#M22687</link>
      <description>&lt;P&gt;@Vivek Ranjan​&amp;nbsp;- Does werners' response answer your question? If yes, would you be happy to mark it as best so that other members can find the solution more quickly?&lt;/P&gt;</description>
      <pubDate>Wed, 26 Jan 2022 16:42:15 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/data-persistence-dataframe-and-delta/m-p/31185#M22687</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2022-01-26T16:42:15Z</dc:date>
    </item>
    <item>
      <title>Re: Data persistence, Dataframe, and Delta</title>
      <link>https://community.databricks.com/t5/data-engineering/data-persistence-dataframe-and-delta/m-p/31186#M22688</link>
      <description>&lt;P&gt;Hey there @Vivek Ranjan​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Hope you are doing great!&lt;/P&gt;&lt;P&gt;Just wanted to check in if you were able to resolve your issue or do you need more help? We'd love to hear from you.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 12 May 2022 13:50:49 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/data-persistence-dataframe-and-delta/m-p/31186#M22688</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2022-05-12T13:50:49Z</dc:date>
    </item>
  </channel>
</rss>

