<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic SparkR or sparklyr not showing history in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/sparkr-or-sparklyr-not-showing-history/m-p/67581#M33372</link>
    <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;for some reason Azure Databricks doesn't show History if the data is saved with SparkR (2 in the figure below) or Sparklyr (3), but it does show it with Data Ingestion (0) or with PySpark (1). Is this a known bug or am I doing something wrong? Is it possible to save data with R while getting the UserId and Username?&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Databricks_history.PNG" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/7303i016A49BF1F7312D4/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Databricks_history.PNG" alt="Databricks_history.PNG" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;PySpark code:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="python"&gt;test_data = [[4,"d",30],[5,"e",70]]
df = spark.createDataFrame(test_data,['a','b','c']) df.write.mode('append').format("delta").saveAsTable("catalog.schema.table")&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;SparkR df and save to table:&lt;/P&gt;&lt;DIV&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="SparkR.PNG" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/7305i7C9BC5D69CB1EEC9/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="SparkR.PNG" alt="SparkR.PNG" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;Sparklyr&amp;nbsp;&lt;SPAN&gt;df and save to table:&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Sparklyr.PNG" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/7306i7BFC2F78A92EFE68/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Sparklyr.PNG" alt="Sparklyr.PNG" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;/DIV&gt;</description>
    <pubDate>Mon, 29 Apr 2024 10:48:32 GMT</pubDate>
    <dc:creator>Sagas</dc:creator>
    <dc:date>2024-04-29T10:48:32Z</dc:date>
    <item>
      <title>SparkR or sparklyr not showing history</title>
      <link>https://community.databricks.com/t5/data-engineering/sparkr-or-sparklyr-not-showing-history/m-p/67581#M33372</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;for some reason Azure Databricks doesn't show History if the data is saved with SparkR (2 in the figure below) or Sparklyr (3), but it does show it with Data Ingestion (0) or with PySpark (1). Is this a known bug or am I doing something wrong? Is it possible to save data with R while getting the UserId and Username?&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Databricks_history.PNG" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/7303i016A49BF1F7312D4/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Databricks_history.PNG" alt="Databricks_history.PNG" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;PySpark code:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="python"&gt;test_data = [[4,"d",30],[5,"e",70]]
df = spark.createDataFrame(test_data,['a','b','c']) df.write.mode('append').format("delta").saveAsTable("catalog.schema.table")&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;SparkR df and save to table:&lt;/P&gt;&lt;DIV&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="SparkR.PNG" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/7305i7C9BC5D69CB1EEC9/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="SparkR.PNG" alt="SparkR.PNG" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;Sparklyr&amp;nbsp;&lt;SPAN&gt;df and save to table:&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Sparklyr.PNG" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/7306i7BFC2F78A92EFE68/image-size/medium/is-moderation-mode/true?v=v2&amp;amp;px=400" role="button" title="Sparklyr.PNG" alt="Sparklyr.PNG" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;/DIV&gt;</description>
      <pubDate>Mon, 29 Apr 2024 10:48:32 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/sparkr-or-sparklyr-not-showing-history/m-p/67581#M33372</guid>
      <dc:creator>Sagas</dc:creator>
      <dc:date>2024-04-29T10:48:32Z</dc:date>
    </item>
    <item>
      <title>Re: SparkR or sparklyr not showing history</title>
      <link>https://community.databricks.com/t5/data-engineering/sparkr-or-sparklyr-not-showing-history/m-p/67593#M33377</link>
      <description>&lt;P&gt;Thank you for your response! I'll consider capturing UserId for each row. But do you mean that also sparklyr can't automatically capture the userId for the Delta table history?&lt;/P&gt;</description>
      <pubDate>Mon, 29 Apr 2024 14:00:33 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/sparkr-or-sparklyr-not-showing-history/m-p/67593#M33377</guid>
      <dc:creator>Sagas</dc:creator>
      <dc:date>2024-04-29T14:00:33Z</dc:date>
    </item>
  </channel>
</rss>

