<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: parsing json string value column into dataframe structure in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/parsing-json-string-value-column-into-dataframe-structure/m-p/98605#M39775</link>
    <description>&lt;P&gt;Would you know the element in the Kafka event JSON ahead of the time or count the number of element each time and then generate the schema for such and pass it from_json to parse?&amp;nbsp; &lt;A href="https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.functions.from_json.html" target="_blank"&gt;https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.functions.from_json.html&lt;/A&gt;&lt;/P&gt;</description>
    <pubDate>Wed, 13 Nov 2024 05:58:34 GMT</pubDate>
    <dc:creator>SparkJun</dc:creator>
    <dc:date>2024-11-13T05:58:34Z</dc:date>
    <item>
      <title>parsing json string value column into dataframe structure</title>
      <link>https://community.databricks.com/t5/data-engineering/parsing-json-string-value-column-into-dataframe-structure/m-p/98603#M39774</link>
      <description>&lt;P&gt;Hi All,&lt;/P&gt;&lt;P&gt;I have to read kafka payload which has value column with json string. But the format of the json is as below.&lt;/P&gt;&lt;P&gt;&lt;SPAN class=""&gt;{&lt;/SPAN&gt; &lt;SPAN class=""&gt;"data"&lt;/SPAN&gt;&lt;SPAN class=""&gt;:&lt;/SPAN&gt; &lt;SPAN class=""&gt;[&lt;/SPAN&gt; &lt;SPAN class=""&gt;{&lt;/SPAN&gt; &lt;SPAN class=""&gt;"p_al4"&lt;/SPAN&gt;&lt;SPAN class=""&gt;:&lt;/SPAN&gt; &lt;SPAN class=""&gt;"N/A"&lt;/SPAN&gt;&lt;SPAN class=""&gt;,&lt;/SPAN&gt; &lt;SPAN class=""&gt;"p_a5"&lt;/SPAN&gt;&lt;SPAN class=""&gt;:&lt;/SPAN&gt; &lt;SPAN class=""&gt;"N/A"&lt;/SPAN&gt;&lt;SPAN class=""&gt;,&lt;/SPAN&gt; &lt;SPAN class=""&gt;"p_ad"&lt;/SPAN&gt;&lt;SPAN class=""&gt;:&lt;/SPAN&gt; &lt;SPAN class=""&gt;"OA003"&lt;/SPAN&gt;&lt;SPAN class=""&gt;,&lt;/SPAN&gt; &lt;SPAN class=""&gt;"p_aName"&lt;/SPAN&gt;&lt;SPAN class=""&gt;:&lt;/SPAN&gt; &lt;SPAN class=""&gt;"Abc"&lt;/SPAN&gt;&lt;SPAN class=""&gt;,&lt;/SPAN&gt; &lt;SPAN class=""&gt;"p_aFlag"&lt;/SPAN&gt;&lt;SPAN class=""&gt;:&lt;/SPAN&gt; &lt;SPAN class=""&gt;&lt;SPAN class=""&gt;true&lt;/SPAN&gt;&lt;/SPAN&gt;&amp;nbsp;,....(dynamic)&lt;SPAN class=""&gt;}&lt;/SPAN&gt; &lt;SPAN class=""&gt;]&lt;/SPAN&gt; &lt;SPAN class=""&gt;}&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN class=""&gt;In data key it can have dynamic number of key value pairs.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN class=""&gt;here "p_" is a column and respective value is given.&lt;BR /&gt;Please suggest how to create this payload into dataframe structure.&lt;BR /&gt;like below:&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN class=""&gt;+-----+-----+-----+-------+------+------------------+&lt;BR /&gt;|p_al4 | p_a5 | p_ad | p_aName | p_aFlag|&lt;BR /&gt;+-----+-----+-----+-------+------+----------------+&lt;BR /&gt;|N/A | N/A | OU13| Admin | true |&lt;BR /&gt;+-----+-----+-----+-------+------+--------------&lt;BR /&gt;&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 13 Nov 2024 05:22:16 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/parsing-json-string-value-column-into-dataframe-structure/m-p/98603#M39774</guid>
      <dc:creator>dipali_globant</dc:creator>
      <dc:date>2024-11-13T05:22:16Z</dc:date>
    </item>
    <item>
      <title>Re: parsing json string value column into dataframe structure</title>
      <link>https://community.databricks.com/t5/data-engineering/parsing-json-string-value-column-into-dataframe-structure/m-p/98605#M39775</link>
      <description>&lt;P&gt;Would you know the element in the Kafka event JSON ahead of the time or count the number of element each time and then generate the schema for such and pass it from_json to parse?&amp;nbsp; &lt;A href="https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.functions.from_json.html" target="_blank"&gt;https://spark.apache.org/docs/latest/api/python/reference/pyspark.sql/api/pyspark.sql.functions.from_json.html&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 13 Nov 2024 05:58:34 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/parsing-json-string-value-column-into-dataframe-structure/m-p/98605#M39775</guid>
      <dc:creator>SparkJun</dc:creator>
      <dc:date>2024-11-13T05:58:34Z</dc:date>
    </item>
    <item>
      <title>Re: parsing json string value column into dataframe structure</title>
      <link>https://community.databricks.com/t5/data-engineering/parsing-json-string-value-column-into-dataframe-structure/m-p/98612#M39776</link>
      <description>&lt;P&gt;No I don't know element in JSON . so I can't define structure.&lt;/P&gt;</description>
      <pubDate>Wed, 13 Nov 2024 06:30:11 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/parsing-json-string-value-column-into-dataframe-structure/m-p/98612#M39776</guid>
      <dc:creator>dipali_globant</dc:creator>
      <dc:date>2024-11-13T06:30:11Z</dc:date>
    </item>
  </channel>
</rss>

