<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Translating SQL Value Function For XML To Databricks SQL in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/105004#M41972</link>
    <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/141582"&gt;@BNV&lt;/a&gt;&amp;nbsp;, little more complex querying to convert XML into rows use below query. For your case just replace XML string with column containing XML value, spark will handle.&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;select c_value as colID, v_value as value from(select
  posexplode(
    xpath(
      '''
      &amp;lt;XMLData&amp;gt;
      &amp;lt;Values&amp;gt;
      &amp;lt;ValueDefinition colID="10" Value="Red"/&amp;gt;
      &amp;lt;ValueDefinition colID="20" Value="Square"/&amp;gt;
      &amp;lt;ValueDefinition colID="3" Value=""/&amp;gt;
      &amp;lt;/Values&amp;gt;
      &amp;lt;/XMLData&amp;gt;''',
      '//ValueDefinition/@colID'
    )
  ) as (c_index, c_value),
  posexplode(
    xpath(
      '''
      &amp;lt;XMLData&amp;gt;
      &amp;lt;Values&amp;gt;
      &amp;lt;ValueDefinition colID="10" Value="Red"/&amp;gt;
      &amp;lt;ValueDefinition colID="20" Value="Square"/&amp;gt;
      &amp;lt;ValueDefinition colID="3" Value=""/&amp;gt;
      &amp;lt;/Values&amp;gt;
      &amp;lt;/XMLData&amp;gt;''',
      '//ValueDefinition/@Value'
    )
  ) as (v_index, v_value))
  where c_index = v_index&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;Hari Prasad&lt;/P&gt;</description>
    <pubDate>Thu, 09 Jan 2025 17:28:06 GMT</pubDate>
    <dc:creator>hari-prasad</dc:creator>
    <dc:date>2025-01-09T17:28:06Z</dc:date>
    <item>
      <title>Translating SQL Value Function For XML To Databricks SQL</title>
      <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104743#M41863</link>
      <description>&lt;P&gt;Trying to translate this line of a SQL query that evaluates XML to Databricks SQL.&lt;/P&gt;&lt;DIV&gt;&lt;DIV&gt;&lt;FONT face="courier new,courier"&gt;&lt;FONT face="courier new,courier"&gt;&lt;SPAN&gt;SELECT&lt;BR /&gt;&lt;/SPAN&gt;&lt;/FONT&gt;&lt;/FONT&gt;&lt;DIV&gt;&lt;DIV&gt;&lt;FONT face="courier new,courier"&gt;&lt;SPAN&gt;&amp;nbsp; &amp;nbsp;MyColumn.value('(/XMLData/Values/ValueDefinition[@colID="10"]/@Value)[1]', 'VARCHAR(max)') as Color&lt;/SPAN&gt;&lt;/FONT&gt;&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;FONT face="arial,helvetica,sans-serif"&gt;&lt;SPAN&gt;The XML looks like this:&lt;/SPAN&gt;&lt;/FONT&gt;&lt;/DIV&gt;&lt;DIV&gt;&lt;FONT face="courier new,courier"&gt;&lt;SPAN&gt;&amp;lt;XMLData&amp;gt;&amp;lt;Values&amp;gt;&amp;lt;ValueDefinition colID="10" Value="Red"/&amp;gt;&amp;lt;ValueDefinition colID="20" Value="Square"/&amp;gt;&amp;lt;ValueDefinition colID="3" Value=""/&amp;gt;&amp;lt;/Values&amp;gt;&amp;lt;/XMLData&amp;gt;&lt;/SPAN&gt;&lt;/FONT&gt;&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;&lt;FONT face="arial,helvetica,sans-serif"&gt;&lt;SPAN&gt;Databricks SQL doesn't seem to support this function ("&lt;SPAN class=""&gt;AnalysisException: &lt;/SPAN&gt;Undefined function: MyColumn.value").&lt;/SPAN&gt;&lt;/FONT&gt;&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;&lt;FONT face="arial,helvetica,sans-serif"&gt;&lt;SPAN&gt;Is there anything I can substitute &lt;U&gt;within the query line&lt;/U&gt; that will work?&lt;/SPAN&gt;&lt;/FONT&gt;&lt;/DIV&gt;&lt;/DIV&gt;</description>
      <pubDate>Wed, 08 Jan 2025 17:04:10 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104743#M41863</guid>
      <dc:creator>BNV</dc:creator>
      <dc:date>2025-01-08T17:04:10Z</dc:date>
    </item>
    <item>
      <title>Re: Translating SQL Value Function For XML To Databricks SQL</title>
      <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104745#M41864</link>
      <description>&lt;P&gt;Hi &lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/141582"&gt;@BNV&lt;/a&gt;,&lt;/P&gt;&lt;P&gt;You can leverage &lt;STRONG&gt;UDF or&lt;/STRONG&gt;&amp;nbsp;&lt;STRONG&gt;pandasUDF&lt;/STRONG&gt; to register user defined functions to customize to parse the XML data using standard python libraries or even in Scala or Java in Databricks notebooks.&lt;/P&gt;&lt;P&gt;In SQL warehouse, you can create custom SQL UDF, follow this link for more&amp;nbsp;&lt;A href="https://www.databricks.com/blog/2021/10/20/introducing-sql-user-defined-functions.html" target="_blank"&gt;Introducing SQL User-Defined Functions | Databricks Blog&lt;/A&gt;.&lt;/P&gt;</description>
      <pubDate>Wed, 08 Jan 2025 17:19:07 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104745#M41864</guid>
      <dc:creator>hari-prasad</dc:creator>
      <dc:date>2025-01-08T17:19:07Z</dc:date>
    </item>
    <item>
      <title>Re: Translating SQL Value Function For XML To Databricks SQL</title>
      <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104748#M41865</link>
      <description>&lt;P&gt;Thank you but I'm not very familiar with Pandas.&amp;nbsp;This might be out of my realm of knowledge.&lt;/P&gt;&lt;P&gt;Are you saying Pandas would have this functionality including using SQL and that SQL function or that I would need to create a UDF to parse XML (which sounds quite difficult).&lt;/P&gt;</description>
      <pubDate>Wed, 08 Jan 2025 17:14:19 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104748#M41865</guid>
      <dc:creator>BNV</dc:creator>
      <dc:date>2025-01-08T17:14:19Z</dc:date>
    </item>
    <item>
      <title>Re: Translating SQL Value Function For XML To Databricks SQL</title>
      <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104753#M41867</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/141582"&gt;@BNV&lt;/a&gt;,&amp;nbsp;you can leverage&amp;nbsp;&lt;STRONG&gt;xpath&lt;/STRONG&gt; SQL function which can parse the XML which works in both Notebook and SQL warehouse, follow this Spark SQL doc for more details&amp;nbsp;&lt;A href="https://spark.apache.org/docs/3.5.4/api/sql/#xpath" target="_blank" rel="noopener"&gt;https://spark.apache.org/docs/3.5.4/api/sql/#xpath&lt;/A&gt;&lt;/P&gt;&lt;P&gt;here is a sample example&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="hariprasad_0-1736357597347.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/13951iFB28D4AF5ABD964E/image-size/medium?v=v2&amp;amp;px=400" role="button" title="hariprasad_0-1736357597347.png" alt="hariprasad_0-1736357597347.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 08 Jan 2025 17:34:11 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104753#M41867</guid>
      <dc:creator>hari-prasad</dc:creator>
      <dc:date>2025-01-08T17:34:11Z</dc:date>
    </item>
    <item>
      <title>Re: Translating SQL Value Function For XML To Databricks SQL</title>
      <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104785#M41877</link>
      <description>&lt;P&gt;This might be a good start but I do get an error ("Invalid XPath") when trying to access the column as the xpath. Is it not possible to use a column as the xpath?&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;&lt;DIV&gt;&lt;DIV&gt;&lt;SPAN&gt;SELECT xpath(MyColumn.value&lt;/SPAN&gt;&lt;SPAN&gt;,&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN&gt;'/XMLData/Values/ValueDefinition[@colID="10"]/@Value)[1]'&lt;/SPAN&gt;&lt;SPAN&gt;) &lt;/SPAN&gt;&lt;SPAN&gt;as&lt;/SPAN&gt;&lt;SPAN&gt; Remarks&lt;/SPAN&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;P&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 08 Jan 2025 21:23:36 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104785#M41877</guid>
      <dc:creator>BNV</dc:creator>
      <dc:date>2025-01-08T21:23:36Z</dc:date>
    </item>
    <item>
      <title>Re: Translating SQL Value Function For XML To Databricks SQL</title>
      <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104828#M41896</link>
      <description>&lt;P&gt;you can share a sample or mocked value, how your xml looks?&lt;/P&gt;&lt;P&gt;mean while you can give a try with below query&lt;/P&gt;&lt;DIV&gt;&lt;DIV&gt;&lt;EM&gt;SELECT xpath_string(MyColumn.value, '/XMLData/Values/ValueDefinition[@colID="10"]/@Value')[1] as Remarks&lt;/EM&gt;&lt;/DIV&gt;&lt;/DIV&gt;</description>
      <pubDate>Thu, 09 Jan 2025 04:03:49 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104828#M41896</guid>
      <dc:creator>hari-prasad</dc:creator>
      <dc:date>2025-01-09T04:03:49Z</dc:date>
    </item>
    <item>
      <title>Re: Translating SQL Value Function For XML To Databricks SQL</title>
      <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104842#M41900</link>
      <description>&lt;P&gt;Since Spark Runtime 14.3 and higher, it is possible to read XML using the Spark Read method.&lt;/P&gt;&lt;P&gt;For example:&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;df = spark.read.option("rowTag", "books").format("xml").load(xmlPath)
df.printSchema()
df.show(truncate=False)&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Have a look at the docu:&amp;nbsp;&lt;A href="https://docs.databricks.com/en/query/formats/xml.html" target="_self"&gt;https://docs.databricks.com/en/query/formats/xml.html&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 09 Jan 2025 06:02:26 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104842#M41900</guid>
      <dc:creator>Stefan-Koch</dc:creator>
      <dc:date>2025-01-09T06:02:26Z</dc:date>
    </item>
    <item>
      <title>Re: Translating SQL Value Function For XML To Databricks SQL</title>
      <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104854#M41904</link>
      <description>&lt;P&gt;Yes, now they support XML parse directly in databricks 14.3 or higher, else earlier you could have leveraged spark xml library jars to parse it.&lt;/P&gt;&lt;P&gt;You can still leverage xpath in case where one of data column hold XML value in a dataset. As &lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/141582"&gt;@BNV&lt;/a&gt;&amp;nbsp;is looking for some SQL based approach.&lt;/P&gt;</description>
      <pubDate>Thu, 09 Jan 2025 07:13:04 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104854#M41904</guid>
      <dc:creator>hari-prasad</dc:creator>
      <dc:date>2025-01-09T07:13:04Z</dc:date>
    </item>
    <item>
      <title>Re: Translating SQL Value Function For XML To Databricks SQL</title>
      <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104997#M41969</link>
      <description>&lt;P&gt;Hi. Thank you for replying. My XML sample is in the original post above if it helps.&lt;/P&gt;&lt;P&gt;I doesn't seem like the "_string" version because it's saying:&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN class=""&gt;AnalysisException: &lt;/SPAN&gt;&lt;SPAN&gt;Can't extract value from xpath_string(ExData#251799, /XMLData/Values/ValueDefinition[@colID="10"]/@Value')[1]): need struct type but got string&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 09 Jan 2025 16:56:27 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/104997#M41969</guid>
      <dc:creator>BNV</dc:creator>
      <dc:date>2025-01-09T16:56:27Z</dc:date>
    </item>
    <item>
      <title>Re: Translating SQL Value Function For XML To Databricks SQL</title>
      <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/105002#M41970</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/141582"&gt;@BNV&lt;/a&gt;,&amp;nbsp; below SQL code worked for me, I'm able to extract &lt;STRONG&gt;Red&lt;/STRONG&gt; for &lt;STRONG&gt;&lt;EM&gt;colID=10&lt;/EM&gt;&lt;/STRONG&gt;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;select
  xpath(
    '''
    &amp;lt;XMLData&amp;gt;
    &amp;lt;Values&amp;gt;
    &amp;lt;ValueDefinition colID="10" Value="Red"/&amp;gt;
    &amp;lt;ValueDefinition colID="20" Value="Square"/&amp;gt;
    &amp;lt;ValueDefinition colID="3" Value=""/&amp;gt;
    &amp;lt;/Values&amp;gt;
    &amp;lt;/XMLData&amp;gt;''',
    '//ValueDefinition[@colID="10"]/@Value'
  )[0] as value&lt;/LI-CODE&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="hariprasad_0-1736442966726.png" style="width: 400px;"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/13985iEE3019A3BE6764D4/image-size/medium?v=v2&amp;amp;px=400" role="button" title="hariprasad_0-1736442966726.png" alt="hariprasad_0-1736442966726.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 09 Jan 2025 17:20:03 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/105002#M41970</guid>
      <dc:creator>hari-prasad</dc:creator>
      <dc:date>2025-01-09T17:20:03Z</dc:date>
    </item>
    <item>
      <title>Re: Translating SQL Value Function For XML To Databricks SQL</title>
      <link>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/105004#M41972</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/141582"&gt;@BNV&lt;/a&gt;&amp;nbsp;, little more complex querying to convert XML into rows use below query. For your case just replace XML string with column containing XML value, spark will handle.&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;select c_value as colID, v_value as value from(select
  posexplode(
    xpath(
      '''
      &amp;lt;XMLData&amp;gt;
      &amp;lt;Values&amp;gt;
      &amp;lt;ValueDefinition colID="10" Value="Red"/&amp;gt;
      &amp;lt;ValueDefinition colID="20" Value="Square"/&amp;gt;
      &amp;lt;ValueDefinition colID="3" Value=""/&amp;gt;
      &amp;lt;/Values&amp;gt;
      &amp;lt;/XMLData&amp;gt;''',
      '//ValueDefinition/@colID'
    )
  ) as (c_index, c_value),
  posexplode(
    xpath(
      '''
      &amp;lt;XMLData&amp;gt;
      &amp;lt;Values&amp;gt;
      &amp;lt;ValueDefinition colID="10" Value="Red"/&amp;gt;
      &amp;lt;ValueDefinition colID="20" Value="Square"/&amp;gt;
      &amp;lt;ValueDefinition colID="3" Value=""/&amp;gt;
      &amp;lt;/Values&amp;gt;
      &amp;lt;/XMLData&amp;gt;''',
      '//ValueDefinition/@Value'
    )
  ) as (v_index, v_value))
  where c_index = v_index&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;Hari Prasad&lt;/P&gt;</description>
      <pubDate>Thu, 09 Jan 2025 17:28:06 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/translating-sql-value-function-for-xml-to-databricks-sql/m-p/105004#M41972</guid>
      <dc:creator>hari-prasad</dc:creator>
      <dc:date>2025-01-09T17:28:06Z</dc:date>
    </item>
  </channel>
</rss>

