<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic How to handle complex json schema in Get Started Discussions</title>
    <link>https://community.databricks.com/t5/get-started-discussions/how-to-handle-complex-json-schema/m-p/57635#M2252</link>
    <description>&lt;P&gt;I have a mounted external directory that is an s3 bucket with multiple subdirectories containing call log files in json format.&amp;nbsp; The files are irregular and complex, when i try to use spark.read.json or spark.sql (SELECT *) i get the&amp;nbsp;UNABLE_TO_INFER_SCHEMA error.&amp;nbsp; the files are too complex to try and build a schema manually, plus there are thousands of files.&amp;nbsp; what is the best approach for creating a dataframe with this data?&lt;/P&gt;</description>
    <pubDate>Thu, 18 Jan 2024 01:47:44 GMT</pubDate>
    <dc:creator>chrisf_sts</dc:creator>
    <dc:date>2024-01-18T01:47:44Z</dc:date>
    <item>
      <title>How to handle complex json schema</title>
      <link>https://community.databricks.com/t5/get-started-discussions/how-to-handle-complex-json-schema/m-p/57635#M2252</link>
      <description>&lt;P&gt;I have a mounted external directory that is an s3 bucket with multiple subdirectories containing call log files in json format.&amp;nbsp; The files are irregular and complex, when i try to use spark.read.json or spark.sql (SELECT *) i get the&amp;nbsp;UNABLE_TO_INFER_SCHEMA error.&amp;nbsp; the files are too complex to try and build a schema manually, plus there are thousands of files.&amp;nbsp; what is the best approach for creating a dataframe with this data?&lt;/P&gt;</description>
      <pubDate>Thu, 18 Jan 2024 01:47:44 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/how-to-handle-complex-json-schema/m-p/57635#M2252</guid>
      <dc:creator>chrisf_sts</dc:creator>
      <dc:date>2024-01-18T01:47:44Z</dc:date>
    </item>
  </channel>
</rss>

