<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Relative path in absolute URI when reading a folder with files containing &amp;quot;:&amp;quot; colons in filename in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/relative-path-in-absolute-uri-when-reading-a-folder-with-files/m-p/12518#M7318</link>
    <description>&lt;P&gt;I am trying to read a folder with partition files where each partition is date/hour/timestamp.csv where timestamp is the exact timestamp in ISO format, e.g. 09-2022-12-05T20:35:15.2786966Z &lt;/P&gt;&lt;P&gt;It seems like spark having issues with reading files with colons, which is quiet ridiculous.&lt;/P&gt;&lt;P&gt;The issue was raised in 2019 &lt;A href="https://issues.apache.org/jira/browse/SPARK-28841" target="test_blank"&gt;https://issues.apache.org/jira/browse/SPARK-28841&lt;/A&gt; but it seems like the issue remains.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;What is the solution, rather than now renaming zillions of file names, which in s3 requires copy... &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I am using Spark 3.2.1&lt;/P&gt;</description>
    <pubDate>Wed, 11 Jan 2023 17:42:02 GMT</pubDate>
    <dc:creator>chanansh</dc:creator>
    <dc:date>2023-01-11T17:42:02Z</dc:date>
    <item>
      <title>Relative path in absolute URI when reading a folder with files containing ":" colons in filename</title>
      <link>https://community.databricks.com/t5/data-engineering/relative-path-in-absolute-uri-when-reading-a-folder-with-files/m-p/12518#M7318</link>
      <description>&lt;P&gt;I am trying to read a folder with partition files where each partition is date/hour/timestamp.csv where timestamp is the exact timestamp in ISO format, e.g. 09-2022-12-05T20:35:15.2786966Z &lt;/P&gt;&lt;P&gt;It seems like spark having issues with reading files with colons, which is quiet ridiculous.&lt;/P&gt;&lt;P&gt;The issue was raised in 2019 &lt;A href="https://issues.apache.org/jira/browse/SPARK-28841" target="test_blank"&gt;https://issues.apache.org/jira/browse/SPARK-28841&lt;/A&gt; but it seems like the issue remains.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;What is the solution, rather than now renaming zillions of file names, which in s3 requires copy... &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I am using Spark 3.2.1&lt;/P&gt;</description>
      <pubDate>Wed, 11 Jan 2023 17:42:02 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/relative-path-in-absolute-uri-when-reading-a-folder-with-files/m-p/12518#M7318</guid>
      <dc:creator>chanansh</dc:creator>
      <dc:date>2023-01-11T17:42:02Z</dc:date>
    </item>
    <item>
      <title>Re: Relative path in absolute URI when reading a folder with files containing ":" colons in filename</title>
      <link>https://community.databricks.com/t5/data-engineering/relative-path-in-absolute-uri-when-reading-a-folder-with-files/m-p/12521#M7321</link>
      <description>&lt;P&gt;I have renamed the files replacing : with - as the bug still exists &lt;/P&gt;</description>
      <pubDate>Tue, 17 Jan 2023 09:40:22 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/relative-path-in-absolute-uri-when-reading-a-folder-with-files/m-p/12521#M7321</guid>
      <dc:creator>chanansh</dc:creator>
      <dc:date>2023-01-17T09:40:22Z</dc:date>
    </item>
    <item>
      <title>Re: Relative path in absolute URI when reading a folder with files containing ":" colons in filename</title>
      <link>https://community.databricks.com/t5/data-engineering/relative-path-in-absolute-uri-when-reading-a-folder-with-files/m-p/12519#M7319</link>
      <description>&lt;P&gt;The issue was reopened again &lt;A href="https://issues.apache.org/jira/browse/HDFS-14762" target="test_blank"&gt;https://issues.apache.org/jira/browse/HDFS-14762&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 11 Jan 2023 22:04:17 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/relative-path-in-absolute-uri-when-reading-a-folder-with-files/m-p/12519#M7319</guid>
      <dc:creator>Debayan</dc:creator>
      <dc:date>2023-01-11T22:04:17Z</dc:date>
    </item>
  </channel>
</rss>

