<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic springml sftp with spark 3.x in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/springml-sftp-with-spark-3-x/m-p/116420#M45309</link>
    <description>&lt;P&gt;Is there a version of springml spark-sftp that works with spark 3.x and scala 2.12?&amp;nbsp; If so can you point me to it or how to load it in my compute?&lt;/P&gt;</description>
    <pubDate>Thu, 24 Apr 2025 03:35:49 GMT</pubDate>
    <dc:creator>Unimog</dc:creator>
    <dc:date>2025-04-24T03:35:49Z</dc:date>
    <item>
      <title>springml sftp with spark 3.x</title>
      <link>https://community.databricks.com/t5/data-engineering/springml-sftp-with-spark-3-x/m-p/116420#M45309</link>
      <description>&lt;P&gt;Is there a version of springml spark-sftp that works with spark 3.x and scala 2.12?&amp;nbsp; If so can you point me to it or how to load it in my compute?&lt;/P&gt;</description>
      <pubDate>Thu, 24 Apr 2025 03:35:49 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/springml-sftp-with-spark-3-x/m-p/116420#M45309</guid>
      <dc:creator>Unimog</dc:creator>
      <dc:date>2025-04-24T03:35:49Z</dc:date>
    </item>
    <item>
      <title>Re: springml sftp with spark 3.x</title>
      <link>https://community.databricks.com/t5/data-engineering/springml-sftp-with-spark-3-x/m-p/116507#M45330</link>
      <description>&lt;P class="_1t7bu9h1 paragraph"&gt;The SpringML Spark-SFTP library does not natively support Apache Spark 3.x and Scala 2.12. The library has not been actively maintained, with the last documented commit made in April 2019. This outdated state results in several issues:&lt;/P&gt;
&lt;OL&gt;
&lt;LI&gt;
&lt;P class="_1t7bu9h1 paragraph"&gt;&lt;STRONG&gt;Lack of Support for Spark 3.x&lt;/STRONG&gt;: It is acknowledged that the SpringML Spark-SFTP library is incompatible with Spark 3.x&lt;/P&gt;
&lt;/LI&gt;
&lt;LI&gt;
&lt;P class="_1t7bu9h1 paragraph"&gt;&lt;STRONG&gt;Incorrect Implementation&lt;/STRONG&gt;: The library is designed as a DataSource rather than as a Hadoop FileSystem, which affects the support for common formats like CSV, Parquet, and JSON in a Spark platform&lt;/P&gt;
&lt;/LI&gt;
&lt;LI&gt;
&lt;P class="_1t7bu9h1 paragraph"&gt;&lt;STRONG&gt;Unsupported File System Schemes&lt;/STRONG&gt;: The library only supports the &lt;CODE&gt;hdfs://&lt;/CODE&gt; file system scheme, making it incompatible with the Databricks runtime&lt;/P&gt;
&lt;/LI&gt;
&lt;LI&gt;
&lt;P class="_1t7bu9h1 paragraph"&gt;&lt;STRONG&gt;No Further Maintenance&lt;/STRONG&gt;: The lack of recent updates from the maintainers makes this library an unreliable dependency for modern Spark and Scala environments&lt;/P&gt;
&lt;/LI&gt;
&lt;/OL&gt;
&lt;P class="_1t7bu9h1 paragraph"&gt;Hope this helps, Louis.&lt;/P&gt;</description>
      <pubDate>Thu, 24 Apr 2025 18:02:07 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/springml-sftp-with-spark-3-x/m-p/116507#M45330</guid>
      <dc:creator>Louis_Frolio</dc:creator>
      <dc:date>2025-04-24T18:02:07Z</dc:date>
    </item>
    <item>
      <title>Re: springml sftp with spark 3.x</title>
      <link>https://community.databricks.com/t5/data-engineering/springml-sftp-with-spark-3-x/m-p/116509#M45332</link>
      <description>&lt;P&gt;Thanks!&amp;nbsp; Any alternatives you recommend for sftp within databricks?&lt;/P&gt;</description>
      <pubDate>Thu, 24 Apr 2025 18:24:02 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/springml-sftp-with-spark-3-x/m-p/116509#M45332</guid>
      <dc:creator>Unimog</dc:creator>
      <dc:date>2025-04-24T18:24:02Z</dc:date>
    </item>
    <item>
      <title>Re: springml sftp with spark 3.x</title>
      <link>https://community.databricks.com/t5/data-engineering/springml-sftp-with-spark-3-x/m-p/116512#M45333</link>
      <description>&lt;P&gt;For Python you might want to look at Paramiko, it seems that it might be an option.&amp;nbsp; You could also look at ETL tools like Airbyte, Rivery, CData, etc.&lt;/P&gt;</description>
      <pubDate>Thu, 24 Apr 2025 18:40:12 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/springml-sftp-with-spark-3-x/m-p/116512#M45333</guid>
      <dc:creator>Louis_Frolio</dc:creator>
      <dc:date>2025-04-24T18:40:12Z</dc:date>
    </item>
  </channel>
</rss>

