<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic sparklyr::spark_read_csv forbidden 403 error in Get Started Discussions</title>
    <link>https://community.databricks.com/t5/get-started-discussions/sparklyr-spark-read-csv-forbidden-403-error/m-p/62756#M6668</link>
    <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I am trying to read a csv file into a Spark DataFrame using sparklyr::spark_read_csv. I am receiving a 403 access denied error.&lt;/P&gt;&lt;P&gt;I have stored my AWS credentials as environment variables, and can successfully read the file as an R dataframe using&amp;nbsp;&lt;SPAN&gt;arrow::read_csv_arrow. However, spark_read_csv is failing.&lt;/SPAN&gt;&lt;/P&gt;&lt;DIV&gt;&amp;nbsp;&lt;DIV&gt;&lt;SPAN&gt;&lt;SPAN&gt;I have confirmed that I am connected to spark, and can read parquet files stored elsewhere.&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;DIV&gt;&amp;nbsp;&lt;DIV&gt;&lt;SPAN&gt;&lt;SPAN&gt;Any advice?&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;DIV&gt;&amp;nbsp;&lt;DIV&gt;&lt;SPAN&gt;&lt;SPAN&gt;Thanks,&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;&lt;P&gt;my_file &amp;lt;- glue::glue("s3://my-bucket/my-folder/my-file-name.csv")&lt;/P&gt;&lt;P&gt;## This works&lt;BR /&gt;mydata &amp;lt;- arrow::read_csv_arrow(&lt;BR /&gt;file = my_file&lt;BR /&gt;)&lt;BR /&gt;## This doesn't&lt;BR /&gt;mydata &amp;lt;- sparklyr::spark_read_csv(&lt;BR /&gt;sc,&lt;BR /&gt;name = "mydata"&lt;BR /&gt;file = my_file&lt;BR /&gt;)&lt;/P&gt;&lt;P&gt;# Error message&lt;BR /&gt;Error : java.nio.file.AccessDeniedException&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;Caused by: com.amazonaws.services.s3.model.AmazonS3Exception: Forbidden; request&lt;/SPAN&gt;&lt;/P&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;</description>
    <pubDate>Wed, 06 Mar 2024 15:12:52 GMT</pubDate>
    <dc:creator>thethirtyfour</dc:creator>
    <dc:date>2024-03-06T15:12:52Z</dc:date>
    <item>
      <title>sparklyr::spark_read_csv forbidden 403 error</title>
      <link>https://community.databricks.com/t5/get-started-discussions/sparklyr-spark-read-csv-forbidden-403-error/m-p/62756#M6668</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I am trying to read a csv file into a Spark DataFrame using sparklyr::spark_read_csv. I am receiving a 403 access denied error.&lt;/P&gt;&lt;P&gt;I have stored my AWS credentials as environment variables, and can successfully read the file as an R dataframe using&amp;nbsp;&lt;SPAN&gt;arrow::read_csv_arrow. However, spark_read_csv is failing.&lt;/SPAN&gt;&lt;/P&gt;&lt;DIV&gt;&amp;nbsp;&lt;DIV&gt;&lt;SPAN&gt;&lt;SPAN&gt;I have confirmed that I am connected to spark, and can read parquet files stored elsewhere.&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;DIV&gt;&amp;nbsp;&lt;DIV&gt;&lt;SPAN&gt;&lt;SPAN&gt;Any advice?&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;DIV&gt;&amp;nbsp;&lt;DIV&gt;&lt;SPAN&gt;&lt;SPAN&gt;Thanks,&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;&lt;P&gt;my_file &amp;lt;- glue::glue("s3://my-bucket/my-folder/my-file-name.csv")&lt;/P&gt;&lt;P&gt;## This works&lt;BR /&gt;mydata &amp;lt;- arrow::read_csv_arrow(&lt;BR /&gt;file = my_file&lt;BR /&gt;)&lt;BR /&gt;## This doesn't&lt;BR /&gt;mydata &amp;lt;- sparklyr::spark_read_csv(&lt;BR /&gt;sc,&lt;BR /&gt;name = "mydata"&lt;BR /&gt;file = my_file&lt;BR /&gt;)&lt;/P&gt;&lt;P&gt;# Error message&lt;BR /&gt;Error : java.nio.file.AccessDeniedException&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;Caused by: com.amazonaws.services.s3.model.AmazonS3Exception: Forbidden; request&lt;/SPAN&gt;&lt;/P&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;</description>
      <pubDate>Wed, 06 Mar 2024 15:12:52 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/sparklyr-spark-read-csv-forbidden-403-error/m-p/62756#M6668</guid>
      <dc:creator>thethirtyfour</dc:creator>
      <dc:date>2024-03-06T15:12:52Z</dc:date>
    </item>
  </channel>
</rss>

