<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Big time differences in reading tables in Get Started Discussions</title>
    <link>https://community.databricks.com/t5/get-started-discussions/big-time-differences-in-reading-tables/m-p/38380#M5501</link>
    <description>&lt;P&gt;When I read managed table in #databricks# i can see big differences in time spent. Small test table with just 2 records is once loaded in 3 seconds and another time in 30 seconds. Reading table_change for this tinny table took 15 minutes. Don't know if this has any explanation or cluster setting is somehow wrong.&lt;/P&gt;&lt;OL&gt;&lt;LI&gt;storage: ADLS gen2&lt;/LI&gt;&lt;LI&gt;cluster config:&lt;UL&gt;&lt;LI&gt;access mode: shared&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;runtime: 13.2 (includes Apache Spark 3.4.0, Scala 2.12)&lt;/SPAN&gt;&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;worker: Standard_DS_v2 14GB, 4 Cores min 2 max 8&lt;/SPAN&gt;&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;driver:&amp;nbsp;Standard_DS_v2 &lt;/SPAN&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;enable autoscaling = true&lt;/SPAN&gt;&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;No other advanced options&lt;/SPAN&gt;&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;&lt;SPAN&gt;Thanks.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Tue, 25 Jul 2023 13:06:16 GMT</pubDate>
    <dc:creator>alesventus</dc:creator>
    <dc:date>2023-07-25T13:06:16Z</dc:date>
    <item>
      <title>Big time differences in reading tables</title>
      <link>https://community.databricks.com/t5/get-started-discussions/big-time-differences-in-reading-tables/m-p/38380#M5501</link>
      <description>&lt;P&gt;When I read managed table in #databricks# i can see big differences in time spent. Small test table with just 2 records is once loaded in 3 seconds and another time in 30 seconds. Reading table_change for this tinny table took 15 minutes. Don't know if this has any explanation or cluster setting is somehow wrong.&lt;/P&gt;&lt;OL&gt;&lt;LI&gt;storage: ADLS gen2&lt;/LI&gt;&lt;LI&gt;cluster config:&lt;UL&gt;&lt;LI&gt;access mode: shared&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;runtime: 13.2 (includes Apache Spark 3.4.0, Scala 2.12)&lt;/SPAN&gt;&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;worker: Standard_DS_v2 14GB, 4 Cores min 2 max 8&lt;/SPAN&gt;&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;driver:&amp;nbsp;Standard_DS_v2 &lt;/SPAN&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;enable autoscaling = true&lt;/SPAN&gt;&lt;/LI&gt;&lt;LI&gt;&lt;SPAN&gt;No other advanced options&lt;/SPAN&gt;&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;&lt;SPAN&gt;Thanks.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 25 Jul 2023 13:06:16 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/big-time-differences-in-reading-tables/m-p/38380#M5501</guid>
      <dc:creator>alesventus</dc:creator>
      <dc:date>2023-07-25T13:06:16Z</dc:date>
    </item>
  </channel>
</rss>

