<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic How to I select an 80/10/10 split when doing AutoML in Machine Learning</title>
    <link>https://community.databricks.com/t5/machine-learning/how-to-i-select-an-80-10-10-split-when-doing-automl/m-p/70277#M3278</link>
    <description>&lt;P&gt;Headline says it all. I am doing a regression and want to select a testvaltrain split that is not 60/20/20. Anyone know how to do this?&lt;/P&gt;</description>
    <pubDate>Wed, 22 May 2024 15:31:17 GMT</pubDate>
    <dc:creator>bothma2</dc:creator>
    <dc:date>2024-05-22T15:31:17Z</dc:date>
    <item>
      <title>How to I select an 80/10/10 split when doing AutoML</title>
      <link>https://community.databricks.com/t5/machine-learning/how-to-i-select-an-80-10-10-split-when-doing-automl/m-p/70277#M3278</link>
      <description>&lt;P&gt;Headline says it all. I am doing a regression and want to select a testvaltrain split that is not 60/20/20. Anyone know how to do this?&lt;/P&gt;</description>
      <pubDate>Wed, 22 May 2024 15:31:17 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/how-to-i-select-an-80-10-10-split-when-doing-automl/m-p/70277#M3278</guid>
      <dc:creator>bothma2</dc:creator>
      <dc:date>2024-05-22T15:31:17Z</dc:date>
    </item>
    <item>
      <title>Re: How to I select an 80/10/10 split when doing AutoML</title>
      <link>https://community.databricks.com/t5/machine-learning/how-to-i-select-an-80-10-10-split-when-doing-automl/m-p/70295#M3279</link>
      <description>&lt;P&gt;You can't do it but there is a workaround:&lt;BR /&gt;&lt;BR /&gt;You could use a fake time column and force it to be 80/10/10.&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;BR /&gt;&lt;SPAN&gt;If you specify this column (in the advanced section - "Time column for training/validation/testing split"), the dataset is split into training, validation, and test sets by time. The earliest points are used for training, the next earliest for validation, and the latest points are used as a test set. Try using all the earliest points as the same timestamp, then another for validation and another one for testing.&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 22 May 2024 18:02:25 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/how-to-i-select-an-80-10-10-split-when-doing-automl/m-p/70295#M3279</guid>
      <dc:creator>mhiltner</dc:creator>
      <dc:date>2024-05-22T18:02:25Z</dc:date>
    </item>
    <item>
      <title>Re: How to I select an 80/10/10 split when doing AutoML</title>
      <link>https://community.databricks.com/t5/machine-learning/how-to-i-select-an-80-10-10-split-when-doing-automl/m-p/70296#M3280</link>
      <description>&lt;P&gt;Wouldn;t that just do a 60/20/20 split?&lt;/P&gt;</description>
      <pubDate>Wed, 22 May 2024 18:06:46 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/how-to-i-select-an-80-10-10-split-when-doing-automl/m-p/70296#M3280</guid>
      <dc:creator>bothma2</dc:creator>
      <dc:date>2024-05-22T18:06:46Z</dc:date>
    </item>
    <item>
      <title>Re: How to I select an 80/10/10 split when doing AutoML</title>
      <link>https://community.databricks.com/t5/machine-learning/how-to-i-select-an-80-10-10-split-when-doing-automl/m-p/70318#M3281</link>
      <description>&lt;P&gt;You'd need to put 80% of your data with the earliest timestamp, then 10% with another one and 10% with another.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 22 May 2024 20:46:52 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/how-to-i-select-an-80-10-10-split-when-doing-automl/m-p/70318#M3281</guid>
      <dc:creator>mhiltner</dc:creator>
      <dc:date>2024-05-22T20:46:52Z</dc:date>
    </item>
  </channel>
</rss>

