<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Cut dataset in Discussions</title>
    <link>https://community.jmp.com/t5/Discussions/Cut-dataset/m-p/409513#M65926</link>
    <description>&lt;P&gt;Hello,&lt;BR /&gt;I would like to cut my 70% vs 30% dataset to have a learning dataset and a test dataset for my statistical models&lt;BR /&gt;I use this method:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Emma1_0-1628866834288.png" style="width: 400px;"&gt;&lt;img src="https://community.jmp.com/t5/image/serverpage/image-id/35000i228BDF94EFCFEDD1/image-size/medium?v=v2&amp;amp;px=400" role="button" title="Emma1_0-1628866834288.png" alt="Emma1_0-1628866834288.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;And I change the 0.7 in 0.3 to have 30%&lt;BR /&gt;However when I do that, the dataset does not separate into two parts: 70% vs 30%, it takes 70% then 30%&lt;BR /&gt;This means that in the dataset 30% there may be data from the dataset containing 70%&lt;/P&gt;&lt;P&gt;Is there a way to cut into two parts the dataset: 70 vs 30% without having the same type of data in both parts?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;Thank you&lt;/P&gt;</description>
    <pubDate>Sat, 10 Jun 2023 23:35:26 GMT</pubDate>
    <dc:creator>Emma1</dc:creator>
    <dc:date>2023-06-10T23:35:26Z</dc:date>
    <item>
      <title>Cut dataset</title>
      <link>https://community.jmp.com/t5/Discussions/Cut-dataset/m-p/409513#M65926</link>
      <description>&lt;P&gt;Hello,&lt;BR /&gt;I would like to cut my 70% vs 30% dataset to have a learning dataset and a test dataset for my statistical models&lt;BR /&gt;I use this method:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Emma1_0-1628866834288.png" style="width: 400px;"&gt;&lt;img src="https://community.jmp.com/t5/image/serverpage/image-id/35000i228BDF94EFCFEDD1/image-size/medium?v=v2&amp;amp;px=400" role="button" title="Emma1_0-1628866834288.png" alt="Emma1_0-1628866834288.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;And I change the 0.7 in 0.3 to have 30%&lt;BR /&gt;However when I do that, the dataset does not separate into two parts: 70% vs 30%, it takes 70% then 30%&lt;BR /&gt;This means that in the dataset 30% there may be data from the dataset containing 70%&lt;/P&gt;&lt;P&gt;Is there a way to cut into two parts the dataset: 70 vs 30% without having the same type of data in both parts?&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;Thank you&lt;/P&gt;</description>
      <pubDate>Sat, 10 Jun 2023 23:35:26 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/Cut-dataset/m-p/409513#M65926</guid>
      <dc:creator>Emma1</dc:creator>
      <dc:date>2023-06-10T23:35:26Z</dc:date>
    </item>
    <item>
      <title>Re: Cut dataset</title>
      <link>https://community.jmp.com/t5/Discussions/Cut-dataset/m-p/409520#M65927</link>
      <description>&lt;P&gt;You need to use the "Make Validation Column"&lt;/P&gt;
&lt;P&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp;Analyze=&amp;gt;Predictive Modeling=&amp;gt;Make Validation Column&lt;/P&gt;
&lt;P&gt;This will give you a new column that if you need to, you can subset the data table into 2 different tables.&lt;/P&gt;</description>
      <pubDate>Fri, 13 Aug 2021 15:11:51 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/Cut-dataset/m-p/409520#M65927</guid>
      <dc:creator>txnelson</dc:creator>
      <dc:date>2021-08-13T15:11:51Z</dc:date>
    </item>
    <item>
      <title>Re: Cut dataset</title>
      <link>https://community.jmp.com/t5/Discussions/Cut-dataset/m-p/409645#M65937</link>
      <description>&lt;P&gt;Create a new column using formula:&amp;nbsp;&lt;/P&gt;&lt;P&gt;Random Binomial(1, 0.3), it will give you 30% "1' and 70% "0".&lt;/P&gt;</description>
      <pubDate>Fri, 13 Aug 2021 21:21:07 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/Cut-dataset/m-p/409645#M65937</guid>
      <dc:creator>ZF</dc:creator>
      <dc:date>2021-08-13T21:21:07Z</dc:date>
    </item>
    <item>
      <title>Re: Cut dataset</title>
      <link>https://community.jmp.com/t5/Discussions/Cut-dataset/m-p/409934#M65967</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;I use the JMP version 16.1.0 and I can't find in the "Analyze" menu the "make validation column"&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Emma1_0-1629100101451.png" style="width: 400px;"&gt;&lt;img src="https://community.jmp.com/t5/image/serverpage/image-id/35044i326DDBBDAB425A38/image-size/medium?v=v2&amp;amp;px=400" role="button" title="Emma1_0-1629100101451.png" alt="Emma1_0-1629100101451.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thank you&lt;/P&gt;</description>
      <pubDate>Mon, 16 Aug 2021 07:48:33 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/Cut-dataset/m-p/409934#M65967</guid>
      <dc:creator>Emma1</dc:creator>
      <dc:date>2021-08-16T07:48:33Z</dc:date>
    </item>
    <item>
      <title>Re: Cut dataset</title>
      <link>https://community.jmp.com/t5/Discussions/Cut-dataset/m-p/409935#M65968</link>
      <description>&lt;P&gt;It works very well !!&lt;/P&gt;&lt;P&gt;Thank you&lt;/P&gt;</description>
      <pubDate>Mon, 16 Aug 2021 07:49:13 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/Cut-dataset/m-p/409935#M65968</guid>
      <dc:creator>Emma1</dc:creator>
      <dc:date>2021-08-16T07:49:13Z</dc:date>
    </item>
  </channel>
</rss>

