<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: data preprocessing in Discussions</title>
    <link>https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/766206#M94621</link>
    <description>Hi &lt;a href="https://community.jmp.com/t5/user/viewprofilepage/user-id/56938"&gt;@maryam_nourmand&lt;/a&gt;,&lt;BR /&gt;&lt;BR /&gt;Did you read my reply to one of your similar question : &lt;A href="https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/761840/highlight/true#M93976" target="_blank"&gt;https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/761840/highlight/true#M93976&lt;/A&gt; ?</description>
    <pubDate>Sun, 16 Jun 2024 23:12:10 GMT</pubDate>
    <dc:creator>Victor_G</dc:creator>
    <dc:date>2024-06-16T23:12:10Z</dc:date>
    <item>
      <title>data preprocessing</title>
      <link>https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/766194#M94619</link>
      <description>&lt;P&gt;Hello.&lt;BR /&gt;My question is when we use nonparametric model in software such as neural network or SVM or Naive bayes or ....do the software scale our data by default?or before we use these models we should scale our numeric data?&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;</description>
      <pubDate>Sun, 16 Jun 2024 21:40:22 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/766194#M94619</guid>
      <dc:creator>maryam_nourmand</dc:creator>
      <dc:date>2024-06-16T21:40:22Z</dc:date>
    </item>
    <item>
      <title>Re: data preprocessing</title>
      <link>https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/766206#M94621</link>
      <description>Hi &lt;a href="https://community.jmp.com/t5/user/viewprofilepage/user-id/56938"&gt;@maryam_nourmand&lt;/a&gt;,&lt;BR /&gt;&lt;BR /&gt;Did you read my reply to one of your similar question : &lt;A href="https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/761840/highlight/true#M93976" target="_blank"&gt;https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/761840/highlight/true#M93976&lt;/A&gt; ?</description>
      <pubDate>Sun, 16 Jun 2024 23:12:10 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/766206#M94621</guid>
      <dc:creator>Victor_G</dc:creator>
      <dc:date>2024-06-16T23:12:10Z</dc:date>
    </item>
    <item>
      <title>Re: data preprocessing</title>
      <link>https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/766249#M94626</link>
      <description>&lt;P&gt;Yes i read&lt;BR /&gt;but you mention about ((&lt;SPAN&gt;&amp;nbsp;SVM, KNN, Neural Networks, (linear &amp;amp; logistic) regression))&lt;BR /&gt;i actually want to know about other models&amp;nbsp;&lt;BR /&gt;boosted tree&lt;BR /&gt;bootstrap forest&lt;BR /&gt;decision tree&lt;BR /&gt;Naive bayes&lt;BR /&gt;&lt;BR /&gt;thanks&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 17 Jun 2024 07:23:44 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/766249#M94626</guid>
      <dc:creator>maryam_nourmand</dc:creator>
      <dc:date>2024-06-17T07:23:44Z</dc:date>
    </item>
    <item>
      <title>Re: data preprocessing</title>
      <link>https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/766270#M94630</link>
      <description>&lt;P&gt;Ok, but in my (very long) answer, I did mention about tree-based methods and Naive Bayes:&lt;/P&gt;
&lt;BLOCKQUOTE&gt;
&lt;P&gt;&lt;SPAN&gt;Tree-based models and probability-based algorithms like Naive Bayes may not require scaling.&lt;/SPAN&gt;&lt;/P&gt;
&lt;/BLOCKQUOTE&gt;
&lt;P&gt;&lt;SPAN&gt;Tree-based methods don't require scaling as they are are not distance-based algorithms, the splits are done based on the order of the data and information generated by splitting at a certain threshold, but there are no influences of the individual values, ranges or distributions on the split results.&lt;BR /&gt;Naive Bayes is a probability-based algorithm, it calculates probabilities from the data's distribution and is invariant to the scale of the data.&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;Some further ressources :&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;&lt;A href="https://stats.stackexchange.com/questions/244507/what-algorithms-need-feature-scaling-beside-from-svm" target="_blank" rel="noopener"&gt;https://stats.stackexchange.com/questions/244507/what-algorithms-need-feature-scaling-beside-from-svm&lt;/A&gt;&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;&lt;A href="https://www.dataschool.io/comparing-supervised-learning-algorithms/" target="_blank" rel="noopener"&gt;https://www.dataschool.io/comparing-supervised-learning-algorithms/&lt;/A&gt;&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;&lt;A href="https://forecastegy.com/posts/do-decision-trees-need-feature-scaling-or-normalization/" target="_blank" rel="noopener"&gt;https://forecastegy.com/posts/do-decision-trees-need-feature-scaling-or-normalization/&lt;/A&gt;&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;Does this complementary response answer your question ?&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 17 Jun 2024 08:31:10 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/766270#M94630</guid>
      <dc:creator>Victor_G</dc:creator>
      <dc:date>2024-06-17T08:31:10Z</dc:date>
    </item>
    <item>
      <title>Re: data preprocessing</title>
      <link>https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/766283#M94632</link>
      <description>&lt;P&gt;Thanks a lot&lt;/P&gt;</description>
      <pubDate>Mon, 17 Jun 2024 08:31:29 GMT</pubDate>
      <guid>https://community.jmp.com/t5/Discussions/data-preprocessing/m-p/766283#M94632</guid>
      <dc:creator>maryam_nourmand</dc:creator>
      <dc:date>2024-06-17T08:31:29Z</dc:date>
    </item>
  </channel>
</rss>

