<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Variable Reduction for Clustering Model in SAS Data Science</title>
    <link>https://communities.sas.com/t5/SAS-Data-Science/Variable-Reduction-for-Clustering-Model/m-p/179024#M2130</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi all,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Are there any other more advanced and robust ways in SAS Base besides Varclus or principal components that can be used for variable reduction?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I am trying to perform a cluster analysis with over a hundred variable so i was wondering if there is something out there that can help reduce the number of variables as well as providing me with the strongest discriminators for my data.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Kind regards&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Mon, 14 Apr 2014 13:35:37 GMT</pubDate>
    <dc:creator>chemicalab</dc:creator>
    <dc:date>2014-04-14T13:35:37Z</dc:date>
    <item>
      <title>Variable Reduction for Clustering Model</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Variable-Reduction-for-Clustering-Model/m-p/179024#M2130</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi all,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Are there any other more advanced and robust ways in SAS Base besides Varclus or principal components that can be used for variable reduction?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I am trying to perform a cluster analysis with over a hundred variable so i was wondering if there is something out there that can help reduce the number of variables as well as providing me with the strongest discriminators for my data.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Kind regards&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 14 Apr 2014 13:35:37 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Variable-Reduction-for-Clustering-Model/m-p/179024#M2130</guid>
      <dc:creator>chemicalab</dc:creator>
      <dc:date>2014-04-14T13:35:37Z</dc:date>
    </item>
    <item>
      <title>Re: Variable Reduction for Clustering Model</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Variable-Reduction-for-Clustering-Model/m-p/179025#M2131</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi Chemicalab,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Proc princomp and proc varclus are the go-to methods in Base SAS as you mention.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;A different approach if you have access to SAS Enterprise Miner: try calculating the variable importance using a tree-based model node. Then confirm the variable importance of your variables.&lt;BR /&gt;Please note that these nodes have the variable selection option set to Yes by default. This means that if you connect any of these nodes to a Cluster node, you will pass only the most important variables (relative variable importance greater or equal to 0.05). A few considerations below.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Decision Tree node - variable importance is calculated using only one decision tree.&lt;/LI&gt;&lt;LI&gt;HPForest node - variable importance is calculated using a random forest model, which is more robust. This node is available in SAS Enterprise Miner 12.3 or newer.&lt;/LI&gt;&lt;LI&gt;Gradient Boosting node - it is very robust, but the sequential nature of this algorithm makes it take some time to run.&lt;/LI&gt;&lt;/UL&gt;&lt;P&gt;&lt;BR /&gt;I hope it helps,&lt;BR /&gt;Thanks,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Miguel&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 14 Apr 2014 14:05:20 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Variable-Reduction-for-Clustering-Model/m-p/179025#M2131</guid>
      <dc:creator>M_Maldonado</dc:creator>
      <dc:date>2014-04-14T14:05:20Z</dc:date>
    </item>
    <item>
      <title>Re: Variable Reduction for Clustering Model</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Variable-Reduction-for-Clustering-Model/m-p/179026#M2132</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Unfortunately i dont have EM so i guess i will have to go with Proc Princ or Varclus, thank you for the reply&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 14 Apr 2014 14:16:37 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Variable-Reduction-for-Clustering-Model/m-p/179026#M2132</guid>
      <dc:creator>chemicalab</dc:creator>
      <dc:date>2014-04-14T14:16:37Z</dc:date>
    </item>
  </channel>
</rss>

