<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Oversampling in Enterprise Miner with a rare event fixed proportion in SAS Data Science</title>
    <link>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161994#M1755</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Fabio&lt;/P&gt;&lt;P&gt;I am not sure if it will be of some help, but you may take a look at this paper:&lt;/P&gt;&lt;P&gt;&lt;A class="active_link" href="http://gking.harvard.edu/files/0s.pdf" title="http://gking.harvard.edu/files/0s.pdf"&gt;http://gking.harvard.edu/files/0s.pdf&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;The authors studies the opposite of the problem you are trying to find a solution. They suggest an adjustment procedure for the data set with huge number observations but relatively few events. Nevertheless, you may be able to implement the same sampling design principle in your data set and estimation procedure as the authors suggest. I have used their methodology for large data sets with relatively low number of cases, and it is a quite effective and slick approach.&amp;nbsp;&amp;nbsp;&amp;nbsp; &lt;/P&gt;&lt;P&gt;Good luck.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Thu, 02 Oct 2014 13:47:05 GMT</pubDate>
    <dc:creator>jsienna</dc:creator>
    <dc:date>2014-10-02T13:47:05Z</dc:date>
    <item>
      <title>Oversampling in Enterprise Miner with a rare event fixed proportion</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161991#M1752</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I need to oversample in Enterprise Miner with a rare event fixed proportion.&lt;/P&gt;&lt;P&gt;Starting from a database with a 0.5% of rare event, I need to specify the proportion of rare event in the sample. 50:50 is not ok, because database is too small in this case.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thank you very much.&lt;/P&gt;&lt;P&gt;F&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Fri, 26 Sep 2014 16:32:34 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161991#M1752</guid>
      <dc:creator>Fabio</dc:creator>
      <dc:date>2014-09-26T16:32:34Z</dc:date>
    </item>
    <item>
      <title>Re: Oversampling in Enterprise Miner with a rare event fixed proportion</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161992#M1753</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi Fabio,&lt;/P&gt;&lt;P&gt;This usage note details the steps on how to model a rare event using oversampling.&lt;/P&gt;&lt;P&gt;Link here: &lt;A href="http://support.sas.com/kb/24/205.html" title="http://support.sas.com/kb/24/205.html"&gt;24205 - Rare event oversampling for model fitting in SAS® Enterprise Miner(tm)&lt;/A&gt;&lt;/P&gt;&lt;P&gt;It includes a video too!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;Miguel&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 29 Sep 2014 15:10:29 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161992#M1753</guid>
      <dc:creator>M_Maldonado</dc:creator>
      <dc:date>2014-09-29T15:10:29Z</dc:date>
    </item>
    <item>
      <title>Re: Oversampling in Enterprise Miner with a rare event fixed proportion</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161993#M1754</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Thank you, Miguel.&lt;/P&gt;&lt;P&gt;The note help to create a 50-50 sample. But the proportion of rare event is to big for me in this sample. I need a sample with a 10% of rare event proportion.&lt;/P&gt;&lt;P&gt;Is it possible?&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 02 Oct 2014 07:50:28 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161993#M1754</guid>
      <dc:creator>Fabio</dc:creator>
      <dc:date>2014-10-02T07:50:28Z</dc:date>
    </item>
    <item>
      <title>Re: Oversampling in Enterprise Miner with a rare event fixed proportion</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161994#M1755</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Fabio&lt;/P&gt;&lt;P&gt;I am not sure if it will be of some help, but you may take a look at this paper:&lt;/P&gt;&lt;P&gt;&lt;A class="active_link" href="http://gking.harvard.edu/files/0s.pdf" title="http://gking.harvard.edu/files/0s.pdf"&gt;http://gking.harvard.edu/files/0s.pdf&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;The authors studies the opposite of the problem you are trying to find a solution. They suggest an adjustment procedure for the data set with huge number observations but relatively few events. Nevertheless, you may be able to implement the same sampling design principle in your data set and estimation procedure as the authors suggest. I have used their methodology for large data sets with relatively low number of cases, and it is a quite effective and slick approach.&amp;nbsp;&amp;nbsp;&amp;nbsp; &lt;/P&gt;&lt;P&gt;Good luck.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 02 Oct 2014 13:47:05 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161994#M1755</guid>
      <dc:creator>jsienna</dc:creator>
      <dc:date>2014-10-02T13:47:05Z</dc:date>
    </item>
    <item>
      <title>Re: Oversampling in Enterprise Miner with a rare event fixed proportion</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161995#M1756</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Fabio, use the "Level Based" options in the Sampling node as demonstrated in the video that Miguel mentioned. You can set any sampling proportions that you want.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Also see the section on "Detecting Rare Classes" in the documentation for Enterprise Miner.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 02 Oct 2014 16:49:14 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161995#M1756</guid>
      <dc:creator>WarrenSarle</dc:creator>
      <dc:date>2014-10-02T16:49:14Z</dc:date>
    </item>
    <item>
      <title>Re: Oversampling in Enterprise Miner with a rare event fixed proportion</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161996#M1757</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Thank you everybody for your precious help&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Fri, 03 Oct 2014 15:49:26 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161996#M1757</guid>
      <dc:creator>Fabio</dc:creator>
      <dc:date>2014-10-03T15:49:26Z</dc:date>
    </item>
    <item>
      <title>Re: Oversampling in Enterprise Miner with a rare event fixed proportion</title>
      <link>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161997#M1758</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Fabio,&lt;/P&gt;&lt;P&gt;I added a detailed example this morning on how to adjust probabilities for a 50/50 oversample using a Decisions node.&lt;/P&gt;&lt;P&gt;Take a look here:&lt;A __default_attr="231401" __jive_macro_name="message" class="jive_macro jive_macro_message" href="https://communities.sas.com/"&gt;&lt;/A&gt;.&lt;/P&gt;&lt;P&gt;I hope it helps,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Miguel&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Fri, 03 Oct 2014 17:48:42 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Data-Science/Oversampling-in-Enterprise-Miner-with-a-rare-event-fixed/m-p/161997#M1758</guid>
      <dc:creator>M_Maldonado</dc:creator>
      <dc:date>2014-10-03T17:48:42Z</dc:date>
    </item>
  </channel>
</rss>

