<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: save the duplicates in SAS Programming</title>
    <link>https://communities.sas.com/t5/SAS-Programming/save-the-duplicates/m-p/838689#M331606</link>
    <description>&lt;P&gt;Alternatively, a data step approach&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;PRE&gt;&lt;CODE class=" language-sas"&gt;data have dups;

   if _N_ = 1 then do;
      dcl hash h(dataset : 'have(obs = 0)');
      h.definekey(all : 'Y');
      h.definedone();
   end;

   set have;

   if h.add() = 0 then output have;
   else                output dups;

run;&lt;/CODE&gt;&lt;/PRE&gt;</description>
    <pubDate>Fri, 14 Oct 2022 17:57:40 GMT</pubDate>
    <dc:creator>PeterClemmensen</dc:creator>
    <dc:date>2022-10-14T17:57:40Z</dc:date>
    <item>
      <title>save the duplicates</title>
      <link>https://communities.sas.com/t5/SAS-Programming/save-the-duplicates/m-p/838683#M331602</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I have a dataset&lt;/P&gt;&lt;P&gt;ID&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;vin&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;zip&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;&lt;/P&gt;&lt;P&gt;11221&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;7896&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 43567&lt;/P&gt;&lt;P&gt;11221&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;7654&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;43567&lt;/P&gt;&lt;P&gt;13456&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;5433&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 41323&lt;/P&gt;&lt;P&gt;13456&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;5433&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 41323&lt;/P&gt;&lt;P&gt;16754&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 6432&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 51678&lt;/P&gt;&lt;P&gt;16754&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;6432&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;51678&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I want to remove the duplicates and want to save what I removed. in a separate dataset.&lt;/P&gt;&lt;P&gt;Removed_duplicates&lt;/P&gt;&lt;P&gt;ID&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;vin&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;zip&lt;/P&gt;&lt;P&gt;13456&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 5433&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;41323&lt;/P&gt;&lt;P&gt;16754&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 6432&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 51678&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;thanks in advance.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 14 Oct 2022 17:40:31 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/save-the-duplicates/m-p/838683#M331602</guid>
      <dc:creator>Smitha9</dc:creator>
      <dc:date>2022-10-14T17:40:31Z</dc:date>
    </item>
    <item>
      <title>Re: save the duplicates</title>
      <link>https://communities.sas.com/t5/SAS-Programming/save-the-duplicates/m-p/838687#M331605</link>
      <description>&lt;P&gt;Try this&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;PRE&gt;&lt;CODE class=" language-sas"&gt;data have;
input ID vin zip;
datalines;
11221 7896 43567
11221 7654 43567
13456 5433 41323
13456 5433 41323
16754 6432 51678
16754 6432 51678
;

proc sort data = have nodupkey dupout = dups;
   by _ALL_;
run;&lt;/CODE&gt;&lt;/PRE&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&lt;U&gt;&lt;STRONG&gt;Result:&lt;/STRONG&gt;&lt;/U&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;PRE&gt;have

ID     vin   zip
11221  7654  43567
11221  7896  43567
13456  5433  41323
16754  6432  51678

dups

ID     vin   zip
13456  5433  41323
16754  6432  51678&lt;/PRE&gt;</description>
      <pubDate>Fri, 14 Oct 2022 17:54:25 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/save-the-duplicates/m-p/838687#M331605</guid>
      <dc:creator>PeterClemmensen</dc:creator>
      <dc:date>2022-10-14T17:54:25Z</dc:date>
    </item>
    <item>
      <title>Re: save the duplicates</title>
      <link>https://communities.sas.com/t5/SAS-Programming/save-the-duplicates/m-p/838689#M331606</link>
      <description>&lt;P&gt;Alternatively, a data step approach&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;PRE&gt;&lt;CODE class=" language-sas"&gt;data have dups;

   if _N_ = 1 then do;
      dcl hash h(dataset : 'have(obs = 0)');
      h.definekey(all : 'Y');
      h.definedone();
   end;

   set have;

   if h.add() = 0 then output have;
   else                output dups;

run;&lt;/CODE&gt;&lt;/PRE&gt;</description>
      <pubDate>Fri, 14 Oct 2022 17:57:40 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/save-the-duplicates/m-p/838689#M331606</guid>
      <dc:creator>PeterClemmensen</dc:creator>
      <dc:date>2022-10-14T17:57:40Z</dc:date>
    </item>
    <item>
      <title>Re: save the duplicates</title>
      <link>https://communities.sas.com/t5/SAS-Programming/save-the-duplicates/m-p/838690#M331607</link>
      <description>&lt;P&gt;Maybe this gets you started. Please note the DATA step code to provide example data that we can test code against.&lt;/P&gt;
&lt;P&gt;This removes all records with duplicate values.&lt;/P&gt;
&lt;PRE&gt;data have;
   input ID vin zip ;
datalines;
11221 7896  43567
11221 7654 43567
13456 5433  41323
13456 5433  41323
16754  6432  51678
16754 6432 51678
;

proc sort data=have out=duplicates 
     uniqueout=Havesort nouniquekey ;
  by _all_;
run;&lt;/PRE&gt;
&lt;P&gt;The Havesort data set in the output is the sorted values of the Unique or "not duplicated" values. The Duplicates set will have all the records with the duplicate values, not just one.&lt;/P&gt;
&lt;P&gt;This leaves one value of each of the duplicates in the Want set with the remainder of the duplicates in the Dupes set:&lt;/P&gt;
&lt;PRE&gt;proc sort data=have out=want 
     dupout=dupes nodupkey ;
  by _all_;
run;&lt;/PRE&gt;
&lt;P&gt;If this doesn't do what you want then provide a clearer example as to what the set without duplicates should look like.&lt;/P&gt;</description>
      <pubDate>Fri, 14 Oct 2022 18:04:17 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/save-the-duplicates/m-p/838690#M331607</guid>
      <dc:creator>ballardw</dc:creator>
      <dc:date>2022-10-14T18:04:17Z</dc:date>
    </item>
  </channel>
</rss>

