<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Delete duplicates based on 3 variables with different priority in SAS Procedures</title>
    <link>https://communities.sas.com/t5/SAS-Procedures/Delete-duplicates-based-on-3-variables-with-different-priority/m-p/615057#M76934</link>
    <description>&lt;P&gt;I know there have been a lot of posts about ways to delete duplicates, but I can't find exactly what I am looking for.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I have a data set of phone numbers and I am trying to save all of the unique phone numbers for each ID. I want one row per phone number. If a phone number appears multiple times for one record, I want to keep the record with the most recent date.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Here's an example of test data:&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;ID&amp;nbsp; &amp;nbsp; phone number&amp;nbsp; &amp;nbsp; &amp;nbsp; date&lt;BR /&gt;1&amp;nbsp; &amp;nbsp; &amp;nbsp;(555) 555-5555&amp;nbsp; &amp;nbsp; &amp;nbsp;5/6/2018&lt;BR /&gt;1&amp;nbsp; &amp;nbsp; &amp;nbsp;(555) 555-5555&amp;nbsp; &amp;nbsp; &amp;nbsp;6/8/2018&lt;BR /&gt;1&amp;nbsp; &amp;nbsp; &amp;nbsp;(666) 666-6666&amp;nbsp; &amp;nbsp; &amp;nbsp;9/10/2018&lt;BR /&gt;2&amp;nbsp; &amp;nbsp; &amp;nbsp;(777) 777-7777&amp;nbsp; &amp;nbsp; &amp;nbsp;4/1/2018&lt;BR /&gt;2&amp;nbsp; &amp;nbsp; &amp;nbsp;(777) 777-7777&amp;nbsp; &amp;nbsp; &amp;nbsp;5/20/2018&lt;BR /&gt;3&amp;nbsp; &amp;nbsp; &amp;nbsp;(888) 888-8888&amp;nbsp; &amp;nbsp; &amp;nbsp;6/4/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp;(222) 222-2222&amp;nbsp; &amp;nbsp; &amp;nbsp;5/6/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp;(222) 222-2222&amp;nbsp; &amp;nbsp; &amp;nbsp;6/5/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp;(333) 333-3333&amp;nbsp; &amp;nbsp; &amp;nbsp;8/4/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp;(222) 222-2222&amp;nbsp; &amp;nbsp; &amp;nbsp;10/10/2018&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I would like the resulting data set to look like this:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;ID&amp;nbsp; &amp;nbsp; &amp;nbsp;phone number&amp;nbsp; &amp;nbsp; &amp;nbsp; date&lt;BR /&gt;1&amp;nbsp; &amp;nbsp; &amp;nbsp; (555) 555-5555&amp;nbsp; &amp;nbsp; &amp;nbsp;6/8/2018&lt;BR /&gt;1&amp;nbsp; &amp;nbsp; &amp;nbsp; (666) 666-6666&amp;nbsp; &amp;nbsp; &amp;nbsp;9/10/2018&lt;BR /&gt;2&amp;nbsp; &amp;nbsp; &amp;nbsp; (777) 777-7777&amp;nbsp; &amp;nbsp; &amp;nbsp;5/20/2018&lt;BR /&gt;3&amp;nbsp; &amp;nbsp; &amp;nbsp; (888) 888-8888&amp;nbsp; &amp;nbsp; &amp;nbsp;6/4/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp; (333) 333-3333&amp;nbsp; &amp;nbsp; &amp;nbsp;8/4/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp; (222) 222-2222&amp;nbsp; &amp;nbsp; &amp;nbsp;10/10/2018&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Where within one ID, each phone number only appears once. If the phone number appears for different dates in the original data, then the most recent date is the record that is kept.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks in advance for any help you can provide!&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Fri, 03 Jan 2020 20:15:19 GMT</pubDate>
    <dc:creator>katblack</dc:creator>
    <dc:date>2020-01-03T20:15:19Z</dc:date>
    <item>
      <title>Delete duplicates based on 3 variables with different priority</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/Delete-duplicates-based-on-3-variables-with-different-priority/m-p/615057#M76934</link>
      <description>&lt;P&gt;I know there have been a lot of posts about ways to delete duplicates, but I can't find exactly what I am looking for.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I have a data set of phone numbers and I am trying to save all of the unique phone numbers for each ID. I want one row per phone number. If a phone number appears multiple times for one record, I want to keep the record with the most recent date.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Here's an example of test data:&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;ID&amp;nbsp; &amp;nbsp; phone number&amp;nbsp; &amp;nbsp; &amp;nbsp; date&lt;BR /&gt;1&amp;nbsp; &amp;nbsp; &amp;nbsp;(555) 555-5555&amp;nbsp; &amp;nbsp; &amp;nbsp;5/6/2018&lt;BR /&gt;1&amp;nbsp; &amp;nbsp; &amp;nbsp;(555) 555-5555&amp;nbsp; &amp;nbsp; &amp;nbsp;6/8/2018&lt;BR /&gt;1&amp;nbsp; &amp;nbsp; &amp;nbsp;(666) 666-6666&amp;nbsp; &amp;nbsp; &amp;nbsp;9/10/2018&lt;BR /&gt;2&amp;nbsp; &amp;nbsp; &amp;nbsp;(777) 777-7777&amp;nbsp; &amp;nbsp; &amp;nbsp;4/1/2018&lt;BR /&gt;2&amp;nbsp; &amp;nbsp; &amp;nbsp;(777) 777-7777&amp;nbsp; &amp;nbsp; &amp;nbsp;5/20/2018&lt;BR /&gt;3&amp;nbsp; &amp;nbsp; &amp;nbsp;(888) 888-8888&amp;nbsp; &amp;nbsp; &amp;nbsp;6/4/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp;(222) 222-2222&amp;nbsp; &amp;nbsp; &amp;nbsp;5/6/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp;(222) 222-2222&amp;nbsp; &amp;nbsp; &amp;nbsp;6/5/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp;(333) 333-3333&amp;nbsp; &amp;nbsp; &amp;nbsp;8/4/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp;(222) 222-2222&amp;nbsp; &amp;nbsp; &amp;nbsp;10/10/2018&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I would like the resulting data set to look like this:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;ID&amp;nbsp; &amp;nbsp; &amp;nbsp;phone number&amp;nbsp; &amp;nbsp; &amp;nbsp; date&lt;BR /&gt;1&amp;nbsp; &amp;nbsp; &amp;nbsp; (555) 555-5555&amp;nbsp; &amp;nbsp; &amp;nbsp;6/8/2018&lt;BR /&gt;1&amp;nbsp; &amp;nbsp; &amp;nbsp; (666) 666-6666&amp;nbsp; &amp;nbsp; &amp;nbsp;9/10/2018&lt;BR /&gt;2&amp;nbsp; &amp;nbsp; &amp;nbsp; (777) 777-7777&amp;nbsp; &amp;nbsp; &amp;nbsp;5/20/2018&lt;BR /&gt;3&amp;nbsp; &amp;nbsp; &amp;nbsp; (888) 888-8888&amp;nbsp; &amp;nbsp; &amp;nbsp;6/4/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp; (333) 333-3333&amp;nbsp; &amp;nbsp; &amp;nbsp;8/4/2018&lt;BR /&gt;4&amp;nbsp; &amp;nbsp; &amp;nbsp; (222) 222-2222&amp;nbsp; &amp;nbsp; &amp;nbsp;10/10/2018&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Where within one ID, each phone number only appears once. If the phone number appears for different dates in the original data, then the most recent date is the record that is kept.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks in advance for any help you can provide!&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 03 Jan 2020 20:15:19 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/Delete-duplicates-based-on-3-variables-with-different-priority/m-p/615057#M76934</guid>
      <dc:creator>katblack</dc:creator>
      <dc:date>2020-01-03T20:15:19Z</dc:date>
    </item>
    <item>
      <title>Re: Delete duplicates based on 3 variables with different priority</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/Delete-duplicates-based-on-3-variables-with-different-priority/m-p/615087#M76935</link>
      <description>&lt;P&gt;This approach requires that you have real dates, and not just character strings:&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;PRE&gt;&lt;CODE class=" language-sas"&gt;proc sort data=have;
  by id phone_number date;
run;

data want;
   set have;
   by id phone_number date;
   if last.phone_number;
run;&lt;/CODE&gt;&lt;/PRE&gt;</description>
      <pubDate>Fri, 03 Jan 2020 21:55:29 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/Delete-duplicates-based-on-3-variables-with-different-priority/m-p/615087#M76935</guid>
      <dc:creator>Astounding</dc:creator>
      <dc:date>2020-01-03T21:55:29Z</dc:date>
    </item>
    <item>
      <title>Re: Delete duplicates based on 3 variables with different priority</title>
      <link>https://communities.sas.com/t5/SAS-Procedures/Delete-duplicates-based-on-3-variables-with-different-priority/m-p/615135#M76939</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/157279"&gt;@katblack&lt;/a&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Another approach could be:&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;PRE&gt;&lt;CODE class=" language-sas"&gt;proc sql;
	create table want as
	select ID, phone_number, max(date) as date format=MMDDYY10.
	from have
	group by ID, phone_number;
quit;&lt;/CODE&gt;&lt;/PRE&gt;
&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-center" image-alt="Capture d’écran 2020-01-04 à 14.30.18.png" style="width: 200px;"&gt;&lt;img src="https://communities.sas.com/t5/image/serverpage/image-id/35140i0EEB890EF458E9F9/image-size/small?v=v2&amp;amp;px=200" role="button" title="Capture d’écran 2020-01-04 à 14.30.18.png" alt="Capture d’écran 2020-01-04 à 14.30.18.png" /&gt;&lt;/span&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sat, 04 Jan 2020 13:31:26 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Procedures/Delete-duplicates-based-on-3-variables-with-different-priority/m-p/615135#M76939</guid>
      <dc:creator>ed_sas_member</dc:creator>
      <dc:date>2020-01-04T13:31:26Z</dc:date>
    </item>
  </channel>
</rss>

