<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Finding Duplicates in SAS Programming</title>
    <link>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135919#M295747</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;If you have Data Flux Tool you can do it very easily. you need to run the DF job with proper QKB attached with it.&lt;/P&gt;&lt;P&gt;It will generate same ID for duplicate records.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Let me know if you want if you want more elaboration.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;&lt;P&gt;Pravin&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Mon, 04 Aug 2014 17:35:16 GMT</pubDate>
    <dc:creator>PravinMishra</dc:creator>
    <dc:date>2014-08-04T17:35:16Z</dc:date>
    <item>
      <title>Finding Duplicates</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135914#M295742</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;I am trying to find duplicates in one column that have different values in another.&amp;nbsp; For example, different sender names with the same sender address.&amp;nbsp; I am using EG and I am not sure which option would be the best. &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;For example:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN style="text-decoration: underline;"&gt;&lt;SPAN style="color: #575757; text-decoration: underline;"&gt;Sender Name&amp;nbsp;&amp;nbsp;&amp;nbsp; &lt;/SPAN&gt;&lt;SPAN style="color: #575757; text-decoration: underline;"&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Sender Address&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN style="color: #575757;"&gt;John Doe&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 123 Main St.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN style="color: #575757;"&gt;Jane Doe&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 123 Main St.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN style="color: #575757;"&gt;Thanks for the help!&lt;/SPAN&gt;&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 28 Apr 2014 14:34:48 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135914#M295742</guid>
      <dc:creator>PRudnick</dc:creator>
      <dc:date>2014-04-28T14:34:48Z</dc:date>
    </item>
    <item>
      <title>Re: Finding Duplicates</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135915#M295743</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Can you use proc freq on the data?&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 28 Apr 2014 14:41:30 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135915#M295743</guid>
      <dc:creator>RW9</dc:creator>
      <dc:date>2014-04-28T14:41:30Z</dc:date>
    </item>
    <item>
      <title>Re: Finding Duplicates</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135916#M295744</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;if you don't mind putting down some SAS code, and assuming name and address are all you have, then try the following:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;proc sql;&lt;/P&gt;&lt;P&gt;&amp;nbsp; create table want/*this is your output table*/ as&lt;/P&gt;&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; select * from have /*this is the input table*/&lt;/P&gt;&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; group by sender_address&lt;/P&gt;&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; having count(*) &amp;gt;1&lt;/P&gt;&lt;P&gt;;quit;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Or like &lt;A __default_attr="814511" __jive_macro_name="user" class="jive_macro jive_macro_user" data-objecttype="3" href="https://communities.sas.com/"&gt;&lt;/A&gt; suggested, try using proc freq. In EG, you will find it under the task name called&amp;nbsp; "One-Way Frequencies".&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Haikuo &lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 28 Apr 2014 14:52:44 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135916#M295744</guid>
      <dc:creator>Haikuo</dc:creator>
      <dc:date>2014-04-28T14:52:44Z</dc:date>
    </item>
    <item>
      <title>Re: Finding Duplicates</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135917#M295745</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;There is a lot of data involved....&amp;nbsp; I have 49 different columns.&amp;nbsp; Proc freq will show me how many times an address is used but I want to be able to output the instance where different Senders are using the same address&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 28 Apr 2014 15:31:42 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135917#M295745</guid>
      <dc:creator>PRudnick</dc:creator>
      <dc:date>2014-04-28T15:31:42Z</dc:date>
    </item>
    <item>
      <title>Re: Finding Duplicates</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135918#M295746</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;You could try using query builder , and/or one-way frequencies, or just run the code that I posted with a minor weak:&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;proc sql;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp; create table want/*this is your output table*/ as&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp; select * from have /*this is the input table*/&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp; group by sender_address&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp; having count(distinct sender_name) &amp;gt;1&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;;quit;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;This will give you all the addresses that have more than one different names.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Haikuo&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Update: not that I am not aware you are EG user, but to post numerous screen shots is just too much for me. &lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 28 Apr 2014 16:00:30 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135918#M295746</guid>
      <dc:creator>Haikuo</dc:creator>
      <dc:date>2014-04-28T16:00:30Z</dc:date>
    </item>
    <item>
      <title>Re: Finding Duplicates</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135919#M295747</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;If you have Data Flux Tool you can do it very easily. you need to run the DF job with proper QKB attached with it.&lt;/P&gt;&lt;P&gt;It will generate same ID for duplicate records.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Let me know if you want if you want more elaboration.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;&lt;P&gt;Pravin&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 04 Aug 2014 17:35:16 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Finding-Duplicates/m-p/135919#M295747</guid>
      <dc:creator>PravinMishra</dc:creator>
      <dc:date>2014-08-04T17:35:16Z</dc:date>
    </item>
  </channel>
</rss>

