<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Making all records in a spreadsheet unique and removing duplicates from other speadsheets in SAS Programming</title>
    <link>https://communities.sas.com/t5/SAS-Programming/Making-all-records-in-a-spreadsheet-unique-and-removing/m-p/777910#M247580</link>
    <description>&lt;P&gt;UNION in SQL checks for duplicates on its own:&lt;/P&gt;
&lt;PRE&gt;&lt;CODE class=" language-sas"&gt;proc sql;
create table new_dataset as
  select * from old_dataset
  union
  select * from update_dataset
;
quit;&lt;/CODE&gt;&lt;/PRE&gt;
&lt;P&gt;Note that this involves an internal sort over all variables, so it can become very resource-intensive with larger data.&lt;/P&gt;
&lt;P&gt;OTOH, spreadsheets from Excel are not "large" as they max out at ~ 1 million rows.&lt;/P&gt;</description>
    <pubDate>Tue, 02 Nov 2021 13:21:39 GMT</pubDate>
    <dc:creator>Kurt_Bremser</dc:creator>
    <dc:date>2021-11-02T13:21:39Z</dc:date>
    <item>
      <title>Making all records in a spreadsheet unique and removing duplicates from other speadsheets</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Making-all-records-in-a-spreadsheet-unique-and-removing/m-p/777903#M247577</link>
      <description>&lt;P&gt;Good Afternoon Everyone,&amp;nbsp;&lt;/P&gt;&lt;P&gt;My problem is as follows:&lt;/P&gt;&lt;P&gt;i have a workbook with no unique identifiers and data that appears to be duplicates but the cleint requested that the information be kept as is and that the information we see within the spreadsheet is not a duplicate.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I have assigned unique identifiers to the records using COUNT() but where the problem comes in is that when we receive new files from the client, The new files could have the exact same information as the previous workbook with one or two new records. How do i keep only the new records from the new file so that i can append it to my existing dataset and remove the duplicates from the new data because they are duplicates from the previous workbook and i do not want that in my dataset while still assigning my unique identifiers to the records.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Please find attached an example of what the Spreadsheet looks like:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;So i want to keep both instances of handy inc and assign unique identifiers for both records.&amp;nbsp;&lt;/P&gt;&lt;P&gt;but if these same records appear in a newly sent spreadhseet by a client that those rows be excluded and only the new records be kept for appending.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thank you in advance for all assistance provided&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Comm Example.PNG" style="width: 613px;"&gt;&lt;img src="https://communities.sas.com/t5/image/serverpage/image-id/65311iAF92113F5C97A086/image-size/large?v=v2&amp;amp;px=999" role="button" title="Comm Example.PNG" alt="Comm Example.PNG" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 02 Nov 2021 13:10:41 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Making-all-records-in-a-spreadsheet-unique-and-removing/m-p/777903#M247577</guid>
      <dc:creator>Ricardo96</dc:creator>
      <dc:date>2021-11-02T13:10:41Z</dc:date>
    </item>
    <item>
      <title>Re: Making all records in a spreadsheet unique and removing duplicates from other speadsheets</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Making-all-records-in-a-spreadsheet-unique-and-removing/m-p/777910#M247580</link>
      <description>&lt;P&gt;UNION in SQL checks for duplicates on its own:&lt;/P&gt;
&lt;PRE&gt;&lt;CODE class=" language-sas"&gt;proc sql;
create table new_dataset as
  select * from old_dataset
  union
  select * from update_dataset
;
quit;&lt;/CODE&gt;&lt;/PRE&gt;
&lt;P&gt;Note that this involves an internal sort over all variables, so it can become very resource-intensive with larger data.&lt;/P&gt;
&lt;P&gt;OTOH, spreadsheets from Excel are not "large" as they max out at ~ 1 million rows.&lt;/P&gt;</description>
      <pubDate>Tue, 02 Nov 2021 13:21:39 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Making-all-records-in-a-spreadsheet-unique-and-removing/m-p/777910#M247580</guid>
      <dc:creator>Kurt_Bremser</dc:creator>
      <dc:date>2021-11-02T13:21:39Z</dc:date>
    </item>
    <item>
      <title>Re: Making all records in a spreadsheet unique and removing duplicates from other speadsheets</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Making-all-records-in-a-spreadsheet-unique-and-removing/m-p/778241#M247715</link>
      <description>&lt;P&gt;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/11562"&gt;@Kurt_Bremser&lt;/a&gt;&amp;nbsp;Thank you.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 03 Nov 2021 15:55:23 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Making-all-records-in-a-spreadsheet-unique-and-removing/m-p/778241#M247715</guid>
      <dc:creator>Ricardo96</dc:creator>
      <dc:date>2021-11-03T15:55:23Z</dc:date>
    </item>
    <item>
      <title>Re: Making all records in a spreadsheet unique and removing duplicates from other speadsheets</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Making-all-records-in-a-spreadsheet-unique-and-removing/m-p/820882#M324048</link>
      <description>&lt;P&gt;Thank you Very much for the assistance on this problem...huge help.&amp;nbsp;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 29 Jun 2022 10:01:34 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Making-all-records-in-a-spreadsheet-unique-and-removing/m-p/820882#M324048</guid>
      <dc:creator>Ricardo96</dc:creator>
      <dc:date>2022-06-29T10:01:34Z</dc:date>
    </item>
  </channel>
</rss>

