<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Seeing if two strings are &amp;quot;similar&amp;quot; enough in SAS Programming</title>
    <link>https://communities.sas.com/t5/SAS-Programming/Seeing-if-two-strings-are-quot-similar-quot-enough/m-p/481739#M124674</link>
    <description>&lt;P&gt;Have a look at the &lt;A href="http://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002206133.htm" target="_self"&gt;COMPGED&lt;/A&gt; and &lt;A href="http://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002206137.htm" target="_self"&gt;COMPLEV&lt;/A&gt; functions are good places to start.&lt;/P&gt;</description>
    <pubDate>Fri, 27 Jul 2018 01:11:53 GMT</pubDate>
    <dc:creator>PeterClemmensen</dc:creator>
    <dc:date>2018-07-27T01:11:53Z</dc:date>
    <item>
      <title>Seeing if two strings are "similar" enough</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Seeing-if-two-strings-are-quot-similar-quot-enough/m-p/481715#M124660</link>
      <description>&lt;P&gt;I have a column called "&lt;STRONG&gt;name&lt;/STRONG&gt;" where people manually inputted a lot of people's names.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I am hoping to use SAS to look for duplicates, but there's a high chance there's high error rates, e.g. a few typos but a "normal human" would know that the two names are likely referring to the same person.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I was wondering what it might look like if I asked SAS to first sort names in alphabetical order, then for each entry, compare the string&amp;nbsp;directly and below it -- if either of those entries has the same amount of characters +/- 2, and then the same letters but with 4 differences, then we will count that as a duplicate and then the new var&amp;nbsp;&lt;STRONG&gt;duplicate&lt;/STRONG&gt; = 1.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Not sure if people have ideas as to how I might compare strings this way?&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thank you!&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 26 Jul 2018 23:03:56 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Seeing-if-two-strings-are-quot-similar-quot-enough/m-p/481715#M124660</guid>
      <dc:creator>cdubs</dc:creator>
      <dc:date>2018-07-26T23:03:56Z</dc:date>
    </item>
    <item>
      <title>Re: Seeing if two strings are "similar" enough</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Seeing-if-two-strings-are-quot-similar-quot-enough/m-p/481718#M124661</link>
      <description>&lt;P&gt;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/174079"&gt;@cdubs&lt;/a&gt;&lt;/P&gt;
&lt;P&gt;Similar questions like yours come up from time to time. Have you already searched this forum with terms like "fuzzy match"?&lt;/P&gt;
&lt;P&gt;You would find discussions like: &lt;A href="https://communities.sas.com/t5/Base-SAS-Programming/Fuzzy-match-with-soundex-and-compged/m-p/295334/highlight/true#M61710&amp;nbsp;" target="_blank"&gt;https://communities.sas.com/t5/Base-SAS-Programming/Fuzzy-match-with-soundex-and-compged/m-p/295334/highlight/true#M61710&amp;nbsp;&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 26 Jul 2018 23:08:37 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Seeing-if-two-strings-are-quot-similar-quot-enough/m-p/481718#M124661</guid>
      <dc:creator>Patrick</dc:creator>
      <dc:date>2018-07-26T23:08:37Z</dc:date>
    </item>
    <item>
      <title>Re: Seeing if two strings are "similar" enough</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Seeing-if-two-strings-are-quot-similar-quot-enough/m-p/481720#M124663</link>
      <description>&lt;P&gt;I haven't!&amp;nbsp;I'll look at those now &lt;span class="lia-unicode-emoji" title=":slightly_smiling_face:"&gt;🙂&lt;/span&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 26 Jul 2018 23:09:32 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Seeing-if-two-strings-are-quot-similar-quot-enough/m-p/481720#M124663</guid>
      <dc:creator>cdubs</dc:creator>
      <dc:date>2018-07-26T23:09:32Z</dc:date>
    </item>
    <item>
      <title>Re: Seeing if two strings are "similar" enough</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Seeing-if-two-strings-are-quot-similar-quot-enough/m-p/481739#M124674</link>
      <description>&lt;P&gt;Have a look at the &lt;A href="http://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002206133.htm" target="_self"&gt;COMPGED&lt;/A&gt; and &lt;A href="http://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002206137.htm" target="_self"&gt;COMPLEV&lt;/A&gt; functions are good places to start.&lt;/P&gt;</description>
      <pubDate>Fri, 27 Jul 2018 01:11:53 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Seeing-if-two-strings-are-quot-similar-quot-enough/m-p/481739#M124674</guid>
      <dc:creator>PeterClemmensen</dc:creator>
      <dc:date>2018-07-27T01:11:53Z</dc:date>
    </item>
  </channel>
</rss>

