<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Matching the String Variables in SAS Programming</title>
    <link>https://communities.sas.com/t5/SAS-Programming/Matching-the-String-Variables/m-p/625006#M184184</link>
    <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/11763"&gt;@AbuChowdhury&lt;/a&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Here is on approach to do this.&lt;/P&gt;
&lt;P&gt;Hope this helps!&lt;/P&gt;
&lt;PRE&gt;&lt;CODE class=" language-sas"&gt;data one;
	infile datalines dlm="09"x;
	input Name:$50. Rank  Year;
	datalines;
A.S. Goldmen	2.01	2002
A.S. Goldmen	3.01	2003
AG Edwards	2.51	2001
AG Edwards	2.61	2002
Credit Suisse	3.50	2002
;

data two;
	infile datalines dlm="09"x;
	input Name:$50. Year;
	datalines;
A.S. Goldmen	2002
Goldmen (xxx)	2003
AG Edwards	2001
AG Edwards	2002  
A.S. GoldmenAG Edwards	2002
Credit Suisse	2002
A.S. GoldmenAG EdwardsCredit Suisse	2002
; 

/* Put distinct 'units' of Name into macrovariables */
proc sql noprint;
	select distinct quote(tranwrd(tranwrd(strip(Name),'.','\.'),' ','\s'),"'") into: units separated by "," from one;
	select count(distinct name) into: total_units from one;
quit;

/* Separate Names into its distinct 'units' (one unit per variable) */
data two2;
	set two;
	if Name="Goldmen (xxx)" then Name="A.S. Goldmen"; /* Data management*/
	id+1;
	array _name(&amp;amp;total_units) $ 50;
	array _unit(&amp;amp;total_units) $ 50 _temporary_ (&amp;amp;units);
	do i=1 to &amp;amp;total_units;
		if prxmatch(cats('/^.*(',_unit(i),').*$/'),Name) then
		_name(i)=prxchange(cats('s/^.*(',_unit(i),').*$/$1/i'),i,Name);
	end;
	drop i;

proc sort data=two2;
	by id name year;
run;
proc transpose data=two2 out=two2_tr (drop=_name_ where=(unit ne "") rename=(col1=unit));
	var _name:;
	by id name year;
run;

/* Merge with ranks */
proc sql;
	create table one_two as
	select b.name, b.unit, b.year, a.rank
	from one as a inner join two2_tr as b
	on a.name = b.unit and a.year=b.year;
quit;

/* Compute mean */
proc sql;
	create table want as
	select distinct name,year, avg(rank) as rank
	from one_two
	group by name, year;
quit;


&lt;/CODE&gt;&lt;/PRE&gt;
&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-center" image-alt="Capture d’écran 2020-02-15 à 14.34.55.png" style="width: 400px;"&gt;&lt;img src="https://communities.sas.com/t5/image/serverpage/image-id/36146i4EFD1DED822B6D90/image-size/medium?v=v2&amp;amp;px=400" role="button" title="Capture d’écran 2020-02-15 à 14.34.55.png" alt="Capture d’écran 2020-02-15 à 14.34.55.png" /&gt;&lt;/span&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Sat, 15 Feb 2020 13:35:32 GMT</pubDate>
    <dc:creator>ed_sas_member</dc:creator>
    <dc:date>2020-02-15T13:35:32Z</dc:date>
    <item>
      <title>Matching the String Variables</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Matching-the-String-Variables/m-p/624985#M184176</link>
      <description>&lt;P&gt;Dear Experts,&lt;/P&gt;&lt;P&gt;I need to match string variables from two different datasets. Datasets look as follows:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Dataset one:&lt;/P&gt;&lt;P&gt;Name&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; Rank&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; Year&lt;/P&gt;&lt;P&gt;A.S. Goldmen&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2.01&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2002&lt;/P&gt;&lt;P&gt;A.S. Goldmen&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 3.01&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2003&lt;/P&gt;&lt;P&gt;AG Edwards&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2.51&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2001&lt;/P&gt;&lt;P&gt;AG Edwards&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2.61&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2002&lt;/P&gt;&lt;P&gt;Credit Suisse&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;3.50&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2002&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Dataset two:&lt;/P&gt;&lt;P&gt;Name&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; Year&lt;/P&gt;&lt;P&gt;A.S Goldmen&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2002&lt;/P&gt;&lt;P&gt;Goldmen (xxx)&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2003&lt;/P&gt;&lt;P&gt;AG Edwards&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2001&lt;/P&gt;&lt;P&gt;AG Edwards&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2002&amp;nbsp;&amp;nbsp;&lt;/P&gt;&lt;P&gt;A.S. GoldmenAG Edwards&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2002&lt;/P&gt;&lt;P&gt;Credit Suisse&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2002&lt;/P&gt;&lt;P&gt;A.S. GoldmenAG EdwardsCredit Suisse&amp;nbsp; &amp;nbsp; &amp;nbsp;2002&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;So how will I merge these datasets by Name and Year? The problem is in Name variable in dataset two.&lt;/P&gt;&lt;P&gt;Output should be like this:&lt;/P&gt;&lt;P&gt;Name&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;Rank&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; Year&lt;/P&gt;&lt;P&gt;A.S. Goldmen&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2.01&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2002&lt;/P&gt;&lt;P&gt;A.S. Goldmen&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 3.01&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2003&lt;/P&gt;&lt;P&gt;AG Edwards&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2.51&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2001&lt;/P&gt;&lt;P&gt;AG Edwards&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2.61&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2002&lt;/P&gt;&lt;P&gt;A.S. GoldmenAG Edwards&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2.31&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2002&lt;/P&gt;&lt;P&gt;A.S. GoldmenAG EdwardsCredit Suisse&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; 2.7067&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;2002&lt;/P&gt;&lt;P&gt;For the row A.S. GoldmenAG Edwards, the Rank is average rank of A.S. Goldmen and AG Edwards in 2002 ((2.01+2.61)/2 = 2.31). For the last row (A.S. GoldmenAG EdwardsCredit Suisse), the is average rank of A.S. Goldmen, AG Edwards and Credit Suisse ((2.01+2.61+ 3.50)/3 = 2.7067).&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Kind regards,&lt;/P&gt;&lt;P&gt;Abu&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sat, 15 Feb 2020 03:36:02 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Matching-the-String-Variables/m-p/624985#M184176</guid>
      <dc:creator>AbuChowdhury</dc:creator>
      <dc:date>2020-02-15T03:36:02Z</dc:date>
    </item>
    <item>
      <title>Re: Matching the String Variables</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Matching-the-String-Variables/m-p/625004#M184183</link>
      <description>Is this problem related to &lt;A href="https://communities.sas.com/t5/SAS-Programming/Matching-the-String-Variables/m-p/624985#M184176" target="_blank"&gt;https://communities.sas.com/t5/SAS-Programming/Matching-the-String-Variables/m-p/624985#M184176&lt;/A&gt;?</description>
      <pubDate>Sat, 15 Feb 2020 12:51:52 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Matching-the-String-Variables/m-p/625004#M184183</guid>
      <dc:creator>andreas_lds</dc:creator>
      <dc:date>2020-02-15T12:51:52Z</dc:date>
    </item>
    <item>
      <title>Re: Matching the String Variables</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Matching-the-String-Variables/m-p/625006#M184184</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/11763"&gt;@AbuChowdhury&lt;/a&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Here is on approach to do this.&lt;/P&gt;
&lt;P&gt;Hope this helps!&lt;/P&gt;
&lt;PRE&gt;&lt;CODE class=" language-sas"&gt;data one;
	infile datalines dlm="09"x;
	input Name:$50. Rank  Year;
	datalines;
A.S. Goldmen	2.01	2002
A.S. Goldmen	3.01	2003
AG Edwards	2.51	2001
AG Edwards	2.61	2002
Credit Suisse	3.50	2002
;

data two;
	infile datalines dlm="09"x;
	input Name:$50. Year;
	datalines;
A.S. Goldmen	2002
Goldmen (xxx)	2003
AG Edwards	2001
AG Edwards	2002  
A.S. GoldmenAG Edwards	2002
Credit Suisse	2002
A.S. GoldmenAG EdwardsCredit Suisse	2002
; 

/* Put distinct 'units' of Name into macrovariables */
proc sql noprint;
	select distinct quote(tranwrd(tranwrd(strip(Name),'.','\.'),' ','\s'),"'") into: units separated by "," from one;
	select count(distinct name) into: total_units from one;
quit;

/* Separate Names into its distinct 'units' (one unit per variable) */
data two2;
	set two;
	if Name="Goldmen (xxx)" then Name="A.S. Goldmen"; /* Data management*/
	id+1;
	array _name(&amp;amp;total_units) $ 50;
	array _unit(&amp;amp;total_units) $ 50 _temporary_ (&amp;amp;units);
	do i=1 to &amp;amp;total_units;
		if prxmatch(cats('/^.*(',_unit(i),').*$/'),Name) then
		_name(i)=prxchange(cats('s/^.*(',_unit(i),').*$/$1/i'),i,Name);
	end;
	drop i;

proc sort data=two2;
	by id name year;
run;
proc transpose data=two2 out=two2_tr (drop=_name_ where=(unit ne "") rename=(col1=unit));
	var _name:;
	by id name year;
run;

/* Merge with ranks */
proc sql;
	create table one_two as
	select b.name, b.unit, b.year, a.rank
	from one as a inner join two2_tr as b
	on a.name = b.unit and a.year=b.year;
quit;

/* Compute mean */
proc sql;
	create table want as
	select distinct name,year, avg(rank) as rank
	from one_two
	group by name, year;
quit;


&lt;/CODE&gt;&lt;/PRE&gt;
&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-center" image-alt="Capture d’écran 2020-02-15 à 14.34.55.png" style="width: 400px;"&gt;&lt;img src="https://communities.sas.com/t5/image/serverpage/image-id/36146i4EFD1DED822B6D90/image-size/medium?v=v2&amp;amp;px=400" role="button" title="Capture d’écran 2020-02-15 à 14.34.55.png" alt="Capture d’écran 2020-02-15 à 14.34.55.png" /&gt;&lt;/span&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sat, 15 Feb 2020 13:35:32 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Matching-the-String-Variables/m-p/625006#M184184</guid>
      <dc:creator>ed_sas_member</dc:creator>
      <dc:date>2020-02-15T13:35:32Z</dc:date>
    </item>
    <item>
      <title>Re: Matching the String Variables</title>
      <link>https://communities.sas.com/t5/SAS-Programming/Matching-the-String-Variables/m-p/625033#M184195</link>
      <description>&lt;P&gt;This links to the current message...&lt;/P&gt;</description>
      <pubDate>Sat, 15 Feb 2020 19:37:48 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Programming/Matching-the-String-Variables/m-p/625033#M184195</guid>
      <dc:creator>PGStats</dc:creator>
      <dc:date>2020-02-15T19:37:48Z</dc:date>
    </item>
  </channel>
</rss>

