<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Large number of observations with missing values in regression output in SAS Studio</title>
    <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450058#M5064</link>
    <description>&lt;P&gt;&lt;SPAN&gt;Salary is in&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN&gt;Compustat_ExecuComp4.&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;And with regards to&amp;nbsp;annual_return, I will quote a SAS expert from another post:&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Do you always begin with January and end with December?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Is DATE a SAS date, or merely a numeric value with YMD?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Is your data in sorted order by TICKER DATE?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Assuming "yes", "just a number", and "yes", you could program it in this way:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I will look into your other points now.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;data temp;&lt;/P&gt;&lt;P&gt;set have;&lt;/P&gt;&lt;P&gt;by ticker date;&lt;/P&gt;&lt;P&gt;retain annual_return 1;&lt;/P&gt;&lt;P&gt;annual_return = annual_return * (1 + RET);&lt;/P&gt;&lt;P&gt;month = int( mod(date,10000) / 100);&lt;/P&gt;&lt;P&gt;if month = 12;&lt;/P&gt;&lt;P&gt;annual_return = (annual_return - 1) * 100;&lt;/P&gt;&lt;P&gt;output;&lt;/P&gt;&lt;P&gt;annual_return = 1;&lt;/P&gt;&lt;P&gt;run;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;If DATE is actually a SAS date, the calculation of MONTH is easier:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;month = month(date);&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Note that the annualized return is calculated separately for each year.&amp;nbsp; If you get 10% for one year, and 20% for the next year, the total value after two years would be 1.1 * 1.2 * original value ... all assuming that I got the formulas correct.&lt;/P&gt;</description>
    <pubDate>Fri, 30 Mar 2018 20:19:25 GMT</pubDate>
    <dc:creator>sastuck</dc:creator>
    <dc:date>2018-03-30T20:19:25Z</dc:date>
    <item>
      <title>Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450003#M5051</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I am modeling the effect of firm performance on CEO salary. SAS read 10,741 observations from my merged ceo_firm data set, but only used 2,066 of them. 8,675 observations had missing values. I am surprised by this, however, due to the substantive data cleaning I have done in preparation for running the regression. Do you have any idea why I could still be missing so many observations? Here is my code:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;libname paper "~/425/425_Final_Paper";

*import compustat dataset;
PROC IMPORT out=paper.CompuStat_Execucomp
datafile="~/425/425_Final_Paper/CompuStat_Execucomp.csv"
DBMS=CSV replace;
getnames= yes;
guessingrows=2000;
run;

*keep only CEOs;
data paper.Compustat_ExecuComp2;
set paper.Compustat_ExecuComp;
if CEOANN = 'CEO';
run;

*** extra DATA step for checking previous data step results by comparing number of records selected;
data check_CEOANN;
set paper.Compustat_ExecuComp;
if CEOANN =: 'CEO';
run;

proc sort data=paper.Compustat_ExecuComp2;
by ticker year;
run;

*import csrp dataset;
PROC IMPORT out=paper.CSRP_Monthly_Stock_char
datafile="~/425/425_Final_Paper/CSRP_MonthlyStock_char.csv"
DBMS=CSV replace;
getnames= yes;
guessingrows=max;
run;

*remove bad data; 
data paper.CSRP_Monthly_Stock_char2;
set paper.CSRP_Monthly_Stock_char (rename=(ret=character_ret));
drop character_ret;
if cusip = ' ' then delete;
ret = input(character_ret, ??8.);
if ret = . then delete;
date = input(put(date, z8.), yymmdd8.);
format date yymmdd10.;
year = year(date);
month = month(date);
if cusip =: '?' then cusip = substr(cusip, 2);
run;

proc contents 
data=paper.CSRP_Monthly_Stock_char2;
run;

proc sort data=paper.CSRP_Monthly_Stock_char2;
by ticker year;
run;

*Remove all bad years from both data sources;
data paper.Compustat_ExecuComp3;
merge paper.Compustat_ExecuComp2
paper.multiple_CEOs (keep=ticker year in=had_multiple_CEOs);
by ticker year;
if had_multiple_CEOs then delete;
run;

data paper.CSRP_Monthly_Stock_char3;
merge paper.CSRP_Monthly_Stock_char2
paper.multiple_CEOs (keep=ticker year in=had_multiple_CEOs);
by ticker year;
if had_multiple_CEOs then delete;
run;

*find additional bad data: multiple return records for the same month/year;
proc freq data=paper.CSRP_Monthly_Stock_char3;
tables ticker * year * month / noprint out=paper.multiple_returns (where=(count &amp;gt; 1));
run;

*Remove all matching year data for multiple returns;
proc sort data=paper.multiple_returns out=multiple_returns (keep=ticker year) NODUPKEY;
by ticker year;
run;

data paper.Compustat_ExecuComp4;
merge paper.Compustat_ExecuComp3
multiple_returns (in=had_multiple_returns);
by ticker year;
if had_multiple_returns then delete;
run;

data paper.CSRP_Monthly_Stock_char4;
merge paper.CSRP_Monthly_Stock_char3
multiple_returns (in=had_multiple_returns);
by ticker year;
if had_multiple_returns then delete;
run;

*create new variable annualized growth;
data paper.CSRP_annual_returns;
set paper.CSRP_Monthly_Stock_char4;
by ticker year;
retain annual_return 1;
annual_return = annual_return * (1 + RET);
if month = 12 or last.ticker;
annual_return = (annual_return - 1) * 100;
output;
annual_return = 1;
keep ticker year annual_return;
run;

*use proc contents to see if there is a type mismatch;
proc contents 
data=paper.CSRP_annual_returns;
run;

proc contents 
data=paper.Compustat_ExecuComp4;
run;

*MERGE statement has more than one data set with repeats of BY values;
proc sort data=paper.compustat_execucomp4;
  by ticker;
run;
proc sort data=paper.CSRP_annual_returns nodupkey;
  by ticker;
run;
data want;
  merge paper.compustat_execucomp4 (in=in1) paper.CSRP_annual_returns;
  by ticker;
  if in1;
run;

*Merge CEO data and firm data; 
DATA paper.ceo_firm ; 
length ticker $5;
MERGE paper.CSRP_annual_returns 
paper.compustat_execucomp4; 
BY ticker; 
RUN;

proc contents 
data=paper.ceo_firm;
run;

*remove missing return data; 
data paper.ceo_firm;
set paper.ceo_firm;
if annual_return = . then delete;
run;

proc means data=paper.CSRP_Monthly_Stock_char3   n nmiss;
var ret;
run;

*Use OLS to estimate model;
title "";
ods graphics on;
proc reg data=paper.ceo_firm plots(maxpoints=none);
model salary = annual_return /clb acov;
run;  
ods graphics off;&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks in advance for the help!&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 30 Mar 2018 18:32:48 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450003#M5051</guid>
      <dc:creator>sastuck</dc:creator>
      <dc:date>2018-03-30T18:32:48Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450009#M5054</link>
      <description>&lt;P&gt;Without seeing the data I don't think anyone can tell you why you are missing salary and/or annual return from so many records.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;I think you have to manually review the files to see why there are so many missing values. Could be an error in how the data was imported.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Art, CEO, AnalystFinder.com&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 30 Mar 2018 18:51:38 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450009#M5054</guid>
      <dc:creator>art297</dc:creator>
      <dc:date>2018-03-30T18:51:38Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450011#M5056</link>
      <description>&lt;P&gt;Which particular dataset do you think would be helpful in looking at this issue?&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 30 Mar 2018 18:52:57 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450011#M5056</guid>
      <dc:creator>sastuck</dc:creator>
      <dc:date>2018-03-30T18:52:57Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450016#M5058</link>
      <description>&lt;P&gt;Post the results of&amp;nbsp;the PROC MEANS call&lt;/P&gt;
&lt;PRE&gt;proc means data=paper.CSRP_Monthly_Stock_char3   n nmiss;
var salary annual_return;
run;&lt;/PRE&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;. It contains the count of missing and nonmissing&amp;nbsp;values for the variables in your&amp;nbsp;model.&lt;/P&gt;</description>
      <pubDate>Fri, 30 Mar 2018 19:04:03 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450016#M5058</guid>
      <dc:creator>Rick_SAS</dc:creator>
      <dc:date>2018-03-30T19:04:03Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450023#M5059</link>
      <description>&lt;P&gt;I agree, in principle, with Rick, but I don't think RET is the variable you're using. Your code includes:&lt;/P&gt;
&lt;PRE&gt;data paper.CSRP_annual_returns;
  set paper.CSRP_Monthly_Stock_char4;
  by ticker year;
  retain annual_return 1;
  annual_return = annual_return * (1 + RET);
  if month = 12 or last.ticker;
  annual_return = (annual_return - 1) * 100;
  output;
  annual_return = 1;
  keep ticker year annual_return;
run;&lt;/PRE&gt;
&lt;P&gt;In that code you're only calculating annual_return if month=12 or it's the last record for a particular ticker. Is that really what you want to be doing? And your proc means only analyzes RET, while your variable is annual_return.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;I don't know which file contains SALARY&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Art, CEO, AnalystFinder.com&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Art, CEO,&lt;/P&gt;</description>
      <pubDate>Fri, 30 Mar 2018 19:10:55 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450023#M5059</guid>
      <dc:creator>art297</dc:creator>
      <dc:date>2018-03-30T19:10:55Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450045#M5061</link>
      <description>&lt;P&gt;From&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;proc means data=paper.Compustat_ExecuComp4   n nmiss;
var salary;
run;&lt;/PRE&gt;&lt;DIV class="proc_title_group"&gt;&lt;P class="c proctitle"&gt;The MEANS Procedure&lt;/P&gt;&lt;/DIV&gt;&lt;P&gt;&amp;nbsp;Analysis Variable : SALARYN N Miss&lt;/P&gt;&lt;TABLE&gt;&lt;TBODY&gt;&lt;TR&gt;&lt;TD&gt;13346&lt;/TD&gt;&lt;TD&gt;0&lt;/TD&gt;&lt;/TR&gt;&lt;/TBODY&gt;&lt;/TABLE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;and from:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;proc means data=paper.CSRP_annual_returns   n nmiss;
var annual_return;
run;&lt;/PRE&gt;&lt;P&gt;we get&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;DIV class="proc_title_group"&gt;&lt;P class="c proctitle"&gt;The MEANS Procedure&lt;/P&gt;&lt;/DIV&gt;&lt;P&gt;&amp;nbsp;Analysis Variable : annual_returnN N Miss&lt;/P&gt;&lt;TABLE&gt;&lt;TBODY&gt;&lt;TR&gt;&lt;TD&gt;53176&lt;/TD&gt;&lt;TD&gt;0&lt;/TD&gt;&lt;/TR&gt;&lt;/TBODY&gt;&lt;/TABLE&gt;</description>
      <pubDate>Fri, 30 Mar 2018 19:58:40 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450045#M5061</guid>
      <dc:creator>sastuck</dc:creator>
      <dc:date>2018-03-30T19:58:40Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450054#M5062</link>
      <description>&lt;P&gt;Didn't you really want to run those proc means on paper.ceo_firm since that is the file you're using in proc reg?&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;PRE&gt;proc reg data=paper.ceo_firm plots(maxpoints=none);
model salary = annual_return /clb acov;
run;&lt;/PRE&gt;
&lt;P&gt;And you haven't (I don't think) addressed the question I raised in my previous post.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Art, CEO, AnalystFinder.com&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 30 Mar 2018 20:16:21 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450054#M5062</guid>
      <dc:creator>art297</dc:creator>
      <dc:date>2018-03-30T20:16:21Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450058#M5064</link>
      <description>&lt;P&gt;&lt;SPAN&gt;Salary is in&amp;nbsp;&lt;/SPAN&gt;&lt;SPAN&gt;Compustat_ExecuComp4.&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;And with regards to&amp;nbsp;annual_return, I will quote a SAS expert from another post:&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Do you always begin with January and end with December?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Is DATE a SAS date, or merely a numeric value with YMD?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Is your data in sorted order by TICKER DATE?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Assuming "yes", "just a number", and "yes", you could program it in this way:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I will look into your other points now.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;data temp;&lt;/P&gt;&lt;P&gt;set have;&lt;/P&gt;&lt;P&gt;by ticker date;&lt;/P&gt;&lt;P&gt;retain annual_return 1;&lt;/P&gt;&lt;P&gt;annual_return = annual_return * (1 + RET);&lt;/P&gt;&lt;P&gt;month = int( mod(date,10000) / 100);&lt;/P&gt;&lt;P&gt;if month = 12;&lt;/P&gt;&lt;P&gt;annual_return = (annual_return - 1) * 100;&lt;/P&gt;&lt;P&gt;output;&lt;/P&gt;&lt;P&gt;annual_return = 1;&lt;/P&gt;&lt;P&gt;run;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;If DATE is actually a SAS date, the calculation of MONTH is easier:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;month = month(date);&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Note that the annualized return is calculated separately for each year.&amp;nbsp; If you get 10% for one year, and 20% for the next year, the total value after two years would be 1.1 * 1.2 * original value ... all assuming that I got the formulas correct.&lt;/P&gt;</description>
      <pubDate>Fri, 30 Mar 2018 20:19:25 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450058#M5064</guid>
      <dc:creator>sastuck</dc:creator>
      <dc:date>2018-03-30T20:19:25Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450072#M5065</link>
      <description>&lt;P&gt;I don't know who provided that code or whether or not it's doing what you want. Most of us on this forum are users .. just like you. We don't get paid, may sometimes suggest wrong answers, and often aren't provided with enough details to make a suggestion that actually does what the requester wanted to do (but didn't convey the correct request).&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;As for myself, I wouldn't necessarily call myself an expert, but I do have a PhD and have been using SAS for the past 45 years.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Make up an example for two years of one ticker and, for each record, show what you expect the value of annual_return to be.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;As for Salary, it has to be in the file you are analyzing with proc reg. Earlier you had asked which file to look at to identify why you had missing values .. I think it may be the comparison of those two files and, if they're different, figuring out why they're different.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Art, CEO, AnalystFinder.com&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;P.S. I just looked up the original post and, if your data are in fact monthly values, then the code that&amp;nbsp;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/4954"&gt;@Astounding&lt;/a&gt;&amp;nbsp;suggested does indeed do the calculation correctly. However, I also noticed in that thread that you were trying obtain the geometric mean, but didn't see&amp;nbsp;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/31461"&gt;@mkeintz&lt;/a&gt;'s suggestion incorporated in your code.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;However, I also noticed in that thread, that you were getting missing values back then. Was that problem ever corrected?&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 30 Mar 2018 22:27:24 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450072#M5065</guid>
      <dc:creator>art297</dc:creator>
      <dc:date>2018-03-30T22:27:24Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450083#M5066</link>
      <description>&lt;P&gt;A) I am going to forgo the geometric mean for now. I am just looking for percentage growth over the course of a year. Here’s an example of what I would expect, based off numbers from yahoo finance:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Ticker&amp;nbsp;&amp;nbsp;&amp;nbsp; year&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; annual_return&lt;/P&gt;&lt;P&gt;AAOI &amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;2014&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 61.35%&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; (my data actually says its -35.15776393)&lt;/P&gt;&lt;P&gt;ACFC&amp;nbsp;&amp;nbsp;&amp;nbsp; 2013&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 115.42%&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; (my data actually says its 125.9565%)&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;B) I used:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;proc contents&lt;/P&gt;&lt;P&gt;data=paper.ceo_firm;&lt;/P&gt;&lt;P&gt;run;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;to confirm that salary is in the data set I am analyzing with proc reg&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Is this what you were wondering?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;C) I will find that thread and investigate my missing values further.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/13711"&gt;@art297&lt;/a&gt;&amp;nbsp;any other suggestions?&lt;/P&gt;</description>
      <pubDate>Sun, 01 Apr 2018 20:00:28 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450083#M5066</guid>
      <dc:creator>sastuck</dc:creator>
      <dc:date>2018-04-01T20:00:28Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450269#M5101</link>
      <description>&lt;P&gt;From what I've read in previous posts on this and related topics I'd be most interested in seeing what data was missing and, if it the results didn't seem reasonable, I'd investigate further.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;You might want to run something like:&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;proc format;&lt;BR /&gt; value sal&lt;BR /&gt; .='Missing'&lt;BR /&gt; low-4999='&amp;lt;5000'&lt;BR /&gt; 5000-39999='&amp;lt; 40000'&lt;BR /&gt; 40000-high='40000 or more'&lt;BR /&gt; ;&lt;BR /&gt; value return&lt;BR /&gt; .='missing'&lt;BR /&gt; low-.299='&amp;lt; .3'&lt;BR /&gt; .3-.499='&amp;lt;.5'&lt;BR /&gt; .5-high='.5 or more'&lt;BR /&gt; ;&lt;BR /&gt;run;&lt;/P&gt;
&lt;P&gt;proc freq data=paper.ceo_firm;&lt;BR /&gt; tables year*(annual_return salary)/ missing;&lt;BR /&gt; format salary sal.;&lt;BR /&gt; format annual_return return.;&lt;BR /&gt;run;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Of course, you might want to select better ranges for the formats.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Art, CEO, AnalystFinder.com&lt;/P&gt;</description>
      <pubDate>Sun, 01 Apr 2018 21:25:23 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450269#M5101</guid>
      <dc:creator>art297</dc:creator>
      <dc:date>2018-04-01T21:25:23Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450271#M5103</link>
      <description>&lt;P&gt;Here is what the output looks like:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;TABLE&gt;&lt;TBODY&gt;&lt;TR&gt;&lt;TD&gt;Table&amp;nbsp;of&amp;nbsp;year&amp;nbsp;by&amp;nbsp;annual_returnyear annual_returnmissing &amp;lt; .3 &amp;lt;.5 .5 or more Total20102011201220132014201520162017Total &lt;TABLE&gt;&lt;TBODY&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;156&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.72&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.33&lt;/DIV&gt;&lt;DIV class="r t"&gt;22.41&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1843&lt;/DIV&gt;&lt;DIV class="r t"&gt;8.45&lt;/DIV&gt;&lt;DIV class="r t"&gt;27.53&lt;/DIV&gt;&lt;DIV class="r t"&gt;29.12&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;26&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.12&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.39&lt;/DIV&gt;&lt;DIV class="r t"&gt;32.91&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;4670&lt;/DIV&gt;&lt;DIV class="r t"&gt;21.42&lt;/DIV&gt;&lt;DIV class="r t"&gt;69.75&lt;/DIV&gt;&lt;DIV class="r t"&gt;31.76&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;6695&lt;/DIV&gt;&lt;DIV class="r t"&gt;30.70&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;137&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.63&lt;/DIV&gt;&lt;DIV class="r t"&gt;5.03&lt;/DIV&gt;&lt;DIV class="r t"&gt;19.68&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;892&lt;/DIV&gt;&lt;DIV class="r t"&gt;4.09&lt;/DIV&gt;&lt;DIV class="r t"&gt;32.78&lt;/DIV&gt;&lt;DIV class="r t"&gt;14.09&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;8&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.04&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.29&lt;/DIV&gt;&lt;DIV class="r t"&gt;10.13&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1684&lt;/DIV&gt;&lt;DIV class="r t"&gt;7.72&lt;/DIV&gt;&lt;DIV class="r t"&gt;61.89&lt;/DIV&gt;&lt;DIV class="r t"&gt;11.45&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2721&lt;/DIV&gt;&lt;DIV class="r t"&gt;12.48&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;114&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.52&lt;/DIV&gt;&lt;DIV class="r t"&gt;4.84&lt;/DIV&gt;&lt;DIV class="r t"&gt;16.38&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;594&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.72&lt;/DIV&gt;&lt;DIV class="r t"&gt;25.24&lt;/DIV&gt;&lt;DIV class="r t"&gt;9.38&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;8&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.04&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.34&lt;/DIV&gt;&lt;DIV class="r t"&gt;10.13&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1637&lt;/DIV&gt;&lt;DIV class="r t"&gt;7.51&lt;/DIV&gt;&lt;DIV class="r t"&gt;69.57&lt;/DIV&gt;&lt;DIV class="r t"&gt;11.13&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2353&lt;/DIV&gt;&lt;DIV class="r t"&gt;10.79&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;97&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.44&lt;/DIV&gt;&lt;DIV class="r t"&gt;4.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;13.94&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;608&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.79&lt;/DIV&gt;&lt;DIV class="r t"&gt;25.06&lt;/DIV&gt;&lt;DIV class="r t"&gt;9.61&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;10&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.05&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.41&lt;/DIV&gt;&lt;DIV class="r t"&gt;12.66&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1711&lt;/DIV&gt;&lt;DIV class="r t"&gt;7.85&lt;/DIV&gt;&lt;DIV class="r t"&gt;70.53&lt;/DIV&gt;&lt;DIV class="r t"&gt;11.64&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2426&lt;/DIV&gt;&lt;DIV class="r t"&gt;11.12&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;86&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.39&lt;/DIV&gt;&lt;DIV class="r t"&gt;3.44&lt;/DIV&gt;&lt;DIV class="r t"&gt;12.36&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;781&lt;/DIV&gt;&lt;DIV class="r t"&gt;3.58&lt;/DIV&gt;&lt;DIV class="r t"&gt;31.27&lt;/DIV&gt;&lt;DIV class="r t"&gt;12.34&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;8&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.04&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.32&lt;/DIV&gt;&lt;DIV class="r t"&gt;10.13&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1623&lt;/DIV&gt;&lt;DIV class="r t"&gt;7.44&lt;/DIV&gt;&lt;DIV class="r t"&gt;64.97&lt;/DIV&gt;&lt;DIV class="r t"&gt;11.04&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2498&lt;/DIV&gt;&lt;DIV class="r t"&gt;11.46&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;64&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.29&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.67&lt;/DIV&gt;&lt;DIV class="r t"&gt;9.20&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;803&lt;/DIV&gt;&lt;DIV class="r t"&gt;3.68&lt;/DIV&gt;&lt;DIV class="r t"&gt;33.44&lt;/DIV&gt;&lt;DIV class="r t"&gt;12.69&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;10&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.05&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.42&lt;/DIV&gt;&lt;DIV class="r t"&gt;12.66&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1524&lt;/DIV&gt;&lt;DIV class="r t"&gt;6.99&lt;/DIV&gt;&lt;DIV class="r t"&gt;63.47&lt;/DIV&gt;&lt;DIV class="r t"&gt;10.37&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2401&lt;/DIV&gt;&lt;DIV class="r t"&gt;11.01&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;42&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.19&lt;/DIV&gt;&lt;DIV class="r t"&gt;1.97&lt;/DIV&gt;&lt;DIV class="r t"&gt;6.03&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;564&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.59&lt;/DIV&gt;&lt;DIV class="r t"&gt;26.42&lt;/DIV&gt;&lt;DIV class="r t"&gt;8.91&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;9&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.04&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.42&lt;/DIV&gt;&lt;DIV class="r t"&gt;11.39&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1520&lt;/DIV&gt;&lt;DIV class="r t"&gt;6.97&lt;/DIV&gt;&lt;DIV class="r t"&gt;71.19&lt;/DIV&gt;&lt;DIV class="r t"&gt;10.34&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2135&lt;/DIV&gt;&lt;DIV class="r t"&gt;9.79&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;0&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;245&lt;/DIV&gt;&lt;DIV class="r t"&gt;1.12&lt;/DIV&gt;&lt;DIV class="r t"&gt;42.39&lt;/DIV&gt;&lt;DIV class="r t"&gt;3.87&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;0&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;333&lt;/DIV&gt;&lt;DIV class="r t"&gt;1.53&lt;/DIV&gt;&lt;DIV class="r t"&gt;57.61&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.26&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;578&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.65&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;696&lt;/DIV&gt;&lt;DIV class="r t"&gt;3.19&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;6330&lt;/DIV&gt;&lt;DIV class="r t"&gt;29.03&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;79&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.36&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;14702&lt;/DIV&gt;&lt;DIV class="r t"&gt;67.42&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;21807&lt;/DIV&gt;&lt;DIV class="r t"&gt;100.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;/TBODY&gt;&lt;/TABLE&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;/TBODY&gt;&lt;/TABLE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;TABLE&gt;&lt;TBODY&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="t"&gt;Frequency&lt;/DIV&gt;&lt;DIV class="t"&gt;Percent&lt;/DIV&gt;&lt;DIV class="t"&gt;Row Pct&lt;/DIV&gt;&lt;DIV class="t"&gt;Col Pct&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;Table&amp;nbsp;of&amp;nbsp;year&amp;nbsp;by&amp;nbsp;SALARYyear SALARYMissing &amp;lt;5000 &amp;lt; 40000 Total20102011201220132014201520162017Total &lt;TABLE&gt;&lt;TBODY&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;4665&lt;/DIV&gt;&lt;DIV class="r t"&gt;21.39&lt;/DIV&gt;&lt;DIV class="r t"&gt;69.68&lt;/DIV&gt;&lt;DIV class="r t"&gt;55.14&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2029&lt;/DIV&gt;&lt;DIV class="r t"&gt;9.30&lt;/DIV&gt;&lt;DIV class="r t"&gt;30.31&lt;/DIV&gt;&lt;DIV class="r t"&gt;15.21&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.01&lt;/DIV&gt;&lt;DIV class="r t"&gt;20.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;6695&lt;/DIV&gt;&lt;DIV class="r t"&gt;30.70&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;726&lt;/DIV&gt;&lt;DIV class="r t"&gt;3.33&lt;/DIV&gt;&lt;DIV class="r t"&gt;26.68&lt;/DIV&gt;&lt;DIV class="r t"&gt;8.58&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1994&lt;/DIV&gt;&lt;DIV class="r t"&gt;9.14&lt;/DIV&gt;&lt;DIV class="r t"&gt;73.28&lt;/DIV&gt;&lt;DIV class="r t"&gt;14.95&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.04&lt;/DIV&gt;&lt;DIV class="r t"&gt;20.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2721&lt;/DIV&gt;&lt;DIV class="r t"&gt;12.48&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;425&lt;/DIV&gt;&lt;DIV class="r t"&gt;1.95&lt;/DIV&gt;&lt;DIV class="r t"&gt;18.06&lt;/DIV&gt;&lt;DIV class="r t"&gt;5.02&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1927&lt;/DIV&gt;&lt;DIV class="r t"&gt;8.84&lt;/DIV&gt;&lt;DIV class="r t"&gt;81.90&lt;/DIV&gt;&lt;DIV class="r t"&gt;14.44&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.04&lt;/DIV&gt;&lt;DIV class="r t"&gt;20.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2353&lt;/DIV&gt;&lt;DIV class="r t"&gt;10.79&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;502&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.30&lt;/DIV&gt;&lt;DIV class="r t"&gt;20.69&lt;/DIV&gt;&lt;DIV class="r t"&gt;5.93&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1923&lt;/DIV&gt;&lt;DIV class="r t"&gt;8.82&lt;/DIV&gt;&lt;DIV class="r t"&gt;79.27&lt;/DIV&gt;&lt;DIV class="r t"&gt;14.41&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.04&lt;/DIV&gt;&lt;DIV class="r t"&gt;20.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2426&lt;/DIV&gt;&lt;DIV class="r t"&gt;11.12&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;622&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.85&lt;/DIV&gt;&lt;DIV class="r t"&gt;24.90&lt;/DIV&gt;&lt;DIV class="r t"&gt;7.35&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1875&lt;/DIV&gt;&lt;DIV class="r t"&gt;8.60&lt;/DIV&gt;&lt;DIV class="r t"&gt;75.06&lt;/DIV&gt;&lt;DIV class="r t"&gt;14.05&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.04&lt;/DIV&gt;&lt;DIV class="r t"&gt;20.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2498&lt;/DIV&gt;&lt;DIV class="r t"&gt;11.46&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;596&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.73&lt;/DIV&gt;&lt;DIV class="r t"&gt;24.82&lt;/DIV&gt;&lt;DIV class="r t"&gt;7.04&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1805&lt;/DIV&gt;&lt;DIV class="r t"&gt;8.28&lt;/DIV&gt;&lt;DIV class="r t"&gt;75.18&lt;/DIV&gt;&lt;DIV class="r t"&gt;13.53&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;0&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2401&lt;/DIV&gt;&lt;DIV class="r t"&gt;11.01&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;421&lt;/DIV&gt;&lt;DIV class="r t"&gt;1.93&lt;/DIV&gt;&lt;DIV class="r t"&gt;19.72&lt;/DIV&gt;&lt;DIV class="r t"&gt;4.98&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;1714&lt;/DIV&gt;&lt;DIV class="r t"&gt;7.86&lt;/DIV&gt;&lt;DIV class="r t"&gt;80.28&lt;/DIV&gt;&lt;DIV class="r t"&gt;12.85&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;0&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;2135&lt;/DIV&gt;&lt;DIV class="r t"&gt;9.79&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;504&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.31&lt;/DIV&gt;&lt;DIV class="r t"&gt;87.20&lt;/DIV&gt;&lt;DIV class="r t"&gt;5.96&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;74&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.34&lt;/DIV&gt;&lt;DIV class="r t"&gt;12.80&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.55&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;0&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;578&lt;/DIV&gt;&lt;DIV class="r t"&gt;2.65&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV class="r t"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;TR&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;8461&lt;/DIV&gt;&lt;DIV class="r t"&gt;38.80&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;13341&lt;/DIV&gt;&lt;DIV class="r t"&gt;61.18&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;5&lt;/DIV&gt;&lt;DIV class="r t"&gt;0.02&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;TD&gt;&lt;DIV class="stacked-cell"&gt;&lt;DIV class="r t"&gt;21807&lt;/DIV&gt;&lt;DIV class="r t"&gt;100.00&lt;/DIV&gt;&lt;/DIV&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;/TBODY&gt;&lt;/TABLE&gt;&lt;/TD&gt;&lt;/TR&gt;&lt;/TBODY&gt;&lt;/TABLE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Do you see anything systematic going on here?&lt;/P&gt;</description>
      <pubDate>Sun, 01 Apr 2018 21:33:14 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450271#M5103</guid>
      <dc:creator>sastuck</dc:creator>
      <dc:date>2018-04-01T21:33:14Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450273#M5105</link>
      <description>&lt;P&gt;The tables posted in a garbled fashion where one can't tell what it represents. It would, in this case, be better to post a snapshot of the result screens and post them as pdf files.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Art, CEO, AnalystFinder.com&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sun, 01 Apr 2018 21:39:24 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450273#M5105</guid>
      <dc:creator>art297</dc:creator>
      <dc:date>2018-04-01T21:39:24Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450274#M5106</link>
      <description>&lt;P&gt;you know what--it looks like this was linked to the case of the merge statement having&amp;nbsp;more than one data set with repeats of BY values. Since implementing the code that you and&amp;nbsp;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/159"&gt;@Tom&lt;/a&gt;&amp;nbsp;came up with, SAS read 12,650 observations, and SAS used 12,650 observations. Perfect!&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;So the issue must have been the regression not including data from either but not both sources and labelled them as "missing," meaning they didn't match with the other data?&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sun, 01 Apr 2018 21:39:51 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450274#M5106</guid>
      <dc:creator>sastuck</dc:creator>
      <dc:date>2018-04-01T21:39:51Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450275#M5107</link>
      <description>&lt;P&gt;&lt;a href="https://communities.sas.com/t5/user/viewprofilepage/user-id/13711"&gt;@art297&lt;/a&gt;, my bad. I will take note of that for next time. It's just that I have been told more than a few times that people do not prefer to have to open attached files on this forum is all.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sun, 01 Apr 2018 21:41:23 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450275#M5107</guid>
      <dc:creator>sastuck</dc:creator>
      <dc:date>2018-04-01T21:41:23Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450276#M5108</link>
      <description>&lt;P&gt;People on the forum don't like pictures of datasets .. they'd rather have data posted in the form of an analyzable data step.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Similarly, they don't like opening file type that might contain viruses, like Word or Excel.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;However, when showing one's output, a picture (i.e., jpg, pdf or the like) I'd think would be welcomed by most.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Art, CEO, AnalystFinder.com&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sun, 01 Apr 2018 21:45:15 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450276#M5108</guid>
      <dc:creator>art297</dc:creator>
      <dc:date>2018-04-01T21:45:15Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450279#M5109</link>
      <description>&lt;P&gt;I'm not going to go through your code, and I don't have your data set, but the problem is that a missing value in the X variable or a missing value in the Y variable will cause SAS to NOT use that record.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;The very simple step that you need to take is to open the data set paper.ceo_firm into SAS ViewTable (or other viewer) and actually look at the data being sent into PROC REG and see if there are missings. Or use the NMISS function to count the number of missings in each record (among the X and Y variables used in the regression)&lt;/P&gt;</description>
      <pubDate>Sun, 01 Apr 2018 22:10:48 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450279#M5109</guid>
      <dc:creator>PaigeMiller</dc:creator>
      <dc:date>2018-04-01T22:10:48Z</dc:date>
    </item>
    <item>
      <title>Re: Large number of observations with missing values in regression output</title>
      <link>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450280#M5110</link>
      <description>&lt;P&gt;This issue has already been resolved. Thanks though.&lt;/P&gt;</description>
      <pubDate>Sun, 01 Apr 2018 22:28:27 GMT</pubDate>
      <guid>https://communities.sas.com/t5/SAS-Studio/Large-number-of-observations-with-missing-values-in-regression/m-p/450280#M5110</guid>
      <dc:creator>sastuck</dc:creator>
      <dc:date>2018-04-01T22:28:27Z</dc:date>
    </item>
  </channel>
</rss>

