/* View the first 5 observations of the STEP1 data */ PROC PRINT DATA=BIO.PULSE_STEP1 (OBS=5); RUN; /* Show information about STEP1 data - Review variable names */ PROC CONTENTS DATA=BIO.PULSE_STEP1 VARNUM; RUN; /* Note the raw data for our categorical variables are coded as numbers */ /* We have not yet created translations for the variables in the STEP1 Data */ /* We will cover how to handle that scenario in the translation tutorials */ /* This will not be an issue here as we focus on only Quantitative variables */ /* Default output for PROC SGPLOT with HISTOGRAM statement */ PROC UNIVARIATE DATA=BIO.PULSE_STEP1 NOPRINT; VAR HEIGHT; /* Three different versions of a similar plot which compares sample to theoretical normal distribution) - the difference is in what exactly is plotted against each other - more agreement indicates that the sample is more normally distributed We will want the first - QQPLOT */ QQPLOT / NORMAL(MU=EST SIGMA=EST) ; /* Quantile-Quantile plot */ PROBPLOT / NORMAL(MU=EST SIGMA=EST); /* Probability Plot */ PPPLOT; /* Probability-Probability Plot */ /* You can also create a histograms using this procedure */ /* SAS still puts these first in the output ... */ HISTOGRAM; HISTOGRAM / NORMAL(MU=EST SIGMA=EST NOPRINT) KERNEL ; RUN; /* One nice thing about UNIVARIATE is we can request multiple plots */ PROC UNIVARIATE DATA=BIO.PULSE_STEP1 NOPRINT; VAR HEIGHT WEIGHT AGE PULSE1 PULSE2; QQPLOT / NORMAL(MU=EST SIGMA=EST) ; HISTOGRAM / NORMAL(MU=EST SIGMA=EST NOPRINT) KERNEL ; RUN;