/******************************* TOSA_D **********************************/ /***This program is used to calculate distance based topological change***/ /***********************Author: Nan "Wendy" Li ***************************/ /***********************wendyli0611@gmail.com*****************************/ /****************************May 16, 2015*********************************/ proc printto log="C:\temp\Save_my_log_please.log" new; /***Creat a log file***/ %macro TOSA_D(sample,data); /*Input data*/ data _null_; call symputx('ndat',count("&data",'|')+1); run; %do k=1 %to &ndat; /*Read data from an Excel spreadsheet*/ %let dat=%scan(&data,&k,'|'); data dis_&dat; set _null_; run; proc import out = &dat datafile = "&path.\&sample..xls" dbms = xls REPLACE; sheet = "&dat"; getnames = yes; run; proc contents data=&dat out=content;run; /*Read raw data into a SAS data table*/ proc sort data=content; by VARNUM;run; proc sql; select name into: vlist separated by ' ' from content; select count(name) into: nv from content; select distinct(NOBS) into: num from content; run; quit; %let num=%trim(%left(&num)); /*Initialize parameters*/ proc corr data=&dat cov out=cov; /*Calculate covirance matrix*/ var &vlist; run; data cov; set cov; /*Save covirance matrix*/ keep &vlist; if _n_ in (1:&nv); run; proc iml; use cov; read all into cov; close cov; cov_inv=inv(cov); /*Calculate the inverse matrix of original covirance matrix*/ use &dat; read all into g; close &dat; %do i=1 %to # /*Calculate mahalanobis distance between any two data points*/ %let t=&i+1; %do j=&t %to # c1=g[&i,]; c2=g[&j,]; c&i&j=c2-c1; t_c&i&j=t(c&i&j); _tmp&i&j=c&i&j*cov_inv*t_c&i&j; _z&i&j=sqrt(_tmp&i&j); create _z&i&j from _z&i&j[colname={"dis_&dat"}]; append from _z&i&j; %end; %end; quit; %do i=1 %to # /*Calculate the results*/ %let t=&i+1; %do j=&t %to # data dis_&dat; set dis_&dat _z&i&j;run; %end; %end; proc datasets nolist; delete _z:; run; quit; %end; data test; merge dis_input dis_output; /*Output the results into a data table*/ diff_sq=(dis_output-dis_input)**2; run; proc means data=test; /*Calculate the mean distance difference*/ var dis_output dis_input diff_sq; output out=means(drop=_TYPE_ _FREQ_); run; data means; set means; if _STAT_ in ('MEAN' 'N'); if _STAT_='N' then _STAT_='num_of_s'; if _STAT_='MEAN' then diff=sqrt(diff_sq); run; proc export data= work.means /*Export the results*/ outfile= "&path.\TOSAD_result.xls" dbms=excel replace; sheet="TOSAD_result"; run; %mend; %TOSA_D(sample=sample, data=input|output, path=C:\test); proc printto; title; run;