Reputation: 1764
I have a data set that looks like this:
data have;
input category $ type $ percent order;
datalines;
X Full 1 1
X B -.04 .
X A -.02 .
X E 0 .
X D .03 .
X C .01 .
;
run;
I want to create a waterfall showing what is "Leftover" after the modifications A-E. The code below does this successfully.
I have two questions:
Thanks!
proc sort data=have(where=(percent<0))
out=neg;
by percent;
run;
data neg;
set neg;
order=_N_+1;
run;
proc sql noprint;
select max(order) into :max_order from neg;
quit;
proc sort data=have(where=(percent>0 and type not in ("Full")))
out=pos;
by descending percent;
run;
data pos;
set pos;
order=_N_+&max_order.;
run;
data x_have;
set have(where=(type="Full")) neg pos;
run;
proc sort data=x_have;
by order;
run;
proc sgplot data=have(where=(percent ne 0)) noautolegend;
waterfall category=type response=percent / colorgroup=type dataskin=sheen datalabel name='a'
finalbartickvalue='Leftover';
;
xaxis display=(nolabel);
yaxis grid display=(nolabel) offsetmin=0;
run;
Upvotes: 0
Views: 508
Reputation: 1764
Thanks to @Joe and Sanjay Matange, I started working this through a highlow plot instead of waterfall. It was a little messy to manipulate the data so it was repeatable (and I can probably go back and clean it up some), but here is the solution for anybody interested.
data have;
input category $ type $ percent order;
datalines;
X Full 1 1
X B -.04 .
X A -.02 .
X E 0 .
X D .03 .
X C .01 .
X F .6 .
X sum1 . .
X sum2 . .
;
run;
proc sql noprint;
select sum(percent)
into :sum
from have
where type in ('A','B','C','D','E');
select percent
into :F
from have
where type='F';
select percent
into :maxperc
from have
where type="Full";
quit;
data have_mod;
set have;
if type='sum1' then percent=1+&sum.;
if type='sum2' then percent=1+&sum.-&F.;
run;
proc sort data=have_mod(where=(percent<0))
out=neg;
by percent;
run;
data neg;
set neg;
order=_N_+1;
run;
proc sql noprint;
select max(order) into :max_neg from neg;
quit;
proc sort data=have_mod(where=(percent>0 and type not in ("Full","sum1","sum2","F")))
out=pos;
by descending percent;
run;
data pos;
set pos;
order=_N_+&max_neg.;
run;
proc sql noprint;
select max(order) into :max_pos from pos;
quit;
data x_have;
set have_mod(where=(type in ("Full", "F", "sum1", "sum2"))) neg pos;
if type='sum1' then order=1+&max_pos.;
if type='F' then order=2+&max_pos.;
if type='sum2' then order=3+&max_pos.;
run;
proc sort data=x_have;
by order;
run;
proc sql noprint;
select percent, order
into :sum1, :ordersum1
from x_have
where type='sum1';
quit;
data want;
set x_have;
by category;
if first.category then sumpercent=0;
sumpercent+percent;
if type in ('sum1','F','sum2') then sumpercent=percent;
if type in ('Full','sum1','sum2') then high=sumpercent;
else if type='F' then high=&sum1.;
else if order=&ordersum1.-1 then high=&sum1.;
else if order=2 then high=&maxperc.;
else if percent>0 then high=sumpercent;
else if percent<0 then high=sumpercent+abs(percent);
if type in ('Full','sum1','sum2') then low=0;
else if percent<0 then low=sumpercent;
else if type='F' then low=high-sumpercent;
else if percent>0 then low=sumpercent-percent;
run;
proc sgplot data=want;
highlow x=type high=high low=low / group=type type=bar
groupdisplay=cluster highlabel=percent lineattrs=graphoutlines
dataskin=matte;
xaxis display=(nolabel noticks);
yaxis offsetmin=0;
run;
Upvotes: 1