套利组合收益的节假日统计

需求:统计节假日效应:节前一周内开仓和节后一周内开仓的收益情况
其中,套利组合在开平仓信号内,按照周一-周五分别开仓。

解决步骤:
1.数据处理
1.1导入周一-周五组合的市值数据,组合数据包含开仓时间(start),平仓时间(end),
   开仓市值(open),平仓市值(close),平仓沪深300市值(hs_close)。
PROC IMPORT OUT= WORK.e
            DATAFILE= "C:\Documents and Settings\Administrator\My Docume
nts\My SAS Files\9.2\汇总表.xls"
            DBMS=EXCEL REPLACE;
     RANGE="周五$";
     GETNAMES=YES;
     MIXED=NO;
     SCANTEXT=YES;
     USEDATE=YES;
     SCANTIME=YES;
RUN;
data e;*e为周五组合数据,类似可以得到周四(d)周三(c)周二(b)周一(a)数据;
   set e;
   ret=(close-hs_close)/open;*ret为组合收益;
run;
......................
1.2导入沪深300指数日线数据并计算涨幅
PROC IMPORT OUT= WORK.hs
            DATAFILE= "C:\Documents and Settings\Administrator\My Docume
nts\My SAS Files\9.2\汇总表.xls"
            DBMS=EXCEL REPLACE;
     RANGE="sheet1$";
     GETNAMES=YES;
     MIXED=NO;
     SCANTEXT=YES;
     USEDATE=YES;
     SCANTIME=YES;
RUN;
data hs;
   set hs;
   ret1=dif(close_hs)/lag(close_hs);*ret为涨幅;
   date=input(compress(start),yymmdd10.);
   format date date9.;
   drop start;
 run;

1.3将沪深300指数数据与组合收益数据合并为一张表
%macro zhangfu(datafile);
proc sql noprint;
   create table hs_&datafile as
   select *
      from &datafile
   left join hs
      on &datafile..start=hs.date ;
quit;
%mend;
%zhangfu(a);%zhangfu(b);%zhangfu(c);%zhangfu(d);%zhangfu(e);

1.4利用2010年至今数据统计节假日收益情况,首先需要明确2010-2012期间的
   法定节假日情况,然后进行筛选出节假日前后开平仓的组合收益(节前7天内)
%macro holiday(datafiles);
data holiday_&datafiles ;
   set &datafiles;
  
   h_1 = '01jan2010'd ; 
   h_2 = '03jan2010'd ; 
   h_3 = '13feb2010'd ;
   h_4 = '19feb2010'd ;
   h_5 = '03apr2010'd ;
   h_6 = '05apr2010'd ;
   h_7 = '01may2010'd ;
   h_8 = '03may2010'd ;
   h_9 = '14jun2010'd ;
   h_10= '16jun2010'd;
   h_11= '22sep2010'd;
   h_12= '24sep2010'd;
   h_13= '01oct2010'd;
   h_14= '07oct2010'd;

   h_15= '01jan2011'd;
   h_16= '03jan2011'd;
   h_17= '02feb2011'd;
   h_18= '08feb2011'd;
   h_19= '03apr2011'd;
   h_20= '05apr2011'd;
   h_21= '30apr2011'd;
   h_22= '02may2011'd;
   h_23= '04jun2011'd;
   h_24= '06jun2011'd;
   h_25= '10sep2011'd;
   h_26= '12sep2011'd;
   h_27= '01oct2011'd;
   h_28= '07oct2011'd;

   h_29= '01jan2012'd;
   h_30= '03jan2012'd;
   h_31= '22jan2012'd;
   h_32= '28jan2012'd;
   h_33= '02apr2012'd;
   h_34= '02apr2012'd;
   h_35= '29apr2012'd;
   h_36= '01may2012'd;
   h_37= '22jun2012'd;
   h_38= '24jun2012'd;
   h_39= '30sep2012'd;
   h_40= '07oct2012'd;
  
   format h_: date9. ret percentn10.2;
  
 
   select ;
   when (abs(start - h_1) <7 )  output;
   when (abs(start - h_2) <7 ) output;
   when (abs(start - h_3) <7 ) output;
   when (abs(start - h_4) <7 ) output;
   when (abs(start - h_5) <7 ) output;
   when (abs(start - h_6) <7 ) output;
   when (abs(start - h_7) <7 ) output;
   when (abs(start - h_8) <7 ) output;
   when (abs(start - h_9) <7 ) output;
   when (abs(start - h_10) <7 ) output;
   when (abs(start - h_11) <7 ) output;
   when (abs(start - h_12) <7 ) output;
   when (abs(start - h_13) <7 ) output;
   when (abs(start - h_14) <7 ) output;

   when (abs(start - h_15) <7 ) output;
   when (abs(start - h_16) <7 ) output;
   when (abs(start - h_17) <7 ) output;
   when (abs(start - h_18) <7 ) output;
   when (abs(start - h_19) <7 ) output;
   when (abs(start - h_20) <7 ) output;
   when (abs(start - h_21) <7 ) output;
   when (abs(start - h_22) <7 ) output;
   when (abs(start - h_23) <7 ) output;
   when (abs(start - h_24) <7 ) output;
   when (abs(start - h_25) <7 ) output;
   when (abs(start - h_26) <7 ) output;
   when (abs(start - h_27) <7 ) output;
   when (abs(start - h_28) <7 ) output;

   when (abs(start - h_29) <7 ) output;
   when (abs(start - h_30) <7 ) output;
   when (abs(start - h_31) <7 ) output;
   when (abs(start - h_32) <7 ) output;
   when (abs(start - h_33) <7 ) output;
   when (abs(start - h_34) <7 ) output;
   when (abs(start - h_35) <7 ) output;
   when (abs(start - h_36) <7 ) output;
   when (abs(start - h_37) <7 ) output;
   when (abs(start - h_38) <7 ) output;
   when (abs(start - h_39) <7 ) output;
   when (abs(start - h_40) <7 ) output;
  
   otherwise delete;
   end;

   keep start end ret ret1;  
run;

%mend;
%holiday(hs_a);%holiday(hs_b);%holiday(hs_c);%holiday(hs_d);%holiday(hs_e);

1.4剔除节前节后的组合另存为新的数据
%macro noholiday(dataset1=,dataset2=);
proc sql noprint;
   create table noholiday_&dataset1 as
   select *
      from &dataset1
      where start not in
         (select start from &dataset2);
quit;
%mend;
%noholiday(dataset1=hs_a,dataset2=holiday_hs_a);
%noholiday(dataset1=hs_b,dataset2=holiday_hs_b);
%noholiday(dataset1=hs_c,dataset2=holiday_hs_c);
%noholiday(dataset1=hs_d,dataset2=holiday_hs_d);
%noholiday(dataset1=hs_e,dataset2=holiday_hs_e);

1.5将周一、周二、周三、周四、周五的数据合并为一张表,下面是对节假日数据的合并 

 ,noholiday(去节假日数据)hs_abcd(完整的数据)合并方法类似。
data holiday;*holiday系所有节前节后数据;
   set holiday_hs_a(in=a)
       holiday_hs_b(in=b)
       holiday_hs_c(in=c)
       holiday_hs_d(in=d)
       holiday_hs_e(in=e)
   ;
   if a=1 then group='周一';
   if b=1 then group='周二';
   if c=1 then group='周三';
   if d=1 then group='周四';
   if e=1 then group='周五';
run;

2.进行收益的描述性统计计算。
2.1proc means计算出常规统计,下面统计了节假日前后一周开仓的组合收益情况,其他 

 情况可以将holiday替换。
proc means data=holiday sum mean std max min;
   by group notsorted;
   var ret;
   class flag; 
   output out=holiday1;
run;

2.2统计组合收益分布比例情况
data test;
   set holiday;
   by end notsorted;
   if first.end then  cnt=1;
   else  cnt+1;
run;
proc format;
   value ret
            low - -0.05   =  '< -5%     '
            -0.05 - -0.02 =  '-5% ~ -2%'
     -0.02 - 0     =  '-2% ~ 0% '
     0 - 0.02      =  ' 0% ~ 2% '
     0.02 - 0.05   =  ' 2% ~5%  '
     0.05 - 0.10   =  ' 5% ~10% '
     other= ' >10% '
;
proc freq data=test;
   tables cnt*ret  ;
   format ret ret.;  
   ods output   CrossTabFreqs=need;

run;

你可能感兴趣的:(Date,Excel,import,dataset,output,2010)