BEGIN { IGNORECASE = 1; # Ignore case in string comparisons. FS = ","; # Initialize the field separator. OFS = ","; # Initialize the output field separator. Pred = 30; # Initialize the range for Pred. } { EstimatedEffort = $1; ActualEffort = $2; Re = (EstimatedEffort-ActualEffort)/ActualEffort Mre = Re < 0 ? -1* Re : Re; SumMre += Mre; SumMreSq += Mre^2; if (Mre < (Pred/100)) PredN++ Corr_Se+=((EstimatedEffort-AvgEstimate)*(EstimatedEffort-AvgEstimate)); Corr_Sa+=((ActualEffort-AvgActual)*(ActualEffort-AvgActual)); Corr_Sea+=((EstimatedEffort-AvgEstimate)*(ActualEffort-AvgActual)); } END { Mmre = 100*SumMre/NR; Pred30 = 100*PredN/NR; SdMmre = 100*sd(SumMreSq,SumMre,NR); Corr_Se=Corr_Se/(NR-1); Corr_Sa=Corr_Sa/(NR-1); Corr_Sea=Corr_Sea/(NR-1); Corr=(Corr_Sea/sqrt(Corr_Se*Corr_Sa)); # tim wants the sd on pred30. will i have to run this 30 times and do the stdev of the output of pred30? # won't i have to concatenate the results of the 30 runs and use this to find the mmre and SdMmre? # 'mean' pred30 could be found either way #print "MMRE, SD(MRE), PRED30, CORR" print Mmre, SdMmre, Pred30, Corr; #print Mmre, SdMmre, Pred30 } function sd(sumSq,sumX,n) { return sqrt((sumSq-((sumX*sumX) / n)) / (n-1)) }