# assumes data has been pruned already # and we know min max # Tmp=`mktemp -d` # trap "rm -rf $Tmp" 0 1 2 3 15 # gawk -f prune.awk $1 > $Tmp/pruned # (gawk -f maxmin.awk $Tmp/pruned ; cat $Tmp/pruned) | gawk -f discrete.awk BEGIN { Klass=-1; IGNORECASE =1; DontKnow = "?"; Lots = 10^10; CONVFMT = "%.10g" } { gsub(/ \t/,"",$0) ; gsub(/%.*/,"")} /^$/ { next } /@attribute/ { Name[++Name[0]] = $2 if ( $3 ~ /real|integer|numeric|continuous/ ) Nump[Name[0]]=1 } /@data/ { In=1; FS=OFS=","; Klass= Klass < 0 ? Name[0] + 1 + Klass : Klass; } /@/ { next} In { store(Klasses,$Klass,Data,Nump,N,Sum,Mean,Name[0]) } END { classPdf(Klasses,Pdf) saya("pdf",Pdf) for(I=1;I