(defun datasetStuff () (let ((datasets `( ;,(weather) ;,(contact-lens) ,(breast-cancer) ,(breastTumor) ,(primary-tumor) ,(meta) ,(soybean) ;,(titanic) ,(anneal) ;work ,(audiology) ,(auto93);work ,(autoHorse) ;work ,(autoMpg);work ,(autoPrice) ;work ,(autos) ;work ,(basketball) ;work ,(bodyfat);work ,(bolts);work ,(boston-housing);work ,(cholesterol) ;work ,(cleveland-14-heart-disease) ;work ,(cleveland) ;work ,(cloud) ;work ,(cpu) ;work ,(credit-rating) ;work ,(detroit) ;work ,(echoMonths) ;work ,(elusage) ;work ,(fishcatch) ;work ,(fruitfly) ;work ,(gascons) ;work ,(horse-colic) ;work ,(housing) ;work ,(hungarian-14-heart-disease) ;work ,(hungarian) ;work ;,(hypothyroid) ;break due to last row being all ? ,(ionosphere) ;work ,(kr-vs-kp) ;work ;,(letter) ;Causes Process to Die ,(lowbwt) ;work ,(mammal-sleep) ;work ,(mbagrade) ;work ,(mushroom) ;work ,(pbc) ;work ,(pharynx) ;works ;,(pima_diabetes) ;breaking ,(pollution) ;work ,(pwLinear) ;work ,(quake) ;work ,(schlvote) ;works now with the check of an unknown class ;,(segment) ;breaks due to ewd on the 3rd column resulting in a divide by zero ,(sensory) ;work ,(servo) ;work ;,(sick) ;breaks due to the 3rd last column not containing any data to discretize on ,(sonar);works ;,(splice) ;Causes Process to Die ,(strike) ;works ,(vehicle) ;works ,(veteran) ;works ,(vineyard) ;works ;,(vote) ;error in data set caused a break ,(vowel) ;works ;,(waveform) ;Causes Process to Die ;,(weather.nominal) ;works ))) ;Adds the Crush data sets to be run (setf datasets (sort datasets 'lt :key #'table-name)) (align (mapcar #'(lambda (x) (list (table-name x) (counted-n (table-all x)) (header-numericp (nth (table-class x) (counted-all (table-columns x)))) (my-fround (/ (sum (mapcar #'(lambda (y) (if (header-numericp y) 1 0)) (counted-all (table-columns x)))) (counted-n (table-columns x)))) (counted-n (table-columns x)) (hash-table-count (xindex-class-counts (cross-index x))) )) datasets)) (format t "~A datasets~%" (length datasets))))