\relax \citation{Hart68a} \citation{Frank+Asuncion:2010} \citation{Hart67} \citation{Bezdek2000,Bezdek2001,Kim2003} \@writefile{toc}{\contentsline {chapter}{\numberline {1}Introduction}{1}} \@writefile{lof}{\addvspace {10\p@ }} \@writefile{lot}{\addvspace {10\p@ }} \newlabel{introduction}{{1}{1}} \citation{jalali08} \citation{Frank+Asuncion:2010} \citation{fastmap} \citation{01cod} \citation{01cod} \@writefile{toc}{\contentsline {section}{\numberline {1.1}Statement of Thesis}{4}} \@writefile{toc}{\contentsline {section}{\numberline {1.2}Contributions of this Thesis}{4}} \@writefile{toc}{\contentsline {section}{\numberline {1.3}Structure of this Thesis}{4}} \citation{Devi2002,Bezdek2001,Chang74,Dasarathy94,Li2009,Bezdek98,Cano2005,Garain2008,Veenman2005,García2008,Kohonen98,Kohonen90} \citation{Hart68a} \citation{Change74} \@writefile{toc}{\contentsline {chapter}{\numberline {2}Background and Related Work}{5}} \@writefile{lof}{\addvspace {10\p@ }} \@writefile{lot}{\addvspace {10\p@ }} \newlabel{related}{{2}{5}} \@writefile{toc}{\contentsline {section}{\numberline {2.1}Prototype Learning for Nearest Neighbor Classifiers}{5}} \citation{Dasarathy94} \@writefile{toc}{\contentsline {subsection}{\numberline {2.1.1}Instance Selection}{6}} \@writefile{toc}{\contentsline {subsubsection}{Condensed Nearest Neighbor (CNN)}{6}} \@writefile{toc}{\contentsline {subsubsection}{Reduced Nearest Neighbor (RNN)}{6}} \@writefile{toc}{\contentsline {subsubsection}{Minimal Consistent Set (MCS)}{6}} \@writefile{toc}{\contentsline {subsection}{\numberline {2.1.2}Instance Abstraction}{6}} \@writefile{toc}{\contentsline {subsubsection}{Chang}{6}} \@writefile{lof}{\contentsline {figure}{\numberline {2.1}{\ignorespaces Chang's algorithm for finding prototypes}}{7}} \newlabel{fig:chang}{{2.1}{7}} \@writefile{toc}{\contentsline {chapter}{\numberline {3}CLIFF: Tool for Instance Selection}{8}} \@writefile{lof}{\addvspace {10\p@ }} \@writefile{lot}{\addvspace {10\p@ }} \newlabel{cliff}{{3}{8}} \@writefile{toc}{\contentsline {section}{\numberline {3.1}CLIFF: Tool for Instance Selection}{8}} \newlabel{subsection:selector}{{3.1}{8}} \newlabel{eq:one}{{3.1}{9}} \@writefile{lof}{\contentsline {figure}{\numberline {3.1}{\ignorespaces A log of some golf-playing behavior}}{9}} \newlabel{fig:golf}{{3.1}{9}} \@writefile{lof}{\contentsline {figure}{\numberline {3.2}{\ignorespaces Pseudo code for Support Based Bayesian Ranking algorithm}}{10}} \newlabel{fig:sbbra}{{3.2}{10}} \citation{Frank+Asuncion:2010} \citation{fastmap} \@writefile{toc}{\contentsline {chapter}{\numberline {4}CLIFF Assessment}{11}} \@writefile{lof}{\addvspace {10\p@ }} \@writefile{lot}{\addvspace {10\p@ }} \newlabel{assess}{{4}{11}} \@writefile{toc}{\contentsline {section}{\numberline {4.1}Data and Preprocessing Tools}{11}} \@writefile{toc}{\contentsline {subsection}{\numberline {4.1.1}Data Set Characteristics}{11}} \@writefile{lof}{\contentsline {figure}{\numberline {4.1}{\ignorespaces Data Set Characteristics}}{12}} \newlabel{fig:info}{{4.1}{12}} \@writefile{toc}{\contentsline {subsection}{\numberline {4.1.2}Pre-processing tools for Dimensionality Reduction}{12}} \@writefile{toc}{\contentsline {subsubsection}{FastMap}{12}} \@writefile{lof}{\contentsline {figure}{\numberline {4.2}{\ignorespaces Data Set Characteristics}}{13}} \newlabel{fig:work}{{4.2}{13}} \@writefile{toc}{\contentsline {subsubsection}{Feature Subset Selection (FSS)}{13}} \@writefile{lof}{\contentsline {figure}{\numberline {4.3}{\ignorespaces Choosing the best number of features for each data set. The best choice will have a high pd along with a low pf}}{14}} \newlabel{fig:numf}{{4.3}{14}} \@writefile{lof}{\contentsline {figure}{\numberline {4.4}{\ignorespaces Example of using the cosine law to find the position of $Oi$ in the dimension $k$}}{14}} \newlabel{fig:fm1}{{4.4}{14}} \@writefile{lof}{\contentsline {figure}{\numberline {4.5}{\ignorespaces Projects of points $O_i$ and $O_j$ onto the hyper-plane perpendicular to the line $O_a$$O_b$}}{15}} \newlabel{fig:fm2}{{4.5}{15}} \@writefile{toc}{\contentsline {section}{\numberline {4.2}CLIFF Assessment on Standard Data Sets}{15}} \@writefile{toc}{\contentsline {subsection}{\numberline {4.2.1}Experimental Method}{15}} \newlabel{section:brit}{{4.2.1}{15}} \@writefile{toc}{\contentsline {subsection}{\numberline {4.2.2}Is CLIFF viable as a Prototype Learner for NNC?}{16}} \@writefile{lof}{\contentsline {figure}{\numberline {4.6}{\ignorespaces Pseudo code for Experiment}}{16}} \newlabel{fig:knnexp1}{{4.6}{16}} \@writefile{toc}{\contentsline {subsubsection}{Results from Experiment}{17}} \newlabel{fig:result1}{{4.2.2}{17}} \@writefile{lof}{\contentsline {figure}{\numberline {4.7}{\ignorespaces Probability of Detection (PD) and Probability of False Alarm (PF)results}}{17}} \newlabel{fig:results100}{{4.7}{17}} \@writefile{lof}{\contentsline {figure}{\numberline {4.8}{\ignorespaces Summary of Mann Whitney U test results (95\% confidence): moving from Befroe to After.}}{18}} \newlabel{fig:man1}{{4.8}{18}} \@writefile{lof}{\contentsline {figure}{\numberline {4.9}{\ignorespaces Position of values in the 'before' and 'after' population with data set at 3, 5, 10 and 20 clusters. The first row shows the results for r=1 while the second row shows the results for r=2}}{19}} \newlabel{fig:charts1}{{4.9}{19}} \citation{Walsh94} \@writefile{toc}{\contentsline {chapter}{\numberline {5}Case Study: Solving the Problem of Brittleness in Forensic Models}{20}} \@writefile{lof}{\addvspace {10\p@ }} \@writefile{lot}{\addvspace {10\p@ }} \newlabel{forensics}{{5}{20}} \@writefile{toc}{\contentsline {section}{\numberline {5.1}Introduction}{20}} \citation{09NAS} \citation{09NAS} \citation{Seheult78} \citation{Grove80} \@writefile{toc}{\contentsline {section}{\numberline {5.2}Visualization of Brittleness}{22}} \@writefile{toc}{\contentsline {section}{\numberline {5.3}Glass Forensic Models}{22}} \citation{Evett94} \citation{Walsh94} \citation{Seheult78} \citation{77Lindley} \@writefile{toc}{\contentsline {subsection}{\numberline {5.3.1}Seheult 1978}{23}} \newlabel{subsection:seh}{{5.3.1}{23}} \newlabel{eq:lin1}{{5.1}{23}} \newlabel{eq:lin2}{{5.2}{23}} \citation{Evett94} \@writefile{toc}{\contentsline {subsection}{\numberline {5.3.2}Grove 1980}{24}} \newlabel{subsection:gro}{{5.3.2}{24}} \newlabel{eq:gro2}{{5.3}{24}} \newlabel{eq:gro4}{{5.5}{24}} \@writefile{toc}{\contentsline {subsection}{\numberline {5.3.3}Evett 1995}{25}} \newlabel{subsection:eve}{{5.3.3}{25}} \citation{Walsh94} \@writefile{toc}{\contentsline {subsection}{\numberline {5.3.4}Walsh 1996}{26}} \newlabel{subsection:wal}{{5.3.4}{26}} \@writefile{toc}{\contentsline {section}{\numberline {5.4}Visualization of Brittleness in Models}{27}} \@writefile{lof}{\contentsline {figure}{\numberline {5.1}{\ignorespaces Visualization of four(4) glass forensic models}}{28}} \newlabel{fig:models}{{5.1}{28}} \citation{09NAS} \citation{Seheult78,Evett84,Evett90,Evett94,Walsh94} \citation{Seheult78,Grove80,Walsh94} \citation{Karslake09} \citation{Karslake09} \citation{Karslake09} \@writefile{toc}{\contentsline {section}{\numberline {5.5}Introduction}{29}} \citation{Karslake09} \citation{joll02} \@writefile{lof}{\contentsline {figure}{\numberline {5.2}{\ignorespaces Proposed procedure for the forensic evaluation of data}}{31}} \newlabel{fig:process}{{5.2}{31}} \@writefile{toc}{\contentsline {section}{\numberline {5.6}Dimensionality Reduction}{31}} \@writefile{toc}{\contentsline {subsection}{\numberline {5.6.1}Principal Component Analysis}{31}} \@writefile{lof}{\contentsline {figure}{\numberline {5.3}{\ignorespaces PCA for iris data set}}{32}} \newlabel{fig:iris}{{5.3}{32}} \citation{Karslake09} \citation{pca} \citation{Karslake09} \citation{fastmap} \citation{knn} \@writefile{toc}{\contentsline {section}{\numberline {5.7}Clustering}{34}} \@writefile{toc}{\contentsline {section}{\numberline {5.8}Classification with KNN}{34}} \newlabel{subsection:knn}{{5.8}{34}} \@writefile{lof}{\contentsline {figure}{\numberline {5.4}{\ignorespaces Probability of detection (pd) and Probability of False alarms (pf) using fixed values for dimensions and fixed k values for k-nearest neighbor}}{35}} \newlabel{fig:exp1}{{5.4}{35}} \@writefile{lof}{\contentsline {figure}{\numberline {5.5}{\ignorespaces Pseudo code for K-means}}{36}} \newlabel{fig:kmeans}{{5.5}{36}} \@writefile{toc}{\contentsline {section}{\numberline {5.9}The Brittleness Measure}{36}} \newlabel{subsection:bm}{{5.9}{36}} \citation{Karslake09} \citation{Karslake09} \citation{Karslake09} \newlabel{eq:bm}{{5.9}{37}} \@writefile{toc}{\contentsline {section}{\numberline {5.10}Data Set and Experimental Method}{37}} \newlabel{section:brit}{{5.10}{37}} \@writefile{toc}{\contentsline {section}{\numberline {5.11}Experiment 1: KNN as a forensic model?}{38}} \@writefile{toc}{\contentsline {subsection}{\numberline {5.11.1}Results from Experiment 1}{38}} \@writefile{lof}{\contentsline {figure}{\numberline {5.6}{\ignorespaces Pseudo code for Experiment 1}}{39}} \newlabel{fig:knnexp1}{{5.6}{39}} \@writefile{toc}{\contentsline {section}{\numberline {5.12}Experiment 2: Can brittleness be reduced?}{39}} \@writefile{lof}{\contentsline {figure}{\numberline {5.7}{\ignorespaces Results for Experiment 1 for the 4 data sets distinguished by the number of clusters. Here for the upper and lower tables n=4 is used while r=1 is used for the upper table and r=2 for the lower table.}}{40}} \newlabel{fig:result1}{{5.7}{40}} \@writefile{lof}{\contentsline {figure}{\numberline {5.8}{\ignorespaces Pseudo code for Experiment 2}}{41}} \newlabel{fig:knnexp2}{{5.8}{41}} \@writefile{toc}{\contentsline {subsection}{\numberline {5.12.1}Results from Experiment 2}{41}} \citation{09Zadora,09aZadora,06Aitken,04Aitken,02Koons,99Koons} \@writefile{lof}{\contentsline {figure}{\numberline {5.9}{\ignorespaces Results for Experiment 2 for the 4 data sets distinguished by the number of clusters. Here for the upper and lower tables n=4 is used while r=1 is used for the upper table and r=2 for the lower table.}}{43}} \newlabel{fig:result2}{{5.9}{43}} \@writefile{lof}{\contentsline {figure}{\numberline {5.10}{\ignorespaces Position of values in the 'before' and 'after' population with data set at 3, 5, 10 and 20 clusters. The first row shows the results for r=1 while the second row shows the results for r=2}}{44}} \newlabel{fig:dist3}{{5.10}{44}} \@writefile{lof}{\contentsline {figure}{\numberline {5.11}{\ignorespaces Results for Experiment 2 of before and after results. -1 indicates that the after is better than before}}{44}} \newlabel{fig:result3}{{5.11}{44}} \citation{09NAS} \citation{09NAS} \citation{Karslake09} \@writefile{toc}{\contentsline {chapter}{\numberline {6}Conclusion}{45}} \@writefile{lof}{\addvspace {10\p@ }} \@writefile{lot}{\addvspace {10\p@ }} \newlabel{conclusion}{{6}{45}} \bibstyle{plain} \bibdata{thesis-v2} \bibcite{04Aitken}{1} \bibcite{06Aitken}{2} \bibcite{Bezdek2000}{3} \bibcite{Bezdek2001}{4} \bibcite{pca}{5} \bibcite{Cano2005}{6} \bibcite{Chang74}{7} \bibcite{Hart67}{8} \bibcite{Dasarathy94}{9} \bibcite{Devi2002}{10} \bibcite{knn}{11} \bibcite{Evett84}{12} \bibcite{Evett90}{13} \bibcite{Evett94}{14} \bibcite{fastmap}{15} \bibcite{Frank+Asuncion:2010}{16} \bibcite{Garain2008}{17} \bibcite{García2008}{18} \bibcite{Grove80}{19} \bibcite{Hart68a}{20} \bibcite{jalali08}{21} \bibcite{joll02}{22} \bibcite{Karslake09}{23} \bibcite{Kim2003}{24} \bibcite{Kohonen90}{25} \bibcite{Kohonen98}{26} \bibcite{02Koons}{27} \bibcite{99Koons}{28} \bibcite{01cod}{29} \bibcite{Li2009}{30} \bibcite{77Lindley}{31} \bibcite{09NAS}{32} \bibcite{Seheult78}{33} \bibcite{Veenman2005}{34} \bibcite{Walsh94}{35} \bibcite{09aZadora}{36} \bibcite{09Zadora}{37}