\begingroup \small \contentsline {section}{\numberline {1}Introduction: We don't need another hero}{3} \contentsline {section}{\numberline {2}Concept of Operations}{4} \contentsline {section}{\numberline {3}How it Works}{6} \contentsline {subsection}{\numberline {3.1}Tokenization}{6} \contentsline {subsection}{\numberline {3.2}Stop lists}{6} \contentsline {subsection}{\numberline {3.3}Stemming}{6} \contentsline {subsection}{\numberline {3.4}Tf*IDF}{7} \contentsline {subsection}{\numberline {3.5}InfoGain}{7} \contentsline {section}{\numberline {4}Results}{8} \contentsline {subsection}{\numberline {4.1}Data}{8} \contentsline {subsection}{\numberline {4.2}Stopping and Stemming}{8} \contentsline {subsection}{\numberline {4.3}Tf*Idf}{8} \contentsline {subsection}{\numberline {4.4}Learning}{9} \contentsline {section}{\numberline {5}Discussion}{11}