@conference {15902, title = {Improving text classification for oral history archives with temporal domain knowledge}, booktitle = {Proceedings of the 30th annual international ACM SIGIR conference on Research and development in information retrieval}, series = {SIGIR {\textquoteright}07}, year = {2007}, month = {2007///}, pages = {623 - 630}, publisher = {ACM}, organization = {ACM}, address = {New York, NY, USA}, abstract = {This paper describes two new techniques for increasing the accuracy oftopic label assignment to conversational speech from oral history interviews using supervised machine learning in conjunction with automatic speech recognition. The first, time-shifted classification, leverages local sequence information from the order in which the story is told. The second, temporal label weighting, takes the complementary perspective by using the position within an interview to bias label assignment probabilities. These methods, when used in combination, yield between 6\% and 15\% relative improvements in classification accuracy using a clipped R-precision measure that models the utility of label sets as segment summaries in interactive speech retrieval applications.}, keywords = {automatic topic classification, classifying with domain knowledge, spoken document classification}, isbn = {978-1-59593-597-7}, doi = {10.1145/1277741.1277848}, url = {http://doi.acm.org/10.1145/1277741.1277848}, author = {Olsson,J. Scott and Oard, Douglas} }