@inproceedings{57bc9054d67040ff9fc379ebab8dab50,
title = "An exploratory study of news article clustering for web-based bio-surveillance",
abstract = "Online news articles provide rich and timely information for disease outbreak surveillance. Meanwhile, it is not trivial to search articles relevant to disease outbreaks among the large volume of online publications. In this study, we examined the use of text clustering techniques to organize online articles. To take into account surveillance analysts' expertise in clustering articles, we considered selection of informative word features in a supervised manner. Our experiments suggest that the supervised selection of features can significantly reduce the features size without affecting the utility of resulting clusters. In addition, we observed that the clustering algorithm could yield consistent results when a small number of selected features were used.",
keywords = "biosurveillance, clustering, feature selection, text mining",
author = "Manabu Torii and Bayarsaikhan, {Burt Ujin} and Hongfang Liu and Thang Nguyen and Kevin Jones and Nelson, {Noele P.G.} and Hartley, {David M.}",
year = "2010",
doi = "10.1145/1882992.1883058",
language = "English (US)",
isbn = "9781450300308",
series = "IHI'10 - Proceedings of the 1st ACM International Health Informatics Symposium",
pages = "435--439",
booktitle = "IHI'10 - Proceedings of the 1st ACM International Health Informatics Symposium",
note = "1st ACM International Health Informatics Symposium, IHI'10 ; Conference date: 11-11-2010 Through 12-11-2010",
}