@inproceedings{f47f8b60baa04c2daca57bf435f74072,
title = "A Framework of Feature Selection Methods for Text Categorization",
abstract = "In text categorization, feature selection (FS) is a strategy that aims at making text classifiers more efficient and accurate. However, when dealing with a new task, it is still difficult to quickly select a suitable one from various FS methods provided by many previous studies. In this paper, we propose a theoretic framework of FS methods based on two basic measurements: frequency measurement and ratio measurement. Then six popular FS methods are in detail discussed under this framework. Moreover, with the guidance of our theoretical analysis, we propose a novel method called weighed frequency and odds (WFO) that combines the two measurements with trained weights. The experimental results on data sets from both topic-based and sentiment classification tasks show that this new method is robust across different tasks and numbers of selected features.",
author = "Shoushan Li and Rui Xia and Chengqing Zong and Huang, {Chu Ren}",
note = "Publisher Copyright: {\textcopyright} 2009 ACL and AFNLP.; Joint Conference of the 47th Annual Meeting of the Association for Computational Linguistics and 4th International Joint Conference on Natural Language Processing of the AFNLP, ACL-IJCNLP 2009 ; Conference date: 02-08-2009 Through 07-08-2009",
year = "2009",
language = "English",
isbn = "9781617382581",
series = "ACL-IJCNLP 2009 - Joint Conf. of the 47th Annual Meeting of the Association for Computational Linguistics and 4th Int. Joint Conf. on Natural Language Processing of the AFNLP, Proceedings of the Conf.",
publisher = "Association for Computational Linguistics (ACL)",
pages = "692--700",
editor = "Keh-Yih Su and Jian Su and Janyce Wiebe and Haizhou Li",
booktitle = "ACL-IJCNLP 2009 - Joint Conf. of the 47th Annual Meeting of the Association for Computational Linguistics and 4th Int. Joint Conf. on Natural Language Processing of the AFNLP, Proceedings of the Conf.",
address = "United States",
}