@inproceedings{188fdf1079c349c1967670c2e9644d3d,
title = "Weighted N-grams CNN for Text Classification",
abstract = "Text categorization can solve the problem of information clutter to a large extent, and it also provides a more efficient search strategy and more effective search results for information retrieval. In recent years, Convolutional Neural Networks have been widely applied to this task. However, most existing CNN models are difficult to extract longer n-grams features for the reason as follow: the parameters of the standard CNN model will increase with the increase of the length of n-grams features because it extracts n-grams features through convolution filters of fixed window size. Meanwhile, the term weighting schemes assigning reasonable weight values to words have exhibited excellent performance in traditional bag-of-words models. Intuitively, considering the weight value of each word in n-grams features may be beneficial in text classification. In this paper, we proposed a model called weighted n-grams CNN model. It is a variant of CNN introducing a weighted n-grams layer. The parameters of the weighted n-grams layer are initialized by term weighting schemes. Only by adding fixed parameters can the model generate any length of weighted n-grams features. We compare our proposed model with other popular and latest CNN models on five datasets in text classification. The experimental results show that our proposed model exhibits comparable or even superior performance.",
keywords = "CNN model, Text classification, Weighted n-grams features",
author = "Zequan Zeng and Yi Cai and Wang, {Fu Lee} and Haoran Xie and Junying Chen",
note = "Publisher Copyright: {\textcopyright} Springer Nature Switzerland AG 2020.; 15th Asia Information Retrieval Societies Conference, AIRS 2019 ; Conference date: 07-11-2019 Through 09-11-2019",
year = "2020",
doi = "10.1007/978-3-030-42835-8_14",
language = "English",
isbn = "9783030428341",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
pages = "158--169",
editor = "Wang, {Fu Lee} and Haoran Xie and Wai Lam and Aixin Sun and Lun-Wei Ku and Tianyong Hao and Wei Chen and Tak-Lam Wong and Xiaohui Tao",
booktitle = "Information Retrieval Technology - 15th Asia Information Retrieval Societies Conference, AIRS 2019, Proceedings",
}