@inproceedings{a7654c9921e74e81bbcba31d958e3b6d,
title = "Extracting Chinese product features: Representing a sequence by a set of skip-bigrams",
abstract = "A skip-bigram is a bigram that allows skips between words. In this paper, we use a set of skip bigrams (a SBGSet) to represent a short word sequence, which is the typical form of a product feature. The advantage of SBGSet representation for word sequences is that we can convert between a sequence and a set. Under the SBGSet representation we can employ association rule mining to find frequent itemsets from which frequent product features can be extracted.For infrequent product features, we use a pattern-based method to extract them. A pattern is also represented by a SBGSet, and contains a variable that can be instantiated to a product feature.We use two data sets to evaluate our method. The experimental result shows that our method is suitable for extracting Chinese product features, and the pattern-based method to extract infrequent product features is effective.",
keywords = "product feature, sentiment analysis, skip-bigram, word sequence",
author = "Ge Xu and Chu-ren Huang and Houfeng Wang",
year = "2013",
month = feb,
day = "26",
doi = "10.1007/978-3-642-36337-5_9",
language = "English",
isbn = "9783642363368",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
pages = "72--83",
booktitle = "Chinese Lexical Semantics - 13th Workshop, CLSW 2012, Revised Selected Papers",
note = "13th Chinese Lexical Semantics Workshop, CLSW 2012 ; Conference date: 06-07-2012 Through 08-07-2012",
}