@inproceedings{c4c9fc2266ac4ca69d1e95ba1d812aa4,
title = "PoS tagging for classical chinese text",
abstract = "The Chinese language is evolving over the centuries. In order to study the changes of Chinese language using computational methods, segmentation and PoS tagging of Chinese are essential. However, segmentation and PoS tagging methods developed for Modern Standard Chinese do not perform well for Classical Chinese. The cost of segmenting and annotation is high if they are done manually. In this work, we present a CRF based method for PoS tagging for Classical Chinese text in the Ming and Qing dynasties. One of the key issues is the preparation of the training data for CRF. Our initial experiment shows that PoS tagging based on Modern Standard Chinese text can achieve a precision of 83%; and by adding as little as 12,000-word annotated Classical Chinese texts, we were able to improve the precision to over 90%.",
keywords = "Ancient chinese, Chinese classics, Novels in the ming and qing dynasties, Part-of-speech tagging",
author = "Chiu, {Tin Shing} and Qin Lu and Jian Xu and Dan Xiong and Fengju Lo",
year = "2015",
month = jan,
day = "1",
doi = "10.1007/978-3-319-27194-1_44",
language = "English",
isbn = "9783319271934",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "448--456",
booktitle = "Chinese Lexical Semantics - 16th Workshop, CLSW 2015, Revised Selected Papers",
address = "Germany",
note = "16th Workshop on Chinese Lexical Semantics Workshop, CLSW 2015 ; Conference date: 09-05-2015 Through 11-05-2015",
}