@inproceedings{48a235bdc1484997b8694f2b2a8ea324,
title = "Building an Indonesian rule-based part-of-speech tagger",
abstract = "This paper describes work on a part-of-speech tagger for the Indonesian language by employing a rule-based approach. The system tokenizes documents while also considering multi-word expressions and recognizes named entities. It then applies tags to every token, starting from closed-class words to open-class words and disambiguates the tags based on a set of manually defined rules. The system currently obtains an accuracy of 79% on a manually tagged corpus of roughly 250.000 tokens.",
keywords = "disambiguation rule, part of speech tag, token",
author = "Fam Rashel and Andry Luthfi and Arawinda Dinakaramani and Ruli Manurung",
note = "Publisher Copyright: {\textcopyright} 2014 IEEE.; International Conference on Asian Language Processing 2014, IALP 2014 ; Conference date: 20-10-2014 Through 22-10-2014",
year = "2014",
month = dec,
day = "3",
doi = "10.1109/IALP.2014.6973521",
language = "English",
series = "Proceedings of the International Conference on Asian Language Processing 2014, IALP 2014",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "70--73",
editor = "Minghui Dong and Yanfeng Lu and Banchs, {Rafael E.} and Bali Ranaivo-Malancon",
booktitle = "Proceedings of the International Conference on Asian Language Processing 2014, IALP 2014",
address = "United States",
}