@inproceedings{f6e2817e927549ab9f45b81be150851f,
title = "Adjusting Indonesian Multiword Expression Annotation to the Penn Treebank Format",
abstract = "Multiword Expression (MWE) has been a pain in the neck, especially in determining its word-classes in syntactic treebank. Previous work had proposed annotation guidelines for Indonesian MWEs that align to the Penn Treebank (PTB) format. However, we think that their proposed annotation still needs improvements. Therefore, this study proposes a new annotation guideline in labeling Indonesian MWE that conforms to PTB format. Moreover, we also revised the MWE annotation of an existing Indonesian constituency treebank consisting of 1030 sentences to conform to the new guidelines. To evaluate the revised treebank's quality, we built an Indonesian constituency parser model using the revised treebank and Stanford parser. The experiments show that the resulting parser has an F1-score of 69.97%.",
keywords = "compound word, Indonesian, multiword expression, Penn Treebank, Stanford parser",
author = "Arwidarasti, {Jessica Naraiswari} and Ika Alfina and Krisnadhi, {Adila Alfa}",
note = "Publisher Copyright: {\textcopyright} 2020 IEEE. Copyright: Copyright 2021 Elsevier B.V., All rights reserved.; 2020 International Conference on Asian Language Processing, IALP 2020 ; Conference date: 04-12-2020 Through 06-12-2020",
year = "2020",
month = dec,
day = "4",
doi = "10.1109/IALP51396.2020.9310479",
language = "English",
series = "2020 International Conference on Asian Language Processing, IALP 2020",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "75--80",
editor = "Yanfeng Lu and Minghui Dong and Lay-Ki Soon and Gan, {Keng Hoon}",
booktitle = "2020 International Conference on Asian Language Processing, IALP 2020",
address = "United States",
}