Inter-clause syntactic and semantic structures are important to process semantic reasoning. This paper presents clause boundaries and class annotation on the `Balanced Corpus of Contemporary Written Japanese'. The annotation is based on the Tori-Bank labelset, which provides the most fine-grained clause classes. We reformulated the legacy syntactic pattern into a syntactic-dependency-based pattern. Two annotators modified the automatically extracted clause boundary candidates. In this study, we investigate the patterns of disagreement in the annotation.
@InProceedings{MATSUMOTO18.4, author = {Satomi Matsumoto ,Masayuki Asahara and Setsuko Arita}, title = {Japanese clause classification annotation on the `Balanced Corpus of Contemporary Written Japanese'}, booktitle = {Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)}, year = {2018}, month = {may}, date = {7-12}, location = {Miyazaki, Japan}, editor = {Kiyoaki Shirai}, publisher = {European Language Resources Association (ELRA)}, address = {Paris, France}, isbn = {979-10-95546-24-5}, language = {english} }