@article{oai:kitami-it.repo.nii.ac.jp:00008178, author = {Ptaszynski, Michal and Rzepka, Rafal and Oyama, Satoshi and Kurihara, Masahito and Araki, Kenji}, issue = {4}, journal = {Information and Media Technologies}, month = {}, note = {In this paper we present a survey on natural language corpora, with particular focus on corpora of large scale and those applicable to sentiment analysis. Natural language corpora are crucial for training various Software Engineering applications, from part-of-speech taggers and dependency parsers to dialog systems or sentiment analysis software. We compare several natural language corpora created for different languages, analyze their distinctive features and the amount of additional annotations provided by the developers of those corpora., ここに掲載した著作物の利用に関する注意 本著作物の著作権は日本ソフトウェア科学会 に帰属します.本著作物は著作権者である日本ソフトウェア科学会の許可のもとに掲載す るものです.ご利用に当たっては「著作権法」に従うことをお願いいたします. Notice for the use of this material: The copyright of this material is retained by the Japan Society for Software Science and Technology (JSSST). This material is published on this web site with the agreement of the JSSST. Please be complied with Copyright Law of Japan if any users wish to reproduce, make derivative work, distribute or make available to the public any part or whole thereof.}, pages = {429--445}, title = {A Survey on Large Scale Corpora and Emotion Corpora}, volume = {9}, year = {2014} }