@techreport{oai:ipsj.ixsq.nii.ac.jp:00074033,
 author = {岡, 照晃 and 小町, 守 and 小木曽, 智信 and 松本, 裕治 and Teruaki, Oka and Mamoru, Komachi and Toshinobu, Ogiso and Yuji, Matsumoto},
 issue = {6},
 month = {May},
 note = {現代日本語のように，濁音を仮名で表記する際に必ず濁点を用いる習慣が定着したのは明治時代以降のことで，明治期の文献の中では濁音が期待される文字に濁点のない濁点無表記の場合が多い．本論文では，濁点無表記の濁音仮名文字を識別し，自動で濁点を補う手法について述べる．我々は，判定点の文字が濁点無表記文字か否かを決定する2値分類問題として定式化を行った．提案手法では，周辺文字列の情報のみを用いて点推定を行う．オンライン学習を採用し，大規模な『太陽コーパス』から学習を行なった．これにより提案手法は，『国民之友』において96.016%の精度と98.283%の再現率を達成した．, The present-day Japanese use of voiced consonant mark had established in Meiji Era. Thus, modern Japanese literary text written in Meiji Era often lacks compulsory voiced consonant marks. In this paper, we propose an approach to automatic labeling of voiced consonants for modern Japanese literary language. We formulate the task of labeling voiced consonants into binary classification problem. Our method uses as its feature set only surface information about the surrounding character strings with pointwise prediction. We use an online learning method for exploiting large datasets from Taiyo Corpus. We achieve 96.016% precision and 98.283% recall on the Kokumin_no_tomo Corpus.},
 title = {機械学習による近代文語文への濁点の自動付与},
 year = {2011}
}