{"updated":"2025-01-19T07:38:20.991395+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00241512","sets":["6164:6165:6630:11866"]},"path":["11866"],"owner":"44499","recid":"241512","title":["Beyond OCR: Enhancing Classical Japanese Transcription with Large Language Models"],"pubdate":{"attribute_name":"公開日","attribute_value":"2024-11-30"},"_buckets":{"deposit":"12e36211-78c0-4abe-bda9-c4897fefec43"},"_deposit":{"id":"241512","pid":{"type":"depid","value":"241512","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"Beyond OCR: Enhancing Classical Japanese Transcription with Large Language Models","author_link":["665023","665021","665019","665016","665017","665018","665022","665020"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"Beyond OCR: Enhancing Classical Japanese Transcription with Large Language Models"},{"subitem_title":"Beyond OCR: Enhancing Classical Japanese Transcription with Large Language Models","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"Large Language Model, Historical Document, Classical Japanese, OCR","subitem_subject_scheme":"Other"}]},"item_type_id":"18","publish_date":"2024-11-30","item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"eng"}]},"item_18_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"Sakana AI"},{"subitem_text_value":" ROIS-DS Center for Open Data in the Humanities"},{"subitem_text_value":" National Institute of Informatics"}]},"item_18_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Sakana AI","subitem_text_language":"en"},{"subitem_text_value":" ROIS-DS Center for Open Data in the Humanities","subitem_text_language":"en"},{"subitem_text_value":" National Institute of Informatics","subitem_text_language":"en"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/241512/files/IPSJ-CH2024011.pdf","label":"IPSJ-CH2024011.pdf"},"date":[{"dateType":"Available","dateValue":"2025-12-07"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-CH2024011.pdf","filesize":[{"value":"2.2 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"24"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"7f16a3cb-8625-43b6-bbdc-2b43fb5840c0","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2024 by the Information Processing Society of Japan"}]},"item_18_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Clanuwat, Tarin"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Zhao Tianyu"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Imajuku, Yuki"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Kitamoto, Asanobu"}],"nameIdentifiers":[{}]}]},"item_18_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Tarin, Clanuwat","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Tianyu Zhao","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Yuki Imajuku","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Asanobu Kitamoto","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_5794","resourcetype":"conference paper"}]},"item_18_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"This paper presents a methodology for enhancing Optical Character Recognition (OCR) accuracy for historical Japanese documents, using Large Language Models (LLMs). We experimented with six open-source LLMs, ranging in size from 7 to 14 billion parameters, developing two models—a next-token prediction model and an OCR text refiner—both fine-tuned on classical Japanese text from the Minna de Honkoku project. Our approach significantly reduces the Character Error Rate (CER) by correcting misidentified characters and reordering incorrect sequences, particularly improving the recognition of Katakana and Kanji characters often misinterpreted by RURI Kuzushiji OCR model. The findings demonstrate the potential of advanced LLMs to improve the digitization and preservation of Japanese historical documents.","subitem_description_type":"Other"}]},"item_18_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"This paper presents a methodology for enhancing Optical Character Recognition (OCR) accuracy for historical Japanese documents, using Large Language Models (LLMs). We experimented with six open-source LLMs, ranging in size from 7 to 14 billion parameters, developing two models—a next-token prediction model and an OCR text refiner—both fine-tuned on classical Japanese text from the Minna de Honkoku project. Our approach significantly reduces the Character Error Rate (CER) by correcting misidentified characters and reordering incorrect sequences, particularly improving the recognition of Katakana and Kanji characters often misinterpreted by RURI Kuzushiji OCR model. The findings demonstrate the potential of advanced LLMs to improve the digitization and preservation of Japanese historical documents.","subitem_description_type":"Other"}]},"item_18_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"82","bibliographic_titles":[{"bibliographic_title":"じんもんこん2024論文集"}],"bibliographicPageStart":"75","bibliographicIssueDates":{"bibliographicIssueDate":"2024-11-30","bibliographicIssueDateType":"Issued"},"bibliographicVolumeNumber":"2024"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"created":"2025-01-19T01:46:09.502512+00:00","id":241512,"links":{}}