{"created":"2025-01-19T01:27:59.664436+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00228860","sets":["934:989:11239:11352"]},"path":["11352"],"owner":"44499","recid":"228860","title":["多段組多サイズ見出しで構成される近代書籍のレイアウト解析"],"pubdate":{"attribute_name":"公開日","attribute_value":"2023-10-31"},"_buckets":{"deposit":"037e2d9d-3c5e-4baf-87e6-e17d27d68a01"},"_deposit":{"id":"228860","pid":{"type":"depid","value":"228860","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"多段組多サイズ見出しで構成される近代書籍のレイアウト解析","author_link":["614365","614368","614363","614361","614360","614364","614367","614366","614369","614362"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"多段組多サイズ見出しで構成される近代書籍のレイアウト解析"},{"subitem_title":"Layout Analysis for Early-modern Japanese Printed Book with Multi-column and Multi-size Headings","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"[事例紹介論文] 近代書籍,多段組多サイズ見出しレイアウト,レイアウト解析","subitem_subject_scheme":"Other"}]},"item_type_id":"3","publish_date":"2023-10-31","item_3_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"奈良女子大学"},{"subitem_text_value":"立命館大学"},{"subitem_text_value":"京都女子大学"},{"subitem_text_value":"奈良女子大学"},{"subitem_text_value":"奈良女子大学"}]},"item_3_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Nara Womens University","subitem_text_language":"en"},{"subitem_text_value":"Ritsumeikan University","subitem_text_language":"en"},{"subitem_text_value":"Kyoto Women's University","subitem_text_language":"en"},{"subitem_text_value":"Nara Womens University","subitem_text_language":"en"},{"subitem_text_value":"Nara Womens University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/228860/files/IPSJ-TOM1602008.pdf","label":"IPSJ-TOM1602008.pdf"},"date":[{"dateType":"Available","dateValue":"2025-10-31"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-TOM1602008.pdf","filesize":[{"value":"21.9 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"17"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"f5fcf9cd-118a-4a5d-8617-fc597da905c4","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2023 by the Information Processing Society of Japan"}]},"item_3_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"飯田, 紗也香"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"竹本, 有紀"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"石川, 由羽"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"髙田, 雅美"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"城, 和貴"}],"nameIdentifiers":[{}]}]},"item_3_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Sayaka, Iida","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Yuki, Takemoto","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Yu, Ishikawa","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Masami, Takata","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Kazuki, Joe","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_3_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AA11464803","subitem_source_identifier_type":"NCID"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_6501","resourcetype":"journal article"}]},"item_3_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1882-7780","subitem_source_identifier_type":"ISSN"}]},"item_3_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"近代書籍にも対応するOCRとして最近NDLOCRが新規開発された.NDLOCRは多数の一般書籍にみられる1段組みの縦書きレイアウトに対しては十分な精度でレイアウト解析を行うことができる.しかし,新聞のような多段組多サイズ見出しを含むレイアウトの近代書籍には,十分な精度でレイアウト解析を行うことができない.そこで,CRAFTと解像度ピラミッドを用いて多段組多サイズ見出しを含むレイアウトの近代書籍に対する文字切り出しを試みる.多段組多サイズ見出し対応のOCR構築における最終的な目標として明治以降の日本人移民が現地で出版した邦字新聞のテキスト化を目指しているが,本論文では,邦字新聞ほどテキスト化の難易度が高くない多段組多サイズ見出しを含む近代書籍の例として帝国議会会議録に焦点を当てる.帝国議会会議録に対して提案手法と他のOCRにおけるレイアウト解析の精度を比較して検証を行う.","subitem_description_type":"Other"}]},"item_3_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"NDLOCR has recently been newly developed as an OCR for Early-Modern Japanese Printed Books, and it can perform layout analysis with sufficient accuracy for the single-column vertical layouts found in many general books. However, it cannot perform layout analysis with sufficient accuracy for modern books with multi-column layouts and multi-size headings, such as newspapers. Therefore, we attempted to perform text extraction for Early-Modern Japanese Printed Books with layouts that include multi-columns and multi-size headlines using CRAFT and the resolution pyramid. The ultimate goal of OCR construction for multi-column and multi-size headlines is to convert Japanese newspapers published locally by Japanese immigrants after the Meiji period into text. In this paper, we focus on the Imperial Diet Proceedings as an example of an Early-Modern Japanese Printed Book containing multi-column and multi-size headlines, which is not as difficult to convert into text as Japanese newspapers. The proposed method is validated by comparing the accuracy of the proposed method with that of layout analysis by other OCR methods for the Imperial Diet Proceedings.","subitem_description_type":"Other"}]},"item_3_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"79","bibliographic_titles":[{"bibliographic_title":"情報処理学会論文誌数理モデル化と応用(TOM)"}],"bibliographicPageStart":"67","bibliographicIssueDates":{"bibliographicIssueDate":"2023-10-31","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"2","bibliographicVolumeNumber":"16"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"id":228860,"updated":"2025-01-19T11:41:32.517508+00:00","links":{}}