{"id":212376,"created":"2025-01-19T01:13:20.977774+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00212376","sets":["1164:4961:10511:10658"]},"path":["10658"],"owner":"44499","recid":"212376","title":["デーヴァナーガリー文字OCRの開発"],"pubdate":{"attribute_name":"公開日","attribute_value":"2021-08-21"},"_buckets":{"deposit":"09f966d1-a3bd-46d5-bb76-9a0b25b99318"},"_deposit":{"id":"212376","pid":{"type":"depid","value":"212376","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"デーヴァナーガリー文字OCRの開発","author_link":["541596","541600","541605","541607","541599","541608","541598","541601","541602","541604","541597","541609","541606","541603"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"デーヴァナーガリー文字OCRの開発"},{"subitem_title":"Development of a Devanāgarī Optical Character Recognition (OCR) System","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2021-08-21","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"東京大学人文社会系研究科"},{"subitem_text_value":"公益財団法人中村元東方研究所"},{"subitem_text_value":"東京大学人文社会系研究科"},{"subitem_text_value":"凸版印刷株式会社情報コミュニケーション事業本部"},{"subitem_text_value":"凸版印刷株式会社情報コミュニケーション事業本部"},{"subitem_text_value":"凸版印刷株式会社総合研究所"},{"subitem_text_value":"凸版印刷株式会社総合研究所"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/212376/files/IPSJ-CH21127001.pdf","label":"IPSJ-CH21127001.pdf"},"date":[{"dateType":"Available","dateValue":"2023-08-21"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-CH21127001.pdf","filesize":[{"value":"905.1 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"24"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"1532043d-3a75-4eb2-9d45-7846a4a5b24c","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2021 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"加藤, 隆宏"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"友成, 有紀"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"谷口, 力光"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"大澤, 留次郎"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"藤巻, 聡"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"岡田, 崇"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"橋本, 江美"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Takahiro, Kato","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Yūki, Tomonari","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Chikamitsu, Taniguchi","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Tomejiro, Osawa","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Satoshi, Fujimaki","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Takashi, Okada","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Emi, Hashimoto","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN1010060X","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8957","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"本発表は,多くのインド諸語表記に用いられる文字であるデーヴァナーガリー文字を読み取るための光学文字認識(OCR)ソフトウェアを開発するために,サンスクリット文献学の専門家とくずし字 AI-OCR 開発などを手がける凸版印刷株式会社との間で行った共同研究に関する報告である.デーヴァナーガリー文字はヒンディー語,マラーティー語,ネパール語などの現代語のみならず,インド圏の文化や歴史などについて多くの史資料を残すサンスクリット語の表記のための主要な文字として使用されてきた.サンスクリット文献学の分野において,サンスクリット語文献のデジタルアーカイブ化・テキストデータベース化は最重要課題であり,これまでドイツ,日本,インドを中心として様々なプロジェクトが展開されてきた.しかしながら,これらのプロジェクトはいずれも手作業(タイピング)によるデータ化が中心であり,個々の研究者の多大な時間と労力と引き換えに築かれてきたものである.今回の研究は,これまで手作業で行われてきたテキストデータ採取の方法を自動化するための OCR を開発し,それによりサンスクリット文献のテキストデータベース化を加速させることを目的とする.重要なサンスクリット文献群を収めるアーナンダ・アーシュラマ・サンスクリット・シリーズ(Anandasrama Sanskrit Series)に収録された文献群を資料として用い,文字システムや文法構造についての専門知識を有する研究者と OCR 技術の開発者が共同して,矩形(データ採取の際に四角形で囲む文字の最小単位)の範囲設定,翻刻・データ化の方法などを検討した.こうして準備された「字形データベース」をもとにした AI-OCR を生成し,その読み取り精度を再検討した.直近の課題としては活版文字に対応した AI-OCR を新たに開発することによって,将来に予想される手書き文字の OCR 開発事業の足掛かりとするとともに,この分野での着実な成果を目指した.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"This paper outlines some specific objectives of the research project cooperatively run by Sanskrit language experts and AI-OCR developers and discusses the process of designing “training data” through which an AI-OCR is generated. We also review some data obtained from the AI-OCR and clarify some problems found there.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"4","bibliographic_titles":[{"bibliographic_title":"研究報告人文科学とコンピュータ(CH)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2021-08-21","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"1","bibliographicVolumeNumber":"2021-CH-127"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"updated":"2025-01-19T17:32:02.615511+00:00","links":{}}