{"updated":"2025-01-20T19:21:16.938384+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00141521","sets":["1164:3500:7866:8222"]},"path":["8222"],"owner":"11","recid":"141521","title":["画像分解による『殷墟卜辭綜類』掲出字頻度分析"],"pubdate":{"attribute_name":"公開日","attribute_value":"2015-03-23"},"_buckets":{"deposit":"76e4e3d7-cb3e-4f06-b4cf-20209b1daa8a"},"_deposit":{"id":"141521","pid":{"type":"depid","value":"141521","revision_id":0},"owners":[11],"status":"published","created_by":11},"item_title":"画像分解による『殷墟卜辭綜類』掲出字頻度分析","author_link":["206741","206738","206743","206742","206739","206740"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"画像分解による『殷墟卜辭綜類』掲出字頻度分析"},{"subitem_title":"Glyph Appearance Frequency Estimation of \"Inkyo Bokuji Sourui\" by Image Decomposition","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"言語処理技術","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2015-03-23","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"広島大学総合科学研究科"},{"subitem_text_value":"茨城大学人文学科"},{"subitem_text_value":"茨城大学人文学科"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Hiroshima University, Faculty of Integrated Arts and Science","subitem_text_language":"en"},{"subitem_text_value":"Ibaraki University, College of Hummanities","subitem_text_language":"en"},{"subitem_text_value":"Ibaraki University, College of Hummanities","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/141521/files/IPSJ-IFAT15118005.pdf"},"date":[{"dateType":"Available","dateValue":"2017-03-23"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-IFAT15118005.pdf","filesize":[{"value":"2.1 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"39"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"c983b03f-fd5b-4d57-9f09-b91f47a27b95","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2015 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"鈴木, 俊哉"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"鈴木, 敦"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"菅谷, 克行"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Toshiya, Suzuki","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Atsushi, Suzuki","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Katsuyuki, Sugaya","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10114171","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"甲骨文字のデジタル化において,文字符号化して問題ないか,あるいは画像として扱うべきかは,拓本資料の鮮明さや掲出例数を考慮して判断しなければならない.我々は印刷物として公表されたデータベースである 『殷墟卜辭綜類』 と 『殷墟甲骨刻辭類纂』 に基づいた検討をすすめているが,全て手書き資料であり,また,そこに模写された文字の集合も明確ではないため,文字認識的な手法をとることができない.本研究では,掲出例数を概算するため,両書に共通するレイアウト構造をもとに模写テキストを画像分解する方法を検討した.両書の画像分解精度が大きく異なる結果が得られたが,この原因は両書の編集・出版方針の違いによると推測される.また,本研究の手法の適用範囲についても報告する.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"In the digitization of the Oracle Bone materials, the criteria to digitize as “coded text” or as an image should be decided with the consideration about the legibility of the source materials and the “glyphs” on the materials are sufficiently popular to interchange with the stable identity. For the character encoding in ISO/IEC 10646, once Japanese experts proposed to select the representative glyphs by the frequency of the contexts listed in the corpuses, like “殷墟卜辭類纂” or “殷墟甲骨刻辭類纂”. In this report, we estimated the frequency by automatic image decomposition method. The representative glyphs with the frequencies with the examples more than 10 are estimated about 850. This is further smaller than the estimation by the cross section of 2 corpuses.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告情報基礎とアクセス技術(IFAT)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2015-03-23","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"5","bibliographicVolumeNumber":"2015-IFAT-118"}]},"relation_version_is_last":true,"weko_creator_id":"11"},"created":"2025-01-19T00:19:05.803348+00:00","id":141521,"links":{}}