{"id":19243,"created":"2025-01-18T22:51:45.678636+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00019243","sets":["1164:1165:1184:1186"]},"path":["1186"],"owner":"1","recid":"19243","title":["SAX - GTR:高速XMLストリーム読み込み手法"],"pubdate":{"attribute_name":"公開日","attribute_value":"2004-07-13"},"_buckets":{"deposit":"9c2f331e-3491-4538-9fc5-30c58ae058d2"},"_deposit":{"id":"19243","pid":{"type":"depid","value":"19243","revision_id":0},"owners":[1],"status":"published","created_by":1},"item_title":"SAX - GTR:高速XMLストリーム読み込み手法","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"SAX - GTR:高速XMLストリーム読み込み手法"},{"subitem_title":"SAX - GTR : Fast Loading of XML Stream","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2004-07-13","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"東京都立大学大学院工学研究科"},{"subitem_text_value":"東京都立大学大学院工学研究科"},{"subitem_text_value":"東京都立大学大学院工学研究科"},{"subitem_text_value":"東京都立大学大学院工学研究科"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Graduate School of Engineerong, Tokyo Metropolitan University","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Engineerong, Tokyo Metropolitan University","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Engineerong, Tokyo Metropolitan University","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Engineerong, Tokyo Metropolitan University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/19243/files/IPSJ-DBS04134029.pdf"},"date":[{"dateType":"Available","dateValue":"2006-07-13"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-DBS04134029.pdf","filesize":[{"value":"1.1 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"13"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"d11764ee-c4dd-4091-96b9-5c8f06539aa9","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2004 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"横山, 昌平"},{"creatorName":"太田, 学"},{"creatorName":"片山, 薫"},{"creatorName":"石川, 博"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Shohei, Yokoyama","creatorNameLang":"en"},{"creatorName":"Manabu, Ohta","creatorNameLang":"en"},{"creatorName":"Kaoru, Katayama","creatorNameLang":"en"},{"creatorName":"Hiroshi, Ishikawa","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10112482","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"アプリケーションからXML文書を扱う仕組みは大きく分けて二つある.一つはDOMに代表されるXML木をメモリ上に展開するタイプの手法であり,もう一つはSAX等,XMLファイルを先頭からデータストリームとして読み込んでゆくタイプの手法である.前者は柔軟な処理を,後者は高速・低消費メモリを特徴としている.本論文では後者の手法に着目し,さらなる高速化に関する手法の提案を行う.具体的には,XML文書をその文書をSAXのイベントから成るストリーム単位に分解し二つのバイナリファイルに分解して保存する.一つのファイルにはイベント列の定義と走査するプログラムによって頻繁に利用される要素属性値が保存され,それ以外のデータはもう一つのファイルに保存する.前者のファイルはXMLファイルを走査するときに読み込まれ,前者はそこに保存された値が利用されるときに読み込まれる.この仕組みによりデータ走査時に読み込むデータの絶対量を削減する事ができ,より高速にXMLストリームを読み込むことができる.本稿ではこのバイナリファイルのフォーマットを説明する.またXMLデータを自動でバイナリ化し,ユーザが提案手法の知識がなくとも,SAXパーサを用いて透過的にアクセス手法を提案する.さらにSAXパーサより高速に動作することを実験により示す.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"There are two basic types of XML parser SAX and DOM. The SAX is a event driven XML parser that parses an XML input stream. The DOM is an in-memory tree representation of the XML document. Unlike SAX, DOM is a read-write API. Documents can be searched, queried, and updated via the DOM interface. This makes DOM much more effective when randomly accessing to XML documents. However, it is quite memory exhaustive compared with SAX because SAX doesn't have to store the entire document in memory. Therefore SAX is scalable from small to very large XML documents. The time taken to parse an XML document grows only linearly with the size of the document. In this paper, we propose an efficient framework for SAX applications called SAX-GTR that divides an XML document in two binary files; one is for the event stream and frequently-accessed data, the other is for non-frequently-accessed data. The division is decided automatically with a particular SAX event handler, without the structural and semantic information such as DTDs. The purpose of this division is to decrease the cost of loading. We also present a transparent access to SAX-GTR documents using SAX event handlers. The effectiveness of SAX-GTR is demonstrated by some experiments.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"220","bibliographic_titles":[{"bibliographic_title":"情報処理学会研究報告データベースシステム(DBS)"}],"bibliographicPageStart":"213","bibliographicIssueDates":{"bibliographicIssueDate":"2004-07-13","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"71(2004-DBS-134)","bibliographicVolumeNumber":"2004"}]},"relation_version_is_last":true,"weko_creator_id":"1"},"updated":"2025-01-22T22:20:00.487637+00:00","links":{}}