{"links":{},"id":240997,"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00240997","sets":["6164:6165:6462:11854"]},"path":["11854"],"owner":"11","recid":"240997","title":["ログ収集のための機械学習を用いたJSON形式ログファイル判別の検討"],"pubdate":{"attribute_name":"PubDate","attribute_value":"2024-10-15"},"_buckets":{"deposit":"260435e6-500f-4e6b-b73c-0128572af147"},"_deposit":{"id":"240997","pid":{"type":"depid","value":"240997","revision_id":0},"owners":[11],"status":"published","created_by":11},"item_title":"ログ収集のための機械学習を用いたJSON形式ログファイル判別の検討","author_link":["662714","662715","662716","662717","662718","662719","662720","662721","662722","662723","662724","662725","662726","662727"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"ログ収集のための機械学習を用いたJSON形式ログファイル判別の検討","subitem_title_language":"ja"},{"subitem_title":"A Consideration of JSON format Log File Discrimination using Machine Learning for Automatic Log Collection","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"機械学習,デジタルフォレンジック,ログ解析","subitem_subject_scheme":"Other"}]},"item_type_id":"18","publish_date":"2024-10-15","item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_18_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"東京情報大学大学院総合情報学研究科"},{"subitem_text_value":"日立システムズサイバーセキュリティリサーチセンタ"},{"subitem_text_value":"日立システムズサイバーセキュリティリサーチセンタ"},{"subitem_text_value":"日立システムズ セキュリティ・コアバリュー本部"},{"subitem_text_value":"東京情報大学総合情報学部"},{"subitem_text_value":"東京情報大学総合情報学部"},{"subitem_text_value":"東京情報大学総合情報学部"}]},"item_18_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Graduate School of Infomatics, Tokyo Universiy of Infomation Sciences","subitem_text_language":"en"},{"subitem_text_value":"Hitachi Systems, Ltd. Cyber Security Research Center","subitem_text_language":"en"},{"subitem_text_value":"Hitachi Systems, Ltd. Cyber Security Research Center","subitem_text_language":"en"},{"subitem_text_value":"Hitachi Systems, Ltd. Security Core Value Office","subitem_text_language":"en"},{"subitem_text_value":"Faculty of Informatics, Tokyo University of Information Sciences","subitem_text_language":"en"},{"subitem_text_value":"Faculty of Informatics, Tokyo University of Information Sciences","subitem_text_language":"en"},{"subitem_text_value":"Faculty of Informatics, Tokyo University of Information Sciences","subitem_text_language":"en"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/240997/files/IPSJ-CSS2024251.pdf","label":"IPSJ-CSS2024251.pdf"},"date":[{"dateType":"Available","dateValue":"2026-10-15"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-CSS2024251.pdf","filesize":[{"value":"644.2 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"30"},{"tax":["include_tax"],"price":"0","billingrole":"46"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"c63b398e-5647-42fe-936d-de2df8dc62ae","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2024 by the Information Processing Society of Japan"}]},"item_18_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"谷屋, 直樹"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"中野, 心太"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"関谷, 信吾"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"折田, 彰"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"岸本, 頼紀"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"早稲田, 篤志"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"花田, 真樹"}],"nameIdentifiers":[{}]}]},"item_18_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Naoki, Taniya","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Shinta, Nakano","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Shingo, Sekiya","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Akira, Orita","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Yorinori, Kishimoto","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Atsushi, Waseda","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Masaki, Hanada","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_5794","resourcetype":"conference paper"}]},"item_18_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"デジタルフォレンジックにおいて,ログファイルを収集する作業は煩わしい.これに対してファイルのバイナリデータに対してfasttextを利用した類似度からテキスト形式のログファイルを自動判別,収集する方法が提案されている.しかし,この手法ではnginxやApacheなどのログ出力形式として利用されるJSON形式のログファイルに対応できない.JSON形式ファイルでは,出力するアプリケーション毎にキーが異なるため,tf-idfのような類似度では分類が難しい.そこで,fasttext,ナイーブベイズ,ランダムフォレスト,SVMのそれぞれのアルゴリズムを用いて類似度を計算し,その傾向について分析する.これにより,ログファイルか否かの判別に適したアルゴリズムについて検討・報告する.","subitem_description_type":"Other"}]},"item_18_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"In digital forensics, collecting log files is a difficult task. A method has been proposed to automatically identify and collect text-format log files based on similarity using fasttext for the binary data of the files. However, this method does not support JSON log files, which are used as the log output format for nginx, Apache, etc. In JSON files, the keys are different for each output application, making classification difficult using similarity measures such as tf-idf. Therefore, we investigated similarity measures using each of the algorithms, fasttext, naive Bayes, random forest, and SVM, and investigated and reported on algorithms suitable for identifying log files.","subitem_description_type":"Other"}]},"item_18_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"1883","bibliographic_titles":[{"bibliographic_title":"コンピュータセキュリティシンポジウム2024論文集"}],"bibliographicPageStart":"1880","bibliographicIssueDates":{"bibliographicIssueDate":"2024-10-15","bibliographicIssueDateType":"Issued"}}]},"relation_version_is_last":true,"weko_creator_id":"11"},"created":"2025-01-19T01:45:30.516049+00:00","updated":"2025-03-06T06:12:15.550202+00:00"}