@inproceedings{oai:ipsj.ixsq.nii.ac.jp:00240964,
 author = {齋藤, 太新 and 橋本, 正樹 and 須崎, 有康 and Taishin, Saito and Masaki, Hashimoto and Kuniyasu, Suzaki},
 book = {コンピュータセキュリティシンポジウム2024論文集},
 month = {Oct},
 note = {サイバー攻撃の全体像把握や発生源の特定のために，Data Provenance を追跡することで，一連関連イベントの依存関係を紐付け，悪性活動を特定するシステムの活用が進められている．しかし，正規
ユーザーによる操作等，通常のシステムの動作が大量に依存関係に含まれることで，生成されるグラフが巨大になり，悪性活動の特定が困難となる依存関係の爆発問題が課題となっている．本稿では，依存関係の爆発の低減のために，ログデータ内の情報を用いた自然言語処理と半教師あり学習によるコンピュータシステム内活動の分類により，頻出の良性活動を抽出する方法を提案する．評価実験では，抽出した良性活動と大規模公開データセットである，DARPA Dateset を用いて，依存関係の爆発問題に対する効果の評価を行い，良性活動を用いて依存関係の爆発を低減可能であることや，コンピュータシステム内の約10%は良性活動のパターンとして定義出来る可能性があることを示した．加えて，小規模サイズのログデータから抽出した良性活動で大規模データ内の探索空間を削減出来ることを示した．, Data Provenance tracing is used to identify malicious activities in cyber attacks by linking related events. However, this approach faces a dependency explosion problem due to the inclusion of numerous benign system operations, making it difficult to isolate malicious activities. This paper proposes a method to extract frequent benign activities using natural language processing and semi-supervised learning of log data, aiming to reduce dependency explosion. We evaluated our method’s effectiveness using the DARPA dataset Transparent Computing Engagement3 . We showed that it is possible to use benign activity to reduce dependency explosion, that approximately 10% of the time in a computer system may be defined as a pattern of benign activity, that benign activity extracted from small size log data can reduce the search space of large data.},
 pages = {1641--1648},
 publisher = {情報処理学会},
 title = {DARPA Dataset を用いた情報システム内の良性活動抽出手法の検討},
 year = {2024}
}