@inproceedings{oai:ipsj.ixsq.nii.ac.jp:00214497,
 author = {山本, 貴巳 and Sangwook, Kim and 班, 涛 and 高橋, 健志 and 小澤, 誠一 and Takami, Yamamoto and Sangwook, Kim and Tao, Ban and Takeshi, Takahashi and Seiichi, Ozawa},
 book = {コンピュータセキュリティシンポジウム2021論文集},
 month = {Oct},
 note = {近年，Drive-by Download 攻撃やフィッシングといった Web 媒介型攻撃による被害が深刻になっており，直接サイバー攻撃を仕掛けたり，攻撃につながるウェブサイトに誘導したりする悪性サイトの迅速な発見が求められている．これまで，URL に着目して，文字レベル畳み込みニューラルネットの学習や URL に頻出する単語を許可リスト化，無視リスト化することで，悪性サイトの判定システムを開発してきた．本研究では，この判定システムの拡張として，HTML タグの構造に着目したグラフ畳み込みネットワークによる悪性サイト判定の手法を提案する．HTML 文書は Document Object Model (DOM) によって表現することができ，HTML タグの構造を木構造として表現できる．これを HTML 文書の「グラフ表現」と呼び，グラフ畳み込みネットワークを適用して悪性サイト判定を行う方法を提案する．従来の URL を利用した悪性サイト判定システムに，HTML タグの構造による判定を加えることで，高い精度で悪性サイトの検知が可能であることを示す．, Recently, damage caused by web-based attacks such as drive by-download attacks and phishing has become serious. There is a pressing need to quickly detect malicious websites which directly launch cyberattacks or guide users to dangerous sites to trigger attacks. In previous work, we have developed a malicious-site detection system based on the word frequency of URLs using character-level convolutional neural networks. In this research, as an extension of the existing system, we propose a new approach using graph convolutional networks based on structural features of HTML tags. First, an HTML document is  represented by the document object model (DOM) as a graph to captures structural information in the document. Then, malicious-site detection is performed by applying graph convolutional networks to the graphs. We show that malicious sites can be detected with higher accuracy by incorporating structural information carried by the HTML tags than the previous approach based on URL.},
 pages = {721--726},
 publisher = {情報処理学会},
 title = {HTMLタグの構造に着目したグラフ畳み込みネットワークによる悪性サイト判定},
 year = {2021}
}