@techreport{oai:ipsj.ixsq.nii.ac.jp:00235322,
 author = {嶋田, 創 and 小川, 剛史 and 長谷川, 皓一 and 山口, 由紀子 and Hajime, Shimada and Takeshi, Ogawa and Hirokazu, Hasegawa and Yukiko, Yamaguchi},
 issue = {6},
 month = {Jul},
 note = {世の中には悪性通信検知研究に向けた通信データセットが多数存在している．しかしながら，実ネットワークから採取し匿名化処理だけを行った通信データセットにおいては，ポートスキャンなどの攻撃対象を調査する通信 (プローブ系の通信) が大量に含まれている．この通信データセットをそのまま用いて良性通信/悪性通信検知の識別器を作成した場合，大量にあるプローブ系の通信の特徴にひっぱられて良い識別器が作成できないことが考えられる．そこで本論文では，実ネットワークから採取された通信データセットに対してプローブ系の通信と思われるものを除外するための基準を設定し，設定に沿った除外を行った場合および行わない場合で作成した識別器の評価を行った．また，プローブ系通信としてカテゴライズした通信に対して，どのような意図を持ったプローブかについて推測を試みる．, There are many network communication based traffic dataset for malicious traffic detection researches. However, in a dataset which gathers data from practical networks (with anonymization), it contains probe type communications which is aimed to search victims. If we create classifier which classifies malicious and benign communications including probe type communications, it may create not good classifier because it is largely affected with dominant probe type communications. In this paper, we defined thresholds to exclude probe type communications and evaluated performance of classifiers which are created with including / excluding probe type communications based on thresholds. Furthermore, we estimated intentions of probe type communications which is categorized by thresholds.},
 title = {実社会通信データセットにおけるプローブ系アクセスの混入と除外処理の試行},
 year = {2024}
}