@inproceedings{196cfc6700f74b3383b0a1dbd4fb8aff,
title = "Threshold-based clustering for intrusion detection systems",
abstract = "Signature-based intrusion detection systems look for known, suspicious patterns in the input data, In this paper we explore compression of labeled empirical data using threshold-based clustering with regularization. The main target of clustering is to compress training dataset to the limited number of signatures, and to minimize the number of comparisons that are necessary to determine the status of the input event as a result. Essentially, the process of clustering includes merging of the clusters which are close enough. As a consequence, we will reduce original dataset to the limited number of labeled centroids. In a complex with k-nearest-neighbor (kNN) method, this set of centroids may be used as a multiclass classifier. Clearly, different attributes have different importance depending on the particular training database. This importance may be regulated in the definition of the distance using linear weight coefficients. The paper introduces special procedure to estimate above weight coefficients. The experiments on the KDD-99 intrusion detection dataset have confirmed effectiveness of the proposed methods.",
keywords = "Distance-based clustering, Intrusion detection, k-nearest-neighbor method",
author = "Vladimir Nikulin",
year = "2006",
doi = "10.1117/12.665326",
language = "English",
isbn = "0819462977",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
booktitle = "Data Mining, Intrusion Detection, Information Assurance, and Data Networks Security 2006",
note = "Data Mining, Intrusion Detection, Information Assurance, and Data Networks Security 2006 ; Conference date: 17-04-2006 Through 18-04-2006",
}