@inproceedings{04c451f85fcc43c9ac165690b25d23d0,
title = "OPHiForest: Order preserving hashing based isolation forest for robust and scalable anomaly detection",
abstract = "Anomaly detection is one of the most important data mining tasks in many real-life applications such as network intrusion detection for cybersecurity and medical diagnosis for healthcare. In the big data era, these applications demand fast and versatile anomaly detection capability to handle various types of increasingly huge-volume data. However, existing detection methods are either slow due to high computational complexity, or unable to deal with complicated anomalies like local anomalies. In this paper, we propose a novel anomaly detection method named OPHiForest with the use of the order preserving hashing based isolation forest. The core idea is to learn the information from data to construct better isolation forest structure than the state-of-the-art methods like iForest and LSHiForest, which can achieve robust detection of various anomaly types. We design a fast two-step learning process for the order preserving hashing scheme. This leads to stronger order preservation for better hashing, and therefore enhances anomaly detection robustness and accuracy. Extensive experiments on both synthetic and real-world data sets demonstrate that our method is highly robust and scalable.",
keywords = "anomaly detection, isolation forest, OPHiForest, order preservation, robust and scalable",
author = "Haolong Xiang and Zoran Salcic and Wanchun Dou and Xiaolong Xu and Lianyong Qi and Xuyun Zhang",
year = "2020",
doi = "10.1145/3340531.3411988",
language = "English",
isbn = "9781450368599",
series = "International Conference on Information and Knowledge Management, Proceedings",
publisher = "Association for Computing Machinery",
pages = "1655--1664",
booktitle = "CIKM 2020 - Proceedings of the 29th ACM International Conference on Information and Knowledge Management",
note = "29th ACM International Conference on Information and Knowledge Management, CIKM 2020 ; Conference date: 19-10-2020 Through 23-10-2020",
}