@inproceedings{adda803efb824250bfcb25669b12329a,
title = "Fast, automatic and scalable learning to detect android malware",
abstract = "We propose a novel scheme for Android malware detection. The scheme has two extremely fast phases. First term-frequency simhashing (tf-simhashing) extracts a fixed sized vector for each binary file. The hashing algorithm embeds the frequency of n-grams of bytes into the output vector which can be reshaped into an image representation. In the second phase, we propose a convolutional extreme learning machine (CELM) learns to distinguish between hashes of malicious and clean files as a two class classification task. This scalable scheme is extremely fast in both learning and predicting. The results show that tf-simhashing in an image-shape representation together with CELM provides better performance than three non-parametric models and one state-of-the-art parametric model.",
keywords = "Android malware detection, Convolutional extreme learning machine, Static analysis, Term-frequency simhashing",
author = "Mahmood Yousefi-Azar and Len Hamey and Vijay Varadharajan and McDonnell, {Mark D.}",
year = "2017",
doi = "10.1007/978-3-319-70139-4_86",
language = "English",
isbn = "9783319701387",
series = "Lecture Notes in Computer Science",
publisher = "Springer, Springer Nature",
pages = "848--857",
editor = "Derong Liu and Shengli Xie and Yuanqing Li and Dongbin Zhao and El-Alfy, {El-Sayed M.}",
booktitle = "Neural Information Processing",
address = "United States",
note = "24th International Conference on Neural Information Processing, ICONIP 2017 ; Conference date: 14-11-2017 Through 18-11-2017",
}