@article{ART003266107},
author={Gwang-Ho Kim and Soo-Jin Lee},
title={Transformer-based Android Malware Classification using Multi-stage Feature Selection},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2025},
volume={30},
number={11},
pages={179-189}
TY - JOUR
AU - Gwang-Ho Kim
AU - Soo-Jin Lee
TI - Transformer-based Android Malware Classification using Multi-stage Feature Selection
JO - Journal of The Korea Society of Computer and Information
PY - 2025
VL - 30
IS - 11
PB - The Korean Society Of Computer And Information
SP - 179
EP - 189
SN - 1598-849X
AB - High-dimensional features in API Call-based Android malware detection lead to high computational costs when applying Transformer models. To address this, this paper proposes a multi-stage feature selection pipeline combining LightGBM and Transformer's tokenization method to achieve both model lightweightness and high performance. The proposed method ranks feature importance using LightGBM and then dynamically constructs a final feature set constrained by each Transformer's maximum input token limit. Experimental results show that despite dramatically reducing 9,503 original features to 80-95, our model achieved up to 98.28% accuracy in binary classification and an 83.66% Macro F1-Score in multi-class classification. This demonstrates that our methodology provides comparable performance to previous studies with significantly fewer features, proving it to be an effective solution for ensuring both efficiency and high detection rates in high-dimensional data analysis.
KW - Android Malware;API-Call;Feature Selection;LightGBM;Transformer
DO -
UR -
ER -
Gwang-Ho Kim and Soo-Jin Lee. (2025). Transformer-based Android Malware Classification using Multi-stage Feature Selection. Journal of The Korea Society of Computer and Information, 30(11), 179-189.
Gwang-Ho Kim and Soo-Jin Lee. 2025, "Transformer-based Android Malware Classification using Multi-stage Feature Selection", Journal of The Korea Society of Computer and Information, vol.30, no.11 pp.179-189.
Gwang-Ho Kim, Soo-Jin Lee "Transformer-based Android Malware Classification using Multi-stage Feature Selection" Journal of The Korea Society of Computer and Information 30.11 pp.179-189 (2025) : 179.
Gwang-Ho Kim, Soo-Jin Lee. Transformer-based Android Malware Classification using Multi-stage Feature Selection. 2025; 30(11), 179-189.
Gwang-Ho Kim and Soo-Jin Lee. "Transformer-based Android Malware Classification using Multi-stage Feature Selection" Journal of The Korea Society of Computer and Information 30, no.11 (2025) : 179-189.
Gwang-Ho Kim; Soo-Jin Lee. Transformer-based Android Malware Classification using Multi-stage Feature Selection. Journal of The Korea Society of Computer and Information, 30(11), 179-189.
Gwang-Ho Kim; Soo-Jin Lee. Transformer-based Android Malware Classification using Multi-stage Feature Selection. Journal of The Korea Society of Computer and Information. 2025; 30(11) 179-189.
Gwang-Ho Kim, Soo-Jin Lee. Transformer-based Android Malware Classification using Multi-stage Feature Selection. 2025; 30(11), 179-189.
Gwang-Ho Kim and Soo-Jin Lee. "Transformer-based Android Malware Classification using Multi-stage Feature Selection" Journal of The Korea Society of Computer and Information 30, no.11 (2025) : 179-189.