@inproceedings{45e3da1ed8934836a5b75d0c4b1dd786,
title = "Optimizing AI for Mobile Malware Detection by Self-Built-Dataset GAN Oversampling and LGBM",
abstract = "The cyber detection industry focuses on analyzing the behavior of threats in order to develop IOCs and triggers. This process makes the detection always behind the attackers, as there is an analysis time between the attack tool launch and the detection ability. To address the challenges, a dedicated Sandbox environment was built, and thousands of mobile devices' samples were tested, resulted in creation of an up-to-date training dataset that is not based on the attacks analysis. With this dataset, the research focus was directed towards optimizing the AI methodology to achieve the best detection rates for a compromised mobile device. A CupolaGAN was implemented to oversample dataset and to compare results obtained from training LGBM models on both original imbalanced dataset and oversampled dataset. Classification scores on the oversampled data increase by maximum of 0.47+/-0.37%. The performance of the fine-tuned model using Optuna on the balanced data reaches 99.36+/-0.19% accuracy.",
keywords = "CupolaGAN, LightGBM, Sandbox, cybersecurity, malware detection, oversampling",
author = "Ortal Dayan and Lior Wolf and Fang Wang and Yaniv Harel",
note = "Publisher Copyright: {\textcopyright} 2023 IEEE.; 3rd IEEE International Conference on Cyber Security and Resilience, CSR 2023 ; Conference date: 31-07-2023 Through 02-08-2023",
year = "2023",
doi = "10.1109/CSR57506.2023.10224927",
language = "אנגלית",
series = "Proceedings of the 2023 IEEE International Conference on Cyber Security and Resilience, CSR 2023",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "60--65",
booktitle = "Proceedings of the 2023 IEEE International Conference on Cyber Security and Resilience, CSR 2023",
address = "ארצות הברית",
}