@inproceedings{3278bda17a3b4f97883cd055d330f980,
title = "DATA AUGMENTATION IN TRAINING DEEP LEARNING MODELS FOR MALWARE FAMILY CLASSIFICATION",
abstract = "With the rapid development of deep learning technologies, different deep learning models have been applied to detect and classify malware. When applying deep learning models to classify malware families, a major bottleneck is the lack of enough labeled family samples that are required for training deep learning models. The depth model applied to malware needs a huge number of samples for training. In order to solve this issue, we propose a method for generating malware family samples. We use the Grad-CAM algorithm to find the raw data representing malware features. A new sample is created by inserting them into section gaps and new sections in PE files. The experiment results show that adding the generated samples into training dataset can improve the classification accuracy of deep learning models.",
keywords = "Data Augmentation, Deep Learning, Feature Extraction",
author = "Ding Yuxin and Wang Guangbin and Ma Yubin and Ding Haoxuan",
note = "Publisher Copyright: {\textcopyright} 2021 IEEE.; 20th International Conference on Machine Learning and Cybernetics, ICMLC 2021 ; Conference date: 04-12-2021 Through 05-12-2021",
year = "2021",
doi = "10.1109/ICMLC54886.2021.9737271",
language = "英语",
series = "Proceedings - International Conference on Machine Learning and Cybernetics",
publisher = "IEEE Computer Society",
booktitle = "Proceedings of 2021 International Conference on Machine Learning and Cybernetics, ICMLC 2021",
address = "美国",
}