Publications

Carrillo-Mondéjar, Javier; Rodríguez, Ricardo J.

Identifying Runtime Libraries in Statically Linked Linux Binaries Journal Article

In: Future Generation Computer Systems, vol. 164, pp. 107602, 2025, ISSN: 0167-739X.

Abstract | Links | BibTeX | Tags: Binary code analysis, IoT, malware, Runtime library identification, Statically linked binaries

@article{CarrilloR-FGCS-25,

title = {Identifying Runtime Libraries in Statically Linked Linux Binaries},

author = {Javier Carrillo-Mondéjar and Ricardo J. Rodríguez},

url = {http://webdiis.unizar.es/~ricardo/files/papers/CarrilloR-FGCS-25.pdf},

doi = {10.1016/j.future.2024.107602},

issn = {0167-739X},

year  = {2025},

date = {2025-01-01},

journal = {Future Generation Computer Systems},

volume = {164},

pages = {107602},

abstract = {Vulnerabilities in unpatched applications can originate from third-party dependencies in statically linked applications, as they must be relinked each time to take advantage of libraries that have been updated to fix any vulnerability. Despite this, malware binaries are often statically linked to ensure they run on target platforms and to complicate malware analysis. In this sense, identification of libraries in malware analysis becomes crucial to help filter out those library functions and focus on malware function analysis. In this paper, we introduce tt MANTILLA, a system for identifying runtime libraries in statically linked Linux-based binaries. Our system is based on radare2 to identify functions and extract their features (independent of the underlying architecture of the binary) through static binary analysis and on the K-nearest neighbors supervised machine learning model and a majority rule to predict final values. tt MANTILLA is evaluated on a dataset consisting of binaries built for different architectures (tt MIPSeb, tt ARMel, tt Intel x86, and tt Intel x86-64) and different runtime libraries (tt uClibc, tt glibc, and tt musl), achieving very high accuracy. We also evaluate it in two case studies. First, using a dataset of binary files belonging to the tt binutils collection and second, using an IoT malware dataset. In both cases, good accuracy results are obtained both in terms of runtime library detection ($94.4%$ and $95.5%$, respectively) and architecture identification ($100%$ and $98.6%$, respectively).},

keywords = {Binary code analysis, IoT, malware, Runtime library identification, Statically linked binaries},

pubstate = {published},

tppubtype = {article}

}

Close

Abascal, León; Rodríguez, Ricardo J.

Poster: Extracting Cryptographic Keys from Windows Live Processes Proceedings Article

In: Egele, Manuel; Moonsamy, Veelasha; Gruss, Daniel; Carminati, Michele (Ed.): Proceedings of the 22nd International Conference on Detection of Intrusions and Malware, and Vulnerability Assessment, pp. 213–219, Springer Nature Switzerland, Cham, 2025, ISBN: 978-3-031-97620-9.

Abstract | Links | BibTeX | Tags: cryptography, digital forensics, malware, Windows

@inproceedings{AbascalR-DIMVA-25,

title = {Poster: Extracting Cryptographic Keys from Windows Live Processes},

author = {León Abascal and Ricardo J. Rodríguez},

editor = {Manuel Egele and Veelasha Moonsamy and Daniel Gruss and Michele Carminati},

url = {https://webdiis.unizar.es/~ricardo/files/papers/AbascalR-DIMVA-25.pdf},

doi = {10.1007/978-3-031-97620-9_12},

isbn = {978-3-031-97620-9},

year  = {2025},

date = {2025-01-01},

booktitle = {Proceedings of the 22nd International Conference on Detection of Intrusions and Malware, and Vulnerability Assessment},

volume = {15748},

pages = {213–219},

publisher = {Springer Nature Switzerland},

address = {Cham},

abstract = {Cryptographic keys are a fundamental aspect of modern system security, but when compromised, they become a critical vulnerability, especially in ransomware attacks. Paradoxically, these keys must be available in memory at runtime to function, creating a unique opportunity for defensive tools. We introduce nameTool, an open-source tool designed to locate cryptographic keys in active Windows processes using advanced memory analysis. Unlike traditional approaches that rely on static memory dumps, nameTool performs dynamic analysis in real time, restricting the search to process heap memory to improve efficiency and accuracy. It employs robust key identification heuristics to minimize false positives and is designed for seamless integration with Endpoint Detection and Response systems. nameTool also encourages extensibility: its open-source nature allows researchers and practitioners to enhance its capabilities with custom key detection algorithms. We validated our approach through extensive experiments involving both proof-of-concept ransomware and real-world samples, demonstrating the effectiveness of key extraction and decryption success. Our tool provides a practical path to strengthening ransomware mitigation strategies.},

keywords = {cryptography, digital forensics, malware, Windows},

pubstate = {published},

tppubtype = {inproceedings}

}

Close

Pelayo-Benedet, Tomás; Rodríguez, Ricardo J.; Gañán, Carlos H.

RAMPAGE: A Software Framework To Ensure Reproducibility in Algorithmically Generated Domains Detection Journal Article

In: Expert Systems With Applications, vol. 293, pp. 128629, 2025, ISSN: 0957-4174.

Abstract | Links | BibTeX | Tags: algorithmically generated domains detection, evaluation, machine learning models, malware, neural network models

@article{PelayoBenedetRG-ESWA-25,

title = {RAMPAGE: A Software Framework To Ensure Reproducibility in Algorithmically Generated Domains Detection},

author = {Tomás Pelayo-Benedet and Ricardo J. Rodríguez and Carlos H. Gañán},

url = {https://webdiis.unizar.es/~ricardo/files/papers/PelayoBenedetRG-ESWA-25.pdf},

doi = {10.1016/j.eswa.2025.128629},

issn = {0957-4174},

year  = {2025},

date = {2025-12-01},

urldate = {2025-12-01},

journal = {Expert Systems With Applications},

volume = {293},

pages = {128629},

abstract = {As part of its life cycle, malware can establish communication with its command and control server. To bypass static protection techniques, such as blocking certain IPs in firewalls or DNS server deny lists, malware can use em algorithmically generated domains (AGD). Many different solutions based on deep learning have been proposed during the last years to detect this type of domains. However, there is a lack of ability to compare the proposed models because there is no common framework that allows experiments to be replicated under the same conditions. Each previous work shows its evaluation results, but under different experimentation conditions and even with different datasets. In this paper, we address this gap by proposing a software framework, dubbed sc RAMPAGE (em fRAMework to comPAre aGd dEtectors), focused on training and comparing machine learning models for AGD detection. Furthermore, we propose a new model that uses logistic regression and, using sc RAMPAGE to obtain a fair comparison with different state-of-the-art models, achieves slightly better results than those obtained so far. In addition, the dataset built from real-world samples for evaluation, as well as the source code of sc RAMPAGE, are also publicly released to facilitate its use and promote experimental reproducibility in this research field.},

keywords = {algorithmically generated domains detection, evaluation, machine learning models, malware, neural network models},

pubstate = {published},

tppubtype = {article}

}

Close

Martín-Pérez, Miguel; Rodríguez, Ricardo J

Quantifying Paging on Recoverable Data from Windows User-Space Modules Proceedings Article

In: Proceedings of the 12th EAI International Conference on Digital Forensics & Cyber Crime, Springer, 2021, (Accepted for publication. To appear).

Abstract | Links | BibTeX | Tags: digital forensics, malware, memory forensics, paging, Windows modules

@inproceedings{MR-ICDF2C-21,

title = {Quantifying Paging on Recoverable Data from Windows User-Space Modules},

author = {Miguel Martín-Pérez and Ricardo J Rodríguez},

url = {https://webdiis.unizar.es/~ricardo/files/papers/MR-ICDF2C-21.pdf},

year  = {2021},

date = {2021-01-01},

booktitle = {Proceedings of the 12th EAI International Conference on Digital Forensics & Cyber Crime},

publisher = {Springer},

abstract = {Memory forensic analysis enables a forensic examiner to retrieve evidence of a security incident, such as encryption keys, or analyze malware that resides solely in memory. During this process, the current state of system memory is acquired and saved to a file denoted as memory dump, which is then analyzed with dedicated software for evidence. Although a memory dump contains large amounts of data for analysis, its content can be inaccurate and incomplete due to how an operating system's memory management subsystem works: page swapping, on-demand paging, or page smearing are some of the problems that can affect the data that resides in memory. In this paper, we evaluate how these issues affect user-mode modules by measuring the ratio of modules that reside in memory on a Windows 10 system under different memory workloads. On Windows, a module represents an image (that is, an executable, shared dynamic library, or driver) that was loaded as part of the kernel or a user-mode process. We show that this ratio is particularly low in shared dynamic library modules, as opposed to executable modules. We also discuss the issues of memory forensics that can affect scanning for malicious evidences in particular. Additionally, we have developed a Volatility plugin, dubbed pluginName, which helps forensic analysts obtain paging information from a memory dump for each process running at the time of acquisition, providing them with information on the amount of data that cannot be properly analyzed.},

note = {Accepted for publication. To appear},

keywords = {digital forensics, malware, memory forensics, paging, Windows modules},

pubstate = {published},

tppubtype = {inproceedings}

}

Close

Selvi, Jose; Rodríguez, Ricardo J; Soria-Olivas, Emilio

Towards Optimal LSTM Neural Networks for Detecting Algorithmically Generated Domain Names Journal Article

In: IEEE Access, vol. 9, pp. 126446–126456, 2021.

Abstract | Links | BibTeX | Tags: deep learning, domain generation algorithms, LSTM, malware

@article{SRS-ACCESS-21,

title = {Towards Optimal LSTM Neural Networks for Detecting Algorithmically Generated Domain Names},

author = {Jose Selvi and Ricardo J Rodríguez and Emilio Soria-Olivas},

url = {http://webdiis.unizar.es/~ricardo/files/papers/SRS-ACCESS-21.pdf},

doi = {10.1109/ACCESS.2021.3111307},

year  = {2021},

date = {2021-01-01},

urldate = {2021-01-01},

journal = {IEEE Access},

volume = {9},

pages = {126446--126456},

abstract = {Malware detection is a problem that has become particularly challenging over the last decade. A common strategy for detecting malware is to scan network traffic for malicious connections between infected devices and their command and control (C&C) servers. However, malware developers are aware of this detection method and begin to incorporate new strategies to go unnoticed. In particular, they generate domain names instead of using static Internet Protocol addresses or regular domain names pointing to their C&C servers. By using a domain generation algorithm, the effectiveness of the blacklisting of domains is reduced, as the large number of domain names that must be blocked greatly increases the size of the blacklist. In this paper, we study different Long Short-Term Memory neural network hyperparameters to find the best network configuration for algorithmically generated domain name detection. In particular, we focus on determining whether the (complex) feature engineering efforts required when using other deep learning techniques, such as Random Forest, can be avoided. In this regard, we have conducted a comparative analysis to study the effect of using different network sizes and configurations on network performance metrics. Our results show an accuracy of 97:62% and an area under the receiver operating characteristic curve of 0:9956 in the test dataset, indicating that it is possible to obtain good classification results despite avoiding the feature engineering process and additional readjustments required in other machine learning techniques.},

keywords = {deep learning, domain generation algorithms, LSTM, malware},

pubstate = {published},

tppubtype = {article}

}

Close

Selvi, Jose; Rodríguez, Ricardo J; Soria-Olivas, Emilio

Detection of Algorithmically Generated Malicious Domain Names using Masked N-Grams Journal Article

In: Expert Systems with Applications, vol. 124, pp. 156–163, 2019, ISSN: 0957-4174.

Abstract | Links | BibTeX | Tags: Domain-generated algorithms, malware, Random Forest

Uroz, Daniel; Rodríguez, Ricardo J

Characteristics and Detectability of Windows Auto-Start Extensibility Points in Memory Forensics Journal Article

In: Digital Investigation, vol. 28, pp. S95–S104, 2019, ISSN: 1742-2876.

Abstract | Links | BibTeX | Tags: Auto-start extensibility points, malware, memory forensics, System persistence, Volatility, Windows registry

@article{UR-DIIN-19,

title = {Characteristics and Detectability of Windows Auto-Start Extensibility Points in Memory Forensics},

author = {Daniel Uroz and Ricardo J Rodríguez},

url = {http://webdiis.unizar.es/~ricardo/files/papers/UR-DIIN-19.pdf},

doi = {10.1016/j.diin.2019.01.026},

issn = {1742-2876},

year  = {2019},

date = {2019-01-01},

journal = {Digital Investigation},

volume = {28},

pages = {S95--S104},

abstract = {Computer forensics is performed during a security incident response process on disk devices or on the memory of the compromised system. The latter case, known as memory forensics, consists in dumping the memory to a file and analyzing it with the appropriate tools. Many security incidents are caused by malware that targets and persists as long as possible in a Windows system within an organization. The persistence is achieved using Auto-Start Extensibility Points (ASEPs), the subset of OS and application extensibility points that allow a program to auto-start without any explicit user invocation. In this paper, we propose a taxonomy of the Windows ASEPs, considering the features that are used or abused by malware to achieve persistence. This taxonomy splits into four categories: system persistence mechanisms, program loader abuse, application abuse, and system behavior abuse. We detail the characteristics of each extensibility point (namely, write permissions, execution privileges, detectability in memory forensics, freshness of system requirements, and execution and configuration scopes). Many of these ASEPs rely on the Windows Registry. We also introduce the tool Winesap, a Volatility plugin that analyzes the registry-based Windows ASEPs in a memory dump. Furthermore, we state the order of execution of some of these registry-based extensibility points and evaluate the effectiveness of our tool in memory dumps taken from a Windows OS where extensibility points were used. Winesap was successful in marking all the registry-based Windows ASEPs as suspicious registry keys.},

keywords = {Auto-start extensibility points, malware, memory forensics, System persistence, Volatility, Windows registry},

pubstate = {published},

tppubtype = {article}

}

Close

Rodríguez, Ricardo J

Evolution and Characterization of Point-of-Sale RAM Scraping Malware Journal Article

In: Journal in Computer Virology and Hacking Techniques, vol. 13, no. 3, pp. 179–192, 2017, ISSN: 2263-8733.

Abstract | Links | BibTeX | Tags: Evolution, malware, POS RAM scraping, Software security, Taxonomy