Publications
2023
1.
Al-Nabki, Wesam; Fidalgo, Eduardo; Alegre, Enrique; Alaiz-Rodríguez, Rocío
Author Correction: Short text classification approach to identify child sexual exploitation material Artículo de revista
En: Scientific Reports, vol. 13, no 1, pp. 17840, 2023, (Publisher: Nature Publishing Group UK London).
Resumen | Enlaces | BibTeX | Etiquetas: CSEM detection, law enforcement, machine learning, test classification
@article{al-nabki_author_2023,
title = {Author Correction: Short text classification approach to identify child sexual exploitation material},
author = {Wesam Al-Nabki and Eduardo Fidalgo and Enrique Alegre and Rocío Alaiz-Rodríguez},
url = {https://www.nature.com/articles/s41598-023-45265-2},
year = {2023},
date = {2023-01-01},
urldate = {2023-01-01},
journal = {Scientific Reports},
volume = {13},
number = {1},
pages = {17840},
abstract = {This paper presents a method to identify Child Sexual Exploitation Material (CSEM) files by analyzing file names and paths instead of content, aiding law enforcement in time-sensitive investigations. The approach tackles obfuscation using character n-grams, binary, and orthographic features. Two classification strategies are proposed: one combining separate file name and path classifiers, and another iterating over the path. Six machine learning and deep learning models were tested, with the best achieving an F1 score of 0.988, making it a promising tool for law enforcement agencies.},
note = {Publisher: Nature Publishing Group UK London},
keywords = {CSEM detection, law enforcement, machine learning, test classification},
pubstate = {published},
tppubtype = {article}
}
This paper presents a method to identify Child Sexual Exploitation Material (CSEM) files by analyzing file names and paths instead of content, aiding law enforcement in time-sensitive investigations. The approach tackles obfuscation using character n-grams, binary, and orthographic features. Two classification strategies are proposed: one combining separate file name and path classifiers, and another iterating over the path. Six machine learning and deep learning models were tested, with the best achieving an F1 score of 0.988, making it a promising tool for law enforcement agencies.