2021
Santos, F.; Durães, D.; Marcondes, F. S.; Hammerschmidt, N.; Lange, S.; Machado, J.; Novais, P.
In-Car Violence Detection Based on the Audio Signal Proceedings Article
Em: D., Allmendinger R. Tino P. Camacho (Ed.): pp. 437-445, Springer Science and Business Media Deutschland GmbH, 2021, ISSN: 03029743, (cited By 15; Conference of 22nd International Conference on Intelligent Data Engineering and Automated Learning, IDEAL 2021 ; Conference Date: 25 November 2021 Through 27 November 2021; Conference Code:269299).
Resumo | Links | BibTeX | Etiquetas: Action recognition; Ambient sounds; Audio action recognition; Audio signal; Audio violence detection; Deep learning; Large-scales; Learning architectures; Signal-processing; Violence detections, Audio acoustics, Classification (of information); Deep learning; Music; Signal detection; Speech processing
@inproceedings{Santos2021437,
title = {In-Car Violence Detection Based on the Audio Signal},
author = {F. Santos and D. Durães and F. S. Marcondes and N. Hammerschmidt and S. Lange and J. Machado and P. Novais},
editor = {Allmendinger R. Tino P. Camacho D.},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85126037019&doi=10.1007%2f978-3-030-91608-4_43&partnerID=40&md5=23842fca53bfddec1db51dc9346d55a4},
doi = {10.1007/978-3-030-91608-4_43},
issn = {03029743},
year = {2021},
date = {2021-01-01},
journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
volume = {13113 LNCS},
pages = {437-445},
publisher = {Springer Science and Business Media Deutschland GmbH},
abstract = {When it is intended to detect violence in the car, audio, speech processing, music, and ambient sound are some of the main points of this problem since it is necessary to find the similarities and differences between these domains. The recent increase in interest in deep learning has allowed practical applications in many areas of signal processing, often surpassing traditional signal processing on a large scale. This paper presents a comparative study of state-of-the-art deep learning architectures applied for inside car violence detection based only on the audio signal. The methodology proposed for audio signal representation was Mel-spectrogram, after an in-depth review of the literature. We build an In-Car video dataset in the experiments and apply four different deep learning architectures to solve the classification problem. The results have shown that the ResNet-18 model presents the best accuracy results on the test set. © 2021, Springer Nature Switzerland AG.},
note = {cited By 15; Conference of 22nd International Conference on Intelligent Data Engineering and Automated Learning, IDEAL 2021 ; Conference Date: 25 November 2021 Through 27 November 2021; Conference Code:269299},
keywords = {Action recognition; Ambient sounds; Audio action recognition; Audio signal; Audio violence detection; Deep learning; Large-scales; Learning architectures; Signal-processing; Violence detections, Audio acoustics, Classification (of information); Deep learning; Music; Signal detection; Speech processing},
pubstate = {published},
tppubtype = {inproceedings}
}