@inproceedings{9e887a894a6144728468966fb1bb8faf,
title = "Neural network-based acoustic vehicle counting",
abstract = "This paper addresses acoustic vehicle counting using one-channel audio. We predict the pass-by instants of vehicles from local minima of clipped vehicle-to-microphone distance. This distance is predicted from audio using a two-stage (coarse-fine) regression, with both stages realised via neural networks (NNs). Experiments show that the NN-based distance regression outperforms by far the previously proposed support vector regression. The 95% confidence interval for the mean of vehicle counting error is within [0.28%, −0.55%]. Besides the minima-based counting, we propose a deep learning counting that operates on the predicted distance without detecting local minima. Although outperformed in accuracy by the former approach, deep counting has a significant advantage in that it does not depend on minima detection parameters. Results also show that removing low frequencies in features improves the counting performance.",
keywords = "Support vector machines, Deep learning, Europe, Artificial neural networks, Signal processing, Acoustics, Vehicle counting, log-mel spectrogram, neural network, peak detection, deep learning",
author = "Slobodan Djukanovi{\'c} and Yash Patel and Jiri Matas and T. Virtanen",
note = "jufoid=55867; European Signal Processing Conference, EUSIPCO 2021 ; Conference date: 23-08-2021 Through 27-08-2021",
year = "2021",
doi = "10.23919/EUSIPCO54536.2021.9615925",
language = "English",
series = "European Signal Processing Conference",
publisher = "IEEE",
pages = "561--565",
booktitle = "2021 29th European Signal Processing Conference (EUSIPCO)",
}