@inproceedings{e30fb86dd4fd458e87a8bec0d5664b57,
title = "Scale and shift invariant time/frequency representation using auditory statistics: Application to rhythm description",
abstract = "In this paper we propose two novel scale and shift-invariant time-frequency representations of the audio content. Scale-invariance is a desired property to describe the rhythm of an audio signal as it will allow to obtain the same representations for same rhythms played at different tempi. This property can be achieved by expressing the time-axis in log-scale, for example using the Scale Transform (ST). Since the frequency locations of the audio content are also important, we previously extended the ST to the Modulation Scale Spectrum (MSS). However, this MSS does not allow to represent the inter-relationship between the audio content existing in various frequency bands. To solve this issue, we propose here two novel representations. The first one is based on the 2D Scale Transform, the second on statistics (inspired by the auditory experiments of McDermott) that represent the interrelationship between the various frequency bands. We apply both representations to a task of rhythm class recognition and demonstrates their benefits. We show that the introduction of auditory statistics allows a large increase of the recognition results.",
keywords = "2D-Fourier, 2D-Scale, Fourier-Mellin Transform, auditory statistics, rhythm description",
author = "Ugo Marchand and Geoffroy Peeters",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 26th IEEE International Workshop on Machine Learning for Signal Processing, MLSP 2016 - Proceedings ; Conference date: 13-09-2016 Through 16-09-2016",
year = "2016",
month = nov,
day = "8",
doi = "10.1109/MLSP.2016.7738904",
language = "English",
series = "IEEE International Workshop on Machine Learning for Signal Processing, MLSP",
publisher = "IEEE Computer Society",
editor = "Kostas Diamantaras and Aurelio Uncini and Palmieri, \{Francesco A. N.\} and Jan Larsen",
booktitle = "2016 IEEE International Workshop on Machine Learning for Signal Processing, MLSP 2016 - Proceedings",
}