@inproceedings{cebafb480d3d4c7598ab04391ab1f63d,
title = "Downbeat detection with conditional random fields and deep learned features",
abstract = "In this paper, we introduce a novel Conditional Random Field (CRF) system that detects the downbeat sequence of musical audio signals. Feature functions are computed from four deep learned representations based on harmony, rhythm, melody and bass content to take advantage of the high-level and multi-faceted aspect of this task. Downbeats being dynamic, the powerful CRF classification system allows us to combine our features with an adapted temporal model in a fully data-driven fashion. Some meters being under-represented in our training set, we show that data augmentation enables a statistically significant improvement of the results by taking into account class imbalance. An evaluation of different configurations of our system on nine datasets shows its efficiency and potential over a heuristic based approach and four downbeat tracking algorithms.",
author = "Simon Durand and Slim Essid",
note = "Publisher Copyright: {\textcopyright} Simon Durand, Slim Essid.; 17th International Society for Music Information Retrieval Conference, ISMIR 2016 ; Conference date: 07-08-2016 Through 11-08-2016",
year = "2016",
month = jan,
day = "1",
language = "English",
series = "Proceedings of the 17th International Society for Music Information Retrieval Conference, ISMIR 2016",
publisher = "International Society for Music Information Retrieval",
pages = "386--392",
editor = "Mandel, \{Michael I.\} and Johanna Devaney and Douglas Turnbull and George Tzanetakis",
booktitle = "Proceedings of the 17th International Society for Music Information Retrieval Conference, ISMIR 2016",
}