@conference{32ee7d149a974ac6a641e79bc5106c1f, author = "Annamaria Mesaros and Toni Heittola and Aleksandr Diment and {Benjamin Martinez} Elizalde and Ankit Shah and Emmanuel Vincent and Bhiksha Raj and Tuomas Virtanen", abstract = "DCASE 2017 Challenge consists of four tasks: acoustic scene classification, detection of rare sound events, sound event detection in real-life audio, and large-scale weakly supervised sound event detection for smart cars. This paper presents the setup of these tasks: task definition, dataset, experimental setup, and baseline system results on the development dataset. The baseline systems for all tasks rely on the same implementation using multilayer perceptron and log mel-energies, but differ in the structure of the output layer and the decision making process, as well as the evaluation of system output using task specific metrics.", booktitle = "Proceedings of the Detection and Classification of Acoustic Scenes and Events 2017 Workshop (DCASE2017)", keywords = "Sound scene analysis; Acoustic scene classification; Sound event detection; Audio tagging; Rare sound events", pages = "85--92", publisher = "Tampere University of Technology. Laboratory of Signal Processing", title = "{DCASE} 2017 challenge setup: tasks, datasets and baseline system", year = "2017", }