Pati, Kumar Ashis; Gururani, Siddharth; Lerch, Alexander Assessment of Student Music Performances Using Deep Neural Networks Journal Article In: Applied Sciences, vol. 8, no. 4, pp. 507, 2018. Abstract | Links | BibTeX | Tags: deep learning, deep neural networks, DNN, MIR, music education, music informatics, music information retrieval, music learning, music performance assessment Wu, Chih-Wei; Dittmar, Christian; Southall, Carl; Vogl, Richard; Widmer, Gerhard; Hockman, Jason A; Muller, Meinard; Lerch, Alexander A Review of Automatic Drum Transcription Journal Article In: IEEE/ACM Transactions on Audio, Speech, and Language Processing, vol. 26, no. 9, pp. 1457–1483, 2018, ISSN: 2329-9290. Abstract | Links | BibTeX | Tags: Automatic Music Transcription, deep learning, Instruments, Machine Learning, Matrix Factorization, Rhythm, Spectrogram, Speech processing, Task analysis, Transient analysis2018
@article{pati_assessment_2018,
title = {Assessment of Student Music Performances Using Deep Neural Networks},
author = {Kumar Ashis Pati and Siddharth Gururani and Alexander Lerch},
url = {http://www.mdpi.com/2076-3417/8/4/507/pdf},
doi = {10.3390/app8040507},
year = {2018},
date = {2018-01-01},
urldate = {2018-03-27},
journal = {Applied Sciences},
volume = {8},
number = {4},
pages = {507},
abstract = {Music performance assessment is a highly subjective task often relying on experts to gauge both the technical and aesthetic aspects of the performance from the audio signal. This article explores the task of building computational models for music performance assessment, i.e., analyzing an audio recording of a performance and rating it along several criteria such as musicality, note accuracy, etc. Much of the earlier work in this area has been centered around using hand-crafted features intended to capture relevant aspects of a performance. However, such features are based on our limited understanding of music perception and may not be optimal. In this article, we propose using Deep Neural Networks (DNNs) for the task and compare their performance against a baseline model using standard and hand-crafted features. We show that, using input representations at different levels of abstraction, DNNs can outperform the baseline models across all assessment criteria. In addition, we use model analysis techniques to further explain the model predictions in an attempt to gain useful insights into the assessment process. The results demonstrate the potential of using supervised feature learning techniques to better characterize music performances.},
keywords = {deep learning, deep neural networks, DNN, MIR, music education, music informatics, music information retrieval, music learning, music performance assessment},
pubstate = {published},
tppubtype = {article}
}
@article{wu_review_2018,
title = {A Review of Automatic Drum Transcription},
author = {Chih-Wei Wu and Christian Dittmar and Carl Southall and Richard Vogl and Gerhard Widmer and Jason A Hockman and Meinard Muller and Alexander Lerch},
url = {http://www.musicinformatics.gatech.edu/wp-content_nondefault/uploads/2018/05/Wu-et-al.-2018-A-review-of-automatic-drum-transcription.pdf},
doi = {10.1109/TASLP.2018.2830113},
issn = {2329-9290},
year = {2018},
date = {2018-01-01},
journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
volume = {26},
number = {9},
pages = {1457--1483},
abstract = {In Western popular music, drums and percussion are an important means to emphasize and shape the rhythm, often defining the musical style. If computers were able to analyze the drum part in recorded music, it would enable a variety of rhythm-related music processing tasks. Especially the detection and classification of drum sound events by computational methods is considered to be an important and challenging research problem in the broader field of Music Information Retrieval. Over the last two decades, several authors have attempted to tackle this problem under the umbrella term Automatic Drum Transcription (ADT). This paper presents a comprehensive review of ADT research, including a thorough discussion of the task-specific challenges, categorization of existing techniques, and evaluation of several state-of-the-art systems. To provide more insights on the practice of ADT systems, we focus on two families of ADT techniques, namely methods based on Non-negative Matrix Factorization and Recurrent Neural Networks. We explain the methods' technical details and drum-specific variations and evaluate these approaches on publicly available datasets with a consistent experimental setup. Finally, the open issues and under-explored areas in ADT research are identified and discussed, providing future directions in this field.},
keywords = {Automatic Music Transcription, deep learning, Instruments, Machine Learning, Matrix Factorization, Rhythm, Spectrogram, Speech processing, Task analysis, Transient analysis},
pubstate = {published},
tppubtype = {article}
}
publications
Assessment of Student Music Performances Using Deep Neural Networks Journal Article In: Applied Sciences, vol. 8, no. 4, pp. 507, 2018. A Review of Automatic Drum Transcription Journal Article In: IEEE/ACM Transactions on Audio, Speech, and Language Processing, vol. 26, no. 9, pp. 1457–1483, 2018, ISSN: 2329-9290.2018