Park, Junhyung; Kim, Yonghyun; Bae, Joonhyung; Kim, Kirak; Kwon, Taegyun; Lerch, Alexander; Nam, Juhan Two Web Toolkits for Multimodal Piano Performance Dataset Acquisition and Fingering Annotation Proceedings Article In: Late Breaking Demo (Extended Abstract), Proceedings of the International Society for Music Information Retrieval Conference (ISMIR), Daejeon, South Korea, 2025. Abstract | Links | BibTeX | Tags: Computer Science - Computer Vision and Pattern Recognition, Computer Science - Multimedia, Computer Science - Sound, Electrical Engineering and Systems Science - Audio and Speech Processing, Electrical Engineering and Systems Science - Image and Video Processing2025
@inproceedings{park_two_2025,
title = {Two Web Toolkits for Multimodal Piano Performance Dataset Acquisition and Fingering Annotation},
author = {Junhyung Park and Yonghyun Kim and Joonhyung Bae and Kirak Kim and Taegyun Kwon and Alexander Lerch and Juhan Nam},
url = {http://arxiv.org/abs/2509.15222},
doi = {10.48550/arXiv.2509.15222},
year = {2025},
date = {2025-09-01},
urldate = {2025-09-20},
booktitle = {Late Breaking Demo (Extended Abstract), Proceedings of the International Society for Music Information Retrieval Conference (ISMIR)},
address = {Daejeon, South Korea},
abstract = {Piano performance is a multimodal activity that intrinsically combines physical actions with the acoustic rendition. Despite growing research interest in analyzing the multimodal nature of piano performance, the laborious process of acquiring large-scale multimodal data remains a significant bottleneck, hindering further progress in this field. To overcome this barrier, we present an integrated web toolkit comprising two graphical user interfaces (GUIs): (i) PiaRec, which supports the synchronized acquisition of audio, video, MIDI, and performance metadata. (ii) ASDF, which enables the efficient annotation of performer fingering from the visual data. Collectively, this system can streamline the acquisition of multimodal piano performance datasets.},
keywords = {Computer Science - Computer Vision and Pattern Recognition, Computer Science - Multimedia, Computer Science - Sound, Electrical Engineering and Systems Science - Audio and Speech Processing, Electrical Engineering and Systems Science - Image and Video Processing},
pubstate = {published},
tppubtype = {inproceedings}
}
publications
Two Web Toolkits for Multimodal Piano Performance Dataset Acquisition and Fingering Annotation Proceedings Article In: Late Breaking Demo (Extended Abstract), Proceedings of the International Society for Music Information Retrieval Conference (ISMIR), Daejeon, South Korea, 2025.2025