Although deep learning has revolutionized music generation, existing methods
for structured melody generation follow an end-to-end left-to-right
note-by-note generative paradigm and treat each note equally. Here, we present
WuYun, a knowledge-enhanced deep learning architecture for improving the
structure of generated melodies, which first generates the most structurally
important notes to construct a melodic skeleton and subsequently infills it
with dynamically decorative notes into a full-fledged melody. Specifically, we
use music domain knowledge to extract melodic skeletons and employ sequence
learning to reconstruct them, which serve as additional knowledge to provide
auxiliary guidance for the melody generation process. We demonstrate that WuYun
can generate melodies with better long-term structure and musicality and
outperforms other state-of-the-art methods by 0.51 on average on all subjective
evaluation metrics. Our study provides a multidisciplinary lens to design
melodic hierarchical structures and bridge the gap between data-driven and
knowledge-based approaches for numerous music generation tasks.
Description
[2301.04488] WuYun: Exploring hierarchical skeleton-guided melody generation using knowledge-enhanced deep learning
%0 Generic
%1 zhang2023wuyun
%A Zhang, Kejun
%A Wu, Xinda
%A Zhang, Tieyao
%A Huang, Zhijie
%A Tan, Xu
%A Liang, Qihao
%A Wu, Songruoyao
%A Sun, Lingyun
%D 2023
%K architecture knowledge-enhanced
%T WuYun: Exploring hierarchical skeleton-guided melody generation using
knowledge-enhanced deep learning
%U http://arxiv.org/abs/2301.04488
%X Although deep learning has revolutionized music generation, existing methods
for structured melody generation follow an end-to-end left-to-right
note-by-note generative paradigm and treat each note equally. Here, we present
WuYun, a knowledge-enhanced deep learning architecture for improving the
structure of generated melodies, which first generates the most structurally
important notes to construct a melodic skeleton and subsequently infills it
with dynamically decorative notes into a full-fledged melody. Specifically, we
use music domain knowledge to extract melodic skeletons and employ sequence
learning to reconstruct them, which serve as additional knowledge to provide
auxiliary guidance for the melody generation process. We demonstrate that WuYun
can generate melodies with better long-term structure and musicality and
outperforms other state-of-the-art methods by 0.51 on average on all subjective
evaluation metrics. Our study provides a multidisciplinary lens to design
melodic hierarchical structures and bridge the gap between data-driven and
knowledge-based approaches for numerous music generation tasks.
@misc{zhang2023wuyun,
abstract = {Although deep learning has revolutionized music generation, existing methods
for structured melody generation follow an end-to-end left-to-right
note-by-note generative paradigm and treat each note equally. Here, we present
WuYun, a knowledge-enhanced deep learning architecture for improving the
structure of generated melodies, which first generates the most structurally
important notes to construct a melodic skeleton and subsequently infills it
with dynamically decorative notes into a full-fledged melody. Specifically, we
use music domain knowledge to extract melodic skeletons and employ sequence
learning to reconstruct them, which serve as additional knowledge to provide
auxiliary guidance for the melody generation process. We demonstrate that WuYun
can generate melodies with better long-term structure and musicality and
outperforms other state-of-the-art methods by 0.51 on average on all subjective
evaluation metrics. Our study provides a multidisciplinary lens to design
melodic hierarchical structures and bridge the gap between data-driven and
knowledge-based approaches for numerous music generation tasks.},
added-at = {2023-04-06T14:31:44.000+0200},
author = {Zhang, Kejun and Wu, Xinda and Zhang, Tieyao and Huang, Zhijie and Tan, Xu and Liang, Qihao and Wu, Songruoyao and Sun, Lingyun},
biburl = {https://www.bibsonomy.org/bibtex/2cc0aea3242340d0ae377d42e2f9f9114/alex_h},
description = {[2301.04488] WuYun: Exploring hierarchical skeleton-guided melody generation using knowledge-enhanced deep learning},
interhash = {38e2ec5c1cfed778c85a02850819c7cd},
intrahash = {cc0aea3242340d0ae377d42e2f9f9114},
keywords = {architecture knowledge-enhanced},
note = {cite arxiv:2301.04488},
timestamp = {2023-04-06T14:31:44.000+0200},
title = {WuYun: Exploring hierarchical skeleton-guided melody generation using
knowledge-enhanced deep learning},
url = {http://arxiv.org/abs/2301.04488},
year = 2023
}