Abstract
In deep neural networks with convolutional layers, each layer typically has
fixed-size/single-resolution receptive field (RF). Convolutional layers with
a large RF capture global information from the input features, while layers
with small RF size capture local details with high resolution from the input
features. In this work, we introduce novel deep multi-resolution fully
convolutional neural networks (MR-FCNN), where each layer has different RF
sizes to extract multi-resolution features that capture the global and local
details information from its input features. The proposed MR-FCNN is applied
to separate a target audio source from a mixture of many audio sources.
Experimental results show that using MR-FCNN improves the performance
compared to feedforward deep neural networks (DNNs) and single resolution
deep fully convolutional neural networks (FCNNs) on the audio source
separation problem.
Bibtex
@article{Grais_2017c,
author = {Grais, E.~M. and Wierstorf, H. and Ward, D. and Plumbley, M. D.},
title = {{Multi-Resolution Fully Convolutional Neural Networks for Monaural Audio Source Separation}},
journal = {ArXiv e-prints},
archiveprefix = {arXiv},
eprint = {1710.11473},
year = {2017},
month = oct,
url = {http://adsabs.harvard.edu/abs/2017arXiv171011473G},
adsnote = {Provided by the SAO/NASA Astrophysics Data System},
keywords = {"maruss"}
}