Publications

Weninger, F., Le Roux, J., Hershey, J.R., Watanabe, S., "Discriminative NMF and its application to single-channel source separation", Interspeech, September 2014, vol. 15, pp. 865-869.
BibTeX TR2014-081 PDF
- @inproceedings{Weninger2014sep,
- author = {Weninger, F. and {Le Roux}, J. and Hershey, J.R. and Watanabe, S.},
- title = {{Discriminative NMF and its application to single-channel source separation}},
- booktitle = {Interspeech},
- year = 2014,
- volume = 15,
- pages = {865--869},
- month = sep,
- publisher = {International Speech Communication Association},
- issn = {2308-457X},
- url = {https://www.merl.com/publications/TR2014-081}
- }
Le Roux, J., Vincent, E., "A Categorization of Robust Speech Processing Datasets," Tech. Rep. TR2014-116, Mitsubishi Electric Research Laboratories, September 2014.
BibTeX TR2014-116 PDF
- @techreport{LeRouxVincent2014TRdatasets,
- author = {{Le Roux}, J. and Vincent, E.},
- title = {{A Categorization of Robust Speech Processing Datasets}},
- institution = {Mitsubishi Electric Research Laboratories},
- year = 2014,
- number = {TR2014-116},
- address = {Cambridge MA, USA},
- month = sep,
- note = {v2014-09},
- url = {https://www.merl.com/publications/TR2014-116}
- }
Hershey, J.R., Le Roux, J., Weninger, F., "Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures", arXiv, August 2014.
BibTeX arXiv
- @article{Hershey2014aug,
- author = {Hershey, J.R. and {Le Roux}, J. and Weninger, F.},
- title = {{Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures}},
- journal = {arXiv},
- year = 2014,
- month = aug,
- url = {https://arxiv.org/abs/1409.2574}
- }
Tachioka, Y., Narita, T., Watanabe, S., Le Roux, J., "Ensemble Integration of Calibrated Speaker Localization and Statistical Speech Detection in Domestic Environments", Joint Workshop on Hands-free Speech Communication and Microphone Arrays (HSCMA), DOI: 10.1109/HSCMA.2014.6843272, May 2014, pp. 162-166.
BibTeX TR2014-034 PDF
- @inproceedings{Tachioka2014may2,
- author = {Tachioka, Y. and Narita, T. and Watanabe, S. and {Le Roux}, J.},
- title = {{Ensemble Integration of Calibrated Speaker Localization and Statistical Speech Detection in Domestic Environments}},
- booktitle = {Joint Workshop on Hands-free Speech Communication and Microphone Arrays (HSCMA)},
- year = 2014,
- pages = {162--166},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/HSCMA.2014.6843272},
- url = {https://www.merl.com/publications/TR2014-034}
- }
Tachioka, Y., Narita, T., Weninger, F., Watanabe, S., "Dual system combination approach for various reverberant environments with dereverberation techniques", IEEE REVERB Workshop, May 2014.
BibTeX TR2014-032 PDF
- @inproceedings{Tachioka2014may,
- author = {Tachioka, Y. and Narita, T. and Weninger, F. and Watanabe, S.},
- title = {{Dual system combination approach for various reverberant environments with dereverberation techniques}},
- booktitle = {IEEE REVERB Workshop},
- year = 2014,
- month = may,
- url = {https://www.merl.com/publications/TR2014-032}
- }
Weninger, F., Watanabe, S., Le Roux, J., Hershey, J.R., Tachioka, Y., Geiger, J., Schuller, B., Rigoll, G., "The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement", IEEE REVERB Workshop, May 2014.
BibTeX TR2014-033 PDF
- @inproceedings{Weninger2014may2,
- author = {Weninger, F. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R. and Tachioka, Y. and Geiger, J. and Schuller, B. and Rigoll, G.},
- title = {{The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement}},
- booktitle = {IEEE REVERB Workshop},
- year = 2014,
- month = may,
- url = {https://www.merl.com/publications/TR2014-033}
- }
Naini, R., Rane, S., Ramalingam, S., "A Vanishing Point-based Global Descriptor for Manhattan Scenes", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854423, May 2014, pp. 4349-4353.
BibTeX TR2014-029 PDF
- @inproceedings{Naini2014may,
- author = {Naini, R. and Rane, S. and Ramalingam, S.},
- title = {{A Vanishing Point-based Global Descriptor for Manhattan Scenes}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {4349--4353},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854423},
- url = {https://www.merl.com/publications/TR2014-029}
- }
Simsekli, U., Le Roux, J., Hershey, J.R., "Non-negative Source-filter Dynamical System for Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854797, May 2014, pp. 6206-6210.
BibTeX TR2014-027 PDF Software
- @inproceedings{Simsekli2014may,
- author = {Simsekli, U. and {Le Roux}, J. and Hershey, J.R.},
- title = {{Non-negative Source-filter Dynamical System for Speech Enhancement}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {6206--6210},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854797},
- url = {https://www.merl.com/publications/TR2014-027}
- }
Tang, H., Watanabe, S., Marks, T.K., Hershey, J.R., "Log-linear Dialog Manager", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854371, May 2014, pp. 4092-4096.
BibTeX TR2014-024 PDF
- @inproceedings{Tang2014may,
- author = {Tang, H. and Watanabe, S. and Marks, T.K. and Hershey, J.R.},
- title = {{Log-linear Dialog Manager}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {4092--4096},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854371},
- url = {https://www.merl.com/publications/TR2014-024}
- }
Wang, Y., Ortega, A., Tian, D., Vetro, A., "A Graph-based Joint Bilateral Approach for Depth Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6853724, May 2014, pp. 885-889.
BibTeX TR2014-028 PDF
- @inproceedings{Wang2014may,
- author = {Wang, Y. and Ortega, A. and Tian, D. and Vetro, A.},
- title = {{A Graph-based Joint Bilateral Approach for Depth Enhancement}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {885--889},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6853724},
- url = {https://www.merl.com/publications/TR2014-028}
- }
Watanabe, S., Le Roux, J., "Black Box Optimization for Automatic Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854202, May 2014, pp. 3256-3260.
BibTeX TR2014-021 PDF
- @inproceedings{Watanabe2014may,
- author = {Watanabe, S. and {Le Roux}, J.},
- title = {{Black Box Optimization for Automatic Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {3256--3260},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854202},
- url = {https://www.merl.com/publications/TR2014-021}
- }
Weng, C., Yu, D., Watanabe, S., Juang, B.-H.F., "Recurrent Deep Neural Networks for Robust Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854661, May 2014, pp. 5532-5536.
BibTeX TR2014-023 PDF
- @inproceedings{Weng2014may,
- author = {Weng, C. and Yu, D. and Watanabe, S. and Juang, B.-H.F.},
- title = {{Recurrent Deep Neural Networks for Robust Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {5532--5536},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854661},
- url = {https://www.merl.com/publications/TR2014-023}
- }
Weninger, F., Watanabe, S., Tachioka, Y., Schuller, B., "Deep Recurrent De-noising Auto-encoder and Blind De-reverberation for Reverberated Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854478, May 2014, pp. 4623-4627.
BibTeX TR2014-022 PDF
- @inproceedings{Weninger2014may1,
- author = {Weninger, F. and Watanabe, S. and Tachioka, Y. and Schuller, B.},
- title = {{Deep Recurrent De-noising Auto-encoder and Blind De-reverberation for Reverberated Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {4623--4627},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854478},
- url = {https://www.merl.com/publications/TR2014-022}
- }
Zhang, J., Chen, L., Boufounos, P.T., Gu, Y., "On the Theoretical Analysis of Cross Validation in Compressive Sensing", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854225, May 2014, pp. 3370-3374.
BibTeX TR2014-025 PDF
- @inproceedings{Zhang2014may,
- author = {Zhang, J. and Chen, L. and Boufounos, P.T. and Gu, Y.},
- title = {{On the Theoretical Analysis of Cross Validation in Compressive Sensing}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {3370--3374},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854225},
- url = {https://www.merl.com/publications/TR2014-025}
- }
Mansour, H., Vetro, A., "Video Background Subtraction Using Semi-supervised Robust Matrix Completion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854862, May 2014, pp. 6528-6532.
BibTeX TR2014-026 PDF
- @inproceedings{Mansour2014may,
- author = {Mansour, H. and Vetro, A.},
- title = {{Video Background Subtraction Using Semi-supervised Robust Matrix Completion}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {6528--6532},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854862},
- url = {https://www.merl.com/publications/TR2014-026}
- }
Watanabe, S., Nakamura, A., Juang, B.-H., "Structural Bayesian Linear Regression for Hidden Markov Models", Journal of Signal Processing Systems, DOI: 10.1007/s11265-013-0785-8, Vol. 74, No. 3, pp. 341-358, March 2014.
BibTeX TR2013-071 PDF
- @article{Watanabe2013aug,
- author = {Watanabe, S. and Nakamura, A. and Juang, B.-H.},
- title = {{Structural Bayesian Linear Regression for Hidden Markov Models}},
- journal = {Journal of Signal Processing Systems},
- year = 2014,
- volume = 74,
- number = 3,
- pages = {341--358},
- month = mar,
- doi = {10.1007/s11265-013-0785-8},
- issn = {1939-8018},
- url = {https://www.merl.com/publications/TR2013-071}
- }
Tachioka, Y., Watanabe, S., Le Roux, J., Hershey, J.R., "A Generalized Discriminative Training Framework for System Combination", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU.2013.6707703, December 2013, pp. 43-48.
BibTeX TR2013-118 PDF
- @inproceedings{Tachioka2013dec,
- author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
- title = {{A Generalized Discriminative Training Framework for System Combination}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2013,
- pages = {43--48},
- month = dec,
- doi = {10.1109/ASRU.2013.6707703},
- url = {https://www.merl.com/publications/TR2013-118}
- }
Vincent, E., Barker, J., Watanabe, S., Le Roux, J., Nesta, F., Matassoni, M., "The Second CHiME Speech Separation and Recognition Challenge: An Overview of Challenge Systems and Outcomes", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU.2013.6707723, December 2013, pp. 162-167.
BibTeX TR2013-119 PDF
- @inproceedings{Vincent2013dec,
- author = {Vincent, E. and Barker, J. and Watanabe, S. and {Le Roux}, J. and Nesta, F. and Matassoni, M.},
- title = {{The Second CHiME Speech Separation and Recognition Challenge: An Overview of Challenge Systems and Outcomes}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2013,
- pages = {162--167},
- month = dec,
- doi = {10.1109/ASRU.2013.6707723},
- url = {https://www.merl.com/publications/TR2013-119}
- }
Potluru, V.K., Le Roux, J., Pearlmutter, B.A., Hershey, J.R., Brand, M., "Coordinate Descent for Mixed-norm NMF", NIPS Workshop on Greedy Algorithms, Frank-Wolfe and Friends - A Modern Perspective, December 2013.
BibTeX TR2013-130 PDF
- @inproceedings{Potluru2013dec,
- author = {Potluru, V.K. and {Le Roux}, J. and Pearlmutter, B.A. and Hershey, J.R. and Brand, M.},
- title = {{Coordinate Descent for Mixed-norm NMF}},
- booktitle = {NIPS Workshop on Greedy Algorithms, Frank-Wolfe and Friends - A Modern Perspective},
- year = 2013,
- month = dec,
- url = {https://www.merl.com/publications/TR2013-130}
- }
Le Roux, J., Watanabe, S., Hershey, J.R., "Ensemble Learning for Speech Enhancement", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA.2013.6701888, October 2013, pp. 1-4.
BibTeX TR2013-098 PDF
- @inproceedings{LeRoux2013oct,
- author = {{Le Roux}, J. and Watanabe, S. and Hershey, J.R.},
- title = {{Ensemble Learning for Speech Enhancement}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2013,
- pages = {1--4},
- month = oct,
- doi = {10.1109/WASPAA.2013.6701888},
- issn = {1931-1168},
- url = {https://www.merl.com/publications/TR2013-098}
- }
Tawara, N., Ogawa, T., Watanabe, S., Nakamura, A., Kobayashi, T., "Blocked Gibbs Sampling Based Multi-Scale Mixture Model for Speaker Clustering on Noisy Data", IEEE International Workshop on Machine Learning for Signal Processing (MLSP), DOI: 10.1109/MLSP.2013.6661902, September 2013, pp. 1-6.
BibTeX TR2013-091 PDF
- @inproceedings{Tawara2013sep,
- author = {Tawara, N. and Ogawa, T. and Watanabe, S. and Nakamura, A. and Kobayashi, T.},
- title = {{Blocked Gibbs Sampling Based Multi-Scale Mixture Model for Speaker Clustering on Noisy Data}},
- booktitle = {IEEE International Workshop on Machine Learning for Signal Processing (MLSP)},
- year = 2013,
- pages = {1--6},
- month = sep,
- doi = {10.1109/MLSP.2013.6661902},
- issn = {1551-2541},
- url = {https://www.merl.com/publications/TR2013-091}
- }
Tachioka, Y., Watanabe, S., "Discriminative Training of Acoustic Models for System Combination", Interspeech, August 2013.
BibTeX TR2013-074 PDF
- @inproceedings{Tachioka2013aug,
- author = {Tachioka, Y. and Watanabe, S.},
- title = {{Discriminative Training of Acoustic Models for System Combination}},
- booktitle = {Interspeech},
- year = 2013,
- month = aug,
- url = {https://www.merl.com/publications/TR2013-074}
- }
Tachioka, Y., Watanabe, S., Le Roux, J., Hershey, J.R., "Discriminative Methods for Noise Robust Speech Recognition: A CHiME Challenge Benchmark", International Workshop on Machine Listening in Multisource Environments (CHiME), June 2013.
BibTeX TR2013-044 PDF
- @inproceedings{Tachioka2013jun,
- author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
- title = {{Discriminative Methods for Noise Robust Speech Recognition: A CHiME Challenge Benchmark}},
- booktitle = {International Workshop on Machine Listening in Multisource Environments (CHiME)},
- year = 2013,
- month = jun,
- url = {https://www.merl.com/publications/TR2013-044}
- }
Fevotte, C., Le Roux, J., Hershey, J.R., "Non-negative Dynamical System with Application to Speech and Audio", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2013.
BibTeX TR2013-021 PDF Software
- @inproceedings{Fevotte2013may,
- author = {Fevotte, C. and {Le Roux}, J. and Hershey, J.R.},
- title = {{Non-negative Dynamical System with Application to Speech and Audio}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2013,
- month = may,
- url = {https://www.merl.com/publications/TR2013-021}
- }
Garg, R., Rane, S., "A Keypoint Descriptor for Alignment-Free Fingerprint Matching", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2013.
BibTeX TR2013-023 PDF
- @inproceedings{Garg2013may,
- author = {Garg, R. and Rane, S.},
- title = {{A Keypoint Descriptor for Alignment-Free Fingerprint Matching}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2013,
- month = may,
- url = {https://www.merl.com/publications/TR2013-023}
- }