Publications

Gerkmann, T., Krawczyk, M., Le Roux, J., "Phase Processing for Single Channel Speech Enhancement: History and Recent Advances", IEEE Signal Processing Magazine, DOI: 10.1109/MSP.2014.2369251, Vol. 32, No. 2, pp. 55-66, March 2015.
BibTeX TR2014-122 PDF
- @article{Gerkmann2015mar,
- author = {Gerkmann, T. and Krawczyk, M. and {Le Roux}, J.},
- title = {Phase Processing for Single Channel Speech Enhancement: History and Recent Advances},
- journal = {IEEE Signal Processing Magazine},
- year = 2015,
- volume = 32,
- number = 2,
- pages = {55--66},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/MSP.2014.2369251},
- issn = {1053-5888},
- url = {https://www.merl.com/publications/TR2014-122}
- }
Le Roux, J., Vincent, E., "A Categorization of Robust Speech Processing Datasets," Tech. Rep. TR2014-116, Mitsubishi Electric Research Laboratories, September 2014.
BibTeX TR2014-116 PDF
- @techreport{LeRouxVincent2014TRdatasets,
- author = {{Le Roux}, J. and Vincent, E.},
- title = {A Categorization of Robust Speech Processing Datasets},
- institution = {Mitsubishi Electric Research Laboratories},
- year = 2014,
- number = {TR2014-116},
- address = {Cambridge MA, USA},
- month = sep,
- note = {v2014-09},
- url = {https://www.merl.com/publications/TR2014-116}
- }
Hershey, J.R., Le Roux, J., Weninger, F., "Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures", arXiv, August 2014.
BibTeX arXiv
- @article{Hershey2014aug,
- author = {Hershey, J.R. and {Le Roux}, J. and Weninger, F.},
- title = {Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures},
- journal = {arXiv},
- year = 2014,
- month = aug,
- url = {https://arxiv.org/abs/1409.2574v1}
- }
Tachioka, Y., Narita, T., Weninger, F., Watanabe, S., "Dual system combination approach for various reverberant environments with dereverberation techniques", IEEE REVERB Workshop, May 2014.
BibTeX TR2014-032 PDF
- @inproceedings{Tachioka2014may,
- author = {Tachioka, Y. and Narita, T. and Weninger, F. and Watanabe, S.},
- title = {Dual system combination approach for various reverberant environments with dereverberation techniques},
- booktitle = {IEEE REVERB Workshop},
- year = 2014,
- month = may,
- url = {https://www.merl.com/publications/TR2014-032}
- }
Weninger, F., Watanabe, S., Le Roux, J., Hershey, J.R., Tachioka, Y., Geiger, J., Schuller, B., Rigoll, G., "The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement", IEEE REVERB Workshop, May 2014.
BibTeX TR2014-033 PDF
- @inproceedings{Weninger2014may2,
- author = {Weninger, F. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R. and Tachioka, Y. and Geiger, J. and Schuller, B. and Rigoll, G.},
- title = {The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement},
- booktitle = {IEEE REVERB Workshop},
- year = 2014,
- month = may,
- url = {https://www.merl.com/publications/TR2014-033}
- }
Simsekli, U., Le Roux, J., Hershey, J.R., "Non-negative Source-filter Dynamical System for Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854797, May 2014, pp. 6206-6210.
BibTeX TR2014-027 PDF Software
- @inproceedings{Simsekli2014may,
- author = {Simsekli, U. and {Le Roux}, J. and Hershey, J.R.},
- title = {Non-negative Source-filter Dynamical System for Speech Enhancement},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {6206--6210},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854797},
- url = {https://www.merl.com/publications/TR2014-027}
- }
Wang, Y., Ortega, A., Tian, D., Vetro, A., "A Graph-based Joint Bilateral Approach for Depth Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6853724, May 2014, pp. 885-889.
BibTeX TR2014-028 PDF
- @inproceedings{Wang2014may,
- author = {Wang, Y. and Ortega, A. and Tian, D. and Vetro, A.},
- title = {A Graph-based Joint Bilateral Approach for Depth Enhancement},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {885--889},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6853724},
- url = {https://www.merl.com/publications/TR2014-028}
- }
Le Roux, J., Watanabe, S., Hershey, J.R., "Ensemble Learning for Speech Enhancement", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA.2013.6701888, October 2013, pp. 1-4.
BibTeX TR2013-098 PDF
- @inproceedings{LeRoux2013oct,
- author = {{Le Roux}, J. and Watanabe, S. and Hershey, J.R.},
- title = {Ensemble Learning for Speech Enhancement},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2013,
- pages = {1--4},
- month = oct,
- doi = {10.1109/WASPAA.2013.6701888},
- issn = {1931-1168},
- url = {https://www.merl.com/publications/TR2013-098}
- }
Fevotte, C., Le Roux, J., Hershey, J.R., "Non-negative Dynamical System with Application to Speech and Audio", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2013.
BibTeX TR2013-021 PDF Software
- @inproceedings{Fevotte2013may,
- author = {Fevotte, C. and {Le Roux}, J. and Hershey, J.R.},
- title = {Non-negative Dynamical System with Application to Speech and Audio},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2013,
- month = may,
- url = {https://www.merl.com/publications/TR2013-021}
- }
Watanabe, S., Hershey, J.R., "Stereo-based Feature Enhancement Using Dictionary Learning", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2013.6639034, May 2013, pp. 7073-7077.
BibTeX TR2013-019 PDF
- @inproceedings{Watanabe2013may,
- author = {Watanabe, S. and Hershey, J.R.},
- title = {Stereo-based Feature Enhancement Using Dictionary Learning},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2013,
- pages = {7073--7077},
- month = may,
- doi = {10.1109/ICASSP.2013.6639034},
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2013-019}
- }
Hershey, J.R., Rennie, S.J., Le Roux, J., "Factorial Models for Noise Robust Speech Recognition" in Techniques for Noise Robustness in Automatic Speech Recognition, Virtanen, T. and Singh, R. and Raj, B., Eds., chapter 12, Wiley, November 2012.
BibTeX TR2012-002 PDF
- @incollection{Hershey2012nov,
- author = {Hershey, J.R. and Rennie, S.J. and {Le Roux}, J.},
- title = {Factorial Models for Noise Robust Speech Recognition},
- booktitle = {Techniques for Noise Robustness in Automatic Speech Recognition},
- year = 2012,
- editor = {Virtanen, T. and Singh, R. and Raj, B.},
- chapter = 12,
- month = nov,
- publisher = {Wiley},
- url = {https://www.merl.com/publications/TR2012-002}
- }
Le Roux, J., Hershey, J.R., "Indirect Model-based Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP-2012.6288806, March 2012, pp. 4045-4048.
BibTeX TR2012-016 PDF
- @inproceedings{LeRoux2012mar2,
- author = {{Le Roux}, J. and Hershey, J.R.},
- title = {Indirect Model-based Speech Enhancement},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2012,
- pages = {4045--4048},
- month = mar,
- doi = {10.1109/ICASSP-2012.6288806},
- issn = {1520-6149},
- isbn = {978-1-4673-0045-2},
- url = {https://www.merl.com/publications/TR2012-016}
- }
Le Roux, J., Hershey, J.R., "Speech Enhancement by Indirect VTS", Acoustical Society of Japan Spring Meeting (ASJ), March 2012.
BibTeX TR2012-011 PDF
- @inproceedings{LeRoux2012mar1,
- author = {{Le Roux}, J. and Hershey, J.R.},
- title = {Speech Enhancement by Indirect VTS},
- booktitle = {Acoustical Society of Japan Spring Meeting (ASJ)},
- year = 2012,
- month = mar,
- url = {https://www.merl.com/publications/TR2012-011}
- }
Boufounos, P.T., "Compressive Sensing for Over-the-Air Ultrasound", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2011.5947722, May 2011, pp. 5972-5975.
BibTeX TR2011-016 PDF Video
- @inproceedings{Boufounos2011may1,
- author = {Boufounos, P.T.},
- title = {Compressive Sensing for Over-the-Air Ultrasound},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2011,
- pages = {5972--5975},
- month = may,
- doi = {10.1109/ICASSP.2011.5947722},
- url = {https://www.merl.com/publications/TR2011-016}
- }
Varna, A.L., Rane, S., Vetro, A., "Data Hiding in Hard-Copy Text Documents Robust to Print, Scan and Photocopy Operations", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2009.
BibTeX TR2009-020 PDF
- @inproceedings{Varna2009apr,
- author = {Varna, A.L. and Rane, S. and Vetro, A.},
- title = {Data Hiding in Hard-Copy Text Documents Robust to Print, Scan and Photocopy Operations},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2009,
- month = apr,
- url = {https://www.merl.com/publications/TR2009-020}
- }
Raj, B., Singh, R., Smaragdis, P., "Recognizing Speech from Simultaneous Speakers", Eurospeech, September 2005.
BibTeX TR2005-136 PDF
- @inproceedings{Raj2005sep,
- author = {Raj, B. and Singh, R. and Smaragdis, P.},
- title = {Recognizing Speech from Simultaneous Speakers},
- booktitle = {Eurospeech},
- year = 2005,
- month = sep,
- url = {https://www.merl.com/publications/TR2005-136}
- }
Divakaran, A., Otsuka, I., Radhakrishnan, R., Nakane, K., Ogawa, M., "Audio-Assisted Video Browsing for DVD Recorders", IEEE Pacific-Rim Conference on Multimedia (PCM), November 2004.
BibTeX TR2004-139 PDF
- @inproceedings{Divakaran2004nov,
- author = {Divakaran, A. and Otsuka, I. and Radhakrishnan, R. and Nakane, K. and Ogawa, M.},
- title = {Audio-Assisted Video Browsing for DVD Recorders},
- booktitle = {IEEE Pacific-Rim Conference on Multimedia (PCM)},
- year = 2004,
- month = nov,
- url = {https://www.merl.com/publications/TR2004-139}
- }
Seltzer, M.L., Raj, B., Stern, R.M., "Likelihood-Maximizing Beamforming for Robust Hands-Free Speech Recognition", IEEE Transactions on Speech and Audio Processing, Vol. 12, No. 5, pp. 489-498, September 2004.
BibTeX TR2004-088 PDF
- @article{Seltzer2004sep1,
- author = {Seltzer, M.L. and Raj, B. and Stern, R.M.},
- title = {Likelihood-Maximizing Beamforming for Robust Hands-Free Speech Recognition},
- journal = {IEEE Transactions on Speech and Audio Processing},
- year = 2004,
- volume = 12,
- number = 5,
- pages = {489--498},
- month = sep,
- note = {Awarded Best Young Author, March 2007},
- issn = {1063-6676},
- url = {https://www.merl.com/publications/TR2004-088}
- }
Raj, B., Seltzer, M.L., Reyes-Gomez, M.J., "Speech Recognizer Based Maximum Likelihood Beamforming", NSF Workshop on Perspectives on Speech Separation, October 2003.
BibTeX TR2003-87 PDF
- @inproceedings{Raj2003oct,
- author = {Raj, B. and Seltzer, M.L. and Reyes-Gomez, M.J.},
- title = {Speech Recognizer Based Maximum Likelihood Beamforming},
- booktitle = {NSF Workshop on Perspectives on Speech Separation},
- year = 2003,
- month = oct,
- url = {https://www.merl.com/publications/TR2003-87}
- }