Publications

46 / 2,449 publications found.


  •  Gerkmann, T.; Krawczyk, M.; Le Roux, J., "Phase Processing for Single Channel Speech Enhancement: History and Recent Advances", IEEE Signal Processing Magazine, DOI: 10.1109/MSP.2014.2369251, ISSN: 1053-5888, Vol. 32, No. 2, pp. 55-66, March 2015.
    BibTeX Download PDFRead TR2014-122
    • @article{Gerkmann2015mar,
    • author = {Gerkmann, T. and Krawczyk, M. and {Le Roux}, J.},
    • title = {Phase Processing for Single Channel Speech Enhancement: History and Recent Advances},
    • journal = {IEEE Signal Processing Magazine},
    • year = 2015,
    • volume = 32,
    • number = 2,
    • pages = {55--66},
    • month = mar,
    • publisher = {IEEE},
    • doi = {10.1109/MSP.2014.2369251},
    • issn = {1053-5888},
    • url = {http://www.merl.com/publications/TR2014-122}
    • }
  •  Weninger, F.; Le Roux, J.; Hershey, J.R.; Schuller, B., "Discriminatively Trained Recurrent Neural Networks for Single-Channel Speech Separation", IEEE Global Conference on Signal and Information Processing (GlobalSIP), DOI: 10.1109/GlobalSIP.2014.7032183, December 2014, pp. 577-581.
    BibTeX Download PDFRead TR2014-104
    • @inproceedings{Weninger2014dec,
    • author = {Weninger, F. and {Le Roux}, J. and Hershey, J.R. and Schuller, B.},
    • title = {Discriminatively Trained Recurrent Neural Networks for Single-Channel Speech Separation},
    • booktitle = {IEEE Global Conference on Signal and Information Processing (GlobalSIP)},
    • year = 2014,
    • pages = {577--581},
    • month = dec,
    • publisher = {IEEE},
    • doi = {10.1109/GlobalSIP.2014.7032183},
    • url = {http://www.merl.com/publications/TR2014-104}
    • }
  •  Tachioka, Y.; Watanabe, S.; Le Roux, J.; Hershey, J.R., "Sequential Maximum Mutual Information Linear Discriminant Analysis for Speech Recognition", Interspeech, ISSN: 2308-457X, September 2014, vol. 15, pp. 2415-2419.
    BibTeX Download PDFRead TR2014-079
    • @inproceedings{Tachioka2014sep,
    • author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
    • title = {Sequential Maximum Mutual Information Linear Discriminant Analysis for Speech Recognition},
    • booktitle = {Interspeech},
    • year = 2014,
    • volume = 15,
    • pages = {2415--2419},
    • month = sep,
    • publisher = {International Speech Communication Association},
    • issn = {2308-457X},
    • url = {http://www.merl.com/publications/TR2014-079}
    • }
  •  Weninger, F.; Le Roux, J.; Hershey, J.R.; Watanabe, S., "Discriminative NMF and its application to single-channel source separation", Interspeech, ISSN: 2308-457X, September 2014, vol. 15, pp. 865-869.
    BibTeX Download PDFRead TR2014-081
    • @inproceedings{Weninger2014sep,
    • author = {Weninger, F. and {Le Roux}, J. and Hershey, J.R. and Watanabe, S.},
    • title = {Discriminative NMF and its application to single-channel source separation},
    • booktitle = {Interspeech},
    • year = 2014,
    • volume = 15,
    • pages = {865--869},
    • month = sep,
    • publisher = {International Speech Communication Association},
    • issn = {2308-457X},
    • url = {http://www.merl.com/publications/TR2014-081}
    • }
  •  Le Roux, J.; Vincent, E., "A Categorization of Robust Speech Processing Datasets," Tech. Rep. TR2014-116, Mitsubishi Electric Research Laboratories, September 2014.
    BibTeX Download PDFRead TR2014-116
    • @techreport{LeRouxVincent2014TRdatasets,
    • author = {{Le Roux}, J. and Vincent, E.},
    • title = {A Categorization of Robust Speech Processing Datasets},
    • institution = {MERL - Mitsubishi Electric Research Laboratories},
    • year = 2014,
    • number = {TR2014-116},
    • address = {Cambridge MA, USA},
    • month = sep,
    • note = {v2014-09},
    • url = {http://www.merl.com/publications/TR2014-116}
    • }
  •  Hershey, J.R.; Le Roux, J.; Weninger, F., "Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures," Tech. Rep. TR2014-117, arXiv, August 2014.
    BibTeX Download PDFRead TR2014-117
    • @techreport{Hershey2014aug,
    • author = {Hershey, J.R. and {Le Roux}, J. and Weninger, F.},
    • title = {Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures},
    • journal = {arXiv},
    • year = 2014,
    • month = aug,
    • url = {http://www.merl.com/publications/TR2014-117}
    • }
  •  Tachioka, Y.; Narita, T.; Watanabe, S.; Le Roux, J., "Ensemble Integration of Calibrated Speaker Localization and Statistical Speech Detection in Domestic Environments", Joint Workshop on Hands-free Speech Communication and Microphone Arrays (HSCMA), DOI: 10.1109/HSCMA.2014.6843272, May 2014, pp. 162-166.
    BibTeX Download PDFRead TR2014-034
    • @inproceedings{Tachioka2014may2,
    • author = {Tachioka, Y. and Narita, T. and Watanabe, S. and {Le Roux}, J.},
    • title = {Ensemble Integration of Calibrated Speaker Localization and Statistical Speech Detection in Domestic Environments},
    • booktitle = {Joint Workshop on Hands-free Speech Communication and Microphone Arrays (HSCMA)},
    • year = 2014,
    • pages = {162--166},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/HSCMA.2014.6843272},
    • url = {http://www.merl.com/publications/TR2014-034}
    • }
  •  Weninger, F.; Watanabe, S.; Le Roux, J.; Hershey, J.R.; Tachioka, Y.; Geiger, J.; Schuller, B.; Rigoll, G., "The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement", IEEE REVERB Workshop, May 2014.
    BibTeX Download PDFRead TR2014-033
    • @inproceedings{Weninger2014may2,
    • author = {Weninger, F. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R. and Tachioka, Y. and Geiger, J. and Schuller, B. and Rigoll, G.},
    • title = {The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement},
    • booktitle = {IEEE REVERB Workshop},
    • year = 2014,
    • month = may,
    • url = {http://www.merl.com/publications/TR2014-033}
    • }
  •  Simsekli, U.; Le Roux, J.; Hershey, J.R., "Non-negative Source-filter Dynamical System for Speech Enhancement", IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854797, May 2014, pp. 6206-6210.
    BibTeX Download PDFRead TR2014-027
    • @inproceedings{Simsekli2014may,
    • author = {Simsekli, U. and {Le Roux}, J. and Hershey, J.R.},
    • title = {Non-negative Source-filter Dynamical System for Speech Enhancement},
    • booktitle = {IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
    • year = 2014,
    • pages = {6206--6210},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP.2014.6854797},
    • url = {http://www.merl.com/publications/TR2014-027}
    • }
  •  Watanabe, S.; Le Roux, J., "Black Box Optimization for Automatic Speech Recognition", IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854202, May 2014, pp. 3256-3260.
    BibTeX Download PDFRead TR2014-021
    • @inproceedings{Watanabe2014may,
    • author = {Watanabe, S. and {Le Roux}, J.},
    • title = {Black Box Optimization for Automatic Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
    • year = 2014,
    • pages = {3256--3260},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP.2014.6854202},
    • url = {http://www.merl.com/publications/TR2014-021}
    • }
  •  Tachioka, Y.; Watanabe, S.; Le Roux, J.; Hershey, J.R., "A Generalized Discriminative Training Framework for System Combination", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU.2013.6707703, December 2013, pp. 43-48.
    BibTeX Download PDFRead TR2013-118
    • @inproceedings{Tachioka2013dec,
    • author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
    • title = {A Generalized Discriminative Training Framework for System Combination},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2013,
    • pages = {43--48},
    • month = dec,
    • doi = {10.1109/ASRU.2013.6707703},
    • url = {http://www.merl.com/publications/TR2013-118}
    • }
  •  Vincent, E.; Barker, J.; Watanabe, S.; Le Roux, J.; Nesta, F.; Matassoni, M., "The Second CHiME Speech Separation and Recognition Challenge: An Overview of Challenge Systems and Outcomes", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU.2013.6707723, December 2013, pp. 162-167.
    BibTeX Download PDFRead TR2013-119
    • @inproceedings{Vincent2013dec,
    • author = {Vincent, E. and Barker, J. and Watanabe, S. and {Le Roux}, J. and Nesta, F. and Matassoni, M.},
    • title = {The Second CHiME Speech Separation and Recognition Challenge: An Overview of Challenge Systems and Outcomes},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2013,
    • pages = {162--167},
    • month = dec,
    • doi = {10.1109/ASRU.2013.6707723},
    • url = {http://www.merl.com/publications/TR2013-119}
    • }
  •  Potluru, V.K.; Le Roux, J.; Pearlmutter, B.A.; Hershey, J.R.; Brand, M.E., "Coordinate Descent for Mixed-norm NMF", NIPS Workshop: Greedy Algorithms, Frank-Wolfe and Friends - A Modern Perspective, December 2013.
    BibTeX Download PDFRead TR2013-130
    • @inproceedings{Potluru2013dec,
    • author = {Potluru, V.K. and {Le Roux}, J. and Pearlmutter, B.A. and Hershey, J.R. and Brand, M.E.},
    • title = {Coordinate Descent for Mixed-norm NMF},
    • booktitle = {NIPS Workshop: Greedy Algorithms, Frank-Wolfe and Friends - A Modern Perspective},
    • year = 2013,
    • month = dec,
    • url = {http://www.merl.com/publications/TR2013-130}
    • }
  •  Le Roux, J.; Watanabe, S.; Hershey, J.R., "Ensemble Learning for Speech Enhancement", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA.2013.6701888, ISSN: 1931-1168, October 2013, pp. 1-4.
    BibTeX Download PDFRead TR2013-098
    • @inproceedings{LeRoux2013oct,
    • author = {{Le Roux}, J. and Watanabe, S. and Hershey, J.R.},
    • title = {Ensemble Learning for Speech Enhancement},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2013,
    • pages = {1--4},
    • month = oct,
    • doi = {10.1109/WASPAA.2013.6701888},
    • issn = {1931-1168},
    • url = {http://www.merl.com/publications/TR2013-098}
    • }
  •  Simsekli, U.; Le Roux, J.; Hershey, J.R., "Hierarchical and Coupled Non-negative Dynamical Systems with Application to Audio Modeling", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA.2013.6701891, ISSN: 1931-1168, October 2013, pp. 1-4.
    BibTeX Download PDFRead TR2013-097
    • @inproceedings{Simsekli2013oct,
    • author = {Simsekli, U. and {Le Roux}, J. and Hershey, J.R.},
    • title = {Hierarchical and Coupled Non-negative Dynamical Systems with Application to Audio Modeling},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2013,
    • pages = {1--4},
    • month = oct,
    • doi = {10.1109/WASPAA.2013.6701891},
    • issn = {1931-1168},
    • url = {http://www.merl.com/publications/TR2013-097}
    • }
  •  Yoshino, K.; Watanabe, S.; Le Roux, J.; Hershey, J.R., "Statistical Dialogue Management using Intention Dependency Graph", International Joint Conference on Natural Language Processing (IJCNLP), October 2013.
    BibTeX Download PDFRead TR2013-096
    • @inproceedings{Yoshino2013oct,
    • author = {Yoshino, K. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
    • title = {Statistical Dialogue Management using Intention Dependency Graph},
    • booktitle = {International Joint Conference on Natural Language Processing (IJCNLP)},
    • year = 2013,
    • month = oct,
    • url = {http://www.merl.com/publications/TR2013-096}
    • }
  •  Tachioka, Y.; Watanabe, S.; Le Roux, J.; Hershey, J.R., "Discriminative Methods for Noise Robust Speech Recognition: A CHiME Challenge Benchmark", International Workshop on Machine Listening in Multisource Environments (CHiME), June 2013.
    BibTeX Download PDFRead TR2013-044
    • @inproceedings{Tachioka2013jun,
    • author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
    • title = {Discriminative Methods for Noise Robust Speech Recognition: A CHiME Challenge Benchmark},
    • booktitle = {International Workshop on Machine Listening in Multisource Environments (CHiME)},
    • year = 2013,
    • month = jun,
    • url = {http://www.merl.com/publications/TR2013-044}
    • }
  •  Fevotte, C.; Le Roux, J.; Hershey, J.R., "Non-negative Dynamical System with Application to Speech and Audio", IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), May 2013.
    BibTeX Download PDFRead TR2013-021
    • @inproceedings{Fevotte2013may,
    • author = {Fevotte, C. and {Le Roux}, J. and Hershey, J.R.},
    • title = {Non-negative Dynamical System with Application to Speech and Audio},
    • booktitle = {IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
    • year = 2013,
    • month = may,
    • url = {http://www.merl.com/publications/TR2013-021}
    • }
  •  Le Roux, J.; Boufounos, P.T.; Kang, K.; Hershey, J.R., "Source Localization in Reverberant Environments using Sparse Optimization", IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2013.6638473, ISSN: 1520-6149, May 2013, pp. 4310-4314.
    BibTeX Download PDFRead TR2013-022
    • @inproceedings{LeRoux2013may,
    • author = {{Le Roux}, J. and Boufounos, P.T. and Kang, K. and Hershey, J.R.},
    • title = {Source Localization in Reverberant Environments using Sparse Optimization},
    • booktitle = {IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
    • year = 2013,
    • pages = {4310--4314},
    • month = may,
    • doi = {10.1109/ICASSP.2013.6638473},
    • issn = {1520-6149},
    • url = {http://www.merl.com/publications/TR2013-022}
    • }
  •  Vincent, E.; Barker, J.; Watanabe, S.; Le Roux, J.; Nesta, F.; Matassoni, M., "The Second 'CHiME' Speech Separation and Recognition Challenge: Datasets, Tasks and Baselines", IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), May 2013.
    BibTeX Download PDFRead TR2013-079
    • @inproceedings{Vincent2013may,
    • author = {Vincent, E. and Barker, J. and Watanabe, S. and {Le Roux}, J. and Nesta, F. and Matassoni, M.},
    • title = {The Second 'CHiME' Speech Separation and Recognition Challenge: Datasets, Tasks and Baselines},
    • booktitle = {IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
    • year = 2013,
    • month = may,
    • url = {http://www.merl.com/publications/TR2013-079}
    • }