Publications

378 / 3,813 publications found.


  •  Weninger, F., Le Roux, J., Hershey, J.R., Schuller, B., "Discriminatively Trained Recurrent Neural Networks for Single-Channel Speech Separation", IEEE Global Conference on Signal and Information Processing (GlobalSIP), DOI: 10.1109/​GlobalSIP.2014.7032183, December 2014, pp. 577-581.
    BibTeX TR2014-104 PDF
    • @inproceedings{Weninger2014dec,
    • author = {Weninger, F. and {Le Roux}, J. and Hershey, J.R. and Schuller, B.},
    • title = {{Discriminatively Trained Recurrent Neural Networks for Single-Channel Speech Separation}},
    • booktitle = {IEEE Global Conference on Signal and Information Processing (GlobalSIP)},
    • year = 2014,
    • pages = {577--581},
    • month = dec,
    • publisher = {IEEE},
    • doi = {10.1109/GlobalSIP.2014.7032183},
    • url = {https://www.merl.com/publications/TR2014-104}
    • }
  •  Tachioka, Y., Watanabe, S., Le Roux, J., Hershey, J.R., "Sequential Maximum Mutual Information Linear Discriminant Analysis for Speech Recognition", Interspeech, September 2014, vol. 15, pp. 2415-2419.
    BibTeX TR2014-079 PDF
    • @inproceedings{Tachioka2014sep,
    • author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
    • title = {{Sequential Maximum Mutual Information Linear Discriminant Analysis for Speech Recognition}},
    • booktitle = {Interspeech},
    • year = 2014,
    • volume = 15,
    • pages = {2415--2419},
    • month = sep,
    • publisher = {International Speech Communication Association},
    • issn = {2308-457X},
    • url = {https://www.merl.com/publications/TR2014-079}
    • }
  •  Watanabe, S., Hershey, J.R., Marks, T.K., Fujii, Y., Koji, Y., "Cost-level integration of statistical and rule-based dialog managers", Interspeech, September 2014, vol. 15, pp. 323-327.
    BibTeX TR2014-082 PDF
    • @inproceedings{Watanabe2014sep,
    • author = {{{Watanabe, S. and Hershey, J.R. and Marks, T.K. and Fujii, Y. and Koji, Y.}}},
    • title = {{{Cost-level integration of statistical and rule-based dialog managers}}},
    • booktitle = {Interspeech},
    • year = 2014,
    • volume = 15,
    • pages = {323--327},
    • month = sep,
    • publisher = {International Speech Communication Association},
    • url = {https://www.merl.com/publications/TR2014-082}
    • }
  •  Weninger, F., Le Roux, J., Hershey, J.R., Watanabe, S., "Discriminative NMF and its application to single-channel source separation", Interspeech, September 2014, vol. 15, pp. 865-869.
    BibTeX TR2014-081 PDF
    • @inproceedings{Weninger2014sep,
    • author = {Weninger, F. and {Le Roux}, J. and Hershey, J.R. and Watanabe, S.},
    • title = {{Discriminative NMF and its application to single-channel source separation}},
    • booktitle = {Interspeech},
    • year = 2014,
    • volume = 15,
    • pages = {865--869},
    • month = sep,
    • publisher = {International Speech Communication Association},
    • issn = {2308-457X},
    • url = {https://www.merl.com/publications/TR2014-081}
    • }
  •  Le Roux, J., Vincent, E., "A Categorization of Robust Speech Processing Datasets," Tech. Rep. TR2014-116, Mitsubishi Electric Research Laboratories, September 2014.
    BibTeX TR2014-116 PDF
    • @techreport{LeRouxVincent2014TRdatasets,
    • author = {{Le Roux}, J. and Vincent, E.},
    • title = {{A Categorization of Robust Speech Processing Datasets}},
    • institution = {Mitsubishi Electric Research Laboratories},
    • year = 2014,
    • number = {TR2014-116},
    • address = {Cambridge MA, USA},
    • month = sep,
    • note = {v2014-09},
    • url = {https://www.merl.com/publications/TR2014-116}
    • }
  •  Hershey, J.R., Le Roux, J., Weninger, F., "Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures", arXiv, August 2014.
    BibTeX arXiv
    • @article{Hershey2014aug,
    • author = {Hershey, J.R. and {Le Roux}, J. and Weninger, F.},
    • title = {{Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures}},
    • journal = {arXiv},
    • year = 2014,
    • month = aug,
    • url = {https://arxiv.org/abs/1409.2574}
    • }
  •  Tachioka, Y., Narita, T., Watanabe, S., Le Roux, J., "Ensemble Integration of Calibrated Speaker Localization and Statistical Speech Detection in Domestic Environments", Joint Workshop on Hands-free Speech Communication and Microphone Arrays (HSCMA), DOI: 10.1109/​HSCMA.2014.6843272, May 2014, pp. 162-166.
    BibTeX TR2014-034 PDF
    • @inproceedings{Tachioka2014may2,
    • author = {Tachioka, Y. and Narita, T. and Watanabe, S. and {Le Roux}, J.},
    • title = {{Ensemble Integration of Calibrated Speaker Localization and Statistical Speech Detection in Domestic Environments}},
    • booktitle = {Joint Workshop on Hands-free Speech Communication and Microphone Arrays (HSCMA)},
    • year = 2014,
    • pages = {162--166},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/HSCMA.2014.6843272},
    • url = {https://www.merl.com/publications/TR2014-034}
    • }
  •  Tachioka, Y., Narita, T., Weninger, F., Watanabe, S., "Dual system combination approach for various reverberant environments with dereverberation techniques", IEEE REVERB Workshop, May 2014.
    BibTeX TR2014-032 PDF
    • @inproceedings{Tachioka2014may,
    • author = {Tachioka, Y. and Narita, T. and Weninger, F. and Watanabe, S.},
    • title = {{Dual system combination approach for various reverberant environments with dereverberation techniques}},
    • booktitle = {IEEE REVERB Workshop},
    • year = 2014,
    • month = may,
    • url = {https://www.merl.com/publications/TR2014-032}
    • }
  •  Weninger, F., Watanabe, S., Le Roux, J., Hershey, J.R., Tachioka, Y., Geiger, J., Schuller, B., Rigoll, G., "The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement", IEEE REVERB Workshop, May 2014.
    BibTeX TR2014-033 PDF
    • @inproceedings{Weninger2014may2,
    • author = {Weninger, F. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R. and Tachioka, Y. and Geiger, J. and Schuller, B. and Rigoll, G.},
    • title = {{The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement}},
    • booktitle = {IEEE REVERB Workshop},
    • year = 2014,
    • month = may,
    • url = {https://www.merl.com/publications/TR2014-033}
    • }
  •  Naini, R., Rane, S., Ramalingam, S., "A Vanishing Point-based Global Descriptor for Manhattan Scenes", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2014.6854423, May 2014, pp. 4349-4353.
    BibTeX TR2014-029 PDF
    • @inproceedings{Naini2014may,
    • author = {Naini, R. and Rane, S. and Ramalingam, S.},
    • title = {{A Vanishing Point-based Global Descriptor for Manhattan Scenes}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2014,
    • pages = {4349--4353},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP.2014.6854423},
    • url = {https://www.merl.com/publications/TR2014-029}
    • }
  •  Simsekli, U., Le Roux, J., Hershey, J.R., "Non-negative Source-filter Dynamical System for Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2014.6854797, May 2014, pp. 6206-6210.
    BibTeX TR2014-027 PDF Software
    • @inproceedings{Simsekli2014may,
    • author = {Simsekli, U. and {Le Roux}, J. and Hershey, J.R.},
    • title = {{Non-negative Source-filter Dynamical System for Speech Enhancement}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2014,
    • pages = {6206--6210},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP.2014.6854797},
    • url = {https://www.merl.com/publications/TR2014-027}
    • }
  •  Tang, H., Watanabe, S., Marks, T.K., Hershey, J.R., "Log-linear Dialog Manager", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2014.6854371, May 2014, pp. 4092-4096.
    BibTeX TR2014-024 PDF
    • @inproceedings{Tang2014may,
    • author = {Tang, H. and Watanabe, S. and Marks, T.K. and Hershey, J.R.},
    • title = {{Log-linear Dialog Manager}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2014,
    • pages = {4092--4096},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP.2014.6854371},
    • url = {https://www.merl.com/publications/TR2014-024}
    • }
  •  Wang, Y., Ortega, A., Tian, D., Vetro, A., "A Graph-based Joint Bilateral Approach for Depth Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2014.6853724, May 2014, pp. 885-889.
    BibTeX TR2014-028 PDF
    • @inproceedings{Wang2014may,
    • author = {Wang, Y. and Ortega, A. and Tian, D. and Vetro, A.},
    • title = {{A Graph-based Joint Bilateral Approach for Depth Enhancement}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2014,
    • pages = {885--889},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP.2014.6853724},
    • url = {https://www.merl.com/publications/TR2014-028}
    • }
  •  Watanabe, S., Le Roux, J., "Black Box Optimization for Automatic Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2014.6854202, May 2014, pp. 3256-3260.
    BibTeX TR2014-021 PDF
    • @inproceedings{Watanabe2014may,
    • author = {Watanabe, S. and {Le Roux}, J.},
    • title = {{Black Box Optimization for Automatic Speech Recognition}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2014,
    • pages = {3256--3260},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP.2014.6854202},
    • url = {https://www.merl.com/publications/TR2014-021}
    • }
  •  Weng, C., Yu, D., Watanabe, S., Juang, B.-H.F., "Recurrent Deep Neural Networks for Robust Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2014.6854661, May 2014, pp. 5532-5536.
    BibTeX TR2014-023 PDF
    • @inproceedings{Weng2014may,
    • author = {Weng, C. and Yu, D. and Watanabe, S. and Juang, B.-H.F.},
    • title = {{Recurrent Deep Neural Networks for Robust Speech Recognition}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2014,
    • pages = {5532--5536},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP.2014.6854661},
    • url = {https://www.merl.com/publications/TR2014-023}
    • }
  •  Weninger, F., Watanabe, S., Tachioka, Y., Schuller, B., "Deep Recurrent De-noising Auto-encoder and Blind De-reverberation for Reverberated Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2014.6854478, May 2014, pp. 4623-4627.
    BibTeX TR2014-022 PDF
    • @inproceedings{Weninger2014may1,
    • author = {Weninger, F. and Watanabe, S. and Tachioka, Y. and Schuller, B.},
    • title = {{Deep Recurrent De-noising Auto-encoder and Blind De-reverberation for Reverberated Speech Recognition}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2014,
    • pages = {4623--4627},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP.2014.6854478},
    • url = {https://www.merl.com/publications/TR2014-022}
    • }
  •  Zhang, J., Chen, L., Boufounos, P.T., Gu, Y., "On the Theoretical Analysis of Cross Validation in Compressive Sensing", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2014.6854225, May 2014, pp. 3370-3374.
    BibTeX TR2014-025 PDF
    • @inproceedings{Zhang2014may,
    • author = {Zhang, J. and Chen, L. and Boufounos, P.T. and Gu, Y.},
    • title = {{On the Theoretical Analysis of Cross Validation in Compressive Sensing}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2014,
    • pages = {3370--3374},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP.2014.6854225},
    • url = {https://www.merl.com/publications/TR2014-025}
    • }
  •  Mansour, H., Vetro, A., "Video Background Subtraction Using Semi-supervised Robust Matrix Completion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2014.6854862, May 2014, pp. 6528-6532.
    BibTeX TR2014-026 PDF
    • @inproceedings{Mansour2014may,
    • author = {Mansour, H. and Vetro, A.},
    • title = {{Video Background Subtraction Using Semi-supervised Robust Matrix Completion}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2014,
    • pages = {6528--6532},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP.2014.6854862},
    • url = {https://www.merl.com/publications/TR2014-026}
    • }
  •  Watanabe, S., Nakamura, A., Juang, B.-H., "Structural Bayesian Linear Regression for Hidden Markov Models", Journal of Signal Processing Systems, DOI: 10.1007/​s11265-013-0785-8, Vol. 74, No. 3, pp. 341-358, March 2014.
    BibTeX TR2013-071 PDF
    • @article{Watanabe2013aug,
    • author = {Watanabe, S. and Nakamura, A. and Juang, B.-H.},
    • title = {{Structural Bayesian Linear Regression for Hidden Markov Models}},
    • journal = {Journal of Signal Processing Systems},
    • year = 2014,
    • volume = 74,
    • number = 3,
    • pages = {341--358},
    • month = mar,
    • doi = {10.1007/s11265-013-0785-8},
    • issn = {1939-8018},
    • url = {https://www.merl.com/publications/TR2013-071}
    • }
  •  Tachioka, Y., Watanabe, S., Le Roux, J., Hershey, J.R., "A Generalized Discriminative Training Framework for System Combination", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/​ASRU.2013.6707703, December 2013, pp. 43-48.
    BibTeX TR2013-118 PDF
    • @inproceedings{Tachioka2013dec,
    • author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
    • title = {{A Generalized Discriminative Training Framework for System Combination}},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2013,
    • pages = {43--48},
    • month = dec,
    • doi = {10.1109/ASRU.2013.6707703},
    • url = {https://www.merl.com/publications/TR2013-118}
    • }
  •  Vincent, E., Barker, J., Watanabe, S., Le Roux, J., Nesta, F., Matassoni, M., "The Second CHiME Speech Separation and Recognition Challenge: An Overview of Challenge Systems and Outcomes", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/​ASRU.2013.6707723, December 2013, pp. 162-167.
    BibTeX TR2013-119 PDF
    • @inproceedings{Vincent2013dec,
    • author = {Vincent, E. and Barker, J. and Watanabe, S. and {Le Roux}, J. and Nesta, F. and Matassoni, M.},
    • title = {{The Second CHiME Speech Separation and Recognition Challenge: An Overview of Challenge Systems and Outcomes}},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2013,
    • pages = {162--167},
    • month = dec,
    • doi = {10.1109/ASRU.2013.6707723},
    • url = {https://www.merl.com/publications/TR2013-119}
    • }
  •  Potluru, V.K., Le Roux, J., Pearlmutter, B.A., Hershey, J.R., Brand, M., "Coordinate Descent for Mixed-norm NMF", NIPS Workshop on Greedy Algorithms, Frank-Wolfe and Friends - A Modern Perspective, December 2013.
    BibTeX TR2013-130 PDF
    • @inproceedings{Potluru2013dec,
    • author = {Potluru, V.K. and {Le Roux}, J. and Pearlmutter, B.A. and Hershey, J.R. and Brand, M.},
    • title = {{Coordinate Descent for Mixed-norm NMF}},
    • booktitle = {NIPS Workshop on Greedy Algorithms, Frank-Wolfe and Friends - A Modern Perspective},
    • year = 2013,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2013-130}
    • }
  •  Le Roux, J., Watanabe, S., Hershey, J.R., "Ensemble Learning for Speech Enhancement", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA.2013.6701888, October 2013, pp. 1-4.
    BibTeX TR2013-098 PDF
    • @inproceedings{LeRoux2013oct,
    • author = {{Le Roux}, J. and Watanabe, S. and Hershey, J.R.},
    • title = {{Ensemble Learning for Speech Enhancement}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2013,
    • pages = {1--4},
    • month = oct,
    • doi = {10.1109/WASPAA.2013.6701888},
    • issn = {1931-1168},
    • url = {https://www.merl.com/publications/TR2013-098}
    • }
  •  Tawara, N., Ogawa, T., Watanabe, S., Nakamura, A., Kobayashi, T., "Blocked Gibbs Sampling Based Multi-Scale Mixture Model for Speaker Clustering on Noisy Data", IEEE International Workshop on Machine Learning for Signal Processing (MLSP), DOI: 10.1109/​MLSP.2013.6661902, September 2013, pp. 1-6.
    BibTeX TR2013-091 PDF
    • @inproceedings{Tawara2013sep,
    • author = {Tawara, N. and Ogawa, T. and Watanabe, S. and Nakamura, A. and Kobayashi, T.},
    • title = {{Blocked Gibbs Sampling Based Multi-Scale Mixture Model for Speaker Clustering on Noisy Data}},
    • booktitle = {IEEE International Workshop on Machine Learning for Signal Processing (MLSP)},
    • year = 2013,
    • pages = {1--6},
    • month = sep,
    • doi = {10.1109/MLSP.2013.6661902},
    • issn = {1551-2541},
    • url = {https://www.merl.com/publications/TR2013-091}
    • }
  •  Tachioka, Y., Watanabe, S., "Discriminative Training of Acoustic Models for System Combination", Interspeech, August 2013.
    BibTeX TR2013-074 PDF
    • @inproceedings{Tachioka2013aug,
    • author = {Tachioka, Y. and Watanabe, S.},
    • title = {{Discriminative Training of Acoustic Models for System Combination}},
    • booktitle = {Interspeech},
    • year = 2013,
    • month = aug,
    • url = {https://www.merl.com/publications/TR2013-074}
    • }