Publications

235 / 3,841 publications found.


  •  Le Roux, J., Boufounos, P.T., Kang, K., Hershey, J.R., "Source Localization in Reverberant Environments using Sparse Optimization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2013.6638473, May 2013, pp. 4310-4314.
    BibTeX TR2013-022 PDF
    • @inproceedings{LeRoux2013may,
    • author = {{Le Roux}, J. and Boufounos, P.T. and Kang, K. and Hershey, J.R.},
    • title = {{Source Localization in Reverberant Environments using Sparse Optimization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2013,
    • pages = {4310--4314},
    • month = may,
    • doi = {10.1109/ICASSP.2013.6638473},
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2013-022}
    • }
  •  Tachioka, Y., Watanabe, S., Hershey, J.R., "Effectiveness of Discriminative Training and Feature Transformation for Reverberated and Noisy Speech", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2013.
    BibTeX TR2013-020 PDF
    • @inproceedings{Tachioka2013may,
    • author = {Tachioka, Y. and Watanabe, S. and Hershey, J.R.},
    • title = {{Effectiveness of Discriminative Training and Feature Transformation for Reverberated and Noisy Speech}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2013,
    • month = may,
    • url = {https://www.merl.com/publications/TR2013-020}
    • }
  •  Vincent, E., Barker, J., Watanabe, S., Le Roux, J., Nesta, F., Matassoni, M., "The Second 'CHiME' Speech Separation and Recognition Challenge: Datasets, Tasks and Baselines", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2013.
    BibTeX TR2013-079 PDF
    • @inproceedings{Vincent2013may,
    • author = {Vincent, E. and Barker, J. and Watanabe, S. and {Le Roux}, J. and Nesta, F. and Matassoni, M.},
    • title = {{The Second 'CHiME' Speech Separation and Recognition Challenge: Datasets, Tasks and Baselines}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2013,
    • month = may,
    • url = {https://www.merl.com/publications/TR2013-079}
    • }
  •  Watanabe, S., Hershey, J.R., "Stereo-based Feature Enhancement Using Dictionary Learning", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2013.6639034, May 2013, pp. 7073-7077.
    BibTeX TR2013-019 PDF
    • @inproceedings{Watanabe2013may,
    • author = {Watanabe, S. and Hershey, J.R.},
    • title = {{Stereo-based Feature Enhancement Using Dictionary Learning}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2013,
    • pages = {7073--7077},
    • month = may,
    • doi = {10.1109/ICASSP.2013.6639034},
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2013-019}
    • }
  •  Potluru, V.K., Plis, S.M., Le Roux, J., Pearlmutter, B.A., Calhoun, V.D., Hayes, T.P., "Block Coordinate Descent for Sparse NMF", International Conference on Learning Representations (ICLR), May 2013.
    BibTeX TR2013-026 PDF
    • @inproceedings{Potluru2013may,
    • author = {Potluru, V.K. and Plis, S.M. and {Le Roux}, J. and Pearlmutter, B.A. and Calhoun, V.D. and Hayes, T.P.},
    • title = {{Block Coordinate Descent for Sparse NMF}},
    • booktitle = {International Conference on Learning Representations (ICLR)},
    • year = 2013,
    • month = may,
    • url = {https://www.merl.com/publications/TR2013-026}
    • }
  •  Le Roux, J., Vincent, E., "Consistent Wiener Filtering for Audio Source Separation", IEEE Signal Processing Letters, DOI: 10.1109/​LSP.2012.2225617, Vol. 20, No. 3, pp. 217-220, March 2013.
    BibTeX TR2012-090 PDF
    • @article{LeRoux2013mar,
    • author = {{Le Roux}, J. and Vincent, E.},
    • title = {{Consistent Wiener Filtering for Audio Source Separation}},
    • journal = {IEEE Signal Processing Letters},
    • year = 2013,
    • volume = 20,
    • number = 3,
    • pages = {217--220},
    • month = mar,
    • doi = {10.1109/LSP.2012.2225617},
    • url = {https://www.merl.com/publications/TR2012-090}
    • }
  •  Watanabe, S., Nakamura, A., "Bayesian Approaches to Acoustic Modeling: A Review", APSIPA Transactions on Signal and Information Processing, DOI: 10.1017/​ATSIP.2012.6, Vol. 1, December 2012.
    BibTeX TR2012-087 PDF
    • @article{Watanabe2012dec,
    • author = {Watanabe, S. and Nakamura, A.},
    • title = {{Bayesian Approaches to Acoustic Modeling: A Review}},
    • journal = {APSIPA Transactions on Signal and Information Processing},
    • year = 2012,
    • volume = 1,
    • month = dec,
    • doi = {10.1017/ATSIP.2012.6},
    • url = {https://www.merl.com/publications/TR2012-087}
    • }
  •  Hershey, J.R., Rennie, S.J., Le Roux, J., "Factorial Models for Noise Robust Speech Recognition" in Techniques for Noise Robustness in Automatic Speech Recognition, Virtanen, T. and Singh, R. and Raj, B., Eds., chapter 12, Wiley, November 2012.
    BibTeX TR2012-002 PDF
    • @incollection{Hershey2012nov,
    • author = {Hershey, J.R. and Rennie, S.J. and {Le Roux}, J.},
    • title = {{Factorial Models for Noise Robust Speech Recognition}},
    • booktitle = {Techniques for Noise Robustness in Automatic Speech Recognition},
    • year = 2012,
    • editor = {Virtanen, T. and Singh, R. and Raj, B.},
    • chapter = 12,
    • month = nov,
    • publisher = {Wiley},
    • url = {https://www.merl.com/publications/TR2012-002}
    • }
  •  Gales, M., Watanabe, S., Fosler-Lussier, E., "Structured Discriminative Models For Speech Recognition", IEEE Signal Processing Magazine, Vol. 29, No. 6, pp. 70-81, November 2012.
    BibTeX TR2012-072 PDF
    • @article{Gales2012nov,
    • author = {Gales, M. and Watanabe, S. and Fosler-Lussier, E.},
    • title = {{Structured Discriminative Models For Speech Recognition}},
    • journal = {IEEE Signal Processing Magazine},
    • year = 2012,
    • volume = 29,
    • number = 6,
    • pages = {70--81},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2012-072}
    • }
  •  Zhang, J., Borowsky, A., Schmidt-Nielsen, B., Harsham, B., Weinberg, G., Romoser, M.R.E., Fisher, D.L., "Evaluation of Two Types of In-Vehicle Music Retrieval and Navigation Systems", Annual Meeting of the Human Factors and Ergonomics Society (HFES), October 2012.
    BibTeX TR2012-097 PDF
    • @inproceedings{Zhang2012oct,
    • author = {Zhang, J. and Borowsky, A. and Schmidt-Nielsen, B. and Harsham, B. and Weinberg, G. and Romoser, M.R.E. and Fisher, D.L.},
    • title = {{Evaluation of Two Types of In-Vehicle Music Retrieval and Navigation Systems}},
    • booktitle = {Annual Meeting of the Human Factors and Ergonomics Society (HFES)},
    • year = 2012,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2012-097}
    • }
  •  Heaukulani, C., Le Roux, J., Hershey, J.R., "Latent Dirichlet Reallocation for Term Swapping", International Workshop on Statistical Machine Learning for Speech Processing (IWSML), March 2012.
    BibTeX TR2012-022 PDF
    • @inproceedings{Heaukulani2012mar,
    • author = {Heaukulani, C. and {Le Roux}, J. and Hershey, J.R.},
    • title = {{Latent Dirichlet Reallocation for Term Swapping}},
    • booktitle = {International Workshop on Statistical Machine Learning for Speech Processing (IWSML)},
    • year = 2012,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2012-022}
    • }
  •  Le Roux, J., Hershey, J.R., "Indirect Model-based Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP-2012.6288806, March 2012, pp. 4045-4048.
    BibTeX TR2012-016 PDF
    • @inproceedings{LeRoux2012mar2,
    • author = {{Le Roux}, J. and Hershey, J.R.},
    • title = {{Indirect Model-based Speech Enhancement}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2012,
    • pages = {4045--4048},
    • month = mar,
    • doi = {10.1109/ICASSP-2012.6288806},
    • issn = {1520-6149},
    • isbn = {978-1-4673-0045-2},
    • url = {https://www.merl.com/publications/TR2012-016}
    • }
  •  Le Roux, J., Hershey, J.R., "Speech Enhancement by Indirect VTS", Acoustical Society of Japan Spring Meeting (ASJ), March 2012.
    BibTeX TR2012-011 PDF
    • @inproceedings{LeRoux2012mar1,
    • author = {{Le Roux}, J. and Hershey, J.R.},
    • title = {{Speech Enhancement by Indirect VTS}},
    • booktitle = {Acoustical Society of Japan Spring Meeting (ASJ)},
    • year = 2012,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2012-011}
    • }
  •  Weinberg, G., Harsham, B., Medenica, Z., "Investigating HUDs or the Presentation of Choice Lists in Car navigation Systems", International Driving Symposium on Human Factors in Driver Assessment, Training and Vehicle Design, June 2011.
    BibTeX TR2011-060 PDF
    • @inproceedings{Weinberg2011jun,
    • author = {Weinberg, G. and Harsham, B. and Medenica, Z.},
    • title = {{Investigating HUDs or the Presentation of Choice Lists in Car navigation Systems}},
    • booktitle = {International Driving Symposium on Human Factors in Driver Assessment, Training and Vehicle Design},
    • year = 2011,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2011-060}
    • }
  •  Mueller, C., Weinberg, G., "Multimodal Input in the Car, Today and Tomorrow", IEEE Multimedia, Vol. 18, No. 1, pp. 98-103, January 2011.
    BibTeX TR2011-002 PDF
    • @article{Mueller2011jan,
    • author = {Mueller, C. and Weinberg, G.},
    • title = {{Multimodal Input in the Car, Today and Tomorrow}},
    • journal = {IEEE Multimedia},
    • year = 2011,
    • volume = 18,
    • number = 1,
    • pages = {98--103},
    • month = jan,
    • issn = {1070-986X},
    • url = {https://www.merl.com/publications/TR2011-002}
    • }
  •  Gouvea, E., Ezzat, T., "Vocabulary Independent Spoken Query: a Case for Subword Units", Interspeech, September 2010.
    BibTeX TR2010-089 PDF
    • @inproceedings{Gouvea2010sep,
    • author = {Gouvea, E. and Ezzat, T.},
    • title = {{Vocabulary Independent Spoken Query: a Case for Subword Units}},
    • booktitle = {Interspeech},
    • year = 2010,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2010-089}
    • }
  •  Raj, B., Wilson, K.W., Krueger, A., Haeb-Umbach, R., "Ungrounded Independent Non-Negative Factor Analysis", Interspeech, September 2010, pp. 330-333.
    BibTeX TR2010-122 PDF
    • @inproceedings{Raj2010sep,
    • author = {Raj, B. and Wilson, K.W. and Krueger, A. and Haeb-Umbach, R.},
    • title = {{Ungrounded Independent Non-Negative Factor Analysis}},
    • booktitle = {Interspeech},
    • year = 2010,
    • pages = {330--333},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2010-122}
    • }
  •  Weinberg, G., Harsham, B., Forlines, C., Medenica, Z., "Contextual Push-to-talk: Shortening Voice Dialogs to Improve Driving Performance", International Conference on Human-Computer Interaction with Mobile Devices and Services (MobileHCI), September 2010, pp. 113-122.
    BibTeX TR2010-085 PDF
    • @inproceedings{Weinberg2010sep1,
    • author = {Weinberg, G. and Harsham, B. and Forlines, C. and Medenica, Z.},
    • title = {{Contextual Push-to-talk: Shortening Voice Dialogs to Improve Driving Performance}},
    • booktitle = {International Conference on Human-Computer Interaction with Mobile Devices and Services (MobileHCI)},
    • year = 2010,
    • pages = {113--122},
    • month = sep,
    • isbn = {978-1-60558-835-3},
    • url = {https://www.merl.com/publications/TR2010-085}
    • }
  •  Weinberg, G., Harsham, B., "Object-Oriented Multimodality for Safer In-Vehicle Interfaces", Speech in Mobile and Pervasive Environments (SiMPE), September 2010.
    BibTeX TR2010-084 PDF
    • @inproceedings{Weinberg2010sep2,
    • author = {Weinberg, G. and Harsham, B.},
    • title = {{Object-Oriented Multimodality for Safer In-Vehicle Interfaces}},
    • booktitle = {Speech in Mobile and Pervasive Environments (SiMPE)},
    • year = 2010,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2010-084}
    • }
  •  Garay-Vega, L., Pradhan, A.K., Weinberg, G.L., Schmidt-Nielsen, B.K., Harsham, B.A., Shen, Y., Divekar, G., Romoser, M., Knodler, M., Fisher, D.L., "Evaluation of Different Speech and Touch Interfaces to In-vehicle Music Retrieval Systems", Accident Analysis & Prevention, Vol. 42, No. 3, May 2010.
    BibTeX TR2010-025 PDF
    • @article{Garay-Vega2010may,
    • author = {Garay-Vega, L. and Pradhan, A.K. and Weinberg, G.L. and Schmidt-Nielsen, B.K. and Harsham, B.A. and Shen, Y. and Divekar, G. and Romoser, M. and Knodler, M. and Fisher, D.L.},
    • title = {{Evaluation of Different Speech and Touch Interfaces to In-vehicle Music Retrieval Systems}},
    • journal = {Accident Analysis \& Prevention},
    • year = 2010,
    • volume = 42,
    • number = 3,
    • month = may,
    • issn = {0001-4575},
    • url = {https://www.merl.com/publications/TR2010-025}
    • }
  •  Gouvea, E., Ezzat, T., Raj, B., "Subword Unit Approaches for Retrieval by Voice", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2010.
    BibTeX TR2010-012 PDF
    • @inproceedings{Gouvea2010mar,
    • author = {Gouvea, E. and Ezzat, T. and Raj, B.},
    • title = {{Subword Unit Approaches for Retrieval by Voice}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2010,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2010-012}
    • }
  •  Srinivasan, S., Raj, B., Ezzat, T., "Ultrasonic Sensing for Robust Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2010.
    BibTeX TR2010-015 PDF
    • @inproceedings{Srinivasan2010mar,
    • author = {Srinivasan, S. and Raj, B. and Ezzat, T.},
    • title = {{Ultrasonic Sensing for Robust Speech Recognition}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2010,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2010-015}
    • }
  •  Toth, A.R., Raj, B., Kalgaonkar, K., Ezzat, T., "Synthesizing Speech from Doppler Signals", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2010.
    BibTeX TR2010-016 PDF
    • @inproceedings{Toth2010mar,
    • author = {Toth, A.R. and Raj, B. and Kalgaonkar, K. and Ezzat, T.},
    • title = {{Synthesizing Speech from Doppler Signals}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2010,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2010-016}
    • }
  •  Wilson, K.W., Raj, B., "Spectrogram Dimensionality Reduction with Independence Constraints", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2010.
    BibTeX TR2010-023 PDF
    • @inproceedings{Wilson2010mar,
    • author = {Wilson, K.W. and Raj, B.},
    • title = {{Spectrogram Dimensionality Reduction with Independence Constraints}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2010,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2010-023}
    • }
  •  Weinberg, G.L., Harsham, B.A., "Developing a Low-Cost Driving Simulator for the Evaluation of In-Vehicle Technologies", International Conference on Automotive User Interfaces and Interactive Vehicular Applications (AutomotiveUI), September 2009, pp. 51-54.
    BibTeX TR2009-064 PDF
    • @inproceedings{Weinberg2009sep1,
    • author = {Weinberg, G.L. and Harsham, B.A.},
    • title = {{Developing a Low-Cost Driving Simulator for the Evaluation of In-Vehicle Technologies}},
    • booktitle = {International Conference on Automotive User Interfaces and Interactive Vehicular Applications (AutomotiveUI)},
    • year = 2009,
    • pages = {51--54},
    • month = sep,
    • isbn = {978-1-60558-571-0},
    • url = {https://www.merl.com/publications/TR2009-064}
    • }