Publications

315 / 3,608 publications found.


  •  Potluru, V.K., Le Roux, J., Pearlmutter, B.A., Hershey, J.R., Brand, M., "Coordinate Descent for Mixed-norm NMF", NIPS Workshop on Greedy Algorithms, Frank-Wolfe and Friends - A Modern Perspective, December 2013.
    BibTeX TR2013-130 PDF
    • @inproceedings{Potluru2013dec,
    • author = {Potluru, V.K. and {Le Roux}, J. and Pearlmutter, B.A. and Hershey, J.R. and Brand, M.},
    • title = {Coordinate Descent for Mixed-norm NMF},
    • booktitle = {NIPS Workshop on Greedy Algorithms, Frank-Wolfe and Friends - A Modern Perspective},
    • year = 2013,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2013-130}
    • }
  •  Portelo, J., Raj, B., Boufounos, P., Trancoso, I., Abad, A., "Speaker Verification Using Secure Binary Embeddings", European Signal Processing Conference (EUSIPCO), September 2013.
    BibTeX TR2013-082 PDF
    • @inproceedings{Portelo2013sep,
    • author = {Portelo, J. and Raj, B. and Boufounos, P. and Trancoso, I. and Abad, A.},
    • title = {Speaker Verification Using Secure Binary Embeddings},
    • booktitle = {European Signal Processing Conference (EUSIPCO)},
    • year = 2013,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2013-082}
    • }
  •  Tachioka, Y., Watanabe, S., "Discriminative Training of Acoustic Models for System Combination", Interspeech, August 2013.
    BibTeX TR2013-074 PDF
    • @inproceedings{Tachioka2013aug,
    • author = {Tachioka, Y. and Watanabe, S.},
    • title = {Discriminative Training of Acoustic Models for System Combination},
    • booktitle = {Interspeech},
    • year = 2013,
    • month = aug,
    • url = {https://www.merl.com/publications/TR2013-074}
    • }
  •  Tachioka, Y., Watanabe, S., Le Roux, J., Hershey, J.R., "Discriminative Methods for Noise Robust Speech Recognition: A CHiME Challenge Benchmark", International Workshop on Machine Listening in Multisource Environments (CHiME), June 2013.
    BibTeX TR2013-044 PDF
    • @inproceedings{Tachioka2013jun,
    • author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
    • title = {Discriminative Methods for Noise Robust Speech Recognition: A CHiME Challenge Benchmark},
    • booktitle = {International Workshop on Machine Listening in Multisource Environments (CHiME)},
    • year = 2013,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2013-044}
    • }
  •  Fevotte, C., Le Roux, J., Hershey, J.R., "Non-negative Dynamical System with Application to Speech and Audio", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2013.
    BibTeX TR2013-021 PDF Software
    • @inproceedings{Fevotte2013may,
    • author = {Fevotte, C. and {Le Roux}, J. and Hershey, J.R.},
    • title = {Non-negative Dynamical System with Application to Speech and Audio},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2013,
    • month = may,
    • url = {https://www.merl.com/publications/TR2013-021}
    • }
  •  Le Roux, J., Boufounos, P.T., Kang, K., Hershey, J.R., "Source Localization in Reverberant Environments using Sparse Optimization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2013.6638473, May 2013, pp. 4310-4314.
    BibTeX TR2013-022 PDF
    • @inproceedings{LeRoux2013may,
    • author = {{Le Roux}, J. and Boufounos, P.T. and Kang, K. and Hershey, J.R.},
    • title = {Source Localization in Reverberant Environments using Sparse Optimization},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2013,
    • pages = {4310--4314},
    • month = may,
    • doi = {10.1109/ICASSP.2013.6638473},
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2013-022}
    • }
  •  Tachioka, Y., Watanabe, S., Hershey, J.R., "Effectiveness of Discriminative Training and Feature Transformation for Reverberated and Noisy Speech", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2013.
    BibTeX TR2013-020 PDF
    • @inproceedings{Tachioka2013may,
    • author = {Tachioka, Y. and Watanabe, S. and Hershey, J.R.},
    • title = {Effectiveness of Discriminative Training and Feature Transformation for Reverberated and Noisy Speech},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2013,
    • month = may,
    • url = {https://www.merl.com/publications/TR2013-020}
    • }
  •  Vincent, E., Barker, J., Watanabe, S., Le Roux, J., Nesta, F., Matassoni, M., "The Second 'CHiME' Speech Separation and Recognition Challenge: Datasets, Tasks and Baselines", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2013.
    BibTeX TR2013-079 PDF
    • @inproceedings{Vincent2013may,
    • author = {Vincent, E. and Barker, J. and Watanabe, S. and {Le Roux}, J. and Nesta, F. and Matassoni, M.},
    • title = {The Second 'CHiME' Speech Separation and Recognition Challenge: Datasets, Tasks and Baselines},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2013,
    • month = may,
    • url = {https://www.merl.com/publications/TR2013-079}
    • }
  •  Watanabe, S., Hershey, J.R., "Stereo-based Feature Enhancement Using Dictionary Learning", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2013.6639034, May 2013, pp. 7073-7077.
    BibTeX TR2013-019 PDF
    • @inproceedings{Watanabe2013may,
    • author = {Watanabe, S. and Hershey, J.R.},
    • title = {Stereo-based Feature Enhancement Using Dictionary Learning},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2013,
    • pages = {7073--7077},
    • month = may,
    • doi = {10.1109/ICASSP.2013.6639034},
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2013-019}
    • }
  •  Potluru, V.K., Plis, S.M., Le Roux, J., Pearlmutter, B.A., Calhoun, V.D., Hayes, T.P., "Block Coordinate Descent for Sparse NMF", International Conference on Learning Representations (ICLR), May 2013.
    BibTeX TR2013-026 PDF
    • @inproceedings{Potluru2013may,
    • author = {Potluru, V.K. and Plis, S.M. and {Le Roux}, J. and Pearlmutter, B.A. and Calhoun, V.D. and Hayes, T.P.},
    • title = {Block Coordinate Descent for Sparse NMF},
    • booktitle = {International Conference on Learning Representations (ICLR)},
    • year = 2013,
    • month = may,
    • url = {https://www.merl.com/publications/TR2013-026}
    • }
  •  Le Roux, J., Vincent, E., "Consistent Wiener Filtering for Audio Source Separation", IEEE Signal Processing Letters, DOI: 10.1109/​LSP.2012.2225617, Vol. 20, No. 3, pp. 217-220, March 2013.
    BibTeX TR2012-090 PDF
    • @article{LeRoux2013mar,
    • author = {{Le Roux}, J. and Vincent, E.},
    • title = {Consistent Wiener Filtering for Audio Source Separation},
    • journal = {IEEE Signal Processing Letters},
    • year = 2013,
    • volume = 20,
    • number = 3,
    • pages = {217--220},
    • month = mar,
    • doi = {10.1109/LSP.2012.2225617},
    • url = {https://www.merl.com/publications/TR2012-090}
    • }
  •  Watanabe, S., Nakamura, A., "Bayesian Approaches to Acoustic Modeling: A Review", APSIPA Transactions on Signal and Information Processing, DOI: 10.1017/​ATSIP.2012.6, Vol. 1, December 2012.
    BibTeX TR2012-087 PDF
    • @article{Watanabe2012dec,
    • author = {Watanabe, S. and Nakamura, A.},
    • title = {Bayesian Approaches to Acoustic Modeling: A Review},
    • journal = {APSIPA Transactions on Signal and Information Processing},
    • year = 2012,
    • volume = 1,
    • month = dec,
    • doi = {10.1017/ATSIP.2012.6},
    • url = {https://www.merl.com/publications/TR2012-087}
    • }
  •  Hershey, J.R., Rennie, S.J., Le Roux, J., "Factorial Models for Noise Robust Speech Recognition" in Techniques for Noise Robustness in Automatic Speech Recognition, Virtanen, T. and Singh, R. and Raj, B., Eds., chapter 12, Wiley, November 2012.
    BibTeX TR2012-002 PDF
    • @incollection{Hershey2012nov,
    • author = {Hershey, J.R. and Rennie, S.J. and {Le Roux}, J.},
    • title = {Factorial Models for Noise Robust Speech Recognition},
    • booktitle = {Techniques for Noise Robustness in Automatic Speech Recognition},
    • year = 2012,
    • editor = {Virtanen, T. and Singh, R. and Raj, B.},
    • chapter = 12,
    • month = nov,
    • publisher = {Wiley},
    • url = {https://www.merl.com/publications/TR2012-002}
    • }
  •  Gales, M., Watanabe, S., Fosler-Lussier, E., "Structured Discriminative Models For Speech Recognition", IEEE Signal Processing Magazine, Vol. 29, No. 6, pp. 70-81, November 2012.
    BibTeX TR2012-072 PDF
    • @article{Gales2012nov,
    • author = {Gales, M. and Watanabe, S. and Fosler-Lussier, E.},
    • title = {Structured Discriminative Models For Speech Recognition},
    • journal = {IEEE Signal Processing Magazine},
    • year = 2012,
    • volume = 29,
    • number = 6,
    • pages = {70--81},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2012-072}
    • }
  •  Zhang, J., Borowsky, A., Schmidt-Nielsen, B., Harsham, B., Weinberg, G., Romoser, M.R.E., Fisher, D.L., "Evaluation of Two Types of In-Vehicle Music Retrieval and Navigation Systems", Annual Meeting of the Human Factors and Ergonomics Society (HFES), October 2012.
    BibTeX TR2012-097 PDF
    • @inproceedings{Zhang2012oct,
    • author = {Zhang, J. and Borowsky, A. and Schmidt-Nielsen, B. and Harsham, B. and Weinberg, G. and Romoser, M.R.E. and Fisher, D.L.},
    • title = {Evaluation of Two Types of In-Vehicle Music Retrieval and Navigation Systems},
    • booktitle = {Annual Meeting of the Human Factors and Ergonomics Society (HFES)},
    • year = 2012,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2012-097}
    • }
  •  Heaukulani, C., Le Roux, J., Hershey, J.R., "Latent Dirichlet Reallocation for Term Swapping", International Workshop on Statistical Machine Learning for Speech Processing (IWSML), March 2012.
    BibTeX TR2012-022 PDF
    • @inproceedings{Heaukulani2012mar,
    • author = {Heaukulani, C. and {Le Roux}, J. and Hershey, J.R.},
    • title = {Latent Dirichlet Reallocation for Term Swapping},
    • booktitle = {International Workshop on Statistical Machine Learning for Speech Processing (IWSML)},
    • year = 2012,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2012-022}
    • }
  •  Le Roux, J., Hershey, J.R., "Indirect Model-based Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP-2012.6288806, March 2012, pp. 4045-4048.
    BibTeX TR2012-016 PDF
    • @inproceedings{LeRoux2012mar2,
    • author = {{Le Roux}, J. and Hershey, J.R.},
    • title = {Indirect Model-based Speech Enhancement},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2012,
    • pages = {4045--4048},
    • month = mar,
    • doi = {10.1109/ICASSP-2012.6288806},
    • issn = {1520-6149},
    • isbn = {978-1-4673-0045-2},
    • url = {https://www.merl.com/publications/TR2012-016}
    • }
  •  Le Roux, J., Hershey, J.R., "Speech Enhancement by Indirect VTS", Acoustical Society of Japan Spring Meeting (ASJ), March 2012.
    BibTeX TR2012-011 PDF
    • @inproceedings{LeRoux2012mar1,
    • author = {{Le Roux}, J. and Hershey, J.R.},
    • title = {Speech Enhancement by Indirect VTS},
    • booktitle = {Acoustical Society of Japan Spring Meeting (ASJ)},
    • year = 2012,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2012-011}
    • }
  •  Weinberg, G., Harsham, B., Medenica, Z., "Investigating HUDs or the Presentation of Choice Lists in Car navigation Systems", International Driving Symposium on Human Factors in Driver Assessment, Training and Vehicle Design, June 2011.
    BibTeX TR2011-060 PDF
    • @inproceedings{Weinberg2011jun,
    • author = {Weinberg, G. and Harsham, B. and Medenica, Z.},
    • title = {Investigating HUDs or the Presentation of Choice Lists in Car navigation Systems},
    • booktitle = {International Driving Symposium on Human Factors in Driver Assessment, Training and Vehicle Design},
    • year = 2011,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2011-060}
    • }
  •  Mueller, C., Weinberg, G., "Multimodal Input in the Car, Today and Tomorrow", IEEE Multimedia, Vol. 18, No. 1, pp. 98-103, January 2011.
    BibTeX TR2011-002 PDF
    • @article{Mueller2011jan,
    • author = {Mueller, C. and Weinberg, G.},
    • title = {Multimodal Input in the Car, Today and Tomorrow},
    • journal = {IEEE Multimedia},
    • year = 2011,
    • volume = 18,
    • number = 1,
    • pages = {98--103},
    • month = jan,
    • issn = {1070-986X},
    • url = {https://www.merl.com/publications/TR2011-002}
    • }
  •  Gouvea, E., Ezzat, T., "Vocabulary Independent Spoken Query: a Case for Subword Units", Interspeech, September 2010.
    BibTeX TR2010-089 PDF
    • @inproceedings{Gouvea2010sep,
    • author = {Gouvea, E. and Ezzat, T.},
    • title = {Vocabulary Independent Spoken Query: a Case for Subword Units},
    • booktitle = {Interspeech},
    • year = 2010,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2010-089}
    • }
  •  Raj, B., Wilson, K.W., Krueger, A., Haeb-Umbach, R., "Ungrounded Independent Non-Negative Factor Analysis", Interspeech, September 2010, pp. 330-333.
    BibTeX TR2010-122 PDF
    • @inproceedings{Raj2010sep,
    • author = {Raj, B. and Wilson, K.W. and Krueger, A. and Haeb-Umbach, R.},
    • title = {Ungrounded Independent Non-Negative Factor Analysis},
    • booktitle = {Interspeech},
    • year = 2010,
    • pages = {330--333},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2010-122}
    • }
  •  Weinberg, G., Harsham, B., Forlines, C., Medenica, Z., "Contextual Push-to-talk: Shortening Voice Dialogs to Improve Driving Performance", International Conference on Human-Computer Interaction with Mobile Devices and Services (MobileHCI), September 2010, pp. 113-122.
    BibTeX TR2010-085 PDF
    • @inproceedings{Weinberg2010sep1,
    • author = {Weinberg, G. and Harsham, B. and Forlines, C. and Medenica, Z.},
    • title = {Contextual Push-to-talk: Shortening Voice Dialogs to Improve Driving Performance},
    • booktitle = {International Conference on Human-Computer Interaction with Mobile Devices and Services (MobileHCI)},
    • year = 2010,
    • pages = {113--122},
    • month = sep,
    • isbn = {978-1-60558-835-3},
    • url = {https://www.merl.com/publications/TR2010-085}
    • }
  •  Weinberg, G., Harsham, B., "Object-Oriented Multimodality for Safer In-Vehicle Interfaces", Speech in Mobile and Pervasive Environments (SiMPE), September 2010.
    BibTeX TR2010-084 PDF
    • @inproceedings{Weinberg2010sep2,
    • author = {Weinberg, G. and Harsham, B.},
    • title = {Object-Oriented Multimodality for Safer In-Vehicle Interfaces},
    • booktitle = {Speech in Mobile and Pervasive Environments (SiMPE)},
    • year = 2010,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2010-084}
    • }
  •  Garay-Vega, L., Pradhan, A.K., Weinberg, G.L., Schmidt-Nielsen, B.K., Harsham, B.A., Shen, Y., Divekar, G., Romoser, M., Knodler, M., Fisher, D.L., "Evaluation of Different Speech and Touch Interfaces to In-vehicle Music Retrieval Systems", Accident Analysis & Prevention, Vol. 42, No. 3, May 2010.
    BibTeX TR2010-025 PDF
    • @article{Garay-Vega2010may,
    • author = {Garay-Vega, L. and Pradhan, A.K. and Weinberg, G.L. and Schmidt-Nielsen, B.K. and Harsham, B.A. and Shen, Y. and Divekar, G. and Romoser, M. and Knodler, M. and Fisher, D.L.},
    • title = {Evaluation of Different Speech and Touch Interfaces to In-vehicle Music Retrieval Systems},
    • journal = {Accident Analysis \& Prevention},
    • year = 2010,
    • volume = 42,
    • number = 3,
    • month = may,
    • issn = {0001-4575},
    • url = {https://www.merl.com/publications/TR2010-025}
    • }