Publications

378 / 3,813 publications found.


  •  Brand, M., "Nonrigid Embeddings for Dimensionality Reduction", European Conference on Machine Learning (ECML), October 2005, vol. 3720.
    BibTeX TR2005-117 PDF
    • @inproceedings{Brand2005oct,
    • author = {Brand, M.},
    • title = {{Nonrigid Embeddings for Dimensionality Reduction}},
    • booktitle = {European Conference on Machine Learning (ECML)},
    • year = 2005,
    • volume = 3720,
    • month = oct,
    • isbn = {3-540-29243-8},
    • url = {https://www.merl.com/publications/TR2005-117}
    • }
  •  Bansal, D., Raj, B., Smaragdis, P., "Bandwidth Expansion of Narrowband Speech Using non-Negative Matrix Factorization", Eurospeech, September 2005.
    BibTeX TR2005-135 PDF
    • @inproceedings{Bansal2005sep,
    • author = {Bansal, D. and Raj, B. and Smaragdis, P.},
    • title = {{Bandwidth Expansion of Narrowband Speech Using non-Negative Matrix Factorization}},
    • booktitle = {Eurospeech},
    • year = 2005,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2005-135}
    • }
  •  Raj, B., Singh, R., Smaragdis, P., "Recognizing Speech from Simultaneous Speakers", Eurospeech, September 2005.
    BibTeX TR2005-136 PDF
    • @inproceedings{Raj2005sep,
    • author = {Raj, B. and Singh, R. and Smaragdis, P.},
    • title = {{Recognizing Speech from Simultaneous Speakers}},
    • booktitle = {Eurospeech},
    • year = 2005,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2005-136}
    • }
  •  Vlasic, D., Brand, M., Pfister, H., Popovic, J., "Face Transfer with Multilinear Models", ACM Transactions on Graphics (TOG), Vol. 24, No. 3, pp. 426-433, July 2005.
    BibTeX TR2005-048 PDF
    • @article{Vlasic2005jul,
    • author = {{{Vlasic, D. and Brand, M. and Pfister, H. and Popovic, J.}}},
    • title = {{{Face Transfer with Multilinear Models}}},
    • journal = {ACM Transactions on Graphics (TOG)},
    • year = 2005,
    • volume = 24,
    • number = 3,
    • pages = {426--433},
    • month = jul,
    • issn = {0730-0301},
    • url = {https://www.merl.com/publications/TR2005-048}
    • }
  •  Rich, C., Sidner, C., Lesh, N., Garland, A., Booth, S., Chimani, M., "DiamondHelp: A Collaborative Interface Framework for Networked Home Appliances", IEEE International Conference on Distributed Computing Systems Workshops, June 2005, pp. 514-519.
    BibTeX TR2004-114 PDF
    • @inproceedings{Rich2005jun,
    • author = {Rich, C. and Sidner, C. and Lesh, N. and Garland, A. and Booth, S. and Chimani, M.},
    • title = {{DiamondHelp: A Collaborative Interface Framework for Networked Home Appliances}},
    • booktitle = {IEEE International Conference on Distributed Computing Systems Workshops},
    • year = 2005,
    • pages = {514--519},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2004-114}
    • }
  •  Hancock, M.S., Shen, C., Forlines, C., Ryall, K., "Exploring Non-Speech Auditory Feedback at an Interactive Multi-User Tabletop", Conference on Graphics Interface (GI), May 2005, pp. 41-50.
    BibTeX TR2005-054 PDF
    • @inproceedings{Hancock2005may,
    • author = {Hancock, M.S. and Shen, C. and Forlines, C. and Ryall, K.},
    • title = {{Exploring Non-Speech Auditory Feedback at an Interactive Multi-User Tabletop}},
    • booktitle = {Conference on Graphics Interface (GI)},
    • year = 2005,
    • pages = {41--50},
    • month = may,
    • issn = {0713-5424},
    • url = {https://www.merl.com/publications/TR2005-054}
    • }
  •  Guinness, J., Raj, B., Schmidt-Nielsen, B., Turicchia, L., Sarpeshkar, R., "A Companding Front End for Noise-Robust Automatic Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 1, pp. 249-252.
    BibTeX TR2005-023 PDF
    • @inproceedings{Guinness2005mar,
    • author = {Guinness, J. and Raj, B. and Schmidt-Nielsen, B. and Turicchia, L. and Sarpeshkar, R.},
    • title = {{A Companding Front End for Noise-Robust Automatic Speech Recognition}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2005,
    • volume = 1,
    • pages = {249--252},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2005-023}
    • }
  •  Nie, Y., Kong, H.-S., Vetro, A., Barner, K., "Fast Adaptive Fuzzy Post-Filtering for Coding Artifacts Removal in Interlaced Video", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 2, pp. 993-996.
    BibTeX TR2005-018 PDF
    • @inproceedings{Nie2005mar,
    • author = {Nie, Y. and Kong, H.-S. and Vetro, A. and Barner, K.},
    • title = {{Fast Adaptive Fuzzy Post-Filtering for Coding Artifacts Removal in Interlaced Video}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2005,
    • volume = 2,
    • pages = {993--996},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2005-018}
    • }
  •  Wang, B., Wang, Y., Selesnick, I., Vetro, A., "Video Coding Using 3-D Dual-Tree Discrete Wavelet Transforms", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 2, pp. 61-64.
    BibTeX TR2005-019 PDF
    • @inproceedings{Wang2005mar,
    • author = {Wang, B. and Wang, Y. and Selesnick, I. and Vetro, A.},
    • title = {{Video Coding Using 3-D Dual-Tree Discrete Wavelet Transforms}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2005,
    • volume = 2,
    • pages = {61--64},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2005-019}
    • }
  •  Xie, L., Kennedy, L., Chang, S.-F., Divakaran, A., Sun, H., Lin, C.-Y., "Layered Dynamic Mixture Model for Pattern Discovery in Asynchronous Multi-Modal Streams", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 2, pp. 1053-1056.
    BibTeX TR2005-078 PDF
    • @inproceedings{Xie2005mar,
    • author = {Xie, L. and Kennedy, L. and Chang, S.-F. and Divakaran, A. and Sun, H. and Lin, C.-Y.},
    • title = {{Layered Dynamic Mixture Model for Pattern Discovery in Asynchronous Multi-Modal Streams}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2005,
    • volume = 2,
    • pages = {1053--1056},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2005-078}
    • }
  •  Radhakrishnan, R., Divakaran, A., "Systematic Acquisition of Audio Classes for Elevator Surveillance", SPIE Conference on Image and Video Communications and Processing, March 2005, vol. 5685, pp. 64-71.
    BibTeX TR2005-076 PDF
    • @inproceedings{Radhakrishnan2005mar,
    • author = {Radhakrishnan, R. and Divakaran, A.},
    • title = {{Systematic Acquisition of Audio Classes for Elevator Surveillance}},
    • booktitle = {SPIE Conference on Image and Video Communications and Processing},
    • year = 2005,
    • volume = 5685,
    • pages = {64--71},
    • month = mar,
    • url = {https://www.merl.com/publications/TR2005-076}
    • }
  •  Radhakrishnan, R., Otsuka, I., Xiong, Z., Divakaran, A., "Modelling Sports Highlights Using a Time Series Clustering Framework and Model Interpretation", SPIE Conference on Storage and Retrieval Methods and Applications for Multimedia, January 2005, vol. 5682, pp. 269-276.
    BibTeX TR2005-077 PDF
    • @inproceedings{Radhakrishnan2005jan,
    • author = {Radhakrishnan, R. and Otsuka, I. and Xiong, Z. and Divakaran, A.},
    • title = {{Modelling Sports Highlights Using a Time Series Clustering Framework and Model Interpretation}},
    • booktitle = {SPIE Conference on Storage and Retrieval Methods and Applications for Multimedia},
    • year = 2005,
    • volume = 5682,
    • pages = {269--276},
    • month = jan,
    • url = {https://www.merl.com/publications/TR2005-077}
    • }
  •  Divakaran, A., Otsuka, I., Radhakrishnan, R., Nakane, K., Ogawa, M., "Audio-Assisted Video Browsing for DVD Recorders", IEEE Pacific-Rim Conference on Multimedia (PCM), November 2004.
    BibTeX TR2004-139 PDF
    • @inproceedings{Divakaran2004nov,
    • author = {Divakaran, A. and Otsuka, I. and Radhakrishnan, R. and Nakane, K. and Ogawa, M.},
    • title = {{Audio-Assisted Video Browsing for DVD Recorders}},
    • booktitle = {IEEE Pacific-Rim Conference on Multimedia (PCM)},
    • year = 2004,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2004-139}
    • }
  •  Xie, L., Kennedy, L., Chang, S.-F., Divakaran, A., Sun, H., Lin, C.-Y., "Discovering Meaningful Multimedia Patterns with Audio-Visual Concepts and Associated Text", IEEE International Conference on Image Processing (ICIP), October 2004, vol. 4, pp. 2383-2386.
    BibTeX TR2004-128 PDF
    • @inproceedings{Xie2004oct,
    • author = {Xie, L. and Kennedy, L. and Chang, S.-F. and Divakaran, A. and Sun, H. and Lin, C.-Y.},
    • title = {{Discovering Meaningful Multimedia Patterns with Audio-Visual Concepts and Associated Text}},
    • booktitle = {IEEE International Conference on Image Processing (ICIP)},
    • year = 2004,
    • volume = 4,
    • pages = {2383--2386},
    • month = oct,
    • issn = {1522-4880},
    • url = {https://www.merl.com/publications/TR2004-128}
    • }
  •  Wolf, P., Woelfel, J., van Gemert, J., Raj, B., Wong, D., "SpokenQuery: An Alternate Approach to Choosing Items with Speech", International Conference on Spoken Language Processing (ICSLP), October 2004.
    BibTeX TR2004-121 PDF
    • @inproceedings{Wolf2004oct,
    • author = {Wolf, P. and Woelfel, J. and {van Gemert}, J. and Raj, B. and Wong, D.},
    • title = {{SpokenQuery: An Alternate Approach to Choosing Items with Speech}},
    • booktitle = {International Conference on Spoken Language Processing (ICSLP)},
    • year = 2004,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2004-121}
    • }
  •  Seltzer, M.L., Raj, B., Stern, R.M., "Likelihood-Maximizing Beamforming for Robust Hands-Free Speech Recognition", IEEE Transactions on Speech and Audio Processing, Vol. 12, No. 5, pp. 489-498, September 2004.
    BibTeX TR2004-088 PDF
    • @article{Seltzer2004sep1,
    • author = {Seltzer, M.L. and Raj, B. and Stern, R.M.},
    • title = {{Likelihood-Maximizing Beamforming for Robust Hands-Free Speech Recognition}},
    • journal = {IEEE Transactions on Speech and Audio Processing},
    • year = 2004,
    • volume = 12,
    • number = 5,
    • pages = {489--498},
    • month = sep,
    • note = {Awarded Best Young Author, March 2007},
    • issn = {1063-6676},
    • url = {https://www.merl.com/publications/TR2004-088}
    • }
  •  Seltzer, M.L., Raj, B., Stern, R.M., "A Bayesian Classifier for Spectrographic Mask Estimation for Missing Feature Speech Recognition", Speech Communication, Vol. 43, No. 4, pp. 379-393, September 2004.
    BibTeX TR2004-086 PDF
    • @article{Seltzer2004sep2,
    • author = {Seltzer, M.L. and Raj, B. and Stern, R.M.},
    • title = {{A Bayesian Classifier for Spectrographic Mask Estimation for Missing Feature Speech Recognition}},
    • journal = {Speech Communication},
    • year = 2004,
    • volume = 43,
    • number = 4,
    • pages = {379--393},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2004-086}
    • }
  •  Raj, B., Seltzer, M.L., Stern, R.M., "Reconstruction of Missing Features for Robust Speech Recognition", Speech Communication, Vol. 43, No. 4, pp. 275-296, September 2004.
    BibTeX TR2004-087 PDF
    • @article{Raj2004sep,
    • author = {Raj, B. and Seltzer, M.L. and Stern, R.M.},
    • title = {{Reconstruction of Missing Features for Robust Speech Recognition}},
    • journal = {Speech Communication},
    • year = 2004,
    • volume = 43,
    • number = 4,
    • pages = {275--296},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2004-087}
    • }
  •  Singh, R., Raj, B., "Classification in Likelihood Spaces", Technometrics, Vol. 46, No. 3, pp. 318-329, August 2004.
    BibTeX TR2004-089 PDF
    • @article{Singh2004aug,
    • author = {{{Singh, R. and Raj, B.}}},
    • title = {{{Classification in Likelihood Spaces}}},
    • journal = {Technometrics},
    • year = 2004,
    • volume = 46,
    • number = 3,
    • pages = {318--329},
    • month = aug,
    • issn = {0040-1706},
    • url = {https://www.merl.com/publications/TR2004-089}
    • }
  •  Smaragdis, P., "Exploiting Redundancy to Construct Listening Systems", Perspectives on Speech Separation, July 2004.
    BibTeX SpringerLink
    • @inproceedings{Smaragdis2004jul,
    • author = {Smaragdis, P.},
    • title = {{Exploiting Redundancy to Construct Listening Systems}},
    • booktitle = {Perspectives on Speech Separation},
    • year = 2004,
    • month = jul,
    • url = {https://link.springer.com/chapter/10.1007/0-387-22794-6_7}
    • }
  •  Raj, B., Singh, R., Stern, R.M., "On Tracking Noise with Linear Dynamical System Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2004, vol. 1, pp. 965-968.
    BibTeX TR2004-042 PDF
    • @inproceedings{Raj2004may,
    • author = {Raj, B. and Singh, R. and Stern, R.M.},
    • title = {{On Tracking Noise with Linear Dynamical System Models}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2004,
    • volume = 1,
    • pages = {965--968},
    • month = may,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2004-042}
    • }
  •  Divi, V., Forlines, C., van Gemert, J.V., Raj, B., Schmidt-Nielsen, B., Wittenburg, K., Woelfel, J., Wolf, P., Zhang, F., "A Speech-In List-Out Approach to Spoken User Interfaces", Human Language Technology Conference (HLT), May 2004.
    BibTeX TR2004-023 PDF
    • @inproceedings{Divi2004may,
    • author = {Divi, V. and Forlines, C. and {van Gemert}, J.V. and Raj, B. and Schmidt-Nielsen, B. and Wittenburg, K. and Woelfel, J. and Wolf, P. and Zhang, F.},
    • title = {{A Speech-In List-Out Approach to Spoken User Interfaces}},
    • booktitle = {Human Language Technology Conference (HLT)},
    • year = 2004,
    • month = may,
    • url = {https://www.merl.com/publications/TR2004-023}
    • }
  •  Raj, B., Seltzer, M.L., Reyes-Gomez, M.J., "Speech Recognizer Based Maximum Likelihood Beamforming", NSF Workshop on Perspectives on Speech Separation, October 2003.
    BibTeX TR2003-87 PDF
    • @inproceedings{Raj2003oct,
    • author = {Raj, B. and Seltzer, M.L. and Reyes-Gomez, M.J.},
    • title = {{Speech Recognizer Based Maximum Likelihood Beamforming}},
    • booktitle = {NSF Workshop on Perspectives on Speech Separation},
    • year = 2003,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2003-87}
    • }
  •  Reyes-Gomez, M.J., Raj, B., Ellis, D.P.W., "Multi-Channel Source Separation by Beamforming Trained with Factorial HMMS", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2003, pp. 13-16.
    BibTeX TR2003-88 PDF
    • @inproceedings{Reyes-Gomez2003oct,
    • author = {Reyes-Gomez, M.J. and Raj, B. and Ellis, D.P.W.},
    • title = {{Multi-Channel Source Separation by Beamforming Trained with Factorial HMMS}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2003,
    • pages = {13--16},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2003-88}
    • }
  •  Peker, K.A., Divakaran, A., "An Extended Framework for Adaptive Playback-Based Video Summarization", SPIE Conference on Internet Multimedia Management Systems, September 2003, vol. 5242, pp. 26-33.
    BibTeX TR2003-115 PDF
    • @inproceedings{Peker2003sep,
    • author = {Peker, K.A. and Divakaran, A.},
    • title = {{An Extended Framework for Adaptive Playback-Based Video Summarization}},
    • booktitle = {SPIE Conference on Internet Multimedia Management Systems},
    • year = 2003,
    • volume = 5242,
    • pages = {26--33},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2003-115}
    • }