- Brand, M., "Nonrigid Embeddings for Dimensionality Reduction", European Conference on Machine Learning (ECML), October 2005, vol. 3720.
BibTeX TR2005-117 PDF- @inproceedings{Brand2005oct,
- author = {Brand, M.},
- title = {{Nonrigid Embeddings for Dimensionality Reduction}},
- booktitle = {European Conference on Machine Learning (ECML)},
- year = 2005,
- volume = 3720,
- month = oct,
- isbn = {3-540-29243-8},
- url = {https://www.merl.com/publications/TR2005-117}
- }
- Bansal, D., Raj, B., Smaragdis, P., "Bandwidth Expansion of Narrowband Speech Using non-Negative Matrix Factorization", Eurospeech, September 2005.
BibTeX TR2005-135 PDF- @inproceedings{Bansal2005sep,
- author = {Bansal, D. and Raj, B. and Smaragdis, P.},
- title = {{Bandwidth Expansion of Narrowband Speech Using non-Negative Matrix Factorization}},
- booktitle = {Eurospeech},
- year = 2005,
- month = sep,
- url = {https://www.merl.com/publications/TR2005-135}
- }
- Raj, B., Singh, R., Smaragdis, P., "Recognizing Speech from Simultaneous Speakers", Eurospeech, September 2005.
BibTeX TR2005-136 PDF- @inproceedings{Raj2005sep,
- author = {Raj, B. and Singh, R. and Smaragdis, P.},
- title = {{Recognizing Speech from Simultaneous Speakers}},
- booktitle = {Eurospeech},
- year = 2005,
- month = sep,
- url = {https://www.merl.com/publications/TR2005-136}
- }
- Vlasic, D., Brand, M., Pfister, H., Popovic, J., "Face Transfer with Multilinear Models", ACM Transactions on Graphics (TOG), Vol. 24, No. 3, pp. 426-433, July 2005.
BibTeX TR2005-048 PDF- @article{Vlasic2005jul,
- author = {{{Vlasic, D. and Brand, M. and Pfister, H. and Popovic, J.}}},
- title = {{{Face Transfer with Multilinear Models}}},
- journal = {ACM Transactions on Graphics (TOG)},
- year = 2005,
- volume = 24,
- number = 3,
- pages = {426--433},
- month = jul,
- issn = {0730-0301},
- url = {https://www.merl.com/publications/TR2005-048}
- }
- Rich, C., Sidner, C., Lesh, N., Garland, A., Booth, S., Chimani, M., "DiamondHelp: A Collaborative Interface Framework for Networked Home Appliances", IEEE International Conference on Distributed Computing Systems Workshops, June 2005, pp. 514-519.
BibTeX TR2004-114 PDF- @inproceedings{Rich2005jun,
- author = {Rich, C. and Sidner, C. and Lesh, N. and Garland, A. and Booth, S. and Chimani, M.},
- title = {{DiamondHelp: A Collaborative Interface Framework for Networked Home Appliances}},
- booktitle = {IEEE International Conference on Distributed Computing Systems Workshops},
- year = 2005,
- pages = {514--519},
- month = jun,
- url = {https://www.merl.com/publications/TR2004-114}
- }
- Hancock, M.S., Shen, C., Forlines, C., Ryall, K., "Exploring Non-Speech Auditory Feedback at an Interactive Multi-User Tabletop", Conference on Graphics Interface (GI), May 2005, pp. 41-50.
BibTeX TR2005-054 PDF- @inproceedings{Hancock2005may,
- author = {Hancock, M.S. and Shen, C. and Forlines, C. and Ryall, K.},
- title = {{Exploring Non-Speech Auditory Feedback at an Interactive Multi-User Tabletop}},
- booktitle = {Conference on Graphics Interface (GI)},
- year = 2005,
- pages = {41--50},
- month = may,
- issn = {0713-5424},
- url = {https://www.merl.com/publications/TR2005-054}
- }
- Guinness, J., Raj, B., Schmidt-Nielsen, B., Turicchia, L., Sarpeshkar, R., "A Companding Front End for Noise-Robust Automatic Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 1, pp. 249-252.
BibTeX TR2005-023 PDF- @inproceedings{Guinness2005mar,
- author = {Guinness, J. and Raj, B. and Schmidt-Nielsen, B. and Turicchia, L. and Sarpeshkar, R.},
- title = {{A Companding Front End for Noise-Robust Automatic Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2005,
- volume = 1,
- pages = {249--252},
- month = mar,
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2005-023}
- }
- Nie, Y., Kong, H.-S., Vetro, A., Barner, K., "Fast Adaptive Fuzzy Post-Filtering for Coding Artifacts Removal in Interlaced Video", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 2, pp. 993-996.
BibTeX TR2005-018 PDF- @inproceedings{Nie2005mar,
- author = {Nie, Y. and Kong, H.-S. and Vetro, A. and Barner, K.},
- title = {{Fast Adaptive Fuzzy Post-Filtering for Coding Artifacts Removal in Interlaced Video}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2005,
- volume = 2,
- pages = {993--996},
- month = mar,
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2005-018}
- }
- Wang, B., Wang, Y., Selesnick, I., Vetro, A., "Video Coding Using 3-D Dual-Tree Discrete Wavelet Transforms", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 2, pp. 61-64.
BibTeX TR2005-019 PDF- @inproceedings{Wang2005mar,
- author = {Wang, B. and Wang, Y. and Selesnick, I. and Vetro, A.},
- title = {{Video Coding Using 3-D Dual-Tree Discrete Wavelet Transforms}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2005,
- volume = 2,
- pages = {61--64},
- month = mar,
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2005-019}
- }
- Xie, L., Kennedy, L., Chang, S.-F., Divakaran, A., Sun, H., Lin, C.-Y., "Layered Dynamic Mixture Model for Pattern Discovery in Asynchronous Multi-Modal Streams", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 2, pp. 1053-1056.
BibTeX TR2005-078 PDF- @inproceedings{Xie2005mar,
- author = {Xie, L. and Kennedy, L. and Chang, S.-F. and Divakaran, A. and Sun, H. and Lin, C.-Y.},
- title = {{Layered Dynamic Mixture Model for Pattern Discovery in Asynchronous Multi-Modal Streams}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2005,
- volume = 2,
- pages = {1053--1056},
- month = mar,
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2005-078}
- }
- Radhakrishnan, R., Divakaran, A., "Systematic Acquisition of Audio Classes for Elevator Surveillance", SPIE Conference on Image and Video Communications and Processing, March 2005, vol. 5685, pp. 64-71.
BibTeX TR2005-076 PDF- @inproceedings{Radhakrishnan2005mar,
- author = {Radhakrishnan, R. and Divakaran, A.},
- title = {{Systematic Acquisition of Audio Classes for Elevator Surveillance}},
- booktitle = {SPIE Conference on Image and Video Communications and Processing},
- year = 2005,
- volume = 5685,
- pages = {64--71},
- month = mar,
- url = {https://www.merl.com/publications/TR2005-076}
- }
- Radhakrishnan, R., Otsuka, I., Xiong, Z., Divakaran, A., "Modelling Sports Highlights Using a Time Series Clustering Framework and Model Interpretation", SPIE Conference on Storage and Retrieval Methods and Applications for Multimedia, January 2005, vol. 5682, pp. 269-276.
BibTeX TR2005-077 PDF- @inproceedings{Radhakrishnan2005jan,
- author = {Radhakrishnan, R. and Otsuka, I. and Xiong, Z. and Divakaran, A.},
- title = {{Modelling Sports Highlights Using a Time Series Clustering Framework and Model Interpretation}},
- booktitle = {SPIE Conference on Storage and Retrieval Methods and Applications for Multimedia},
- year = 2005,
- volume = 5682,
- pages = {269--276},
- month = jan,
- url = {https://www.merl.com/publications/TR2005-077}
- }
- Divakaran, A., Otsuka, I., Radhakrishnan, R., Nakane, K., Ogawa, M., "Audio-Assisted Video Browsing for DVD Recorders", IEEE Pacific-Rim Conference on Multimedia (PCM), November 2004.
BibTeX TR2004-139 PDF- @inproceedings{Divakaran2004nov,
- author = {Divakaran, A. and Otsuka, I. and Radhakrishnan, R. and Nakane, K. and Ogawa, M.},
- title = {{Audio-Assisted Video Browsing for DVD Recorders}},
- booktitle = {IEEE Pacific-Rim Conference on Multimedia (PCM)},
- year = 2004,
- month = nov,
- url = {https://www.merl.com/publications/TR2004-139}
- }
- Xie, L., Kennedy, L., Chang, S.-F., Divakaran, A., Sun, H., Lin, C.-Y., "Discovering Meaningful Multimedia Patterns with Audio-Visual Concepts and Associated Text", IEEE International Conference on Image Processing (ICIP), October 2004, vol. 4, pp. 2383-2386.
BibTeX TR2004-128 PDF- @inproceedings{Xie2004oct,
- author = {Xie, L. and Kennedy, L. and Chang, S.-F. and Divakaran, A. and Sun, H. and Lin, C.-Y.},
- title = {{Discovering Meaningful Multimedia Patterns with Audio-Visual Concepts and Associated Text}},
- booktitle = {IEEE International Conference on Image Processing (ICIP)},
- year = 2004,
- volume = 4,
- pages = {2383--2386},
- month = oct,
- issn = {1522-4880},
- url = {https://www.merl.com/publications/TR2004-128}
- }
- Wolf, P., Woelfel, J., van Gemert, J., Raj, B., Wong, D., "SpokenQuery: An Alternate Approach to Choosing Items with Speech", International Conference on Spoken Language Processing (ICSLP), October 2004.
BibTeX TR2004-121 PDF- @inproceedings{Wolf2004oct,
- author = {Wolf, P. and Woelfel, J. and {van Gemert}, J. and Raj, B. and Wong, D.},
- title = {{SpokenQuery: An Alternate Approach to Choosing Items with Speech}},
- booktitle = {International Conference on Spoken Language Processing (ICSLP)},
- year = 2004,
- month = oct,
- url = {https://www.merl.com/publications/TR2004-121}
- }
- Seltzer, M.L., Raj, B., Stern, R.M., "Likelihood-Maximizing Beamforming for Robust Hands-Free Speech Recognition", IEEE Transactions on Speech and Audio Processing, Vol. 12, No. 5, pp. 489-498, September 2004.
BibTeX TR2004-088 PDF- @article{Seltzer2004sep1,
- author = {Seltzer, M.L. and Raj, B. and Stern, R.M.},
- title = {{Likelihood-Maximizing Beamforming for Robust Hands-Free Speech Recognition}},
- journal = {IEEE Transactions on Speech and Audio Processing},
- year = 2004,
- volume = 12,
- number = 5,
- pages = {489--498},
- month = sep,
- note = {Awarded Best Young Author, March 2007},
- issn = {1063-6676},
- url = {https://www.merl.com/publications/TR2004-088}
- }
- Seltzer, M.L., Raj, B., Stern, R.M., "A Bayesian Classifier for Spectrographic Mask Estimation for Missing Feature Speech Recognition", Speech Communication, Vol. 43, No. 4, pp. 379-393, September 2004.
BibTeX TR2004-086 PDF- @article{Seltzer2004sep2,
- author = {Seltzer, M.L. and Raj, B. and Stern, R.M.},
- title = {{A Bayesian Classifier for Spectrographic Mask Estimation for Missing Feature Speech Recognition}},
- journal = {Speech Communication},
- year = 2004,
- volume = 43,
- number = 4,
- pages = {379--393},
- month = sep,
- url = {https://www.merl.com/publications/TR2004-086}
- }
- Raj, B., Seltzer, M.L., Stern, R.M., "Reconstruction of Missing Features for Robust Speech Recognition", Speech Communication, Vol. 43, No. 4, pp. 275-296, September 2004.
BibTeX TR2004-087 PDF- @article{Raj2004sep,
- author = {Raj, B. and Seltzer, M.L. and Stern, R.M.},
- title = {{Reconstruction of Missing Features for Robust Speech Recognition}},
- journal = {Speech Communication},
- year = 2004,
- volume = 43,
- number = 4,
- pages = {275--296},
- month = sep,
- url = {https://www.merl.com/publications/TR2004-087}
- }
- Singh, R., Raj, B., "Classification in Likelihood Spaces", Technometrics, Vol. 46, No. 3, pp. 318-329, August 2004.
BibTeX TR2004-089 PDF- @article{Singh2004aug,
- author = {{{Singh, R. and Raj, B.}}},
- title = {{{Classification in Likelihood Spaces}}},
- journal = {Technometrics},
- year = 2004,
- volume = 46,
- number = 3,
- pages = {318--329},
- month = aug,
- issn = {0040-1706},
- url = {https://www.merl.com/publications/TR2004-089}
- }
- Smaragdis, P., "Exploiting Redundancy to Construct Listening Systems", Perspectives on Speech Separation, July 2004.
BibTeX SpringerLink- @inproceedings{Smaragdis2004jul,
- author = {Smaragdis, P.},
- title = {{Exploiting Redundancy to Construct Listening Systems}},
- booktitle = {Perspectives on Speech Separation},
- year = 2004,
- month = jul,
- url = {https://link.springer.com/chapter/10.1007/0-387-22794-6_7}
- }
- Raj, B., Singh, R., Stern, R.M., "On Tracking Noise with Linear Dynamical System Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2004, vol. 1, pp. 965-968.
BibTeX TR2004-042 PDF- @inproceedings{Raj2004may,
- author = {Raj, B. and Singh, R. and Stern, R.M.},
- title = {{On Tracking Noise with Linear Dynamical System Models}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2004,
- volume = 1,
- pages = {965--968},
- month = may,
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2004-042}
- }
- Divi, V., Forlines, C., van Gemert, J.V., Raj, B., Schmidt-Nielsen, B., Wittenburg, K., Woelfel, J., Wolf, P., Zhang, F., "A Speech-In List-Out Approach to Spoken User Interfaces", Human Language Technology Conference (HLT), May 2004.
BibTeX TR2004-023 PDF- @inproceedings{Divi2004may,
- author = {Divi, V. and Forlines, C. and {van Gemert}, J.V. and Raj, B. and Schmidt-Nielsen, B. and Wittenburg, K. and Woelfel, J. and Wolf, P. and Zhang, F.},
- title = {{A Speech-In List-Out Approach to Spoken User Interfaces}},
- booktitle = {Human Language Technology Conference (HLT)},
- year = 2004,
- month = may,
- url = {https://www.merl.com/publications/TR2004-023}
- }
- Raj, B., Seltzer, M.L., Reyes-Gomez, M.J., "Speech Recognizer Based Maximum Likelihood Beamforming", NSF Workshop on Perspectives on Speech Separation, October 2003.
BibTeX TR2003-87 PDF- @inproceedings{Raj2003oct,
- author = {Raj, B. and Seltzer, M.L. and Reyes-Gomez, M.J.},
- title = {{Speech Recognizer Based Maximum Likelihood Beamforming}},
- booktitle = {NSF Workshop on Perspectives on Speech Separation},
- year = 2003,
- month = oct,
- url = {https://www.merl.com/publications/TR2003-87}
- }
- Reyes-Gomez, M.J., Raj, B., Ellis, D.P.W., "Multi-Channel Source Separation by Beamforming Trained with Factorial HMMS", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2003, pp. 13-16.
BibTeX TR2003-88 PDF- @inproceedings{Reyes-Gomez2003oct,
- author = {Reyes-Gomez, M.J. and Raj, B. and Ellis, D.P.W.},
- title = {{Multi-Channel Source Separation by Beamforming Trained with Factorial HMMS}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2003,
- pages = {13--16},
- month = oct,
- url = {https://www.merl.com/publications/TR2003-88}
- }
- Peker, K.A., Divakaran, A., "An Extended Framework for Adaptive Playback-Based Video Summarization", SPIE Conference on Internet Multimedia Management Systems, September 2003, vol. 5242, pp. 26-33.
BibTeX TR2003-115 PDF- @inproceedings{Peker2003sep,
- author = {Peker, K.A. and Divakaran, A.},
- title = {{An Extended Framework for Adaptive Playback-Based Video Summarization}},
- booktitle = {SPIE Conference on Internet Multimedia Management Systems},
- year = 2003,
- volume = 5242,
- pages = {26--33},
- month = sep,
- url = {https://www.merl.com/publications/TR2003-115}
- }