Publications

Reddy, A.M., Raj, B., "Soft Mask Methods for Single-Channel Speaker Separation", IEEE Transactions on Audio, Speech and Language Processing, Vol. 15, No. 6, pp. 1766-1776, August 2007.
BibTeX IEEE Xplore
- @article{Reddy2007aug,
- author = {Reddy, A.M. and Raj, B.},
- title = {{Soft Mask Methods for Single-Channel Speaker Separation}},
- journal = {IEEE Transactions on Audio, Speech and Language Processing},
- year = 2007,
- volume = 15,
- number = 6,
- pages = {1766--1776},
- month = aug,
- issn = {1558-7916},
- url = {https://ieeexplore.ieee.org/document/4276763}
- }
Smaragdis, P., Shashanka, M., "A Framework for Secure Speech Recognition", IEEE Transactions on Audio, Speech and Language Processing, DOI: 10.1109/TASL.2007.894526, Vol. 15, No. 4, pp. 1404-1413, May 2007.
BibTeX TR2007-057 PDF
- @article{Smaragdis2007may,
- author = {Smaragdis, P. and Shashanka, M.},
- title = {{A Framework for Secure Speech Recognition}},
- journal = {IEEE Transactions on Audio, Speech and Language Processing},
- year = 2007,
- volume = 15,
- number = 4,
- pages = {1404--1413},
- month = may,
- doi = {10.1109/TASL.2007.894526},
- issn = {1558-7916},
- url = {https://www.merl.com/publications/TR2007-057}
- }
Tse, E., Shen, C., Greenberg, S., Forlines, C., "How Pairs Interact Over a Multimodal Digital Table", Conference on Human Factors In Computing Systems (SIGCHI), April 2007, pp. 215-218.
BibTeX TR2007-055 PDF
- @inproceedings{Tse2007apr,
- author = {Tse, E. and Shen, C. and Greenberg, S. and Forlines, C.},
- title = {{How Pairs Interact Over a Multimodal Digital Table}},
- booktitle = {Conference on Human Factors In Computing Systems (SIGCHI)},
- year = 2007,
- pages = {215--218},
- month = apr,
- isbn = {978-1-59593-593-9},
- url = {https://www.merl.com/publications/TR2007-055}
- }
Draper, S.C., Khisti, A., Martinian, E., Vetro, A., Yedidia, J.S., "Using Distributed Source Coding to Secure Fingerprint Biometrics", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2007, vol. 2, pp. 129-132.
BibTeX TR2007-005 PDF
- @inproceedings{Draper2007apr,
- author = {Draper, S.C. and Khisti, A. and Martinian, E. and Vetro, A. and Yedidia, J.S.},
- title = {{Using Distributed Source Coding to Secure Fingerprint Biometrics}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2007,
- volume = 2,
- pages = {129--132},
- month = apr,
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2007-005}
- }
Raj, B., Singh, R., Shashanka, M., Smaragdis, P., "Bandwidth Expansion with a Polya URN Model", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2007, vol. 4, pp. IV597-IV600.
BibTeX TR2007-058 PDF
- @inproceedings{Raj2007apr,
- author = {Raj, B. and Singh, R. and Shashanka, M. and Smaragdis, P.},
- title = {{Bandwidth Expansion with a Polya URN Model}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2007,
- volume = 4,
- pages = {IV597--IV600},
- month = apr,
- url = {https://www.merl.com/publications/TR2007-058}
- }
Shashanka, M.V.S., Raj, B., Smaragdis, P., "Sparse Overcomplete Decomposition for Single Channel Speaker Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2007, vol. 2, pp. 641-644.
BibTeX TR2007-031 PDF
- @inproceedings{Shashanka2007apr,
- author = {Shashanka, M.V.S. and Raj, B. and Smaragdis, P.},
- title = {{Sparse Overcomplete Decomposition for Single Channel Speaker Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2007,
- volume = 2,
- pages = {641--644},
- month = apr,
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2007-031}
- }
Smaragdis, P., Shashanka, M., "A Framework for Secure Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2007, vol. 4, pp. 969-972.
BibTeX IEEE Xplore
- @inproceedings{Smaragdis2007apr,
- author = {Smaragdis, P. and Shashanka, M.},
- title = {{A Framework for Secure Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2007,
- volume = 4,
- pages = {969--972},
- month = apr,
- issn = {1520-6149},
- url = {https://ieeexplore.ieee.org/document/4218264}
- }
Smaragdis, P., "Convolutive Speech Bases and their Application to Supervised Speech Separation", IEEE Transactions on Audio, Speech and Language Processing, Vol. 15, No. 1, pp. 1-12, January 2007.
BibTeX TR2007-002 PDF
- @article{Smaragdis2007jan2,
- author = {Smaragdis, P.},
- title = {{Convolutive Speech Bases and their Application to Supervised Speech Separation}},
- journal = {IEEE Transactions on Audio, Speech and Language Processing},
- year = 2007,
- volume = 15,
- number = 1,
- pages = {1--12},
- month = jan,
- issn = {1558-7916},
- url = {https://www.merl.com/publications/TR2007-002}
- }
Smaragdis, P., Boufounos, P., "Position and Trajectory Learning for Microphone Arrays", IEEE Transactions on Audio, Speech and Language Processing, Vol. 15, No. 1, pp. 358-368, January 2007.
BibTeX TR2007-001 PDF
- @article{Smaragdis2007jan1,
- author = {Smaragdis, P. and Boufounos, P.},
- title = {{Position and Trajectory Learning for Microphone Arrays}},
- journal = {IEEE Transactions on Audio, Speech and Language Processing},
- year = 2007,
- volume = 15,
- number = 1,
- pages = {358--368},
- month = jan,
- issn = {1558-7916},
- url = {https://www.merl.com/publications/TR2007-001}
- }
Tse, E., Greenberg, S., Shen, C., "GSI Demo: Multiuser Gesture/Speech Interaction over Digital Tables by Wrapping Single User Applications", International Conference on Multimodal Interfaces (ICMI), November 2006, pp. 76-83.
BibTeX TR2006-085 PDF
- @inproceedings{Tse2006nov,
- author = {Tse, E. and Greenberg, S. and Shen, C.},
- title = {{GSI Demo: Multiuser Gesture/Speech Interaction over Digital Tables by Wrapping Single User Applications}},
- booktitle = {International Conference on Multimodal Interfaces (ICMI)},
- year = 2006,
- pages = {76--83},
- month = nov,
- isbn = {1-59593-541-X},
- url = {https://www.merl.com/publications/TR2006-085}
- }
Weinberg, G., Raj, B., Kalgaonkar, K., "Two New Techniques for Natural Spoken User Interfaces", ACM Symposium on User Interface Software and Technology (UIST), October 2006.
BibTeX TR2006-098 PDF
- @inproceedings{Weinberg2006oct,
- author = {Weinberg, G. and Raj, B. and Kalgaonkar, K.},
- title = {{Two New Techniques for Natural Spoken User Interfaces}},
- booktitle = {ACM Symposium on User Interface Software and Technology (UIST)},
- year = 2006,
- month = oct,
- url = {https://www.merl.com/publications/TR2006-098}
- }
Wittenburg, K., Lanning, T., Schwenke, D., Shubin, H., Vetro, A., "The Prospects for Unrestricted Speech Input for TV Content Search", International Working Conference on Advanced Visual Interfaces (AVI), May 2006.
BibTeX TR2006-045 PDF
- @inproceedings{Wittenburg2006may,
- author = {Wittenburg, K. and Lanning, T. and Schwenke, D. and Shubin, H. and Vetro, A.},
- title = {{The Prospects for Unrestricted Speech Input for TV Content Search}},
- booktitle = {International Working Conference on Advanced Visual Interfaces (AVI)},
- year = 2006,
- month = may,
- url = {https://www.merl.com/publications/TR2006-045}
- }
Tse, E., Shen, C., Greenberg, S., Forlines, C., "Enabling Interaction with Single User Applications through Speech and Gestures on a Multi-User Tabletop", International Working Conference on Advanced Visual Interfaces (AVI), May 2006.
BibTeX TR2005-130 PDF
- @inproceedings{Tse2006may1,
- author = {Tse, E. and Shen, C. and Greenberg, S. and Forlines, C.},
- title = {{Enabling Interaction with Single User Applications through Speech and Gestures on a Multi-User Tabletop}},
- booktitle = {International Working Conference on Advanced Visual Interfaces (AVI)},
- year = 2006,
- month = may,
- url = {https://www.merl.com/publications/TR2005-130}
- }
Radhakrishnan, R., Divakaran, A., "Generative Process Tracking for Audio Analysis", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2006, vol. 5, pp. V.
BibTeX TR2006-053 PDF
- @inproceedings{Radhakrishnan2006may,
- author = {Radhakrishnan, R. and Divakaran, A.},
- title = {{Generative Process Tracking for Audio Analysis}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2006,
- volume = 5,
- pages = {V},
- month = may,
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2006-053}
- }
Raj, B., Shashanka, M.V.S., Smaragdis, P., "Latent Dirichlet Decomposition for Single Channel Speaker Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2006.
BibTeX TR2006-064 PDF
- @inproceedings{Raj2006may,
- author = {Raj, B. and Shashanka, M.V.S. and Smaragdis, P.},
- title = {{Latent Dirichlet Decomposition for Single Channel Speaker Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2006,
- month = may,
- url = {https://www.merl.com/publications/TR2006-064}
- }
Shashanka, M.V.S., Smaragdis, P., "Secure Sound Classification: Gaussian Mixture Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2006.
BibTeX TR2006-065 PDF
- @inproceedings{Shashanka2006may,
- author = {Shashanka, M.V.S. and Smaragdis, P.},
- title = {{Secure Sound Classification: Gaussian Mixture Models}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2006,
- month = may,
- url = {https://www.merl.com/publications/TR2006-065}
- }
Tse, E., Greenberg, S., Shen, C., Forlines, C., "Multimodal Multiplayer Tabletop Gaming", International Workshop on Pervasive Gaming Applications (PerGames), May 2006.
BibTeX TR2006-009 PDF
- @inproceedings{Tse2006may2,
- author = {Tse, E. and Greenberg, S. and Shen, C. and Forlines, C.},
- title = {{Multimodal Multiplayer Tabletop Gaming}},
- booktitle = {International Workshop on Pervasive Gaming Applications (PerGames)},
- year = 2006,
- month = may,
- url = {https://www.merl.com/publications/TR2006-009}
- }
Xing, L., Yu, H., Huang, Q., Ye, Q., Divakaran, A., "Subjective Evaluation Criterion for Selecting Affective Features and Modeling Highlights", SPIE Conference on Multimedia Content Analysis, Management and Retrieval, January 2006, vol. 6073, pp. 188-195.
BibTeX TR2006-027 PDF
- @inproceedings{Xing2006jan,
- author = {Xing, L. and Yu, H. and Huang, Q. and Ye, Q. and Divakaran, A.},
- title = {{Subjective Evaluation Criterion for Selecting Affective Features and Modeling Highlights}},
- booktitle = {SPIE Conference on Multimedia Content Analysis, Management and Retrieval},
- year = 2006,
- volume = 6073,
- pages = {188--195},
- month = jan,
- url = {https://www.merl.com/publications/TR2006-027}
- }
Shen, C., "Multi-User Interface and Interactions on Direct-Touch Horizontal Surfaces: Collaborative Tabletop Research at MERL", IEEE International Workshop on Horizontal Interactive Human-Computer Systems (TableTop), January 2006, pp. 53-54.
BibTeX TR2005-119 PDF
- @inproceedings{Shen2006jan,
- author = {Shen, C.},
- title = {{Multi-User Interface and Interactions on Direct-Touch Horizontal Surfaces: Collaborative Tabletop Research at MERL}},
- booktitle = {IEEE International Workshop on Horizontal Interactive Human-Computer Systems (TableTop)},
- year = 2006,
- pages = {53--54},
- month = jan,
- isbn = {0-7695-2494-X},
- url = {https://www.merl.com/publications/TR2005-119}
- }
Raj, B., Singh, R., "Reconstructing Spectral Vectors with Uncertain Spectrographic Masks for Robust Speech Recognition", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), November 2005, pp. 27-32.
BibTeX TR2005-160 PDF
- @inproceedings{Raj2005nov,
- author = {Raj, B. and Singh, R.},
- title = {{Reconstructing Spectral Vectors with Uncertain Spectrographic Masks for Robust Speech Recognition}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2005,
- pages = {27--32},
- month = nov,
- url = {https://www.merl.com/publications/TR2005-160}
- }
Hu, R., Raj, B., "A Robust Voice Activity Detector Using an Acoustic Doppler Radar", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), November 2005, pp. 171-176.
BibTeX TR2005-159 PDF
- @inproceedings{Hu2005nov,
- author = {Hu, R. and Raj, B.},
- title = {{A Robust Voice Activity Detector Using an Acoustic Doppler Radar}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2005,
- pages = {171--176},
- month = nov,
- url = {https://www.merl.com/publications/TR2005-159}
- }
Raj, B., Smaragdis, P., "Latent Variable Decomposition of Spectrograms for Single Channel Speaker Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2005, pp. 17-20.
BibTeX TR2005-137 PDF
- @inproceedings{Raj2005oct,
- author = {Raj, B. and Smaragdis, P.},
- title = {{Latent Variable Decomposition of Spectrograms for Single Channel Speaker Separation}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2005,
- pages = {17--20},
- month = oct,
- url = {https://www.merl.com/publications/TR2005-137}
- }
Brand, M., "Nonrigid Embeddings for Dimensionality Reduction", European Conference on Machine Learning (ECML), October 2005, vol. 3720.
BibTeX TR2005-117 PDF
- @inproceedings{Brand2005oct,
- author = {Brand, M.},
- title = {{Nonrigid Embeddings for Dimensionality Reduction}},
- booktitle = {European Conference on Machine Learning (ECML)},
- year = 2005,
- volume = 3720,
- month = oct,
- isbn = {3-540-29243-8},
- url = {https://www.merl.com/publications/TR2005-117}
- }
Bansal, D., Raj, B., Smaragdis, P., "Bandwidth Expansion of Narrowband Speech Using non-Negative Matrix Factorization", Eurospeech, September 2005.
BibTeX TR2005-135 PDF
- @inproceedings{Bansal2005sep,
- author = {Bansal, D. and Raj, B. and Smaragdis, P.},
- title = {{Bandwidth Expansion of Narrowband Speech Using non-Negative Matrix Factorization}},
- booktitle = {Eurospeech},
- year = 2005,
- month = sep,
- url = {https://www.merl.com/publications/TR2005-135}
- }
Raj, B., Singh, R., Smaragdis, P., "Recognizing Speech from Simultaneous Speakers", Eurospeech, September 2005.
BibTeX TR2005-136 PDF
- @inproceedings{Raj2005sep,
- author = {Raj, B. and Singh, R. and Smaragdis, P.},
- title = {{Recognizing Speech from Simultaneous Speakers}},
- booktitle = {Eurospeech},
- year = 2005,
- month = sep,
- url = {https://www.merl.com/publications/TR2005-136}
- }