Publications

235 / 3,841 publications found.


  •  Singh, R., Raj, B., "Classification in Likelihood Spaces", Technometrics, Vol. 46, No. 3, pp. 318-329, August 2004.
    BibTeX TR2004-089 PDF
    • @article{Singh2004aug,
    • author = {{{Singh, R. and Raj, B.}}},
    • title = {{{Classification in Likelihood Spaces}}},
    • journal = {Technometrics},
    • year = 2004,
    • volume = 46,
    • number = 3,
    • pages = {318--329},
    • month = aug,
    • issn = {0040-1706},
    • url = {https://www.merl.com/publications/TR2004-089}
    • }
  •  Smaragdis, P., "Exploiting Redundancy to Construct Listening Systems", Perspectives on Speech Separation, July 2004.
    BibTeX SpringerLink
    • @inproceedings{Smaragdis2004jul,
    • author = {Smaragdis, P.},
    • title = {{Exploiting Redundancy to Construct Listening Systems}},
    • booktitle = {Perspectives on Speech Separation},
    • year = 2004,
    • month = jul,
    • url = {https://link.springer.com/chapter/10.1007/0-387-22794-6_7}
    • }
  •  Radhakrishnan, R., Xiong, Z., Divakaran, A., Memon, N., "Time Series Analysis and Segmentation Using Eigenvectors for Mining Semantic Audio Label Sequences", IEEE International Conference on Multimedia and Expo (ICME), June 2004.
    BibTeX TR2004-063 PDF
    • @inproceedings{Radhakrishnan2004jun,
    • author = {Radhakrishnan, R. and Xiong, Z. and Divakaran, A. and Memon, N.},
    • title = {{Time Series Analysis and Segmentation Using Eigenvectors for Mining Semantic Audio Label Sequences}},
    • booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
    • year = 2004,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2004-063}
    • }
  •  Xiong, Z., Radhakrishnan, R., Divakaran, A., Huang, T.S., "Effective and Efficient Sports Highlights Extraction Using the Minimum Description Length Criterion in Selecting GMM Structures", IEEE International Conference on Multimedia and Expo (ICME), June 2004.
    BibTeX TR2004-061 PDF
    • @inproceedings{Xiong2004jun,
    • author = {Xiong, Z. and Radhakrishnan, R. and Divakaran, A. and Huang, T.S.},
    • title = {{Effective and Efficient Sports Highlights Extraction Using the Minimum Description Length Criterion in Selecting GMM Structures}},
    • booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
    • year = 2004,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2004-061}
    • }
  •  Brown, J.C., Smaragdis, P., "Independent Component Analysis for Automatic Note Extraction from Musical Trills", Journal of the Acoustical Society of America, Vol. 115, No. 5, pp. 1851-2634, May 2004.
    BibTeX TR2004-078 PDF
    • @article{Brown2004may,
    • author = {Brown, J.C. and Smaragdis, P.},
    • title = {{Independent Component Analysis for Automatic Note Extraction from Musical Trills}},
    • journal = {Journal of the Acoustical Society of America},
    • year = 2004,
    • volume = 115,
    • number = 5,
    • pages = {1851--2634},
    • month = may,
    • url = {https://www.merl.com/publications/TR2004-078}
    • }
  •  Raj, B., Singh, R., Stern, R.M., "On Tracking Noise with Linear Dynamical System Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2004, vol. 1, pp. 965-968.
    BibTeX TR2004-042 PDF
    • @inproceedings{Raj2004may,
    • author = {Raj, B. and Singh, R. and Stern, R.M.},
    • title = {{On Tracking Noise with Linear Dynamical System Models}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2004,
    • volume = 1,
    • pages = {965--968},
    • month = may,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2004-042}
    • }
  •  DeVault, D., Rich, C., Sidner, C.L., "Natural Language Generation and Discourse Context: Computing Distractor Sets from the Focus Stack", International Florida Artificial Intelligence Research Symposium (FLAIRS), May 2004.
    BibTeX TR2004-004 PDF
    • @inproceedings{DeVault2004may,
    • author = {DeVault, D. and Rich, C. and Sidner, C.L.},
    • title = {{Natural Language Generation and Discourse Context: Computing Distractor Sets from the Focus Stack}},
    • booktitle = {International Florida Artificial Intelligence Research Symposium (FLAIRS)},
    • year = 2004,
    • month = may,
    • url = {https://www.merl.com/publications/TR2004-004}
    • }
  •  Divi, V., Forlines, C., van Gemert, J.V., Raj, B., Schmidt-Nielsen, B., Wittenburg, K., Woelfel, J., Wolf, P., Zhang, F., "A Speech-In List-Out Approach to Spoken User Interfaces", Human Language Technology Conference (HLT), May 2004.
    BibTeX TR2004-023 PDF
    • @inproceedings{Divi2004may,
    • author = {Divi, V. and Forlines, C. and {van Gemert}, J.V. and Raj, B. and Schmidt-Nielsen, B. and Wittenburg, K. and Woelfel, J. and Wolf, P. and Zhang, F.},
    • title = {{A Speech-In List-Out Approach to Spoken User Interfaces}},
    • booktitle = {Human Language Technology Conference (HLT)},
    • year = 2004,
    • month = may,
    • url = {https://www.merl.com/publications/TR2004-023}
    • }
  •  Radhakrishan, R., Xiong, Z., Divakaran, A., Ishikawa, Y., "Generation of Sports Highlights Using a Combination of Supervised & Unsupervised Learning in Audio Domain", IEEE Pacific-Rim Conference on Multimedia (PCM), December 2003, vol. 2, pp. 935-939.
    BibTeX TR2003-144 PDF
    • @inproceedings{Radhakrishan2003dec,
    • author = {Radhakrishan, R. and Xiong, Z. and Divakaran, A. and Ishikawa, Y.},
    • title = {{Generation of Sports Highlights Using a Combination of Supervised \& Unsupervised Learning in Audio Domain}},
    • booktitle = {IEEE Pacific-Rim Conference on Multimedia (PCM)},
    • year = 2003,
    • volume = 2,
    • pages = {935--939},
    • month = dec,
    • url = {https://www.merl.com/publications/TR2003-144}
    • }
  •  Raj, B., Seltzer, M.L., Reyes-Gomez, M.J., "Speech Recognizer Based Maximum Likelihood Beamforming", NSF Workshop on Perspectives on Speech Separation, October 2003.
    BibTeX TR2003-87 PDF
    • @inproceedings{Raj2003oct,
    • author = {Raj, B. and Seltzer, M.L. and Reyes-Gomez, M.J.},
    • title = {{Speech Recognizer Based Maximum Likelihood Beamforming}},
    • booktitle = {NSF Workshop on Perspectives on Speech Separation},
    • year = 2003,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2003-87}
    • }
  •  Reyes-Gomez, M.J., Raj, B., Ellis, D.P.W., "Multi-Channel Source Separation by Beamforming Trained with Factorial HMMS", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2003, pp. 13-16.
    BibTeX TR2003-88 PDF
    • @inproceedings{Reyes-Gomez2003oct,
    • author = {Reyes-Gomez, M.J. and Raj, B. and Ellis, D.P.W.},
    • title = {{Multi-Channel Source Separation by Beamforming Trained with Factorial HMMS}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2003,
    • pages = {13--16},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2003-88}
    • }
  •  Smaragdis, P., Brown, J.C., "Non-negative Matrix Factorization for Polyphonic Music Transcription", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2003, pp. 177-180.
    BibTeX TR2003-139 PDF
    • @inproceedings{Smaragdis2003oct,
    • author = {Smaragdis, P. and Brown, J.C.},
    • title = {{Non-negative Matrix Factorization for Polyphonic Music Transcription}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2003,
    • pages = {177--180},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2003-139}
    • }
  •  Lamere, P., Kwok, P., Walker, W., Gouvea, E., Singh, R., Raj, B., Wolf, P.P., "Design of the CMU Sphinx-4 Decoder", Eurospeech, September 2003.
    BibTeX TR2003-110 PDF
    • @inproceedings{Lamere2003sep,
    • author = {Lamere, P. and Kwok, P. and Walker, W. and Gouvea, E. and Singh, R. and Raj, B. and Wolf, P.P.},
    • title = {{Design of the CMU Sphinx-4 Decoder}},
    • booktitle = {Eurospeech},
    • year = 2003,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2003-110}
    • }
  •  Singh, R., Warmuth, M., Raj, B., Lamere, P., "Classification with Free Energy at Raised Temperatures", Eurospeech, September 2003.
    BibTeX TR2003-22 PDF
    • @inproceedings{Singh2003sep,
    • author = {Singh, R. and Warmuth, M. and Raj, B. and Lamere, P.},
    • title = {{Classification with Free Energy at Raised Temperatures}},
    • booktitle = {Eurospeech},
    • year = 2003,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2003-22}
    • }
  •  Xiong, Z., Radhakrishnan, R., Divakaran, A., Huang, T.S., "Comparing MFCC and MPEG-7 Audio Features for Feature Extraction, Maximum Likelihood HMM and Entropic Prior HMM for Sports Audio Classification", IEEE International Conference on Multimedia and Expo (ICME), DOI: 10.1109/​ICME.2003.1221332, July 2003, vol. 3, pp. 397-400.
    BibTeX TR2004-082 PDF
    • @inproceedings{Xiong2003jul2,
    • author = {Xiong, Z. and Radhakrishnan, R. and Divakaran, A. and Huang, T.S.},
    • title = {{Comparing MFCC and MPEG-7 Audio Features for Feature Extraction, Maximum Likelihood HMM and Entropic Prior HMM for Sports Audio Classification}},
    • booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
    • year = 2003,
    • volume = 3,
    • pages = {397--400},
    • month = jul,
    • doi = {10.1109/ICME.2003.1221332},
    • url = {https://www.merl.com/publications/TR2004-082}
    • }
  •  Raj, B., Whittaker, E.W.D., "Lossless Compression of Language Model Structure and Word Identifiers", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2003, vol. 1, pp. 388-391.
    BibTeX IEEE Xplore
    • @inproceedings{Raj2003apr,
    • author = {Raj, B. and Whittaker, E.W.D.},
    • title = {{Lossless Compression of Language Model Structure and Word Identifiers}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • volume = 1,
    • pages = {388--391},
    • month = apr,
    • issn = {1520-6149},
    • url = {https://ieeexplore.ieee.org/document/1198799}
    • }
  •  Reyes-Gomez, M.J., Raj, B., Ellis, D.P.W., "Multi-Channel Source Separation by Factorial HMMs", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2003.
    BibTeX
    • @inproceedings{Reyes-Gomez2003apr,
    • author = {Reyes-Gomez, M.J. and Raj, B. and Ellis, D.P.W.},
    • title = {{Multi-Channel Source Separation by Factorial HMMs}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • month = apr
    • }
  •  Singh, R., Raj, B., "Tracking Noise via Dynamical Systems with a Continuum of States", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2003.
    BibTeX
    • @inproceedings{Singh2003apr,
    • author = {Singh, R. and Raj, B.},
    • title = {{Tracking Noise via Dynamical Systems with a Continuum of States}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • month = apr
    • }
  •  Xiong, Z., Radhakrishnan, R., Divakaran, A., Huang, T.S., "Comparing MFCC and MPEG-7 Audio Features for Feature Extraction, Maximum Likelihood HMM and Entropic Prior HMM for Sports Audio Classification", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2003.1200048, April 2003, vol. 5, pp. 628-631.
    BibTeX IEEE Xplore
    • @inproceedings{Xiong2003apr1,
    • author = {Xiong, Z. and Radhakrishnan, R. and Divakaran, A. and Huang, T.S.},
    • title = {{Comparing MFCC and MPEG-7 Audio Features for Feature Extraction, Maximum Likelihood HMM and Entropic Prior HMM for Sports Audio Classification}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • volume = 5,
    • pages = {628--631},
    • month = apr,
    • doi = {10.1109/ICASSP.2003.1200048},
    • issn = {1520-6149},
    • url = {https://ieeexplore.ieee.org/document/1200048}
    • }
  •  Xiong, Z., Radhakrishnan, R., Divakaran, A., Huang, T.S., "Audio Events Detection Based Highlights Extraction from Baseball, Golf and Soccer Games in a Unified Framework", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2003, vol. 5, pp. 632-635.
    BibTeX IEEE Xplore
    • @inproceedings{Xiong2003apr2,
    • author = {Xiong, Z. and Radhakrishnan, R. and Divakaran, A. and Huang, T.S.},
    • title = {{Audio Events Detection Based Highlights Extraction from Baseball, Golf and Soccer Games in a Unified Framework}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • volume = 5,
    • pages = {632--635},
    • month = apr,
    • issn = {1520-6149},
    • url = {https://ieeexplore.ieee.org/document/1200049}
    • }
  •  Smaragdis, P., Casey, M., "Audio/Visual Independent Components", International Symposium on Independent Component Analysis and Blind Source Separation (ICA), April 2003, pp. 709-714.
    BibTeX TR2003-138 PDF
    • @inproceedings{Smaragdis2003apr,
    • author = {Smaragdis, P. and Casey, M.},
    • title = {{Audio/Visual Independent Components}},
    • booktitle = {International Symposium on Independent Component Analysis and Blind Source Separation (ICA)},
    • year = 2003,
    • pages = {709--714},
    • month = apr,
    • url = {https://www.merl.com/publications/TR2003-138}
    • }
  •  Seltzer, M.L., Raj, B., "Speech Recognizer Based Filter Optimization for Microphone Array Processing", IEEE Transactions on Signal Processing, Vol. 10, No. 3, pp. 69-71, March 2003.
    BibTeX IEEE Xplore
    • @article{Seltzer2003mar,
    • author = {Seltzer, M.L. and Raj, B.},
    • title = {{Speech Recognizer Based Filter Optimization for Microphone Array Processing}},
    • journal = {IEEE Transactions on Signal Processing},
    • year = 2003,
    • volume = 10,
    • number = 3,
    • pages = {69--71},
    • month = mar,
    • issn = {1070-9908},
    • url = {https://ieeexplore.ieee.org/document/1182087}
    • }
  •  Raj, B., Singh, R., "Classifier-Based Non-Linear Projection for Adaptive Endpointing of Continuous Speech", Computer Speech and Language, Vol. 17, No. 1, pp. 5-26, January 2003.
    BibTeX
    • @article{Raj2003jan,
    • author = {Raj, B. and Singh, R.},
    • title = {{Classifier-Based Non-Linear Projection for Adaptive Endpointing of Continuous Speech}},
    • journal = {Computer Speech and Language},
    • year = 2003,
    • volume = 17,
    • number = 1,
    • pages = {5--26},
    • month = jan
    • }
  •  Divakaran, A., Radhakrishnan, R., Xiong, Z., Casey, M., "Procedure for Audio-Assisted Browsing of News Video Using Generalized Sound Recognition", SPIE Conference on Storage and Retrieval for Multimedia Databases, DOI: 10.1117/​12.476294, January 2003, vol. 5021, pp. 160-166.
    BibTeX SPIE Digital Library
    • @inproceedings{Divakaran2003jan,
    • author = {Divakaran, A. and Radhakrishnan, R. and Xiong, Z. and Casey, M.},
    • title = {{Procedure for Audio-Assisted Browsing of News Video Using Generalized Sound Recognition}},
    • booktitle = {SPIE Conference on Storage and Retrieval for Multimedia Databases},
    • year = 2003,
    • volume = 5021,
    • pages = {160--166},
    • month = jan,
    • doi = {10.1117/12.476294},
    • url = {https://www.spiedigitallibrary.org/conference-proceedings-of-spie/5021/0000/Procedure-for-audio-assisted-browsing-of-news-video-using-generalized/10.1117/12.476294.short?SSO=1}
    • }
  •  Wolf, P., Raj, B., "The MERL SpokenQuery Information Retrieval System: A System for Retrieving Pertinent Documents from a Spoken Query", IEEE International Conference on Multimedia and Expo (ICME), August 2002, vol. 2, pp. 317-320.
    BibTeX TR2002-57 PDF
    • @inproceedings{Wolf2002aug,
    • author = {Wolf, P. and Raj, B.},
    • title = {{The MERL SpokenQuery Information Retrieval System: A System for Retrieving Pertinent Documents from a Spoken Query}},
    • booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
    • year = 2002,
    • volume = 2,
    • pages = {317--320},
    • month = aug,
    • url = {https://www.merl.com/publications/TR2002-57}
    • }