Publications

597 / 3,604 publications found.


  •  Chen, C., Liu, M.-Y., Tuzel, C.O., Xiao, J., "R-CNN for Small Object Detection", Asian Conference on Computer Vision (ACCV), DOI: 10.1007/​978-3-319-54193-8_14, November 2016, vol. 10115, pp. 214-230.
    BibTeX TR2016-144 PDF
    • @inproceedings{Chen2016nov,
    • author = {Chen, Chenyi and Liu, Ming-Yu and Tuzel, C. Oncel and Xiao, Jianxiong},
    • title = {R-CNN for Small Object Detection},
    • booktitle = {Asian Conference on Computer Vision (ACCV)},
    • year = 2016,
    • volume = 10115,
    • pages = {214--230},
    • month = nov,
    • doi = {10.1007/978-3-319-54193-8_14},
    • url = {https://www.merl.com/publications/TR2016-144}
    • }
  •  Tawara, N., Ogawa, T., Watanabe, S., Kobayashi, T., "Nested Gibbs sampling for mixture-of-mixture model and its application to speaker clustering", APSIPA Transactions on Signal and Information Processing, DOI: 10.1017/​ATSIP.2016.15, Vol. 5, October 2016.
    BibTeX TR2016-138 PDF
    • @article{Tawara2016oct,
    • author = {Tawara, Naohiro and Ogawa, Tetsuji and Watanabe, Shinji and Kobayashi, Tetsunori},
    • title = {Nested Gibbs sampling for mixture-of-mixture model and its application to speaker clustering},
    • journal = {APSIPA Transactions on Signal and Information Processing},
    • year = 2016,
    • volume = 5,
    • month = oct,
    • doi = {10.1017/ATSIP.2016.15},
    • url = {https://www.merl.com/publications/TR2016-138}
    • }
  •  Ozcan, G., Pajovic, M., Sahinoglu, Z., Wang, Y., Orlik, P.V., Wada, T., "Online State of Charge Estimation for Lithium-Ion Batteries Using Gaussian Process Regression", IEEE Industrial Electronics Society (IECON), DOI: 10.1109/​IECON.2016.7793002, October 2016, pp. 998-1003.
    BibTeX TR2016-136 PDF
    • @inproceedings{Ozcan2016oct,
    • author = {Ozcan, Gozde and Pajovic, Milutin and Sahinoglu, Zafer and Wang, Yebin and Orlik, Philip V. and Wada, Toshihiro},
    • title = {Online State of Charge Estimation for Lithium-Ion Batteries Using Gaussian Process Regression},
    • booktitle = {IEEE Industrial Electronics Society (IECON)},
    • year = 2016,
    • pages = {998--1003},
    • month = oct,
    • doi = {10.1109/IECON.2016.7793002},
    • url = {https://www.merl.com/publications/TR2016-136}
    • }
  •  Tuzel, C.O., Marks, T.K., Tambe, S., "Robust Face Alignment Using a Mixture of Invariant Experts", European Conference on Computer Vision (ECCV), DOI: 10.1007/​978-3-319-46454-1_50, October 2016, vol. 9909, pp. 825-841.
    BibTeX TR2016-129 PDF
    • @inproceedings{Tuzel2016oct,
    • author = {Tuzel, C. Oncel and Marks, Tim K. and Tambe, Salil},
    • title = {Robust Face Alignment Using a Mixture of Invariant Experts},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2016,
    • volume = 9909,
    • pages = {825--841},
    • month = oct,
    • doi = {10.1007/978-3-319-46454-1_50},
    • url = {https://www.merl.com/publications/TR2016-129}
    • }
  •  Sankaran, B., Ramalingam, S., Taguchi, Y., "Parameter Learning for Improving Binary Descriptor Matching", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/​IROS.2016.7759718, October 2016, pp. 4892-4897.
    BibTeX TR2016-132 PDF
    • @inproceedings{Sankaran2016oct,
    • author = {Sankaran, Bharath and Ramalingam, Srikumar and Taguchi, Yuichi},
    • title = {Parameter Learning for Improving Binary Descriptor Matching},
    • booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2016,
    • pages = {4892--4897},
    • month = oct,
    • doi = {10.1109/IROS.2016.7759718},
    • url = {https://www.merl.com/publications/TR2016-132}
    • }
  •  Delcroix, M., Watanabe, S., "Recent Advances in Distant Speech Recognition," Tech. Rep. TR2016-115, Interspeech Tutorials, September 2016.
    BibTeX TR2016-115 PDF
    • @techreport{Delcroix2016sep,
    • author = {Delcroix, Marc and Watanabe, Shinji},
    • title = {Recent Advances in Distant Speech Recognition},
    • booktitle = {Interspeech Tutorials},
    • institution = {Interspeech},
    • year = 2016,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2016-115}
    • }
  •  Le Roux, J., Vincent, E., Erdogan, H., "Learning-Based Approaches to Speech Enhancement and Separation," Tech. Rep. TR2016-113, Interspeech Tutorials, September 2016.
    BibTeX TR2016-113 PDF
    • @techreport{LeRoux2016sep,
    • author = {Le Roux, Jonathan and Vincent, Emmanuel and Erdogan, Hakan},
    • title = {Learning-Based Approaches to Speech Enhancement and Separation},
    • booktitle = {Interspeech Tutorials},
    • year = 2016,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2016-113}
    • }
  •  Erdogan, H., Hershey, J.R., Watanabe, S., Mandel, M., Le Roux, J., "Improved MVDR beamforming using single-channel mask prediction networks", Interspeech, DOI: 10.21437/​Interspeech.2016-552, September 2016, pp. 1981-1985.
    BibTeX TR2016-072 PDF
    • @inproceedings{Erdogan2016sep,
    • author = {Erdogan, Hakan and Hershey, John R. and Watanabe, Shinji and Mandel, Michael and Le Roux, Jonathan},
    • title = {Improved MVDR beamforming using single-channel mask prediction networks},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {1981--1985},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-552},
    • url = {https://www.merl.com/publications/TR2016-072}
    • }
  •  Hori, C., Hori, T., Watanabe, S., Hershey, J.R., "Context-Sensitive and Role-Dependent Spoken Language Understanding using Bidirectional and Attention LSTMs", Interspeech, DOI: 10.21437/​Interspeech.2016-1171, September 2016, pp. 3236-3240.
    BibTeX TR2016-074 PDF
    • @inproceedings{Hori2016sep,
    • author = {Hori, Chiori and Hori, Takaaki and Watanabe, Shinji and Hershey, John R.},
    • title = {Context-Sensitive and Role-Dependent Spoken Language Understanding using Bidirectional and Attention LSTMs},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {3236--3240},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-1171},
    • url = {https://www.merl.com/publications/TR2016-074}
    • }
  •  Isik, Y., Le Roux, J., Chen, Z., Watanabe, S., Hershey, J.R., "Single-Channel Multi-Speaker Separation using Deep Clustering", Interspeech, DOI: 10.21437/​Interspeech.2016-1176, September 2016, pp. 545-549.
    BibTeX TR2016-073 PDF
    • @inproceedings{Isik2016sep,
    • author = {Isik, Yusuf and Le Roux, Jonathan and Chen, Zhuo and Watanabe, Shinji and Hershey, John R.},
    • title = {Single-Channel Multi-Speaker Separation using Deep Clustering},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {545--549},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-1176},
    • url = {https://www.merl.com/publications/TR2016-073}
    • }
  •  Zmolikova, K., Karafiat, M., Vesely, K., Delcroix, M., Watanabe, S., Burget, L., Cernocky, J.H., "Data selection by sequence summarizing neural network in mismatch condition training", Interspeech, DOI: 10.21437/​Interspeech.2016-741, September 2016, pp. 2354-2358.
    BibTeX TR2016-075 PDF
    • @inproceedings{Zmolikova2016sep,
    • author = {Zmolikova, Katerina and Karafiat, Martin and Vesely, Karel and Delcroix, Marc and Watanabe, Shinji and Burget, Lukas and Cernocky, Jan, Honza},
    • title = {Data selection by sequence summarizing neural network in mismatch condition training},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {2354--2358},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-741},
    • url = {https://www.merl.com/publications/TR2016-075}
    • }
  •  Hayashi, T., Watanabe, S., Toda, T., Hori, T., Le Roux, J., Takeda, K., "Bidirectional LSTM-HMM Hybrid System for Polyphonic Sound Event Detection", Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE), September 2016, pp. 35-39.
    BibTeX TR2016-114 PDF
    • @inproceedings{Hayashi2016sep,
    • author = {Hayashi, Tomoki and Watanabe, Shinji and Toda, Tomoki and Hori, Takaaki and Le Roux, Jonathan and Takeda, Kazuya},
    • title = {Bidirectional LSTM-HMM Hybrid System for Polyphonic Sound Event Detection},
    • booktitle = {Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE)},
    • year = 2016,
    • pages = {35--39},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2016-114}
    • }
  •  Koike-Akino, T., Mahajan, R., Marks, T.K., Tuzel, C.O., Wang, Y., Watanabe, S., Orlik, P.V., "High-Accuracy User Identification Using EEG Biometrics", International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC), DOI: 10.1109/​EMBC.2016.7590835, August 2016, pp. 854-858.
    BibTeX TR2016-105 PDF Presentation
    • @inproceedings{Koike-Akino2016aug,
    • author = {Koike-Akino, Toshiaki and Mahajan, Ruhi and Marks, Tim K. and Tuzel, C. Oncel and Wang, Ye and Watanabe, Shinji and Orlik, Philip V.},
    • title = {High-Accuracy User Identification Using EEG Biometrics},
    • booktitle = {International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)},
    • year = 2016,
    • pages = {854--858},
    • month = aug,
    • doi = {10.1109/EMBC.2016.7590835},
    • url = {https://www.merl.com/publications/TR2016-105}
    • }
  •  Nikovski, D.N., Byadarhaly, K., "Regularized Covariance Matrix Estimation with High Dimensional Data for Supervised Anomaly Detection Problems", IEEE International Joint Conference on Neural Networks (IJCNN), DOI: 10.1109/​IJCNN.2016.7727554, July 2016, pp. 2811-2818.
    BibTeX TR2016-099 PDF
    • @inproceedings{Nikovski2016jul,
    • author = {Nikovski, Daniel N. and Byadarhaly, Kiran},
    • title = {Regularized Covariance Matrix Estimation with High Dimensional Data for Supervised Anomaly Detection Problems},
    • booktitle = {IEEE International Joint Conference on Neural Networks (IJCNN)},
    • year = 2016,
    • pages = {2811--2818},
    • month = jul,
    • doi = {10.1109/IJCNN.2016.7727554},
    • url = {https://www.merl.com/publications/TR2016-099}
    • }
  •  Hori, C., Watanabe, S., Hori, T., Harsham, B.A., Hershey, J.R., Koji, Y., Fujii, Y., Furumoto, Y., "Driver Confusion Status Detection Using Recurrent Neural Networks", IEEE International Conference on Multimedia and Expo (ICME), DOI: 10.1109/​ICME.2016.7552966, July 2016.
    BibTeX TR2016-088 PDF
    • @inproceedings{Hori2016jul,
    • author = {Hori, Chiori and Watanabe, Shinji and Hori, Takaaki and Harsham, Bret A. and Hershey, John R. and Koji, Yusuke and Fujii, Youichi and Furumoto, Yuki},
    • title = {Driver Confusion Status Detection Using Recurrent Neural Networks},
    • booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
    • year = 2016,
    • month = jul,
    • doi = {10.1109/ICME.2016.7552966},
    • url = {https://www.merl.com/publications/TR2016-088}
    • }
  •  Singh, B., Marks, T.K., Jones, M.J., Tuzel, C.O., Shao, M., "A Multi-Stream Bi-Directional Recurrent Neural Network for Fine-Grained Action Detection", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR.2016.216, June 2016, pp. 1961-1970.
    BibTeX TR2016-080 PDF Data
    • @inproceedings{Singh2016jun,
    • author = {Singh, Bharat and Marks, Tim K. and Jones, Michael J. and Tuzel, C. Oncel and Shao, Ming},
    • title = {A Multi-Stream Bi-Directional Recurrent Neural Network for Fine-Grained Action Detection},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2016,
    • pages = {1961--1970},
    • month = jun,
    • doi = {10.1109/CVPR.2016.216},
    • url = {https://www.merl.com/publications/TR2016-080}
    • }
  •  Vemulapalli, R., Tuzel, C.O., Liu, M.-Y., "Deep Gaussian Conditional Random Field Network: A Model-based Deep Network for Discriminative Denoising", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR.2016.351, June 2016, pp. 4801-4809.
    BibTeX TR2016-079 PDF
    • @inproceedings{Vemulapalli2016jun2,
    • author = {Vemulapalli, Raviteja and Tuzel, C. Oncel and Liu, Ming-Yu},
    • title = {Deep Gaussian Conditional Random Field Network: A Model-based Deep Network for Discriminative Denoising},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2016,
    • pages = {4801--4809},
    • month = jun,
    • doi = {10.1109/CVPR.2016.351},
    • url = {https://www.merl.com/publications/TR2016-079}
    • }
  •  Vemulapalli, R., Tuzel, C.O., Liu, M.-Y., Chellappa, R., "Gaussian Conditional Random Field Network for Semantic Segmentation", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2016, pp. 3224-3233.
    BibTeX TR2016-078 PDF
    • @inproceedings{Vemulapalli2016jun,
    • author = {Vemulapalli, Raviteja and Tuzel, C. Oncel and Liu, Ming-Yu and Chellappa, Rama},
    • title = {Gaussian Conditional Random Field Network for Semantic Segmentation},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2016,
    • pages = {3224--3233},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2016-078}
    • }
  •  Son, K., Liu, M.-Y., Taguchi, Y., "Learning to Remove Multipath Distortions in Time-of-Flight Range Images for a Robotic Arm Setup", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA.2016.7487515, May 2016, pp. 3390-3397.
    BibTeX TR2016-036 PDF
    • @inproceedings{Son2016may,
    • author = {Son, Kilho and Liu, Ming-Yu and Taguchi, Yuichi},
    • title = {Learning to Remove Multipath Distortions in Time-of-Flight Range Images for a Robotic Arm Setup},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2016,
    • pages = {3390--3397},
    • month = may,
    • doi = {10.1109/ICRA.2016.7487515},
    • url = {https://www.merl.com/publications/TR2016-036}
    • }
  •  Jones, M.J., Nikovski, D.N., Imamura, M., Hirata, T., "Exemplar Learning for Extremely Efficient Anomaly Detection in Real-Valued Time Series", Journal of Data Mining and Knowledge Discovery, DOI: 10.1007/​s10618-015-0449-3, Vol. 30, No. 6, pp. 1427-1454, March 2016.
    BibTeX TR2016-027 PDF
    • @article{Jones2016mar,
    • author = {Jones, Michael J. and Nikovski, Daniel N. and Imamura, Makoto and Hirata, Takahisa},
    • title = {Exemplar Learning for Extremely Efficient Anomaly Detection in Real-Valued Time Series},
    • journal = {Journal of Data Mining and Knowledge Discovery},
    • year = 2016,
    • volume = 30,
    • number = 6,
    • pages = {1427--1454},
    • month = mar,
    • doi = {10.1007/s10618-015-0449-3},
    • issn = {1573-756X},
    • url = {https://www.merl.com/publications/TR2016-027}
    • }
  •  Hershey, J.R., Chen, Z., Le Roux, J., Watanabe, S., "Deep Clustering: Discriminative Embeddings for Segmentation and Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2016.7471631, March 2016, pp. 31-35.
    BibTeX TR2016-003 PDF
    • @inproceedings{Hershey2016mar,
    • author = {Hershey, John R. and Chen, Zhuo and Le Roux, Jonathan and Watanabe, Shinji},
    • title = {Deep Clustering: Discriminative Embeddings for Segmentation and Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2016,
    • pages = {31--35},
    • month = mar,
    • doi = {10.1109/ICASSP.2016.7471631},
    • url = {https://www.merl.com/publications/TR2016-003}
    • }
  •  Hori, T., Hori, C., Watanabe, S., Hershey, J.R., "Minimum Word Error Training of Long Short-Term Memory Recurrent Neural Network Language Models for Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2016.7472827, March 2016, pp. 5990-5994.
    BibTeX TR2016-011 PDF
    • @inproceedings{Hori2016mar,
    • author = {Hori, Takaaki and Hori, Chiori and Watanabe, Shinji and Hershey, John R.},
    • title = {Minimum Word Error Training of Long Short-Term Memory Recurrent Neural Network Language Models for Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2016,
    • pages = {5990--5994},
    • month = mar,
    • doi = {10.1109/ICASSP.2016.7472827},
    • url = {https://www.merl.com/publications/TR2016-011}
    • }
  •  Vesely, K., Watanabe, S., Zmolikova, K., Karafiat, M., Burget, L., Cernocky, J.H., "Sequence Summarizing Neural Network for Speaker Adaptation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2016.7472692, March 2016, pp. 5315-5319.
    BibTeX TR2016-001 PDF
    • @inproceedings{Vesely2016mar,
    • author = {Vesely, Karel and Watanabe, Shinji and Zmolikova, Katerina and Karafiat, Martin and Burget, Lukas and Cernocky, Jan, Honza},
    • title = {Sequence Summarizing Neural Network for Speaker Adaptation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2016,
    • pages = {5315--5319},
    • month = mar,
    • doi = {10.1109/ICASSP.2016.7472692},
    • url = {https://www.merl.com/publications/TR2016-001}
    • }
  •  Wisdom, S., Hershey, J.R., Le Roux, J., Watanabe, S., "Deep Unfolding for Multichannel Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2016.7471649, March 2016, pp. 121-125.
    BibTeX TR2016-008 PDF
    • @inproceedings{Wisdom2016mar,
    • author = {Wisdom, Scott and Hershey, John R. and Le Roux, Jonathan and Watanabe, Shinji},
    • title = {Deep Unfolding for Multichannel Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2016,
    • pages = {121--125},
    • month = mar,
    • doi = {10.1109/ICASSP.2016.7471649},
    • url = {https://www.merl.com/publications/TR2016-008}
    • }
  •  Xiao, X., Watanabe, S., Erdogan, H., Lu, L., Hershey, J., Seltzer, M., Chen, G., Zhang, Y., Mandel, M., Yu, D., "Deep Beamforming Networks for Multi-Channel Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2016.7472778, March 2016, pp. 5745-5749.
    BibTeX TR2016-002 PDF
    • @inproceedings{Xiao2016mar,
    • author = {Xiao, Xiong and Watanabe, Shinji and Erdogan, Hakan and Lu, Liang and Hershey, John and Seltzer, Mike and Chen, Guoguo and Zhang, Yu and Mandel, Michael and Yu, Dong},
    • title = {Deep Beamforming Networks for Multi-Channel Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2016,
    • pages = {5745--5749},
    • month = mar,
    • doi = {10.1109/ICASSP.2016.7472778},
    • url = {https://www.merl.com/publications/TR2016-002}
    • }