Publications

357 / 3,171 publications found.


  •  Koike-Akino, T., Wang, P., Pajovic, M., Sun, H., Orlik, P.V., "Fingerprinting-Based Indoor Localization with Commercial MMWave WiFi: A Deep Learning Approach", IEEE Access, DOI: 10.1109/​ACCESS.2020.2991129, April 2020.
    BibTeX TR2020-054 PDF Data
    • @article{Koike-Akino2020apr,
    • author = {Koike-Akino, Toshiaki and Wang, Pu and Pajovic, Milutin and Sun, Haijian and Orlik, Philip V.},
    • title = {Fingerprinting-Based Indoor Localization with Commercial MMWave WiFi: A Deep Learning Approach},
    • journal = {IEEE Access},
    • year = 2020,
    • month = apr,
    • doi = {10.1109/ACCESS.2020.2991129},
    • issn = {2169-3536},
    • url = {https://www.merl.com/publications/TR2020-054}
    • }
  •  Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Learning Invariant Representations from EEG via Adversarial Inference", IEEE Access, DOI: 10.1109/​ACCESS.2020.2971600, Vol. 8, pp. 27074-27085, April 2020.
    BibTeX TR2020-049 PDF
    • @article{Ozdenizci2020apr,
    • author = {Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
    • title = {Learning Invariant Representations from EEG via Adversarial Inference},
    • journal = {IEEE Access},
    • year = 2020,
    • volume = 8,
    • pages = {27074--27085},
    • month = apr,
    • doi = {10.1109/ACCESS.2020.2971600},
    • issn = {2169-3536},
    • url = {https://www.merl.com/publications/TR2020-049}
    • }
  •  Chang, X., Zhang, W., Qian, Y., Le Roux, J., Watanabe, S., "End-To-End Multi-Speaker Speech Recognition with Transformer", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9054029, April 2020, pp. 6134-6138.
    BibTeX TR2020-043 PDF Video
    • @inproceedings{Chang2020apr,
    • author = {Chang, Xuankai and Zhang, Wangyou and Qian, Yanmin and Le Roux, Jonathan and Watanabe, Shinji},
    • title = {End-To-End Multi-Speaker Speech Recognition with Transformer},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {6134--6138},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9054029},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-043}
    • }
  •  Pishdadian, F., Wichern, G., Le Roux, J., "Learning to Separate Sounds From Weakly Labeled Scenes", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9053055, April 2020, pp. 91-95.
    BibTeX TR2020-038 PDF Video
    • @inproceedings{Pishdadian2020apr,
    • author = {Pishdadian, Fatemeh and Wichern, Gordon and Le Roux, Jonathan},
    • title = {Learning to Separate Sounds From Weakly Labeled Scenes},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {91--95},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9053055},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-038}
    • }
  •  Al-Shabili, A., Mansour, H., Boufounos, P.T., "Learning Plug-and-Play Proximal Quasi-Newton Denoisers", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9054537, April 2020, pp. 8896-8900.
    BibTeX TR2020-045 PDF Video
    • @inproceedings{Al-Shabili2020apr,
    • author = {Al-Shabili, Abdullah and Mansour, Hassan and Boufounos, Petros T.},
    • title = {Learning Plug-and-Play Proximal Quasi-Newton Denoisers},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {8896--8900},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9054537},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-045}
    • }
  •  Maciejewski, M., Wichern, G., McQuinn, E., Le Roux, J., "WHAMR!: Noisy and Reverberant Single-Channel Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9053327, April 2020, pp. 696-700.
    BibTeX TR2020-042 PDF Video
    • @inproceedings{Maciejewski2020apr,
    • author = {Maciejewski, Matthew and Wichern, Gordon and McQuinn, Emmett and Le Roux, Jonathan},
    • title = {WHAMR!: Noisy and Reverberant Single-Channel Speech Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {696--700},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9053327},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-042}
    • }
  •  Moritz, N., Hori, T., Le Roux, J., "Streaming Automatic Speech Recognition With The Transformer Model", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9054476, April 2020, pp. 6074-6078.
    BibTeX TR2020-040 PDF Video
    • @inproceedings{Moritz2020apr,
    • author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Streaming Automatic Speech Recognition With The Transformer Model},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {6074--6078},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9054476},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-040}
    • }
  •  Sari, L., Moritz, N., Hori, T., Le Roux, J., "Unsupervised Speaker Adaptation Using Attention-Based Speaker Memory For End-To-End ASR", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9054249, April 2020, pp. 7384-7388.
    BibTeX TR2020-037 PDF Video
    • @inproceedings{Sari2020apr,
    • author = {Sari, Leda and Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Unsupervised Speaker Adaptation Using Attention-Based Speaker Memory For End-To-End ASR},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {7384--7388},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9054249},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-037}
    • }
  •  Shi, L., Geng, S., Shuang, K., Hori, C., Liu, S., Gao, P., Su, S., "Multi-Layer Content Interaction Through Quaternion Product For Visual Question Answering", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9053595, April 2020, pp. 4412-4416.
    BibTeX TR2020-046 PDF
    • @inproceedings{Shi2020apr,
    • author = {Shi, Lei and Geng, Shijie and Shuang, Kai and Hori, Chiori and Liu, Songxiang and Gao, Peng and Su, Sen},
    • title = {Multi-Layer Content Interaction Through Quaternion Product For Visual Question Answering},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {4412--4416},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9053595},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-046}
    • }
  •  Zhang, S., Zhang, S., Wang, B., Habetler, T., "Deep Learning Algorithms for Bearing Fault Diagnostics – A Comprehensive Review", IEEE Access, DOI: 10.1109/​ACCESS.2020.2972859, Vol. 8, pp. 29857-29881, March 2020.
    BibTeX TR2020-034 PDF
    • @article{Zhang2020mar,
    • author = {Zhang, Shen and Zhang, Shibo and Wang, Bingnan and Habetler, Thomas},
    • title = {Deep Learning Algorithms for Bearing Fault Diagnostics – A Comprehensive Review},
    • journal = {IEEE Access},
    • year = 2020,
    • volume = 8,
    • pages = {29857--29881},
    • month = mar,
    • doi = {10.1109/ACCESS.2020.2972859},
    • issn = {2169-3536},
    • url = {https://www.merl.com/publications/TR2020-034}
    • }
  •  Li, R., Wang, X., Mallidi, H., Watanabe, S., Hori, T., Hermansky, H., "Multi-Stream End-to-End Speech Recognition", IEEE/ACM Transactions on Audio, Speech and Language Processing, DOI: 10.1109/​TASLP.2019.2959721, Vol. 28, pp. 646-655, March 2020.
    BibTeX TR2020-030 PDF
    • @article{Li2020mar,
    • author = {Li, Ruizhi and Wang, Xiaofei and Mallidi, Harish and Watanabe, Shinji and Hori, Takaaki and Hermansky, Hynek},
    • title = {Multi-Stream End-to-End Speech Recognition},
    • journal = {IEEE/ACM Transactions on Audio, Speech and Language Processing},
    • year = 2020,
    • volume = 28,
    • pages = {646--655},
    • month = mar,
    • doi = {10.1109/TASLP.2019.2959721},
    • url = {https://www.merl.com/publications/TR2020-030}
    • }
  •  D’Haro, L.F., Yoshino, K., Hori, C., Marks, T.K., Polymenakos, L., Kummerfeld, J.K., Galley, M., Gao, X., "Overview of the seventh Dialog System Technology Challenge: DSTC7", Computer Speech and Language, DOI: 10.1016/​j.csl.2020.101068, Vol. 62, March 2020.
    BibTeX TR2020-029 PDF
    • @article{D’Haro2020mar,
    • author = {D’Haro, Luis Fernando and Yoshino, Koichiro and Hori, Chiori and Marks, Tim K. and Polymenakos, Lazaros and Kummerfeld, Jonathan K. and Galley, Michel and Gao, Xiang},
    • title = {Overview of the seventh Dialog System Technology Challenge: DSTC7},
    • journal = {Computer Speech and Language},
    • year = 2020,
    • volume = 62,
    • month = mar,
    • doi = {10.1016/j.csl.2020.101068},
    • url = {https://www.merl.com/publications/TR2020-029}
    • }
  •  Kojima, K., TaherSima, M., Koike-Akino, T., Jha, D.K., Tang, Y., Parsons, K., Sang, F., Klamkin, J., "Deep Neural Networks for Designing Integrated Photonics", Optical Fiber Communication Conference and Exposition (OFC), DOI: 10.1364/​OFC.2020.Th1A.6, March 2020.
    BibTeX TR2020-057 PDF
    • @inproceedings{Kojima2020mar,
    • author = {Kojima, Keisuke and TaherSima, Mohammad and Koike-Akino, Toshiaki and Jha, Devesh K. and Tang, Yingheng and Parsons, Kieran and Sang, Fengqiao and Klamkin, Jonathan},
    • title = {Deep Neural Networks for Designing Integrated Photonics},
    • booktitle = {Optical Fiber Communication Conference and Exposition (OFC)},
    • year = 2020,
    • month = mar,
    • publisher = {OSA},
    • doi = {10.1364/OFC.2020.Th1A.6},
    • isbn = {978-1-943580-71-2},
    • url = {https://www.merl.com/publications/TR2020-057}
    • }
  •  Aihara, R., Wichern, G., Le Roux, J., "Deep Clustering-based Single Channel Speech Separation and Recent Advances", Acoustical Science and Technology, DOI: 10.1250/​ast.41.465, Vol. 41, No. 2, pp. 465-471, March 2020.
    BibTeX TR2021-020 PDF
    • @article{Aihara2020jun,
    • author = {Aihara, Ryo and Wichern, Gordon and Le Roux, Jonathan},
    • title = {Deep Clustering-based Single Channel Speech Separation and Recent Advances},
    • journal = {Acoustical Science and Technology},
    • year = 2020,
    • volume = 41,
    • number = 2,
    • pages = {465--471},
    • month = mar,
    • doi = {10.1250/ast.41.465},
    • url = {https://www.merl.com/publications/TR2021-020}
    • }
  •  Ramachandra, B., Jones, M.J., Vatsavai, R., "Learning a distance function with a Siamese network to localize anomalies in videos", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/​WACV45572.2020.9093417, February 2020, pp. 2598-2607.
    BibTeX TR2020-015 PDF
    • @inproceedings{Jones2020feb,
    • author = {Ramachandra, Bharathkumar and Jones, Michael J. and Vatsavai, Ranga},
    • title = {Learning a distance function with a Siamese network to localize anomalies in videos},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2020,
    • pages = {2598--2607},
    • month = feb,
    • doi = {10.1109/WACV45572.2020.9093417},
    • url = {https://www.merl.com/publications/TR2020-015}
    • }
  •  Cherian, A., Wang, J., Hori, C., Marks, T.K., "Spatio-Temporal Ranked-Attention Networks for Video Captioning", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/​WACV45572.2020.9093291, February 2020, pp. 1606-1615.
    BibTeX TR2020-016 PDF
    • @inproceedings{Cherian2020feb,
    • author = {Cherian, Anoop and Wang, Jue and Hori, Chiori and Marks, Tim K.},
    • title = {Spatio-Temporal Ranked-Attention Networks for Video Captioning},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2020,
    • pages = {1606--1615},
    • month = feb,
    • publisher = {IEEE},
    • doi = {10.1109/WACV45572.2020.9093291},
    • url = {https://www.merl.com/publications/TR2020-016}
    • }
  •  Huang, R., Xu, W., Lee, T.-Y., Cherian, A., Wang, Y., Marks, T.K., "FX-GAN: Self-Supervised GAN Learning via Feature Exchange", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/​WACV45572.2020.9093525, February 2020, pp. 3183-3191.
    BibTeX TR2020-014 PDF
    • @inproceedings{Huang2020feb,
    • author = {Huang, Rui and Xu, Wenju and Lee, Teng-Yok and Cherian, Anoop and Wang, Ye and Marks, Tim K.},
    • title = {FX-GAN: Self-Supervised GAN Learning via Feature Exchange},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2020,
    • pages = {3183--3191},
    • month = feb,
    • publisher = {IEEE},
    • doi = {10.1109/WACV45572.2020.9093525},
    • url = {https://www.merl.com/publications/TR2020-014}
    • }
  •  He, W., Lee, T.-Y., van Baar, J., Wittenburg, K.B., Shen, H.-W., "DynamicsExplorer: Visual Analytics for Robot Control Tasks involving Dynamics and LSTM-based Control Policies", IEEE Pacific Visualization Symposium (PacificVis), DOI: 10.1109/​PacificVis48177.2020.7127, January 2020, pp. 36-45.
    BibTeX TR2020-011 PDF
    • @inproceedings{He2020jan,
    • author = {He, Wenbin and Lee, Teng-Yok and van Baar, Jeroen and Wittenburg, Kent B. and Shen, Han-Wei},
    • title = {DynamicsExplorer: Visual Analytics for Robot Control Tasks involving Dynamics and LSTM-based Control Policies},
    • booktitle = {IEEE Pacific Visualization Symposium (PacificVis)},
    • year = 2020,
    • pages = {36--45},
    • month = jan,
    • doi = {10.1109/PacificVis48177.2020.7127},
    • url = {https://www.merl.com/publications/TR2020-011}
    • }
  •  Chen, S., Duan, C., Yang, Y., Feng, C., Li, D., Tian, D., "Deep Unsupervised Learning of 3D Point Clouds via Graph Topology Inference and Filtering", IEEE Transactions on Image Processing, DOI: 10.1109/​TIP.2019.2957935, pp. 3183-3198, January 2020.
    BibTeX TR2020-004 PDF Software
    • @article{Chen2020jan,
    • author = {Chen, Siheng and Duan, Chaojing and Yang, Yaoqing and Feng, Chen and Li, Duanshun and Tian, Dong},
    • title = {Deep Unsupervised Learning of 3D Point Clouds via Graph Topology Inference and Filtering},
    • journal = {IEEE Transactions on Image Processing},
    • year = 2020,
    • pages = {3183--3198},
    • month = jan,
    • doi = {10.1109/TIP.2019.2957935},
    • url = {https://www.merl.com/publications/TR2020-004}
    • }
  •  Xu, H., Sun, H., Nikovski, D.N., Kitamura, S., Mori, K., Hashimoto, H., "Deep Reinforcement Learning for Joint Bidding and Pricing of Load Serving Entity", IEEE Transactions on smart grids, DOI: 10.1109/​TSG.2019.2903756, Vol. 10, No. 6, pp. 6366-6375, January 2020.
    BibTeX TR2020-003 PDF
    • @article{Xu2020jan,
    • author = {Xu, Hanchen and Sun, Hongbo and Nikovski, Daniel N. and Kitamura, Shoichi and Mori, Kazuyuki and Hashimoto, Hiroyuki},
    • title = {Deep Reinforcement Learning for Joint Bidding and Pricing of Load Serving Entity},
    • journal = {IEEE Transactions on smart grids},
    • year = 2020,
    • volume = 10,
    • number = 6,
    • pages = {6366--6375},
    • month = jan,
    • doi = {10.1109/TSG.2019.2903756},
    • issn = {1949-3061},
    • url = {https://www.merl.com/publications/TR2020-003}
    • }
  •  Berntorp, K., Quirynen, R., Uno, T., Di Cairano, S., "Trajectory Tracking for Autonomous Vehicles on Varying Road Surfaces by Friction-Adaptive Nonlinear Model Predictive Control", Journal of Vehicle Systems Dynamics, DOI: 10.1080/​00423114.2019.1697456, January 2020.
    BibTeX TR2020-005 PDF
    • @article{Berntorp2020jan,
    • author = {Berntorp, Karl and Quirynen, Rien and Uno, Tomoki and Di Cairano, Stefano},
    • title = {Trajectory Tracking for Autonomous Vehicles on Varying Road Surfaces by Friction-Adaptive Nonlinear Model Predictive Control},
    • journal = {Journal of Vehicle Systems Dynamics},
    • year = 2020,
    • month = jan,
    • doi = {10.1080/00423114.2019.1697456},
    • url = {https://www.merl.com/publications/TR2020-005}
    • }
  •  Chang, X., Zhang, W., Qian, Y., Le Roux, J., Watanabe, S., "MIMO-Speech: End-to-End Multi-Channel Multi-Speaker Speech Recognition", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2019, pp. 237-144.
    BibTeX TR2019-157 PDF
    • @inproceedings{Chang2019dec,
    • author = {Chang, Xuankai and Zhang, Wangyou and Qian, Yanmin and Le Roux, Jonathan and Watanabe, Shinji},
    • title = {MIMO-Speech: End-to-End Multi-Channel Multi-Speaker Speech Recognition},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2019,
    • pages = {237--144},
    • month = dec,
    • isbn = {978-1-7281-0305-1},
    • url = {https://www.merl.com/publications/TR2019-157}
    • }
  •  Karita, S., Chen, N., Hayashi, T., Hori, T., Inaguma, H., Jiang, Z., Someki, M., Enrique Yalta Soplin, N., Yamamoto, R., Wang, X., Watanabe, S., Yoshimura, T., Zhang, W., "A Comparative Study on Transformer Vs RNN in Speech Applications", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/​ASRU46091.2019.9003750, December 2019, pp. 449-456.
    BibTeX TR2019-158 PDF
    • @inproceedings{Karita2019dec,
    • author = {Karita, Shigeki and Chen, Nanxin and Hayashi, Tomoki and Hori, Takaaki and Inaguma, Hirofumi and Jiang, Ziyan and Someki, Masao and Enrique Yalta Soplin, Nelson and Yamamoto, Ryuichi and Wang, Xiaofei and Watanabe, Shinji and Yoshimura, Takenori and Zhang, Wangyou},
    • title = {A Comparative Study on Transformer Vs RNN in Speech Applications},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2019,
    • pages = {449--456},
    • month = dec,
    • doi = {10.1109/ASRU46091.2019.9003750},
    • url = {https://www.merl.com/publications/TR2019-158}
    • }
  •  Moritz, N., Hori, T., Le Roux, J., "Streaming End-to-End Speech Recognition with Joint CTC-Attention Based Models", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2019, pp. 936-943.
    BibTeX TR2019-159 PDF
    • @inproceedings{Moritz2019dec,
    • author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Streaming End-to-End Speech Recognition with Joint CTC-Attention Based Models},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2019,
    • pages = {936--943},
    • month = dec,
    • isbn = {978-1-7281-0305-1},
    • url = {https://www.merl.com/publications/TR2019-159}
    • }
  •  Jha, D.K., Kolaric, P., Romeres, D., Raghunathan, A., Benosman, M., Nikovski, D.N., "Robust Optimization for Trajectory-Centric Model-based Reinforcement Learning", NeurIPS Workshop on Safety and Robustness in Decision Making, December 2019.
    BibTeX TR2019-156 PDF
    • @inproceedings{Jha2019dec2,
    • author = {Jha, Devesh K. and Kolaric, Patrik and Romeres, Diego and Raghunathan, Arvind and Benosman, Mouhacine and Nikovski, Daniel N.},
    • title = {Robust Optimization for Trajectory-Centric Model-based Reinforcement Learning},
    • booktitle = {NeurIPS Workshop on Safety and Robustness in Decision Making},
    • year = 2019,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2019-156}
    • }