- Moritz, N., Wichern, G., Hori, T., Le Roux, J., "All-in-One Transformer: Unifying Speech Recognition, Audio Tagging, and Event Detection", Interspeech, DOI: 10.21437/Interspeech.2020-2757, October 2020, pp. 3112-3116.
BibTeX TR2020-138 PDF Presentation- @inproceedings{Moritz2020oct,
- author = {Moritz, Niko and Wichern, Gordon and Hori, Takaaki and Le Roux, Jonathan},
- title = {All-in-One Transformer: Unifying Speech Recognition, Audio Tagging, and Event Detection},
- booktitle = {Interspeech},
- year = 2020,
- pages = {3112--3116},
- month = oct,
- doi = {10.21437/Interspeech.2020-2757},
- issn = {1990-9772},
- url = {https://www.merl.com/publications/TR2020-138}
- }
- Manilow, E., Wichern, G., Le Roux, J., "Hierarchical Musical Instrument Separation", International Society for Music Information Retrieval (ISMIR) Conference, October 2020, pp. 376-383.
BibTeX TR2020-136 PDF Software- @inproceedings{Manilow2020oct,
- author = {Manilow, Ethan and Wichern, Gordon and Le Roux, Jonathan},
- title = {Hierarchical Musical Instrument Separation},
- booktitle = {International Society for Music Information Retrieval (ISMIR) Conference},
- year = 2020,
- pages = {376--383},
- month = oct,
- isbn = {978-0-9813537-0-8},
- url = {https://www.merl.com/publications/TR2020-136}
- }
- Tang, Y., Kojima, K., Koike-Akino, T., Wang, Y., Wu, P., TaherSima, M., Jha, D.K., Parsons, K., Qi, M., "Generative Deep Learning Model for Inverse Design of Integrated Nanophotonic Devices", Lasers and Photonics Reviews, DOI: 10.1002/lpor.202000287, Vol. 2020, pp. 2000287, October 2020.
BibTeX TR2020-135 PDF- @article{Tang2020oct,
- author = {Tang, Yingheng and Kojima, Keisuke and Koike-Akino, Toshiaki and Wang, Ye and Wu, Pengxiang and TaherSima, Mohammad and Jha, Devesh K. and Parsons, Kieran and Qi, Minghao},
- title = {Generative Deep Learning Model for Inverse Design of Integrated Nanophotonic Devices},
- journal = {Lasers and Photonics Reviews},
- year = 2020,
- volume = 2020,
- pages = 2000287,
- month = oct,
- doi = {10.1002/lpor.202000287},
- url = {https://www.merl.com/publications/TR2020-135}
- }
- Seetharaman, P., Wichern, G., Pardo, B., Le Roux, J., "Autoclip: Adaptive Gradient Clipping For Source Separation Networks", IEEE International Workshop on Machine Learning for Signal Processing (MLSP), DOI: 10.1109/MLSP49062.2020.9231926, September 2020.
BibTeX TR2020-132 PDF- @inproceedings{Seetharaman2020sep,
- author = {Seetharaman, Prem and Wichern, Gordon and Pardo, Bryan and Le Roux, Jonathan},
- title = {Autoclip: Adaptive Gradient Clipping For Source Separation Networks},
- booktitle = {IEEE International Workshop on Machine Learning for Signal Processing (MLSP)},
- year = 2020,
- month = sep,
- publisher = {IEEE},
- doi = {10.1109/MLSP49062.2020.9231926},
- url = {https://www.merl.com/publications/TR2020-132}
- }
- Kojima, K., Tang, Y., Koike-Akino, T., Wang, Y., Jha, D.K., Parsons, K., TaherSima, M., Sang, F., Klamkin, J., Qi, M., "Inverse Design of Nanophotonic Devices using Deep Neural Networks", Asia Communications and Photonics Conference (ACP), September 2020, pp. Su1A.1.
BibTeX TR2020-130 PDF Video- @inproceedings{Kojima2020sep,
- author = {Kojima, Keisuke and Tang, Yingheng and Koike-Akino, Toshiaki and Wang, Ye and Jha, Devesh K. and Parsons, Kieran and TaherSima, Mohammad and Sang, Fengqiao and Klamkin, Jonathan and Qi, Minghao},
- title = {Inverse Design of Nanophotonic Devices using Deep Neural Networks},
- booktitle = {Asia Communications and Photonics Conference (ACP)},
- year = 2020,
- pages = {Su1A.1},
- month = sep,
- publisher = {Optical Society of America},
- isbn = {978-1-943580-82-8},
- url = {https://www.merl.com/publications/TR2020-130}
- }
- Han, M., Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Disentangled Adversarial Autoencoder for Subject-Invariant Physiological Feature Extraction", IEEE Signal Processing Letters, DOI: 10.1109/LSP.2020.3020215, Vol. 27, pp. 1565-1569, September 2020.
BibTeX TR2020-128 PDF- @article{Han2020sep,
- author = {Han, Mo and Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
- title = {Disentangled Adversarial Autoencoder for Subject-Invariant Physiological Feature Extraction},
- journal = {IEEE Signal Processing Letters},
- year = 2020,
- volume = 27,
- pages = {1565--1569},
- month = sep,
- doi = {10.1109/LSP.2020.3020215},
- issn = {1558-2361},
- url = {https://www.merl.com/publications/TR2020-128}
- }
- Pishdadian, F., Wichern, G., Le Roux, J., "Finding Strength in Weakness: Learning to Separate Sounds with Weak Supervision", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TASLP.2020.3013105, Vol. 28, pp. 2386-2399, September 2020.
BibTeX TR2020-126 PDF- @article{Pishdadian2020sep,
- author = {Pishdadian, Fatemeh and Wichern, Gordon and Le Roux, Jonathan},
- title = {Finding Strength in Weakness: Learning to Separate Sounds with Weak Supervision},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2020,
- volume = 28,
- pages = {2386--2399},
- month = sep,
- doi = {10.1109/TASLP.2020.3013105},
- url = {https://www.merl.com/publications/TR2020-126}
- }
- Cherian, A., Chatterjee, M., Ahuja, N., "Sound2Sight: Generating Visual Dynamics from Sound and Context", European Conference on Computer Vision (ECCV), Vedaldi, A. and Bischof, H. and Brox, Th. and Frahm, J.-M., Eds., August 2020.
BibTeX TR2020-121 PDF Software- @inproceedings{Cherian2020aug,
- author = {Cherian, Anoop and Chatterjee, Moitreya and Ahuja, Narendra},
- title = {Sound2Sight: Generating Visual Dynamics from Sound and Context},
- booktitle = {European Conference on Computer Vision (ECCV)},
- year = 2020,
- editor = {Vedaldi, A. and Bischof, H. and Brox, Th. and Frahm, J.-M.},
- month = aug,
- publisher = {Springer},
- url = {https://www.merl.com/publications/TR2020-121}
- }
- Han, M., Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Disentangled Adversarial Transfer Learning for Physiological Biosignals", International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC), DOI: 10.1109/EMBC44109.2020.9175233, July 2020.
BibTeX TR2020-109 PDF Video Presentation- @inproceedings{Han2020jul,
- author = {Han, Mo and Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
- title = {Disentangled Adversarial Transfer Learning for Physiological Biosignals},
- booktitle = {International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)},
- year = 2020,
- month = jul,
- publisher = {IEEE},
- doi = {10.1109/EMBC44109.2020.9175233},
- issn = {1558-4615},
- isbn = {978-1-7281-1990-8},
- url = {https://www.merl.com/publications/TR2020-109}
- }
- Seetharaman, P., Wichern, G., Le Roux, J., Pardo, B., "Bootstrapping Unsupervised Deep Music Separation from Primitive Auditory Grouping Principles", ICML 2020 Workshop on Self-supervision in Audio and Speech, July 2020.
BibTeX TR2020-111 PDF- @inproceedings{Seetharaman2020jul,
- author = {Seetharaman, Prem and Wichern, Gordon and Le Roux, Jonathan and Pardo, Bryan},
- title = {Bootstrapping Unsupervised Deep Music Separation from Primitive Auditory Grouping Principles},
- booktitle = {ICML 2020 Workshop on Self-supervision in Audio and Speech},
- year = 2020,
- month = jul,
- url = {https://www.merl.com/publications/TR2020-111}
- }
- Cherian, A., Aeron, S., "Representation Learning via Adversarially-Contrastive Optimal Transport", International Conference on Machine Learning (ICML), Daumé, H. and Singh, A., Eds., July 2020, pp. 10675-10685.
BibTeX TR2020-093 PDF Software- @inproceedings{Cherian2020jul,
- author = {Cherian, Anoop and Aeron, Shuchin},
- title = {Representation Learning via Adversarially-Contrastive Optimal Transport},
- booktitle = {International Conference on Machine Learning (ICML)},
- year = 2020,
- editor = {Daumé, H. and Singh, A.},
- pages = {10675--10685},
- month = jul,
- url = {https://www.merl.com/publications/TR2020-093}
- }
- Koike-Akino, T., Wang, Y., "Stochastic Bottleneck: Rateless Auto-Encoder for Flexible Dimensionality Reduction", IEEE International Symposium on Information Theory (ISIT), DOI: 10.1109/ISIT44484.2020.9174523, June 2020.
BibTeX TR2020-075 PDF Video Presentation- @inproceedings{Koike-Akino2020jun,
- author = {Koike-Akino, Toshiaki and Wang, Ye},
- title = {Stochastic Bottleneck: Rateless Auto-Encoder for Flexible Dimensionality Reduction},
- booktitle = {IEEE International Symposium on Information Theory (ISIT)},
- year = 2020,
- month = jun,
- publisher = {IEEE},
- doi = {10.1109/ISIT44484.2020.9174523},
- issn = {2157-8117},
- isbn = {978-1-7281-6432-8},
- url = {https://www.merl.com/publications/TR2020-075}
- }
- Hu, Y., Chen, S., Zhang, Y., Gu, X., "Collaborative Motion Prediction via Neural Motion Message Passing", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/CVPR42600.2020.00635, June 2020, pp. 6318-6327.
BibTeX TR2020-072 PDF- @inproceedings{Hu2020jun,
- author = {Hu, Yue and Chen, Siheng and Zhang, Ya and Gu, Xiao},
- title = {Collaborative Motion Prediction via Neural Motion Message Passing},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2020,
- pages = {6318--6327},
- month = jun,
- doi = {10.1109/CVPR42600.2020.00635},
- url = {https://www.merl.com/publications/TR2020-072}
- }
- Li, M., Chen, S., Zhao, Y., Zhang, Y., Wang, Y., Tia, Q., "Dynamic Multiscale Graph Neural Networks for 3D Skeleton-Based Human Motion Prediction", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/CVPR42600.2020.00029, June 2020, pp. 211-220.
BibTeX TR2020-073 PDF- @inproceedings{Li2020jun,
- author = {Li, Maosen and Chen, Sihen and Zhao, Yangheng and Zhang, Ya and Wang, Yanfeng and Tia, Qi},
- title = {Dynamic Multiscale Graph Neural Networks for 3D Skeleton-Based Human Motion Prediction},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2020,
- pages = {211--220},
- month = jun,
- doi = {10.1109/CVPR42600.2020.00029},
- url = {https://www.merl.com/publications/TR2020-073}
- }
- Wang, Y., Koike-Akino, T., "Learning to Modulate for Non-coherent MIMO", IEEE International Conference on Communications (ICC), DOI: 10.1109/ICC40277.2020.9149438, June 2020.
BibTeX TR2020-071 PDF Video Presentation- @inproceedings{Wang2020jun,
- author = {Wang, Ye and Koike-Akino, Toshiaki},
- title = {Learning to Modulate for Non-coherent MIMO},
- booktitle = {IEEE International Conference on Communications (ICC)},
- year = 2020,
- month = jun,
- publisher = {IEEE},
- doi = {10.1109/ICC40277.2020.9149438},
- issn = {1938-1883},
- isbn = {978-1-7281-5089-5},
- url = {https://www.merl.com/publications/TR2020-071}
- }
- Kumar, A., Marks, T.K., Mou, W., Wang, Y., Cherian, A., Jones, M.J., Liu, X., Koike-Akino, T., Feng, C., "LUVLi Face Alignment: Estimating Landmarks’ Location, Uncertainty, and Visibility Likelihood", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/CVPR42600.2020.00826, June 2020.
BibTeX TR2020-067 PDF Video Data Software- @inproceedings{Kumar2020jun,
- author = {Kumar, Abhinav and Marks, Tim K. and Mou, Wenxuan and Wang, Ye and Cherian, Anoop and Jones, Michael J. and Liu, Xiaoming and Koike-Akino, Toshiaki and Feng, Chen},
- title = {LUVLi Face Alignment: Estimating Landmarks’ Location, Uncertainty, and Visibility Likelihood},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2020,
- month = jun,
- publisher = {IEEE},
- doi = {10.1109/CVPR42600.2020.00826},
- issn = {2575-7075},
- isbn = {978-1-7281-7168-5},
- url = {https://www.merl.com/publications/TR2020-067}
- }
- Wu, P., Chen, S., "MotionNet: Joint Perception and Motion Prediction for Autonomous Driving Based on Bird’s Eye View Maps", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/CVPR42600.2020.01140, June 2020, pp. 11382-11392.
BibTeX TR2020-068 PDF Data Software- @inproceedings{Wu2020jun,
- author = {Wu, Pengxiang and Chen, Siheng},
- title = {MotionNet: Joint Perception and Motion Prediction for Autonomous Driving Based on Bird’s Eye View Maps},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2020,
- pages = {11382--11392},
- month = jun,
- doi = {10.1109/CVPR42600.2020.01140},
- url = {https://www.merl.com/publications/TR2020-068}
- }
- Chen, S., Liu, B., Feng, C., Vallespi-Gonzalez, C., Wellington, C., "3D Point Cloud Processing and Learning for Autonomous Driving", IEEE Signal Processing Magazine, DOI: 10.1109/MSP.2020.2984780, Vol. 38, No. 1, pp. 68-86, May 2020.
BibTeX TR2020-066 PDF- @article{Chen2020may2,
- author = {Chen, Siheng and Liu, Baoan and Feng, Chen and Vallespi-Gonzalez, Carlos and Wellington, Carl},
- title = {3D Point Cloud Processing and Learning for Autonomous Driving},
- journal = {IEEE Signal Processing Magazine},
- year = 2020,
- volume = 38,
- number = 1,
- pages = {68--86},
- month = may,
- doi = {10.1109/MSP.2020.2984780},
- url = {https://www.merl.com/publications/TR2020-066}
- }
- Fujihashi, T., Koike-Akino, T., Watanabe, T., Orlik, P.V., "High-Quality Soft Image Delivery with Deep Image Denoising", IEEE International Conference on Communications (ICC), DOI: 10.1109/ICC40277.2020.9148611, May 2020.
BibTeX TR2020-060 PDF Video- @inproceedings{Fujihashi2020may,
- author = {Fujihashi, Takuya and Koike-Akino, Toshiaki and Watanabe, Takashi and Orlik, Philip V.},
- title = {High-Quality Soft Image Delivery with Deep Image Denoising},
- booktitle = {IEEE International Conference on Communications (ICC)},
- year = 2020,
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICC40277.2020.9148611},
- issn = {1938-1883},
- isbn = {978-1-7281-5089-5},
- url = {https://www.merl.com/publications/TR2020-060}
- }
- Bhamidipati, S., Kim, K.J., Sun, H., Orlik, P.V., "Artificial Intelligence-Based Distributed Belief Propagation and Recurrent Neural Network Algorithm for Wide-Area Monitoring Systems", IEEE Network, DOI: 10.1109/MNET.011.1900322, Vol. 34, No. 3, pp. 64-72, May 2020.
BibTeX TR2020-058 PDF- @article{Bhamidipati2020may,
- author = {Bhamidipati, Sriramya and Kim, Kyeong Jin and Sun, Hongbo and Orlik, Philip V.},
- title = {Artificial Intelligence-Based Distributed Belief Propagation and Recurrent Neural Network Algorithm for Wide-Area Monitoring Systems},
- journal = {IEEE Network},
- year = 2020,
- volume = 34,
- number = 3,
- pages = {64--72},
- month = may,
- doi = {10.1109/MNET.011.1900322},
- url = {https://www.merl.com/publications/TR2020-058}
- }
- Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Learning Invariant Representations from EEG via Adversarial Inference", IEEE Access, DOI: 10.1109/ACCESS.2020.2971600, Vol. 8, pp. 27074-27085, April 2020.
BibTeX TR2020-049 PDF- @article{Ozdenizci2020apr,
- author = {Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
- title = {Learning Invariant Representations from EEG via Adversarial Inference},
- journal = {IEEE Access},
- year = 2020,
- volume = 8,
- pages = {27074--27085},
- month = apr,
- doi = {10.1109/ACCESS.2020.2971600},
- issn = {2169-3536},
- url = {https://www.merl.com/publications/TR2020-049}
- }
- Chang, X., Zhang, W., Qian, Y., Le Roux, J., Watanabe, S., "End-To-End Multi-Speaker Speech Recognition with Transformer", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9054029, April 2020, pp. 6134-6138.
BibTeX TR2020-043 PDF Video Presentation- @inproceedings{Chang2020apr,
- author = {Chang, Xuankai and Zhang, Wangyou and Qian, Yanmin and Le Roux, Jonathan and Watanabe, Shinji},
- title = {End-To-End Multi-Speaker Speech Recognition with Transformer},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {6134--6138},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9054029},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-043}
- }
- Pishdadian, F., Wichern, G., Le Roux, J., "Learning to Separate Sounds From Weakly Labeled Scenes", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9053055, April 2020, pp. 91-95.
BibTeX TR2020-038 PDF Video Presentation- @inproceedings{Pishdadian2020apr,
- author = {Pishdadian, Fatemeh and Wichern, Gordon and Le Roux, Jonathan},
- title = {Learning to Separate Sounds From Weakly Labeled Scenes},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {91--95},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9053055},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-038}
- }
- Al-Shabili, A., Mansour, H., Boufounos, P.T., "Learning Plug-and-Play Proximal Quasi-Newton Denoisers", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9054537, April 2020, pp. 8896-8900.
BibTeX TR2020-045 PDF Video- @inproceedings{Al-Shabili2020apr,
- author = {Al-Shabili, Abdullah and Mansour, Hassan and Boufounos, Petros T.},
- title = {Learning Plug-and-Play Proximal Quasi-Newton Denoisers},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {8896--8900},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9054537},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-045}
- }
- Maciejewski, M., Wichern, G., McQuinn, E., Le Roux, J., "WHAMR!: Noisy and Reverberant Single-Channel Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9053327, April 2020, pp. 696-700.
BibTeX TR2020-042 PDF Video Presentation- @inproceedings{Maciejewski2020apr,
- author = {Maciejewski, Matthew and Wichern, Gordon and McQuinn, Emmett and Le Roux, Jonathan},
- title = {WHAMR!: Noisy and Reverberant Single-Channel Speech Separation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {696--700},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9053327},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-042}
- }