Publications

596 / 3,602 publications found.


  •  Geng, S., Gao, P., Chatterjee, M., Hori, C., Le Roux, J., Zhang, Y., Li, H., Cherian, A., "Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers", AAAI Conference on Artificial Intelligence, February 2021, pp. 1415-1423.
    BibTeX TR2021-010 PDF
    • @inproceedings{Geng2021feb,
    • author = {Geng, Shijie and Gao, Peng and Chatterjee, Moitreya and Hori, Chiori and Le Roux, Jonathan and Zhang, Yongfeng and Li, Hongsheng and Cherian, Anoop},
    • title = {Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2021,
    • pages = {1415--1423},
    • month = feb,
    • publisher = {AAAI Press, Palo Alto, California USA},
    • isbn = {978-1-57735-866-4},
    • url = {https://www.merl.com/publications/TR2021-010}
    • }
  •  Kojima, K., TaherSima, M., Koike-Akino, T., Jha, D.K., Tang, Y., Wang, Y., Parsons, K., "Deep Neural Networks for Inverse Design of Nanophotonic Devices", IEEE Journal of Lightwave Technology, DOI: 10.1109/​JLT.2021.3050083, January 2021.
    BibTeX TR2021-001 PDF
    • @article{Kojima2021jan,
    • author = {Kojima, Keisuke and TaherSima, Mohammad and Koike-Akino, Toshiaki and Jha, Devesh K. and Tang, Yingheng and Wang, Ye and Parsons, Kieran},
    • title = {Deep Neural Networks for Inverse Design of Nanophotonic Devices},
    • journal = {IEEE Journal of Lightwave Technology},
    • year = 2021,
    • month = jan,
    • doi = {10.1109/JLT.2021.3050083},
    • issn = {1558-2213},
    • url = {https://www.merl.com/publications/TR2021-001}
    • }
  •  Lohit, S., Anirudh, R., Turaga, P., "Recovering Trajectories of Unmarked Joints in 3D Human Actions Using Latent Space Optimization", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2021.
    BibTeX TR2021-004 PDF
    • @inproceedings{Lohit2021jan,
    • author = {Lohit, Suhas and Anirudh, Rushil and Turaga, Pavan},
    • title = {Recovering Trajectories of Unmarked Joints in 3D Human Actions Using Latent Space Optimization},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2021,
    • month = jan,
    • publisher = {CVF OpenAccess},
    • url = {https://www.merl.com/publications/TR2021-004}
    • }
  •  Anirudh, R., Lohit, S., Turaga, P., "Generative Patch Priors for Practical Compressive Image Recovery", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2021.
    BibTeX TR2021-003 PDF
    • @inproceedings{Anirudh2021jan,
    • author = {Anirudh, Rushil and Lohit, Suhas and Turaga, Pavan},
    • title = {Generative Patch Priors for Practical Compressive Image Recovery},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2021,
    • month = jan,
    • publisher = {CVF OpenAccess},
    • url = {https://www.merl.com/publications/TR2021-003}
    • }
  •  Nowara, E., Marks, T.K., Mansour, H., Veeraraghavan, A., "Near-Infrared Imaging Photoplethysmography During Driving", IEEE Transactions on Intelligent Transportation Systems, DOI: 10.1109/​TITS.2020.3038317, pp. 1-12, December 2020.
    BibTeX TR2020-161 PDF
    • @article{Nowara2020dec,
    • author = {Nowara, Ewa and Marks, Tim K. and Mansour, Hassan and Veeraraghavan, Ashok},
    • title = {Near-Infrared Imaging Photoplethysmography During Driving},
    • journal = {IEEE Transactions on Intelligent Transportation Systems},
    • year = 2020,
    • pages = {1--12},
    • month = dec,
    • doi = {10.1109/TITS.2020.3038317},
    • url = {https://www.merl.com/publications/TR2020-161}
    • }
  •  Li, M., Chen, S., Zhang, Y., "Graph Cross Networks with Vertex Infomax Pooling", Advances in Neural Information Processing Systems (NeurIPS), December 2020.
    BibTeX TR2020-167 PDF
    • @inproceedings{Li2020dec,
    • author = {Li, Maosen and Chen, Siheng and Zhang, Ya},
    • title = {Graph Cross Networks with Vertex Infomax Pooling},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2020,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2020-167}
    • }
  •  Talreja, V., Koike-Akino, T., Wang, Y., Millar, D.S., Kojima, K., Parsons, K., "End-to-End Deep Learning for Phase Noise-Robust Multi-Dimensional Geometric Shaping", European Conference on Optical Communication (ECOC), DOI: 10.1109/​ECOC48923.2020.9333382, November 2020.
    BibTeX TR2020-155 PDF Video
    • @inproceedings{Talreja2020nov,
    • author = {Talreja, Veeru and Koike-Akino, Toshiaki and Wang, Ye and Millar, David S. and Kojima, Keisuke and Parsons, Kieran},
    • title = {End-to-End Deep Learning for Phase Noise-Robust Multi-Dimensional Geometric Shaping},
    • booktitle = {European Conference on Optical Communication (ECOC)},
    • year = 2020,
    • month = nov,
    • publisher = {IEEE},
    • doi = {10.1109/ECOC48923.2020.9333382},
    • isbn = {978-1-7281-7361-0},
    • url = {https://www.merl.com/publications/TR2020-155}
    • }
  •  Corcodel, R., Jain, S., van Baar, J., "Interactive Tactile Perception for Classification of Novel Object Instances", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/​IROS45743.2020.9341795, November 2020, pp. 9861-9868.
    BibTeX TR2020-143 PDF Video
    • @inproceedings{Corcodel2020nov,
    • author = {Corcodel, Radu and Jain, Siddarth and van Baar, Jeroen},
    • title = {Interactive Tactile Perception for Classification of Novel Object Instances},
    • booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2020,
    • pages = {9861--9868},
    • month = nov,
    • publisher = {IEEE},
    • doi = {10.1109/IROS45743.2020.9341795},
    • url = {https://www.merl.com/publications/TR2020-143}
    • }
  •  Jones, M.J., Ramachandra, B., Vatsavai, R., "A Survey of Single-Scene Video Anomaly Detection", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/​TPAMI.2020.3040591, Vol. 44, No. 5, pp. 2293-2312, November 2020.
    BibTeX TR2021-029 PDF
    • @article{Jones2020nov,
    • author = {Jones, Michael J. and Ramachandra, Bharathkumar and Vatsavai, Ranga},
    • title = {A Survey of Single-Scene Video Anomaly Detection},
    • journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
    • year = 2020,
    • volume = 44,
    • number = 5,
    • pages = {2293--2312},
    • month = nov,
    • doi = {10.1109/TPAMI.2020.3040591},
    • url = {https://www.merl.com/publications/TR2021-029}
    • }
  •  Ota, K., Sasaki, Y., Jha, D., Yoshiyasu, Y., Kanezaki, A., "Efficient Exploration in Constrained Environments with Goal-Oriented Reference Path", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), November 2020.
    BibTeX TR2020-141 PDF Software
    • @inproceedings{Ota2020nov,
    • author = {Ota, Kei and Sasaki, Yoko and Jha, Devesh and Yoshiyasu, Yusuke and Kanezaki, Asako},
    • title = {Efficient Exploration in Constrained Environments with Goal-Oriented Reference Path},
    • booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2020,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2020-141}
    • }
  •  Hori, T., Moritz, N., Hori, C., Le Roux, J., "Transformer-based Long-context End-to-end Speech Recognition", Interspeech, DOI: 10.21437/​Interspeech.2020-2928, October 2020, pp. 5011-5015.
    BibTeX TR2020-139 PDF Presentation
    • @inproceedings{Hori2020oct,
    • author = {Hori, Takaaki and Moritz, Niko and Hori, Chiori and Le Roux, Jonathan},
    • title = {Transformer-based Long-context End-to-end Speech Recognition},
    • booktitle = {Interspeech},
    • year = 2020,
    • pages = {5011--5015},
    • month = oct,
    • doi = {10.21437/Interspeech.2020-2928},
    • issn = {1990-9772},
    • url = {https://www.merl.com/publications/TR2020-139}
    • }
  •  Jayashankar, T., Le Roux, J., Moulin, P., "Detecting Audio Attacks on ASR Systems with Dropout Uncertainty", Interspeech, DOI: 10.21437/​Interspeech.2020-1846, October 2020, pp. 4671-4675.
    BibTeX TR2020-137 PDF Presentation
    • @inproceedings{Jayashankar2020oct,
    • author = {Jayashankar, Tejas and Le Roux, Jonathan and Moulin, Pierre},
    • title = {Detecting Audio Attacks on ASR Systems with Dropout Uncertainty},
    • booktitle = {Interspeech},
    • year = 2020,
    • pages = {4671--4675},
    • month = oct,
    • doi = {10.21437/Interspeech.2020-1846},
    • issn = {1990-9772},
    • url = {https://www.merl.com/publications/TR2020-137}
    • }
  •  Moritz, N., Wichern, G., Hori, T., Le Roux, J., "All-in-One Transformer: Unifying Speech Recognition, Audio Tagging, and Event Detection", Interspeech, DOI: 10.21437/​Interspeech.2020-2757, October 2020, pp. 3112-3116.
    BibTeX TR2020-138 PDF Presentation
    • @inproceedings{Moritz2020oct,
    • author = {Moritz, Niko and Wichern, Gordon and Hori, Takaaki and Le Roux, Jonathan},
    • title = {All-in-One Transformer: Unifying Speech Recognition, Audio Tagging, and Event Detection},
    • booktitle = {Interspeech},
    • year = 2020,
    • pages = {3112--3116},
    • month = oct,
    • doi = {10.21437/Interspeech.2020-2757},
    • issn = {1990-9772},
    • url = {https://www.merl.com/publications/TR2020-138}
    • }
  •  Manilow, E., Wichern, G., Le Roux, J., "Hierarchical Musical Instrument Separation", International Society for Music Information Retrieval (ISMIR) Conference, October 2020, pp. 376-383.
    BibTeX TR2020-136 PDF Software
    • @inproceedings{Manilow2020oct,
    • author = {Manilow, Ethan and Wichern, Gordon and Le Roux, Jonathan},
    • title = {Hierarchical Musical Instrument Separation},
    • booktitle = {International Society for Music Information Retrieval (ISMIR) Conference},
    • year = 2020,
    • pages = {376--383},
    • month = oct,
    • isbn = {978-0-9813537-0-8},
    • url = {https://www.merl.com/publications/TR2020-136}
    • }
  •  Tang, Y., Kojima, K., Koike-Akino, T., Wang, Y., Wu, P., TaherSima, M., Jha, D.K., Parsons, K., Qi, M., "Generative Deep Learning Model for Inverse Design of Integrated Nanophotonic Devices", Lasers and Photonics Reviews, DOI: 10.1002/​lpor.202000287, Vol. 2020, pp. 2000287, October 2020.
    BibTeX TR2020-135 PDF
    • @article{Tang2020oct,
    • author = {Tang, Yingheng and Kojima, Keisuke and Koike-Akino, Toshiaki and Wang, Ye and Wu, Pengxiang and TaherSima, Mohammad and Jha, Devesh K. and Parsons, Kieran and Qi, Minghao},
    • title = {Generative Deep Learning Model for Inverse Design of Integrated Nanophotonic Devices},
    • journal = {Lasers and Photonics Reviews},
    • year = 2020,
    • volume = 2020,
    • pages = 2000287,
    • month = oct,
    • doi = {10.1002/lpor.202000287},
    • url = {https://www.merl.com/publications/TR2020-135}
    • }
  •  Seetharaman, P., Wichern, G., Pardo, B., Le Roux, J., "Autoclip: Adaptive Gradient Clipping For Source Separation Networks", IEEE International Workshop on Machine Learning for Signal Processing (MLSP), DOI: 10.1109/​MLSP49062.2020.9231926, September 2020.
    BibTeX TR2020-132 PDF
    • @inproceedings{Seetharaman2020sep,
    • author = {Seetharaman, Prem and Wichern, Gordon and Pardo, Bryan and Le Roux, Jonathan},
    • title = {Autoclip: Adaptive Gradient Clipping For Source Separation Networks},
    • booktitle = {IEEE International Workshop on Machine Learning for Signal Processing (MLSP)},
    • year = 2020,
    • month = sep,
    • publisher = {IEEE},
    • doi = {10.1109/MLSP49062.2020.9231926},
    • url = {https://www.merl.com/publications/TR2020-132}
    • }
  •  Kojima, K., Tang, Y., Koike-Akino, T., Wang, Y., Jha, D.K., Parsons, K., TaherSima, M., Sang, F., Klamkin, J., Qi, M., "Inverse Design of Nanophotonic Devices using Deep Neural Networks", Asia Communications and Photonics Conference (ACP), September 2020, pp. Su1A.1.
    BibTeX TR2020-130 PDF Video
    • @inproceedings{Kojima2020sep,
    • author = {Kojima, Keisuke and Tang, Yingheng and Koike-Akino, Toshiaki and Wang, Ye and Jha, Devesh K. and Parsons, Kieran and TaherSima, Mohammad and Sang, Fengqiao and Klamkin, Jonathan and Qi, Minghao},
    • title = {Inverse Design of Nanophotonic Devices using Deep Neural Networks},
    • booktitle = {Asia Communications and Photonics Conference (ACP)},
    • year = 2020,
    • pages = {Su1A.1},
    • month = sep,
    • publisher = {Optical Society of America},
    • isbn = {978-1-943580-82-8},
    • url = {https://www.merl.com/publications/TR2020-130}
    • }
  •  Han, M., Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Disentangled Adversarial Autoencoder for Subject-Invariant Physiological Feature Extraction", IEEE Signal Processing Letters, DOI: 10.1109/​LSP.2020.3020215, Vol. 27, pp. 1565-1569, September 2020.
    BibTeX TR2020-128 PDF
    • @article{Han2020sep,
    • author = {Han, Mo and Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
    • title = {Disentangled Adversarial Autoencoder for Subject-Invariant Physiological Feature Extraction},
    • journal = {IEEE Signal Processing Letters},
    • year = 2020,
    • volume = 27,
    • pages = {1565--1569},
    • month = sep,
    • doi = {10.1109/LSP.2020.3020215},
    • issn = {1558-2361},
    • url = {https://www.merl.com/publications/TR2020-128}
    • }
  •  Pishdadian, F., Wichern, G., Le Roux, J., "Finding Strength in Weakness: Learning to Separate Sounds with Weak Supervision", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/​TASLP.2020.3013105, Vol. 28, pp. 2386-2399, September 2020.
    BibTeX TR2020-126 PDF
    • @article{Pishdadian2020sep,
    • author = {Pishdadian, Fatemeh and Wichern, Gordon and Le Roux, Jonathan},
    • title = {Finding Strength in Weakness: Learning to Separate Sounds with Weak Supervision},
    • journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
    • year = 2020,
    • volume = 28,
    • pages = {2386--2399},
    • month = sep,
    • doi = {10.1109/TASLP.2020.3013105},
    • url = {https://www.merl.com/publications/TR2020-126}
    • }
  •  Cherian, A., Chatterjee, M., Ahuja, N., "Sound2Sight: Generating Visual Dynamics from Sound and Context", European Conference on Computer Vision (ECCV), Vedaldi, A. and Bischof, H. and Brox, Th. and Frahm, J.-M., Eds., August 2020.
    BibTeX TR2020-121 PDF Software
    • @inproceedings{Cherian2020aug,
    • author = {Cherian, Anoop and Chatterjee, Moitreya and Ahuja, Narendra},
    • title = {Sound2Sight: Generating Visual Dynamics from Sound and Context},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2020,
    • editor = {Vedaldi, A. and Bischof, H. and Brox, Th. and Frahm, J.-M.},
    • month = aug,
    • publisher = {Springer},
    • url = {https://www.merl.com/publications/TR2020-121}
    • }
  •  Han, M., Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Disentangled Adversarial Transfer Learning for Physiological Biosignals", International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC), DOI: 10.1109/​EMBC44109.2020.9175233, July 2020.
    BibTeX TR2020-109 PDF Video Presentation
    • @inproceedings{Han2020jul,
    • author = {Han, Mo and Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
    • title = {Disentangled Adversarial Transfer Learning for Physiological Biosignals},
    • booktitle = {International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)},
    • year = 2020,
    • month = jul,
    • publisher = {IEEE},
    • doi = {10.1109/EMBC44109.2020.9175233},
    • issn = {1558-4615},
    • isbn = {978-1-7281-1990-8},
    • url = {https://www.merl.com/publications/TR2020-109}
    • }
  •  Seetharaman, P., Wichern, G., Le Roux, J., Pardo, B., "Bootstrapping Unsupervised Deep Music Separation from Primitive Auditory Grouping Principles", ICML 2020 Workshop on Self-supervision in Audio and Speech, July 2020.
    BibTeX TR2020-111 PDF
    • @inproceedings{Seetharaman2020jul,
    • author = {Seetharaman, Prem and Wichern, Gordon and Le Roux, Jonathan and Pardo, Bryan},
    • title = {Bootstrapping Unsupervised Deep Music Separation from Primitive Auditory Grouping Principles},
    • booktitle = {ICML 2020 Workshop on Self-supervision in Audio and Speech},
    • year = 2020,
    • month = jul,
    • url = {https://www.merl.com/publications/TR2020-111}
    • }
  •  Cherian, A., Aeron, S., "Representation Learning via Adversarially-Contrastive Optimal Transport", International Conference on Machine Learning (ICML), Daumé, H. and Singh, A., Eds., July 2020, pp. 10675-10685.
    BibTeX TR2020-093 PDF Software
    • @inproceedings{Cherian2020jul,
    • author = {Cherian, Anoop and Aeron, Shuchin},
    • title = {Representation Learning via Adversarially-Contrastive Optimal Transport},
    • booktitle = {International Conference on Machine Learning (ICML)},
    • year = 2020,
    • editor = {Daumé, H. and Singh, A.},
    • pages = {10675--10685},
    • month = jul,
    • url = {https://www.merl.com/publications/TR2020-093}
    • }
  •  Koike-Akino, T., Wang, Y., "Stochastic Bottleneck: Rateless Auto-Encoder for Flexible Dimensionality Reduction", IEEE International Symposium on Information Theory (ISIT), DOI: 10.1109/​ISIT44484.2020.9174523, June 2020.
    BibTeX TR2020-075 PDF Video Presentation
    • @inproceedings{Koike-Akino2020jun,
    • author = {Koike-Akino, Toshiaki and Wang, Ye},
    • title = {Stochastic Bottleneck: Rateless Auto-Encoder for Flexible Dimensionality Reduction},
    • booktitle = {IEEE International Symposium on Information Theory (ISIT)},
    • year = 2020,
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.1109/ISIT44484.2020.9174523},
    • issn = {2157-8117},
    • isbn = {978-1-7281-6432-8},
    • url = {https://www.merl.com/publications/TR2020-075}
    • }
  •  Hu, Y., Chen, S., Zhang, Y., Gu, X., "Collaborative Motion Prediction via Neural Motion Message Passing", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR42600.2020.00635, June 2020, pp. 6318-6327.
    BibTeX TR2020-072 PDF
    • @inproceedings{Hu2020jun,
    • author = {Hu, Yue and Chen, Siheng and Zhang, Ya and Gu, Xiao},
    • title = {Collaborative Motion Prediction via Neural Motion Message Passing},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2020,
    • pages = {6318--6327},
    • month = jun,
    • doi = {10.1109/CVPR42600.2020.00635},
    • url = {https://www.merl.com/publications/TR2020-072}
    • }