Publications

Wang, Y., Aeron, S., Rakin, A.S., Koike-Akino, T., Moulin, P., "Robust Machine Learning via Privacy/Rate-Distortion Theory", IEEE International Symposium on Information Theory (ISIT), DOI: 10.1109/ISIT45174.2021.9517751, July 2021.
BibTeX TR2021-082 PDF Video Presentation
- @inproceedings{Wang2021jul,
- author = {Wang, Ye and Aeron, Shuchin and Rakin, Adnan S and Koike-Akino, Toshiaki and Moulin, Pierre},
- title = {{Robust Machine Learning via Privacy/Rate-Distortion Theory}},
- booktitle = {IEEE International Symposium on Information Theory (ISIT)},
- year = 2021,
- month = jul,
- publisher = {IEEE},
- doi = {10.1109/ISIT45174.2021.9517751},
- isbn = {978-1-5386-8210-4},
- url = {https://www.merl.com/publications/TR2021-082}
- }
Cherian, A., Wang, J., "Generalized One-Class Learning Using Pairs of Complementary Classifiers", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/TPAMI.2021.3092999, June 2021.
BibTeX TR2021-076 PDF Software
- @article{Cherian2021jun,
- author = {Cherian, Anoop and Wang, Jue},
- title = {{Generalized One-Class Learning Using Pairs of Complementary Classifiers}},
- journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
- year = 2021,
- month = jun,
- doi = {10.1109/TPAMI.2021.3092999},
- url = {https://www.merl.com/publications/TR2021-076}
- }
Hori, C., "Human Perspective Scene Understanding via Multimodal Sensing," Tech. Rep. TR2022-151, Audio-Visual Scene Understanding Tutorial at CVPR 2021, June 2021.
BibTeX TR2022-151 PDF Video
- @techreport{Hori2021jun,
- author = {Hori, Chiori},
- title = {{Human Perspective Scene Understanding via Multimodal Sensing}},
- institution = {Mitsubishi Electric Research Laboratories},
- year = 2021,
- month = jun,
- url = {https://www.merl.com/publications/TR2022-151}
- }
Raychaudhuri, D.S., van Baar, J., Paul, S., Roy-Chowdhury, A.K., "Cross-domain Imitation from Observations", International Conference on Machine Learning (ICML), June 2021.
BibTeX TR2021-074 PDF
- @inproceedings{Raychaudhuri2021jun,
- author = {Raychaudhuri, Dripta S. and {van Baar}, Jeroen and Paul, Sujoy and Roy-Chowdhury, Amit K.},
- title = {{Cross-domain Imitation from Observations}},
- booktitle = {International Conference on Machine Learning (ICML)},
- year = 2021,
- month = jun,
- url = {https://www.merl.com/publications/TR2021-074}
- }
Moritz, N., Hori, T., Le Roux, J., "Capturing Multi-Resolution Context by Dilated Self-Attention", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9415001, June 2021, pp. 5869-5873.
BibTeX TR2021-036 PDF
- @inproceedings{Moritz2021jun,
- author = {Moritz, Niko and Hori, Takaaki and {Le Roux}, Jonathan},
- title = {{Capturing Multi-Resolution Context by Dilated Self-Attention}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- pages = {5869--5873},
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9415001},
- url = {https://www.merl.com/publications/TR2021-036}
- }
Chen, S., Eldar, Y., "Time-Varying Graph Signal Inpainting via Unrolling Networks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9413406, June 2021.
BibTeX TR2021-070 PDF
- @inproceedings{Chen2021jun,
- author = {{Chen, Siheng and Eldar, Yonina}},
- title = {{Time-Varying Graph Signal Inpainting via Unrolling Networks}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9413406},
- url = {https://www.merl.com/publications/TR2021-070}
- }
Chen, S., Eldar, Y., "Graph Signaling Denoising via Unrolling Networks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9415073, June 2021.
BibTeX TR2021-071 PDF
- @inproceedings{Chen2021jun3,
- author = {{Chen, Siheng and Eldar, Yonina}},
- title = {{Graph Signaling Denoising via Unrolling Networks}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9415073},
- url = {https://www.merl.com/publications/TR2021-071}
- }
Hung, Y.-N., Wichern, G., Le Roux, J., "Transcription Is All You Need: Learning to Separate Musical Mixtures with Score as Supervision", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9413358, June 2021, pp. 46-50.
BibTeX TR2021-069 PDF
- @inproceedings{Hung2021jun,
- author = {Hung, Yun-Ning and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Transcription Is All You Need: Learning to Separate Musical Mixtures with Score as Supervision}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- pages = {46--50},
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9413358},
- issn = {2379-190X},
- isbn = {978-1-7281-7605-5},
- url = {https://www.merl.com/publications/TR2021-069}
- }
Khurana, S., Moritz, N., Hori, T., Le Roux, J., "Unsupervised Domain Adaptation For Speech Recognition via Uncertainty Driven Self-Training", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9414299, June 2021, pp. 6553-6557.
BibTeX TR2021-039 PDF
- @inproceedings{Khurana2021jun,
- author = {Khurana, Sameer and Moritz, Niko and Hori, Takaaki and {Le Roux}, Jonathan},
- title = {{Unsupervised Domain Adaptation For Speech Recognition via Uncertainty Driven Self-Training}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- pages = {6553--6557},
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9414299},
- url = {https://www.merl.com/publications/TR2021-039}
- }
Moritz, N., Hori, T., Le Roux, J., "Semi-Supervised Speech Recognition via Graph-Based Temporal Classification", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9414058, June 2021, pp. 6548-6552.
BibTeX TR2021-037 PDF
- @inproceedings{Moritz2021jun2,
- author = {Moritz, Niko and Hori, Takaaki and {Le Roux}, Jonathan},
- title = {{Semi-Supervised Speech Recognition via Graph-Based Temporal Classification}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- pages = {6548--6552},
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9414058},
- url = {https://www.merl.com/publications/TR2021-037}
- }
Watanabe, S., Boyer, F., Chang, X., Guo, P., Hayashi, T., Higuchi, Y., Hori, T., Huang, W.-C., Inaguma, H., Kamo, N., Shigeki, K., Li, C., Shi, J., Subramanian, A.S., Zhang, W., "The 2020 ESPNET Update: New Features, Broadened Applications, Performance Improvements, and Future Plans", IEEE Data Science and Learning Workshop (DSLW), DOI: 10.1109/DSLW51110, June 2021, pp. 1-6.
BibTeX TR2021-073 PDF
- @inproceedings{Watanabe2021jun,
- author = {Watanabe, Shinji and Boyer, Florian and Chang, Xuankai and Guo, Pengcheng and Hayashi, Tomoki and Higuchi, Yosuke and Hori, Takaaki and Huang, Wen-Chin and Inaguma, Hirofumi and Kamo, Naoyuki and Shigeki, Karita and Li, Chenda and Shi, Jing and Subramanian, Aswin S and Zhang, Wangyou},
- title = {{The 2020 ESPNET Update: New Features, Broadened Applications, Performance Improvements, and Future Plans}},
- booktitle = {IEEE Data Science and Learning Workshop (DSLW)},
- year = 2021,
- pages = {1--6},
- month = jun,
- publisher = {IEEE},
- doi = {10.1109/DSLW51110},
- isbn = {978-1-6654-2826-2},
- url = {https://www.merl.com/publications/TR2021-073}
- }
Kim, S., Galley, M., Gunasekara, C., Lee, S., Atkinson, A., Peng, B., Schulz, H., Gao, J., Li, J., Adada, M., Huang, M., Lastras, L., Kummerfeld, J.K., Lasecki, W.S., Hori, C., Cherian, A., Marks, T.K., Rastogi, A., Zang, X., Sunkara, S., Gupta, R., "Overview of the Eighth Dialog System Technology Challenge: DSTC8", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TASLP.2021.3078368, May 2021.
BibTeX TR2021-064 PDF
- @article{Kim2021may,
- author = {Kim, Seokhwan and Galley, Michel and Gunasekara, Chulaka and Lee, Sungjin and Atkinson, Adam and Peng, Baolin and Schulz, Hannes and Gao, Jianfeng and Li, Jinchao and Adada, Mahmoud and Huang, Minlie and Lastras, Luis and Kummerfeld, Jonathan K. and Lasecki, Walter S. and Hori, Chiori and Cherian, Anoop and Marks, Tim K. and Rastogi, Abhinav and Zang, Xiaoxue and Sunkara, Srinivas and Gupta, Raghav},
- title = {{Overview of the Eighth Dialog System Technology Challenge: DSTC8}},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2021,
- month = may,
- doi = {10.1109/TASLP.2021.3078368},
- issn = {2329-9290},
- url = {https://www.merl.com/publications/TR2021-064}
- }
Hori, C., Tsuchiya, M., Chen, S., Cherian, A., Hori, T., Harsham, B.A., Marks, T.K., Le Roux, J., Sullivan, A., Vetro, A., "マルチモーダルセンシング情報に基づくScene-aware Interaction 技術", Society of Automotive Engineers of Japan, Vol. 75, No. 5, pp. 66-71, May 2021.
BibTeX TR2021-042 PDF Video
- @article{Hori2021may,
- author = {Hori, Chiori and Tsuchiya, Masato and Chen, Siheng and Cherian, Anoop and Hori, Takaaki and Harsham, Bret A. and Marks, Tim K. and {Le Roux}, Jonathan and Sullivan, Alan and Vetro, Anthony},
- title = {{マルチモーダルセンシング情報に基づくScene-aware Interaction 技術}},
- journal = {Society of Automotive Engineers of Japan},
- year = 2021,
- volume = 75,
- number = 5,
- pages = {66--71},
- month = may,
- url = {https://www.merl.com/publications/TR2021-042}
- }
Pan, C., Chen, S., Ortega, A., "Spatio-Temporal Graph Scattering Transform", International Conference on Learning Representations (ICLR), May 2021.
BibTeX TR2021-044 PDF
- @inproceedings{Pan2021may,
- author = {{Pan, Chao and Chen, Siheng and Ortega, Antonio}},
- title = {{Spatio-Temporal Graph Scattering Transform}},
- booktitle = {International Conference on Learning Representations (ICLR)},
- year = 2021,
- month = may,
- url = {https://www.merl.com/publications/TR2021-044}
- }
Han, M., Ozdenizci, O., Koike-Akino, T., Wang, Y., Erdogmus, D., "Universal Physiological Representation Learning with Soft-Disentangled Rateless Autoencoders", IEEE Journal of Biomedical and Health Informatics, DOI: 10.1109/JBHI.2021.3062335, Vol. 25, No. 8, pp. 2928-2937, April 2021.
BibTeX TR2021-027 PDF
- @article{Han2021apr,
- author = {Han, Mo and Ozdenizci, Ozan and Koike-Akino, Toshiaki and Wang, Ye and Erdogmus, Deniz},
- title = {{Universal Physiological Representation Learning with Soft-Disentangled Rateless Autoencoders}},
- journal = {IEEE Journal of Biomedical and Health Informatics},
- year = 2021,
- volume = 25,
- number = 8,
- pages = {2928--2937},
- month = apr,
- doi = {10.1109/JBHI.2021.3062335},
- issn = {2168-2208},
- url = {https://www.merl.com/publications/TR2021-027}
- }
Ramachandra, B., Jones, M.J., Vatsavai, R., "Perceptual Metric Learning for Video Anomaly Detection", Machine Vision and Applications, DOI: 0.1007/s00138-021-01187-5, Vol. 32, No. 63, pp. 1-18, March 2021.
BibTeX TR2021-028 PDF
- @article{Ramachandra2021mar,
- author = {Ramachandra, Bharathkumar and Jones, Michael J. and Vatsavai, Ranga},
- title = {{Perceptual Metric Learning for Video Anomaly Detection}},
- journal = {Machine Vision and Applications},
- year = 2021,
- volume = 32,
- number = 63,
- pages = {1--18},
- month = mar,
- doi = {0.1007/s00138-021-01187-5},
- url = {https://www.merl.com/publications/TR2021-028}
- }
Demir, A., Koike-Akino, T., Wang, Y., Erdogmus, D., "AutoBayes: Automated Bayesian Graph Exploration for Nuisance-Robust Inference", IEEE Access, DOI: 10.1109/ACCESS.2021.3064530, Vol. 9, pp. 39955-39972, March 2021.
BibTeX TR2021-016 PDF Presentation
- @article{Demir2021mar,
- author = {Demir, Andac and Koike-Akino, Toshiaki and Wang, Ye and Erdogmus, Deniz},
- title = {{AutoBayes: Automated Bayesian Graph Exploration for Nuisance-Robust Inference}},
- journal = {IEEE Access},
- year = 2021,
- volume = 9,
- pages = {39955--39972},
- month = mar,
- doi = {10.1109/ACCESS.2021.3064530},
- issn = {2169-3536},
- url = {https://www.merl.com/publications/TR2021-016}
- }
Kojima, K., Tang, Y., Koike-Akino, T., Wang, Y., Jha, D.K., TaherSima, M., Parsons, K., "Application of Deep Learning for Nanophotonic Device Design", SPIE Photonics West, Bahram Jalali and Ken-ichi Kitayama, Eds., DOI: 10.1117/12.2579104, March 2021.
BibTeX TR2020-182 PDF Video
- @inproceedings{Kojima2021mar,
- author = {Kojima, Keisuke and Tang, Yingheng and Koike-Akino, Toshiaki and Wang, Ye and Jha, Devesh K. and TaherSima, Mohammad and Parsons, Kieran},
- title = {{Application of Deep Learning for Nanophotonic Device Design}},
- booktitle = {SPIE Photonics West},
- year = 2021,
- editor = {Bahram Jalali and Ken-ichi Kitayama},
- month = mar,
- publisher = {SPIE},
- doi = {10.1117/12.2579104},
- url = {https://www.merl.com/publications/TR2020-182}
- }
Geng, S., Gao, P., Chatterjee, M., Hori, C., Le Roux, J., Zhang, Y., Li, H., Cherian, A., "Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers", AAAI Conference on Artificial Intelligence, February 2021, pp. 1415-1423.
BibTeX TR2021-010 PDF
- @inproceedings{Geng2021feb,
- author = {Geng, Shijie and Gao, Peng and Chatterjee, Moitreya and Hori, Chiori and {Le Roux}, Jonathan and Zhang, Yongfeng and Li, Hongsheng and Cherian, Anoop},
- title = {{Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers}},
- booktitle = {AAAI Conference on Artificial Intelligence},
- year = 2021,
- pages = {1415--1423},
- month = feb,
- publisher = {AAAI Press, Palo Alto, California USA},
- isbn = {978-1-57735-866-4},
- url = {https://www.merl.com/publications/TR2021-010}
- }
Kojima, K., TaherSima, M., Koike-Akino, T., Jha, D.K., Tang, Y., Wang, Y., Parsons, K., "Deep Neural Networks for Inverse Design of Nanophotonic Devices", IEEE Journal of Lightwave Technology, DOI: 10.1109/JLT.2021.3050083, January 2021.
BibTeX TR2021-001 PDF
- @article{Kojima2021jan,
- author = {Kojima, Keisuke and TaherSima, Mohammad and Koike-Akino, Toshiaki and Jha, Devesh K. and Tang, Yingheng and Wang, Ye and Parsons, Kieran},
- title = {{Deep Neural Networks for Inverse Design of Nanophotonic Devices}},
- journal = {IEEE Journal of Lightwave Technology},
- year = 2021,
- month = jan,
- doi = {10.1109/JLT.2021.3050083},
- issn = {1558-2213},
- url = {https://www.merl.com/publications/TR2021-001}
- }
Lohit, S., Anirudh, R., Turaga, P., "Recovering Trajectories of Unmarked Joints in 3D Human Actions Using Latent Space Optimization", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2021.
BibTeX TR2021-004 PDF
- @inproceedings{Lohit2021jan,
- author = {Lohit, Suhas and Anirudh, Rushil and Turaga, Pavan},
- title = {{Recovering Trajectories of Unmarked Joints in 3D Human Actions Using Latent Space Optimization}},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2021,
- month = jan,
- publisher = {CVF OpenAccess},
- url = {https://www.merl.com/publications/TR2021-004}
- }
Anirudh, R., Lohit, S., Turaga, P., "Generative Patch Priors for Practical Compressive Image Recovery", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2021.
BibTeX TR2021-003 PDF
- @inproceedings{Anirudh2021jan,
- author = {Anirudh, Rushil and Lohit, Suhas and Turaga, Pavan},
- title = {{Generative Patch Priors for Practical Compressive Image Recovery}},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2021,
- month = jan,
- publisher = {CVF OpenAccess},
- url = {https://www.merl.com/publications/TR2021-003}
- }
Nowara, E., Marks, T.K., Mansour, H., Veeraraghavan, A., "Near-Infrared Imaging Photoplethysmography During Driving", IEEE Transactions on Intelligent Transportation Systems, DOI: 10.1109/TITS.2020.3038317, pp. 1-12, December 2020.
BibTeX TR2020-161 PDF
- @article{Nowara2020dec,
- author = {Nowara, Ewa and Marks, Tim K. and Mansour, Hassan and Veeraraghavan, Ashok},
- title = {{Near-Infrared Imaging Photoplethysmography During Driving}},
- journal = {IEEE Transactions on Intelligent Transportation Systems},
- year = 2020,
- pages = {1--12},
- month = dec,
- doi = {10.1109/TITS.2020.3038317},
- url = {https://www.merl.com/publications/TR2020-161}
- }
Li, M., Chen, S., Zhang, Y., "Graph Cross Networks with Vertex Infomax Pooling", Advances in Neural Information Processing Systems (NeurIPS), December 2020.
BibTeX TR2020-167 PDF
- @inproceedings{Li2020dec,
- author = {Li, Maosen and Chen, Siheng and Zhang, Ya},
- title = {{Graph Cross Networks with Vertex Infomax Pooling}},
- booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
- year = 2020,
- month = dec,
- url = {https://www.merl.com/publications/TR2020-167}
- }
Talreja, V., Koike-Akino, T., Wang, Y., Millar, D.S., Kojima, K., Parsons, K., "End-to-End Deep Learning for Phase Noise-Robust Multi-Dimensional Geometric Shaping", European Conference on Optical Communication (ECOC), DOI: 10.1109/ECOC48923.2020.9333382, November 2020.
BibTeX TR2020-155 PDF Video
- @inproceedings{Talreja2020nov,
- author = {Talreja, Veeru and Koike-Akino, Toshiaki and Wang, Ye and Millar, David S. and Kojima, Keisuke and Parsons, Kieran},
- title = {{End-to-End Deep Learning for Phase Noise-Robust Multi-Dimensional Geometric Shaping}},
- booktitle = {European Conference on Optical Communication (ECOC)},
- year = 2020,
- month = nov,
- publisher = {IEEE},
- doi = {10.1109/ECOC48923.2020.9333382},
- isbn = {978-1-7281-7361-0},
- url = {https://www.merl.com/publications/TR2020-155}
- }