Publications

627 / 3,733 publications found.


  •  Hori, C., Hori, T., Le Roux, J., "Low-Latency Streaming Scene-aware Interaction Using Audio-Visual Transformers", Interspeech, DOI: 10.21437/​Interspeech.2022-10891, September 2022, pp. 4511-4515.
    BibTeX TR2022-116 PDF
    • @inproceedings{Hori2022sep,
    • author = {Hori, Chiori and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Low-Latency Streaming Scene-aware Interaction Using Audio-Visual Transformers},
    • booktitle = {Interspeech},
    • year = 2022,
    • pages = {4511--4515},
    • month = sep,
    • doi = {10.21437/Interspeech.2022-10891},
    • url = {https://www.merl.com/publications/TR2022-116}
    • }
  •  Tzinis, E., Wichern, G., Subramanian, A.S., Smaragdis, P., Le Roux, J., "Heterogeneous Target Speech Separation", Interspeech, DOI: 10.21437/​Interspeech.2022-10717, September 2022, pp. 1796-1800.
    BibTeX TR2022-115 PDF Video Presentation
    • @inproceedings{Tzinis2022sep,
    • author = {Tzinis, Efthymios and Wichern, Gordon and Subramanian, Aswin Shanmugam and Smaragdis, Paris and Le Roux, Jonathan},
    • title = {Heterogeneous Target Speech Separation},
    • booktitle = {Interspeech},
    • year = 2022,
    • pages = {1796--1800},
    • month = sep,
    • doi = {10.21437/Interspeech.2022-10717},
    • url = {https://www.merl.com/publications/TR2022-115}
    • }
  •  Higuchi, Y., Moritz, N., Le Roux, J., Hori, T., "Momentum Pseudo-Labeling: Semi-Supervised ASR with Continuously Improving Pseudo-Labels", IEEE Journal of Selected Topics in Signal Processing, DOI: 10.1109/​JSTSP.2022.3195367, Vol. 16, No. 6, pp. 1424-1438, September 2022.
    BibTeX TR2022-112 PDF
    • @article{Higuchi2022sep,
    • author = {Higuchi, Yosuke and Moritz, Niko and Le Roux, Jonathan and Hori, Takaaki},
    • title = {Momentum Pseudo-Labeling: Semi-Supervised ASR with Continuously Improving Pseudo-Labels},
    • journal = {IEEE Journal of Selected Topics in Signal Processing},
    • year = 2022,
    • volume = 16,
    • number = 6,
    • pages = {1424--1438},
    • month = sep,
    • doi = {10.1109/JSTSP.2022.3195367},
    • issn = {1941-0484},
    • url = {https://www.merl.com/publications/TR2022-112}
    • }
  •  Koike-Akino, T., Wang, P., Yamashita, G., Tsujita, W., Nakajima, M., "Quantum Feature Extraction for THz Multi-Layer Imaging", International Conference on Infrared, Millimeter, and Terahertz Waves (IRMMW-THz), DOI: 10.1109/​IRMMW-THz50927.2022.9896037, August 2022.
    BibTeX TR2022-110 PDF Video Presentation
    • @inproceedings{Koike-Akino2022aug,
    • author = {Koike-Akino, Toshiaki and Wang, Pu and Yamashita, Genki and Tsujita, Wataru and Nakajima, M.},
    • title = {Quantum Feature Extraction for THz Multi-Layer Imaging},
    • booktitle = {International Conference on Infrared, Millimeter, and Terahertz Waves (IRMMW-THz)},
    • year = 2022,
    • month = aug,
    • publisher = {IEEE},
    • doi = {10.1109/IRMMW-THz50927.2022.9896037},
    • issn = {2162-2035},
    • isbn = {978-1-7281-9427-1},
    • url = {https://www.merl.com/publications/TR2022-110}
    • }
  •  Liu, Bryan, Koike-Akino, Toshiaki, Wang, Ye, Kim, Kyeong Jin, Brand, Matthew, Aeron, Shuchin, Parsons, Kieran, "Data Privacy and Protection on Deep Leakage from Gradients by Layer-Wise Pruning", Tech. Rep. TR2022-081, Mitsubishi Electric Research Laboratories, Cambridge, MA, August 2022.
    BibTeX TR2022-081 PDF
    • @techreport{MERL_TR2022-081,
    • author = {Liu, Bryan; Koike-Akino, Toshiaki; Wang, Ye; Kim, Kyeong Jin; Brand, Matthew; Aeron, Shuchin; Parsons, Kieran},
    • title = {Data Privacy and Protection on Deep Leakage from Gradients by Layer-Wise Pruning},
    • institution = {MERL - Mitsubishi Electric Research Laboratories},
    • address = {Cambridge, MA 02139},
    • number = {TR2022-081},
    • month = aug,
    • year = 2022,
    • url = {https://www.merl.com/publications/TR2022-081/}
    • }
  •  Kojima, K., Jung, M., Koike-Akino, T., Wang, Y., Brand, M., Parsons, K., "Deep Transfer Learning for Nanophotonic Device Design", Conference on Lasers and Electro-Optics (CLEO) Pacific Rim, July 2022.
    BibTeX TR2022-107 PDF
    • @inproceedings{Kojima2022jul,
    • author = {Kojima, Keisuke and Jung, Minwoo and Koike-Akino, Toshiaki and Wang, Ye and Brand, Matthew and Parsons, Kieran},
    • title = {Deep Transfer Learning for Nanophotonic Device Design},
    • booktitle = {Proceedings of the 2022 Conference on Lasers and Electro-Optics Pacific Rim},
    • year = 2022,
    • month = jul,
    • publisher = {Optica Publishing Group},
    • url = {https://www.merl.com/publications/TR2022-107}
    • }
  •  Koike-Akino, T., Wang, Y., "AutoVAE: Mismatched Variational Autoencoder with Irregular Posterior Prior Pairing", IEEE International Symposium on Information Theory (ISIT), DOI: 10.1109/​ISIT50566.2022.9834769, July 2022.
    BibTeX TR2022-071 PDF Video Presentation
    • @inproceedings{Koike-Akino2022jul,
    • author = {Koike-Akino, Toshiaki and Wang, Ye},
    • title = {AutoVAE: Mismatched Variational Autoencoder with Irregular Posterior Prior Pairing},
    • booktitle = {IEEE International Symposium on Information Theory (ISIT)},
    • year = 2022,
    • month = jul,
    • publisher = {IEEE},
    • doi = {10.1109/ISIT50566.2022.9834769},
    • issn = {2157-8117},
    • isbn = {978-1-6654-2159-1},
    • url = {https://www.merl.com/publications/TR2022-071}
    • }
  •  Rambhatla, S., Jones, M.J., Chellappa, R., "An Empirical Analysis of Boosting Deep Networks", International Joint Conference on Neural Networks (IJCNN), DOI: 10.1109/​IJCNN55064.2022.9892204, July 2022.
    BibTeX TR2022-075 PDF Presentation
    • @inproceedings{Rambhatla2022jul,
    • author = {Rambhatla, Sai and Jones, Michael J. and Chellappa, Rama},
    • title = {An Empirical Analysis of Boosting Deep Networks},
    • booktitle = {International Joint Conference on Neural Networks (IJCNN)},
    • year = 2022,
    • month = jul,
    • doi = {10.1109/IJCNN55064.2022.9892204},
    • url = {https://www.merl.com/publications/TR2022-075}
    • }
  •  Demir, A., Koike-Akino, T., Wang, Y., Erdogmus, D., "EEG-GAT: Graph Attention Networks for Classification of Electroencephalogram (EEG) Signals", International Conference of the IEEE Engineering in Medicine & Biology Society (EMBS), DOI: 10.1109/​EMBC48229.2022.9871984, July 2022.
    BibTeX TR2022-097 PDF
    • @inproceedings{Demir2022jul,
    • author = {Demir, Andac and Koike-Akino, Toshiaki and Wang, Ye and Erdogmus, Deniz},
    • title = {EEG-GAT: Graph Attention Networks for Classification of Electroencephalogram (EEG) Signals},
    • booktitle = {International Conference of the IEEE Engineering in Medicine \& Biology Society (EMBS)},
    • year = 2022,
    • month = jul,
    • publisher = {IEEE},
    • doi = {10.1109/EMBC48229.2022.9871984},
    • issn = {2694-0604},
    • isbn = {978-1-7281-2782-8},
    • url = {https://www.merl.com/publications/TR2022-097}
    • }
  •  Smedemark-Margulies, N., Wang, Y., Koike-Akino, T., Erdogmus, D., "AutoTransfer: Subject Transfer Learning with Censored Representations on Biosignals Data", International Conference of the IEEE Engineering in Medicine & Biology Society (EMBS), DOI: 10.1109/​EMBC48229.2022.9871649, July 2022.
    BibTeX TR2022-098 PDF Software
    • @inproceedings{Smedemark-Margulies2022jul,
    • author = {Smedemark-Margulies, Niklas and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
    • title = {AutoTransfer: Subject Transfer Learning with Censored Representations on Biosignals Data},
    • booktitle = {International Conference of the IEEE Engineering in Medicine \& Biology Society (EMBS)},
    • year = 2022,
    • month = jul,
    • publisher = {IEEE},
    • doi = {10.1109/EMBC48229.2022.9871649},
    • issn = {2694-0604},
    • isbn = {978-1-7281-2782-8},
    • url = {https://www.merl.com/publications/TR2022-098}
    • }
  •  Cao, W., Benosman, M., Zhang, X., Ma, R., "Domain Knowledge-Infused Deep Learning for Automated Analog/Radio-Frequency Circuit Parameter Optimization", ACM/IEEE Design Automation Conference, July 2022.
    BibTeX TR2022-096 PDF
    • @inproceedings{Cao2022jul,
    • author = {Cao, Weidong and Benosman, Mouhacine and Zhang, Xuan and Ma, Rui},
    • title = {Domain Knowledge-Infused Deep Learning for Automated Analog/Radio-Frequency Circuit Parameter Optimization},
    • booktitle = {ACM/IEEE Design Automation Conference},
    • year = 2022,
    • month = jul,
    • url = {https://www.merl.com/publications/TR2022-096}
    • }
  •  Venkatesh, S., Wichern, G., Subramanian, A.S., Le Roux, J., "Disentangled Surrogate Task Learning for Improved Domain Generalization in Unsupervised Anomolous Sound Detection," Tech. Rep. TR2022-092, Detection and Classification of Acoustic Scenes and Events (DCASE) Challenge 2022, July 2022.
    BibTeX TR2022-092 PDF Presentation
    • @techreport{Venkatesh2022jul,
    • author = {Venkatesh, Satvik and Wichern, Gordon and Subramanian, Aswin Shanmugam and Le Roux, Jonathan},
    • title = {Disentangled Surrogate Task Learning for Improved Domain Generalization in Unsupervised Anomolous Sound Detection},
    • institution = {DCASE2022 Challenge},
    • year = 2022,
    • month = jul,
    • url = {https://www.merl.com/publications/TR2022-092}
    • }
  •  Sullivan, A., Wang, J., Li, X., Chen, S., Abbot, L., "PointMotionNet: Point-Wise Motion Learning for Large-Scale LiDAR Point Clouds Sequences", CVPR Workshop on Autonomous Driving, June 2022.
    BibTeX TR2022-083 PDF
    • @inproceedings{Sullivan2022jun,
    • author = {Sullivan, Alan and Wang, Jun and Li, Xiaolong and Chen, Siheng and Abbot, Lynn},
    • title = {PointMotionNet: Point-Wise Motion Learning for Large-Scale LiDAR Point Clouds Sequences},
    • booktitle = {CVPR Workshop on Autonomous Driving},
    • year = 2022,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2022-083}
    • }
  •  Koike-Akino, T., Wang, P., Wang, Y., "AutoQML: Automated Quantum Machine Learning for Wi-Fi Integrated Sensing and Communications", IEEE Sensor Array and Multichannel Signal Processing Workshop (SAM), DOI: 10.1109/​SAM53842.2022.9827846, June 2022.
    BibTeX TR2022-068 PDF Video Presentation
    • @inproceedings{Koike-Akino2022jun,
    • author = {Koike-Akino, Toshiaki and Wang, Pu and Wang, Ye},
    • title = {AutoQML: Automated Quantum Machine Learning for Wi-Fi Integrated Sensing and Communications},
    • booktitle = {IEEE Sensor Array and Multichannel Signal Processing Workshop (SAM)},
    • year = 2022,
    • month = jun,
    • doi = {10.1109/SAM53842.2022.9827846},
    • url = {https://www.merl.com/publications/TR2022-068}
    • }
  •  Chatterjee, M., Ahuja, N., Cherian, A., "Quantifying Predictive Uncertainty for Stochastic Video Synthesis from Audio", IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), June 2022.
    BibTeX TR2022-082 PDF
    • @inproceedings{Chatterjee2022jun,
    • author = {Chatterjee, Moitreya and Ahuja, Narendra and Cherian, Anoop},
    • title = {Quantifying Predictive Uncertainty for Stochastic Video Synthesis from Audio},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)},
    • year = 2022,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2022-082}
    • }
  •  Liu, B., Koike-Akino, T., Wang, Y., Kim, K.J., Brand, M., Aeron, S., Parsons, K., "Data Privacy and Protection on Deep Leakage from Gradients by Layer-Wise Pruning", IEEE Information Theory and Applications Workshop (ITA), June 2022.
    BibTeX TR2022-080 PDF Presentation
    • @inproceedings{Liu2022jun,
    • author = {Liu, Bryan and Koike-Akino, Toshiaki and Wang, Ye and Kim, Kyeong Jin and Brand, Matthew and Aeron, Shuchin and Parsons, Kieran},
    • title = {Data Privacy and Protection on Deep Leakage from Gradients by Layer-Wise Pruning},
    • booktitle = {IEEE Information Theory and Applications Workshop (ITA)},
    • year = 2022,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2022-080}
    • }
  •  Sun, Y., Benosman, M., Ma, R., "GaN Distributed RF Power Amplifier Automation Design with Deep Reinforcement Learning", International Conference on Artificial Intelligence Circuits and Systems (AICAS), June 2022.
    BibTeX TR2022-074 PDF
    • @inproceedings{Sun2022jun,
    • author = {Sun, Yuxiang and Benosman, Mouhacine and Ma, Rui},
    • title = {GaN Distributed RF Power Amplifier Automation Design with Deep Reinforcement Learning},
    • booktitle = {International Conference on Artificial Intelligence Circuits and Systems (AICAS)},
    • year = 2022,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2022-074}
    • }
  •  Zhu, X., Jain, S., Tomizuka, M., van Baar, J., "Learning to Synthesize Volumetric Meshes from Vision-based Tactile Imprints", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA46639.2022.9812092, May 2022, pp. 4833-4839.
    BibTeX TR2022-055 PDF
    • @inproceedings{Zhu2022may2,
    • author = {Zhu, Xinghao and Jain, Siddarth and Tomizuka, Masayoshi and van Baar, Jeroen},
    • title = {Learning to Synthesize Volumetric Meshes from Vision-based Tactile Imprints},
    • booktitle = {2022 IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2022,
    • pages = {4833--4839},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA46639.2022.9812092},
    • isbn = {978-1-7281-9681-7},
    • url = {https://www.merl.com/publications/TR2022-055}
    • }
  •  Liu, B., Koike-Akino, T., Wang, Y., Parsons, K., "Variational Quantum Compressed Sensing for Joint User and Channel State Acquisition in Grant-Free Device Access Systems", IEEE International Conference on Communications (ICC), DOI: 10.1109/​ICC45855.2022.9838445, May 2022.
    BibTeX TR2022-052 PDF Video Presentation
    • @inproceedings{Liu2022may3,
    • author = {Liu, Bryan and Koike-Akino, Toshiaki and Wang, Ye and Parsons, Kieran},
    • title = {Variational Quantum Compressed Sensing for Joint User and Channel State Acquisition in Grant-Free Device Access Systems},
    • booktitle = {IEEE International Conference on Communications (ICC)},
    • year = 2022,
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICC45855.2022.9838445},
    • issn = {1938-1883},
    • isbn = {978-1-5386-8347-7},
    • url = {https://www.merl.com/publications/TR2022-052}
    • }
  •  Jung, M., Kojima, K., Koike-Akino, T., Wang, Y., Zhu, D., Brand, M., "Finding the Right Deep Neural Network Model for Efficient Design of Tunable Nanophotonic Devices", Conference on Lasers and Electro-Optics (CLEO), DOI: 10.1364/​CLEO_SI.2022.SW5E.6, May 2022.
    BibTeX TR2022-047 PDF Video Presentation
    • @inproceedings{Jung2022may,
    • author = {Jung, Minwoo and Kojima, Keisuke and Koike-Akino, Toshiaki and Wang, Ye and Zhu, Dayu and Brand, Matthew},
    • title = {Finding the Right Deep Neural Network Model for Efficient Design of Tunable Nanophotonic Devices},
    • booktitle = {Conference on Lasers and Electro-Optics (CLEO)},
    • year = 2022,
    • month = may,
    • publisher = {Optica},
    • doi = {10.1364/CLEO_SI.2022.SW5E.6},
    • isbn = {978-1-957171-05-0},
    • url = {https://www.merl.com/publications/TR2022-047}
    • }
  •  Koike-Akino, T., Kojima, K., Wang, Y., "AutoML Hyperparameter Tuning of Generative DNN Architecture for Nanophotonic Device Design", Conference on Lasers and Electro-Optics (CLEO), DOI: 10.1364/​CLEO_AT.2022.JW3A.44, May 2022.
    BibTeX TR2022-046 PDF Presentation
    • @inproceedings{Koike-Akino2022may3,
    • author = {Koike-Akino, Toshiaki and Kojima, Keisuke and Wang, Ye},
    • title = {AutoML Hyperparameter Tuning of Generative DNN Architecture for Nanophotonic Device Design},
    • booktitle = {Conference on Lasers and Electro-Optics (CLEO)},
    • year = 2022,
    • month = may,
    • publisher = {Optica},
    • doi = {10.1364/CLEO_AT.2022.JW3A.44},
    • isbn = {978-1-957171-05-0},
    • url = {https://www.merl.com/publications/TR2022-046}
    • }
  •  Chang, X., Moritz, N., Hori, T., Watanabe, S., Le Roux, J., "Extended Graph Temporal Classification for Multi-Speaker End-to-End ASR", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9747375, April 2022, pp. 7322-7326.
    BibTeX TR2022-021 PDF
    • @inproceedings{Chang2022apr,
    • author = {Chang, Xuankai and Moritz, Niko and Hori, Takaaki and Watanabe, Shinji and Le Roux, Jonathan},
    • title = {Extended Graph Temporal Classification for Multi-Speaker End-to-End ASR},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {7322--7326},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP43922.2022.9747375},
    • url = {https://www.merl.com/publications/TR2022-021}
    • }
  •  Higuchi, Y., Moritz, N., Le Roux, J., Hori, T., "Advancing Momentum Pseudo-Labeling with Conformer and Initialization Strategy", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9746275, April 2022, pp. 7672-7676.
    BibTeX TR2022-026 PDF
    • @inproceedings{Higuchi2022apr,
    • author = {Higuchi, Yosuke and Moritz, Niko and Le Roux, Jonathan and Hori, Takaaki},
    • title = {Advancing Momentum Pseudo-Labeling with Conformer and Initialization Strategy},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {7672--7676},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP43922.2022.9746275},
    • url = {https://www.merl.com/publications/TR2022-026}
    • }
  •  Moritz, N., Hori, T., Watanabe, S., Le Roux, J., "Sequence Transduction with Graph-based Supervision", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9747788, April 2022, pp. 7212-7216.
    BibTeX TR2022-024 PDF
    • @inproceedings{Moritz2022apr,
    • author = {Moritz, Niko and Hori, Takaaki and Watanabe, Shinji and Le Roux, Jonathan},
    • title = {Sequence Transduction with Graph-based Supervision},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {7212--7216},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP43922.2022.9747788},
    • url = {https://www.merl.com/publications/TR2022-024}
    • }
  •  Peng, K.-C., "Iterative Self Knowledge Distillation -- From Pothole Classification To Fine-Grained And COVID Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), Gan, W.-S. and Ma, K. K., Eds., DOI: 10.1109/​ICASSP43922.2022.9746470, April 2022, pp. 3139-3143.
    BibTeX TR2022-020 PDF Video Presentation
    • @inproceedings{Peng2022apr,
    • author = {Peng, Kuan-Chuan},
    • title = {Iterative Self Knowledge Distillation -- From Pothole Classification To Fine-Grained And COVID Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • editor = {Gan, W.-S. and Ma, K. K.},
    • pages = {3139--3143},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP43922.2022.9746470},
    • issn = {1520-6149},
    • isbn = {978-1-6654-0541-6},
    • url = {https://www.merl.com/publications/TR2022-020}
    • }