Publications

Yen, H., Germain, F., Wichern, G., Le Roux, J., "Cold Diffusion for Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10096064, May 2023, pp. 1-5.
BibTeX TR2023-020 PDF
- @inproceedings{Yen2023may,
- author = {Yen, Hao and Germain, Francois and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Cold Diffusion for Speech Enhancement}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10096064},
- url = {https://www.merl.com/publications/TR2023-020}
- }
Zhao, Q., Ma, Y., Boufounos, P.T., Nabi, S., Mansour, H., "Deep Born Operator Learning for Reflection Tomographic Imaging", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10095494, May 2023, pp. 1-5.
BibTeX TR2023-029 PDF Video Data Software
- @inproceedings{Zhao2023may,
- author = {Zhao, Qingqing and Ma, Yanting and Boufounos, Petros T. and Nabi, Saleh and Mansour, Hassan},
- title = {{Deep Born Operator Learning for Reflection Tomographic Imaging}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10095494},
- url = {https://www.merl.com/publications/TR2023-029}
- }
Cherian, A., Peng, K.-C., Lohit, S., Smith, K., Tenenbaum, J.B., "Are Deep Neural Networks SMARTer than Second Graders?", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), March 2023, pp. 10834-10844.
BibTeX TR2023-014 PDF Video Data Software Presentation
- @inproceedings{Cherian2023mar,
- author = {Cherian, Anoop and Peng, Kuan-Chuan and Lohit, Suhas and Smith, Kevin and Tenenbaum, Joshua B.},
- title = {{Are Deep Neural Networks SMARTer than Second Graders?}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2023,
- pages = {10834--10844},
- month = mar,
- publisher = {CVF},
- url = {https://www.merl.com/publications/TR2023-014}
- }
Yoshino, K., Chen, Y.-N., Crook, P., Kottur, S., Li, J., Hedayatnia, B., Moon, S., Fei, Z., Li, Z., Zhang, J., Feng, Y., Zhou, J., Kim, S., Liu, Y., Jin, D., Papangelis, A., Gopalakrishnan, K., Hakkani-Tur, D., Damavandi, B., Geramifard, A., Hori, C., Shah, A., Zhang, C., Li, H., Sedoc, J., D'Haro, L.F., Banchs, R., Rudnicky, A., "Overview of the Tenth Dialog System Technology Challenge: DSTC10", IEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TCSVT.2002.808437, Vol. 13, No. 2, pp. 121-130, February 2023.
BibTeX TR2023-109 PDF
- @article{Yoshino2023feb,
- author = {{{Yoshino, Koichiro and Chen, Yun-Nung and Crook, Paul and Kottur, Satwik and Li, Jinchao and Hedayatnia, Behnam and Moon, Seungwhan and Fei, Zhengcong and Li, Zekang and Zhang, Jinchao and Feng, Yang and Zhou, Jie and Kim, Seokhwan and Liu, Yang and Jin, Di and Papangelis, Alexandros and Gopalakrishnan, Karthik and Hakkani-Tur, Dilek and Damavandi, Babak and Geramifard, Alborz and Hori, Chiori and Shah, Ankit and Zhang, Chen and Li, Haizhou and Sedoc, João and D'Haro, Luis F. and Banchs, Rafael and Rudnicky, Alexander}}},
- title = {{{Overview of the Tenth Dialog System Technology Challenge: DSTC10}}},
- journal = {IEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2023,
- volume = 13,
- number = 2,
- pages = {121--130},
- month = feb,
- doi = {10.1109/TCSVT.2002.808437},
- url = {https://www.merl.com/publications/TR2023-109}
- }
Kojima, K., Koike-Akino, T., Wang, Y., Jung Minwoo, , Brand, M., "Inverse design of two-dimensional freeform metagrating using an adversarial conditional variational autoencoder", SPIE Photonics West, DOI: 10.1117/12.2650299, January 2023.
BibTeX TR2023-004 PDF
- @inproceedings{Kojima2023jan,
- author = {Kojima, Keisuke and Koike-Akino, Toshiaki and Wang, Ye and Jung Minwoo and Brand, Matthew},
- title = {{Inverse design of two-dimensional freeform metagrating using an adversarial conditional variational autoencoder}},
- booktitle = {Proc. SPIE 12431, Photonic and Phononic Properties of Engineered Nanostructures XIII},
- year = 2023,
- month = jan,
- publisher = {SPIE},
- doi = {10.1117/12.2650299},
- url = {https://www.merl.com/publications/TR2023-004}
- }
Liu, T., Cherian, A., "Learning a Constrained Optimizer: A Primal Method", AAAI Bridge on Constraint Programming and Machine Learning, January 2023.
BibTeX TR2023-003 PDF
- @inproceedings{Liu2023jan,
- author = {Liu, Tao and Cherian, Anoop},
- title = {{Learning a Constrained Optimizer: A Primal Method}},
- booktitle = {AAAI Bridge on Constraint Programming and Machine Learning},
- year = 2023,
- month = jan,
- url = {https://www.merl.com/publications/TR2023-003}
- }
Tohme, T., Liu, D., Youcef-Toumi, K., "GSR: A Generalized Symbolic Regression Approach", Transactions on Machine Learning Research, January 2023.
BibTeX TR2023-002 PDF
- @article{Tohme2023jan,
- author = {Tohme, Tony and Liu, Dehong and Youcef-Toumi, Kamal},
- title = {{GSR: A Generalized Symbolic Regression Approach}},
- journal = {Transactions on Machine Learning Research},
- year = 2023,
- month = jan,
- issn = {2835-8856},
- url = {https://www.merl.com/publications/TR2023-002}
- }
Wang, Z.-Q., Wichern, G., Watanabe, S., Le Roux, J., "STFT-Domain Neural Speech Enhancement with Very Low Algorithmic Latency", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TASLP.2022.3224285, Vol. 31, pp. 397-410, December 2022.
BibTeX TR2022-166 PDF
- @article{Wang2022dec2,
- author = {Wang, Zhong-Qiu and Wichern, Gordon and Watanabe, Shinji and {Le Roux}, Jonathan},
- title = {{STFT-Domain Neural Speech Enhancement with Very Low Algorithmic Latency}},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2022,
- volume = 31,
- pages = {397--410},
- month = dec,
- doi = {10.1109/TASLP.2022.3224285},
- issn = {2329-9304},
- url = {https://www.merl.com/publications/TR2022-166}
- }
Singla, V., Aeron, S., Koike-Akino, T., Parsons, K., Brand, M., Wang, Y., "Learning with noisy labels using low-dimensional model trajectory", NeurIPS 2022 Workshop on Distribution Shifts (DistShift), December 2022.
BibTeX TR2022-156 PDF
- @inproceedings{Singla2022dec,
- author = {Singla, Vasu and Aeron, Shuchin and Koike-Akino, Toshiaki and Parsons, Kieran and Brand, Matthew and Wang, Ye},
- title = {{Learning with noisy labels using low-dimensional model trajectory}},
- booktitle = {NeurIPS 2022 Workshop on Distribution Shifts: Connecting Methods and Applications},
- year = 2022,
- month = dec,
- publisher = {OpenReview},
- url = {https://www.merl.com/publications/TR2022-156}
- }
Shimoya, R., Morimoto, T., van Baar, J., Boufounos, P.T., Ma, Y., Mansour, H., "Learning Occlusion-Aware Dense Correspondences for Multi-Modal Images", IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS), DOI: 10.1109/AVSS56176.2022.9959354, November 2022, pp. 1-8.
BibTeX TR2022-149 PDF
- @inproceedings{Shimoya2022nov,
- author = {Shimoya, Ryosuke and Morimoto, Tahashi and {van Baar}, Jeroen and Boufounos, Petros T. and Ma, Yanting and Mansour, Hassan},
- title = {{Learning Occlusion-Aware Dense Correspondences for Multi-Modal Images}},
- booktitle = {IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS)},
- year = 2022,
- pages = {1--8},
- month = nov,
- doi = {10.1109/AVSS56176.2022.9959354},
- isbn = {978-1-6654-6382-9},
- url = {https://www.merl.com/publications/TR2022-149}
- }
Romero, D., Lohit, S., "Learning Partial Equivariances from Data", Advances in Neural Information Processing Systems (NeurIPS), S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh, Eds., November 2022, pp. 36466-36478.
BibTeX TR2022-148 PDF Software Presentation
- @inproceedings{Romero2022nov,
- author = {Romero, David and Lohit, Suhas},
- title = {{Learning Partial Equivariances from Data}},
- booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
- year = 2022,
- editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh},
- pages = {36466--36478},
- month = nov,
- url = {https://www.merl.com/publications/TR2022-148}
- }
Wang, H., Lohit, S., Jones, M.J., Fu, R., "What Makes a “Good” Data Augmentation in Knowledge Distillation – A Statistical Perspective", Advances in Neural Information Processing Systems (NeurIPS), S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh, Eds., November 2022, pp. 13456-13469.
BibTeX TR2022-147 PDF
- @inproceedings{Wang2022nov,
- author = {Wang, Huan and Lohit, Suhas and Jones, Michael J. and Fu, Raymond},
- title = {{What Makes a “Good” Data Augmentation in Knowledge Distillation – A Statistical Perspective}},
- booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
- year = 2022,
- editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh},
- pages = {13456--13469},
- month = nov,
- url = {https://www.merl.com/publications/TR2022-147}
- }
Venkatesh, S., Wichern, G., Subramanian, A.S., Le Roux, J., "Improved Domain Generalization via Disentangled Multi-Task Learning in Unsupervised Anomalous Sound Detection", DCASE Workshop, Lagrange, M. and Mesaros, A. and Pellegrini, T. and Richard, G. and Serizel, R. and Stowell, D., Eds., November 2022.
BibTeX TR2022-146 PDF Presentation
- @inproceedings{Venkatesh2022nov,
- author = {Venkatesh, Satvik and Wichern, Gordon and Subramanian, Aswin Shanmugam and {Le Roux}, Jonathan},
- title = {{Improved Domain Generalization via Disentangled Multi-Task Learning in Unsupervised Anomalous Sound Detection}},
- booktitle = {DCASE Workshop},
- year = 2022,
- editor = {Lagrange, M. and Mesaros, A. and Pellegrini, T. and Richard, G. and Serizel, R. and Stowell, D.},
- month = nov,
- isbn = {978-952-03-2677-7},
- url = {https://www.merl.com/publications/TR2022-146}
- }
Yu, X., Smedemark-Margulies, N., Aeron, S., Koike-Akino, T., Moulin, P., Brand, M., Parsons, K., Wang, Y., "Improving Adversarial Robustness by Learning Shared Information", Pattern Recognition, DOI: 10.1016/j.patcog.2022.109054, Vol. 134, pp. 109054, November 2022.
BibTeX TR2022-141 PDF
- @article{Yu2022nov,
- author = {Yu, Xi and Smedemark-Margulies, Niklas and Aeron, Shuchin and Koike-Akino, Toshiaki and Moulin, Pierre and Brand, Matthew and Parsons, Kieran and Wang, Ye},
- title = {{Improving Adversarial Robustness by Learning Shared Information}},
- journal = {Pattern Recognition},
- year = 2022,
- volume = 134,
- pages = 109054,
- month = nov,
- doi = {10.1016/j.patcog.2022.109054},
- issn = {0031-3203},
- url = {https://www.merl.com/publications/TR2022-141}
- }
Ahmed, S.M., Lohit, S., Peng, K.-C., Jones, M.J., Roy Chowdhury, A.K., "Cross-Modal Knowledge Transfer Without Task-Relevant Source Data", European Conference on Computer Vision (ECCV), Avidan, S and Brostow, G and Cisse M and Farinella, G.M. and Hassner T., Eds., DOI: 10.1007/978-3-031-19830-4_7, October 2022, pp. 111-127.
BibTeX TR2022-135 PDF Video Software Presentation
- @inproceedings{Ahmed2022oct,
- author = {Ahmed, Sk Miraj and Lohit, Suhas and Peng, Kuan-Chuan and Jones, Michael J. and Roy Chowdhury, Amit K.},
- title = {{Cross-Modal Knowledge Transfer Without Task-Relevant Source Data}},
- booktitle = {European Conference on Computer Vision (ECCV)},
- year = 2022,
- editor = {Avidan, S and Brostow, G and Cisse M and Farinella, G.M. and Hassner T.},
- pages = {111--127},
- month = oct,
- publisher = {Springer},
- doi = {10.1007/978-3-031-19830-4_7},
- isbn = {978-3-031-19830-4},
- url = {https://www.merl.com/publications/TR2022-135}
- }
Xia, H., Wang, P., Ding, Z., "Incomplete Multi-view Domain Adaptation via Channel Enhancement and Knowledge Transfer", European Conference on Computer Vision (ECCV), DOI: 10.1007/978-3-031-19830-4_12, October 2022.
BibTeX TR2022-134 PDF
- @inproceedings{Xia2022oct,
- author = {Xia, Haifeng and Wang, Pu and Ding, Zhengming},
- title = {{Incomplete Multi-view Domain Adaptation via Channel Enhancement and Knowledge Transfer}},
- booktitle = {European Conference on Computer Vision (ECCV)},
- year = 2022,
- month = oct,
- doi = {10.1007/978-3-031-19830-4_12},
- isbn = {978-3-031-19830-4},
- url = {https://www.merl.com/publications/TR2022-134}
- }
Leu, J., Wang, Y., Tomizuka, M., Di Cairano, S., "Improved A-Search Guided Tree for Autonomous Trailer Planning", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/IROS47612.2022.9982121, October 2022.
BibTeX TR2022-133 PDF
- @inproceedings{Leu2022oct,
- author = {Leu, Jessica and Wang, Yebin and Tomizuka, Masayoshi and {Di Cairano}, Stefano},
- title = {{Improved A-Search Guided Tree for Autonomous Trailer Planning}},
- booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
- year = 2022,
- month = oct,
- doi = {10.1109/IROS47612.2022.9982121},
- url = {https://www.merl.com/publications/TR2022-133}
- }
Paul, S., Roy Chowdhury, A.K., Cherian, A., "AVLEN: Audio-Visual-Language Embodied Navigation in 3D Environments", Advances in Neural Information Processing Systems (NeurIPS), October 2022, pp. 6236-6249.
BibTeX TR2022-131 PDF Video Data Software
- @inproceedings{Paul2022oct2,
- author = {Paul, Sudipta and Roy Chowdhury, Amit K and Cherian, Anoop},
- title = {{AVLEN: Audio-Visual-Language Embodied Navigation in 3D Environments}},
- booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
- year = 2022,
- pages = {6236--6249},
- month = oct,
- url = {https://www.merl.com/publications/TR2022-131}
- }
Mansour, H., Lohit, S., Boufounos, P.T., "Distributed Radar Autofocus Imaging Using Deep Priors", IEEE International Conference on Image Processing (ICIP), DOI: 10.1109/ICIP46576.2022.9897332, October 2022, pp. 2511-2515.
BibTeX TR2022-129 PDF Video
- @inproceedings{Mansour2022oct,
- author = {Mansour, Hassan and Lohit, Suhas and Boufounos, Petros T.},
- title = {{Distributed Radar Autofocus Imaging Using Deep Priors}},
- booktitle = {IEEE International Conference on Image Processing (ICIP)},
- year = 2022,
- pages = {2511--2515},
- month = oct,
- doi = {10.1109/ICIP46576.2022.9897332},
- url = {https://www.merl.com/publications/TR2022-129}
- }
Koike-Akino, T., Wang, Y., "quEEGNet: Quantum AI for Biosignal Processing", IEEE Conference on Biomedical and Health Informatics (BHI), DOI: 10.1109/BHI56158.2022.9926814, September 2022.
BibTeX TR2022-121 PDF Video Presentation
- @inproceedings{Koike-Akino2022sep,
- author = {Koike-Akino, Toshiaki and Wang, Ye},
- title = {{quEEGNet: Quantum AI for Biosignal Processing}},
- booktitle = {IEEE Conference on Biomedical and Health Informatics (BHI)},
- year = 2022,
- month = sep,
- publisher = {IEEE},
- doi = {10.1109/BHI56158.2022.9926814},
- issn = {2641-3604},
- isbn = {978-1-6654-8791-7},
- url = {https://www.merl.com/publications/TR2022-121}
- }
Zawislak, R., Greiff, M., Kim, K.J., Berntorp, K., Di Cairano, S., Mao, K., Parsons, K., Orlik, P.V., Sato, Y., "GNSS Multipath Detection Aided by Unsupervised Domain Adaptation", ION-GNSS+ Conference, DOI: 10.33012/2022.18333, September 2022, pp. 2127-2137.
BibTeX TR2022-118 PDF
- @inproceedings{Zawislak2022sep,
- author = {Zawislak, Remy and Greiff, Marcus and Kim, Kyeong Jin and Berntorp, Karl and {Di Cairano}, Stefano and Mao, Konishi and Parsons, Kieran and Orlik, Philip V. and Sato, Yuki},
- title = {{GNSS Multipath Detection Aided by Unsupervised Domain Adaptation}},
- booktitle = {ION-GNSS+ Conference},
- year = 2022,
- pages = {2127--2137},
- month = sep,
- publisher = {Institute of Navigation},
- doi = {10.33012/2022.18333},
- url = {https://www.merl.com/publications/TR2022-118}
- }
Suda, T., Nikovski, D., "Deep Reinforcement Learning for Optimal Sailing Upwind", IEEE International Joint Conference on Neural Networks IJCNN, DOI: 10.1109/IJCNN55064.2022.9892369, September 2022, pp. 1-8.
BibTeX TR2022-102 PDF
- @inproceedings{Suda2022sep,
- author = {{{Suda, Takumi and Nikovski, Daniel}}},
- title = {{{Deep Reinforcement Learning for Optimal Sailing Upwind}}},
- booktitle = {IEEE International Joint Conference on Neural Networks IJCNN},
- year = 2022,
- pages = {1--8},
- month = sep,
- publisher = {IEEE},
- doi = {10.1109/IJCNN55064.2022.9892369},
- issn = {2161-4393},
- isbn = {978-1-7281-8671-9},
- url = {https://www.merl.com/publications/TR2022-102}
- }
Hori, C., Hori, T., Le Roux, J., "Low-Latency Streaming Scene-aware Interaction Using Audio-Visual Transformers", Interspeech, DOI: 10.21437/Interspeech.2022-10891, September 2022, pp. 4511-4515.
BibTeX TR2022-116 PDF
- @inproceedings{Hori2022sep,
- author = {Hori, Chiori and Hori, Takaaki and {Le Roux}, Jonathan},
- title = {{Low-Latency Streaming Scene-aware Interaction Using Audio-Visual Transformers}},
- booktitle = {Interspeech},
- year = 2022,
- pages = {4511--4515},
- month = sep,
- doi = {10.21437/Interspeech.2022-10891},
- url = {https://www.merl.com/publications/TR2022-116}
- }
Tzinis, E., Wichern, G., Subramanian, A.S., Smaragdis, P., Le Roux, J., "Heterogeneous Target Speech Separation", Interspeech, DOI: 10.21437/Interspeech.2022-10717, September 2022, pp. 1796-1800.
BibTeX TR2022-115 PDF Video Presentation
- @inproceedings{Tzinis2022sep,
- author = {Tzinis, Efthymios and Wichern, Gordon and Subramanian, Aswin Shanmugam and Smaragdis, Paris and {Le Roux}, Jonathan},
- title = {{Heterogeneous Target Speech Separation}},
- booktitle = {Interspeech},
- year = 2022,
- pages = {1796--1800},
- month = sep,
- doi = {10.21437/Interspeech.2022-10717},
- url = {https://www.merl.com/publications/TR2022-115}
- }
Higuchi, Y., Moritz, N., Le Roux, J., Hori, T., "Momentum Pseudo-Labeling: Semi-Supervised ASR with Continuously Improving Pseudo-Labels", IEEE Journal of Selected Topics in Signal Processing, DOI: 10.1109/JSTSP.2022.3195367, Vol. 16, No. 6, pp. 1424-1438, September 2022.
BibTeX TR2022-112 PDF
- @article{Higuchi2022sep,
- author = {Higuchi, Yosuke and Moritz, Niko and {Le Roux}, Jonathan and Hori, Takaaki},
- title = {{Momentum Pseudo-Labeling: Semi-Supervised ASR with Continuously Improving Pseudo-Labels}},
- journal = {IEEE Journal of Selected Topics in Signal Processing},
- year = 2022,
- volume = 16,
- number = 6,
- pages = {1424--1438},
- month = sep,
- doi = {10.1109/JSTSP.2022.3195367},
- issn = {1941-0484},
- url = {https://www.merl.com/publications/TR2022-112}
- }