Publications

235 / 3,892 publications found.


  •  Steinmetz, C., Uhle, C., Everardo, F., Mitcheltree, C., McElveen, J.K., Jot, J.-M., Wichern, G., "Audio Signal Processing in the Artificial Intelligence Era: Challenges and Directions", Journal of the Audio Engineering Society, August 2025.
    BibTeX TR2025-116 PDF
    • @article{Steinmetz2025aug,
    • author = {Steinmetz, Christian and Uhle, Christian and Everardo, Flavio and Mitcheltree, Christopher and McElveen, J. Keith and Jot, Jean-Marc and Wichern, Gordon},
    • title = {{Audio Signal Processing in the Artificial Intelligence Era: Challenges and Directions}},
    • journal = {Journal of the Audio Engineering Society},
    • year = 2025,
    • month = aug,
    • url = {https://www.merl.com/publications/TR2025-116}
    • }
  •  Kato, S., Wang, P., Koike-Akino, T., Fujihashi, T., Mansour, H., Boufounos, P.T., "Multi-Band Wi-Fi Neural Dynamic Fusion", IEEE Transactions on Wireless Communications, July 2025.
    BibTeX TR2025-115 PDF
    • @article{Kato2025jul,
    • author = {Kato, Sorachi and Wang, Pu and Koike-Akino, Toshiaki and Fujihashi, Takuya and Mansour, Hassan and Boufounos, Petros T.},
    • title = {{Multi-Band Wi-Fi Neural Dynamic Fusion}},
    • journal = {IEEE Transactions on Wireless Communications},
    • year = 2025,
    • month = jul,
    • url = {https://www.merl.com/publications/TR2025-115}
    • }
  •  Paissan, F., Wichern, G., Masuyama, Y., Aihara, R., Germain, F.G., Saijo, K., Le Roux, J., "FasTUSS: Faster Task-Aware Unified Source Separation", arXiv, July 2025.
    BibTeX arXiv
    • @article{Paissan2025jul,
    • author = {Paissan, Francesco and Wichern, Gordon and Masuyama, Yoshiki and Aihara, Ryo and Germain, François G and Saijo, Kohei and {Le Roux}, Jonathan},
    • title = {{FasTUSS: Faster Task-Aware Unified Source Separation}},
    • journal = {arXiv},
    • year = 2025,
    • month = jul,
    • url = {https://www.arxiv.org/abs/2507.11435}
    • }
  •  Pavlasek, N., Di Cairano, S., Weiss, A., "Geostationary Satellite Station Keeping and Collocation under High-Thrust Impulsive Control", American Control Conference (ACC), July 2025.
    BibTeX TR2025-101 PDF
    • @inproceedings{Pavlasek2025jul,
    • author = {Pavlasek, Natalia and {Di Cairano}, Stefano and Weiss, Avishai},
    • title = {{Geostationary Satellite Station Keeping and Collocation under High-Thrust Impulsive Control}},
    • booktitle = {American Control Conference (ACC)},
    • year = 2025,
    • month = jul,
    • url = {https://www.merl.com/publications/TR2025-101}
    • }
  •  Dai, M., Lu, Z., Li, N., Wang, Y., "Enhanced Agility and Safety in Mobile Manipulators through Centroidal Momentum-Based Motion Planning", European Control Conference (ECC), June 2025.
    BibTeX TR2025-092 PDF
    • @inproceedings{Dai2025jun,
    • author = {Dai, Min and Lu, Zehui and Li, Na and Wang, Yebin},
    • title = {{Enhanced Agility and Safety in Mobile Manipulators through Centroidal Momentum-Based Motion Planning}},
    • booktitle = {European Control Conference (ECC)},
    • year = 2025,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2025-092}
    • }
  •  Masuyama, Y., "Single- and Multi-Channel Speech Enhancement and Separation for Far-Field Conversation Recognition," Tech. Rep. TR2025-097, Jelinek Summer Workshop on Speech and Language Technology (JSALT), June 2025.
    BibTeX TR2025-097 PDF
    • @techreport{Masuyama2025jun,
    • author = {{{Masuyama, Yoshiki}}},
    • title = {{{Single- and Multi-Channel Speech Enhancement and Separation for Far-Field Conversation Recognition}}},
    • institution = {Jelinek Summer Workshop on Speech and Language Technology (JSALT)},
    • year = 2025,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2025-097}
    • }
  •  Vats, S., Jha, D.K., Likhachev, M., Kroemer, O., Romeres, D., "RecoveryChaining: Learning Local Recovery Policies for Robust Manipulation", R3: Reasoning for Robust Robot Manipulation in the Open World Workshop at R:SS 2025, June 2025.
    BibTeX TR2025-091 PDF
    • @inproceedings{Vats2025jun,
    • author = {Vats, Shivam and Jha, Devesh K. and Likhachev, Maxim and Kroemer, Oliver and Romeres, Diego},
    • title = {{RecoveryChaining: Learning Local Recovery Policies for Robust Manipulation}},
    • booktitle = {R3: Reasoning for Robust Robot Manipulation in the Open World Workshop at R:SS 2025},
    • year = 2025,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2025-091}
    • }
  •  Jung, Y.G., Park, J., Yoon, J., Peng, K.-C., Kim, W., Teoh, A.B.J., Camps, O., "TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), Isola, P. and Kjellström, H. and Lepetit, V. and Li, F. and Su, H. and Tang, S., Eds., DOI: 10.1109/​CVPR52734.2025.02378, June 2025, pp. 25539-25548.
    BibTeX TR2025-077 PDF Video Presentation
    • @inproceedings{Jung2025jun,
    • author = {{{Jung, Yoon G. and Park, Jaewoo and Yoon, Jaeho and Peng, Kuan-Chuan and Kim, Wonchul and Teoh, Andrew B. J. and Camps, Octavia}}},
    • title = {{{TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection}}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2025,
    • editor = {Isola, P. and Kjellström, H. and Lepetit, V. and Li, F. and Su, H. and Tang, S.},
    • pages = {25539--25548},
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.1109/CVPR52734.2025.02378},
    • issn = {2575-7075},
    • isbn = {979-8-3315-4364-8},
    • url = {https://www.merl.com/publications/TR2025-077}
    • }
  •  Masuyama, Y., Chang, X., Zhang, W., Cornell, S., Wang, Z.-Q., Ono, N., Qian, Y., Watanabe, S., "An End-to-End Integration of Speech Separation and Recognition with Self-Supervised Learning Representation", Computer Speech & Language, DOI: 10.1016/​j.csl.2025.101813, Vol. 95, pp. 101813, May 2025.
    BibTeX TR2025-054 PDF
    • @article{Masuyama2025may,
    • author = {Masuyama, Yoshiki and Chang, Xuankai and Zhang, Wangyou and Cornell, Samuele and Wang, Zhong-Qiu and Ono, Nobutaka and Qian, Yanmin and Watanabe, Shinji},
    • title = {{An End-to-End Integration of Speech Separation and Recognition with Self-Supervised Learning Representation}},
    • journal = {Computer Speech \& Language},
    • year = 2025,
    • volume = 95,
    • pages = 101813,
    • month = may,
    • doi = {10.1016/j.csl.2025.101813},
    • issn = {0885-2308},
    • url = {https://www.merl.com/publications/TR2025-054}
    • }
  •  Araki, S., Ito, N., Haeb-Umbach, R., Wichern, G., Wang, Z.-Q., Mitsufuji, Y., "30+ Years of Source Separation Research: Achievements and Future Challenges", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10889006, April 2025, pp. 1-5.
    BibTeX TR2025-036 PDF
    • @inproceedings{Araki2025mar,
    • author = {Araki, Shoko and Ito, Nobutaka and Haeb-Umbach, Reinhold and Wichern, Gordon and Wang, Zhong-Qiu and Mitsufuji, Yuki},
    • title = {{30+ Years of Source Separation Research: Achievements and Future Challenges}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • pages = {1--5},
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10889006},
    • url = {https://www.merl.com/publications/TR2025-036}
    • }
  •  Saijo, K., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Task-Aware Unified Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10887819, April 2025.
    BibTeX TR2025-032 PDF Software
    • @inproceedings{Saijo2025mar,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Task-Aware Unified Source Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10887819},
    • url = {https://www.merl.com/publications/TR2025-032}
    • }
  •  Vinod, A.P., Weiss, A., Di Cairano, S., "Inscribing and separating an ellipsoid and a constrained zonotope: Applications in stochastic control and centering", IEEE Conference on Decision and Control (CDC), DOI: 10.1109/​CDC56724.2024.10886451, December 2024, pp. 8125-8131.
    BibTeX TR2024-173 PDF
    • @inproceedings{Vinod2024dec,
    • author = {Vinod, Abraham P. and Weiss, Avishai and {Di Cairano}, Stefano},
    • title = {{Inscribing and separating an ellipsoid and a constrained zonotope: Applications in stochastic control and centering}},
    • booktitle = {IEEE Conference on Decision and Control (CDC)},
    • year = 2024,
    • pages = {8125--8131},
    • month = dec,
    • doi = {10.1109/CDC56724.2024.10886451},
    • url = {https://www.merl.com/publications/TR2024-173}
    • }
  •  Cornell, S., Ebbers, J., Douwes, C., Martin-Morato, I., Harju, M., Mesaros, A., Serizel, R., "DCASE 2024 Task 4: Sound Event Detection with Heterogeneous Data and Missing Labels", Detection and Classification of Acoustic Scenes and Events (DCASE) Workshop, October 2024, pp. 31-35.
    BibTeX TR2024-146 PDF
    • @inproceedings{Cornell2024oct,
    • author = {Cornell, Samuele and Ebbers, Janek and Douwes, Constance and Martin-Morato, Irene and Harju, Manu and Mesaros, Annamaria and Serizel, Romain},
    • title = {{DCASE 2024 Task 4: Sound Event Detection with Heterogeneous Data and Missing Labels}},
    • booktitle = {Detection and Classification of Acoustic Scenes and Events (DCASE) Workshop},
    • year = 2024,
    • pages = {31--35},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2024-146}
    • }
  •  Saijo, K., Wichern, G., Germain, F.G., Pan, Z., Le Roux, J., "TF-Locoformer: Transformer with Local Modeling by Convolution for Speech Separation and Enhancement", International Workshop on Acoustic Signal Enhancement (IWAENC), DOI: 10.1109/​IWAENC61483.2024.10694313, September 2024, pp. 205-209.
    BibTeX TR2024-126 PDF Software
    • @inproceedings{Saijo2024sep2,
    • author = {Saijo, Kohei and Wichern, Gordon and Germain, François G and Pan, Zexu and {Le Roux}, Jonathan},
    • title = {{TF-Locoformer: Transformer with Local Modeling by Convolution for Speech Separation and Enhancement}},
    • booktitle = {International Workshop on Acoustic Signal Enhancement (IWAENC)},
    • year = 2024,
    • pages = {205--209},
    • month = sep,
    • doi = {10.1109/IWAENC61483.2024.10694313},
    • issn = {2835-3439},
    • isbn = {979-8-3503-6185-8},
    • url = {https://www.merl.com/publications/TR2024-126}
    • }
  •  Pan, Z., Wichern, G., Germain, F.G., Saijo, K., Le Roux, J., "PARIS: Pseudo-AutoRegressIve Siamese Training for Online Speech Separation", Interspeech, DOI: 10.21437/​Interspeech.2024-1066, September 2024, pp. 582-586.
    BibTeX TR2024-124 PDF
    • @inproceedings{Pan2024sep,
    • author = {Pan, Zexu and Wichern, Gordon and Germain, François G and Saijo, Kohei and {Le Roux}, Jonathan},
    • title = {{PARIS}: Pseudo-AutoRegressIve Siamese Training for Online Speech Separation},
    • booktitle = {Interspeech},
    • year = 2024,
    • pages = {582--586},
    • month = sep,
    • doi = {10.21437/Interspeech.2024-1066},
    • issn = {2958-1796},
    • url = {https://www.merl.com/publications/TR2024-124}
    • }
  •  Saijo, K., Wichern, G., Germain, F.G., Pan, Z., Le Roux, J., "Enhanced Reverberation as Supervision for Unsupervised Speech Separation", Interspeech, DOI: 10.21437/​Interspeech.2024-1241, September 2024, pp. 607-611.
    BibTeX TR2024-116 PDF Software
    • @inproceedings{Saijo2024sep,
    • author = {Saijo, Kohei and Wichern, Gordon and Germain, François G and Pan, Zexu and {Le Roux}, Jonathan},
    • title = {{Enhanced Reverberation as Supervision for Unsupervised Speech Separation}},
    • booktitle = {Interspeech},
    • year = 2024,
    • pages = {607--611},
    • month = sep,
    • doi = {10.21437/Interspeech.2024-1241},
    • issn = {2958-1796},
    • url = {https://www.merl.com/publications/TR2024-116}
    • }
  •  Vinod, A.P., Yamazaki, S., Chakrabarty, A., Yoshikawa, N., Di Cairano, S., "Aircraft Approach Management using Reachability and Dynamic Programming", American Control Conference (ACC), DOI: 10.23919/​ACC60939.2024.10644902, June 2024, pp. 318-324.
    BibTeX TR2024-079 PDF
    • @inproceedings{Vinod2024jun,
    • author = {Vinod, Abraham P. and Yamazaki, Sachiyo and Chakrabarty, Ankush and Yoshikawa, Nobuyuki and {Di Cairano}, Stefano},
    • title = {{Aircraft Approach Management using Reachability and Dynamic Programming}},
    • booktitle = {American Control Conference (ACC)},
    • year = 2024,
    • pages = {318--324},
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.23919/ACC60939.2024.10644902},
    • url = {https://www.merl.com/publications/TR2024-079}
    • }
  •  Jeon, C.-B., Wichern, G., Germain, F.G., Le Roux, J., "Why does music source separation benefit from cacophony?", IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA), DOI: 10.1109/​ICASSPW62465.2024.10669899, March 2024, pp. 873-877.
    BibTeX TR2024-030 PDF Video
    • @inproceedings{Jeon2024mar,
    • author = {Jeon, Chang-Bin and Wichern, Gordon and Germain, François G and {Le Roux}, Jonathan},
    • title = {{Why does music source separation benefit from cacophony?}},
    • booktitle = {IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA)},
    • year = 2024,
    • pages = {873--877},
    • month = mar,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSPW62465.2024.10669899},
    • isbn = {979-8-3503-7451-3},
    • url = {https://www.merl.com/publications/TR2024-030}
    • }
  •  Boeddeker, C., Subramanian, A.S., Wichern, G., Haeb-Umbach, R., Le Roux, J., "TS-SEP: Joint Diarization and Separation Conditioned on Estimated Speaker Embeddings", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/​TASLP.2024.3350887, Vol. 32, pp. 1185-1197, February 2024.
    BibTeX TR2024-006 PDF Software
    • @article{Boeddeker2024feb,
    • author = {Boeddeker, Christoph and Subramanian, Aswin Shanmugam and Wichern, Gordon and Haeb-Umbach, Reinhold and {Le Roux}, Jonathan},
    • title = {{TS-SEP: Joint Diarization and Separation Conditioned on Estimated Speaker Embeddings}},
    • journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
    • year = 2024,
    • volume = 32,
    • pages = {1185--1197},
    • month = feb,
    • doi = {10.1109/TASLP.2024.3350887},
    • issn = {2329-9304},
    • url = {https://www.merl.com/publications/TR2024-006}
    • }
  •  Pan, Z., Wichern, G., Masuyama, Y., Germain, F.G., Khurana, S., Hori, C., Le Roux, J., "Scenario-Aware Audio-Visual TF-GridNet for Target Speech Extraction", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/​ASRU57964.2023.10389618, December 2023.
    BibTeX TR2023-152 PDF Video
    • @inproceedings{Pan2023dec2,
    • author = {Pan, Zexu and Wichern, Gordon and Masuyama, Yoshiki and Germain, François G and Khurana, Sameer and Hori, Chiori and {Le Roux}, Jonathan},
    • title = {{Scenario-Aware Audio-Visual TF-GridNet for Target Speech Extraction}},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2023,
    • month = dec,
    • doi = {10.1109/ASRU57964.2023.10389618},
    • isbn = {979-8-3503-0689-7},
    • url = {https://www.merl.com/publications/TR2023-152}
    • }
  •  Falcon Perez, R., Wichern, G., Germain, F., Le Roux, J., "Location as supervision for weakly supervised multi-channel source separation of machine sounds", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA58266.2023.10248128, September 2023.
    BibTeX TR2023-119 PDF Presentation
    • @inproceedings{FalconPerez2023aug,
    • author = {Falcon Perez, Ricardo and Wichern, Gordon and Germain, Francois and {Le Roux}, Jonathan},
    • title = {{Location as supervision for weakly supervised multi-channel source separation of machine sounds}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2023,
    • month = sep,
    • publisher = {IEEE},
    • doi = {10.1109/WASPAA58266.2023.10248128},
    • issn = {1947-1629},
    • isbn = {979-8-3503-2372-6},
    • url = {https://www.merl.com/publications/TR2023-119}
    • }
  •  Petermann, D., Wichern, G., Subramanian, A.S., Wang, Z.-Q., Le Roux, J., "Tackling the Cocktail Fork Problem for Separation and Transcription of Real-World Soundtracks", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/​TASLP.2023.3290428, Vol. 31, pp. 2592-2605, September 2023.
    BibTeX TR2023-113 PDF
    • @article{Petermann2023sep,
    • author = {Petermann, Darius and Wichern, Gordon and Subramanian, Aswin Shanmugam and Wang, Zhong-Qiu and {Le Roux}, Jonathan},
    • title = {{Tackling the Cocktail Fork Problem for Separation and Transcription of Real-World Soundtracks}},
    • journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
    • year = 2023,
    • volume = 31,
    • pages = {2592--2605},
    • month = sep,
    • doi = {10.1109/TASLP.2023.3290428},
    • issn = {2329-9304},
    • url = {https://www.merl.com/publications/TR2023-113}
    • }
  •  Vinod, A.P., Di Cairano, S., "Sample quantile-based programming for non-convex separable chance constraints", American Control Conference (ACC), May 2023, pp. 1517-1522.
    BibTeX TR2023-062 PDF
    • @inproceedings{Vinod2023may,
    • author = {Vinod, Abraham P. and {Di Cairano}, Stefano},
    • title = {{Sample quantile-based programming for non-convex separable chance constraints}},
    • booktitle = {American Control Conference (ACC)},
    • year = 2023,
    • pages = {1517--1522},
    • month = may,
    • url = {https://www.merl.com/publications/TR2023-062}
    • }
  •  Chen, K., Wichern, G., Germain, F., Le Roux, J., "Pac-HuBERT: Self-Supervised Music Source Separation via Primitive Auditory Clustering and Hidden-Unit BERT", IEEE ICASSP Satellite Workshop on Self-supervision in Audio, Speech and Beyond (SASB), DOI: 10.1109/​ICASSPW59220.2023.10193575, May 2023.
    BibTeX TR2023-030 PDF
    • @inproceedings{Chen2023may,
    • author = {Chen, Ke and Wichern, Gordon and Germain, Francois and {Le Roux}, Jonathan},
    • title = {{Pac-HuBERT: Self-Supervised Music Source Separation via Primitive Auditory Clustering and Hidden-Unit BERT}},
    • booktitle = {IEEE ICASSP Satellite Workshop on Self-supervision in Audio, Speech and Beyond (SASB)},
    • year = 2023,
    • month = may,
    • doi = {10.1109/ICASSPW59220.2023.10193575},
    • isbn = {979-8-3503-0261-5},
    • url = {https://www.merl.com/publications/TR2023-030}
    • }
  •  Aralikatti, R., Boeddeker, C., Wichern, G., Subramanian, A.S., Le Roux, J., "Reverberation as Supervision for Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10095022, May 2023, pp. 1-5.
    BibTeX TR2023-016 PDF
    • @inproceedings{Aralikatti2023may,
    • author = {Aralikatti, Rohith and Boeddeker, Christoph and Wichern, Gordon and Subramanian, Aswin Shanmugam and {Le Roux}, Jonathan},
    • title = {{Reverberation as Supervision for Speech Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10095022},
    • url = {https://www.merl.com/publications/TR2023-016}
    • }