Publications

Jeon, C.-B., Wichern, G., Germain, F.G., Le Roux, J., "Why does music source separation benefit from cacophony?", IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA), March 2024.
BibTeX TR2024-030 PDF Video
- @inproceedings{Jeon2024mar,
- author = {Jeon, Chang-Bin and Wichern, Gordon and Germain, François G and Le Roux, Jonathan},
- title = {Why does music source separation benefit from cacophony?},
- booktitle = {IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA)},
- year = 2024,
- month = mar,
- url = {https://www.merl.com/publications/TR2024-030}
- }
Boeddeker, C., Subramanian, A.S., Wichern, G., Haeb-Umbach, R., Le Roux, J., "TS-SEP: Joint Diarization and Separation Conditioned on Estimated Speaker Embeddings", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TASLP.2024.3350887, Vol. 32, pp. 1185-1197, February 2024.
BibTeX TR2024-006 PDF
- @article{Boeddeker2024feb,
- author = {Boeddeker, Christoph and Subramanian, Aswin Shanmugam and Wichern, Gordon and Haeb-Umbach, Reinhold and Le Roux, Jonathan},
- title = {TS-SEP: Joint Diarization and Separation Conditioned on Estimated Speaker Embeddings},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2024,
- volume = 32,
- pages = {1185--1197},
- month = feb,
- doi = {10.1109/TASLP.2024.3350887},
- issn = {2329-9304},
- url = {https://www.merl.com/publications/TR2024-006}
- }
Pan, Z., Wichern, G., Masuyama, Y., Germain, F.G., Khurana, S., Hori, C., Le Roux, J., "Scenario-Aware Audio-Visual TF-GridNet for Target Speech Extraction", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU57964.2023.10389618, December 2023.
BibTeX TR2023-152 PDF
- @inproceedings{Pan2023dec2,
- author = {Pan, Zexu and Wichern, Gordon and Masuyama, Yoshiki and Germain, François G and Khurana, Sameer and Hori, Chiori and Le Roux, Jonathan},
- title = {Scenario-Aware Audio-Visual TF-GridNet for Target Speech Extraction},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2023,
- month = dec,
- doi = {10.1109/ASRU57964.2023.10389618},
- isbn = {979-8-3503-0689-7},
- url = {https://www.merl.com/publications/TR2023-152}
- }
Falcon Perez, R., Wichern, G., Germain, F., Le Roux, J., "Location as supervision for weakly supervised multi-channel source separation of machine sounds", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA58266.2023.10248128, September 2023.
BibTeX TR2023-119 PDF Presentation
- @inproceedings{FalconPerez2023aug,
- author = {Falcon Perez, Ricardo and Wichern, Gordon and Germain, Francois and Le Roux, Jonathan},
- title = {Location as supervision for weakly supervised multi-channel source separation of machine sounds},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2023,
- month = sep,
- publisher = {IEEE},
- doi = {10.1109/WASPAA58266.2023.10248128},
- issn = {1947-1629},
- isbn = {979-8-3503-2372-6},
- url = {https://www.merl.com/publications/TR2023-119}
- }
Petermann, D., Wichern, G., Subramanian, A.S., Wang, Z.-Q., Le Roux, J., "Tackling the Cocktail Fork Problem for Separation and Transcription of Real-World Soundtracks", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TASLP.2023.3290428, Vol. 31, pp. 2592-2605, September 2023.
BibTeX TR2023-113 PDF
- @article{Petermann2023sep,
- author = {Petermann, Darius and Wichern, Gordon and Subramanian, Aswin Shanmugam and Wang, Zhong-Qiu and Le Roux, Jonathan},
- title = {Tackling the Cocktail Fork Problem for Separation and Transcription of Real-World Soundtracks},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2023,
- volume = 31,
- pages = {2592--2605},
- month = sep,
- doi = {10.1109/TASLP.2023.3290428},
- issn = {2329-9304},
- url = {https://www.merl.com/publications/TR2023-113}
- }
Vinod, A.P., Di Cairano, S., "Sample quantile-based programming for non-convex separable chance constraints", American Control Conference (ACC), May 2023, pp. 1517-1522.
BibTeX TR2023-062 PDF
- @inproceedings{Vinod2023may,
- author = {Vinod, Abraham P. and Di Cairano, Stefano},
- title = {Sample quantile-based programming for non-convex separable chance constraints},
- booktitle = {American Control Conference (ACC)},
- year = 2023,
- pages = {1517--1522},
- month = may,
- url = {https://www.merl.com/publications/TR2023-062}
- }
Chen, K., Wichern, G., Germain, F., Le Roux, J., "Pac-HuBERT: Self-Supervised Music Source Separation via Primitive Auditory Clustering and Hidden-Unit BERT", IEEE ICASSP Satellite Workshop on Self-supervision in Audio, Speech and Beyond (SASB), DOI: 10.1109/ICASSPW59220.2023.10193575, May 2023.
BibTeX TR2023-030 PDF
- @inproceedings{Chen2023may,
- author = {Chen, Ke and Wichern, Gordon and Germain, Francois and Le Roux, Jonathan},
- title = {Pac-HuBERT: Self-Supervised Music Source Separation via Primitive Auditory Clustering and Hidden-Unit BERT},
- booktitle = {IEEE ICASSP Satellite Workshop on Self-supervision in Audio, Speech and Beyond (SASB)},
- year = 2023,
- month = may,
- doi = {10.1109/ICASSPW59220.2023.10193575},
- isbn = {979-8-3503-0261-5},
- url = {https://www.merl.com/publications/TR2023-030}
- }
Aralikatti, R., Boeddeker, C., Wichern, G., Subramanian, A.S., Le Roux, J., "Reverberation as Supervision for Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10095022, May 2023, pp. 1-5.
BibTeX TR2023-016 PDF
- @inproceedings{Aralikatti2023may,
- author = {Aralikatti, Rohith and Boeddeker, Christoph and Wichern, Gordon and Subramanian, Aswin Shanmugam and Le Roux, Jonathan},
- title = {Reverberation as Supervision for Speech Separation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10095022},
- url = {https://www.merl.com/publications/TR2023-016}
- }
Bralios, D., Tzinis, E., Wichern, G., Smaragdis, P., Le Roux, J., "Latent Iterative Refinement for Modular Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10096897, May 2023, pp. 1-5.
BibTeX TR2023-019 PDF
- @inproceedings{Bralios2023may,
- author = {Bralios, Dimitrios and Tzinis, Efthymios and Wichern, Gordon and Smaragdis, Paris and Le Roux, Jonathan},
- title = {Latent Iterative Refinement for Modular Source Separation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10096897},
- url = {https://www.merl.com/publications/TR2023-019}
- }
Petermann, D., Wichern, G., Subramanian, A.S., Le Roux, J., "Hyperbolic Audio Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10094943, May 2023, pp. 1-5.
BibTeX TR2023-017 PDF Software
- @inproceedings{Petermann2023may,
- author = {Petermann, Darius and Wichern, Gordon and Subramanian, Aswin Shanmugam and Le Roux, Jonathan},
- title = {Hyperbolic Audio Source Separation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10094943},
- url = {https://www.merl.com/publications/TR2023-017}
- }
Tzinis, E., Wichern, G., Smaragdis, P., Le Roux, J., "Optimal Condition Training for Target Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10095128, May 2023, pp. 1-5.
BibTeX TR2023-018 PDF
- @inproceedings{Tzinis2023may,
- author = {Tzinis, Efthymios and Wichern, Gordon and Smaragdis, Paris and Le Roux, Jonathan},
- title = {Optimal Condition Training for Target Source Separation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10095128},
- url = {https://www.merl.com/publications/TR2023-018}
- }
Lin, C., "Analytical Parametrization for Magnetization of Gadolinium based on Scaling Hypothesis", Physica A, DOI: 10.1016/j.physa.2023.128686, Vol. 617, pp. 128686, April 2023.
BibTeX TR2023-015 PDF
- @article{Lin2023apr,
- author = {Lin, Chungwei},
- title = {Analytical Parametrization for Magnetization of Gadolinium based on Scaling Hypothesis},
- journal = {Physica A},
- year = 2023,
- volume = 617,
- pages = 128686,
- month = apr,
- doi = {10.1016/j.physa.2023.128686},
- issn = {0378-4371},
- url = {https://www.merl.com/publications/TR2023-015}
- }
Chatterjee, M., Ahuja, N., Cherian, A., "Learning Audio-Visual Dynamics Using Scene Graphs for Audio Source Separation", Advances in Neural Information Processing Systems (NeurIPS), November 2022.
BibTeX TR2022-140 PDF Presentation
- @inproceedings{Chatterjee2022nov,
- author = {Chatterjee, Moitreya and Ahuja, Narendra and Cherian, Anoop},
- title = {Learning Audio-Visual Dynamics Using Scene Graphs for Audio Source Separation},
- booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
- year = 2022,
- month = nov,
- url = {https://www.merl.com/publications/TR2022-140}
- }
Tzinis, E., Wichern, G., Subramanian, A.S., Smaragdis, P., Le Roux, J., "Heterogeneous Target Speech Separation", Interspeech, DOI: 10.21437/Interspeech.2022-10717, September 2022, pp. 1796-1800.
BibTeX TR2022-115 PDF Video Presentation
- @inproceedings{Tzinis2022sep,
- author = {Tzinis, Efthymios and Wichern, Gordon and Subramanian, Aswin Shanmugam and Smaragdis, Paris and Le Roux, Jonathan},
- title = {Heterogeneous Target Speech Separation},
- booktitle = {Interspeech},
- year = 2022,
- pages = {1796--1800},
- month = sep,
- doi = {10.21437/Interspeech.2022-10717},
- url = {https://www.merl.com/publications/TR2022-115}
- }
Yu, J., Wang, P., Koike-Akino, T., Wang, Y., Orlik, P.V., Buehrer, R.M., "Multi-Band Wi-Fi Sensing with Matched Feature Granularity", IEEE Internet of Things Journal, DOI: 10.1109/JIOT.2022.3190826, July 2022.
BibTeX TR2022-105 PDF
- @article{Yu2022jul,
- author = {Yu, Jianyuan and Wang, Pu and Koike-Akino, Toshiaki and Wang, Ye and Orlik, Philip V. and Buehrer, R. Michael},
- title = {Multi-Band Wi-Fi Sensing with Matched Feature Granularity},
- journal = {IEEE Internet of Things Journal},
- year = 2022,
- month = jul,
- doi = {10.1109/JIOT.2022.3190826},
- issn = {2327-4662},
- url = {https://www.merl.com/publications/TR2022-105}
- }
Shirsat, A., Sun, H., Kim, K.J., Guo, J., Nikovski, D.N., "ConvEDNet: A Convolutional Energy Disaggregation Network Using Continuous Point-On-Wave Measurements", IEEE PES General Meeting, DOI: 10.1109/PESGM48719.2022.9916802, July 2022.
BibTeX TR2022-101 PDF
- @inproceedings{Shirsat2022jul,
- author = {Shirsat, Ashwin and Sun, Hongbo and Kim, Kyeong Jin and Guo, Jianlin and Nikovski, Daniel N.},
- title = {ConvEDNet: A Convolutional Energy Disaggregation Network Using Continuous Point-On-Wave Measurements},
- booktitle = {2022 IEEE Power \& Energy Society General Meeting (PESGM)},
- year = 2022,
- month = jul,
- doi = {10.1109/PESGM48719.2022.9916802},
- url = {https://www.merl.com/publications/TR2022-101}
- }
Wollenstein-Betech, S., Sun, C., Zhang, J., Cassandras, C.G., Paschalidis, I.C., "Joint Data-Driven Estimation of Origin-Destination Demand and Travel Latency Functions in Multi-Class Transportation Networks", IEEE Transactions on Control of Network Systems, DOI: 10.1109/TCNS.2022.3161200, June 2022.
BibTeX TR2022-078 PDF
- @article{Wollenstein-Betech2022jun,
- author = {Wollenstein-Betech, Salomon and Sun, Chuangchuang and Zhang, Jing and Cassandras, Christos G. and Paschalidis, Ioannis Ch.},
- title = {Joint Data-Driven Estimation of Origin-Destination Demand and Travel Latency Functions in Multi-Class Transportation Networks},
- journal = {IEEE Transactions on Control of Network Systems},
- year = 2022,
- month = jun,
- doi = {10.1109/TCNS.2022.3161200},
- url = {https://www.merl.com/publications/TR2022-078}
- }
Petermann, D., Wichern, G., Wang, Z.-Q., Le Roux, J., "The Cocktail Fork Problem: Three-Stem Audio Separation for Real-World Soundtracks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP43922.2022.9746005, April 2022, pp. 526-530.
BibTeX TR2022-022 PDF Software
- @inproceedings{Petermann2022apr,
- author = {Petermann, Darius and Wichern, Gordon and Wang, Zhong-Qiu and Le Roux, Jonathan},
- title = {The Cocktail Fork Problem: Three-Stem Audio Separation for Real-World Soundtracks},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2022,
- pages = {526--530},
- month = apr,
- doi = {10.1109/ICASSP43922.2022.9746005},
- url = {https://www.merl.com/publications/TR2022-022}
- }
Jin, S., Pu, W., Boufounos, P.T., Orlik, P.V., Roy, S., "Automotive Radar Interference Mitigation with Fast-Time-Frequency Mode Retrieval", IEEE Radar Conference (RadarCon), DOI: 10.1109/RadarConf2248738.2022.9764338, March 2022.
BibTeX TR2022-029 PDF
- @inproceedings{Jin2022mar,
- author = {Jin, Sian and Pu, Wang and Boufounos, Petros T. and Orlik, Philip V. and Roy, Sumit},
- title = {Automotive Radar Interference Mitigation with Fast-Time-Frequency Mode Retrieval},
- booktitle = {IEEE Radar Conference (RadarCon)},
- year = 2022,
- month = mar,
- doi = {10.1109/RadarConf2248738.2022.9764338},
- isbn = {978-1-7281-5368-1},
- url = {https://www.merl.com/publications/TR2022-029}
- }
Nohra, C.J., Raghunathan, A., Sahinidis, N.V., "SDP-quality bounds via convex quadratic relaxations for global optimization of mixed-integer quadratic programs", Mathematical Programming B, DOI: 10.1007/s10107-021-01680-9, Vol. 196, No. 1-2, pp. 203–233, December 2021.
BibTeX TR2022-001 PDF
- @article{Nohra2021dec,
- author = {Nohra, Carlos J. and Raghunathan, Arvind and Sahinidis, Nikolaos V.},
- title = {SDP-quality bounds via convex quadratic relaxations for global optimization of mixed-integer quadratic programs},
- journal = {Mathematical Programming B},
- year = 2021,
- volume = 196,
- number = {1-2},
- pages = {203–233},
- month = dec,
- doi = {10.1007/s10107-021-01680-9},
- url = {https://www.merl.com/publications/TR2022-001}
- }
Bonzanini, A.D., Mesbah, A., Di Cairano, S., "On the Stability Properties of Perception-aware Chance-constrained MPC in Uncertain Environments", IEEE Conference on Decision and Control (CDC), DOI: 10.1109/CDC45484.2021.9682990, December 2021.
BibTeX TR2021-145 PDF
- @inproceedings{Bonzanini2021dec,
- author = {Bonzanini, Angelo Domenico and Mesbah, Ali and Di Cairano, Stefano},
- title = {On the Stability Properties of Perception-aware Chance-constrained MPC in Uncertain Environments},
- booktitle = {IEEE Conference on Decision and Control (CDC)},
- year = 2021,
- month = dec,
- doi = {10.1109/CDC45484.2021.9682990},
- url = {https://www.merl.com/publications/TR2021-145}
- }
Wang, Z.-Q., Wichern, G., Le Roux, J., "Convolutive Prediction for Monaural Speech Dereverberation and Noisy-Reverberant Speaker Separation", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TASLP.2021.3129363, Vol. 29, pp. 3476-3490, December 2021.
BibTeX TR2021-144 PDF
- @article{Wang2021dec,
- author = {Wang, Zhong-Qiu and Wichern, Gordon and Le Roux, Jonathan},
- title = {Convolutive Prediction for Monaural Speech Dereverberation and Noisy-Reverberant Speaker Separation},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2021,
- volume = 29,
- pages = {3476--3490},
- month = dec,
- doi = {10.1109/TASLP.2021.3129363},
- url = {https://www.merl.com/publications/TR2021-144}
- }
Wang, Z.-Q., Wichern, G., Le Roux, J., "On The Compensation Between Magnitude and Phase in Speech Separation", IEEE Signal Processing Letters, DOI: 10.1109/LSP.2021.3116502, Vol. 28, pp. 2018-2022, November 2021.
BibTeX TR2021-137 PDF
- @article{Wang2021nov2,
- author = {Wang, Zhong-Qiu and Wichern, Gordon and Le Roux, Jonathan},
- title = {On The Compensation Between Magnitude and Phase in Speech Separation},
- journal = {IEEE Signal Processing Letters},
- year = 2021,
- volume = 28,
- pages = {2018--2022},
- month = nov,
- doi = {10.1109/LSP.2021.3116502},
- url = {https://www.merl.com/publications/TR2021-137}
- }
Wang, Z.-Q., Wichern, G., Le Roux, J., "Convolutive Prediction for Reverberant Speech Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA52581.2021.9632667, October 2021, pp. 56-60.
BibTeX TR2021-127 PDF
- @inproceedings{Wang2021oct4,
- author = {Wang, Zhong-Qiu and Wichern, Gordon and Le Roux, Jonathan},
- title = {Convolutive Prediction for Reverberant Speech Separation},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2021,
- pages = {56--60},
- month = oct,
- publisher = {IEEE},
- doi = {10.1109/WASPAA52581.2021.9632667},
- url = {https://www.merl.com/publications/TR2021-127}
- }
Chatterjee, M., Le Roux, J., Ahuja, N., Cherian, A., "Visual Scene Graphs for Audio Source Separation", IEEE International Conference on Computer Vision (ICCV), October 2021, pp. 1204-1213.
BibTeX TR2021-095 PDF Video Software
- @inproceedings{Chatterjee2021oct,
- author = {Chatterjee, Moitreya and Le Roux, Jonathan and Ahuja, Narendra and Cherian, Anoop},
- title = {Visual Scene Graphs for Audio Source Separation},
- booktitle = {IEEE International Conference on Computer Vision (ICCV)},
- year = 2021,
- pages = {1204--1213},
- month = oct,
- publisher = {CVF},
- url = {https://www.merl.com/publications/TR2021-095}
- }