Publications

Manilow, E., Wichern, G., Le Roux, J., "Hierarchical Musical Instrument Separation", International Society for Music Information Retrieval (ISMIR) Conference, October 2020, pp. 376-383.
BibTeX TR2020-136 PDF Software
- @inproceedings{Manilow2020oct,
- author = {Manilow, Ethan and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Hierarchical Musical Instrument Separation}},
- booktitle = {International Society for Music Information Retrieval (ISMIR) Conference},
- year = 2020,
- pages = {376--383},
- month = oct,
- isbn = {978-0-9813537-0-8},
- url = {https://www.merl.com/publications/TR2020-136}
- }
Seetharaman, P., Wichern, G., Pardo, B., Le Roux, J., "Autoclip: Adaptive Gradient Clipping For Source Separation Networks", IEEE International Workshop on Machine Learning for Signal Processing (MLSP), DOI: 10.1109/MLSP49062.2020.9231926, September 2020.
BibTeX TR2020-132 PDF
- @inproceedings{Seetharaman2020sep,
- author = {Seetharaman, Prem and Wichern, Gordon and Pardo, Bryan and {Le Roux}, Jonathan},
- title = {{Autoclip: Adaptive Gradient Clipping For Source Separation Networks}},
- booktitle = {IEEE International Workshop on Machine Learning for Signal Processing (MLSP)},
- year = 2020,
- month = sep,
- publisher = {IEEE},
- doi = {10.1109/MLSP49062.2020.9231926},
- url = {https://www.merl.com/publications/TR2020-132}
- }
Pishdadian, F., Wichern, G., Le Roux, J., "Finding Strength in Weakness: Learning to Separate Sounds with Weak Supervision", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TASLP.2020.3013105, Vol. 28, pp. 2386-2399, September 2020.
BibTeX TR2020-126 PDF
- @article{Pishdadian2020sep,
- author = {Pishdadian, Fatemeh and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Finding Strength in Weakness: Learning to Separate Sounds with Weak Supervision}},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2020,
- volume = 28,
- pages = {2386--2399},
- month = sep,
- doi = {10.1109/TASLP.2020.3013105},
- url = {https://www.merl.com/publications/TR2020-126}
- }
Di Cairano, S., Danielson, C., "Indirect Adaptive Model Predictive Control and its Application to Uncertain Linear Systems", International Journal of Robust and Nonlinear Control, DOI: 10.1002/rnc.5166, July 2020.
BibTeX TR2020-115 PDF
- @article{DiCairano2020jul,
- author = {{Di Cairano}, Stefano and Danielson, Claus},
- title = {{Indirect Adaptive Model Predictive Control and its Application to Uncertain Linear Systems}},
- journal = {International Journal of Robust and Nonlinear Control},
- year = 2020,
- month = jul,
- doi = {10.1002/rnc.5166},
- url = {https://www.merl.com/publications/TR2020-115}
- }
Seetharaman, P., Wichern, G., Le Roux, J., Pardo, B., "Bootstrapping Unsupervised Deep Music Separation from Primitive Auditory Grouping Principles", ICML 2020 Workshop on Self-supervision in Audio and Speech, July 2020.
BibTeX TR2020-111 PDF
- @inproceedings{Seetharaman2020jul,
- author = {Seetharaman, Prem and Wichern, Gordon and {Le Roux}, Jonathan and Pardo, Bryan},
- title = {{Bootstrapping Unsupervised Deep Music Separation from Primitive Auditory Grouping Principles}},
- booktitle = {ICML 2020 Workshop on Self-supervision in Audio and Speech},
- year = 2020,
- month = jul,
- url = {https://www.merl.com/publications/TR2020-111}
- }
Konno, N., Raghunathan, A., "Data-Driven Joint Optimization of Pricing and Seat Allocation in Trains", International Conference on Railway Engineering Design and Operation (COMPRAIL), DOI: 10.2495/CR200351, July 2020, pp. 379-392.
BibTeX TR2020-094 PDF
- @inproceedings{Konno2020jul2,
- author = {Konno, Naoto and Raghunathan, Arvind},
- title = {{Data-Driven Joint Optimization of Pricing and Seat Allocation in Trains}},
- booktitle = {International Conference on Railway Engineering Design and Operation (COMPRAIL)},
- year = 2020,
- pages = {379--392},
- month = jul,
- publisher = {WIT Press},
- doi = {10.2495/CR200351},
- url = {https://www.merl.com/publications/TR2020-094}
- }
Sun, H., Wang, P., Pajovic, M., Koike-Akino, T., Orlik, P.V., Taira, A., Nakagawa, K., "Fingerprinting-Based Outdoor Localization with 28-GHz Channel Measurement: A Field Study", IEEE International Workshop on Signal Processing Advances in Wireless Communications (SPAWC), DOI: 10.1109/SPAWC48557.2020.9154212, May 2020.
BibTeX TR2020-056 PDF
- @inproceedings{Sun2020may,
- author = {Sun, Haijian and Wang, Pu and Pajovic, Milutin and Koike-Akino, Toshiaki and Orlik, Philip V. and Taira, Akinori and Nakagawa, Kenji},
- title = {{Fingerprinting-Based Outdoor Localization with 28-GHz Channel Measurement: A Field Study}},
- booktitle = {IEEE International Workshop on Signal Processing Advances in Wireless Communications (SPAWC)},
- year = 2020,
- month = may,
- publisher = {IEEE},
- doi = {10.1109/SPAWC48557.2020.9154212},
- issn = {1948-3252},
- isbn = {978-1-7281-5478-7},
- url = {https://www.merl.com/publications/TR2020-056}
- }
Pishdadian, F., Wichern, G., Le Roux, J., "Learning to Separate Sounds From Weakly Labeled Scenes", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9053055, April 2020, pp. 91-95.
BibTeX TR2020-038 PDF Video Presentation
- @inproceedings{Pishdadian2020apr,
- author = {Pishdadian, Fatemeh and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Learning to Separate Sounds From Weakly Labeled Scenes}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {91--95},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9053055},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-038}
- }
Maciejewski, M., Wichern, G., McQuinn, E., Le Roux, J., "WHAMR!: Noisy and Reverberant Single-Channel Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9053327, April 2020, pp. 696-700.
BibTeX TR2020-042 PDF Video Presentation
- @inproceedings{Maciejewski2020apr,
- author = {Maciejewski, Matthew and Wichern, Gordon and McQuinn, Emmett and {Le Roux}, Jonathan},
- title = {{WHAMR!: Noisy and Reverberant Single-Channel Speech Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {696--700},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9053327},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-042}
- }
Wang, P., Boufounos, P.T., Mansour, H., Orlik, P.V., "Slow-Time MIMO-FMCW Automotive Radar Detection with Imperfect Waveform Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9053892, April 2020, pp. 8634-8638.
BibTeX TR2020-039 PDF Video
- @inproceedings{Wang2020apr,
- author = {Wang, Pu and Boufounos, Petros T. and Mansour, Hassan and Orlik, Philip V.},
- title = {{Slow-Time MIMO-FMCW Automotive Radar Detection with Imperfect Waveform Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {8634--8638},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9053892},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-039}
- }
Li, R., Wang, X., Mallidi, H., Watanabe, S., Hori, T., Hermansky, H., "Multi-Stream End-to-End Speech Recognition", IEEE/ACM Transactions on Audio, Speech and Language Processing, DOI: 10.1109/TASLP.2019.2959721, Vol. 28, pp. 646-655, March 2020.
BibTeX TR2020-030 PDF
- @article{Li2020mar,
- author = {Li, Ruizhi and Wang, Xiaofei and Mallidi, Harish and Watanabe, Shinji and Hori, Takaaki and Hermansky, Hynek},
- title = {{Multi-Stream End-to-End Speech Recognition}},
- journal = {IEEE/ACM Transactions on Audio, Speech and Language Processing},
- year = 2020,
- volume = 28,
- pages = {646--655},
- month = mar,
- doi = {10.1109/TASLP.2019.2959721},
- url = {https://www.merl.com/publications/TR2020-030}
- }
Aihara, R., Wichern, G., Le Roux, J., "Deep Clustering-based Single Channel Speech Separation and Recent Advances", Acoustical Science and Technology, DOI: 10.1250/ast.41.465, Vol. 41, No. 2, pp. 465-471, March 2020.
BibTeX TR2021-020 PDF
- @article{Aihara2020jun,
- author = {Aihara, Ryo and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Deep Clustering-based Single Channel Speech Separation and Recent Advances}},
- journal = {Acoustical Science and Technology},
- year = 2020,
- volume = 41,
- number = 2,
- pages = {465--471},
- month = mar,
- doi = {10.1250/ast.41.465},
- url = {https://www.merl.com/publications/TR2021-020}
- }
Wang, P., Li, H., "Target Detection with Imperfect Waveform Separation in Distributed MIMO Radar", IEEE Transactions on Signal Processing, DOI: 10.1109/TSP.2020.2964227, Vol. 68, No. 1, pp. 793-807, January 2020.
BibTeX TR2020-007 PDF
- @article{Wang2020jan,
- author = {Wang, Pu and Li, Hongbin},
- title = {{Target Detection with Imperfect Waveform Separation in Distributed MIMO Radar}},
- journal = {IEEE Transactions on Signal Processing},
- year = 2020,
- volume = 68,
- number = 1,
- pages = {793--807},
- month = jan,
- doi = {10.1109/TSP.2020.2964227},
- issn = {1053-587X},
- url = {https://www.merl.com/publications/TR2020-007}
- }
Chang, X., Zhang, W., Qian, Y., Le Roux, J., Watanabe, S., "MIMO-Speech: End-to-End Multi-Channel Multi-Speaker Speech Recognition", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2019, pp. 237-144.
BibTeX TR2019-157 PDF
- @inproceedings{Chang2019dec,
- author = {Chang, Xuankai and Zhang, Wangyou and Qian, Yanmin and {Le Roux}, Jonathan and Watanabe, Shinji},
- title = {{MIMO-Speech: End-to-End Multi-Channel Multi-Speaker Speech Recognition}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2019,
- pages = {237--144},
- month = dec,
- isbn = {978-1-7281-0305-1},
- url = {https://www.merl.com/publications/TR2019-157}
- }
Wollenstein, S., Sun, C., Zhang, J., Paschalidis, I., "Joint Estimation of OD Demands and Cost Functions in Transportation Networks from Data", IEEE Conference on Decision and Control (CDC), DOI: 10.1109/CDC40024.2019.9029445, December 2019, pp. 5113-5118.
BibTeX TR2019-144 PDF
- @inproceedings{Wollenstein2019dec,
- author = {Wollenstein, Salomón and Sun, Chuangchuang and Zhang, Jing and Paschalidis, Ioannis},
- title = {{Joint Estimation of OD Demands and Cost Functions in Transportation Networks from Data}},
- booktitle = {IEEE Conference on Decision and Control (CDC)},
- year = 2019,
- pages = {5113--5118},
- month = dec,
- doi = {10.1109/CDC40024.2019.9029445},
- url = {https://www.merl.com/publications/TR2019-144}
- }
Jespersen, M.H., Pajovic, M., Koike-Akino, T., Wang, Y., Popovski, P., Orlik, P.V., "Deep Learning for Synchronization and Channel Estimation in NB-IoT Random Access Channel", IEEE Global Communications Conference (GLOBECOM), DOI: 10.1109/GLOBECOM38437.2019.9013510, December 2019.
BibTeX TR2019-140 PDF
- @inproceedings{Jespersen2019dec,
- author = {Jespersen, Mads Helge and Pajovic, Milutin and Koike-Akino, Toshiaki and Wang, Ye and Popovski, Petar and Orlik, Philip V.},
- title = {{Deep Learning for Synchronization and Channel Estimation in NB-IoT Random Access Channel}},
- booktitle = {IEEE Global Communications Conference (GLOBECOM)},
- year = 2019,
- month = dec,
- publisher = {IEEE},
- doi = {10.1109/GLOBECOM38437.2019.9013510},
- issn = {2576-6813},
- isbn = {978-1-7281-0962-6},
- url = {https://www.merl.com/publications/TR2019-140}
- }
Kavalerov, I., Wisdom, S., Erdogan, H., Patton, B., Wilson, K., Le Roux, J., Hershey, J., "Universal Sound Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA.2019.8937253, October 2019, pp. 170-174.
BibTeX TR2019-123 PDF
- @inproceedings{Kavalerov2019oct,
- author = {Kavalerov, Ilya and Wisdom, Scott and Erdogan, Hakan and Patton, Brian and Wilson, Kevin and {Le Roux}, Jonathan and Hershey, John},
- title = {{Universal Sound Separation}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2019,
- pages = {170--174},
- month = oct,
- doi = {10.1109/WASPAA.2019.8937253},
- issn = {1947-1629},
- isbn = {978-1-7281-1123-0},
- url = {https://www.merl.com/publications/TR2019-123}
- }
Manilow, E., Wichern, G., Seetharaman, P., Le Roux, J., "Cutting Music Source Separation Some Slakh: A Dataset to Study the Impact of Training Data Quality and Quantity", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA.2019.8937170, October 2019, pp. 45-49.
BibTeX TR2019-124 PDF
- @inproceedings{Manilow2019oct,
- author = {Manilow, Ethan and Wichern, Gordon and Seetharaman, Prem and {Le Roux}, Jonathan},
- title = {{Cutting Music Source Separation Some Slakh: A Dataset to Study the Impact of Training Data Quality and Quantity}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2019,
- pages = {45--49},
- month = oct,
- doi = {10.1109/WASPAA.2019.8937170},
- issn = {1947-1629},
- isbn = {978-1-7281-1123-0},
- url = {https://www.merl.com/publications/TR2019-124}
- }
Karafiat, M., Baskar, M.K., Watanabe, S., Hori, T., Wiesner, M., Cernocky, J.H., "Analysis of Multilingual Sequence-to-Sequence Speech Recognition Systems", Interspeech, DOI: 10.21437/Interspeech.2019-2355//, September 2019, pp. 2019-2355.
BibTeX TR2019-103 PDF
- @inproceedings{Karafiat2019sep,
- author = {Karafiat, Martin and Baskar, Murali Karthick and Watanabe, Shinji and Hori, Takaaki and Wiesner, Matthew and Cernocky, Jan, Honza},
- title = {{Analysis of Multilingual Sequence-to-Sequence Speech Recognition Systems}},
- booktitle = {Interspeech},
- year = 2019,
- pages = {2019--2355},
- month = sep,
- doi = {10.21437/Interspeech.2019-2355//},
- url = {https://www.merl.com/publications/TR2019-103}
- }
Wichern, G., McQuinn, E., Antognini, J., Flynn, M., Zhu, R., Crow, D., Manilow, E., Le Roux, J., "WHAM!: Extending Speech Separation to Noisy Environments", Interspeech, DOI: 10.21437/Interspeech.2019-2821, September 2019, pp. 1368-1372.
BibTeX TR2019-099 PDF
- @inproceedings{Wichern2019sep,
- author = {Wichern, Gordon and McQuinn, Emmett and Antognini, Joe and Flynn, Michael and Zhu, Richard and Crow, Dwight and Manilow, Ethan and {Le Roux}, Jonathan},
- title = {{WHAM!: Extending Speech Separation to Noisy Environments}},
- booktitle = {Interspeech},
- year = 2019,
- pages = {1368--1372},
- month = sep,
- doi = {10.21437/Interspeech.2019-2821},
- url = {https://www.merl.com/publications/TR2019-099}
- }
Wang, J., Cherian, A., "Discriminative Video Representation Learning Using Support Vector Classifiers", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/TPAMI.2019.2937292, August 2019.
BibTeX TR2019-107 PDF
- @article{Wang2019aug,
- author = {Wang, Jue and Cherian, Anoop},
- title = {{Discriminative Video Representation Learning Using Support Vector Classifiers}},
- journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
- year = 2019,
- month = aug,
- doi = {10.1109/TPAMI.2019.2937292},
- url = {https://www.merl.com/publications/TR2019-107}
- }
Aihara, R., Hanazawa, T., Okato, Y., Wichern, G., Le Roux, J., "Teacher-Student Deep Clustering For Low-Delay Channel Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8682695, May 2019.
BibTeX TR2019-003 PDF
- @inproceedings{Aihara2019may,
- author = {Aihara, Ryo and Hanazawa, Toshiyuki and Okato, Yohei and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Teacher-Student Deep Clustering For Low-Delay Channel Speech Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8682695},
- url = {https://www.merl.com/publications/TR2019-003}
- }
Le Roux, J., Wichern, G., Watanabe, S., Sarroff, A., Hershey, J., "The Phasebook: Building Complex Masks via Discrete Representations for Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8682587, May 2019.
BibTeX TR2019-008 PDF
- @inproceedings{LeRoux2019may2,
- author = {{Le Roux}, Jonathan and Wichern, Gordon and Watanabe, Shinji and Sarroff, Andy and Hershey, John},
- title = {{The Phasebook: Building Complex Masks via Discrete Representations for Source Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8682587},
- url = {https://www.merl.com/publications/TR2019-008}
- }
Le Roux, J., Wisdom, S., Erdogan, H., Hershey, J., "SDR -- Half-Baked or Well Done?", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8683855, May 2019.
BibTeX TR2019-013 PDF
- @inproceedings{LeRoux2019may,
- author = {{Le Roux}, Jonathan and Wisdom, Scott and Erdogan, Hakan and Hershey, John},
- title = {{SDR-- Half- Baked or Well Done? }},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8683855},
- url = {https://www.merl.com/publications/TR2019-013}
- }
Seetharaman, P., Wichern, G., Le Roux, J., Pardo, B., "Bootstrapping Single-Channel Source Separation via Unsupervised Spatial Clustering on Stereo Mixtures", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8683198, May 2019.
BibTeX TR2019-014 PDF
- @inproceedings{Seetharaman2019may2,
- author = {Seetharaman, Prem and Wichern, Gordon and {Le Roux}, Jonathan and Pardo, Bryan},
- title = {{Bootstrapping Single-Channel Source Separation via Unsupervised Spatial Clustering on Stereo Mixtures}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8683198},
- url = {https://www.merl.com/publications/TR2019-014}
- }