- Kavalerov, I., Wisdom, S., Erdogan, H., Patton, B., Wilson, K., Le Roux, J., Hershey, J., "Universal Sound Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA.2019.8937253, October 2019, pp. 170-174.
BibTeX TR2019-123 PDF- @inproceedings{Kavalerov2019oct,
- author = {Kavalerov, Ilya and Wisdom, Scott and Erdogan, Hakan and Patton, Brian and Wilson, Kevin and Le Roux, Jonathan and Hershey, John},
- title = {Universal Sound Separation},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2019,
- pages = {170--174},
- month = oct,
- doi = {10.1109/WASPAA.2019.8937253},
- issn = {1947-1629},
- isbn = {978-1-7281-1123-0},
- url = {https://www.merl.com/publications/TR2019-123}
- }
- Manilow, E., Wichern, G., Seetharaman, P., Le Roux, J., "Cutting Music Source Separation Some Slakh: A Dataset to Study the Impact of Training Data Quality and Quantity", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA.2019.8937170, October 2019, pp. 45-49.
BibTeX TR2019-124 PDF Data- @inproceedings{Manilow2019oct,
- author = {Manilow, Ethan and Wichern, Gordon and Seetharaman, Prem and Le Roux, Jonathan},
- title = {Cutting Music Source Separation Some Slakh: A Dataset to Study the Impact of Training Data Quality and Quantity},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2019,
- pages = {45--49},
- month = oct,
- doi = {10.1109/WASPAA.2019.8937170},
- issn = {1947-1629},
- isbn = {978-1-7281-1123-0},
- url = {https://www.merl.com/publications/TR2019-124}
- }
- Karafiat, M., Baskar, M.K., Watanabe, S., Hori, T., Wiesner, M., Cernocky, J.H., "Analysis of Multilingual Sequence-to-Sequence Speech Recognition Systems", Interspeech, DOI: 10.21437/Interspeech.2019-2355//, September 2019, pp. 2019-2355.
BibTeX TR2019-103 PDF- @inproceedings{Karafiat2019sep,
- author = {Karafiat, Martin and Baskar, Murali Karthick and Watanabe, Shinji and Hori, Takaaki and Wiesner, Matthew and Cernocky, Jan, Honza},
- title = {Analysis of Multilingual Sequence-to-Sequence Speech Recognition Systems},
- booktitle = {Interspeech},
- year = 2019,
- pages = {2019--2355},
- month = sep,
- doi = {10.21437/Interspeech.2019-2355//},
- url = {https://www.merl.com/publications/TR2019-103}
- }
- Wichern, G., McQuinn, E., Antognini, J., Flynn, M., Zhu, R., Crow, D., Manilow, E., Le Roux, J., "WHAM!: Extending Speech Separation to Noisy Environments", Interspeech, DOI: 10.21437/Interspeech.2019-2821, September 2019, pp. 1368-1372.
BibTeX TR2019-099 PDF- @inproceedings{Wichern2019sep,
- author = {Wichern, Gordon and McQuinn, Emmett and Antognini, Joe and Flynn, Michael and Zhu, Richard and Crow, Dwight and Manilow, Ethan and Le Roux, Jonathan},
- title = {WHAM!: Extending Speech Separation to Noisy Environments},
- booktitle = {Interspeech},
- year = 2019,
- pages = {1368--1372},
- month = sep,
- doi = {10.21437/Interspeech.2019-2821},
- url = {https://www.merl.com/publications/TR2019-099}
- }
- Wang, J., Cherian, A., "Discriminative Video Representation Learning Using Support Vector Classifiers", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/TPAMI.2019.2937292, August 2019.
BibTeX TR2019-107 PDF- @article{Wang2019aug,
- author = {Wang, Jue and Cherian, Anoop},
- title = {Discriminative Video Representation Learning Using Support Vector Classifiers},
- journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
- year = 2019,
- month = aug,
- doi = {10.1109/TPAMI.2019.2937292},
- url = {https://www.merl.com/publications/TR2019-107}
- }
- Aihara, R., Hanazawa, T., Okato, Y., Wichern, G., Le Roux, J., "Teacher-Student Deep Clustering For Low-Delay Channel Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8682695, May 2019.
BibTeX TR2019-003 PDF- @inproceedings{Aihara2019may,
- author = {Aihara, Ryo and Hanazawa, Toshiyuki and Okato, Yohei and Wichern, Gordon and Le Roux, Jonathan},
- title = {Teacher-Student Deep Clustering For Low-Delay Channel Speech Separation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8682695},
- url = {https://www.merl.com/publications/TR2019-003}
- }
- Le Roux, J., Wichern, G., Watanabe, S., Sarroff, A., Hershey, J., "The Phasebook: Building Complex Masks via Discrete Representations for Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8682587, May 2019.
BibTeX TR2019-008 PDF- @inproceedings{LeRoux2019may2,
- author = {Le Roux, Jonathan and Wichern, Gordon and Watanabe, Shinji and Sarroff, Andy and Hershey, John},
- title = {The Phasebook: Building Complex Masks via Discrete Representations for Source Separation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8682587},
- url = {https://www.merl.com/publications/TR2019-008}
- }
- Le Roux, J., Wisdom, S., Erdogan, H., Hershey, J., "SDR -- Half-Baked or Well Done?", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8683855, May 2019.
BibTeX TR2019-013 PDF- @inproceedings{LeRoux2019may,
- author = {Le Roux, Jonathan and Wisdom, Scott and Erdogan, Hakan and Hershey, John},
- title = {SDR -- Half-Baked or Well Done?},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8683855},
- url = {https://www.merl.com/publications/TR2019-013}
- }
- Seetharaman, P., Wichern, G., Le Roux, J., Pardo, B., "Bootstrapping Single-Channel Source Separation via Unsupervised Spatial Clustering on Stereo Mixtures", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8683198, May 2019.
BibTeX TR2019-014 PDF- @inproceedings{Seetharaman2019may2,
- author = {Seetharaman, Prem and Wichern, Gordon and Le Roux, Jonathan and Pardo, Bryan},
- title = {Bootstrapping Single-Channel Source Separation via Unsupervised Spatial Clustering on Stereo Mixtures},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8683198},
- url = {https://www.merl.com/publications/TR2019-014}
- }
- Seetharaman, P., Wichern, G., Venkataramani, S., Le Roux, J., "Class-Conditional Embeddings for Music Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8683007, May 2019.
BibTeX TR2019-004 PDF- @inproceedings{Seetharaman2019may,
- author = {Seetharaman, Prem and Wichern, Gordon and Venkataramani, Shrikant and Le Roux, Jonathan},
- title = {Class-Conditional Embeddings for Music Source Separation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8683007},
- url = {https://www.merl.com/publications/TR2019-004}
- }
- Wang, X., Li, R., Mallidi, S.H., Hori, T., Watanabe, S., Hermansky, H., "Stream Attention-Based Multi-Array End-to-End Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8682650, May 2019.
BibTeX TR2019-005 PDF- @inproceedings{Wang2019may,
- author = {Wang, Xiaofei and Li, Ruizhi and Mallidi, Sri Harish and Hori, Takaaki and Watanabe, Shinji and Hermansky, Hynek},
- title = {Stream Attention-Based Multi-Array End-to-End Speech Recognition},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8682650},
- url = {https://www.merl.com/publications/TR2019-005}
- }
- Bergman, D., Cardonha, C., Cire, A., Raghunathan, A.U., "On the Minimum Chordal Completion Polytope", Operations Research, DOI: 10.1287/opre.2018.1783, Vol. 67, No. 2, pp. 295-597, March 2019.
BibTeX TR2018-095 PDF- @article{Bergman2019mar,
- author = {Bergman, David and Cardonha, Carlos and Cire, Andre and Raghunathan, Arvind},
- title = {On the Minimum Chordal Completion Polytope},
- journal = {Operations Research},
- year = 2019,
- volume = 67,
- number = 2,
- pages = {295--597},
- month = mar,
- doi = {10.1287/opre.2018.1783},
- url = {https://www.merl.com/publications/TR2018-095}
- }
- Le Roux, J., Wichern, G., Watanabe, S., Sarroff, A., Hershey, J., "Phasebook and Friends: Leveraging discrete representations for source separation", IEEE Journal of Selected Topics in Signal Processing, DOI: 10.1109/JSTSP.2019.2904183, Vol. 13, No. 2, pp. 370-382, March 2019.
BibTeX TR2018-199 PDF- @article{LeRoux2019mar,
- author = {Le Roux, Jonathan and Wichern, Gordon and Watanabe, Shinji and Sarroff, Andy and Hershey, John},
- title = {Phasebook and Friends: Leveraging discrete representations for source separation},
- journal = {IEEE Journal of Selected Topics in Signal Processing},
- year = 2019,
- volume = 13,
- number = 2,
- pages = {370--382},
- month = mar,
- doi = {10.1109/JSTSP.2019.2904183},
- url = {https://www.merl.com/publications/TR2018-199}
- }
- Pajovic, M., Ozcan, G., Koike-Akino, T., Wang, P., Orlik, P.V., "Packet Separation in Phase Noise Impaired Random Access Channel", IEEE Global Communications Conference (GLOBECOM), DOI: 10.1109/GLOCOM.2018.8647403, December 2018.
BibTeX TR2018-167 PDF- @inproceedings{Pajovic2018dec,
- author = {Pajovic, Milutin and Ozcan, Gozde and Koike-Akino, Toshiaki and Wang, Pu and Orlik, Philip V.},
- title = {Packet Separation in Phase Noise Impaired Random Access Channel},
- booktitle = {IEEE Global Communications Conference (GLOBECOM)},
- year = 2018,
- month = dec,
- doi = {10.1109/GLOCOM.2018.8647403},
- url = {https://www.merl.com/publications/TR2018-167}
- }
- Yu, X., Chaturvedi, S., Feng, C., Taguchi, Y., Lee, T.-Y., Fernandes, C., Ramalingam, S., "VLASE: Vehicle Localization by Aggregating Semantic Edges", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/IROS.2018.8594358, October 2018, pp. 3196-3203.
BibTeX TR2018-113 PDF- @inproceedings{Yu2018oct,
- author = {Yu, Xin and Chaturvedi, Sagar and Feng, Chen and Taguchi, Yuichi and Lee, Teng-Yok and Fernandes, Clinton and Ramalingam, Srikumar},
- title = {VLASE: Vehicle Localization by Aggregating Semantic Edges},
- booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
- year = 2018,
- pages = {3196--3203},
- month = oct,
- doi = {10.1109/IROS.2018.8594358},
- url = {https://www.merl.com/publications/TR2018-113}
- }
- Wichern, G., Le Roux, J., "Phase Reconstruction with Learned Time-Frequency Representations for Single-Channel Speech Separation", International Workshop on Acoustic Signal Enhancement (IWAENC), DOI: 10.1109/IWAENC.2018.8521243, September 2018.
BibTeX TR2018-146 PDF- @inproceedings{Wichern2018sep,
- author = {Wichern, Gordon and Le Roux, Jonathan},
- title = {Phase Reconstruction with Learned Time-Frequency Representations for Single-Channel Speech Separation},
- booktitle = {International Workshop on Acoustic Signal Enhancement (IWAENC)},
- year = 2018,
- month = sep,
- doi = {10.1109/IWAENC.2018.8521243},
- url = {https://www.merl.com/publications/TR2018-146}
- }
- Wang, J., Cherian, A., "Learning Discriminative Video Representations Using Adversarial Perturbations", European Conference on Computer Vision (ECCV), September 2018.
BibTeX TR2018-139 PDF Software- @inproceedings{Wang2018sep3,
- author = {Wang, Jue and Cherian, Anoop},
- title = {Learning Discriminative Video Representations Using Adversarial Perturbations},
- booktitle = {European Conference on Computer Vision (ECCV)},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-139}
- }
- Wang, J., Cherian, A., "Discriminative Subspace Pooling for Action Recognition", Workshop on Perceptual Organization in Computer Vision as part of the European Conference on Computer Vision (ECCV), September 2018.
BibTeX TR2018-141 PDF- @inproceedings{Wang2018sep2,
- author = {Wang, Jue and Cherian, Anoop},
- title = {Discriminative Subspace Pooling for Action Recognition},
- booktitle = {Workshop on Perceptual Organization in Computer Vision as part of the European Conference on Computer Vision (ECCV)},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-141}
- }
- Wang, Z.-Q., Le Roux, J., Wang, D., Hershey, J., "End-to-End Speech Separation with Unfolded Iterative Phase Reconstruction", Interspeech, September 2018.
BibTeX TR2018-135 PDF- @inproceedings{Wang2018sep,
- author = {Wang, Zhong-Qiu and Le Roux, Jonathan and Wang, DeLiang and Hershey, John},
- title = {End-to-End Speech Separation with Unfolded Iterative Phase Reconstruction},
- booktitle = {Interspeech},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-135}
- }
- Seki, H., Hori, T., Watanabe, S., Le Roux, J., Hershey, J., "A Purely End-to-end System for Multi-speaker Speech Recognition", Annual Meeting of the Association for Computational Linguistics (ACL), July 2018, pp. 2620-2630.
BibTeX TR2018-104 PDF Video- @inproceedings{Seki2018jul,
- author = {Seki, Hiroshi and Hori, Takaaki and Watanabe, Shinji and Le Roux, Jonathan and Hershey, John},
- title = {A Purely End-to-end System for Multi-speaker Speech Recognition},
- booktitle = {Annual Meeting of the Association for Computational Linguistics (ACL)},
- year = 2018,
- pages = {2620--2630},
- month = jul,
- publisher = {Elsevier},
- url = {https://www.merl.com/publications/TR2018-104}
- }
- Pan, Y., Farahmand, A.-M., White, M., Nabi, S., Grover, P., Nikovski, D.N., "Reinforcement Learning with Function-Valued Action Spaces for Partial Differential Equation Control", International Conference on Machine Learning (ICML), July 2018.
BibTeX TR2018-101 PDF- @inproceedings{Pan2018jul,
- author = {Pan, Yangchen and Farahmand, Amir-massoud and White, Martha and Nabi, Saleh and Grover, Piyush and Nikovski, Daniel N.},
- title = {Reinforcement Learning with Function-Valued Action Spaces for Partial Differential Equation Control},
- booktitle = {International Conference on Machine Learning (ICML)},
- year = 2018,
- month = jul,
- url = {https://www.merl.com/publications/TR2018-101}
- }
- Erdogan, H., Hershey, J., Watanabe, S., Le Roux, J., "Deep recurrent networks for separation and recognition of single-channel speech in non-stationary background audio" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R., Eds., chapter 7, Springer, July 2018.
BibTeX - @incollection{Erdogan2018jul,
- author = {Erdogan, Hakan and Hershey, John and Watanabe, Shinji and Le Roux, Jonathan},
- title = {Deep recurrent networks for separation and recognition of single-channel speech in non-stationary background audio},
- booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
- year = 2018,
- editor = {Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R.},
- chapter = 7,
- month = jul,
- publisher = {Springer},
- isbn = {978-3-319-64680-0}
- }
- Di Cairano, S., Goldsmith, A., Kalabić, U., Bortoff, S.A., "Cascaded Reference Governor-MPC for Motion Control of Two-Stage Manufacturing Machines", IEEE Transactions on Control Systems Technology, DOI: 10.1109/TCST.2018.2847627, July 2018.
BibTeX TR2018-083 PDF- @article{DiCairano2018jul,
- author = {Di Cairano, S. and Goldsmith, A. and Kalabić, U. and Bortoff, S.A.},
- title = {Cascaded Reference Governor-MPC for Motion Control of Two-Stage Manufacturing Machines},
- journal = {IEEE Transactions on Control Systems Technology},
- year = 2018,
- month = jul,
- doi = {10.1109/TCST.2018.2847627},
- url = {https://www.merl.com/publications/TR2018-083}
- }
- Berntorp, K., Di Cairano, S., "Approximate Noise-Adaptive Filtering Using Student-t Distributions", American Control Conference (ACC), DOI: 10.23919/ACC.2018.8430902, June 2018, pp. 2745-2750.
BibTeX TR2018-088 PDF- @inproceedings{Berntorp2018jun2,
- author = {Berntorp, Karl and Di Cairano, Stefano},
- title = {Approximate Noise-Adaptive Filtering Using Student-t Distributions},
- booktitle = {American Control Conference (ACC)},
- year = 2018,
- pages = {2745--2750},
- month = jun,
- doi = {10.23919/ACC.2018.8430902},
- url = {https://www.merl.com/publications/TR2018-088}
- }
- Pajovic, M., Orlik, P.V., "Reduced-Dimension Symbol Detection in Random Access Channel", IEEE International Conference on Communications (ICC), DOI: 10.1109/ICC.2018.8422126, May 2018.
BibTeX TR2018-060 PDF- @inproceedings{Pajovic2018may,
- author = {Pajovic, Milutin and Orlik, Philip V.},
- title = {Reduced-Dimension Symbol Detection in Random Access Channel},
- booktitle = {IEEE International Conference on Communications (ICC)},
- year = 2018,
- month = may,
- doi = {10.1109/ICC.2018.8422126},
- url = {https://www.merl.com/publications/TR2018-060}
- }