Publications

259 / 3,904 publications found.


  •  Falcon Perez, R., Wichern, G., Germain, F., Le Roux, J., "Location as supervision for weakly supervised multi-channel source separation of machine sounds", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA58266.2023.10248128, September 2023.
    BibTeX TR2023-119 PDF Presentation
    • @inproceedings{FalconPerez2023aug,
    • author = {Falcon Perez, Ricardo and Wichern, Gordon and Germain, Francois and {Le Roux}, Jonathan},
    • title = {{Location as supervision for weakly supervised multi-channel source separation of machine sounds}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2023,
    • month = sep,
    • publisher = {IEEE},
    • doi = {10.1109/WASPAA58266.2023.10248128},
    • issn = {1947-1629},
    • isbn = {979-8-3503-2372-6},
    • url = {https://www.merl.com/publications/TR2023-119}
    • }
  •  Petermann, D., Wichern, G., Subramanian, A.S., Wang, Z.-Q., Le Roux, J., "Tackling the Cocktail Fork Problem for Separation and Transcription of Real-World Soundtracks", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/​TASLP.2023.3290428, Vol. 31, pp. 2592-2605, September 2023.
    BibTeX TR2023-113 PDF
    • @article{Petermann2023sep,
    • author = {Petermann, Darius and Wichern, Gordon and Subramanian, Aswin Shanmugam and Wang, Zhong-Qiu and {Le Roux}, Jonathan},
    • title = {{Tackling the Cocktail Fork Problem for Separation and Transcription of Real-World Soundtracks}},
    • journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
    • year = 2023,
    • volume = 31,
    • pages = {2592--2605},
    • month = sep,
    • doi = {10.1109/TASLP.2023.3290428},
    • issn = {2329-9304},
    • url = {https://www.merl.com/publications/TR2023-113}
    • }
  •  Salatiello, A., Wang, Y., Wichern, G., Koike-Akino, T., Yoshihiro, O., Kaneko, Y., Laughman, C.R., Chakrabarty, A., "Synthesizing Building Operation Data with Generative Models: VAEs, GANs, or Something In Between?", ACM e-Energy Conference, DOI: 10.1145/​3599733.3600260, June 2023.
    BibTeX TR2023-072 PDF
    • @inproceedings{Salatiello2023jun,
    • author = {Salatiello, Alessandro and Wang, Ye and Wichern, Gordon and Koike-Akino, Toshiaki and Yoshihiro, Ohta and Kaneko, Yosuke and Laughman, Christopher R. and Chakrabarty, Ankush},
    • title = {{Synthesizing Building Operation Data with Generative Models: VAEs, GANs, or Something In Between?}},
    • booktitle = {ACM e-Energy Conference},
    • year = 2023,
    • month = jun,
    • doi = {10.1145/3599733.3600260},
    • url = {https://www.merl.com/publications/TR2023-072}
    • }
  •  Chen, K., Wichern, G., Germain, F., Le Roux, J., "Pac-HuBERT: Self-Supervised Music Source Separation via Primitive Auditory Clustering and Hidden-Unit BERT", IEEE ICASSP Satellite Workshop on Self-supervision in Audio, Speech and Beyond (SASB), DOI: 10.1109/​ICASSPW59220.2023.10193575, May 2023.
    BibTeX TR2023-030 PDF
    • @inproceedings{Chen2023may,
    • author = {Chen, Ke and Wichern, Gordon and Germain, Francois and {Le Roux}, Jonathan},
    • title = {{Pac-HuBERT: Self-Supervised Music Source Separation via Primitive Auditory Clustering and Hidden-Unit BERT}},
    • booktitle = {IEEE ICASSP Satellite Workshop on Self-supervision in Audio, Speech and Beyond (SASB)},
    • year = 2023,
    • month = may,
    • doi = {10.1109/ICASSPW59220.2023.10193575},
    • isbn = {979-8-3503-0261-5},
    • url = {https://www.merl.com/publications/TR2023-030}
    • }
  •  Aralikatti, R., Boeddeker, C., Wichern, G., Subramanian, A.S., Le Roux, J., "Reverberation as Supervision for Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10095022, May 2023, pp. 1-5.
    BibTeX TR2023-016 PDF
    • @inproceedings{Aralikatti2023may,
    • author = {Aralikatti, Rohith and Boeddeker, Christoph and Wichern, Gordon and Subramanian, Aswin Shanmugam and {Le Roux}, Jonathan},
    • title = {{Reverberation as Supervision for Speech Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10095022},
    • url = {https://www.merl.com/publications/TR2023-016}
    • }
  •  Bralios, D., Tzinis, E., Wichern, G., Smaragdis, P., Le Roux, J., "Latent Iterative Refinement for Modular Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10096897, May 2023, pp. 1-5.
    BibTeX TR2023-019 PDF
    • @inproceedings{Bralios2023may,
    • author = {Bralios, Dimitrios and Tzinis, Efthymios and Wichern, Gordon and Smaragdis, Paris and {Le Roux}, Jonathan},
    • title = {{Latent Iterative Refinement for Modular Source Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10096897},
    • url = {https://www.merl.com/publications/TR2023-019}
    • }
  •  Jeon, E.S., Lohit, S., Anirudh, R., Turaga, P., "Robust Time Series Recovery and Classification Using Test-time Noise Simulator Networks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10096888, May 2023.
    BibTeX TR2023-021 PDF Presentation
    • @inproceedings{Jeon2023may,
    • author = {Jeon, Eun Som and Lohit, Suhas and Anirudh, Rushil and Turaga, Pavan},
    • title = {{Robust Time Series Recovery and Classification Using Test-time Noise Simulator Networks}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10096888},
    • url = {https://www.merl.com/publications/TR2023-021}
    • }
  •  Petermann, D., Wichern, G., Subramanian, A.S., Le Roux, J., "Hyperbolic Audio Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10094943, May 2023, pp. 1-5.
    BibTeX TR2023-017 PDF Video Software
    • @inproceedings{Petermann2023may,
    • author = {Petermann, Darius and Wichern, Gordon and Subramanian, Aswin Shanmugam and {Le Roux}, Jonathan},
    • title = {{Hyperbolic Audio Source Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10094943},
    • url = {https://www.merl.com/publications/TR2023-017}
    • }
  •  Tzinis, E., Wichern, G., Smaragdis, P., Le Roux, J., "Optimal Condition Training for Target Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10095128, May 2023, pp. 1-5.
    BibTeX TR2023-018 PDF
    • @inproceedings{Tzinis2023may,
    • author = {Tzinis, Efthymios and Wichern, Gordon and Smaragdis, Paris and {Le Roux}, Jonathan},
    • title = {{Optimal Condition Training for Target Source Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10095128},
    • url = {https://www.merl.com/publications/TR2023-018}
    • }
  •  Aich, A., Peng, K.-C., Roy-Chowdhury, A.K., "Cross-Domain Video Anomaly Detection without Target Domain Adaptation", IEEE Winter Conference on Applications of Computer Vision (WACV), Crandall, D. and Gong, B. and Lee, Y. J. and Souvenir, R. and Yu, S., Eds., DOI: 10.1109/​WACV56688.2023.00261, January 2023, pp. 2578-2590.
    BibTeX TR2023-001 PDF Video Presentation
    • @inproceedings{Aich2023jan,
    • author = {Aich, Abhishek and Peng, Kuan-Chuan and Roy-Chowdhury, Amit K.},
    • title = {{Cross-Domain Video Anomaly Detection without Target Domain Adaptation}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2023,
    • editor = {Crandall, D. and Gong, B. and Lee, Y. J. and Souvenir, R. and Yu, S.},
    • pages = {2578--2590},
    • month = jan,
    • publisher = {IEEE},
    • doi = {10.1109/WACV56688.2023.00261},
    • issn = {2642-9381},
    • isbn = {978-1-6654-9346-8},
    • url = {https://www.merl.com/publications/TR2023-001}
    • }
  •  Chatterjee, M., Ahuja, N., Cherian, A., "Learning Audio-Visual Dynamics Using Scene Graphs for Audio Source Separation", Advances in Neural Information Processing Systems (NeurIPS), November 2022.
    BibTeX TR2022-140 PDF Presentation
    • @inproceedings{Chatterjee2022nov,
    • author = {Chatterjee, Moitreya and Ahuja, Narendra and Cherian, Anoop},
    • title = {{Learning Audio-Visual Dynamics Using Scene Graphs for Audio Source Separation}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2022-140}
    • }
  •  Ahmed, S.M., Lohit, S., Peng, K.-C., Jones, M.J., Roy Chowdhury, A.K., "Cross-Modal Knowledge Transfer Without Task-Relevant Source Data", European Conference on Computer Vision (ECCV), Avidan, S and Brostow, G and Cisse M and Farinella, G.M. and Hassner T., Eds., DOI: 10.1007/​978-3-031-19830-4_7, October 2022, pp. 111-127.
    BibTeX TR2022-135 PDF Video Software Presentation
    • @inproceedings{Ahmed2022oct,
    • author = {Ahmed, Sk Miraj and Lohit, Suhas and Peng, Kuan-Chuan and Jones, Michael J. and Roy Chowdhury, Amit K.},
    • title = {{Cross-Modal Knowledge Transfer Without Task-Relevant Source Data}},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2022,
    • editor = {Avidan, S and Brostow, G and Cisse M and Farinella, G.M. and Hassner T.},
    • pages = {111--127},
    • month = oct,
    • publisher = {Springer},
    • doi = {10.1007/978-3-031-19830-4_7},
    • isbn = {978-3-031-19830-4},
    • url = {https://www.merl.com/publications/TR2022-135}
    • }
  •  Xia, H., Wang, P., Ding, Z., "Incomplete Multi-view Domain Adaptation via Channel Enhancement and Knowledge Transfer", European Conference on Computer Vision (ECCV), DOI: 10.1007/​978-3-031-19830-4_12, October 2022.
    BibTeX TR2022-134 PDF
    • @inproceedings{Xia2022oct,
    • author = {Xia, Haifeng and Wang, Pu and Ding, Zhengming},
    • title = {{Incomplete Multi-view Domain Adaptation via Channel Enhancement and Knowledge Transfer}},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2022,
    • month = oct,
    • doi = {10.1007/978-3-031-19830-4_12},
    • isbn = {978-3-031-19830-4},
    • url = {https://www.merl.com/publications/TR2022-134}
    • }
  •  Tzinis, E., Wichern, G., Subramanian, A.S., Smaragdis, P., Le Roux, J., "Heterogeneous Target Speech Separation", Interspeech, DOI: 10.21437/​Interspeech.2022-10717, September 2022, pp. 1796-1800.
    BibTeX TR2022-115 PDF Video Presentation
    • @inproceedings{Tzinis2022sep,
    • author = {Tzinis, Efthymios and Wichern, Gordon and Subramanian, Aswin Shanmugam and Smaragdis, Paris and {Le Roux}, Jonathan},
    • title = {{Heterogeneous Target Speech Separation}},
    • booktitle = {Interspeech},
    • year = 2022,
    • pages = {1796--1800},
    • month = sep,
    • doi = {10.21437/Interspeech.2022-10717},
    • url = {https://www.merl.com/publications/TR2022-115}
    • }
  •  Zhan, S., Wichern, G., Laughman, C.R., Chong, A., Chakrabarty, A., "Calibrating building simulation models using multi-source datasets and meta-learned Bayesian optimization", Energy and Buildings, DOI: 10.1016/​j.enbuild.2022.112278, Vol. 270, pp. 112278, September 2022.
    BibTeX TR2022-072 PDF
    • @article{Zhan2023jan,
    • author = {Zhan, Sicheng and Wichern, Gordon and Laughman, Christopher R. and Chong, Adrian and Chakrabarty, Ankush},
    • title = {{Calibrating building simulation models using multi-source datasets and meta-learned Bayesian optimization}},
    • journal = {Energy and Buildings},
    • year = 2022,
    • volume = 270,
    • pages = 112278,
    • month = sep,
    • doi = {10.1016/j.enbuild.2022.112278},
    • url = {https://www.merl.com/publications/TR2022-072}
    • }
  •  Xia, H., Wang, P., Koike-Akino, T., Wang, Y., Orlik, P.V., Ding, Z., "Adversarial Bi-Regressor Network for Domain Adaptive Regression", International Joint Conference on Artificial Intelligence (IJCAI), Lud De Raedt, Eds., DOI: 10.24963/​ijcai.2022/​501, July 2022, pp. 3608-3614.
    BibTeX TR2022-103 PDF
    • @inproceedings{Xia2022jul,
    • author = {Xia, Haifeng and Wang, Pu and Koike-Akino, Toshiaki and Wang, Ye and Orlik, Philip V. and Ding, Zhengming},
    • title = {{Adversarial Bi-Regressor Network for Domain Adaptive Regression}},
    • booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)},
    • year = 2022,
    • editor = {Lud De Raedt},
    • pages = {3608--3614},
    • month = jul,
    • publisher = {IJCAI},
    • doi = {10.24963/ijcai.2022/501},
    • url = {https://www.merl.com/publications/TR2022-103}
    • }
  •  Raghunathan, A., Jha, D.K., Romeres, D., "Python-based Open Source Package for Optimization of Contact-rich Systems", Robotics: Science and Systems, June 2022.
    BibTeX TR2022-089 PDF
    • @inproceedings{Raghunathan2022jun,
    • author = {Raghunathan, Arvind and Jha, Devesh K. and Romeres, Diego},
    • title = {{Python-based Open Source Package for Optimization of Contact-rich Systems}},
    • booktitle = {Robotics: Science and Systems},
    • year = 2022,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2022-089}
    • }
  •  Petermann, D., Wichern, G., Wang, Z.-Q., Le Roux, J., "The Cocktail Fork Problem: Three-Stem Audio Separation for Real-World Soundtracks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9746005, April 2022, pp. 526-530.
    BibTeX TR2022-022 PDF Video Software
    • @inproceedings{Petermann2022apr,
    • author = {Petermann, Darius and Wichern, Gordon and Wang, Zhong-Qiu and {Le Roux}, Jonathan},
    • title = {{The Cocktail Fork Problem: Three-Stem Audio Separation for Real-World Soundtracks}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {526--530},
    • month = apr,
    • doi = {10.1109/ICASSP43922.2022.9746005},
    • url = {https://www.merl.com/publications/TR2022-022}
    • }
  •  Slizovskaia, O., Wichern, G., Wang, Z.-Q., Le Roux, J., "Locate This, Not That: Class-Conditioned Sound Event DOA Estimation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9747604, April 2022, pp. 711-715.
    BibTeX TR2022-023 PDF
    • @inproceedings{Slizovskaia2022mar,
    • author = {Slizovskaia, Olga and Wichern, Gordon and Wang, Zhong-Qiu and {Le Roux}, Jonathan},
    • title = {{Locate This, Not That: Class-Conditioned Sound Event DOA Estimation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {711--715},
    • month = apr,
    • doi = {10.1109/ICASSP43922.2022.9747604},
    • url = {https://www.merl.com/publications/TR2022-023}
    • }
  •  Wang, B., Shin, K.-H., Hidaka, Y., Kondo, S., Arita, H., Ito, K., "Analytical Magnetic Model for Variable-Flux Interior Permanent Magnet Synchronous Motors", IEEE Energy Conversion Congress and Exposition (ECCE), DOI: 10.1109/​ECCE47101.2021.9595341, October 2021, pp. 4142-4148.
    BibTeX TR2021-123 PDF
    • @inproceedings{Wang2021oct2,
    • author = {Wang, Bingnan and Shin, Kyung-Hun and Hidaka, Yuki and Kondo, Shota and Arita, Hideaki and Ito, Kazumasa},
    • title = {{Analytical Magnetic Model for Variable-Flux Interior Permanent Magnet Synchronous Motors}},
    • booktitle = {2021 IEEE Energy Conversion Congress and Exposition (ECCE)},
    • year = 2021,
    • pages = {4142--4148},
    • month = oct,
    • publisher = {IEEE},
    • doi = {10.1109/ECCE47101.2021.9595341},
    • url = {https://www.merl.com/publications/TR2021-123}
    • }
  •  Chatterjee, M., Le Roux, J., Ahuja, N., Cherian, A., "Visual Scene Graphs for Audio Source Separation", IEEE International Conference on Computer Vision (ICCV), October 2021, pp. 1204-1213.
    BibTeX TR2021-095 PDF Video Software
    • @inproceedings{Chatterjee2021oct,
    • author = {Chatterjee, Moitreya and {Le Roux}, Jonathan and Ahuja, Narendra and Cherian, Anoop},
    • title = {{Visual Scene Graphs for Audio Source Separation}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2021,
    • pages = {1204--1213},
    • month = oct,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2021-095}
    • }
  •  Liu, B., Guo, J., Koike-Akino, T., Wang, Y., Kim, K.J., Parsons, K., Orlik, P.V., Hashimoto, S., Yuan, J., "Anomaly Detection and Diagnosis Using Pre-Processing and Time-Delay Autoencoder", IEEE International conference on emerging technologies and factory automation, September 2021.
    BibTeX TR2021-107 PDF
    • @inproceedings{Liu2021sep,
    • author = {Liu, Bryan and Guo, Jianlin and Koike-Akino, Toshiaki and Wang, Ye and Kim, Kyeong Jin and Parsons, Kieran and Orlik, Philip V. and Hashimoto, Shigeru and Yuan, Jinhong},
    • title = {{Anomaly Detection and Diagnosis Using Pre-Processing and Time-Delay Autoencoder}},
    • booktitle = {IEEE International conference on emerging technologies and factory automation},
    • year = 2021,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2021-107}
    • }
  •  Li, K., Yagyu, E., Sato, H., Teo, K.H., Rakheja, S., "Compact modeling of gate leakage phenomenon in GaN HEMTs", IEEE Transactions on Electron Devices, DOI: 10.23919/​SISPAD49475.2020.9241666, June 2021.
    BibTeX TR2021-079 PDF
    • @article{Li2021jun,
    • author = {Li, Kexin and Yagyu, Eiji and Sato, Hisashi and Teo, Koon Hoo and Rakheja, Shaloo},
    • title = {{Compact modeling of gate leakage phenomenon in GaN HEMTs}},
    • journal = {IEEE Transactions on Electron Devices},
    • year = 2021,
    • month = jun,
    • doi = {10.23919/SISPAD49475.2020.9241666},
    • url = {https://www.merl.com/publications/TR2021-079}
    • }
  •  Hung, Y.-N., Wichern, G., Le Roux, J., "Transcription Is All You Need: Learning to Separate Musical Mixtures with Score as Supervision", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP39728.2021.9413358, June 2021, pp. 46-50.
    BibTeX TR2021-069 PDF
    • @inproceedings{Hung2021jun,
    • author = {Hung, Yun-Ning and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Transcription Is All You Need: Learning to Separate Musical Mixtures with Score as Supervision}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2021,
    • pages = {46--50},
    • month = jun,
    • doi = {10.1109/ICASSP39728.2021.9413358},
    • issn = {2379-190X},
    • isbn = {978-1-7281-7605-5},
    • url = {https://www.merl.com/publications/TR2021-069}
    • }
  •  Khurana, S., Moritz, N., Hori, T., Le Roux, J., "Unsupervised Domain Adaptation For Speech Recognition via Uncertainty Driven Self-Training", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP39728.2021.9414299, June 2021, pp. 6553-6557.
    BibTeX TR2021-039 PDF
    • @inproceedings{Khurana2021jun,
    • author = {Khurana, Sameer and Moritz, Niko and Hori, Takaaki and {Le Roux}, Jonathan},
    • title = {{Unsupervised Domain Adaptation For Speech Recognition via Uncertainty Driven Self-Training}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2021,
    • pages = {6553--6557},
    • month = jun,
    • doi = {10.1109/ICASSP39728.2021.9414299},
    • url = {https://www.merl.com/publications/TR2021-039}
    • }