- Uhlich, S., Fabbro, G., Hirano, M., Takahashi, S., Wichern, G., Le Roux, J., Chakraborty, D., Mohanty, S., Li, K., Luo, Y., Yu, J., Gu, R., Solovyev, R., Stempkovskiy, A., Habruseva, T., Sukhovei, M., Mitsufuji, Y., "The Sound Demixing Challenge 2023 – Cinematic Demixing Track", Transactions of the International Society for Music Information Retrieval, DOI: 10.5334/tismir.172, Vol. 7, No. 1, pp. 44-62, May 2024.
BibTeX TR2024-047 PDF- @article{Uhlich2024may,
- author = {Uhlich, Stefan and Fabbro, Giorgio and Hirano, Masato and Takahashi, Shusuke and Wichern, Gordon and {Le Roux}, Jonathan and Chakraborty, Dipam and Mohanty, Sharada and Li, Kai and Luo, Yi and Yu, Jianwei and Gu, Rongzhi and Solovyev, Roman and Stempkovskiy, Alexander and Habruseva, Tatiana and Sukhovei, Mikhail and Mitsufuji, Yuki},
- title = {{The {S}ound {D}emixing {C}hallenge 2023 – {C}inematic {D}emixing {T}rack}},
- journal = {Transactions of the International Society for Music Information Retrieval},
- year = 2024,
- volume = 7,
- number = 1,
- pages = {44--62},
- month = may,
- doi = {10.5334/tismir.172},
- url = {https://www.merl.com/publications/TR2024-047}
- }
- Xu, W., Jones, C., Svetozarevic, B., Laughman, C.R., Chakrabarty, A., "Violation-Aware Contextual Bayesian Optimization for Controller Performance Optimization with Unmodeled Constraints", Journal of Process Control, DOI: 10.1016/j.jprocont.2024.103212, Vol. 138, April 2024.
BibTeX TR2024-046 PDF- @article{Xu2024apr,
- author = {Xu, Wenjie and Jones, Colin and Svetozarevic, Bratislav and Laughman, Christopher R. and Chakrabarty, Ankush},
- title = {{Violation-Aware Contextual Bayesian Optimization for Controller Performance Optimization with Unmodeled Constraints}},
- journal = {Journal of Process Control},
- year = 2024,
- volume = 138,
- month = apr,
- doi = {10.1016/j.jprocont.2024.103212},
- url = {https://www.merl.com/publications/TR2024-046}
- }
- Vaca-Rubio, C., Wang, P., Koike-Akino, T., Wang, Y., Boufounos, P.T., Popovski, P., "Object Trajectory Estimation with Continuous-Time Neural Dynamic Learning of Millimeter-Wave Wi-Fi", IEEE Journal of Selected Topics in Signal Processing, DOI: 10.1109/JSTSP.2024.3388930, April 2024.
BibTeX TR2024-044 PDF- @article{Vaca-Rubio2024apr,
- author = {Vaca-Rubio, Cristian and Wang, Pu and Koike-Akino, Toshiaki and Wang, Ye and Boufounos, Petros T. and Popovski, Petar},
- title = {{Object Trajectory Estimation with Continuous-Time Neural Dynamic Learning of Millimeter-Wave Wi-Fi}},
- journal = {IEEE Journal of Selected Topics in Signal Processing},
- year = 2024,
- month = apr,
- doi = {10.1109/JSTSP.2024.3388930},
- issn = {1941-0484},
- url = {https://www.merl.com/publications/TR2024-044}
- }
- Dey, R., Egger, B., Boddeti, V., Wang, Y., Marks, T.K., "CoLa-SDF: Controllable Latent StyleSDF for Disentangled 3D Face Generation", IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), April 2024.
BibTeX TR2024-045 PDF- @inproceedings{Dey2024apr,
- author = {Dey, Rahul and Egger, Bernhard and Boddeti, Vishnu and Wang, Ye and Marks, Tim K.},
- title = {{CoLa-SDF: Controllable Latent StyleSDF for Disentangled 3D Face Generation}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)},
- year = 2024,
- month = apr,
- url = {https://www.merl.com/publications/TR2024-045}
- }
- Nagai, Y., Guo, J., Sumi, T., Parsons, K., Orlik, P.V., Rolfe, B.A., Wang, P., "Improve IEEE 802.15.4 Network Reliability by Suspendable CSMA/CA", IEEE Wireless Communications and Networking Conference (WCNC), April 2024.
BibTeX TR2024-039 PDF- @inproceedings{Nagai2024apr,
- author = {Nagai, Yukimasa and Guo, Jianlin and Sumi, Takenori and Parsons, Kieran and Orlik, Philip V. and Rolfe, Benjamin A. and Wang, Pu},
- title = {{Improve IEEE 802.15.4 Network Reliability by Suspendable CSMA/CA}},
- booktitle = {IEEE Wireless Communications and Networking Conference (WCNC)},
- year = 2024,
- month = apr,
- url = {https://www.merl.com/publications/TR2024-039}
- }
- Dong, Y., Qiao, H., Laughman, C.R., "Physically-constrained Hybrid Modeling for Vapor Compression Systems", Thermal and Fluids Engineering Conference, DOI: 10.1615/TFEC2024.ml.050269, April 2024, pp. 1259-1268.
BibTeX TR2024-038 PDF- @inproceedings{Dong2024apr,
- author = {Dong, Yiyun and Qiao, Hongtao and Laughman, Christopher R.},
- title = {{Physically-constrained Hybrid Modeling for Vapor Compression Systems}},
- booktitle = {9th Thermal and Fluids Engineering Conference},
- year = 2024,
- pages = {1259--1268},
- month = apr,
- doi = {10.1615/TFEC2024.ml.050269},
- issn = {2379-1748},
- url = {https://www.merl.com/publications/TR2024-038}
- }
- Yan, J., Chakrabarty, A., Rupenyan, A., Lygeros, J., "MPC of Uncertain Nonlinear Systems with Meta-Learning for Fast Adaptation of Neural Predictive Models", arXiv, April 2024.
BibTeX arXiv- @inproceedings{Yan2024apr,
- author = {Yan, Jiaqi and Chakrabarty, Ankush and Rupenyan, Alisa and Lygeros, John},
- title = {{MPC of Uncertain Nonlinear Systems with Meta-Learning for Fast Adaptation of Neural Predictive Models}},
- booktitle = {arXiv},
- year = 2024,
- month = apr,
- url = {https://arxiv.org/abs/2404.12097}
- }
- Hegde, D., Lohit, S., Peng, K.-C., Jones, M.J., Patel, V.M., "Multimodal 3D Object Detection on Unseen Domains", arXiv, April 2024.
BibTeX arXiv- @article{Hegde2024apr,
- author = {Hegde, Deepti and Lohit, Suhas and Peng, Kuan-Chuan and Jones, Michael J. and Patel, Vishal M.},
- title = {{Multimodal 3D Object Detection on Unseen Domains}},
- journal = {arXiv},
- year = 2024,
- month = apr,
- url = {https://arxiv.org/abs/2404.11764}
- }
- Pan, Z., Wichern, G., Germain, F.G., Subramanian, A., Le Roux, J., "Late Audio-Visual Fusion for In-The-Wild Speaker Diarization", Hands-free Speech Communication and Microphone Arrays (HSCMA), DOI: 10.1109/ICASSPW62465.2024.10626914, April 2024, pp. 174-178.
BibTeX TR2024-029 PDF- @inproceedings{Pan2024apr,
- author = {Pan, Zexu and Wichern, Gordon and Germain, François G and Subramanian, Aswin and {Le Roux}, Jonathan},
- title = {{Late Audio-Visual Fusion for In-The-Wild Speaker Diarization}},
- booktitle = {Hands-free Speech Communication and Microphone Arrays (HSCMA)},
- year = 2024,
- pages = {174--178},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSPW62465.2024.10626914},
- isbn = {979-8-3503-7451-3},
- url = {https://www.merl.com/publications/TR2024-029}
- }
- Fujihashi, T., Kato, S., Koike-Akino, T., "Implicit Neural Representation for Low-Overhead Graph-Based Holographic-Type Communications", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10445857, April 2024.
BibTeX TR2024-022 PDF- @inproceedings{Fujihashi2024apr,
- author = {Fujihashi, Takuya and Kato, Sorachi and Koike-Akino, Toshiaki},
- title = {{Implicit Neural Representation for Low-Overhead Graph-Based Holographic-Type Communications}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP48485.2024.10445857},
- issn = {2379-190X},
- isbn = {979-8-3503-4485-1},
- url = {https://www.merl.com/publications/TR2024-022}
- }
- Queeney, J., Ozcan, E.C., Paschalidis, I.C., Cassandras, C.G., "Optimal Transport Perturbations for Safe Reinforcement Learning with Robustness Guarantees", Transactions on Machine Learning Research (TMLR), April 2024.
BibTeX TR2024-037 PDF- @article{Queeney2024apr,
- author = {Queeney, James and Ozcan, Erhan Can and Paschalidis, Ioannis Ch. and Cassandras, Christos G.},
- title = {{Optimal Transport Perturbations for Safe Reinforcement Learning with Robustness Guarantees}},
- journal = {Transactions on Machine Learning Research (TMLR)},
- year = 2024,
- month = apr,
- issn = {2835-8856},
- url = {https://www.merl.com/publications/TR2024-037}
- }
- Yang, Z., Liu, J., Chen, P., Cherian, A., Marks, T.K., Le Roux, J., Gan, C., "RILA: Reflective and Imaginative Language Agent for Zero-Shot Semantic Audio-Visual Navigation", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), April 2024, pp. 16251-16261.
BibTeX TR2024-043 PDF- @inproceedings{Yang2024apr,
- author = {Yang, Zeyuan and Liu, Jiageng and Chen, Peihao and Cherian, Anoop and Marks, Tim K. and {Le Roux}, Jonathan and Gan, Chuang},
- title = {{RILA: Reflective and Imaginative Language Agent for Zero-Shot Semantic Audio-Visual Navigation}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2024,
- pages = {16251--16261},
- month = apr,
- publisher = {CVF},
- url = {https://www.merl.com/publications/TR2024-043}
- }
- Jeon, W., Chakrabarty, A., Zemouche, A., Rajamani, R., "LMI-Based Neural Observer for State and Nonlinear Function Estimation", International Journal of Robust and Nonlinear Control, DOI: 10.1002/rnc.7327, April 2024.
BibTeX TR2024-036 PDF- @article{Jeon2024apr,
- author = {Jeon, Woongsun and Chakrabarty, Ankush and Zemouche, Ali and Rajamani, Rajesh},
- title = {{LMI-Based Neural Observer for State and Nonlinear Function Estimation}},
- journal = {International Journal of Robust and Nonlinear Control},
- year = 2024,
- month = apr,
- doi = {10.1002/rnc.7327},
- url = {https://www.merl.com/publications/TR2024-036}
- }
- Koo, J., Wichern, G., Germain, F.G., Khurana, S., Le Roux, J., "SMITIN: Self-Monitored Inference-Time INtervention for Generative Music Transformers", arXiv, April 2024.
BibTeX arXiv- @article{Koo2024apr2,
- author = {Koo, Junghyun and Wichern, Gordon and Germain, François G and Khurana, Sameer and {Le Roux}, Jonathan},
- title = {{SMITIN: Self-Monitored Inference-Time INtervention for Generative Music Transformers}},
- journal = {arXiv},
- year = 2024,
- month = apr,
- url = {https://arxiv.org/abs/2404.02252}
- }
- Koo, J., Wichern, G., Germain, F.G., Khurana, S., Le Roux, J., "Understanding and Controlling Generative Music Transformers by Probing Individual Attention Heads", IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA), April 2024.
BibTeX TR2024-032 PDF- @inproceedings{Koo2024apr,
- author = {Koo, Junghyun and Wichern, Gordon and Germain, François G and Khurana, Sameer and {Le Roux}, Jonathan},
- title = {{Understanding and Controlling Generative Music Transformers by Probing Individual Attention Heads}},
- booktitle = {IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA)},
- year = 2024,
- month = apr,
- url = {https://www.merl.com/publications/TR2024-032}
- }
- Zhang, Z., Lin, C., Wang, B., "Physics-informed shape optimization using coordinate projection", Scientific Reports, DOI: 10.1038/s41598-024-57137-4, Vol. 14, pp. 6537, April 2024.
BibTeX TR2024-035 PDF- @article{Zhang2024apr,
- author = {Zhang, Zhizhou and Lin, Chungwei and Wang, Bingnan},
- title = {{Physics-informed shape optimization using coordinate projection}},
- journal = {Scientific Reports},
- year = 2024,
- volume = 14,
- pages = 6537,
- month = apr,
- doi = {10.1038/s41598-024-57137-4},
- url = {https://www.merl.com/publications/TR2024-035}
- }
- Zhu, X., Jha, D.K., Romeres, D., Sun, L., Tomizuka, M., Cherian, A., "Multi-level Reasoning for Robotic Assembly: From Sequence Inference to Contact Selection", IEEE International Conference on Robotics and Automation (ICRA), March 2024, pp. 816-823.
BibTeX TR2024-033 PDF Video- @inproceedings{Zhu2024mar,
- author = {Zhu, Xinghao and Jha, Devesh K. and Romeres, Diego and Sun, Lingfeng and Tomizuka, Masayoshi and Cherian, Anoop},
- title = {{Multi-level Reasoning for Robotic Assembly: From Sequence Inference to Contact Selection}},
- booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
- year = 2024,
- pages = {816--823},
- month = mar,
- publisher = {IEEE},
- url = {https://www.merl.com/publications/TR2024-033}
- }
- Wang, Y., Hansen, E., Ahn, H., "Hierarchical planning for autonomous parking in dynamic environments", IEEE Transactions on Control Systems Technology, DOI: 10.1109/TCST.2024.3367468, March 2024.
BibTeX TR2024-034 PDF- @article{Wang2024mar2,
- author = {Wang, Yebin and Hansen, Emma and Ahn, Heejin},
- title = {{Hierarchical planning for autonomous parking in dynamic environments}},
- journal = {IEEE Transactions on Control Systems Technology},
- year = 2024,
- month = mar,
- doi = {10.1109/TCST.2024.3367468},
- issn = {1558-0865},
- url = {https://www.merl.com/publications/TR2024-034}
- }
- Gaur, A., Pais, G., Miraldo, P., "Oriented-grid Encoder for 3D Implicit Representations", International Conference on 3D Vision (3DV), DOI: 10.1109/3DV62453.2024.00101, March 2024, pp. 1208-1218.
BibTeX TR2024-031 PDF- @inproceedings{Gaur2024mar,
- author = {Gaur, Arihant and Pais, Goncalo and Miraldo, Pedro},
- title = {{Oriented-grid Encoder for 3D Implicit Representations}},
- booktitle = {International Conference on 3D Vision (3DV)},
- year = 2024,
- pages = {1208--1218},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/3DV62453.2024.00101},
- issn = {2475-7888},
- isbn = {979-8-3503-6245-9},
- url = {https://www.merl.com/publications/TR2024-031}
- }
- Chen, X., Liu, J., Wang, Y., Wang, P., Brand, M., Wang, G., Koike-Akino, T., "SuperLoRA: Parameter-Efficient Unified Adaptation of Multi-Layer Attention Modules", arXiv, March 2024.
BibTeX arXiv- @article{Chen2024mar,
- author = {Chen, Xiangyu and Liu, Jing and Wang, Ye and Wang, Pu and Brand, Matthew and Wang, Guanghui and Koike-Akino, Toshiaki},
- title = {{SuperLoRA: Parameter-Efficient Unified Adaptation of Multi-Layer Attention Modules}},
- journal = {arXiv},
- year = 2024,
- month = mar,
- url = {https://arxiv.org/abs/2403.11887}
- }
- Jeon, C.-B., Wichern, G., Germain, F.G., Le Roux, J., "Why does music source separation benefit from cacophony?", IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA), DOI: 10.1109/ICASSPW62465.2024.10669899, March 2024, pp. 873-877.
BibTeX TR2024-030 PDF Video- @inproceedings{Jeon2024mar,
- author = {Jeon, Chang-Bin and Wichern, Gordon and Germain, François G and {Le Roux}, Jonathan},
- title = {{Why does music source separation benefit from cacophony?}},
- booktitle = {IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA)},
- year = 2024,
- pages = {873--877},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/ICASSPW62465.2024.10669899},
- isbn = {979-8-3503-7451-3},
- url = {https://www.merl.com/publications/TR2024-030}
- }
- Bralios, D., Wichern, G., Germain, F.G., Pan, Z., Khurana, S., Hori, C., Le Roux, J., "Generation or Replication: Auscultating Audio Latent Diffusion Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10447705, March 2024, pp. 1156-1160.
BibTeX TR2024-027 PDF- @inproceedings{Bralios2024mar,
- author = {Bralios, Dimitrios and Wichern, Gordon and Germain, François G and Pan, Zexu and Khurana, Sameer and Hori, Chiori and {Le Roux}, Jonathan},
- title = {{Generation or Replication: Auscultating Audio Latent Diffusion Models}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {1156--1160},
- month = mar,
- doi = {10.1109/ICASSP48485.2024.10447705},
- url = {https://www.merl.com/publications/TR2024-027}
- }
- Fernandez-Menduina, S., Rapp, J., Mansour, H., Greiff, M., Parsons, K., "Tracking Beyond the Unambiguous Range with Modulo Single-Photon Lidar", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10446835, March 2024, pp. 6-10.
BibTeX TR2024-021 PDF- @inproceedings{Fernandez-Menduina2024mar,
- author = {Fernandez-Menduina, Samuel and Rapp, Joshua and Mansour, Hassan and Greiff, Marcus and Parsons, Kieran},
- title = {{Tracking Beyond the Unambiguous Range with Modulo Single-Photon Lidar}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {6--10},
- month = mar,
- doi = {10.1109/ICASSP48485.2024.10446835},
- url = {https://www.merl.com/publications/TR2024-021}
- }
- Masuyama, Y., Wichern, G., Germain, F.G., Pan, Z., Khurana, S., Hori, C., Le Roux, J., "NIIRF: Neural IIR Filter Field for HRTF Upsampling and Personalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10448477, March 2024, pp. 1016-1020.
BibTeX TR2024-026 PDF Software- @inproceedings{Masuyama2024mar,
- author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Pan, Zexu and Khurana, Sameer and Hori, Chiori and {Le Roux}, Jonathan},
- title = {{NIIRF: Neural IIR Filter Field for HRTF Upsampling and Personalization}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {1016--1020},
- month = mar,
- doi = {10.1109/ICASSP48485.2024.10448477},
- url = {https://www.merl.com/publications/TR2024-026}
- }
- Pan, Z., Wichern, G., Germain, F.G., Khurana, S., Le Roux, J., "NeuroHeed+: Improving Neuro-steered Speaker Extraction with Joint Auditory Attention Detection", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10446333, March 2024, pp. 11456-11460.
BibTeX TR2024-025 PDF- @inproceedings{Pan2024mar,
- author = {Pan, Zexu and Wichern, Gordon and Germain, François G and Khurana, Sameer and {Le Roux}, Jonathan},
- title = {{NeuroHeed+: Improving Neuro-steered Speaker Extraction with Joint Auditory Attention Detection}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {11456--11460},
- month = mar,
- doi = {10.1109/ICASSP48485.2024.10446333},
- url = {https://www.merl.com/publications/TR2024-025}
- }