Publications

Ji, D.-Y., Wang, B., Inoue, H., Kanemaru, M., "Motor Fault Detection with a Hybrid Physics-based and Data-Driven Method", IEEE International Electric Machines and Drives Conference (IEMDC), DOI: 10.1109/IEMDC60492.2025.11061000, May 2025, pp. 1178-1183.
BibTeX TR2025-062 PDF
- @inproceedings{Ji2025may,
- author = {Ji, Dai-Yan and Wang, Bingnan and Inoue, Hiroshi and Kanemaru, Makoto},
- title = {{Motor Fault Detection with a Hybrid Physics-based and Data-Driven Method}},
- booktitle = {2025 IEEE International Electric Machines & Drives Conference (IEMDC)},
- year = 2025,
- pages = {1178--1183},
- month = may,
- doi = {10.1109/IEMDC60492.2025.11061000},
- url = {https://www.merl.com/publications/TR2025-062}
- }
Sun, S., Wang, Y., Koike-Akino, T., Yamamoto, T., Sakamoto, Y., Wang, B., "Electric Motor Cogging Torque Prediction with Vision Transformer Models", IEEE International Electric Machines and Drives Conference (IEMDC), DOI: 10.1109/IEMDC60492.2025.11061129, May 2025, pp. 782-788.
BibTeX TR2025-059 PDF
- @inproceedings{Sun2025may,
- author = {Sun, Siyuan and Wang, Ye and Koike-Akino, Toshiaki and Yamamoto, Tatsuya and Sakamoto, Yusuke and Wang, Bingnan},
- title = {{Electric Motor Cogging Torque Prediction with Vision Transformer Models}},
- booktitle = {2025 IEEE International Electric Machines & Drives Conference (IEMDC)},
- year = 2025,
- pages = {782--788},
- month = may,
- doi = {10.1109/IEMDC60492.2025.11061129},
- url = {https://www.merl.com/publications/TR2025-059}
- }
Wu, J., Goldsmith, A., Liu, D., Wang, B., Zhou, L., Wang, Y., "A Unified Observer for Smooth Speed-Sensorless Drive Control of Induction Machines at Full Speed Range", IEEE International Electric Machines and Drives Conference (IEMDC), DOI: 10.1109/IEMDC60492.2025.11060981, May 2025.
BibTeX TR2025-060 PDF
- @inproceedings{Wu2025may,
- author = {Wu, Jingjie and Goldsmith, Abraham and Liu, Dehong and Wang, Bingnan and Zhou, Lei and Wang, Yebin},
- title = {{A Unified Observer for Smooth Speed-Sensorless Drive Control of Induction Machines at Full Speed Range}},
- booktitle = {IEEE International Electric Machines and Drives Conference (IEMDC)},
- year = 2025,
- month = may,
- doi = {10.1109/IEMDC60492.2025.11060981},
- url = {https://www.merl.com/publications/TR2025-060}
- }
Wu, J., Goldsmith, A., Zhou, L., Liu, D., Wang, B., Wang, Y., "A Novel High-Frequency Injection Method Towards Speed-Sensorless Drive Control of Induction Machines over Full Speed Range", IEEE International Electric Machines and Drives Conference (IEMDC), DOI: 10.1109/IEMDC60492.2025.11061131, May 2025.
BibTeX TR2025-061 PDF
- @inproceedings{Wu2025may2,
- author = {Wu, Jingjie and Goldsmith, Abraham and Zhou, Lei and Liu, Dehong and Wang, Bingnan and Wang, Yebin},
- title = {{A Novel High-Frequency Injection Method Towards Speed-Sensorless Drive Control of Induction Machines over Full Speed Range}},
- booktitle = {IEEE International Electric Machines and Drives Conference (IEMDC)},
- year = 2025,
- month = may,
- doi = {10.1109/IEMDC60492.2025.11061131},
- url = {https://www.merl.com/publications/TR2025-061}
- }
Singh, A., Jones, M.J., Peng, K.-C., Chatterjee, M., Cherian, A., Learned-Miller, E., "Improving Open-World Object Localization by Discovering Background", CVPR Workshop on Domain Generalization: Evolution, Breakthroughs and Future Horizon, May 2025, pp. 6449-6458.
BibTeX TR2025-058 PDF
- @inproceedings{Singh2025may,
- author = {Singh, Ashish and Jones, Michael J. and Peng, Kuan-Chuan and Chatterjee, Moitreya and Cherian, Anoop and Learned-Miller, Erik},
- title = {{Improving Open-World Object Localization by Discovering Background}},
- booktitle = {CVPR Workshop on Domain Generalization: Evolution, Breakthroughs and Future Horizon},
- year = 2025,
- pages = {6449--6458},
- month = may,
- url = {https://www.merl.com/publications/TR2025-058}
- }
Basu, S., Lohit, S., Brand, M., "G-RepsNet: A Lightweight Construction of Equivariant Net- works for Arbitrary Matrix Groups", Transactions on Machine Learning Research (TMLR), May 2025.
BibTeX TR2025-056 PDF Software
- @article{Basu2025may,
- author = {Basu, Sourya and Lohit, Suhas and Brand, Matthew},
- title = {{G-RepsNet: A Lightweight Construction of Equivariant Net- works for Arbitrary Matrix Groups}},
- journal = {Transactions on Machine Learning Research (TMLR)},
- year = 2025,
- month = may,
- issn = {2835-8856},
- url = {https://www.merl.com/publications/TR2025-056}
- }
Bronars, A., Corcodel, R., Jha, D.K., "High-Accuracy Tactile Pose Estimation for Connector Assembly", ICRA 2025 Workshop on “Towards Human Level Intelligence Vision and Tactile Sensing”, May 2025.
BibTeX TR2025-057 PDF
- @inproceedings{Bronars2025may,
- author = {Bronars, Antonia and Corcodel, Radu and Jha, Devesh K.},
- title = {{High-Accuracy Tactile Pose Estimation for Connector Assembly}},
- booktitle = {ICRA 2025 Workshop on “Towards Human Level Intelligence Vision and Tactile Sensing”},
- year = 2025,
- month = may,
- url = {https://www.merl.com/publications/TR2025-057}
- }
Pan, C."., Brand, M., "Inverse Design of Multilayer Broadband “RGBP” Freeform Metalens for Dual-Functional Color-sorting and Polarization Imaging", Conference on Lasers and Electro-Optics (CLEO), May 2025.
BibTeX TR2025-055 PDF
- @inproceedings{Pan2025may,
- author = {Pan, Cindy "Hsin" and Brand, Matthew},
- title = {{Inverse Design of Multilayer Broadband “RGBP” Freeform Metalens for Dual-Functional Color-sorting and Polarization Imaging}},
- booktitle = {Conference on Lasers and Electro-Optics (CLEO)},
- year = 2025,
- month = may,
- url = {https://www.merl.com/publications/TR2025-055}
- }
Masuyama, Y., Chang, X., Zhang, W., Cornell, S., Wang, Z.-Q., Ono, N., Qian, Y., Watanabe, S., "An End-to-End Integration of Speech Separation and Recognition with Self-Supervised Learning Representation", Computer Speech & Language, DOI: 10.1016/j.csl.2025.101813, Vol. 95, pp. 101813, May 2025.
BibTeX TR2025-054 PDF
- @article{Masuyama2025may,
- author = {Masuyama, Yoshiki and Chang, Xuankai and Zhang, Wangyou and Cornell, Samuele and Wang, Zhong-Qiu and Ono, Nobutaka and Qian, Yanmin and Watanabe, Shinji},
- title = {{An End-to-End Integration of Speech Separation and Recognition with Self-Supervised Learning Representation}},
- journal = {Computer Speech \& Language},
- year = 2025,
- volume = 95,
- pages = 101813,
- month = may,
- doi = {10.1016/j.csl.2025.101813},
- issn = {0885-2308},
- url = {https://www.merl.com/publications/TR2025-054}
- }
Chen, Y., Jha, D.K., Tomizuka, M., Romeres, D., "FDPP: Fine-tune Diffusion Policy with Human Preference", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/ICRA55743.2025.11128127, May 2025.
BibTeX TR2025-053 PDF Video
- @inproceedings{Chen2025may,
- author = {Chen, Yuxin and Jha, Devesh K. and Tomizuka, Masayoshi and Romeres, Diego},
- title = {{FDPP: Fine-tune Diffusion Policy with Human Preference}},
- booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
- year = 2025,
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICRA55743.2025.11128127},
- isbn = {979-8-3315-4139-2},
- url = {https://www.merl.com/publications/TR2025-053}
- }
Shirai, Y., Raghunathan, A., Jha, D.K., "Hierarchical Contact-Rich Trajectory Optimization for Multi-Modal Manipulation using Tight Convex Relaxations", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/ICRA55743.2025.11127667, May 2025, pp. 9199-9205.
BibTeX TR2025-052 PDF
- @inproceedings{Shirai2025may,
- author = {Shirai, Yuki and Raghunathan, Arvind and Jha, Devesh K.},
- title = {{Hierarchical Contact-Rich Trajectory Optimization for Multi-Modal Manipulation using Tight Convex Relaxations}},
- booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
- year = 2025,
- pages = {9199--9205},
- month = may,
- doi = {10.1109/ICRA55743.2025.11127667},
- url = {https://www.merl.com/publications/TR2025-052}
- }
Koike-Akino, T., Tonin, F., Wu, Y., Wu, F.Z., Candogan, L.N., Cevher, V., "Quantum-PEFT: Ultra Parameter-Efficient Fine-Tuning", International Conference on Learning Representations (ICLR), April 2025.
BibTeX TR2025-051 PDF
- @inproceedings{Koike-Akino2025apr,
- author = {Koike-Akino, Toshiaki and Tonin,Francesco and Wu,Yongtao and Wu,Frank Zhengqing and Candogan,Leyla Naz and Cevher, Volkan},
- title = {{Quantum-PEFT: Ultra Parameter-Efficient Fine-Tuning}},
- booktitle = {International Conference on Learning Representations (ICLR)},
- year = 2025,
- month = apr,
- url = {https://www.merl.com/publications/TR2025-051}
- }
Tang, H., Ellis, K., Lohit, S., Jones, M.J., Chatterjee, M., "Programmatic Video Prediction Using Large Language Models", International Conference on Learning Representations Workshops (ICLRW), April 2025.
BibTeX TR2025-049 PDF
- @inproceedings{Tang2025apr,
- author = {Tang, Hao and Ellis, Kevin and Lohit, Suhas and Jones, Michael J. and Chatterjee, Moitreya},
- title = {{Programmatic Video Prediction Using Large Language Models}},
- booktitle = {International Conference on Learning Representations Workshops (ICLRW)},
- year = 2025,
- month = apr,
- url = {https://www.merl.com/publications/TR2025-049}
- }
Kitichotkul, R., Rapp, J., Ma, Y., Mansour, H., "Simultaneous Range and Velocity Measurement with Doppler Single-Photon Lidar", Optica, DOI: 10.1364/OPTICA.555984, Vol. 12, pp. 604-613, April 2025.
BibTeX TR2025-050 PDF
- @article{Kitichotkul2025apr,
- author = {Kitichotkul, Ruangrawee and Rapp, Joshua and Ma, Yanting and Mansour, Hassan},
- title = {{Simultaneous Range and Velocity Measurement with Doppler Single-Photon Lidar}},
- journal = {Optica},
- year = 2025,
- volume = 12,
- pages = {604--613},
- month = apr,
- doi = {10.1364/OPTICA.555984},
- url = {https://www.merl.com/publications/TR2025-050}
- }
Zhang, M., Jha, D.K., Raghunathan, A., Hauser, K., "Simultaneous Trajectory Optimization and Contact Selection for Contact-rich Manipulation with High-Fidelity Geometry", IEEE Transactions on Robotics (T-RO), DOI: 10.1109/TRO.2025.3554380, Vol. 41, pp. 2677-2690, April 2025.
BibTeX TR2025-047 PDF
- @article{Zhang2025apr,
- author = {Zhang, Mengchao and Jha, Devesh K. and Raghunathan, Arvind and Hauser, Kris},
- title = {{Simultaneous Trajectory Optimization and Contact Selection for Contact-rich Manipulation with High-Fidelity Geometry}},
- journal = {IEEE Transactions on Robotics (T-RO)},
- year = 2025,
- volume = 41,
- pages = {2677--2690},
- month = apr,
- doi = {10.1109/TRO.2025.3554380},
- url = {https://www.merl.com/publications/TR2025-047}
- }
Lin, C., Boufounos, P.T., Ma, Y., Wang, Y., Ding, Q., Sels, D., Chien, C.-C., "Time-optimal single-scalar control on a qubit of unitary dynamics", Physical Review, DOI: 10.1103/PhysRevA.111.042602, Vol. 111, No. 4, pp. 042602, April 2025.
BibTeX TR2025-048 PDF
- @article{Lin2025apr2,
- author = {Lin, Chungwei and Boufounos, Petros T. and Ma, Yanting and Wang, Yebin and Ding, Qi and Sels, Dries and Chien, Chih-Chun},
- title = {{Time-optimal single-scalar control on a qubit of unitary dynamics}},
- journal = {Physical Review},
- year = 2025,
- volume = 111,
- number = 4,
- pages = 042602,
- month = apr,
- doi = {10.1103/PhysRevA.111.042602},
- url = {https://www.merl.com/publications/TR2025-048}
- }
Turcato, N., Cali, M., Dalla Libera, A., Giacomuzzo, G., Carli, R., Romeres, D., "Learning global control of underactuated double pendulum with Model-Based Reinforcement Learning", IEEE International Conference on Robotics and Automation (ICRA) - 3rd AI Olympics with RealAIGym Competition, April 2025.
BibTeX TR2025-046 PDF
- @inproceedings{Turcato2025apr,
- author = {Turcato, Niccolò and Cali, Marco and Dalla Libera, Alberto and Giacomuzzo, Giulio and Carli, Ruggero and Romeres, Diego},
- title = {{Learning global control of underactuated double pendulum with Model-Based Reinforcement Learning}},
- booktitle = {IEEE International Conference on Robotics and Automation (ICRA) - 3rd AI Olympics with RealAIGym Competition},
- year = 2025,
- month = apr,
- url = {https://www.merl.com/publications/TR2025-046}
- }
Araki, S., Ito, N., Haeb-Umbach, R., Wichern, G., Wang, Z.-Q., Mitsufuji, Y., "30+ Years of Source Separation Research: Achievements and Future Challenges", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10889006, April 2025, pp. 1-5.
BibTeX TR2025-036 PDF
- @inproceedings{Araki2025mar,
- author = {Araki, Shoko and Ito, Nobutaka and Haeb-Umbach, Reinhold and Wichern, Gordon and Wang, Zhong-Qiu and Mitsufuji, Yuki},
- title = {{30+ Years of Source Separation Research: Achievements and Future Challenges}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- pages = {1--5},
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10889006},
- url = {https://www.merl.com/publications/TR2025-036}
- }
Attiah, K., Wang, P., Mansour, H., Koike-Akino, T., Boufounos, P.T., "Enabling DMG Wi-Fi Sensing in Data Transmission Intervals by Exploiting Beam Training Codebook", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10889300, April 2025.
BibTeX TR2025-026 PDF
- @inproceedings{Attiah2025mar,
- author = {Attiah, Kareem and Wang, Pu and Mansour, Hassan and Koike-Akino, Toshiaki and Boufounos, Petros T.},
- title = {{Enabling DMG Wi-Fi Sensing in Data Transmission Intervals by Exploiting Beam Training Codebook}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49660.2025.10889300},
- issn = {2379-190X},
- isbn = {979-8-3503-6874-1},
- url = {https://www.merl.com/publications/TR2025-026}
- }
Ebbers, J., Germain, F.G., Wilkinghoff, K., Wichern, G., Le Roux, J., "No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10890706, April 2025.
BibTeX TR2025-037 PDF
- @inproceedings{Ebbers2025mar,
- author = {Ebbers, Janek and Germain, François G and Wilkinghoff, Kevin and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10890706},
- url = {https://www.merl.com/publications/TR2025-037}
- }
Gruttadauria, E., Fontaine, M., Le Roux, J., Essid, S., "O-EENC-SD: Efficient Online End-to-End Neural Clustering for Speaker Diarization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10890837, April 2025.
BibTeX TR2025-031 PDF
- @inproceedings{Gruttadauria2025mar,
- author = {Gruttadauria, Elio and Fontaine, Mathieu and {Le Roux}, Jonathan and Essid, Slim},
- title = {{{O-EENC-SD}: Efficient Online End-to-End Neural Clustering for Speaker Diarization}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10890837},
- url = {https://www.merl.com/publications/TR2025-031}
- }
Hori, C., Kambara, M., Sugiura, K., Ota, K., Khurana, S., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Interactive Robot Action Replanning using Multimodal LLM Trained from Human Demonstration Videos", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10887717, April 2025.
BibTeX TR2025-034 PDF
- @inproceedings{Hori2025mar,
- author = {Hori, Chiori and Kambara, Motonari and Sugiura, Komei and Ota, Kei and Khurana, Sameer and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
- title = {{Interactive Robot Action Replanning using Multimodal {LLM} Trained from Human Demonstration Videos}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10887717},
- url = {https://www.merl.com/publications/TR2025-034}
- }
Kitichotkul, R., Rapp, J., Ma, Y., Mansour, H., "Doppler Single-Photon Lidar", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10888897, April 2025, pp. 1-5.
BibTeX TR2025-028 PDF
- @inproceedings{Kitichotkul2025mar,
- author = {Kitichotkul, Ruangrawee and Rapp, Joshua and Ma, Yanting and Mansour, Hassan},
- title = {{Doppler Single-Photon Lidar}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- pages = {1--5},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49660.2025.10888897},
- url = {https://www.merl.com/publications/TR2025-028}
- }
Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10889481, April 2025.
BibTeX TR2025-029 PDF Software
- @inproceedings{Masuyama2025mar,
- author = {{{Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and Le Roux, Jonathan}}},
- title = {{{Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization}}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = apr,
- doi = {10.1109/ICASSP49660.2025.10889481},
- url = {https://www.merl.com/publications/TR2025-029}
- }
Saijo, K., Ebbers, J., Germain, F.G., Khurana, S., Wichern, G., Le Roux, J., "Leveraging Audio-Only Data for Text-Queried Target Sound Extraction", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10888769, April 2025.
BibTeX TR2025-033 PDF
- @inproceedings{Saijo2025mar2,
- author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Khurana, Sameer and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Leveraging Audio-Only Data for Text-Queried Target Sound Extraction}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10888769},
- url = {https://www.merl.com/publications/TR2025-033}
- }