- Hori, C., Masuyama, Y., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2025.
BibTeX TR2025-167 PDF- @inproceedings{Hori2025dec,
- author = {Hori, Chiori and Masuyama, Yoshiki and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
- title = {{Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2025,
- month = dec,
- url = {https://www.merl.com/publications/TR2025-167}
- }
- Xiang, X., Peng, K.-C., Lohit, S., Jones, M.J., Zhang, J., "Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes", British Machine Vision Conference (BMVC), November 2025.
BibTeX TR2025-162 PDF Video Data Presentation- @inproceedings{Xiang2025nov,
- author = {{{Xiang, Xinhao and Peng, Kuan-Chuan and Lohit, Suhas and Jones, Michael J. and Zhang, Jiawei}}},
- title = {{{Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes}}},
- booktitle = {British Machine Vision Conference (BMVC)},
- year = 2025,
- month = nov,
- url = {https://www.merl.com/publications/TR2025-162}
- }
- Masuyama, Y., "Neural Fields for Spatial Audio Modeling," Tech. Rep. TR2025-171, Speech and Audio in the Northeast (SANE), November 2025.
BibTeX TR2025-171 PDF- @techreport{Masuyama2025nov,
- author = {Masuyama, Yoshiki},
- title = {{Neural Fields for Spatial Audio Modeling}},
- institution = {Speech and Audio in the Northeast (SANE)},
- year = 2025,
- month = nov,
- url = {https://www.merl.com/publications/TR2025-171}
- }
- Wilkinghoff, K., Fujimura, T., Imoto, K., Le Roux, J., Tan, Z.-H., Toda, T., "Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work", Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE), DOI: 10.5281/zenodo.17251589, October 2025, pp. 20-24.
BibTeX TR2025-157 PDF- @inproceedings{Wilkinghoff2025oct,
- author = {Wilkinghoff, Kevin and Fujimura, Takuya and Imoto, Keisuke and {Le Roux}, Jonathan and Tan, Zheng-Hua and Toda, Tomoki},
- title = {{Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work}},
- booktitle = {Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE)},
- year = 2025,
- pages = {20--24},
- month = oct,
- doi = {10.5281/zenodo.17251589},
- isbn = {978-84-09-77652-8},
- url = {https://www.merl.com/publications/TR2025-157}
- }
- Chakrabarty, A., Wichern, G., Deshpande, V.M., Vinod, A.P., Berntorp, K., Laughman, C.R., "Meta-Learning for Physically-Constrained Neural System Identification", Neurocomputing, DOI: 10.1016/j.neucom.2025.130945, Vol. 651, pp. 130945, October 2025.
BibTeX TR2025-159 PDF- @article{Chakrabarty2025nov,
- author = {Chakrabarty, Ankush and Wichern, Gordon and Deshpande, Vedang M. and Vinod, Abraham P. and Berntorp, Karl and Laughman, Christopher R.},
- title = {{Meta-Learning for Physically-Constrained Neural System Identification}},
- journal = {Neurocomputing},
- year = 2025,
- volume = 651,
- pages = 130945,
- month = nov,
- doi = {10.1016/j.neucom.2025.130945},
- issn = {0925-2312},
- url = {https://www.merl.com/publications/TR2025-159}
- }
- Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception", IEEE International Conference on Computer Vision (ICCV) Workshop, October 2025.
BibTeX TR2025-154 PDF Software- @inproceedings{Yataka2025oct,
- author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
- title = {{Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshop},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-154}
- }
- Sun, H., Otake, Y., Matsuyama, K., Raghunathan, A., "Switchgear Partial Discharge Diagnosis Using Scarce Fault Records", IEEE PES Innovative Smart Grid Technologies Conference - Europe (ISGT Europe), DOI: 10.1109/ISGTEurope64741.2025.11305301, October 2025.
BibTeX TR2025-155 PDF- @inproceedings{Sun2025oct,
- author = {Sun, Hongbo and Otake, Yasutomo and Matsuyama, Kotaro and Raghunathan, Arvind},
- title = {{Switchgear Partial Discharge Diagnosis Using Scarce Fault Records}},
- booktitle = {IEEE PES Innovative Smart Grid Technologies Conference - Europe (ISGT Europe)},
- year = 2025,
- month = oct,
- doi = {10.1109/ISGTEurope64741.2025.11305301},
- url = {https://www.merl.com/publications/TR2025-155}
- }
- Piedade, V., Chitturi, S., Gaspar, J., Govindu, V., Miraldo, P., "SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity", IEEE International Conference on Computer Vision (ICCV), October 2025.
BibTeX TR2025-146 PDF Presentation- @inproceedings{Piedade2025oct,
- author = {{{Piedade, Valter and Chitturi, Sidhartha and Gaspar, Jose and Govindu, Venu and Miraldo, Pedro}}},
- title = {{{SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity}}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV)},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-146}
- }
- Yang, C.-A., Peng, K.-C., Yeh, R., "Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts", IEEE International Conference on Computer Vision (ICCV), October 2025.
BibTeX TR2025-124 PDF Video Data Presentation- @inproceedings{Yang2025oct,
- author = {{{Yang, Chiao-An and Peng, Kuan-Chuan and Yeh, Raymond}}},
- title = {{{Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts}}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV)},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-124}
- }
- Peng, K.-C., "Joint Training of Image Generator and Detector for Road Defect Detection", IEEE International Conference on Computer Vision (ICCV) Workshops, October 2025.
BibTeX TR2025-149 PDF Video Presentation- @inproceedings{Peng2025oct,
- author = {{{Peng, Kuan-Chuan}}},
- title = {{{Joint Training of Image Generator and Detector for Road Defect Detection}}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshops},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-149}
- }
- Kuwabara, A., Kirihara, H., Kato, S., Koike-Akino, T., Fujihashi, T., "L-GGSC: Learnable Graph-based Gaussian Splatting Compression", IEEE International Conference on Computer Vision Workshops (ICCV), October 2025.
BibTeX TR2025-148 PDF- @inproceedings{Kuwabara2025oct,
- author = {Kuwabara, Akihiro and Kirihara, Hinata and Kato, Sorachi and Koike-Akino, Toshiaki and Fujihashi, Takuya},
- title = {{L-GGSC: Learnable Graph-based Gaussian Splatting Compression}},
- booktitle = {IEEE International Conference on Computer Vision Workshops (ICCV)},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-148}
- }
- Ma, H., Dai, B., Ren, Z., Wang, Y., Li, N., "Offline Imitation Learning upon Arbitrary Demonstrations by Pre-Training Dynamics Representations", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), October 2025.
BibTeX TR2025-147 PDF- @inproceedings{Ma2025oct,
- author = {Ma, Haitong and Dai, Bo and Ren, Zhaolin and Wang, Yebin and Li, Na},
- title = {{Offline Imitation Learning upon Arbitrary Demonstrations by Pre-Training Dynamics Representations}},
- booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-147}
- }
- Shenoy, V., Wu, S., Comas, A., Lohit, S., Mansour, H., Marks, T.K., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", IEEE Access, DOI: 10.1109/ACCESS.2025.3617284, Vol. 13, pp. 173923-173938, October 2025.
BibTeX TR2025-145 PDF- @article{Shenoy2025oct,
- author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Lohit, Suhas and Mansour, Hassan and Marks, Tim K.},
- title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
- journal = {IEEE Access},
- year = 2025,
- volume = 13,
- pages = {173923--173938},
- month = oct,
- doi = {10.1109/ACCESS.2025.3617284},
- url = {https://www.merl.com/publications/TR2025-145}
- }
- Masuyama, Y., Germain, F.G., Wichern, G., Ick, C., Le Roux, J., "Physics-Informed Direction-Aware Neural Acoustic Fields", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA66052.2025.11230918, October 2025.
BibTeX TR2025-142 PDF- @inproceedings{Masuyama2025oct,
- author = {Masuyama, Yoshiki and Germain, François G and Wichern, Gordon and Ick, Christopher and {Le Roux}, Jonathan},
- title = {{Physics-Informed Direction-Aware Neural Acoustic Fields}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2025,
- month = oct,
- doi = {10.1109/WASPAA66052.2025.11230918},
- url = {https://www.merl.com/publications/TR2025-142}
- }
- Paissan, F., Wichern, G., Masuyama, Y., Aihara, R., Germain, F.G., Saijo, K., Le Roux, J., "FasTUSS: Faster Task-Aware Unified Source Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA66052.2025.11230943, October 2025.
BibTeX TR2025-143 PDF- @inproceedings{Paissan2025oct,
- author = {Paissan, Francesco and Wichern, Gordon and Masuyama, Yoshiki and Aihara, Ryo and Germain, François G and Saijo, Kohei and {Le Roux}, Jonathan},
- title = {{FasTUSS: Faster Task-Aware Unified Source Separation}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2025,
- month = oct,
- doi = {10.1109/WASPAA66052.2025.11230943},
- url = {https://www.merl.com/publications/TR2025-143}
- }
- Ma, J., Dong, Y., Qiao, H., Laughman, C.R., "A physics-constrained deep learning framework for dynamic modeling of vapor compression systems", Applied Energy, DOI: 10.1016/j.applthermaleng.2024.123734, Vol. 254, September 2025.
BibTeX TR2025-137 PDF- @article{Ma2025sep,
- author = {Ma, JiaCheng and Dong, Yiyun and Qiao, Hongtao and Laughman, Christopher R.},
- title = {{A physics-constrained deep learning framework for dynamic modeling of vapor compression systems}},
- journal = {Applied Energy},
- year = 2025,
- volume = 254,
- month = sep,
- doi = {10.1016/j.applthermaleng.2024.123734},
- url = {https://www.merl.com/publications/TR2025-137}
- }
- Tang, W.-T., Vinod, A.P., Germain, F.G., Paulson, J.A., Laughman, C.R., Chakrabarty, A., "AI-Driven Scenario Discovery: Diffusion Models and Multi-Armed Bandits for Building Control Validation", Energy and Buildings, DOI: 10.1016/j.enbuild.2025.116207, September 2025.
BibTeX TR2025-132 PDF- @article{Tang2025sep,
- author = {Tang, Wei-Ting and Vinod, Abraham P. and Germain, François G and Paulson, Joel A. and Laughman, Christopher R. and Chakrabarty, Ankush},
- title = {{AI-Driven Scenario Discovery: Diffusion Models and Multi-Armed Bandits for Building Control Validation}},
- journal = {Energy and Buildings},
- year = 2025,
- month = sep,
- doi = {10.1016/j.enbuild.2025.116207},
- url = {https://www.merl.com/publications/TR2025-132}
- }
- Zhang, J., Cherian, A., Rodriguez, C., Deng, W., Gould, S., "Manual-PA: Learning 3D Part Assembly from Instruction Diagrams", IEEE International Conference on Computer Vision (ICCV), September 2025, pp. 6304-6314.
BibTeX TR2025-139 PDF- @inproceedings{Zhang2025sep,
- author = {Zhang, Jiahao and Cherian, Anoop and Rodriguez, Cristian and Deng, Weijian and Gould, Stephen},
- title = {{Manual-PA: Learning 3D Part Assembly from Instruction Diagrams}},
- booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)},
- year = 2025,
- pages = {6304--6314},
- month = sep,
- url = {https://www.merl.com/publications/TR2025-139}
- }
- Hu, Y., Lohit, S., Kamilov, U., Marks, T.K., "Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal", IEEE Transactions on Geoscience and Remote Sensing, DOI: 10.1109/TGRS.2025.3604654, Vol. 63, September 2025.
BibTeX TR2025-138 PDF- @article{Hu2025sep2,
- author = {Hu, Yuyang and Lohit, Suhas and Kamilov, Ulugbek and Marks, Tim K.},
- title = {{Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal}},
- journal = {IEEE Transactions on Geoscience and Remote Sensing},
- year = 2025,
- volume = 63,
- month = sep,
- doi = {10.1109/TGRS.2025.3604654},
- issn = {1558-0644},
- url = {https://www.merl.com/publications/TR2025-138}
- }
- Miyawaki, K., Qiao, H., Sciazko, A., Shikazono, N., "LSTM-Based Modeling and Cross-Correlation Sensitivity Analysis for Heat Pump Refrigerant Distribution", International Journal of Refrigeration, DOI: 10.1016/j.ijrefrig.2025.06.006, Vol. 177, pp. 351-363, September 2025.
BibTeX TR2025-141 PDF- @article{Miyawaki2025sep,
- author = {Miyawaki, Kosuke and Qiao, Hongtao and Sciazko, Anna and Shikazono, Naoki},
- title = {{LSTM-Based Modeling and Cross-Correlation Sensitivity Analysis for Heat Pump Refrigerant Distribution}},
- journal = {International Journal of Refrigeration},
- year = 2025,
- volume = 177,
- pages = {351--363},
- month = sep,
- doi = {10.1016/j.ijrefrig.2025.06.006},
- url = {https://www.merl.com/publications/TR2025-141}
- }
- Chakrabarty, A., Forgione, M., Piga, D., Bemporad, A., Laughman, C.R., "Zero-Shot Parameter Estimation of Modelica Models using Patch Transformer Networks", International Modelica and FMI Conference, September 2025.
BibTeX TR2025-133 PDF- @inproceedings{Chakrabarty2025sep,
- author = {Chakrabarty, Ankush and Forgione, Marco and Piga, Dario and Bemporad, Alberto and Laughman, Christopher R.},
- title = {{Zero-Shot Parameter Estimation of Modelica Models using Patch Transformer Networks}},
- booktitle = {International Modelica and FMI Conference},
- year = 2025,
- month = sep,
- url = {https://www.merl.com/publications/TR2025-133}
- }
- Ji, D.-Y., Wang, B., Inoue, H., Kanemaru, M., "Simulation-to-Reality Domain Adaptation for Motor Fault Detection", IEEE International Symposium on Diagnostics for Electric Machines, Power Electronics and Drives (SDEMPED), August 2025.
BibTeX TR2025-126 PDF- @inproceedings{Ji2025aug,
- author = {Ji, Dai-Yan and Wang, Bingnan and Inoue, Hiroshi and Kanemaru, Makoto},
- title = {{Simulation-to-Reality Domain Adaptation for Motor Fault Detection}},
- booktitle = {IEEE International Symposium on Diagnostics for Electric Machines, Power Electronics and Drives (SDEMPED)},
- year = 2025,
- month = aug,
- url = {https://www.merl.com/publications/TR2025-126}
- }
- Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "End-to-End Radar Human Segmentation with Differentiable Positional Encoding", European Signal Processing Conference (EUSIPCO), DOI: 10.23919/EUSIPCO63237.2025.11226318, August 2025.
BibTeX TR2025-125 PDF- @inproceedings{Yataka2025aug,
- author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
- title = {End-to-End Radar Human Segmentation with Differentiable Positional Encoding},
- booktitle = {European Signal Processing Conference (EUSIPCO)},
- year = 2025,
- month = aug,
- doi = {10.23919/EUSIPCO63237.2025.11226318},
- isbn = {978-9-4645-9362-4},
- url = {https://www.merl.com/publications/TR2025-125}
- }
- Hussein, A., Khurana, S., Wichern, G., Germain, F.G., Le Roux, J., "HASRD: Hierarchical Acoustic and Semantic Representation Disentanglement", Interspeech, DOI: 10.21437/Interspeech.2025-2063, August 2025, pp. 5393-5397.
BibTeX TR2025-122 PDF- @inproceedings{Hussein2025aug,
- author = {Hussein, Amir and Khurana, Sameer and Wichern, Gordon and Germain, François G and {Le Roux}, Jonathan},
- title = {{HASRD: Hierarchical Acoustic and Semantic Representation Disentanglement}},
- booktitle = {Interspeech},
- year = 2025,
- pages = {5393--5397},
- month = aug,
- publisher = {ISCA},
- doi = {10.21437/Interspeech.2025-2063},
- url = {https://www.merl.com/publications/TR2025-122}
- }
- Ick, C., Wichern, G., Masuyama, Y., Germain, F.G., Le Roux, J., "Direction-Aware Neural Acoustic Fields for Few-Shot Interpolation of Ambisonic Impulse Responses", Interspeech, DOI: 10.21437/Interspeech.2025-1912, August 2025, pp. 933-937.
BibTeX TR2025-120 PDF- @inproceedings{Ick2025aug,
- author = {Ick, Christopher and Wichern, Gordon and Masuyama, Yoshiki and Germain, François G and {Le Roux}, Jonathan},
- title = {{Direction-Aware Neural Acoustic Fields for Few-Shot Interpolation of Ambisonic Impulse Responses}},
- booktitle = {Interspeech},
- year = 2025,
- pages = {933--937},
- month = aug,
- doi = {10.21437/Interspeech.2025-1912},
- url = {https://www.merl.com/publications/TR2025-120}
- }