Publications

717 / 3,995 publications found.


  •  Hori, C., Masuyama, Y., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2025.
    BibTeX TR2025-167 PDF
    • @inproceedings{Hori2025dec,
    • author = {Hori, Chiori and Masuyama, Yoshiki and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
    • title = {{Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM}},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2025,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2025-167}
    • }
  •  Xiang, X., Peng, K.-C., Lohit, S., Jones, M.J., Zhang, J., "Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes", British Machine Vision Conference (BMVC), November 2025.
    BibTeX TR2025-162 PDF Video Data Presentation
    • @inproceedings{Xiang2025nov,
    • author = {{{Xiang, Xinhao and Peng, Kuan-Chuan and Lohit, Suhas and Jones, Michael J. and Zhang, Jiawei}}},
    • title = {{{Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes}}},
    • booktitle = {British Machine Vision Conference (BMVC)},
    • year = 2025,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2025-162}
    • }
  •  Masuyama, Y., "Neural Fields for Spatial Audio Modeling," Tech. Rep. TR2025-171, Speech and Audio in the Northeast (SANE), November 2025.
    BibTeX TR2025-171 PDF
    • @techreport{Masuyama2025nov,
    • author = {Masuyama, Yoshiki},
    • title = {{Neural Fields for Spatial Audio Modeling}},
    • institution = {Speech and Audio in the Northeast (SANE)},
    • year = 2025,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2025-171}
    • }
  •  Wilkinghoff, K., Fujimura, T., Imoto, K., Le Roux, J., Tan, Z.-H., Toda, T., "Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work", Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE), DOI: 10.5281/​zenodo.17251589, October 2025, pp. 20-24.
    BibTeX TR2025-157 PDF
    • @inproceedings{Wilkinghoff2025oct,
    • author = {Wilkinghoff, Kevin and Fujimura, Takuya and Imoto, Keisuke and {Le Roux}, Jonathan and Tan, Zheng-Hua and Toda, Tomoki},
    • title = {{Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work}},
    • booktitle = {Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE)},
    • year = 2025,
    • pages = {20--24},
    • month = oct,
    • doi = {10.5281/zenodo.17251589},
    • isbn = {978-84-09-77652-8},
    • url = {https://www.merl.com/publications/TR2025-157}
    • }
  •  Chakrabarty, A., Wichern, G., Deshpande, V.M., Vinod, A.P., Berntorp, K., Laughman, C.R., "Meta-Learning for Physically-Constrained Neural System Identification", Neurocomputing, DOI: 10.1016/​j.neucom.2025.130945, Vol. 651, pp. 130945, October 2025.
    BibTeX TR2025-159 PDF
    • @article{Chakrabarty2025nov,
    • author = {Chakrabarty, Ankush and Wichern, Gordon and Deshpande, Vedang M. and Vinod, Abraham P. and Berntorp, Karl and Laughman, Christopher R.},
    • title = {{Meta-Learning for Physically-Constrained Neural System Identification}},
    • journal = {Neurocomputing},
    • year = 2025,
    • volume = 651,
    • pages = 130945,
    • month = nov,
    • doi = {10.1016/j.neucom.2025.130945},
    • issn = {0925-2312},
    • url = {https://www.merl.com/publications/TR2025-159}
    • }
  •  Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception", IEEE International Conference on Computer Vision (ICCV) Workshop, October 2025.
    BibTeX TR2025-154 PDF Software
    • @inproceedings{Yataka2025oct,
    • author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
    • title = {{Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshop},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-154}
    • }
  •  Sun, H., Otake, Y., Matsuyama, K., Raghunathan, A., "Switchgear Partial Discharge Diagnosis Using Scarce Fault Records", IEEE PES Innovative Smart Grid Technologies Conference - Europe (ISGT Europe), DOI: 10.1109/​ISGTEurope64741.2025.11305301, October 2025.
    BibTeX TR2025-155 PDF
    • @inproceedings{Sun2025oct,
    • author = {Sun, Hongbo and Otake, Yasutomo and Matsuyama, Kotaro and Raghunathan, Arvind},
    • title = {{Switchgear Partial Discharge Diagnosis Using Scarce Fault Records}},
    • booktitle = {IEEE PES Innovative Smart Grid Technologies Conference - Europe (ISGT Europe)},
    • year = 2025,
    • month = oct,
    • doi = {10.1109/ISGTEurope64741.2025.11305301},
    • url = {https://www.merl.com/publications/TR2025-155}
    • }
  •  Piedade, V., Chitturi, S., Gaspar, J., Govindu, V., Miraldo, P., "SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity", IEEE International Conference on Computer Vision (ICCV), October 2025.
    BibTeX TR2025-146 PDF Presentation
    • @inproceedings{Piedade2025oct,
    • author = {{{Piedade, Valter and Chitturi, Sidhartha and Gaspar, Jose and Govindu, Venu and Miraldo, Pedro}}},
    • title = {{{SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-146}
    • }
  •  Yang, C.-A., Peng, K.-C., Yeh, R., "Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts", IEEE International Conference on Computer Vision (ICCV), October 2025.
    BibTeX TR2025-124 PDF Video Data Presentation
    • @inproceedings{Yang2025oct,
    • author = {{{Yang, Chiao-An and Peng, Kuan-Chuan and Yeh, Raymond}}},
    • title = {{{Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-124}
    • }
  •  Peng, K.-C., "Joint Training of Image Generator and Detector for Road Defect Detection", IEEE International Conference on Computer Vision (ICCV) Workshops, October 2025.
    BibTeX TR2025-149 PDF Video Presentation
    • @inproceedings{Peng2025oct,
    • author = {{{Peng, Kuan-Chuan}}},
    • title = {{{Joint Training of Image Generator and Detector for Road Defect Detection}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshops},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-149}
    • }
  •  Kuwabara, A., Kirihara, H., Kato, S., Koike-Akino, T., Fujihashi, T., "L-GGSC: Learnable Graph-based Gaussian Splatting Compression", IEEE International Conference on Computer Vision Workshops (ICCV), October 2025.
    BibTeX TR2025-148 PDF
    • @inproceedings{Kuwabara2025oct,
    • author = {Kuwabara, Akihiro and Kirihara, Hinata and Kato, Sorachi and Koike-Akino, Toshiaki and Fujihashi, Takuya},
    • title = {{L-GGSC: Learnable Graph-based Gaussian Splatting Compression}},
    • booktitle = {IEEE International Conference on Computer Vision Workshops (ICCV)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-148}
    • }
  •  Ma, H., Dai, B., Ren, Z., Wang, Y., Li, N., "Offline Imitation Learning upon Arbitrary Demonstrations by Pre-Training Dynamics Representations", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), October 2025.
    BibTeX TR2025-147 PDF
    • @inproceedings{Ma2025oct,
    • author = {Ma, Haitong and Dai, Bo and Ren, Zhaolin and Wang, Yebin and Li, Na},
    • title = {{Offline Imitation Learning upon Arbitrary Demonstrations by Pre-Training Dynamics Representations}},
    • booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-147}
    • }
  •  Shenoy, V., Wu, S., Comas, A., Lohit, S., Mansour, H., Marks, T.K., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", IEEE Access, DOI: 10.1109/​ACCESS.2025.3617284, Vol. 13, pp. 173923-173938, October 2025.
    BibTeX TR2025-145 PDF
    • @article{Shenoy2025oct,
    • author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Lohit, Suhas and Mansour, Hassan and Marks, Tim K.},
    • title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
    • journal = {IEEE Access},
    • year = 2025,
    • volume = 13,
    • pages = {173923--173938},
    • month = oct,
    • doi = {10.1109/ACCESS.2025.3617284},
    • url = {https://www.merl.com/publications/TR2025-145}
    • }
  •  Masuyama, Y., Germain, F.G., Wichern, G., Ick, C., Le Roux, J., "Physics-Informed Direction-Aware Neural Acoustic Fields", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA66052.2025.11230918, October 2025.
    BibTeX TR2025-142 PDF
    • @inproceedings{Masuyama2025oct,
    • author = {Masuyama, Yoshiki and Germain, François G and Wichern, Gordon and Ick, Christopher and {Le Roux}, Jonathan},
    • title = {{Physics-Informed Direction-Aware Neural Acoustic Fields}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2025,
    • month = oct,
    • doi = {10.1109/WASPAA66052.2025.11230918},
    • url = {https://www.merl.com/publications/TR2025-142}
    • }
  •  Paissan, F., Wichern, G., Masuyama, Y., Aihara, R., Germain, F.G., Saijo, K., Le Roux, J., "FasTUSS: Faster Task-Aware Unified Source Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA66052.2025.11230943, October 2025.
    BibTeX TR2025-143 PDF
    • @inproceedings{Paissan2025oct,
    • author = {Paissan, Francesco and Wichern, Gordon and Masuyama, Yoshiki and Aihara, Ryo and Germain, François G and Saijo, Kohei and {Le Roux}, Jonathan},
    • title = {{FasTUSS: Faster Task-Aware Unified Source Separation}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2025,
    • month = oct,
    • doi = {10.1109/WASPAA66052.2025.11230943},
    • url = {https://www.merl.com/publications/TR2025-143}
    • }
  •  Ma, J., Dong, Y., Qiao, H., Laughman, C.R., "A physics-constrained deep learning framework for dynamic modeling of vapor compression systems", Applied Energy, DOI: 10.1016/​j.applthermaleng.2024.123734, Vol. 254, September 2025.
    BibTeX TR2025-137 PDF
    • @article{Ma2025sep,
    • author = {Ma, JiaCheng and Dong, Yiyun and Qiao, Hongtao and Laughman, Christopher R.},
    • title = {{A physics-constrained deep learning framework for dynamic modeling of vapor compression systems}},
    • journal = {Applied Energy},
    • year = 2025,
    • volume = 254,
    • month = sep,
    • doi = {10.1016/j.applthermaleng.2024.123734},
    • url = {https://www.merl.com/publications/TR2025-137}
    • }
  •  Tang, W.-T., Vinod, A.P., Germain, F.G., Paulson, J.A., Laughman, C.R., Chakrabarty, A., "AI-Driven Scenario Discovery: Diffusion Models and Multi-Armed Bandits for Building Control Validation", Energy and Buildings, DOI: 10.1016/​j.enbuild.2025.116207, September 2025.
    BibTeX TR2025-132 PDF
    • @article{Tang2025sep,
    • author = {Tang, Wei-Ting and Vinod, Abraham P. and Germain, François G and Paulson, Joel A. and Laughman, Christopher R. and Chakrabarty, Ankush},
    • title = {{AI-Driven Scenario Discovery: Diffusion Models and Multi-Armed Bandits for Building Control Validation}},
    • journal = {Energy and Buildings},
    • year = 2025,
    • month = sep,
    • doi = {10.1016/j.enbuild.2025.116207},
    • url = {https://www.merl.com/publications/TR2025-132}
    • }
  •  Zhang, J., Cherian, A., Rodriguez, C., Deng, W., Gould, S., "Manual-PA: Learning 3D Part Assembly from Instruction Diagrams", IEEE International Conference on Computer Vision (ICCV), September 2025, pp. 6304-6314.
    BibTeX TR2025-139 PDF
    • @inproceedings{Zhang2025sep,
    • author = {Zhang, Jiahao and Cherian, Anoop and Rodriguez, Cristian and Deng, Weijian and Gould, Stephen},
    • title = {{Manual-PA: Learning 3D Part Assembly from Instruction Diagrams}},
    • booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • pages = {6304--6314},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2025-139}
    • }
  •  Hu, Y., Lohit, S., Kamilov, U., Marks, T.K., "Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal", IEEE Transactions on Geoscience and Remote Sensing, DOI: 10.1109/​TGRS.2025.3604654, Vol. 63, September 2025.
    BibTeX TR2025-138 PDF
    • @article{Hu2025sep2,
    • author = {Hu, Yuyang and Lohit, Suhas and Kamilov, Ulugbek and Marks, Tim K.},
    • title = {{Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal}},
    • journal = {IEEE Transactions on Geoscience and Remote Sensing},
    • year = 2025,
    • volume = 63,
    • month = sep,
    • doi = {10.1109/TGRS.2025.3604654},
    • issn = {1558-0644},
    • url = {https://www.merl.com/publications/TR2025-138}
    • }
  •  Miyawaki, K., Qiao, H., Sciazko, A., Shikazono, N., "LSTM-Based Modeling and Cross-Correlation Sensitivity Analysis for Heat Pump Refrigerant Distribution", International Journal of Refrigeration, DOI: 10.1016/​j.ijrefrig.2025.06.006, Vol. 177, pp. 351-363, September 2025.
    BibTeX TR2025-141 PDF
    • @article{Miyawaki2025sep,
    • author = {Miyawaki, Kosuke and Qiao, Hongtao and Sciazko, Anna and Shikazono, Naoki},
    • title = {{LSTM-Based Modeling and Cross-Correlation Sensitivity Analysis for Heat Pump Refrigerant Distribution}},
    • journal = {International Journal of Refrigeration},
    • year = 2025,
    • volume = 177,
    • pages = {351--363},
    • month = sep,
    • doi = {10.1016/j.ijrefrig.2025.06.006},
    • url = {https://www.merl.com/publications/TR2025-141}
    • }
  •  Chakrabarty, A., Forgione, M., Piga, D., Bemporad, A., Laughman, C.R., "Zero-Shot Parameter Estimation of Modelica Models using Patch Transformer Networks", International Modelica and FMI Conference, September 2025.
    BibTeX TR2025-133 PDF
    • @inproceedings{Chakrabarty2025sep,
    • author = {Chakrabarty, Ankush and Forgione, Marco and Piga, Dario and Bemporad, Alberto and Laughman, Christopher R.},
    • title = {{Zero-Shot Parameter Estimation of Modelica Models using Patch Transformer Networks}},
    • booktitle = {International Modelica and FMI Conference},
    • year = 2025,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2025-133}
    • }
  •  Ji, D.-Y., Wang, B., Inoue, H., Kanemaru, M., "Simulation-to-Reality Domain Adaptation for Motor Fault Detection", IEEE International Symposium on Diagnostics for Electric Machines, Power Electronics and Drives (SDEMPED), August 2025.
    BibTeX TR2025-126 PDF
    • @inproceedings{Ji2025aug,
    • author = {Ji, Dai-Yan and Wang, Bingnan and Inoue, Hiroshi and Kanemaru, Makoto},
    • title = {{Simulation-to-Reality Domain Adaptation for Motor Fault Detection}},
    • booktitle = {IEEE International Symposium on Diagnostics for Electric Machines, Power Electronics and Drives (SDEMPED)},
    • year = 2025,
    • month = aug,
    • url = {https://www.merl.com/publications/TR2025-126}
    • }
  •  Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "End-to-End Radar Human Segmentation with Differentiable Positional Encoding", European Signal Processing Conference (EUSIPCO), DOI: 10.23919/​EUSIPCO63237.2025.11226318, August 2025.
    BibTeX TR2025-125 PDF
    • @inproceedings{Yataka2025aug,
    • author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
    • title = {End-to-End Radar Human Segmentation with Differentiable Positional Encoding},
    • booktitle = {European Signal Processing Conference (EUSIPCO)},
    • year = 2025,
    • month = aug,
    • doi = {10.23919/EUSIPCO63237.2025.11226318},
    • isbn = {978-9-4645-9362-4},
    • url = {https://www.merl.com/publications/TR2025-125}
    • }
  •  Hussein, A., Khurana, S., Wichern, G., Germain, F.G., Le Roux, J., "HASRD: Hierarchical Acoustic and Semantic Representation Disentanglement", Interspeech, DOI: 10.21437/​Interspeech.2025-2063, August 2025, pp. 5393-5397.
    BibTeX TR2025-122 PDF
    • @inproceedings{Hussein2025aug,
    • author = {Hussein, Amir and Khurana, Sameer and Wichern, Gordon and Germain, François G and {Le Roux}, Jonathan},
    • title = {{HASRD: Hierarchical Acoustic and Semantic Representation Disentanglement}},
    • booktitle = {Interspeech},
    • year = 2025,
    • pages = {5393--5397},
    • month = aug,
    • publisher = {ISCA},
    • doi = {10.21437/Interspeech.2025-2063},
    • url = {https://www.merl.com/publications/TR2025-122}
    • }
  •  Ick, C., Wichern, G., Masuyama, Y., Germain, F.G., Le Roux, J., "Direction-Aware Neural Acoustic Fields for Few-Shot Interpolation of Ambisonic Impulse Responses", Interspeech, DOI: 10.21437/​Interspeech.2025-1912, August 2025, pp. 933-937.
    BibTeX TR2025-120 PDF
    • @inproceedings{Ick2025aug,
    • author = {Ick, Christopher and Wichern, Gordon and Masuyama, Yoshiki and Germain, François G and {Le Roux}, Jonathan},
    • title = {{Direction-Aware Neural Acoustic Fields for Few-Shot Interpolation of Ambisonic Impulse Responses}},
    • booktitle = {Interspeech},
    • year = 2025,
    • pages = {933--937},
    • month = aug,
    • doi = {10.21437/Interspeech.2025-1912},
    • url = {https://www.merl.com/publications/TR2025-120}
    • }