Publications

699 / 3,956 publications found.


  •  Wilkinghoff, K., Yang, H., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Local Density-Based Anomaly Score Normalization for Domain Generalization", IEEE Transactions on Audio, Speech and Language Processing, January 2026.
    BibTeX TR2026-010 PDF Software
    • @article{Wilkinghoff2026jan,
    • author = {Wilkinghoff, Kevin and Yang, Haici and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Local Density-Based Anomaly Score Normalization for Domain Generalization}},
    • journal = {IEEE Transactions on Audio, Speech and Language Processing},
    • year = 2026,
    • month = jan,
    • url = {https://www.merl.com/publications/TR2026-010}
    • }
  •  Cornell, S., Boeddeker, C., Park, T., Huang, H., Raj, D., Wiesner, M., Masuyama, Y., Chang, X., Wang, Z.-Q., Squartini, S., Garcia, P., Watanabe, S., "Recent Trends in Distant Conversational Speech Recognition: A Review of CHiME-7 and 8 DASR Challenges", Computer Speech & Language, December 2025.
    BibTeX TR2026-008 PDF
    • @article{Cornell2025dec,
    • author = {Cornell, Samuele and Boeddeker, Christoph and Park, Taejin and Huang, He and Raj, Desh and Wiesner, Matthew and Masuyama, Yoshiki and Chang, Xuankai and Wang, Zhong-Qiu and Squartini, Stefano and Garcia, Paola and Watanabe, Shinji},
    • title = {{Recent Trends in Distant Conversational Speech Recognition: A Review of CHiME-7 and 8 DASR Challenges}},
    • journal = {Computer Speech \& Language},
    • year = 2025,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2026-008}
    • }
  •  Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "SuDaField: Subject- and Dataset-Aware Neural Field for HRTF Modeling", IEEE Open Journal of Signal Processing, December 2025.
    BibTeX TR2026-009 PDF
    • @article{Masuyama2025dec2,
    • author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and {Le Roux}, Jonathan},
    • title = {{SuDaField: Subject- and Dataset-Aware Neural Field for HRTF Modeling}},
    • journal = {IEEE Open Journal of Signal Processing},
    • year = 2025,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2026-009}
    • }
  •  Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "RANF: Neural Field-Based HRTF Spatial Upsampling with Retrieval Augmentation and Parameter Efficient Fine-Tuning", IEEE Open Journal of Signal Processing, December 2025.
    BibTeX TR2026-007 PDF Software
    • @article{Masuyama2025dec,
    • author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and {Le Roux}, Jonathan},
    • title = {{RANF: Neural Field-Based HRTF Spatial Upsampling with Retrieval Augmentation and Parameter Efficient Fine-Tuning}},
    • journal = {IEEE Open Journal of Signal Processing},
    • year = 2025,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2026-007}
    • }
  •  Kato, S., Yataka, R., Wang, P., Miraldo, P., Fujihashi, T., Boufounos, P.T., "RAPTR: Radar-based 3D Pose Estimation using Transformer", Advances in Neural Information Processing Systems (NeurIPS), December 2025.
    BibTeX TR2026-006 PDF Software
    • @inproceedings{Kato2025dec,
    • author = {Kato, Sorachi and Yataka, Ryoma and Wang, Pu and Miraldo, Pedro and Fujihashi, Takuya and Boufounos, Petros T.},
    • title = {{RAPTR: Radar-based 3D Pose Estimation using Transformer}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2025,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2026-006}
    • }
  •  Hutchinson, S., Vinod, A.P., Germain, F.G., Di Cairano, S., Laughman, C.R., Chakrabarty, A., "Quantile-SMPC for Grid-Interactive Buildings with Multivariate Temporal Fusion Transformers", Advances in Neural Information Processing Systems (NeurIPS) Workshop on UrbanAI, December 2025.
    BibTeX TR2026-001 PDF
    • @inproceedings{Hutchinson2025dec,
    • author = {{{Hutchinson, Spencer and Vinod, Abraham P. and Germain, François G and Di Cairano, Stefano and Laughman, Christopher R. and Chakrabarty, Ankush}}},
    • title = {{{Quantile-SMPC for Grid-Interactive Buildings with Multivariate Temporal Fusion Transformers}}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS) Workshop on UrbanAI},
    • year = 2025,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2026-001}
    • }
  •  Xie, X., Mowlavi, S., Benosman, M., "Smooth and Sparse Latent Dynamics in Operator Learning with Jerk Regularization", Advances in Neural Information Processing Systems (NeurIPS) workshop on Machine Learning and the Physical Sciences (ML4PS), December 2025.
    BibTeX TR2025-166 PDF
    • @inproceedings{Xie2025dec,
    • author = {{{Xie, Xiaoyu and Mowlavi, Saviz and Benosman, Mouhacine}}},
    • title = {{{Smooth and Sparse Latent Dynamics in Operator Learning with Jerk Regularization}}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS) workshop on Machine Learning and the Physical Sciences (ML4PS)},
    • year = 2025,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2025-166}
    • }
  •  Hori, C., Masuyama, Y., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2025.
    BibTeX TR2025-167 PDF
    • @inproceedings{Hori2025dec,
    • author = {Hori, Chiori and Masuyama, Yoshiki and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
    • title = {{Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM}},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2025,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2025-167}
    • }
  •  Xiang, X., Peng, K.-C., Lohit, S., Jones, M.J., Zhang, J., "Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes", British Machine Vision Conference (BMVC), November 2025.
    BibTeX TR2025-162 PDF Video Data Presentation
    • @inproceedings{Xiang2025nov,
    • author = {{{Xiang, Xinhao and Peng, Kuan-Chuan and Lohit, Suhas and Jones, Michael J. and Zhang, Jiawei}}},
    • title = {{{Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes}}},
    • booktitle = {British Machine Vision Conference (BMVC)},
    • year = 2025,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2025-162}
    • }
  •  Masuyama, Y., "Neural Fields for Spatial Audio Modeling," Tech. Rep. TR2025-171, Speech and Audio in the Northeast (SANE), November 2025.
    BibTeX TR2025-171 PDF
    • @techreport{Masuyama2025nov,
    • author = {Masuyama, Yoshiki},
    • title = {{Neural Fields for Spatial Audio Modeling}},
    • institution = {Speech and Audio in the Northeast (SANE)},
    • year = 2025,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2025-171}
    • }
  •  Wilkinghoff, K., Fujimura, T., Imoto, K., Le Roux, J., Tan, Z.-H., Toda, T., "Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work", Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE), DOI: 10.5281/​zenodo.17251589, October 2025, pp. 20-24.
    BibTeX TR2025-157 PDF
    • @inproceedings{Wilkinghoff2025oct,
    • author = {Wilkinghoff, Kevin and Fujimura, Takuya and Imoto, Keisuke and {Le Roux}, Jonathan and Tan, Zheng-Hua and Toda, Tomoki},
    • title = {{Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work}},
    • booktitle = {Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE)},
    • year = 2025,
    • pages = {20--24},
    • month = oct,
    • doi = {10.5281/zenodo.17251589},
    • isbn = {978-84-09-77652-8},
    • url = {https://www.merl.com/publications/TR2025-157}
    • }
  •  Chakrabarty, A., Wichern, G., Deshpande, V.M., Vinod, A.P., Berntorp, K., Laughman, C.R., "Meta-Learning for Physically-Constrained Neural System Identification", Neurocomputing, DOI: 10.1016/​j.neucom.2025.130945, Vol. 651, pp. 130945, October 2025.
    BibTeX TR2025-159 PDF
    • @article{Chakrabarty2025nov,
    • author = {Chakrabarty, Ankush and Wichern, Gordon and Deshpande, Vedang M. and Vinod, Abraham P. and Berntorp, Karl and Laughman, Christopher R.},
    • title = {{Meta-Learning for Physically-Constrained Neural System Identification}},
    • journal = {Neurocomputing},
    • year = 2025,
    • volume = 651,
    • pages = 130945,
    • month = nov,
    • doi = {10.1016/j.neucom.2025.130945},
    • issn = {0925-2312},
    • url = {https://www.merl.com/publications/TR2025-159}
    • }
  •  Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception", IEEE International Conference on Computer Vision (ICCV) Workshop, October 2025.
    BibTeX TR2025-154 PDF
    • @inproceedings{Yataka2025oct,
    • author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
    • title = {{Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshop},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-154}
    • }
  •  Sun, H., Otake, Y., Matsuyama, K., Raghunathan, A., "Switchgear Partial Discharge Diagnosis Using Scarce Fault Records", IEEE PES Innovative Smart Grid Technologies Conference - Europe (ISGT Europe), October 2025.
    BibTeX TR2025-155 PDF
    • @inproceedings{Sun2025oct,
    • author = {Sun, Hongbo and Otake, Yasutomo and Matsuyama, Kotaro and Raghunathan, Arvind},
    • title = {{Switchgear Partial Discharge Diagnosis Using Scarce Fault Records}},
    • booktitle = {IEEE PES Innovative Smart Grid Technologies Conference - Europe (ISGT Europe)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-155}
    • }
  •  Piedade, V., Chitturi, S., Gaspar, J., Govindu, V., Miraldo, P., "SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity", IEEE International Conference on Computer Vision (ICCV), October 2025.
    BibTeX TR2025-146 PDF Presentation
    • @inproceedings{Piedade2025oct,
    • author = {{{Piedade, Valter and Chitturi, Sidhartha and Gaspar, Jose and Govindu, Venu and Miraldo, Pedro}}},
    • title = {{{SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-146}
    • }
  •  Yang, C.-A., Peng, K.-C., Yeh, R., "Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts", IEEE International Conference on Computer Vision (ICCV), October 2025.
    BibTeX TR2025-124 PDF Video Data Presentation
    • @inproceedings{Yang2025oct,
    • author = {{{Yang, Chiao-An and Peng, Kuan-Chuan and Yeh, Raymond}}},
    • title = {{{Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-124}
    • }
  •  Peng, K.-C., "Joint Training of Image Generator and Detector for Road Defect Detection", IEEE International Conference on Computer Vision (ICCV) Workshops, October 2025.
    BibTeX TR2025-149 PDF Video Presentation
    • @inproceedings{Peng2025oct,
    • author = {{{Peng, Kuan-Chuan}}},
    • title = {{{Joint Training of Image Generator and Detector for Road Defect Detection}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshops},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-149}
    • }
  •  Kuwabara, A., Kirihara, H., Kato, S., Koike-Akino, T., Fujihashi, T., "L-GGSC: Learnable Graph-based Gaussian Splatting Compression", IEEE International Conference on Computer Vision Workshops (ICCV), October 2025.
    BibTeX TR2025-148 PDF
    • @inproceedings{Kuwabara2025oct,
    • author = {Kuwabara, Akihiro and Kirihara, Hinata and Kato, Sorachi and Koike-Akino, Toshiaki and Fujihashi, Takuya},
    • title = {{L-GGSC: Learnable Graph-based Gaussian Splatting Compression}},
    • booktitle = {IEEE International Conference on Computer Vision Workshops (ICCV)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-148}
    • }
  •  Ma, H., Dai, B., Ren, Z., Wang, Y., Li, N., "Offline Imitation Learning upon Arbitrary Demonstrations by Pre-Training Dynamics Representations", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), October 2025.
    BibTeX TR2025-147 PDF
    • @inproceedings{Ma2025oct,
    • author = {Ma, Haitong and Dai, Bo and Ren, Zhaolin and Wang, Yebin and Li, Na},
    • title = {{Offline Imitation Learning upon Arbitrary Demonstrations by Pre-Training Dynamics Representations}},
    • booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-147}
    • }
  •  Shenoy, V., Wu, S., Comas, A., Lohit, S., Mansour, H., Marks, T.K., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", IEEE Access, October 2025.
    BibTeX TR2025-145 PDF
    • @article{Shenoy2025oct,
    • author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Lohit, Suhas and Mansour, Hassan and Marks, Tim K.},
    • title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
    • journal = {IEEE Access},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-145}
    • }
  •  Masuyama, Y., Germain, F.G., Wichern, G., Ick, C., Le Roux, J., "Physics-Informed Direction-Aware Neural Acoustic Fields", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA66052.2025.11230918, October 2025.
    BibTeX TR2025-142 PDF
    • @inproceedings{Masuyama2025oct,
    • author = {Masuyama, Yoshiki and Germain, François G and Wichern, Gordon and Ick, Christopher and {Le Roux}, Jonathan},
    • title = {{Physics-Informed Direction-Aware Neural Acoustic Fields}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2025,
    • month = oct,
    • doi = {10.1109/WASPAA66052.2025.11230918},
    • url = {https://www.merl.com/publications/TR2025-142}
    • }
  •  Paissan, F., Wichern, G., Masuyama, Y., Aihara, R., Germain, F.G., Saijo, K., Le Roux, J., "FasTUSS: Faster Task-Aware Unified Source Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA66052.2025.11230943, October 2025.
    BibTeX TR2025-143 PDF
    • @inproceedings{Paissan2025oct,
    • author = {Paissan, Francesco and Wichern, Gordon and Masuyama, Yoshiki and Aihara, Ryo and Germain, François G and Saijo, Kohei and {Le Roux}, Jonathan},
    • title = {{FasTUSS: Faster Task-Aware Unified Source Separation}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2025,
    • month = oct,
    • doi = {10.1109/WASPAA66052.2025.11230943},
    • url = {https://www.merl.com/publications/TR2025-143}
    • }
  •  Ma, J., Dong, Y., Qiao, H., Laughman, C.R., "A physics-constrained deep learning framework for dynamic modeling of vapor compression systems", Applied Energy, September 2025.
    BibTeX TR2025-137 PDF
    • @article{Ma2025sep,
    • author = {Ma, JiaCheng and Dong, Yiyun and Qiao, Hongtao and Laughman, Christopher R.},
    • title = {{A physics-constrained deep learning framework for dynamic modeling of vapor compression systems}},
    • journal = {Applied Energy},
    • year = 2025,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2025-137}
    • }
  •  Tang, W.-T., Vinod, A.P., Germain, F.G., Paulson, J.A., Laughman, C.R., Chakrabarty, A., "AI-Driven Scenario Discovery: Diffusion Models and Multi-Armed Bandits for Building Control Validation", Energy and Buildings, DOI: 10.1016/​j.enbuild.2025.116207, September 2025.
    BibTeX TR2025-132 PDF
    • @article{Tang2025sep,
    • author = {Tang, Wei-Ting and Vinod, Abraham P. and Germain, François G and Paulson, Joel A. and Laughman, Christopher R. and Chakrabarty, Ankush},
    • title = {{AI-Driven Scenario Discovery: Diffusion Models and Multi-Armed Bandits for Building Control Validation}},
    • journal = {Energy and Buildings},
    • year = 2025,
    • month = sep,
    • doi = {10.1016/j.enbuild.2025.116207},
    • url = {https://www.merl.com/publications/TR2025-132}
    • }
  •  Zhang, J., Cherian, A., Rodriguez, C., Deng, W., Gould, S., "Manual-PA: Learning 3D Part Assembly from Instruction Diagrams", IEEE International Conference on Computer Vision (ICCV), September 2025, pp. 6304-6314.
    BibTeX TR2025-139 PDF
    • @inproceedings{Zhang2025sep,
    • author = {Zhang, Jiahao and Cherian, Anoop and Rodriguez, Cristian and Deng, Weijian and Gould, Stephen},
    • title = {{Manual-PA: Learning 3D Part Assembly from Instruction Diagrams}},
    • booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • pages = {6304--6314},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2025-139}
    • }