Publications

Cherian, A., Lohit, S., Peng, K.-C., "WISE: Weighted Iterative Society-of-Experts for Multimodal Multi-Agent Debate with Probabilistic Consensus", ICML SCALE AI Workshop, June 2026.
BibTeX TR2026-083 PDF
- @inproceedings{Cherian2026jun,
- author = {Cherian, Anoop and Lohit, Suhas and Peng, Kuan-Chuan},
- title = {{WISE: Weighted Iterative Society-of-Experts for Multimodal Multi-Agent Debate with Probabilistic Consensus}},
- booktitle = {ICML SCALE AI Workshop},
- year = 2026,
- month = jun,
- url = {https://www.merl.com/publications/TR2026-083}
- }
Zhou, Q., Gan, C., Cherian, A., "LLawCo: Learning Laws of Cooperation for Modeling Embodied Multi-Agent Behavior", International Conference on Machine Learning (ICML), June 2026.
BibTeX TR2026-081 PDF Video
- @inproceedings{Zhou2026jun,
- author = {Zhou, Qinhong and Gan, Chuang and Cherian, Anoop},
- title = {{LLawCo: Learning Laws of Cooperation for Modeling Embodied Multi-Agent Behavior}},
- booktitle = {International Conference on Machine Learning (ICML)},
- year = 2026,
- month = jun,
- url = {https://www.merl.com/publications/TR2026-081}
- }
Hsieh, J.-W., Wu, Y.-H., Hsieh, Y.-K., Li, X., Peng, K.-C., Chang, M.-C., "SoREL: Soft-Label Refurbishment with Ensemble Learning for Noisy Long-Tailed Classification", CVPR Findings, June 2026.
BibTeX TR2026-075 PDF
- @inproceedings{Hsieh2026jun2,
- author = {Hsieh, Jun-Wei and Wu, Ying-Hsuan and Hsieh, Yi-Kuan and Li, Xin and Peng, Kuan-Chuan and Chang, Ming-Ching},
- title = {{SoREL: Soft-Label Refurbishment with Ensemble Learning for Noisy Long-Tailed Classification}},
- booktitle = {CVPR Findings},
- year = 2026,
- month = jun,
- url = {https://www.merl.com/publications/TR2026-075}
- }
Hsieh, J.-W., Wu, Y.-H., Hsieh, Y.-K., Li, X., Peng, K.-C., Chang, M.-C., "SoREL: Soft-Label Refurbishment with Ensemble Learning for Noisy Long-Tailed Classification Supplementary Material", CVPR Findings, June 2026.
BibTeX TR2026-074 PDF
- @inproceedings{Hsieh2026jun,
- author = {Hsieh, Jun-Wei and Wu, Ying-Hsuan and Hsieh, Yi-Kuan and Li, Xin and Peng, Kuan-Chuan and Chang, Ming-Ching},
- title = {{SoREL: Soft-Label Refurbishment with Ensemble Learning for Noisy Long-Tailed Classification Supplementary Material}},
- booktitle = {CVPR Findings},
- year = 2026,
- month = jun,
- url = {https://www.merl.com/publications/TR2026-074}
- }
Li, D., Zhang, J., Egger, B., Chatterjee, M., Lohit, S., Marks, T.K., Cherian, A., "AssemblyBench: Physics-Aware Assembly of Complex Industrial Objects", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2026.
BibTeX TR2026-076 PDF Video Data Software
- @inproceedings{Li2026jun,
- author = {Li, Danrui and Zhang, Jiahao and Egger, Bernhard and Chatterjee, Moitreya and Lohit, Suhas and Marks, Tim K. and Cherian, Anoop},
- title = {{AssemblyBench: Physics-Aware Assembly of Complex Industrial Objects}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2026,
- month = jun,
- url = {https://www.merl.com/publications/TR2026-076}
- }
Liu, X., Miraldo, P., Lohit, S., Jiang, H., Sawada, N., Tai, Y.-W., Tang, C.-K., Chatterjee, M., "Point4Cast: Streaming Dynamic Scene Reconstruction and Forecasting", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2026.
BibTeX TR2026-077 PDF
- @inproceedings{Liu2026jun,
- author = {Liu, Xinhang and Miraldo, Pedro and Lohit, Suhas and Jiang, Huaizu and Sawada, Naoko and Tai, Yu-Wing and Tang, Chi-Keung and Chatterjee, Moitreya},
- title = {{Point4Cast: Streaming Dynamic Scene Reconstruction and Forecasting}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2026,
- month = jun,
- url = {https://www.merl.com/publications/TR2026-077}
- }
Jain, S., Choi, H.J., "SplatCtrl: Perception–Action Coupling via Gaussian Scene Representations and Reactive Robot Control", 2026 IEEE International Conference on Robotics & Automation (ICRA), June 2026.
BibTeX TR2026-069 PDF
- @inproceedings{Jain2026jun,
- author = {{Jain, Siddarth and Choi, Ho Jin}},
- title = {{SplatCtrl: Perception–Action Coupling via Gaussian Scene Representations and Reactive Robot Control}},
- booktitle = {2026 IEEE International Conference on Robotics \& Automation (ICRA)},
- year = 2026,
- month = jun,
- url = {https://www.merl.com/publications/TR2026-069}
- }
Velentzas, I.G., Tomita, K., "LIDIA: Localizing In the Dark with Illumination-Awareness toward Perception-Aware Planning", IEEE International Conference on Robotics and Automation (ICRA), June 2026.
BibTeX TR2026-071 PDF
- @inproceedings{Velentzas2026jun,
- author = {{Velentzas, I.G. and Tomita, K.}},
- title = {{LIDIA: Localizing In the Dark with Illumination-Awareness toward Perception-Aware Planning}},
- booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
- year = 2026,
- month = jun,
- url = {https://www.merl.com/publications/TR2026-071}
- }
Ding, T., Xie, Y., Liang, Y., Chatterjee, M., Miraldo, P., Jiang, H., "LASER: Layer-wise Scale Alignment for Training-Free Streaming 4D Reconstruction", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), May 2026.
BibTeX TR2026-055 PDF
- @inproceedings{Ding2026may,
- author = {Ding, Tianye and Xie, Yiming and Liang, Yiqing and Chatterjee, Moitreya and Miraldo, Pedro and Jiang, Huaizu},
- title = {{LASER: Layer-wise Scale Alignment for Training-Free Streaming 4D Reconstruction}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2026,
- month = may,
- url = {https://www.merl.com/publications/TR2026-055}
- }
Manam, L., Govindu, V., "Parallel Rigidity Matters for Bundle Adjustment", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), May 2026, pp. 29035-29046.
BibTeX TR2026-053 PDF Video Presentation
- @inproceedings{Lalit2026may,
- author = {{Manam, Lalit and Govindu, Venu}},
- title = {{Parallel Rigidity Matters for Bundle Adjustment}},
- booktitle = {IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2026,
- pages = {29035--29046},
- month = may,
- url = {https://www.merl.com/publications/TR2026-053}
- }
Piedade, V., Manam, L., Yamazaki, M., Miraldo, P., "Revisiting Monocular SLAM with Spatio-Temporal Scene Modeling", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), May 2026.
BibTeX TR2026-056 PDF Video Software Presentation
- @inproceedings{Piedade2026may,
- author = {{Piedade, Valter and Manam, Lalit and Yamazaki, Masashi and Miraldo, Pedro}},
- title = {{Revisiting Monocular SLAM with Spatio-Temporal Scene Modeling}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2026,
- month = may,
- url = {https://www.merl.com/publications/TR2026-056}
- }
Cherian, A., Corcodel, R., Jain, S., Romeres, D., "LLMPhy: Parameter-Identifiable Physical Reasoning Combining Large Language Models and Physics Engines", International Conference on Artificial Intelligence and Statistics (AISTATS), May 2026.
BibTeX TR2026-052 PDF Data Software
- @inproceedings{Cherian2026may,
- author = {Cherian, Anoop and Corcodel, Radu and Jain, Siddarth and Romeres, Diego},
- title = {{LLMPhy: Parameter-Identifiable Physical Reasoning Combining Large Language Models and Physics Engines}},
- booktitle = {International Conference on Artificial Intelligence and Statistics (AISTATS)},
- year = 2026,
- month = may,
- url = {https://www.merl.com/publications/TR2026-052}
- }
Shenoy, V., Lohit, S., Mansour, H., Chellappa, R., Marks, T.K., "Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models", IEEE Transactions on Image Processing, DOI: 10.1109/TIP.2026.3671653, Vol. 35, pp. 2755-2770, March 2026.
BibTeX TR2026-031 PDF
- @article{Shenoy2026mar,
- author = {Shenoy, Vineet and Lohit, Suhas and Mansour, Hassan and Chellappa, Rama and Marks, Tim K.},
- title = {{Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models}},
- journal = {IEEE Transactions on Image Processing},
- year = 2026,
- volume = 35,
- pages = {2755--2770},
- month = mar,
- doi = {10.1109/TIP.2026.3671653},
- issn = {1941-0042},
- url = {https://www.merl.com/publications/TR2026-031}
- }
Kogashi, K., Cherian, A., Kuo, M.-Y.J., "MMHOI: Modeling Complex 3D Multi-Human Multi-Object Interactions", IEEE Winter Conference on Applications of Computer Vision (WACV), March 2026, pp. 1512-1521.
BibTeX TR2026-029 PDF Video Data
- @inproceedings{Kogashi2026mar,
- author = {Kogashi, Kaen and Cherian, Anoop and Kuo, Meng-Yu Jennifer},
- title = {{MMHOI: Modeling Complex 3D Multi-Human Multi-Object Interactions}},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2026,
- pages = {1512--1521},
- month = mar,
- url = {https://www.merl.com/publications/TR2026-029}
- }
Mumcu, F., Jones, M.J., Yilmaz, Y., Cherian, A., "Leveraging Multimodal LLM Descriptions of Activity for Explainable Semi-Supervised Video Anomaly Detection", Transactions on Machine Learning Research, February 2026.
BibTeX TR2026-027 PDF
- @article{Mumcu2026feb2,
- author = {Mumcu, Furkan and Jones, Michael J. and Yilmaz, Yasin and Cherian, Anoop},
- title = {{Leveraging Multimodal LLM Descriptions of Activity for Explainable Semi-Supervised Video Anomaly Detection}},
- journal = {Transactions on Machine Learning Research},
- year = 2026,
- month = feb,
- url = {https://www.merl.com/publications/TR2026-027}
- }
Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Indoor Multi-View Radar Object Detection via 3D Bounding Box Diffusion", AAAI Conference on Artificial Intelligence, DOI: 10.1609/aaai.v40i22.38939, January 2026, vol. 40, pp. 18710-18718.
BibTeX TR2026-019 PDF Software
- @inproceedings{Yataka2026jan,
- author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
- title = {IIndoor Multi-View Radar Object Detection via 3D Bounding Box Diffusion},
- booktitle = {AAAI Conference on Artificial Intelligence},
- year = 2026,
- volume = 40,
- number = 22,
- pages = {18710--18718},
- month = jan,
- doi = {10.1609/aaai.v40i22.38939},
- url = {https://www.merl.com/publications/TR2026-019}
- }
Kuwabara, A., Kato, S., Koike-Akino, T., Fujihashi, T., "Date of publication xxxx 00, 0000, date of current version xxxx 00, 0000. Digital Object Identifier 10.1109/ACCESS.2017.DOI Range Image-Based Implicit Neural Compression for LiDAR Point Clouds", IEEE Access, DOI: 10.1109/ACCESS.2026.3654068, Vol. 14, pp. 10262-10275, January 2026.
BibTeX TR2026-023 PDF
- @article{Kuwabara2026feb,
- author = {Kuwabara, Akihiro and Kato, Sorachi and Koike-Akino, Toshiaki and Fujihashi, Takuya},
- title = {{Range Image-Based Implicit Neural Compression for LiDAR Point Clouds}},
- journal = {IEEE Access},
- year = 2026,
- volume = 14,
- pages = {10262--10275},
- month = feb,
- doi = {10.1109/ACCESS.2026.3654068},
- issn = {2169-3536},
- url = {https://www.merl.com/publications/TR2026-023}
- }
Hori, C., Masuyama, Y., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU65441.2025.11434641, December 2025.
BibTeX TR2025-167 PDF
- @inproceedings{Hori2025dec,
- author = {Hori, Chiori and Masuyama, Yoshiki and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
- title = {{Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2025,
- month = dec,
- doi = {10.1109/ASRU65441.2025.11434641},
- issn = {2997-6995},
- isbn = {979-8-3315-4426-3},
- url = {https://www.merl.com/publications/TR2025-167}
- }
Xiang, X., Peng, K.-C., Lohit, S., Jones, M.J., Zhang, J., "Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes", British Machine Vision Conference (BMVC), November 2025.
BibTeX TR2025-162 PDF Video Data Presentation
- @inproceedings{Xiang2025nov,
- author = {{{Xiang, Xinhao and Peng, Kuan-Chuan and Lohit, Suhas and Jones, Michael J. and Zhang, Jiawei}}},
- title = {{{Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes}}},
- booktitle = {British Machine Vision Conference (BMVC)},
- year = 2025,
- month = nov,
- url = {https://www.merl.com/publications/TR2025-162}
- }
Gambill, P., Jha, D.K., Krishnamoorthy, B., Raghunathan, A., Yerazunis, W.S., "DamageEst: Accurate Estimation of Damage for Repair using Additive Manufacturing", Solid Freeform Fabrication Symposium (SFF), November 2025, pp. 1506-1526.
BibTeX TR2025-158 PDF Presentation
- @inproceedings{Gambill2025nov,
- author = {{{Gambill, Patrick and Jha, Devesh K. and Krishnamoorthy, Bala and Raghunathan, Arvind and Yerazunis, William S.}}},
- title = {{{DamageEst: Accurate Estimation of Damage for Repair using Additive Manufacturing}}},
- booktitle = {36th Annual International Solid Freeform Fabrication Symposium – An Additive Manufacturing Conference},
- year = 2025,
- pages = {1506--1526},
- month = nov,
- url = {https://www.merl.com/publications/TR2025-158}
- }
Nikovski, D.N., "Observation-Based Inverse Kinematics for Visual Servo Control", 22nd International Conference on Informatics in Control, Automation and Robotics (ICINCO), DOI: 10.5220/0013701100003982, October 2025, pp. 200-207.
BibTeX TR2025-153 PDF
- @inproceedings{Nikovski2025oct,
- author = {Nikovski, Daniel N.},
- title = {{Observation-Based Inverse Kinematics for Visual Servo Control}},
- booktitle = {22nd International Conference on Informatics in Control, Automation and Robotics (ICINCO)},
- year = 2025,
- pages = {200--207},
- month = oct,
- publisher = {SciTePress},
- doi = {10.5220/0013701100003982},
- isbn = {978-989-758-770-2},
- url = {https://www.merl.com/publications/TR2025-153}
- }
Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception", IEEE International Conference on Computer Vision (ICCV) Workshop, October 2025.
BibTeX TR2025-154 PDF Software
- @inproceedings{Yataka2025oct,
- author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
- title = {{Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshop},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-154}
- }
Piedade, V., Chitturi, S., Gaspar, J., Govindu, V., Miraldo, P., "SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity", IEEE International Conference on Computer Vision (ICCV), DOI: 10.1109/ICCV51701.2025.00547, October 2025, pp. 5780-5790.
BibTeX TR2025-146 PDF Video Software Presentation
- @inproceedings{Piedade2025oct,
- author = {{{Piedade, Valter and Chitturi, Sidhartha and Gaspar, Jose and Govindu, Venu and Miraldo, Pedro}}},
- title = {{{SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity}}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV)},
- year = 2025,
- pages = {5780--5790},
- month = oct,
- doi = {10.1109/ICCV51701.2025.00547},
- url = {https://www.merl.com/publications/TR2025-146}
- }
Yang, C.-A., Peng, K.-C., Yeh, R., "Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts", IEEE International Conference on Computer Vision (ICCV), October 2025.
BibTeX TR2025-124 PDF Video Data Presentation
- @inproceedings{Yang2025oct,
- author = {{{Yang, Chiao-An and Peng, Kuan-Chuan and Yeh, Raymond}}},
- title = {{{Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts}}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV)},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-124}
- }
Peng, K.-C., "Joint Training of Image Generator and Detector for Road Defect Detection", IEEE International Conference on Computer Vision (ICCV) Workshops, October 2025.
BibTeX TR2025-149 PDF Video Presentation
- @inproceedings{Peng2025oct,
- author = {{{Peng, Kuan-Chuan}}},
- title = {{{Joint Training of Image Generator and Detector for Road Defect Detection}}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshops},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-149}
- }