Publications

674 / 3,854 publications found.


  •  Ranade, S., Pais, G., Whitaker, R., Nascimento, J., Miraldo, P., Ramalingam, S., "SurfR: Surface Reconstruction with Multi-scale Attention", International Conference on 3D Vision (3DV), March 2025.
    BibTeX TR2025-039 PDF Presentation
    • @inproceedings{Ranade2025mar,
    • author = {{{Ranade, Siddhant and Pais, Goncalo and Whitaker, Ross and Nascimento, Jacinto and Miraldo, Pedro and Ramalingam, Srikumar}}},
    • title = {{{SurfR: Surface Reconstruction with Multi-scale Attention}}},
    • booktitle = {International Conference on 3D Vision (3DV)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-039}
    • }
  •  Tian, J., Shi, J., Chen, W., Arora, S., Masuyama, Y., Takashi, M., Wu, Y., Peng, J., Bharadwaj, S., Zhao, Y., Cornell, S., Peng, Y., Yue, X., Yang, C.-H.H., Neubig, G., Watanabe, S., "ESPnet-SpeechLM: An Open Speech Language Model Toolkit", NAACL-HLT (the system demonstration track), Dziri, N. and Ren, S. X. and Diao, S., Eds., March 2025, pp. 116-124.
    BibTeX TR2025-038 PDF
    • @inproceedings{Tian2025mar,
    • author = {Tian, Jinchuan and Shi, Jiatong and Chen, William and Arora, Siddhant and Masuyama, Yoshiki and Takashi, Maekaku and Wu, Yihan and Peng, Junyi and Bharadwaj, Shikhar and Zhao, Yiwen and Cornell, Samuele and Peng, Yifan and Yue, Xiang and Yang, Chao-Han H. and Neubig, Graham and Watanabe, Shinji},
    • title = {{ESPnet-SpeechLM: An Open Speech Language Model Toolkit}},
    • booktitle = {NAACL-HLT (the system demonstration track)},
    • year = 2025,
    • editor = {Dziri, N. and Ren, S. X. and Diao, S.},
    • pages = {116--124},
    • month = mar,
    • publisher = {Association for Computational Linguistics},
    • url = {https://www.merl.com/publications/TR2025-038}
    • }
  •  Wang, R., Wang, Y., Liu, J., Koike-Akino, T., "Quantum Diffusion Models for Few-Shot Learning", AAAI Conference on Artificial Intelligence, March 2025.
    BibTeX TR2025-025 PDF
    • @inproceedings{Wang2025mar,
    • author = {Wang, Ruhan and Wang, Ye and Liu, Jing and Koike-Akino, Toshiaki},
    • title = {{Quantum Diffusion Models for Few-Shot Learning}},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-025}
    • }
  •  Fujihashi, T., Koike-Akino, T., "Quantum Implicit Neural Compression", AAAI Conference on Artificial Intelligence, March 2025.
    BibTeX TR2025-024 PDF
    • @inproceedings{Fujihashi2025mar,
    • author = {Fujihashi, Takuya and Koike-Akino, Toshiaki},
    • title = {{Quantum Implicit Neural Compression}},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-024}
    • }
  •  Wang, Y., Peng, K.-C., Fu, R., "Towards Zero-shot 3D Anomaly Localization", IEEE Winter Conference on Applications of Computer Vision (WACV), Biswas, S. and Averbuch-Elor, H. and Štruc, V. and Yang, Y., Eds., DOI: 10.1109/​WACV61041.2025.00148, February 2025, pp. 1447-1456.
    BibTeX TR2025-020 PDF Video Presentation
    • @inproceedings{Wang2025feb2,
    • author = {Wang, Yizhou and Peng, Kuan-Chuan and Fu, Raymond},
    • title = {{Towards Zero-shot 3D Anomaly Localization}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2025,
    • editor = {Biswas, S. and Averbuch-Elor, H. and Štruc, V. and Yang, Y.},
    • pages = {1447--1456},
    • month = feb,
    • publisher = {IEEE},
    • doi = {10.1109/WACV61041.2025.00148},
    • issn = {2642-9381},
    • isbn = {979-8-3315-1083-1},
    • url = {https://www.merl.com/publications/TR2025-020}
    • }
  •  Rashid, M.R.U., Liu, J., Koike-Akino, T., Wang, Y., Mehnaz, S., "Forget to Flourish: Leveraging Machine-Unlearning on Pretrained Language Models for Privacy Leakage", AAAI Conference on Artificial Intelligence, Toby Walsh, Julie Shah, Zico Kolter, Eds., DOI: 10.1609/​aaai.v39i19.34218, February 2025, pp. 20139-20147.
    BibTeX TR2025-017 PDF
    • @inproceedings{Rashid2025feb,
    • author = {Rashid, Md Rafi Ur and Liu, Jing and Koike-Akino, Toshiaki and Wang, Ye and Mehnaz, Shagufta},
    • title = {{Forget to Flourish: Leveraging Machine-Unlearning on Pretrained Language Models for Privacy Leakage}},
    • booktitle = {Proceedings of the AAAI Conference on Artificial Intelligence},
    • year = 2025,
    • editor = {Toby Walsh, Julie Shah, Zico Kolter},
    • pages = {20139--20147},
    • month = feb,
    • publisher = {Association for the Advancement of Artificial Intelligence (AAAI)},
    • doi = {10.1609/aaai.v39i19.34218},
    • issn = {2374-3468},
    • isbn = {978-1-57735-897-8},
    • url = {https://www.merl.com/publications/TR2025-017}
    • }
  •  Mumcu, F., Jones, M.J., Yilmaz, Y., Cherian, A., "ComplexVAD: Detecting Interaction Anomalies in Video", IEEE Winter Conference on Applications of Computer Vision (WACV) Workshop, February 2025.
    BibTeX TR2025-016 PDF Data
    • @inproceedings{Mumcu2025feb,
    • author = {Mumcu, Furkan and Jones, Michael J. and Yilmaz, Yasin and Cherian, Anoop},
    • title = {{ComplexVAD: Detecting Interaction Anomalies in Video}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV) Workshop},
    • year = 2025,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2025-016}
    • }
  •  Koo, J., Wichern, G., Germain, F.G., Khurana, S., Le Roux, J., "SMITIN: Self-Monitored Inference-Time INtervention for Generative Music Transformers", IEEE Open Journal of Signal Processing, DOI: 10.1109/​OJSP.2025.3534686, Vol. 6, pp. 266-275, January 2025.
    BibTeX TR2025-012 PDF Software
    • @article{Koo2025jan,
    • author = {Koo, Junghyun and Wichern, Gordon and Germain, François G and Khurana, Sameer and {Le Roux}, Jonathan},
    • title = {{SMITIN: Self-Monitored Inference-Time INtervention for Generative Music Transformers}},
    • journal = {IEEE Open Journal of Signal Processing},
    • year = 2025,
    • volume = 6,
    • pages = {266--275},
    • month = jan,
    • doi = {10.1109/OJSP.2025.3534686},
    • issn = {2644-1322},
    • url = {https://www.merl.com/publications/TR2025-012}
    • }
  •  Lohit, S., Marks, T.K., "Rotation-Equivariant Neural Networks for Cloud Removal from Satellite Images", Asilomar Conference on Signals, Systems, and Computers (ACSSC), DOI: 10.1109/​IEEECONF60004.2024.10942613, January 2025, pp. 1360-1365.
    BibTeX TR2025-009 PDF
    • @inproceedings{Lohit2025jan,
    • author = {Lohit, Suhas and Marks, Tim K.},
    • title = {{Rotation-Equivariant Neural Networks for Cloud Removal from Satellite Images}},
    • booktitle = {2024 58th Asilomar Conference on Signals, Systems, and Computers (ACSSC)},
    • year = 2025,
    • pages = {1360--1365},
    • month = jan,
    • publisher = {IEEE},
    • doi = {10.1109/IEEECONF60004.2024.10942613},
    • issn = {2576-2303},
    • isbn = {979-8-3503-5405-8},
    • url = {https://www.merl.com/publications/TR2025-009}
    • }
  •  He, Y., Shin, S., Cherian, A., Trigoni, N., Markham, A., "SoundLoc3D: Invisible 3D Sound Source Localization and Classification Using a Multimodal RGB-D Acoustic Camera", IEEE Winter Conference on Applications of Computer Vision (WACV), December 2024, pp. 5408-5418.
    BibTeX TR2025-003 PDF
    • @inproceedings{He2024dec2,
    • author = {He, Yuhang and Shin, Sangyun and Cherian, Anoop and Trigoni, Niki and Markham, Andrew},
    • title = {{SoundLoc3D: Invisible 3D Sound Source Localization and Classification Using a Multimodal RGB-D Acoustic Camera}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2024,
    • pages = {5408--5418},
    • month = dec,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2025-003}
    • }
  •  Zhang, J., Zhang, F., Rodriguez, C., Ben-Shabat, I., Cherian, A., Gould, S., "Temporally Grounding Instructional Diagrams in Unconstrained Videos", IEEE Winter Conference on Applications of Computer Vision (WACV), December 2024, pp. 8090-8100.
    BibTeX TR2025-002 PDF
    • @inproceedings{Zhang2024dec,
    • author = {Zhang, Jiahao and Zhang, Frederic and Rodriguez, Cristian and Ben-Shabat, Itzik and Cherian, Anoop and Gould, Stephen},
    • title = {{Temporally Grounding Instructional Diagrams in Unconstrained Videos}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2024,
    • pages = {8090--8100},
    • month = dec,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2025-002}
    • }
  •  Bimbraw, K., Wang, Y., Liu, J., Koike-Akino, T., "GPT Sonograpy: Hand Gesture Decoding from Forearm Ultrasound Images via VLM", Advances in Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2024-175 PDF Presentation
    • @inproceedings{Bimbraw2024dec,
    • author = {Bimbraw, Keshav and Wang, Ye and Liu, Jing and Koike-Akino, Toshiaki},
    • title = {{GPT Sonograpy: Hand Gesture Decoding from Forearm Ultrasound Images via VLM}},
    • booktitle = {Advancements In Medical Foundation Models: Explainability, Robustness, Security, and Beyond Workshop at Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-175}
    • }
  •  Chen, X., Wang, Y., Brand, M., Wang, P., Liu, J., Koike-Akino, T., "Slaying the HyDRA: Parameter-Efficient Hyper Networks with Low-Displacement Rank Adaptation", Advances in Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2024-157 PDF Presentation
    • @inproceedings{Chen2024dec,
    • author = {Chen, Xiangyu and Wang, Ye and Brand, Matthew and Wang, Pu and Liu, Jing and Koike-Akino, Toshiaki},
    • title = {{Slaying the HyDRA: Parameter-Efficient Hyper Networks with Low-Displacement Rank Adaptation}},
    • booktitle = {Workshop on Adaptive Foundation Models: Evolving AI for Personalized and Efficient Learning at Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-157}
    • }
  •  Fujihashi, T., Kato, S., Koike-Akino, T., "FV-NeRV: Neural Compression for Free Viewpoint Videos", Advances in Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2024-176 PDF
    • @inproceedings{Fujihashi2024dec,
    • author = {Fujihashi, Takuya and Kato, Sorachi and Koike-Akino, Toshiaki},
    • title = {{FV-NeRV: Neural Compression for Free Viewpoint Videos}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-176}
    • }
  •  Park, Y.-J., Germain, F.G., Liu, J., Wang, Y., Koike-Akino, T., Wichern, G., Laughman, C.R., Azizan, N., Chakrabarty, A., "Probabilistic Forecasting for Building Energy Systems: Are Time-Series Foundation Models The Answer?", Advances in Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2025-001 PDF
    • @inproceedings{Park2024dec,
    • author = {{{Park, Young-Jin and Germain, François G and Liu, Jing and Wang, Ye and Koike-Akino, Toshiaki and Wichern, Gordon and Laughman, Christopher R. and Azizan, Navid and Chakrabarty, Ankush}}},
    • title = {{{Probabilistic Forecasting for Building Energy Systems: Are Time-Series Foundation Models The Answer?}}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2025-001}
    • }
  •  Tang, W.-T., Chakrabarty, A., Paulson, J.A., "TR-BEACON: Shedding Light on Efficient Behavior Discovery in High-Dimensional Spaces with Bayesian Novelty Search over Trust Regions", Advances in Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2024-167 PDF
    • @inproceedings{Tang2024dec,
    • author = {Tang, Wei-Ting and Chakrabarty, Ankush and Paulson, Joel A.},
    • title = {{TR-BEACON: Shedding Light on Efficient Behavior Discovery in High-Dimensional Spaces with Bayesian Novelty Search over Trust Regions}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-167}
    • }
  •  Liu, J., Wang, Y., Koike-Akino, T., Nakai, T., Oonishi, K., Higashi, T., "MEL-PETs Defense for the NeurIPS 2024 LLM Privacy Challenge Blue Team Track", LLM Privacy Challenge at Neural Information Processing Systems (NeurIPS) 2024, December 2024.
    BibTeX TR2024-166 PDF Video Presentation
    • @inproceedings{Liu2024dec,
    • author = {Liu, Jing and Wang, Ye and Koike-Akino, Toshiaki and Nakai, Tsunato and Oonishi, Kento and Higashi, Takuya},
    • title = {{MEL-PETs Defense for the NeurIPS 2024 LLM Privacy Challenge Blue Team Track}},
    • booktitle = {LLM Privacy Challenge at Neural Information Processing Systems (NeurIPS) 2024},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-166}
    • }
  •  Wang, Y., Nakai, T., Liu, J., Koike-Akino, T., Oonishi, K., Higashi, T., "MEL-PETs Joint-Context Attack for the NeurIPS 2024 LLM Privacy Challenge Red Team Track", LLM Privacy Challenge at Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2024-165 PDF Video Presentation
    • @inproceedings{Wang2024dec2,
    • author = {Wang, Ye and Nakai, Tsunato and Liu, Jing and Koike-Akino, Toshiaki and Oonishi, Kento and Higashi, Takuya},
    • title = {{MEL-PETs Joint-Context Attack for the NeurIPS 2024 LLM Privacy Challenge Red Team Track}},
    • booktitle = {LLM Privacy Challenge at Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-165}
    • }
  •  Ick, C., Wichern, G., Masuyama, Y., Germain, F.G., Le Roux, J., "Spatially-Aware Losses for Enhanced Neural Acoustic Fields", NeurIPS 2024 Audio Imagination Workshop, December 2024.
    BibTeX TR2024-169 PDF
    • @inproceedings{Ick2024dec,
    • author = {Ick, Christopher and Wichern, Gordon and Masuyama, Yoshiki and Germain, François G and {Le Roux}, Jonathan},
    • title = {{Spatially-Aware Losses for Enhanced Neural Acoustic Fields}},
    • booktitle = {NeurIPS 2024 Audio Imagination Workshop},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-169}
    • }
  •  Rashid, M.R.U., Liu, J., Koike-Akino, T., Mehnaz, S., Wang, Y., "Forget to Flourish: Leveraging Machine-Unlearning on Pretrained Language Models for Privacy Leakage", Red Teaming GenAI Workshop at Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2024-168 PDF
    • @inproceedings{Rashid2024dec,
    • author = {Rashid, Md Rafi Ur and Liu, Jing and Koike-Akino, Toshiaki and Mehnaz, Shagufta and Wang, Ye},
    • title = {{Forget to Flourish: Leveraging Machine-Unlearning on Pretrained Language Models for Privacy Leakage}},
    • booktitle = {Red Teaming GenAI Workshop at Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • publisher = {OpenReview},
    • url = {https://www.merl.com/publications/TR2024-168}
    • }
  •  Ryo, H., Rashid, M.R.U., Lewis, A., Liu, J., Koike-Akino, T., Parsons, K., Wang, Y., "Smoothed Embeddings for Robust Language Models", Safe Generative AI Workshop at Advances in Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2024-170 PDF Presentation
    • @inproceedings{Ryo2024dec,
    • author = {Ryo, Hase and Rashid, Md Rafi Ur and Lewis, Ashley and Liu, Jing and Koike-Akino, Toshiaki and Parsons, Kieran and Wang, Ye},
    • title = {{Smoothed Embeddings for Robust Language Models}},
    • booktitle = {Safe Generative AI Workshop at Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • publisher = {OpenReview},
    • url = {https://www.merl.com/publications/TR2024-170}
    • }
  •  Chen, X., Liu, J., Wang, Y., Wang, P., Brand, M., Wang, G., Koike-Akino, T., "SuperLoRA: Parameter-Efficient Unified Adaptation of Large Foundation Models", British Machine Vision Conference (BMVC), November 2024.
    BibTeX TR2024-156 PDF Presentation
    • @inproceedings{Chen2024nov,
    • author = {Chen, Xiangyu and Liu, Jing and Wang, Ye and Wang, Pu and Brand, Matthew and Wang, Guanghui and Koike-Akino, Toshiaki},
    • title = {{SuperLoRA: Parameter-Efficient Unified Adaptation of Large Foundation Models}},
    • booktitle = {British Machine Vision Conference (BMVC)},
    • year = 2024,
    • month = nov,
    • publisher = {British Machine Vision Association},
    • url = {https://www.merl.com/publications/TR2024-156}
    • }
  •  Cherian, A., Peng, K.-C., Lohit, S., Matthiesen, J., Smith, K., Tenenbaum, J.B., "Evaluating Large Vision-and-Language Models on Children’s Mathematical Olympiads", Advances in Neural Information Processing Systems (NeurIPS), November 2024, pp. 15779-15800.
    BibTeX TR2024-160 PDF Video Presentation
    • @inproceedings{Cherian2024nov,
    • author = {Cherian, Anoop and Peng, Kuan-Chuan and Lohit, Suhas and Matthiesen, Joanna and Smith, Kevin and Tenenbaum, Joshua B.},
    • title = {{Evaluating Large Vision-and-Language Models on Children’s Mathematical Olympiads}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • pages = {15779--15800},
    • month = nov,
    • publisher = {NeurIPS Proceedings},
    • url = {https://www.merl.com/publications/TR2024-160}
    • }
  •  Cornell, S., Ebbers, J., Douwes, C., Martin-Morato, I., Harju, M., Mesaros, A., Serizel, R., "DCASE 2024 Task 4: Sound Event Detection with Heterogeneous Data and Missing Labels", Detection and Classification of Acoustic Scenes and Events (DCASE) Workshop, October 2024, pp. 31-35.
    BibTeX TR2024-146 PDF
    • @inproceedings{Cornell2024oct,
    • author = {Cornell, Samuele and Ebbers, Janek and Douwes, Constance and Martin-Morato, Irene and Harju, Manu and Mesaros, Annamaria and Serizel, Romain},
    • title = {{DCASE 2024 Task 4: Sound Event Detection with Heterogeneous Data and Missing Labels}},
    • booktitle = {Detection and Classification of Acoustic Scenes and Events (DCASE) Workshop},
    • year = 2024,
    • pages = {31--35},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2024-146}
    • }
  •  Li, Z., Lowy, A., Liu, J., Koike-Akino, T., Parsons, K., Malin, B., Wang, Y., "Analyzing Inference Privacy Risks Through Gradients In Machine Learning", ACM Conference on Computer and Communications Security (CCS), DOI: 10.1145/​3658644.3690304, October 2024, pp. 3466-3480.
    BibTeX TR2024-141 PDF
    • @inproceedings{Li2024oct,
    • author = {Li, Zhuohang and Lowy, Andrew and Liu, Jing and Koike-Akino, Toshiaki and Parsons, Kieran and Malin, Bradley and Wang, Ye},
    • title = {{Analyzing Inference Privacy Risks Through Gradients In Machine Learning}},
    • booktitle = {Proceedings of the 2024 on ACM SIGSAC Conference on Computer and Communications Security},
    • year = 2024,
    • pages = {3466--3480},
    • month = oct,
    • publisher = {Association for Computing Machinery},
    • doi = {10.1145/3658644.3690304},
    • isbn = {9798400706363},
    • url = {https://www.merl.com/publications/TR2024-141}
    • }