Publications

242 / 3,619 publications found.


  •  Sun, L., Jha, D.K., Hori, C., Jain, S., Corcodel, R., Zhu, X., Tomizuka, M., Romeres, D., "Interactive Planning Using Large Language Models for Partially Observable Robotic Tasks", IEEE International Conference on Robotics and Automation (ICRA), May 2024.
    BibTeX TR2024-052 PDF
    • @inproceedings{Sun2024may,
    • author = {Sun, Lingfeng and Jha, Devesh K. and Hori, Chiori and Jain, Siddarth and Corcodel, Radu and Zhu, Xinghao and Tomizuka, Masayoshi and Romeres, Diego}},
    • title = {Interactive Planning Using Large Language Models for Partially Observable Robotic Tasks},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2024,
    • month = may,
    • url = {https://www.merl.com/publications/TR2024-052}
    • }
  •  Dey, R., Egger, B., Boddeti, V., Wang, Y., Marks, T.K., "CoLa-SDF: Controllable Latent StyleSDF for Disentangled 3D Face Generation", IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), April 2024.
    BibTeX TR2024-045 PDF
    • @inproceedings{Dey2024apr,
    • author = {Dey, Rahul and Egger, Bernhard and Boddeti, Vishnu and Wang, Ye and Marks, Tim K.},
    • title = {CoLa-SDF: Controllable Latent StyleSDF for Disentangled 3D Face Generation},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)},
    • year = 2024,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2024-045}
    • }
  •  Koo, J., Wichern, G., Germain, F.G., Khurana, S., Le Roux, J., "Understanding and Controlling Generative Music Transformers by Probing Individual Attention Heads", IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA), April 2024.
    BibTeX TR2024-032 PDF
    • @inproceedings{Koo2024apr,
    • author = {Koo, Junghyun and Wichern, Gordon and Germain, François G and Khurana, Sameer and Le Roux, Jonathan},
    • title = {Understanding and Controlling Generative Music Transformers by Probing Individual Attention Heads},
    • booktitle = {IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA)},
    • year = 2024,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2024-032}
    • }
  •  Bralios, D., Wichern, G., Germain, F.G., Pan, Z., Khurana, S., Hori, C., Le Roux, J., "Generation or Replication: Auscultating Audio Latent Diffusion Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-027 PDF
    • @inproceedings{Bralios2024mar,
    • author = {Bralios, Dimitrios and Wichern, Gordon and Germain, François G and Pan, Zexu and Khurana, Sameer and Hori, Chiori and Le Roux, Jonathan},
    • title = {Generation or Replication: Auscultating Audio Latent Diffusion Models},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-027}
    • }
  •  Wu, S.-L., Chang, X., Wichern, G., Jung, J.-W., Germain, F.G., Le Roux, J., Watanabe, S., "Improving Audio Captioning Models with Fine-grained Audio Features, Text Embedding Supervision, and LLM Mix-up Augmentation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-028 PDF
    • @inproceedings{Wu2024mar,
    • author = {Wu, Shih-Lun and Chang, Xuankai and Wichern, Gordon and Jung, Jee-weon and Germain, François G and Le Roux, Jonathan and Watanabe, Shinji},
    • title = {Improving Audio Captioning Models with Fine-grained Audio Features, Text Embedding Supervision, and LLM Mix-up Augmentation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-028}
    • }
  •  Baoueb, T., Liu, H., Fontaine, M., Le Roux, J., Richard, G., "SpecDiff-GAN: A Spectrally-Shaped Noise Diffusion GAN for Speech and Music Synthesis", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10446830, March 2024, pp. 986-990.
    BibTeX TR2024-013 PDF
    • @inproceedings{Baoueb2024mar,
    • author = {Baoueb, Teysir and Liu, Haocheng and Fontaine, Mathieu and Le Roux, Jonathan and Richard, Gaël},
    • title = {SpecDiff-GAN: A Spectrally-Shaped Noise Diffusion GAN for Speech and Music Synthesis},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {986--990},
    • month = mar,
    • doi = {10.1109/ICASSP48485.2024.10446830},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-013}
    • }
  •  Hori, C., Wang, P., Rahman, M., Vaca-Rubio, C., Khurana, S., Cherian, A., Le Roux, J., "Wi-Fi based Indoor Monitoring Enhanced by Multimodal Fusion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10447600, March 2024, pp. 13296-13300.
    BibTeX TR2024-012 PDF
    • @inproceedings{Hori2024mar,
    • author = {Hori, Chiori and Wang, Pu and Rahman, Mahbub and Vaca-Rubio, Cristian and Khurana, Sameer and Cherian, Anoop and Le Roux, Jonathan},
    • title = {Wi-Fi based Indoor Monitoring Enhanced by Multimodal Fusion},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {13296--13300},
    • month = mar,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP48485.2024.10447600},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-012}
    • }
  •  Liu, H., Baoueb, T., Fontaine, M., Le Roux, J., Richard, G., "GLA-Grad: A Griffin-Lim Extended Waveform Generation Diffusion Model", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10446058, March 2024, pp. 11611-11615.
    BibTeX TR2024-014 PDF
    • @inproceedings{Liu2024mar,
    • author = {Liu, Haocheng and Baoueb, Teysir and Fontaine, Mathieu and Le Roux, Jonathan and Richard, Gaël},
    • title = {GLA-Grad: A Griffin-Lim Extended Waveform Generation Diffusion Model},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {11611--11615},
    • month = mar,
    • doi = {10.1109/ICASSP48485.2024.10446058},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-014}
    • }
  •  Bortoff, S.A., Eisenhower, B., Adetola, V., O'Neil, Z., "Control Challenges and Opportunities in Building Automation" in The Impact of Automatic Control Research on Industrial Innovation: Enabling a Sustainable Future, February 2024.
    BibTeX TR2024-011 PDF
    • @incollection{Bortoff2024feb,
    • author = {Bortoff, Scott A. and Eisenhower, Bryan and Adetola, Veronica and O'Neil, Zheng},
    • title = {Control Challenges and Opportunities in Building Automation},
    • booktitle = {The Impact of Automatic Control Research on Industrial Innovation: Enabling a Sustainable Future},
    • year = 2024,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2024-011}
    • }
  •  Liu, X., Paul, S., Chatterjee, M., Cherian, A., "CAVEN: An Embodied Conversational Agent for Efficient Audio-Visual Navigation in Noisy Environments", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v38i4.28167, December 2023, pp. 3765-3773.
    BibTeX TR2023-154 PDF
    • @inproceedings{Liu2023dec2,
    • author = {Liu, Xiulong and Paul, Sudipta and Chatterjee, Moitreya and Cherian, Anoop},
    • title = {CAVEN: An Embodied Conversational Agent for Efficient Audio-Visual Navigation in Noisy Environments},
    • booktitle = {Proceedings of the 38th AAAI Conference on Artificial Intelligence},
    • year = 2023,
    • pages = {3765--3773},
    • month = dec,
    • doi = {10.1609/aaai.v38i4.28167},
    • url = {https://www.merl.com/publications/TR2023-154}
    • }
  •  Liu, J., Koike-Akino, T., Wang, P., Brand, M., Wang, Y., Parsons, K., "LoDA: Low-Dimensional Adaptation of Large Language Models", Advances in Neural Information Processing Systems (NeurIPS) workshop, December 2023.
    BibTeX TR2023-150 PDF
    • @inproceedings{Liu2023dec,
    • author = {Liu, Jing and Koike-Akino, Toshiaki and Wang, Pu and Brand, Matthew and Wang, Ye and Parsons, Kieran},
    • title = {LoDA: Low-Dimensional Adaptation of Large Language Models},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS) workshop},
    • year = 2023,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2023-150}
    • }
  •  Kong, C., Yerazunis, W.S., Nikovski, D., "Stochastic Learning Manipulation of Object Pose With Under-Actuated Impulse Generator Arrays", International Conference on Machine Learning and Applications (ICMLA), DOI: 10.1109/​ICMLA58977.2023.00024, December 2023, pp. 112-119.
    BibTeX TR2023-151 PDF
    • @inproceedings{Kong2023dec,
    • author = {Kong, Chuizheng and Yerazunis, William S. and Nikovski, Daniel},
    • title = {Stochastic Learning Manipulation of Object Pose With Under-Actuated Impulse Generator Arrays},
    • booktitle = {International Conference on Machine Learning and Applications (ICMLA)},
    • year = 2023,
    • pages = {112--119},
    • month = dec,
    • doi = {10.1109/ICMLA58977.2023.00024},
    • url = {https://www.merl.com/publications/TR2023-151}
    • }
  •  Sun, L., Jha, D.K., Hori, C., Jain, S., Corcodel, R., Zhu, X., Tomizuka, M., Romeres, D., "Interactive Planning Using Large Language Models for Partially Observable Robotics Tasks", Advances in Neural Information Processing Systems (NeurIPS) Workshop on Instruction Tuning and Instruction Following, December 2023.
    BibTeX TR2023-148 PDF
    • @inproceedings{Sun2023dec,
    • author = {Sun, Lingfeng and Jha, Devesh K. and Hori, Chiori and Jain, Siddarth and Corcodel, Radu and Zhu, Xinghao and Tomizuka, Masayoshi and Romeres, Diego},
    • title = {Interactive Planning Using Large Language Models for Partially Observable Robotics Tasks},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS) Workshop on Instruction Tuning and Instruction Following},
    • year = 2023,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2023-148}
    • }
  •  Zhou, A., Sun, H., Kitamura, S., Nikovski, D., "A Decision-Dependent Chance-Constrained Planning Model for Distribution Networks Under Extreme Weather Events", IEEE PES Innovative Smart Grid Technologies Europe (ISGT-Europe), DOI: 10.1109/​ISGTEUROPE56780.2023.10408310, October 2023.
    BibTeX TR2023-133 PDF
    • @inproceedings{Zhou2023oct,
    • author = {Zhou, Anping and Sun, Hongbo and Kitamura, Shoichi and Nikovski, Daniel},
    • title = {A Decision-Dependent Chance-Constrained Planning Model for Distribution Networks Under Extreme Weather Events},
    • booktitle = {IEEE PES Innovative Smart Grid Technologies Europe (ISGT-Europe)},
    • year = 2023,
    • month = oct,
    • doi = {10.1109/ISGTEUROPE56780.2023.10408310},
    • url = {https://www.merl.com/publications/TR2023-133}
    • }
  •  Nair, N.G., Cherian, A., Lohit, S., Wang, Y., Koike-Akino, T., Patel, V.M., Marks, T.K., "Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis", IEEE International Conference on Computer Vision (ICCV), October 2023, pp. 20850-20860.
    BibTeX TR2023-126 PDF Presentation
    • @inproceedings{Nair2023sep,
    • author = {Nair, Nithin Gopalakrishnan and Cherian, Anoop and Lohit, Suhas and Wang, Ye and Koike-Akino, Toshiaki and Patel, Vishal M. and Marks, Tim K.},
    • title = {Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis},
    • booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision},
    • year = 2023,
    • pages = {20850--20860},
    • month = oct,
    • publisher = {IEEE/CVF},
    • url = {https://www.merl.com/publications/TR2023-126}
    • }
  •  Wang, B., Zhang, S., Inoue, H., Kanemaru, M., "Semi-Supervised Machine Learning for Motor Eccentricity Fault Diagnosis", Asia Pacific Conference of the Prognostics and Health Management Society, DOI: 10.36001/​phmap.2023.v4i1.3644, September 2023.
    BibTeX TR2023-117 PDF
    • @inproceedings{Wang2023sep,
    • author = {Wang, Bingnan and Zhang, Shen and Inoue, Hiroshi and Kanemaru, Makoto},
    • title = {Semi-Supervised Machine Learning for Motor Eccentricity Fault Diagnosis},
    • booktitle = {Asia Pacific Conference of the Prognostics and Health Management Society},
    • year = 2023,
    • month = sep,
    • publisher = {PHM Society},
    • doi = {10.36001/phmap.2023.v4i1.3644},
    • url = {https://www.merl.com/publications/TR2023-117}
    • }
  •  Zhan, S., Chakrabarty, A., Laughman, C.R., Chong, A., "A Virtual Testbed for Robust and Reproducible Calibration of Building Energy Simulation Models", 18th IBPSA International Conference and Exhibition Building Simulation, DOI: 10.26868/​25222708.2023.1482, September 2023.
    BibTeX TR2023-114 PDF
    • @inproceedings{Zhan2023sep,
    • author = {Zhan, Sicheng and Chakrabarty, Ankush and Laughman, Christopher R. and Chong, Adrian},
    • title = {A Virtual Testbed for Robust and Reproducible Calibration of Building Energy Simulation Models},
    • booktitle = {18th IBPSA International Conference and Exhibition Building Simulation},
    • year = 2023,
    • month = sep,
    • doi = {10.26868/25222708.2023.1482},
    • url = {https://www.merl.com/publications/TR2023-114}
    • }
  •  Hori, C., Peng, P., Harwath, D., Liu, X., Ota, K., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Style-transfer based Speech and Audio-visual Scene understanding for Robot Action Sequence Acquisition from Videos", Interspeech, DOI: 10.21437/​Interspeech.2023-1983, August 2023, pp. 4663-4667.
    BibTeX TR2023-104 PDF
    • @inproceedings{Hori2023aug,
    • author = {Hori, Chiori and Peng, Puyuang and Harwath, David and Liu, Xinyu and Ota, Kei and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and Le Roux, Jonathan},
    • title = {Style-transfer based Speech and Audio-visual Scene understanding for Robot Action Sequence Acquisition from Videos},
    • booktitle = {Interspeech},
    • year = 2023,
    • pages = {4663--4667},
    • month = aug,
    • doi = {10.21437/Interspeech.2023-1983},
    • url = {https://www.merl.com/publications/TR2023-104}
    • }
  •  Chakrabarty, A., Vinod, A.P., Mansour, H., Bortoff, S.A., Laughman, C.R., "Moving Horizon Estimation for Digital Twins using Deep Autoencoders", World Congress of the International Federation of Automatic Control (IFAC), Ishii, H. and Ebihara, Y. and Imura, J. and Yamakita, M., Eds., DOI: 10.1016/​j.ifacol.2023.10.207, July 2023, pp. 5500-5505.
    BibTeX TR2023-088 PDF
    • @inproceedings{Chakrabarty2023jul2,
    • author = {Chakrabarty, Ankush and Vinod, Abraham P. and Mansour, Hassan and Bortoff, Scott A. and Laughman, Christopher R.},
    • title = {Moving Horizon Estimation for Digital Twins using Deep Autoencoders},
    • booktitle = {World Congress of the International Federation of Automatic Control (IFAC)},
    • year = 2023,
    • editor = {Ishii, H. and Ebihara, Y. and Imura, J. and Yamakita, M.},
    • pages = {5500--5505},
    • month = jul,
    • publisher = {Elseiver},
    • doi = {10.1016/j.ifacol.2023.10.207},
    • url = {https://www.merl.com/publications/TR2023-088}
    • }
  •  Di Cairano, S., Skibik, T., Vinod, A.P., Weiss, A., Berntorp, K., "Decision Making for Automated Driving by Reachability of Parameterized Maneuvers", World Congress of the International Federation of Automatic Control (IFAC), Ishii, H. and Ebihara, Y. and Imura, J. and Yamakita, M., Eds., DOI: 10.1016/​j.ifacol.2023.10.018, July 2023, pp. 7852-7857.
    BibTeX TR2023-084 PDF
    • @inproceedings{DiCairano2023jul,
    • author = {Di Cairano, Stefano and Skibik, Terrence and Vinod, Abraham P. and Weiss, Avishai and Berntorp, Karl},
    • title = {Decision Making for Automated Driving by Reachability of Parameterized Maneuvers},
    • booktitle = {World Congress of the International Federation of Automatic Control (IFAC)},
    • year = 2023,
    • editor = {Ishii, H. and Ebihara, Y. and Imura, J. and Yamakita, M.},
    • pages = {7852--7857},
    • month = jul,
    • publisher = {Elsevier},
    • doi = {10.1016/j.ifacol.2023.10.018},
    • url = {https://www.merl.com/publications/TR2023-084}
    • }
  •  Salatiello, A., Wang, Y., Wichern, G., Koike-Akino, T., Yoshihiro, O., Kaneko, Y., Laughman, C.R., Chakrabarty, A., "Synthesizing Building Operation Data with Generative Models: VAEs, GANs, or Something In Between?", ACM e-Energy Conference, DOI: 10.1145/​3599733.3600260, June 2023.
    BibTeX TR2023-072 PDF
    • @inproceedings{Salatiello2023jun,
    • author = {Salatiello, Alessandro and Wang, Ye and Wichern, Gordon and Koike-Akino, Toshiaki and Yoshihiro, Ohta and Kaneko, Yosuke and Laughman, Christopher R. and Chakrabarty, Ankush},
    • title = {Synthesizing Building Operation Data with Generative Models: VAEs, GANs, or Something In Between?},
    • booktitle = {ACM e-Energy Conference},
    • year = 2023,
    • month = jun,
    • doi = {10.1145/3599733.3600260},
    • url = {https://www.merl.com/publications/TR2023-072}
    • }
  •  Hu, H., Menner, M., Wang, Y., Fang, H., Sun, D., Takegami, T., "Simulator-based Mission Optimization for Conceptual Aircraft Design with Turboelectric Propulsion", AIAA/IEEE Electric Aircraft Technologies Symposium (EATS), DOI: 10.2514/​6.2023-3872, June 2023, pp. 3872.
    BibTeX TR2023-069 PDF
    • @inproceedings{Hu2023jun,
    • author = {Hu, Hanyao and Menner, Marcel and Wang, Yebin and Fang, Huazhen and Sun, Dengfeng and Takegami, Tomoki},
    • title = {Simulator-based Mission Optimization for Conceptual Aircraft Design with Turboelectric Propulsion},
    • booktitle = {AIAA/IEEE Electric Aircraft Technologies Symposium (EATS)},
    • year = 2023,
    • pages = 3872,
    • month = jun,
    • doi = {10.2514/6.2023-3872},
    • url = {https://www.merl.com/publications/TR2023-069}
    • }
  •  Wu, S.-L., Chang, X., Wichern, G., Jung, J.-W., Germain, F., Le Roux, J., Watanabe, S., "BEATs-based Audio Captioning Model with Instructor Embedding Supervision and ChatGPT Mix-up," Tech. Rep. TR2023-068, DCASE2023 Challenge, May 2023.
    BibTeX TR2023-068 PDF
    • @techreport{Wu2023may,
    • author = {Wu, Shih-Lun and Chang, Xuankai and Wichern, Gordon and Jung, Jee-weon and Germain, Francois and Le Roux, Jonathan and Watanabe, Shinji},
    • title = {BEATs-based Audio Captioning Model with Instructor Embedding Supervision and ChatGPT Mix-up},
    • institution = {DCASE2023 Challenge},
    • year = 2023,
    • month = may,
    • url = {https://www.merl.com/publications/TR2023-068}
    • }
  •  Ota, K., Tung, H.-Y., Smith, K., Cherian, A., Marks, T.K., Sullivan, A., Kanezaki, A., Tenenbaum, J.B., "H-SAUR: Hypothesize, Simulate, Act, Update, and Repeat for Understanding Object Articulations from Interactions", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA48891.2023.10160575, May 2023, pp. 7272-7278.
    BibTeX TR2023-009 PDF
    • @inproceedings{Ota2023may,
    • author = {Ota, Kei and Tung, Hsiao-Yu and Smith, Kevin and Cherian, Anoop and Marks, Tim K. and Sullivan, Alan and Kanezaki, Asako and Tenenbaum, Joshua B.},
    • title = {H-SAUR: Hypothesize, Simulate, Act, Update, and Repeat for Understanding Object Articulations from Interactions},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2023,
    • pages = {7272--7278},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA48891.2023.10160575},
    • url = {https://www.merl.com/publications/TR2023-009}
    • }
  •  Shirai, Y., Jha, D.K., Raghunathan, A., Hong, D., "Tactile Tool Manipulation", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA48891.2023.10160480, May 2023, pp. 12597-12603.
    BibTeX TR2023-023 PDF Video
    • @inproceedings{Shirai2023may2,
    • author = {Shirai, Yuki and Jha, Devesh K. and Raghunathan, Arvind and Hong, Dennis},
    • title = {Tactile Tool Manipulation},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2023,
    • pages = {12597--12603},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA48891.2023.10160480},
    • isbn = {979-8-3503-2365-8},
    • url = {https://www.merl.com/publications/TR2023-023}
    • }