Publications

3,622 major publications by members of the MERL staff.


  •  Wu, S.-L., Chang, X., Wichern, G., Jung, J.-W., Germain, F.G., Le Roux, J., Watanabe, S., "Improving Audio Captioning Models with Fine-grained Audio Features, Text Embedding Supervision, and LLM Mix-up Augmentation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-028 PDF
    • @inproceedings{Wu2024mar,
    • author = {Wu, Shih-Lun and Chang, Xuankai and Wichern, Gordon and Jung, Jee-weon and Germain, François G and Le Roux, Jonathan and Watanabe, Shinji},
    • title = {Improving Audio Captioning Models with Fine-grained Audio Features, Text Embedding Supervision, and LLM Mix-up Augmentation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-028}
    • }
  •  Kato, S., Wang, P., Koike-Akino, T., Fujihashi, T., Mansour, H., Boufounos, P.T., "Object Trajectory Estimation with Multi-Band Wi-Fi Neural Dynamic Fusion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10445972, March 2024, pp. 13261-13265.
    BibTeX TR2024-019 PDF
    • @inproceedings{Kato2024mar,
    • author = {Kato, Sorachi and Wang, Pu and Koike-Akino, Toshiaki and Fujihashi, Takuya and Mansour, Hassan and Boufounos, Petros T.},
    • title = {Object Trajectory Estimation with Multi-Band Wi-Fi Neural Dynamic Fusion},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {13261--13265},
    • month = mar,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP48485.2024.10445972},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-019}
    • }
  •  Wang, P., Boufounos, P.T., "Monostatic DMG Passive Sensing with Hypothesis Testing", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10447134, March 2024, pp. 13381-13385.
    BibTeX TR2024-020 PDF
    • @inproceedings{Wang2024mar,
    • author = {Wang, Pu and Boufounos, Petros T.},
    • title = {Monostatic DMG Passive Sensing with Hypothesis Testing},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {13381--13385},
    • month = mar,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP48485.2024.10447134},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-020}
    • }
  •  Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Radar Perception with Scalable Connective Temporal Relations for Autonomous Driving", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10446449, March 2024, pp. 13266-13270.
    BibTeX TR2024-023 PDF
    • @inproceedings{Yataka2024mar,
    • author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
    • title = {Radar Perception with Scalable Connective Temporal Relations for Autonomous Driving},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {13266--13270},
    • month = mar,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP48485.2024.10446449},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-023}
    • }
  •  Kobori, H., Fukuchi, K., Wang, Y., "Evaluation of Information Security Risk from Training Data Inference in Federated Learning", The Institute of Electronics, Information and Communication Engineers, General Conference, March 2024.
    BibTeX
    • @inproceedings{Kobori2024mar,
    • author = {Kobori, Hiroko and Fukuchi, Ken and Wang, Ye},
    • title = {Evaluation of Information Security Risk from Training Data Inference in Federated Learning},
    • booktitle = {The Institute of Electronics, Information and Communication Engineers, General Conference},
    • year = 2024,
    • month = mar
    • }
  •  Fujihashi, T., Koike-Akino, T., "Graph-Based EEG Signal Compression for Human-Machine Interaction", IEEE Access, DOI: 10.1109/​ACCESS.2023.3347592, Vol. 12, No. IEEE, pp. 1163-1171, March 2024.
    BibTeX TR2024-015 PDF
    • @article{Fujihashi2024mar,
    • author = {Fujihashi, Takuya and Koike-Akino, Toshiaki},
    • title = {Graph-Based EEG Signal Compression for Human-Machine Interaction},
    • journal = {IEEE Access},
    • year = 2024,
    • volume = 12,
    • number = {IEEE},
    • pages = {1163--1171},
    • month = mar,
    • doi = {10.1109/ACCESS.2023.3347592},
    • issn = {2169-3536},
    • url = {https://www.merl.com/publications/TR2024-015}
    • }
  •  Baoueb, T., Liu, H., Fontaine, M., Le Roux, J., Richard, G., "SpecDiff-GAN: A Spectrally-Shaped Noise Diffusion GAN for Speech and Music Synthesis", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10446830, March 2024, pp. 986-990.
    BibTeX TR2024-013 PDF
    • @inproceedings{Baoueb2024mar,
    • author = {Baoueb, Teysir and Liu, Haocheng and Fontaine, Mathieu and Le Roux, Jonathan and Richard, Gaël},
    • title = {SpecDiff-GAN: A Spectrally-Shaped Noise Diffusion GAN for Speech and Music Synthesis},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {986--990},
    • month = mar,
    • doi = {10.1109/ICASSP48485.2024.10446830},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-013}
    • }
  •  Hori, C., Wang, P., Rahman, M., Vaca-Rubio, C., Khurana, S., Cherian, A., Le Roux, J., "Wi-Fi based Indoor Monitoring Enhanced by Multimodal Fusion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10447600, March 2024, pp. 13296-13300.
    BibTeX TR2024-012 PDF
    • @inproceedings{Hori2024mar,
    • author = {Hori, Chiori and Wang, Pu and Rahman, Mahbub and Vaca-Rubio, Cristian and Khurana, Sameer and Cherian, Anoop and Le Roux, Jonathan},
    • title = {Wi-Fi based Indoor Monitoring Enhanced by Multimodal Fusion},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {13296--13300},
    • month = mar,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP48485.2024.10447600},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-012}
    • }
  •  Liu, H., Baoueb, T., Fontaine, M., Le Roux, J., Richard, G., "GLA-Grad: A Griffin-Lim Extended Waveform Generation Diffusion Model", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10446058, March 2024, pp. 11611-11615.
    BibTeX TR2024-014 PDF
    • @inproceedings{Liu2024mar,
    • author = {Liu, Haocheng and Baoueb, Teysir and Fontaine, Mathieu and Le Roux, Jonathan and Richard, Gaël},
    • title = {GLA-Grad: A Griffin-Lim Extended Waveform Generation Diffusion Model},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {11611--11615},
    • month = mar,
    • doi = {10.1109/ICASSP48485.2024.10446058},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-014}
    • }
  •  Zhang, X., Mowlavi, S., Benosman, M., Basar, T., "Policy Optimization for PDE Control with a Warm Start", arXiv, March 2024.
    BibTeX arXiv
    • @article{Zhang2024mar,
    • author = {Zhang, Xiangyuan and Mowlavi, Saviz and Benosman, Mouhacine and Basar, Tamer},
    • title = {Policy Optimization for PDE Control with a Warm Start},
    • journal = {arXiv},
    • year = 2024,
    • month = mar,
    • url = {https://arxiv.org/abs/2403.01005}
    • }
  •  Hossain, T., sikder, B., Azad, M.T., Xie, Q., Yuan, M., Yagyu, E., Teo, K.H., Palacios, T., Chowdhury, N., "Fermi-Level Pinning Effect in Gate Region: A Case Study of Multi-Metal Gated AlGaN/GaN HEMT for High RF Linearity", IEEE Electron Devices Technology & Manufacturing Conference, February 2024.
    BibTeX TR2024-010 PDF
    • @inproceedings{Hossain2024feb,
    • author = {Hossain, Toiyob and sikder, Bejoy and Azad, Md.Tasnim and Xie, Qingyun and Yuan, Mengyang and Yagyu, Eiji and Teo, Koon Hoo and Palacios, Tomas and Chowdhury, Nadim},
    • title = {Fermi-Level Pinning Effect in Gate Region: A Case Study of Multi-Metal Gated AlGaN/GaN HEMT for High RF Linearity},
    • booktitle = {IEEE Electron Devices Technology & Manufacturing Conference},
    • year = 2024,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2024-010}
    • }
  •  Bortoff, S.A., Eisenhower, B., Adetola, V., O'Neil, Z., "Control Challenges and Opportunities in Building Automation" in The Impact of Automatic Control Research on Industrial Innovation: Enabling a Sustainable Future, February 2024.
    BibTeX TR2024-011 PDF
    • @incollection{Bortoff2024feb,
    • author = {Bortoff, Scott A. and Eisenhower, Bryan and Adetola, Veronica and O'Neil, Zheng},
    • title = {Control Challenges and Opportunities in Building Automation},
    • booktitle = {The Impact of Automatic Control Research on Industrial Innovation: Enabling a Sustainable Future},
    • year = 2024,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2024-011}
    • }
  •  Ozcan, E.C., Giammarino, V., Queeney, J., Paschalidis, I.C., "A Model-Based Approach for Improving Reinforcement Learning Efficiency Leveraging Expert Observations", arXiv, February 2024.
    BibTeX arXiv
    • @article{Ozcan2024feb,
    • author = {Ozcan, Erhan Can and Giammarino, Vittorio and Queeney, James and Paschalidis, Ioannis Ch.},
    • title = {A Model-Based Approach for Improving Reinforcement Learning Efficiency Leveraging Expert Observations},
    • journal = {arXiv},
    • year = 2024,
    • month = feb,
    • url = {https://arxiv.org/abs/2402.18836}
    • }
  •  Lowy, A., Li, Z., Liu, J., Koike-Akino, T., Parsons, K., Wang, Y., "Why Does Differential Privacy with Large ε Defend Against Practical Membership Inference Attacks?", AAAI Workshop on Privacy-Preserving Artificial Intelligence, February 2024.
    BibTeX TR2024-009 PDF
    • @inproceedings{Lowy2024feb2,
    • author = {Lowy, Andrew and Li, Zhuohang and Liu, Jing and Koike-Akino, Toshiaki and Parsons, Kieran and Wang, Ye},
    • title = {Why Does Differential Privacy with Large ε Defend Against Practical Membership Inference Attacks?},
    • booktitle = {AAAI Workshop on Privacy-Preserving Artificial Intelligence},
    • year = 2024,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2024-009}
    • }
  •  Basu, S., Lohit, S., Brand, M., "G-RepsNet: A Fast and General Construction of Equivariant Networks for Arbitrary Matrix Groups", arXiv, February 2024.
    BibTeX arXiv
    • @article{Basu2024feb,
    • author = {Basu, Sourya and Lohit, Suhas and Brand, Matthew},
    • title = {G-RepsNet: A Fast and General Construction of Equivariant Networks for Arbitrary Matrix Groups},
    • journal = {arXiv},
    • year = 2024,
    • month = feb,
    • url = {https://arxiv.org/abs/2402.15413}
    • }
  •  Xie, X., Mowlavi, S., Benosman, M., "Smooth and Sparse Latent Dynamics in Operator Learning with Jerk Regularization", arXiv, February 2024.
    BibTeX arXiv
    • @article{Xie2024feb,
    • author = {Xie, Xiaoyu and Mowlavi, Saviz and Benosman, Mouhacine},
    • title = {Smooth and Sparse Latent Dynamics in Operator Learning with Jerk Regularization},
    • journal = {arXiv},
    • year = 2024,
    • month = feb,
    • url = {https://arxiv.org/abs/2402.15636}
    • }
  •  Kuwabara, A., Osako Yutaro, , Kato, S., Fujihashi, T., Koike-Akino, T., Watanabe, T., "Implicit Neural Representation-based Hybrid Digital-Analog Image Delivery", IEEE International Conference on Computing, Networking and Communications (ICNC), February 2024.
    BibTeX TR2024-007 PDF
    • @inproceedings{Kuwabara2024feb,
    • author = {Kuwabara,Akihiro and Osako Yutaro and Kato, Sorachi and Fujihashi, Takuya and Koike-Akino, Toshiaki and Watanabe, Takashi},
    • title = {Implicit Neural Representation-based Hybrid Digital-Analog Image Delivery},
    • booktitle = {IEEE International Conference on Computing, Networking and Communications (ICNC)},
    • year = 2024,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2024-007}
    • }
  •  Boeddeker, C., Subramanian, A.S., Wichern, G., Haeb-Umbach, R., Le Roux, J., "TS-SEP: Joint Diarization and Separation Conditioned on Estimated Speaker Embeddings", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/​TASLP.2024.3350887, Vol. 32, pp. 1185-1197, February 2024.
    BibTeX TR2024-006 PDF
    • @article{Boeddeker2024feb,
    • author = {Boeddeker, Christoph and Subramanian, Aswin Shanmugam and Wichern, Gordon and Haeb-Umbach, Reinhold and Le Roux, Jonathan},
    • title = {TS-SEP: Joint Diarization and Separation Conditioned on Estimated Speaker Embeddings},
    • journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
    • year = 2024,
    • volume = 32,
    • pages = {1185--1197},
    • month = feb,
    • doi = {10.1109/TASLP.2024.3350887},
    • issn = {2329-9304},
    • url = {https://www.merl.com/publications/TR2024-006}
    • }
  •  Ma, Y., Rapp, J., Boufounos, P.T., Mansour, H., "A model of spatial resolution uncertainty for Compton camera imaging", International Conference on Advancements in Nuclear Instrumentation Measurement Methods and their Applications (ANIMMA), DOI: 10.1051/​epjconf/​202328810002, January 2024, pp. 10002.
    BibTeX TR2024-005 PDF
    • @inproceedings{Ma2024jan,
    • author = {Ma, Yanting and Rapp, Joshua and Boufounos, Petros T. and Mansour, Hassan},
    • title = {A model of spatial resolution uncertainty for Compton camera imaging},
    • booktitle = {Advancements in Nuclear Instrumentation Measurement Methods and their Applications (ANIMMA)},
    • year = 2024,
    • pages = 10002,
    • month = jan,
    • publisher = {EPJ Web of Conferences, 288},
    • doi = {10.1051/epjconf/202328810002},
    • url = {https://www.merl.com/publications/TR2024-005}
    • }
  •  Srinivas, N., Vinod, A.P., Di Cairano, S., Weiss, A., "Lunar Landing with Feasible Divert using Controllable Sets", AIAA SciTech, DOI: 10.2514/​6.2024-0324, January 2024, pp. AIAA 2024-0324.
    BibTeX TR2024-004 PDF
    • @inproceedings{Srinivas2024jan,
    • author = {Srinivas, Neeraj and Vinod, Abraham P. and Di Cairano, Stefano and Weiss, Avishai},
    • title = {Lunar Landing with Feasible Divert using Controllable Sets},
    • booktitle = {AIAA SCITECH 2024 Forum},
    • year = 2024,
    • pages = {AIAA 2024--0324},
    • month = jan,
    • doi = {10.2514/6.2024-0324},
    • url = {https://www.merl.com/publications/TR2024-004}
    • }
  •  Kitichotkul, R., Rapp, J., Goyal, V.K., "The Role of Detection Times in Reflectivity Estimation with Single-Photon Lidar", IEEE Journal of Selected Topics in Quantum Electronics, DOI: 10.1109/​JSTQE.2023.3333834, Vol. 30, No. 1, pp. 8800114:1-14, January 2024.
    BibTeX TR2024-003 PDF
    • @article{Kitichotkul2024jan,
    • author = {Kitichotkul, Ruangrawee and Rapp, Joshua and Goyal, Vivek K},
    • title = {The Role of Detection Times in Reflectivity Estimation with Single-Photon Lidar},
    • journal = {IEEE Journal of Selected Topics in Quantum Electronics},
    • year = 2024,
    • volume = 30,
    • number = 1,
    • pages = {8800114:1--14},
    • month = jan,
    • doi = {10.1109/JSTQE.2023.3333834},
    • url = {https://www.merl.com/publications/TR2024-003}
    • }
  •  Zhao, G., Jha, D.K., Wang, Y., Zhu, M., "iPolicy: Incremental Policy Algorithms for Feedback Motion Planning", arXiv, January 2024.
    BibTeX arXiv
    • @article{Zhao2024jan,
    • author = {Zhao, Guoxiang and Jha, Devesh K. and Wang, Yebin and Zhu, Minghui},
    • title = {iPolicy: Incremental Policy Algorithms for Feedback Motion Planning},
    • journal = {arXiv},
    • year = 2024,
    • month = jan,
    • url = {https://arxiv.org/abs/2401.02883}
    • }
  •  Carmichael, Z., Jones, L.S., Cherian, A., Michael J., , Scheirer, W., "Pixel-Grounded Prototypical Part Networks", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2024.
    BibTeX TR2024-002 PDF Presentation
    • @inproceedings{Carmichael2024jan,
    • author = {Carmichael, Zachariah and Jones, Lohit, Suhas and Cherian, Anoop and Michael J. and Scheirer, Walter},
    • title = {Pixel-Grounded Prototypical Part Networks},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2024,
    • month = jan,
    • url = {https://www.merl.com/publications/TR2024-002}
    • }
  •  Qiao, H., Kobayashi, T., Laughman, C.R., Bortoff, S.A., "On the Characteristics of One-Dimensional Compressible Flow", International Modelica Conference, Dirk Müller, Antonello Monti, and Andrea Benigni, Eds., DOI: 10.3384/​ecp204327, December 2023, pp. 327-336.
    BibTeX TR2024-001 PDF
    • @inproceedings{Qiao2023dec,
    • author = {Qiao, Hongtao and Kobayashi, Takashi and Laughman, Christopher R. and Bortoff, Scott A.},
    • title = {On the Characteristics of One-Dimensional Compressible Flow},
    • booktitle = {Proceedings of the 15th International Modelica Conference 2023},
    • year = 2023,
    • editor = {Dirk Müller, Antonello Monti, and Andrea Benigni},
    • pages = {327--336},
    • month = dec,
    • doi = {10.3384/ecp204327},
    • isbn = {978-91-8075-505-4},
    • url = {https://www.merl.com/publications/TR2024-001}
    • }
  •  Liu, X., Paul, S., Chatterjee, M., Cherian, A., "CAVEN: An Embodied Conversational Agent for Efficient Audio-Visual Navigation in Noisy Environments", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v38i4.28167, December 2023, pp. 3765-3773.
    BibTeX TR2023-154 PDF
    • @inproceedings{Liu2023dec2,
    • author = {Liu, Xiulong and Paul, Sudipta and Chatterjee, Moitreya and Cherian, Anoop},
    • title = {CAVEN: An Embodied Conversational Agent for Efficient Audio-Visual Navigation in Noisy Environments},
    • booktitle = {Proceedings of the 38th AAAI Conference on Artificial Intelligence},
    • year = 2023,
    • pages = {3765--3773},
    • month = dec,
    • doi = {10.1609/aaai.v38i4.28167},
    • url = {https://www.merl.com/publications/TR2023-154}
    • }