Publications

3,591 major publications by members of the MERL staff.


  •  Shirai, Y., Jha, D.K., Raghunathan, A., Romeres, D., "Chance-Constrained Optimization for Contact-rich Systems using Mixed Integer Programming", Nonlinear Analysis: Hybrid Systems, December 2024.
    BibTeX TR2024-008 PDF
    • @article{Shirai2024dec,
    • author = {Shirai, Yuki and Jha, Devesh K. and Raghunathan, Arvind and Romeres, Diego},
    • title = {Chance-Constrained Optimization for Contact-rich Systems using Mixed Integer Programming},
    • journal = {Nonlinear Analysis: Hybrid Systems},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-008}
    • }
  •  Pan, Z., Wichern, G., Germain, F.G., Subramanian, A., Le Roux, J., "Late Audio-Visual Fusion for In-The-Wild Speaker Diarization", Hands-free Speech Communication and Microphone Arrays (HSCMA), April 2024.
    BibTeX TR2024-029 PDF
    • @inproceedings{Pan2024apr,
    • author = {Pan, Zexu and Wichern, Gordon and Germain, François G and Subramanian, Aswin and Le Roux, Jonathan},
    • title = {Late Audio-Visual Fusion for In-The-Wild Speaker Diarization},
    • booktitle = {Hands-free Speech Communication and Microphone Arrays (HSCMA)},
    • year = 2024,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2024-029}
    • }
  •  Fujihashi, T., Kato, S., Koike-Akino, T., "Implicit Neural Representation for Low-Overhead Graph-Based Holographic-Type Communications", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2024.
    BibTeX TR2024-022 PDF
    • @inproceedings{Fujihashi2024apr,
    • author = {Fujihashi, Takuya and Kato, Sorachi and Koike-Akino, Toshiaki},
    • title = {Implicit Neural Representation for Low-Overhead Graph-Based Holographic-Type Communications},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2024-022}
    • }
  •  Koo, J., Wichern, G., Germain, F.G., Khurana, S., Le Roux, J., "Understanding and Controlling Generative Music Transformers by Probing Individual Attention Heads", IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA), April 2024.
    BibTeX TR2024-032 PDF
    • @inproceedings{Koo2024apr,
    • author = {Koo, Junghyun and Wichern, Gordon and Germain, François G and Khurana, Sameer and Le Roux, Jonathan},
    • title = {Understanding and Controlling Generative Music Transformers by Probing Individual Attention Heads},
    • booktitle = {IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA)},
    • year = 2024,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2024-032}
    • }
  •  Vinod, A.P., Weiss, A., Di Cairano, S., "Projection-free computation of robust controllable sets with constrained zonotopes", arXiv, March 2024.
    BibTeX arXiv
    • @article{Vinod2024mar,
    • author = {Vinod, Abraham P. and Weiss, Avishai and Di Cairano, Stefano},
    • title = {Projection-free computation of robust controllable sets with constrained zonotopes},
    • journal = {arXiv},
    • year = 2024,
    • month = mar,
    • url = {https://arxiv.org/abs/2403.13730}
    • }
  •  Gaur, A., Pais, G., Miraldo, P., "Oriented-grid Encoder for 3D Implicit Representations", International Conference on 3D Vision (3DV), March 2024.
    BibTeX TR2024-031 PDF
    • @inproceedings{Gaur2024mar,
    • author = {Gaur, Arihant and Pais, Goncalo and Miraldo, Pedro},
    • title = {Oriented-grid Encoder for 3D Implicit Representations},
    • booktitle = {International Conference on 3D Vision (3DV)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-031}
    • }
  •  Chen, X., Liu, J., Wang, Y., Wang, P., Brand, M., Wang, G., Koike-Akino, T., "SuperLoRA: Parameter-Efficient Unified Adaptation of Multi-Layer Attention Modules", arXiv, March 2024.
    BibTeX arXiv
    • @article{Chen2024mar,
    • author = {Chen, Xiangyu and Liu, Jing and Wang, Ye and Wang, Pu and Brand, Matthew and Wang, Guanghui and Koike-Akino, Toshiaki},
    • title = {SuperLoRA: Parameter-Efficient Unified Adaptation of Multi-Layer Attention Modules},
    • journal = {arXiv},
    • year = 2024,
    • month = mar,
    • url = {https://arxiv.org/abs/2403.11887}
    • }
  •  Jeon, C.-B., Wichern, G., Germain, F.G., Le Roux, J., "Why does music source separation benefit from cacophony?", IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA), March 2024.
    BibTeX TR2024-030 PDF
    • @inproceedings{Jeon2024mar,
    • author = {Jeon, Chang-Bin and Wichern, Gordon and Germain, François G and Le Roux, Jonathan},
    • title = {Why does music source separation benefit from cacophony?},
    • booktitle = {IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-030}
    • }
  •  Bralios, D., Wichern, G., Germain, F.G., Pan, Z., Khurana, S., Hori, C., Le Roux, J., "Generation or Replication: Auscultating Audio Latent Diffusion Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-027 PDF
    • @inproceedings{Bralios2024mar,
    • author = {Bralios, Dimitrios and Wichern, Gordon and Germain, François G and Pan, Zexu and Khurana, Sameer and Hori, Chiori and Le Roux, Jonathan},
    • title = {Generation or Replication: Auscultating Audio Latent Diffusion Models},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-027}
    • }
  •  Fernandez-Menduina, S., Rapp, J., Mansour, H., Greiff, M., Parsons, K., "Tracking Beyond the Unambiguous Range with Modulo Single-Photon Lidar", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10446835, March 2024, pp. 6-10.
    BibTeX TR2024-021 PDF
    • @inproceedings{Fernandez-Menduina2024mar,
    • author = {Fernandez-Menduina, Samuel and Rapp, Joshua and Mansour, Hassan and Greiff, Marcus and Parsons, Kieran},
    • title = {Tracking Beyond the Unambiguous Range with Modulo Single-Photon Lidar},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {6--10},
    • month = mar,
    • doi = {10.1109/ICASSP48485.2024.10446835},
    • url = {https://www.merl.com/publications/TR2024-021}
    • }
  •  Masuyama, Y., Wichern, G., Germain, F.G., Pan, Z., Khurana, S., Hori, C., Le Roux, J., "NIIRF: Neural IIR Filter Field for HRTF Upsampling and Personalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-026 PDF
    • @inproceedings{Masuyama2024mar,
    • author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Pan, Zexu and Khurana, Sameer and Hori, Chiori and Le Roux, Jonathan},
    • title = {NIIRF: Neural IIR Filter Field for HRTF Upsampling and Personalization},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-026}
    • }
  •  Pan, Z., Wichern, G., Germain, F.G., Khurana, S., Le Roux, J., "NeuroHeed+: Improving Neuro-steered Speaker Extraction with Joint Auditory Attention Detection", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-025 PDF
    • @inproceedings{Pan2024mar,
    • author = {Pan, Zexu and Wichern, Gordon and Germain, François G and Khurana, Sameer and Le Roux, Jonathan},
    • title = {NeuroHeed+: Improving Neuro-steered Speaker Extraction with Joint Auditory Attention Detection},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-025}
    • }
  •  Sholokhov, A., Rapp, J., Nabi, S., Brunton, S., Kutz, N., Mansour, H., "Single-pixel imaging of dynamic flows using Neural ODE regularization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-024 PDF
    • @inproceedings{Sholokhov2024mar,
    • author = {Sholokhov, Aleksei and Rapp, Joshua and Nabi, Saleh and Brunton, Steven and Kutz, Nathan and Mansour, Hassan},
    • title = {Single-pixel imaging of dynamic flows using Neural ODE regularization},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-024}
    • }
  •  Wu, S.-L., Chang, X., Wichern, G., Jung, J.-W., Germain, F.G., Le Roux, J., Watanabe, S., "Improving Audio Captioning Models with Fine-grained Audio Features, Text Embedding Supervision, and LLM Mix-up Augmentation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-028 PDF
    • @inproceedings{Wu2024mar,
    • author = {Wu, Shih-Lun and Chang, Xuankai and Wichern, Gordon and Jung, Jee-weon and Germain, François G and Le Roux, Jonathan and Watanabe, Shinji},
    • title = {Improving Audio Captioning Models with Fine-grained Audio Features, Text Embedding Supervision, and LLM Mix-up Augmentation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-028}
    • }
  •  Kato, S., Wang, P., Koike-Akino, T., Fujihashi, T., Mansour, H., Boufounos, P.T., "Object Trajectory Estimation with Multi-Band Wi-Fi Neural Dynamic Fusion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-019 PDF
    • @inproceedings{Kato2024mar,
    • author = {Kato, Sorachi and Wang, Pu and Koike-Akino, Toshiaki and Fujihashi, Takuya and Mansour, Hassan and Boufounos, Petros T.},
    • title = {Object Trajectory Estimation with Multi-Band Wi-Fi Neural Dynamic Fusion},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-019}
    • }
  •  Wang, P., Boufounos, P.T., "Monostatic DMG Passive Sensing with Hypothesis Testing", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-020 PDF
    • @inproceedings{Wang2024mar,
    • author = {Wang, Pu and Boufounos, Petros T.},
    • title = {Monostatic DMG Passive Sensing with Hypothesis Testing},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-020}
    • }
  •  Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Radar Perception with Scalable Connective Temporal Relations for Autonomous Driving", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-023 PDF
    • @inproceedings{Yataka2024mar,
    • author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
    • title = {Radar Perception with Scalable Connective Temporal Relations for Autonomous Driving},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-023}
    • }
  •  Kobori, H., Fukuchi, K., Wang, Y., "Evaluation of Information Security Risk from Training Data Inference in Federated Learning", The Institute of Electronics, Information and Communication Engineers, General Conference, March 2024.
    BibTeX
    • @inproceedings{Kobori2024mar,
    • author = {Kobori, Hiroko and Fukuchi, Ken and Wang, Ye},
    • title = {Evaluation of Information Security Risk from Training Data Inference in Federated Learning},
    • booktitle = {The Institute of Electronics, Information and Communication Engineers, General Conference},
    • year = 2024,
    • month = mar
    • }
  •  Fujihashi, T., Koike-Akino, T., "Graph-Based EEG Signal Compression for Human-Machine Interaction", IEEE Access, DOI: 10.1109/​ACCESS.2023.3347592, Vol. 12, No. IEEE, pp. 1163-1171, March 2024.
    BibTeX TR2024-015 PDF
    • @article{Fujihashi2024mar,
    • author = {Fujihashi, Takuya and Koike-Akino, Toshiaki},
    • title = {Graph-Based EEG Signal Compression for Human-Machine Interaction},
    • journal = {IEEE Access},
    • year = 2024,
    • volume = 12,
    • number = {IEEE},
    • pages = {1163--1171},
    • month = mar,
    • doi = {10.1109/ACCESS.2023.3347592},
    • issn = {2169-3536},
    • url = {https://www.merl.com/publications/TR2024-015}
    • }
  •  Baoueb, T., Liu, H., Fontaine, M., Le Roux, J., Richard, G., "SpecDiff-GAN: A Spectrally-Shaped Noise Diffusion GAN for Speech and Music Synthesis", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-013 PDF
    • @inproceedings{Baoueb2024mar,
    • author = {Baoueb, Teysir and Liu, Haocheng and Fontaine, Mathieu and Le Roux, Jonathan and Richard, Gaël},
    • title = {SpecDiff-GAN: A Spectrally-Shaped Noise Diffusion GAN for Speech and Music Synthesis},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-013}
    • }
  •  Hori, C., Wang, P., Rahman, M., Vaca-Rubio, C., Khurana, S., Cherian, A., Le Roux, J., "Wi-Fi based Indoor Monitoring Enhanced by Multimodal Fusion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-012 PDF
    • @inproceedings{Hori2024mar,
    • author = {Hori, Chiori and Wang, Pu and Rahman, Mahbub and Vaca-Rubio, Cristian and Khurana, Sameer and Cherian, Anoop and Le Roux, Jonathan},
    • title = {Wi-Fi based Indoor Monitoring Enhanced by Multimodal Fusion},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-012}
    • }
  •  Liu, H., Baoueb, T., Fontaine, M., Le Roux, J., Richard, G., "GLA-Grad: A Griffin-Lim Extended Waveform Generation Diffusion Model", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2024.
    BibTeX TR2024-014 PDF
    • @inproceedings{Liu2024mar,
    • author = {Liu, Haocheng and Baoueb, Teysir and Fontaine, Mathieu and Le Roux, Jonathan and Richard, Gaël},
    • title = {GLA-Grad: A Griffin-Lim Extended Waveform Generation Diffusion Model},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2024-014}
    • }
  •  Zhang, X., Mowlavi, S., Benosman, M., Basar, T., "Policy Optimization for PDE Control with a Warm Start", arXiv, March 2024.
    BibTeX arXiv
    • @article{Zhang2024mar,
    • author = {Zhang, Xiangyuan and Mowlavi, Saviz and Benosman, Mouhacine and Basar, Tamer},
    • title = {Policy Optimization for PDE Control with a Warm Start},
    • journal = {arXiv},
    • year = 2024,
    • month = mar,
    • url = {https://arxiv.org/abs/2403.01005}
    • }
  •  Hossain, T., sikder, B., Azad, M.T., Xie, Q., Yuan, M., Yagyu, E., Teo, K.H., Palacios, T., Chowdhury, N., "Fermi-Level Pinning Effect in Gate Region: A Case Study of Multi-Metal Gated AlGaN/GaN HEMT for High RF Linearity", IEEE Electron Devices Technology & Manufacturing Conference, February 2024.
    BibTeX TR2024-010 PDF
    • @inproceedings{Hossain2024feb,
    • author = {Hossain, Toiyob and sikder, Bejoy and Azad, Md.Tasnim and Xie, Qingyun and Yuan, Mengyang and Yagyu, Eiji and Teo, Koon Hoo and Palacios, Tomas and Chowdhury, Nadim},
    • title = {Fermi-Level Pinning Effect in Gate Region: A Case Study of Multi-Metal Gated AlGaN/GaN HEMT for High RF Linearity},
    • booktitle = {IEEE Electron Devices Technology & Manufacturing Conference},
    • year = 2024,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2024-010}
    • }
  •  Bortoff, S.A., Eisenhower, B., Adetola, V., O'Neil, Z., "Control Challenges and Opportunities in Building Automation" in The Impact of Automatic Control Research on Industrial Innovation: Enabling a Sustainable Future, February 2024.
    BibTeX TR2024-011 PDF
    • @incollection{Bortoff2024feb,
    • author = {Bortoff, Scott A. and Eisenhower, Bryan and Adetola, Veronica and O'Neil, Zheng},
    • title = {Control Challenges and Opportunities in Building Automation},
    • booktitle = {The Impact of Automatic Control Research on Industrial Innovation: Enabling a Sustainable Future},
    • year = 2024,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2024-011}
    • }