Publications

128 / 3,874 publications found.


  •  Sawada, N., Miraldo, P., Lohit, S., Marks, T.K., Chatterjee, M., "FreBIS: Frequency-Based Stratification for Neural Implicit Surface Representations", IEEE Conference on Computer Vision and Pattern Recognition Workshop (CVPR), June 2025.
    BibTeX TR2025-074 PDF
    • @inproceedings{Sawada2025jun,
    • author = {Sawada, Naoko and Miraldo, Pedro and Lohit, Suhas and Marks, Tim K. and Chatterjee, Moitreya},
    • title = {{FreBIS: Frequency-Based Stratification for Neural Implicit Surface Representations}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshop (CVPR)},
    • year = 2025,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2025-074}
    • }
  •  Hu, Y., Lohit, S., Kamilov, U., Marks, T.K., "Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal", arXiv, April 2025.
    BibTeX arXiv
    • @article{Hu2025apr,
    • author = {Hu, Yuyang and Lohit, Suhas and Kamilov, Ulugbek and Marks, Tim K.},
    • title = {{Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal}},
    • journal = {arXiv},
    • year = 2025,
    • month = apr,
    • url = {https://arxiv.org/abs/2504.03607}
    • }
  •  Das, A., Rahman, S., Xiang, X., Palash, R.H., Hossain, T., Sikder, B., Yagyu, E., Nakamura, M., Teo, K.H., Chowdhury, N., "Inverse Design of AlGaN/GaN HEMT RF Device with Source Connected Field Plate", Advanced Theory and Simulations, DOI: 10.1002/​adts.202401207, March 2025.
    BibTeX TR2025-040 PDF
    • @article{Das2025mar,
    • author = {Das, Aurick and Rahman, Saimur and Xiang, Xiaofeng and Palash, Raffd Hassan and Hossain, Toiyob and Sikder, Bejoy and Yagyu, Eiji and Nakamura, Marika and Teo, Koon Hoo and Chowdhury, Nadim},
    • title = {{Inverse Design of AlGaN/GaN HEMT RF Device with Source Connected Field Plate}},
    • journal = {Advanced Theory and Simulations},
    • year = 2025,
    • month = mar,
    • doi = {10.1002/adts.202401207},
    • url = {https://www.merl.com/publications/TR2025-040}
    • }
  •  Shenoy, V., Lohit, S., Mansour, H., Chellappa, R., Marks, T.K., "Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models", arXiv, March 2025.
    BibTeX arXiv
    • @article{Shenoy2025mar,
    • author = {Shenoy, Vineet and Lohit, Suhas and Mansour, Hassan and Chellappa, Rama and Marks, Tim K.},
    • title = {{Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.17269}
    • }
  •  Shenoy, V., Wu, S., Comas, A., Marks, T.K., Lohit, S., Mansour, H., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", arXiv, March 2025.
    BibTeX arXiv
    • @article{Shenoy2025mar2,
    • author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Marks, Tim K. and Lohit, Suhas and Mansour, Hassan},
    • title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.17351}
    • }
  •  Lohit, S., Marks, T.K., "Rotation-Equivariant Neural Networks for Cloud Removal from Satellite Images", Asilomar Conference on Signals, Systems, and Computers (ACSSC), DOI: 10.1109/​IEEECONF60004.2024.10942613, January 2025, pp. 1360-1365.
    BibTeX TR2025-009 PDF
    • @inproceedings{Lohit2025jan,
    • author = {Lohit, Suhas and Marks, Tim K.},
    • title = {{Rotation-Equivariant Neural Networks for Cloud Removal from Satellite Images}},
    • booktitle = {2024 58th Asilomar Conference on Signals, Systems, and Computers (ACSSC)},
    • year = 2025,
    • pages = {1360--1365},
    • month = jan,
    • publisher = {IEEE},
    • doi = {10.1109/IEEECONF60004.2024.10942613},
    • issn = {2576-2303},
    • isbn = {979-8-3503-5405-8},
    • url = {https://www.merl.com/publications/TR2025-009}
    • }
  •  Berntorp, K., Greiff, M., "A Framework for Joint Vehicle Localization and Road Mapping Using Onboard Sensors", Control Engineering Practice, November 2024.
    BibTeX TR2024-163 PDF
    • @article{Berntorp2024nov,
    • author = {Berntorp, Karl and Greiff, Marcus},
    • title = {{A Framework for Joint Vehicle Localization and Road Mapping Using Onboard Sensors}},
    • journal = {Control Engineering Practice},
    • year = 2024,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2024-163}
    • }
  •  Kosanic, M., Sun, H., Kawano, S., Raghunathan, A., Kitamura, S., "Sequentially Pruning Phase Rebalance Schedule: Load Profile Learning Approach", IEEE PES Innovative Smart Grid Technologies Conference - Europe (ISGT Europe), DOI: 10.1109/​ISGTEUROPE62998.2024.10861894, October 2024.
    BibTeX TR2024-143 PDF
    • @inproceedings{Kosanic2024oct,
    • author = {Kosanic, Miroslav and Sun, Hongbo and Kawano, Shunsuke and Raghunathan, Arvind and Kitamura, Shoichi},
    • title = {{Sequentially Pruning Phase Rebalance Schedule: Load Profile Learning Approach}},
    • booktitle = {IEEE PES Innovative Smart Grid Technologies Conference - Europe (ISGT Europe)},
    • year = 2024,
    • month = oct,
    • doi = {10.1109/ISGTEUROPE62998.2024.10861894},
    • url = {https://www.merl.com/publications/TR2024-143}
    • }
  •  Cherian, A., Jain, S., Marks, T.K., "Few-shot Transparent Instance Segmentation for Bin Picking", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), September 2024, pp. 5009-5016.
    BibTeX TR2024-127 PDF Video
    • @inproceedings{Cherian2024sep,
    • author = {Cherian, Anoop and Jain, Siddarth and Marks, Tim K.},
    • title = {{Few-shot Transparent Instance Segmentation for Bin Picking}},
    • booktitle = {2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2024,
    • pages = {5009--5016},
    • month = sep,
    • publisher = {IEEE},
    • url = {https://www.merl.com/publications/TR2024-127}
    • }
  •  Yin, J., Luo, A., Du, Y., Cherian, A., Marks, T.K., Le Roux, J., Gan, C., "Disentangled Acoustic Fields For Multimodal Physical Scene Understanding", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), September 2024, pp. 557-564.
    BibTeX TR2024-125 PDF
    • @inproceedings{Yin2024sep,
    • author = {Yin, Jie and Luo, Andrew and Du, Yilun and Cherian, Anoop and Marks, Tim K. and {Le Roux}, Jonathan and Gan, Chuang},
    • title = {{Disentangled Acoustic Fields For Multimodal Physical Scene Understanding}},
    • booktitle = {2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2024,
    • pages = {557--564},
    • month = sep,
    • publisher = {IEEE},
    • url = {https://www.merl.com/publications/TR2024-125}
    • }
  •  Berntorp, K., Greiff, M., "Variational Bayes Kalman Filter for Joint Vehicle Localization and Road Mapping Using Onboard Sensors", European Control Conference (ECC), DOI: 10.23919/​ECC64448.2024.10590965, June 2024, pp. 725-730.
    BibTeX TR2024-082 PDF
    • @inproceedings{Berntorp2024jun,
    • author = {Berntorp, Karl and Greiff, Marcus},
    • title = {{Variational Bayes Kalman Filter for Joint Vehicle Localization and Road Mapping Using Onboard Sensors}},
    • booktitle = {European Control Conference (ECC)},
    • year = 2024,
    • pages = {725--730},
    • month = jun,
    • doi = {10.23919/ECC64448.2024.10590965},
    • url = {https://www.merl.com/publications/TR2024-082}
    • }
  •  Ni, H., Egger, B., Lohit, S., Cherian, A., Wang, Y., Koike-Akino, T., Huang, S.X., Marks, T.K., "TI2V-Zero: Zero-Shot Image Conditioning for Text-to-Video Diffusion Models", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2024, pp. 9015-9025.
    BibTeX TR2024-059 PDF Video Software Presentation
    • @inproceedings{Ni2024jun,
    • author = {Ni, Haomiao and Egger, Bernhard and Lohit, Suhas and Cherian, Anoop and Wang, Ye and Koike-Akino, Toshiaki and Huang, Sharon X. and Marks, Tim K.},
    • title = {{TI2V-Zero: Zero-Shot Image Conditioning for Text-to-Video Diffusion Models}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2024,
    • pages = {9015--9025},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2024-059}
    • }
  •  Dey, R., Egger, B., Boddeti, V., Wang, Y., Marks, T.K., "CoLa-SDF: Controllable Latent StyleSDF for Disentangled 3D Face Generation", IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), April 2024.
    BibTeX TR2024-045 PDF
    • @inproceedings{Dey2024apr,
    • author = {Dey, Rahul and Egger, Bernhard and Boddeti, Vishnu and Wang, Ye and Marks, Tim K.},
    • title = {{CoLa-SDF: Controllable Latent StyleSDF for Disentangled 3D Face Generation}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)},
    • year = 2024,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2024-045}
    • }
  •  Yang, Z., Liu, J., Chen, P., Cherian, A., Marks, T.K., Le Roux, J., Gan, C., "RILA: Reflective and Imaginative Language Agent for Zero-Shot Semantic Audio-Visual Navigation", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), April 2024, pp. 16251-16261.
    BibTeX TR2024-043 PDF
    • @inproceedings{Yang2024apr,
    • author = {Yang, Zeyuan and Liu, Jiageng and Chen, Peihao and Cherian, Anoop and Marks, Tim K. and {Le Roux}, Jonathan and Gan, Chuang},
    • title = {{RILA: Reflective and Imaginative Language Agent for Zero-Shot Semantic Audio-Visual Navigation}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2024,
    • pages = {16251--16261},
    • month = apr,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2024-043}
    • }
  •  Nair, N.G., Cherian, A., Lohit, S., Wang, Y., Koike-Akino, T., Patel, V.M., Marks, T.K., "Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis", IEEE International Conference on Computer Vision (ICCV), October 2023, pp. 20850-20860.
    BibTeX TR2023-126 PDF Software Presentation
    • @inproceedings{Nair2023sep,
    • author = {Nair, Nithin Gopalakrishnan and Cherian, Anoop and Lohit, Suhas and Wang, Ye and Koike-Akino, Toshiaki and Patel, Vishal M. and Marks, Tim K.},
    • title = {{Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis}},
    • booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision},
    • year = 2023,
    • pages = {20850--20860},
    • month = oct,
    • publisher = {IEEE/CVF},
    • url = {https://www.merl.com/publications/TR2023-126}
    • }
  •  Shenoy, V., Marks, T.K., Mansour, H., Lohit, S., "Unrolled IPPG: Video Heart Rate Esitmation via Unrolling Proximal Gradient Descent", IEEE International Conference on Image Processing (ICIP), DOI: 10.1109/​ICIP49359.2023.10222169, September 2023, pp. 2715-2719.
    BibTeX TR2023-116 PDF Video
    • @inproceedings{Shenoy2023sep,
    • author = {Shenoy, Vineet and Marks, Tim K. and Mansour, Hassan and Lohit, Suhas},
    • title = {{Unrolled IPPG: Video Heart Rate Esitmation via Unrolling Proximal Gradient Descent}},
    • booktitle = {IEEE International Conference on Image Processing (ICIP)},
    • year = 2023,
    • pages = {2715--2719},
    • month = sep,
    • publisher = {IEEE},
    • doi = {10.1109/ICIP49359.2023.10222169},
    • isbn = {978-1-7281-9835-4},
    • url = {https://www.merl.com/publications/TR2023-116}
    • }
  •  Berntorp, K., Greiff, M., Di Cairano, S., Miraldo, P., "Bayesian Sensor Fusion for Joint Vehicle Localization and Road Mapping Using Onboard Sensors", International Conference on Information Fusion (FUSION), DOI: 10.23919/​FUSION52260.2023.10224204, June 2023, pp. 1-8.
    BibTeX TR2023-074 PDF
    • @inproceedings{Berntorp2023jun,
    • author = {Berntorp, Karl and Greiff, Marcus and {Di Cairano}, Stefano and Miraldo, Pedro},
    • title = {{Bayesian Sensor Fusion for Joint Vehicle Localization and Road Mapping Using Onboard Sensors}},
    • booktitle = {International Conference on Information Fusion (FUSION)},
    • year = 2023,
    • pages = {1--8},
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.23919/FUSION52260.2023.10224204},
    • isbn = {979-8-89034-485-4},
    • url = {https://www.merl.com/publications/TR2023-074}
    • }
  •  Cherian, A., Jain, S., Marks, T.K., Sullivan, A., "Discriminative 3D Shape Modeling for Few-Shot Instance Segmentation", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA48891.2023.10160644, May 2023, pp. 9296-9302.
    BibTeX TR2023-010 PDF Presentation
    • @inproceedings{Cherian2023may,
    • author = {Cherian, Anoop and Jain, Siddarth and Marks, Tim K. and Sullivan, Alan},
    • title = {{Discriminative 3D Shape Modeling for Few-Shot Instance Segmentation}},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2023,
    • pages = {9296--9302},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA48891.2023.10160644},
    • url = {https://www.merl.com/publications/TR2023-010}
    • }
  •  Ota, K., Tung, H.-Y., Smith, K., Cherian, A., Marks, T.K., Sullivan, A., Kanezaki, A., Tenenbaum, J.B., "H-SAUR: Hypothesize, Simulate, Act, Update, and Repeat for Understanding Object Articulations from Interactions", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA48891.2023.10160575, May 2023, pp. 7272-7278.
    BibTeX TR2023-009 PDF
    • @inproceedings{Ota2023may,
    • author = {Ota, Kei and Tung, Hsiao-Yu and Smith, Kevin and Cherian, Anoop and Marks, Tim K. and Sullivan, Alan and Kanezaki, Asako and Tenenbaum, Joshua B.},
    • title = {{H-SAUR: Hypothesize, Simulate, Act, Update, and Repeat for Understanding Object Articulations from Interactions}},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2023,
    • pages = {7272--7278},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA48891.2023.10160575},
    • url = {https://www.merl.com/publications/TR2023-009}
    • }
  •  Shah, A.P., Geng, S., Gao, P., Cherian, A., Hori, T., Marks, T.K., Le Roux, J., Hori, C., "Audio-Visual Scene-Aware Dialog and Reasoning Using Audio-Visual Transformers with Joint Student-Teacher Learning", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2022, pp. 7732-7736.
    BibTeX TR2022-019 PDF
    • @inproceedings{Shah2022apr,
    • author = {Shah, Ankit Parag and Geng, Shijie and Gao, Peng and Cherian, Anoop and Hori, Takaaki and Marks, Tim K. and {Le Roux}, Jonathan and Hori, Chiori},
    • title = {{Audio-Visual Scene-Aware Dialog and Reasoning Using Audio-Visual Transformers with Joint Student-Teacher Learning}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {7732--7736},
    • month = apr,
    • publisher = {IEEE},
    • issn = {1520-6149},
    • isbn = {978-1-6654-0540-9},
    • url = {https://www.merl.com/publications/TR2022-019}
    • }
  •  Hori, C., Shah, A.P., Geng, S., Gao, P., Cherian, A., Hori, T., Le Roux, J., Marks, T.K., "Overview of Audio Visual Scene-Aware Dialog with Reasoning Track for Natural Language Generation in DSTC10", The 10th Dialog System Technology Challenge Workshop at AAAI, February 2022.
    BibTeX TR2022-016 PDF
    • @inproceedings{Hori2022feb,
    • author = {Hori, Chiori and Shah, Ankit Parag and Geng, Shijie and Gao, Peng and Cherian, Anoop and Hori, Takaaki and {Le Roux}, Jonathan and Marks, Tim K.},
    • title = {{Overview of Audio Visual Scene-Aware Dialog with Reasoning Track for Natural Language Generation in DSTC10}},
    • booktitle = {The 10th Dialog System Technology Challenge Workshop at AAAI},
    • year = 2022,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2022-016}
    • }
  •  Cherian, A., Hori, C., Marks, T.K., Le Roux, J., "(2.5+1)D Spatio-Temporal Scene Graphs for Video Question Answering", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v36i1.19922, February 2022, pp. 444-453.
    BibTeX TR2022-014 PDF Video Presentation
    • @inproceedings{Cherian2022feb,
    • author = {Cherian, Anoop and Hori, Chiori and Marks, Tim K. and {Le Roux}, Jonathan},
    • title = {{(2.5+1)D Spatio-Temporal Scene Graphs for Video Question Answering}},
    • booktitle = {Proceedings of the AAAI Conference on Artificial Intelligence},
    • year = 2022,
    • pages = {444--453},
    • month = feb,
    • doi = {10.1609/aaai.v36i1.19922},
    • url = {https://www.merl.com/publications/TR2022-014}
    • }
  •  Medin, S.C., Egger, B., Cherian, A., Wang, Y., Tenenbaum, J.B., Liu, X., Marks, T.K., "MOST-GAN: 3D Morphable StyleGAN for Disentangled Face Image Manipulation", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v36i2.20091, February 2022, pp. 1962-1971.
    BibTeX TR2022-011 PDF Video Data Presentation
    • @inproceedings{Medin2022feb,
    • author = {Medin, Safa C. and Egger, Bernhard and Cherian, Anoop and Wang, Ye and Tenenbaum, Joshua B. and Liu, Xiaoming and Marks, Tim K.},
    • title = {{MOST-GAN: 3D Morphable StyleGAN for Disentangled Face Image Manipulation}},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2022,
    • pages = {1962--1971},
    • month = feb,
    • doi = {10.1609/aaai.v36i2.20091},
    • url = {https://www.merl.com/publications/TR2022-011}
    • }
  •  Cherian, A., Pais, G., Jain, S., Marks, T.K., Sullivan, A., "InSeGAN: A Generative Approach to Segmenting Identical Instances in Depth Images", IEEE International Conference on Computer Vision (ICCV), October 2021, pp. 10023-10032.
    BibTeX TR2021-097 PDF Video Data Software Presentation
    • @inproceedings{Cherian2021oct,
    • author = {Cherian, Anoop and Pais, Goncalo and Jain, Siddarth and Marks, Tim K. and Sullivan, Alan},
    • title = {{InSeGAN: A Generative Approach to Segmenting Identical Instances in Depth Images}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2021,
    • pages = {10023--10032},
    • month = oct,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2021-097}
    • }
  •  Comas, A., Marks, T.K., Mansour, H., Lohit, S., Ma, Y., Liu, X., "TURNIP: Time-series U-NET with Recurrence for NIR Imaging PPG", IEEE International Conference on Image Processing (ICIP), DOI: 10.1109/​ICIP42928.2021.9506663, September 2021, pp. 309-313.
    BibTeX TR2021-099 PDF
    • @inproceedings{Comas2021sep,
    • author = {Comas, Armand and Marks, Tim K. and Mansour, Hassan and Lohit, Suhas and Ma, Yechi and Liu, Xiaoming},
    • title = {{TURNIP: Time-series U-NET with Recurrence for NIR Imaging PPG}},
    • booktitle = {IEEE International Conference on Image Processing (ICIP)},
    • year = 2021,
    • pages = {309--313},
    • month = sep,
    • publisher = {IEEE},
    • doi = {10.1109/ICIP42928.2021.9506663},
    • url = {https://www.merl.com/publications/TR2021-099}
    • }