Publications

590 / 3,591 publications found.


  •  Cherian, A., Peng, K.-C., Lohit, S., Smith, K., Tenenbaum, J.B., "Are Deep Neural Networks SMARTer than Second Graders?", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), March 2023, pp. 10834-10844.
    BibTeX TR2023-014 PDF Data Software Presentation
    • @inproceedings{Cherian2023mar,
    • author = {Cherian, Anoop and Peng, Kuan-Chuan and Lohit, Suhas and Smith, Kevin and Tenenbaum, Joshua B.},
    • title = {Are Deep Neural Networks SMARTer than Second Graders?},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2023,
    • pages = {10834--10844},
    • month = mar,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2023-014}
    • }
  •  Mateus, A., Ranade, S., Ramalingam, S., Miraldo, P., "Fast and Accurate 3D Registration from Line Intersection Constraints", International Journal of Computer Vision, DOI: 10.1007/​s11263-023-01774-1, Vol. 131, pp. 2044-2069, February 2023.
    BibTeX TR2023-007 PDF
    • @article{Mateus2023feb,
    • author = {Mateus, Andre and Ranade, Siddhant and Ramalingam, Srikumar and Miraldo, Pedro},
    • title = {Fast and Accurate 3D Registration from Line Intersection Constraints},
    • journal = {International Journal of Computer Vision},
    • year = 2023,
    • volume = 131,
    • pages = {2044--2069},
    • month = feb,
    • doi = {10.1007/s11263-023-01774-1},
    • url = {https://www.merl.com/publications/TR2023-007}
    • }
  •  Aich, A., Peng, K.-C., Roy-Chowdhury, A.K., "Cross-Domain Video Anomaly Detection without Target Domain Adaptation", IEEE Winter Conference on Applications of Computer Vision (WACV), Crandall, D. and Gong, B. and Lee, Y. J. and Souvenir, R. and Yu, S., Eds., DOI: 10.1109/​WACV56688.2023.00261, January 2023, pp. 2578-2590.
    BibTeX TR2023-001 PDF Video Presentation
    • @inproceedings{Aich2023jan,
    • author = {Aich, Abhishek and Peng, Kuan-Chuan and Roy-Chowdhury, Amit K.},
    • title = {Cross-Domain Video Anomaly Detection without Target Domain Adaptation},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2023,
    • editor = {Crandall, D. and Gong, B. and Lee, Y. J. and Souvenir, R. and Yu, S.},
    • pages = {2578--2590},
    • month = jan,
    • publisher = {IEEE},
    • doi = {10.1109/WACV56688.2023.00261},
    • issn = {2642-9381},
    • isbn = {978-1-6654-9346-8},
    • url = {https://www.merl.com/publications/TR2023-001}
    • }
  •  Shimoya, R., Morimoto, T., van Baar, J., Boufounos, P.T., Ma, Y., Mansour, H., "Learning Occlusion-Aware Dense Correspondences for Multi-Modal Images", IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS), DOI: 10.1109/​AVSS56176.2022.9959354, November 2022, pp. 1-8.
    BibTeX TR2022-149 PDF
    • @inproceedings{Shimoya2022nov,
    • author = {Shimoya, Ryosuke and Morimoto, Tahashi and van Baar, Jeroen and Boufounos, Petros T. and Ma, Yanting and Mansour, Hassan},
    • title = {Learning Occlusion-Aware Dense Correspondences for Multi-Modal Images},
    • booktitle = {IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS)},
    • year = 2022,
    • pages = {1--8},
    • month = nov,
    • doi = {10.1109/AVSS56176.2022.9959354},
    • isbn = {978-1-6654-6382-9},
    • url = {https://www.merl.com/publications/TR2022-149}
    • }
  •  Romero, D., Lohit, S., "Learning Partial Equivariances from Data", Advances in Neural Information Processing Systems (NeurIPS), S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh, Eds., November 2022, pp. 36466-36478.
    BibTeX TR2022-148 PDF Presentation
    • @inproceedings{Romero2022nov,
    • author = {Romero, David and Lohit, Suhas},
    • title = {Learning Partial Equivariances from Data},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh},
    • pages = {36466--36478},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2022-148}
    • }
  •  Wang, H., Lohit, S., Jones, M.J., Fu, R., "What Makes a “Good” Data Augmentation in Knowledge Distillation – A Statistical Perspective", Advances in Neural Information Processing Systems (NeurIPS), S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh, Eds., November 2022, pp. 13456-13469.
    BibTeX TR2022-147 PDF
    • @inproceedings{Wang2022nov,
    • author = {Wang, Huan and Lohit, Suhas and Jones, Michael J. and Fu, Raymond},
    • title = {What Makes a “Good” Data Augmentation in Knowledge Distillation – A Statistical Perspective},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh},
    • pages = {13456--13469},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2022-147}
    • }
  •  Chatterjee, M., Ahuja, N., Cherian, A., "Learning Audio-Visual Dynamics Using Scene Graphs for Audio Source Separation", Advances in Neural Information Processing Systems (NeurIPS), November 2022.
    BibTeX TR2022-140 PDF Presentation
    • @inproceedings{Chatterjee2022nov,
    • author = {Chatterjee, Moitreya and Ahuja, Narendra and Cherian, Anoop},
    • title = {Learning Audio-Visual Dynamics Using Scene Graphs for Audio Source Separation},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2022-140}
    • }
  •  Ahmed, S.M., Lohit, S., Peng, K.-C., Jones, M.J., Roy Chowdhury, A.K., "Cross-Modal Knowledge Transfer Without Task-Relevant Source Data", European Conference on Computer Vision (ECCV), Avidan, S and Brostow, G and Cisse M and Farinella, G.M. and Hassner T., Eds., DOI: 10.1007/​978-3-031-19830-4_7, October 2022, pp. 111-127.
    BibTeX TR2022-135 PDF Video Software Presentation
    • @inproceedings{Ahmed2022oct,
    • author = {Ahmed, Sk Miraj and Lohit, Suhas and Peng, Kuan-Chuan and Jones, Michael J. and Roy Chowdhury, Amit K},
    • title = {Cross-Modal Knowledge Transfer Without Task-Relevant Source Data},
    • booktitle = {Computer Vision--ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23--27, 2022, Proceedings, Part XXXIV},
    • year = 2022,
    • editor = {Avidan, S and Brostow, G and Cisse M and Farinella, G.M. and Hassner T.},
    • pages = {111--127},
    • month = oct,
    • publisher = {Springer},
    • doi = {10.1007/978-3-031-19830-4_7},
    • isbn = {978-3-031-19830-4},
    • url = {https://www.merl.com/publications/TR2022-135}
    • }
  •  Paul, S., Roy Chowdhury, A.K., Cherian, A., "AVLEN: Audio-Visual-Language Embodied Navigation in 3D Environments", Advances in Neural Information Processing Systems (NeurIPS), October 2022, pp. 6236-6249.
    BibTeX TR2022-131 PDF Video Data Software
    • @inproceedings{Paul2022oct2,
    • author = {Paul, Sudipta and Roy Chowdhury, Amit K and Cherian, Anoop},
    • title = {AVLEN: Audio-Visual-Language Embodied Navigation in 3D Environments},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • pages = {6236--6249},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2022-131}
    • }
  •  Mansour, H., Lohit, S., Boufounos, P.T., "Distributed Radar Autofocus Imaging Using Deep Priors", IEEE International Conference on Image Processing (ICIP), DOI: 10.1109/​ICIP46576.2022.9897332, October 2022, pp. 2511-2515.
    BibTeX TR2022-129 PDF Video
    • @inproceedings{Mansour2022oct,
    • author = {Mansour, Hassan and Lohit, Suhas and Boufounos, Petros T.},
    • title = {Distributed Radar Autofocus Imaging Using Deep Priors},
    • booktitle = {IEEE International Conference on Image Processing (ICIP)},
    • year = 2022,
    • pages = {2511--2515},
    • month = oct,
    • doi = {10.1109/ICIP46576.2022.9897332},
    • url = {https://www.merl.com/publications/TR2022-129}
    • }
  •  Hori, C., Hori, T., Le Roux, J., "Low-Latency Streaming Scene-aware Interaction Using Audio-Visual Transformers", Interspeech, DOI: 10.21437/​Interspeech.2022-10891, September 2022, pp. 4511-4515.
    BibTeX TR2022-116 PDF
    • @inproceedings{Hori2022sep,
    • author = {Hori, Chiori and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Low-Latency Streaming Scene-aware Interaction Using Audio-Visual Transformers},
    • booktitle = {Interspeech},
    • year = 2022,
    • pages = {4511--4515},
    • month = sep,
    • doi = {10.21437/Interspeech.2022-10891},
    • url = {https://www.merl.com/publications/TR2022-116}
    • }
  •  Rambhatla, S., Jones, M.J., Chellappa, R., "An Empirical Analysis of Boosting Deep Networks", International Joint Conference on Neural Networks (IJCNN), DOI: 10.1109/​IJCNN55064.2022.9892204, July 2022.
    BibTeX TR2022-075 PDF Presentation
    • @inproceedings{Rambhatla2022jul,
    • author = {Rambhatla, Sai and Jones, Michael J. and Chellappa, Rama},
    • title = {An Empirical Analysis of Boosting Deep Networks},
    • booktitle = {International Joint Conference on Neural Networks (IJCNN)},
    • year = 2022,
    • month = jul,
    • doi = {10.1109/IJCNN55064.2022.9892204},
    • url = {https://www.merl.com/publications/TR2022-075}
    • }
  •  Miraldo, P., Iglesias, J.P., "A Unified Model for Line Projections in Catadioptric Cameras with Rotationally Symmetric Mirrors", IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR52688.2022.01534, June 2022.
    BibTeX TR2022-084 PDF
    • @inproceedings{Miraldo2022jun,
    • author = {Miraldo, Pedro and Iglesias, Jose Pedro},
    • title = {A Unified Model for Line Projections in Catadioptric Cameras with Rotationally Symmetric Mirrors},
    • booktitle = {IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2022,
    • month = jun,
    • doi = {10.1109/CVPR52688.2022.01534},
    • url = {https://www.merl.com/publications/TR2022-084}
    • }
  •  Sullivan, A., Wang, J., Li, X., Chen, S., Abbot, L., "PointMotionNet: Point-Wise Motion Learning for Large-Scale LiDAR Point Clouds Sequences", CVPR Workshop on Autonomous Driving, June 2022.
    BibTeX TR2022-083 PDF
    • @inproceedings{Sullivan2022jun,
    • author = {Sullivan, Alan and Wang, Jun and Li, Xiaolong and Chen, Siheng and Abbot, Lynn},
    • title = {PointMotionNet: Point-Wise Motion Learning for Large-Scale LiDAR Point Clouds Sequences},
    • booktitle = {CVPR Workshop on Autonomous Driving},
    • year = 2022,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2022-083}
    • }
  •  Chatterjee, M., Ahuja, N., Cherian, A., "Quantifying Predictive Uncertainty for Stochastic Video Synthesis from Audio", IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), June 2022.
    BibTeX TR2022-082 PDF
    • @inproceedings{Chatterjee2022jun,
    • author = {Chatterjee, Moitreya and Ahuja, Narendra and Cherian, Anoop},
    • title = {Quantifying Predictive Uncertainty for Stochastic Video Synthesis from Audio},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)},
    • year = 2022,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2022-082}
    • }
  •  Zhu, X., Jain, S., Tomizuka, M., van Baar, J., "Learning to Synthesize Volumetric Meshes from Vision-based Tactile Imprints", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA46639.2022.9812092, May 2022, pp. 4833-4839.
    BibTeX TR2022-055 PDF
    • @inproceedings{Zhu2022may2,
    • author = {Zhu, Xinghao and Jain, Siddarth and Tomizuka, Masayoshi and van Baar, Jeroen},
    • title = {Learning to Synthesize Volumetric Meshes from Vision-based Tactile Imprints},
    • booktitle = {2022 IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2022,
    • pages = {4833--4839},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA46639.2022.9812092},
    • isbn = {978-1-7281-9681-7},
    • url = {https://www.merl.com/publications/TR2022-055}
    • }
  •  Shah, A.P., Geng, S., Gao, P., Cherian, A., Hori, T., Marks, T.K., Le Roux, J., Hori, C., "Audio-Visual Scene-Aware Dialog and Reasoning Using Audio-Visual Transformers with Joint Student-Teacher Learning", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2022, pp. 7732-7736.
    BibTeX TR2022-019 PDF
    • @inproceedings{Shah2022apr,
    • author = {Shah, Ankit Parag and Geng, Shijie and Gao, Peng and Cherian, Anoop and Hori, Takaaki and Marks, Tim K. and Le Roux, Jonathan and Hori, Chiori},
    • title = {Audio-Visual Scene-Aware Dialog and Reasoning Using Audio-Visual Transformers with Joint Student-Teacher Learning},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {7732--7736},
    • month = apr,
    • publisher = {IEEE},
    • issn = {1520-6149},
    • isbn = {978-1-6654-0540-9},
    • url = {https://www.merl.com/publications/TR2022-019}
    • }
  •  Hori, C., Shah, A.P., Geng, S., Gao, P., Cherian, A., Hori, T., Le Roux, J., Marks, T.K., "Overview of Audio Visual Scene-Aware Dialog with Reasoning Track for Natural Language Generation in DSTC10", The 10th Dialog System Technology Challenge Workshop at AAAI, February 2022.
    BibTeX TR2022-016 PDF
    • @inproceedings{Hori2022feb,
    • author = {Hori, Chiori and Shah, Ankit Parag and Geng, Shijie and Gao, Peng and Cherian, Anoop and Hori, Takaaki and Le Roux, Jonathan and Marks, Tim K.},
    • title = {Overview of Audio Visual Scene-Aware Dialog with Reasoning Track for Natural Language Generation in DSTC10},
    • booktitle = {The 10th Dialog System Technology Challenge Workshop at AAAI},
    • year = 2022,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2022-016}
    • }
  •  Shah, A.P., Hori, T., Le Roux, J., Hori, C., DSTC10-AVSD Submission System with Reasoning using Audio-Visual Transformers with Joint Student-Teacher Learning, February 2022.
    BibTeX TR2022-025 PDF
    • @book{Shah2022feb,
    • author = {Shah, Ankit Parag and Hori, Takaaki and Le Roux, Jonathan and Hori, Chiori},
    • title = {DSTC10-AVSD Submission System with Reasoning using Audio-Visual Transformers with Joint Student-Teacher Learning},
    • year = 2022,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2022-025}
    • }
  •  Cherian, A., Hori, C., Marks, T.K., Le Roux, J., "(2.5+1)D Spatio-Temporal Scene Graphs for Video Question Answering", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v36i1.19922, February 2022, pp. 444-453.
    BibTeX TR2022-014 PDF Video Presentation
    • @inproceedings{Cherian2022feb,
    • author = {Cherian, Anoop and Hori, Chiori and Marks, Tim K. and Le Roux, Jonathan},
    • title = {(2.5+1)D Spatio-Temporal Scene Graphs for Video Question Answering},
    • booktitle = {Proceedings of the AAAI Conference on Artificial Intelligence},
    • year = 2022,
    • pages = {444--453},
    • month = feb,
    • doi = {10.1609/aaai.v36i1.19922},
    • url = {https://www.merl.com/publications/TR2022-014}
    • }
  •  Ke, L., Peng, K.-C., Lyu, S., "Towards To-a-T Spatio-Temporal Focus for Skeleton-Based Action Recognition", AAAI Conference on Artificial Intelligence, February 2022.
    BibTeX TR2022-015 PDF Presentation
    • @inproceedings{Ke2022feb,
    • author = {Ke, Lipeng and Peng, Kuan-Chuan and Lyu, Siwei},
    • title = {Towards To-a-T Spatio-Temporal Focus for Skeleton-Based Action Recognition},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2022,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2022-015}
    • }
  •  Shah, A., Sra, S., Chellappa, R., Cherian, A., "Max-Margin Contrastive Learning", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v36i8.20796, February 2022, pp. 8220-8230.
    BibTeX TR2022-013 PDF
    • @inproceedings{Shah2022feb,
    • author = {Shah, Anshul and Sra, Suvrit and Chellappa, Rama and Cherian, Anoop},
    • title = {Max-Margin Contrastive Learning},
    • booktitle = {Proceedings of the AAAI Conference on Artificial Intelligence},
    • year = 2022,
    • pages = {8220--8230},
    • month = feb,
    • doi = {10.1609/aaai.v36i8.20796},
    • url = {https://www.merl.com/publications/TR2022-013}
    • }
  •  Medin, S.C., Egger, B., Cherian, A., Wang, Y., Tenenbaum, J.B., Liu, X., Marks, T.K., "MOST-GAN: 3D Morphable StyleGAN for Disentangled Face Image Manipulation", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v36i2.20091, February 2022, pp. 1962-1971.
    BibTeX TR2022-011 PDF Video Data Presentation
    • @inproceedings{Medin2022feb,
    • author = {Medin, Safa C. and Egger, Bernhard and Cherian, Anoop and Wang, Ye and Tenenbaum, Joshua B. and Liu, Xiaoming and Marks, Tim K.},
    • title = {MOST-GAN: 3D Morphable StyleGAN for Disentangled Face Image Manipulation},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2022,
    • pages = {1962--1971},
    • month = feb,
    • doi = {10.1609/aaai.v36i2.20091},
    • url = {https://www.merl.com/publications/TR2022-011}
    • }
  •  Lohit, S., Jones, M.J., "Model Compression Using Optimal Transport", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2022.
    BibTeX TR2022-006 PDF Presentation
    • @inproceedings{Lohit2022jan,
    • author = {Lohit, Suhas and Jones, Michael J.},
    • title = {Model Compression Using Optimal Transport},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2022,
    • month = jan,
    • publisher = {CVF OpenAccess},
    • url = {https://www.merl.com/publications/TR2022-006}
    • }
  •  Yu, X., van Baar, J., Chen, S., Sullivan, A., "Keypoint-aligned 3D Human Shape Recovery from A Single Imagewith Bilayer-Graph", International Conference on 3D Vision (3DV), DOI: 10.1109/​3DV53792.2021.00060, December 2021, pp. 505-514.
    BibTeX TR2021-143 PDF
    • @inproceedings{Yu2021dec,
    • author = {Yu, Xin and van Baar, Jeroen and Chen, Siheng and Sullivan, Alan},
    • title = {Keypoint-aligned 3D Human Shape Recovery from A Single Imagewith Bilayer-Graph},
    • booktitle = {International Conference on 3D Vision (3DV)},
    • year = 2021,
    • pages = {505--514},
    • month = dec,
    • doi = {10.1109/3DV53792.2021.00060},
    • url = {https://www.merl.com/publications/TR2021-143}
    • }