Publications

591 / 3,604 publications found.


  •  Jain, S., Corcodel, R., Jha, D.K., Romeres, D., "Vision Guided Food Assembly by Robot Teaching from Target Composition", ICRA 2023 Workshop on Task-Informed Grasping IV (TIG-IV): From Farm to Fork, May 2023.
    BibTeX TR2023-067 PDF
    • @inproceedings{Jain2023may,
    • author = {Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego},
    • title = {Vision Guided Food Assembly by Robot Teaching from Target Composition},
    • booktitle = {ICRA 2023 Workshop on Task-Informed Grasping IV (TIG-IV): From Farm to Fork},
    • year = 2023,
    • month = may,
    • url = {https://www.merl.com/publications/TR2023-067}
    • }
  •  Cherian, A., Jain, S., Marks, T.K., Sullivan, A., "Discriminative 3D Shape Modeling for Few-Shot Instance Segmentation", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA48891.2023.10160644, May 2023, pp. 9296-9302.
    BibTeX TR2023-010 PDF Presentation
    • @inproceedings{Cherian2023may,
    • author = {Cherian, Anoop and Jain, Siddarth and Marks, Tim K. and Sullivan, Alan},
    • title = {Discriminative 3D Shape Modeling for Few-Shot Instance Segmentation},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2023,
    • pages = {9296--9302},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA48891.2023.10160644},
    • url = {https://www.merl.com/publications/TR2023-010}
    • }
  •  Ota, K., Tung, H.-Y., Smith, K., Cherian, A., Marks, T.K., Sullivan, A., Kanezaki, A., Tenenbaum, J.B., "H-SAUR: Hypothesize, Simulate, Act, Update, and Repeat for Understanding Object Articulations from Interactions", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA48891.2023.10160575, May 2023, pp. 7272-7278.
    BibTeX TR2023-009 PDF
    • @inproceedings{Ota2023may,
    • author = {Ota, Kei and Tung, Hsiao-Yu and Smith, Kevin and Cherian, Anoop and Marks, Tim K. and Sullivan, Alan and Kanezaki, Asako and Tenenbaum, Joshua B.},
    • title = {H-SAUR: Hypothesize, Simulate, Act, Update, and Repeat for Understanding Object Articulations from Interactions},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2023,
    • pages = {7272--7278},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA48891.2023.10160575},
    • url = {https://www.merl.com/publications/TR2023-009}
    • }
  •  Shah, A., Roy, A., Shah, K., Mishra, S.K., Jacobs, D., Cherian, A., Chellappa, R., "HaLP: Hallucinating Latent Positives for Skeleton-based Self-Supervised Learning of Actions", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), May 2023, pp. 18846-18856.
    BibTeX TR2023-035 PDF
    • @inproceedings{Shah2023may,
    • author = {Shah, Anshul and Roy, Aniket and Shah, Ketul and Mishra, Shlok Kumar and Jacobs, David and Cherian, Anoop and Chellappa, Rama},
    • title = {HaLP: Hallucinating Latent Positives for Skeleton-based Self-Supervised Learning of Actions},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2023,
    • pages = {18846--18856},
    • month = may,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2023-035}
    • }
  •  Zhang, J., Cherian, A., Liu, Y., Shabat, I.B., Rodriguez, C., Gould, S., "Aligning Step-by-Step Instructional Diagrams to Video Demonstrations", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), May 2023, pp. 2483-2492.
    BibTeX TR2023-034 PDF
    • @inproceedings{Zhang2023may,
    • author = {Zhang, Jiahao and Cherian, Anoop and Liu, Yanbin and Shabat, Itzik Ben and Rodriguez, Cristian and Gould, Stephen},
    • title = {Aligning Step-by-Step Instructional Diagrams to Video Demonstrations},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2023,
    • pages = {2483--2492},
    • month = may,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2023-034}
    • }
  •  Jeon, E.S., Lohit, S., Anirudh, R., Turaga, P., "Robust Time Series Recovery and Classification Using Test-time Noise Simulator Networks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10096888, May 2023.
    BibTeX TR2023-021 PDF Presentation
    • @inproceedings{Jeon2023may,
    • author = {Jeon, Eun Som and Lohit, Suhas and Anirudh, Rushil and Turaga, Pavan},
    • title = {Robust Time Series Recovery and Classification Using Test-time Noise Simulator Networks},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10096888},
    • url = {https://www.merl.com/publications/TR2023-021}
    • }
  •  Cherian, A., Peng, K.-C., Lohit, S., Smith, K., Tenenbaum, J.B., "Are Deep Neural Networks SMARTer than Second Graders?", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), March 2023, pp. 10834-10844.
    BibTeX TR2023-014 PDF Data Software Presentation
    • @inproceedings{Cherian2023mar,
    • author = {Cherian, Anoop and Peng, Kuan-Chuan and Lohit, Suhas and Smith, Kevin and Tenenbaum, Joshua B.},
    • title = {Are Deep Neural Networks SMARTer than Second Graders?},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2023,
    • pages = {10834--10844},
    • month = mar,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2023-014}
    • }
  •  Mateus, A., Ranade, S., Ramalingam, S., Miraldo, P., "Fast and Accurate 3D Registration from Line Intersection Constraints", International Journal of Computer Vision, DOI: 10.1007/​s11263-023-01774-1, Vol. 131, pp. 2044-2069, February 2023.
    BibTeX TR2023-007 PDF
    • @article{Mateus2023feb,
    • author = {Mateus, Andre and Ranade, Siddhant and Ramalingam, Srikumar and Miraldo, Pedro},
    • title = {Fast and Accurate 3D Registration from Line Intersection Constraints},
    • journal = {International Journal of Computer Vision},
    • year = 2023,
    • volume = 131,
    • pages = {2044--2069},
    • month = feb,
    • doi = {10.1007/s11263-023-01774-1},
    • url = {https://www.merl.com/publications/TR2023-007}
    • }
  •  Aich, A., Peng, K.-C., Roy-Chowdhury, A.K., "Cross-Domain Video Anomaly Detection without Target Domain Adaptation", IEEE Winter Conference on Applications of Computer Vision (WACV), Crandall, D. and Gong, B. and Lee, Y. J. and Souvenir, R. and Yu, S., Eds., DOI: 10.1109/​WACV56688.2023.00261, January 2023, pp. 2578-2590.
    BibTeX TR2023-001 PDF Video Presentation
    • @inproceedings{Aich2023jan,
    • author = {Aich, Abhishek and Peng, Kuan-Chuan and Roy-Chowdhury, Amit K.},
    • title = {Cross-Domain Video Anomaly Detection without Target Domain Adaptation},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2023,
    • editor = {Crandall, D. and Gong, B. and Lee, Y. J. and Souvenir, R. and Yu, S.},
    • pages = {2578--2590},
    • month = jan,
    • publisher = {IEEE},
    • doi = {10.1109/WACV56688.2023.00261},
    • issn = {2642-9381},
    • isbn = {978-1-6654-9346-8},
    • url = {https://www.merl.com/publications/TR2023-001}
    • }
  •  Shimoya, R., Morimoto, T., van Baar, J., Boufounos, P.T., Ma, Y., Mansour, H., "Learning Occlusion-Aware Dense Correspondences for Multi-Modal Images", IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS), DOI: 10.1109/​AVSS56176.2022.9959354, November 2022, pp. 1-8.
    BibTeX TR2022-149 PDF
    • @inproceedings{Shimoya2022nov,
    • author = {Shimoya, Ryosuke and Morimoto, Tahashi and van Baar, Jeroen and Boufounos, Petros T. and Ma, Yanting and Mansour, Hassan},
    • title = {Learning Occlusion-Aware Dense Correspondences for Multi-Modal Images},
    • booktitle = {IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS)},
    • year = 2022,
    • pages = {1--8},
    • month = nov,
    • doi = {10.1109/AVSS56176.2022.9959354},
    • isbn = {978-1-6654-6382-9},
    • url = {https://www.merl.com/publications/TR2022-149}
    • }
  •  Romero, D., Lohit, S., "Learning Partial Equivariances from Data", Advances in Neural Information Processing Systems (NeurIPS), S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh, Eds., November 2022, pp. 36466-36478.
    BibTeX TR2022-148 PDF Presentation
    • @inproceedings{Romero2022nov,
    • author = {Romero, David and Lohit, Suhas},
    • title = {Learning Partial Equivariances from Data},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh},
    • pages = {36466--36478},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2022-148}
    • }
  •  Wang, H., Lohit, S., Jones, M.J., Fu, R., "What Makes a “Good” Data Augmentation in Knowledge Distillation – A Statistical Perspective", Advances in Neural Information Processing Systems (NeurIPS), S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh, Eds., November 2022, pp. 13456-13469.
    BibTeX TR2022-147 PDF
    • @inproceedings{Wang2022nov,
    • author = {Wang, Huan and Lohit, Suhas and Jones, Michael J. and Fu, Raymond},
    • title = {What Makes a “Good” Data Augmentation in Knowledge Distillation – A Statistical Perspective},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh},
    • pages = {13456--13469},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2022-147}
    • }
  •  Chatterjee, M., Ahuja, N., Cherian, A., "Learning Audio-Visual Dynamics Using Scene Graphs for Audio Source Separation", Advances in Neural Information Processing Systems (NeurIPS), November 2022.
    BibTeX TR2022-140 PDF Presentation
    • @inproceedings{Chatterjee2022nov,
    • author = {Chatterjee, Moitreya and Ahuja, Narendra and Cherian, Anoop},
    • title = {Learning Audio-Visual Dynamics Using Scene Graphs for Audio Source Separation},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2022-140}
    • }
  •  Ahmed, S.M., Lohit, S., Peng, K.-C., Jones, M.J., Roy Chowdhury, A.K., "Cross-Modal Knowledge Transfer Without Task-Relevant Source Data", European Conference on Computer Vision (ECCV), Avidan, S and Brostow, G and Cisse M and Farinella, G.M. and Hassner T., Eds., DOI: 10.1007/​978-3-031-19830-4_7, October 2022, pp. 111-127.
    BibTeX TR2022-135 PDF Video Software Presentation
    • @inproceedings{Ahmed2022oct,
    • author = {Ahmed, Sk Miraj and Lohit, Suhas and Peng, Kuan-Chuan and Jones, Michael J. and Roy Chowdhury, Amit K},
    • title = {Cross-Modal Knowledge Transfer Without Task-Relevant Source Data},
    • booktitle = {Computer Vision--ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23--27, 2022, Proceedings, Part XXXIV},
    • year = 2022,
    • editor = {Avidan, S and Brostow, G and Cisse M and Farinella, G.M. and Hassner T.},
    • pages = {111--127},
    • month = oct,
    • publisher = {Springer},
    • doi = {10.1007/978-3-031-19830-4_7},
    • isbn = {978-3-031-19830-4},
    • url = {https://www.merl.com/publications/TR2022-135}
    • }
  •  Paul, S., Roy Chowdhury, A.K., Cherian, A., "AVLEN: Audio-Visual-Language Embodied Navigation in 3D Environments", Advances in Neural Information Processing Systems (NeurIPS), October 2022, pp. 6236-6249.
    BibTeX TR2022-131 PDF Video Data Software
    • @inproceedings{Paul2022oct2,
    • author = {Paul, Sudipta and Roy Chowdhury, Amit K and Cherian, Anoop},
    • title = {AVLEN: Audio-Visual-Language Embodied Navigation in 3D Environments},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • pages = {6236--6249},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2022-131}
    • }
  •  Mansour, H., Lohit, S., Boufounos, P.T., "Distributed Radar Autofocus Imaging Using Deep Priors", IEEE International Conference on Image Processing (ICIP), DOI: 10.1109/​ICIP46576.2022.9897332, October 2022, pp. 2511-2515.
    BibTeX TR2022-129 PDF Video
    • @inproceedings{Mansour2022oct,
    • author = {Mansour, Hassan and Lohit, Suhas and Boufounos, Petros T.},
    • title = {Distributed Radar Autofocus Imaging Using Deep Priors},
    • booktitle = {IEEE International Conference on Image Processing (ICIP)},
    • year = 2022,
    • pages = {2511--2515},
    • month = oct,
    • doi = {10.1109/ICIP46576.2022.9897332},
    • url = {https://www.merl.com/publications/TR2022-129}
    • }
  •  Hori, C., Hori, T., Le Roux, J., "Low-Latency Streaming Scene-aware Interaction Using Audio-Visual Transformers", Interspeech, DOI: 10.21437/​Interspeech.2022-10891, September 2022, pp. 4511-4515.
    BibTeX TR2022-116 PDF
    • @inproceedings{Hori2022sep,
    • author = {Hori, Chiori and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Low-Latency Streaming Scene-aware Interaction Using Audio-Visual Transformers},
    • booktitle = {Interspeech},
    • year = 2022,
    • pages = {4511--4515},
    • month = sep,
    • doi = {10.21437/Interspeech.2022-10891},
    • url = {https://www.merl.com/publications/TR2022-116}
    • }
  •  Rambhatla, S., Jones, M.J., Chellappa, R., "An Empirical Analysis of Boosting Deep Networks", International Joint Conference on Neural Networks (IJCNN), DOI: 10.1109/​IJCNN55064.2022.9892204, July 2022.
    BibTeX TR2022-075 PDF Presentation
    • @inproceedings{Rambhatla2022jul,
    • author = {Rambhatla, Sai and Jones, Michael J. and Chellappa, Rama},
    • title = {An Empirical Analysis of Boosting Deep Networks},
    • booktitle = {International Joint Conference on Neural Networks (IJCNN)},
    • year = 2022,
    • month = jul,
    • doi = {10.1109/IJCNN55064.2022.9892204},
    • url = {https://www.merl.com/publications/TR2022-075}
    • }
  •  Miraldo, P., Iglesias, J.P., "A Unified Model for Line Projections in Catadioptric Cameras with Rotationally Symmetric Mirrors", IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR52688.2022.01534, June 2022.
    BibTeX TR2022-084 PDF
    • @inproceedings{Miraldo2022jun,
    • author = {Miraldo, Pedro and Iglesias, Jose Pedro},
    • title = {A Unified Model for Line Projections in Catadioptric Cameras with Rotationally Symmetric Mirrors},
    • booktitle = {IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2022,
    • month = jun,
    • doi = {10.1109/CVPR52688.2022.01534},
    • url = {https://www.merl.com/publications/TR2022-084}
    • }
  •  Sullivan, A., Wang, J., Li, X., Chen, S., Abbot, L., "PointMotionNet: Point-Wise Motion Learning for Large-Scale LiDAR Point Clouds Sequences", CVPR Workshop on Autonomous Driving, June 2022.
    BibTeX TR2022-083 PDF
    • @inproceedings{Sullivan2022jun,
    • author = {Sullivan, Alan and Wang, Jun and Li, Xiaolong and Chen, Siheng and Abbot, Lynn},
    • title = {PointMotionNet: Point-Wise Motion Learning for Large-Scale LiDAR Point Clouds Sequences},
    • booktitle = {CVPR Workshop on Autonomous Driving},
    • year = 2022,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2022-083}
    • }
  •  Chatterjee, M., Ahuja, N., Cherian, A., "Quantifying Predictive Uncertainty for Stochastic Video Synthesis from Audio", IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), June 2022.
    BibTeX TR2022-082 PDF
    • @inproceedings{Chatterjee2022jun,
    • author = {Chatterjee, Moitreya and Ahuja, Narendra and Cherian, Anoop},
    • title = {Quantifying Predictive Uncertainty for Stochastic Video Synthesis from Audio},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)},
    • year = 2022,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2022-082}
    • }
  •  Zhu, X., Jain, S., Tomizuka, M., van Baar, J., "Learning to Synthesize Volumetric Meshes from Vision-based Tactile Imprints", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA46639.2022.9812092, May 2022, pp. 4833-4839.
    BibTeX TR2022-055 PDF
    • @inproceedings{Zhu2022may2,
    • author = {Zhu, Xinghao and Jain, Siddarth and Tomizuka, Masayoshi and van Baar, Jeroen},
    • title = {Learning to Synthesize Volumetric Meshes from Vision-based Tactile Imprints},
    • booktitle = {2022 IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2022,
    • pages = {4833--4839},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA46639.2022.9812092},
    • isbn = {978-1-7281-9681-7},
    • url = {https://www.merl.com/publications/TR2022-055}
    • }
  •  Shah, A.P., Geng, S., Gao, P., Cherian, A., Hori, T., Marks, T.K., Le Roux, J., Hori, C., "Audio-Visual Scene-Aware Dialog and Reasoning Using Audio-Visual Transformers with Joint Student-Teacher Learning", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2022, pp. 7732-7736.
    BibTeX TR2022-019 PDF
    • @inproceedings{Shah2022apr,
    • author = {Shah, Ankit Parag and Geng, Shijie and Gao, Peng and Cherian, Anoop and Hori, Takaaki and Marks, Tim K. and Le Roux, Jonathan and Hori, Chiori},
    • title = {Audio-Visual Scene-Aware Dialog and Reasoning Using Audio-Visual Transformers with Joint Student-Teacher Learning},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {7732--7736},
    • month = apr,
    • publisher = {IEEE},
    • issn = {1520-6149},
    • isbn = {978-1-6654-0540-9},
    • url = {https://www.merl.com/publications/TR2022-019}
    • }
  •  Hori, C., Shah, A.P., Geng, S., Gao, P., Cherian, A., Hori, T., Le Roux, J., Marks, T.K., "Overview of Audio Visual Scene-Aware Dialog with Reasoning Track for Natural Language Generation in DSTC10", The 10th Dialog System Technology Challenge Workshop at AAAI, February 2022.
    BibTeX TR2022-016 PDF
    • @inproceedings{Hori2022feb,
    • author = {Hori, Chiori and Shah, Ankit Parag and Geng, Shijie and Gao, Peng and Cherian, Anoop and Hori, Takaaki and Le Roux, Jonathan and Marks, Tim K.},
    • title = {Overview of Audio Visual Scene-Aware Dialog with Reasoning Track for Natural Language Generation in DSTC10},
    • booktitle = {The 10th Dialog System Technology Challenge Workshop at AAAI},
    • year = 2022,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2022-016}
    • }
  •  Shah, A.P., Hori, T., Le Roux, J., Hori, C., DSTC10-AVSD Submission System with Reasoning using Audio-Visual Transformers with Joint Student-Teacher Learning, February 2022.
    BibTeX TR2022-025 PDF
    • @book{Shah2022feb,
    • author = {Shah, Ankit Parag and Hori, Takaaki and Le Roux, Jonathan and Hori, Chiori},
    • title = {DSTC10-AVSD Submission System with Reasoning using Audio-Visual Transformers with Joint Student-Teacher Learning},
    • year = 2022,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2022-025}
    • }