Publications

Chakrabarty, A., Jha, D.K., Buzzard, G.T., Wang, Y., Vamvoudakis, K., "Safe Approximate Dynamic Programming via Kernelized Lipschitz Estimation", IEEE Transactions on Neural Networks and Learning Systems, DOI: 10.1109/TNNLS.2020.2978805, July 2020.
BibTeX TR2020-108 PDF
- @article{Chakrabarty2020jul2,
- author = {Chakrabarty, Ankush and Jha, Devesh K. and Buzzard, Gregery T. and Wang, Yebin and Vamvoudakis, Kyriakos},
- title = {Safe Approximate Dynamic Programming via Kernelized Lipschitz Estimation},
- journal = {IEEE Transactions on Neural Networks and Learning Systems},
- year = 2020,
- month = jul,
- doi = {10.1109/TNNLS.2020.2978805},
- url = {https://www.merl.com/publications/TR2020-108}
- }
Romeres, D., Liu, Y., Jha, D.K., Nikovski, D.N., "Understanding Multi-Modal Perception Using Behavioral Cloning for Peg-In-a-Hole Insertion Tasks", Robotics: Science and Systems, July 2020.
BibTeX TR2020-110 PDF
- @inproceedings{Romeres2020jul,
- author = {Romeres, Diego and Liu, Yifang and Jha, Devesh K. and Nikovski, Daniel N.},
- title = {Understanding Multi-Modal Perception Using Behavioral Cloning for Peg-In-a-Hole Insertion Tasks},
- booktitle = {Robotics: Science and Systems},
- year = 2020,
- month = jul,
- url = {https://www.merl.com/publications/TR2020-110}
- }
Ota, K., Oiki, T., Jha, D.K., Mariyama, T., Nikovski, D.N., "Can Increasing Input Dimensionality Improve Deep Reinforcement Learning?", International Conference on Machine Learning (ICML), Daumé III , Hal and Singh, Aarti, Eds., June 2020, pp. 7424-7433.
BibTeX TR2020-083 PDF Software
- @inproceedings{Ota2020jun,
- author = {Ota, Kei and Oiki, Tomoaki and Jha, Devesh K. and Mariyama, Toshisada and Nikovski, Daniel N.},
- title = {Can Increasing Input Dimensionality Improve Deep Reinforcement Learning?},
- booktitle = {International Conference on Machine Learning (ICML)},
- year = 2020,
- editor = {Daumé III , Hal and Singh, Aarti},
- pages = {7424--7433},
- month = jun,
- publisher = {PMLR},
- url = {https://www.merl.com/publications/TR2020-083}
- }
Jha, D.K., Kolaric, P., Raghunathan, A., Lewis, F., Benosman, M., Romeres, D., Nikovski, D.N., "Local Policy Optimization for Trajectory-Centric Reinforcement Learning", IEEE International Conference on Robotics and Automation (ICRA), Ayanna Howard, Eds., May 2020, pp. 5094-5100.
BibTeX TR2020-062 PDF
- @inproceedings{Jha2020may,
- author = {Jha, Devesh K. and Kolaric, Patrik and Raghunathan, Arvind and Lewis, Frank and Benosman, Mouhacine and Romeres, Diego and Nikovski, Daniel N.},
- title = {Local Policy Optimization for Trajectory-Centric Reinforcement Learning},
- booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
- year = 2020,
- editor = {Ayanna Howard},
- pages = {5094--5100},
- month = may,
- publisher = {IEEE},
- isbn = {978-1-7281-7395-5},
- url = {https://www.merl.com/publications/TR2020-062}
- }
Romeres, D., Dalla Libera, A., Jha, D.K., Yerazunis, W.S., Nikovski, D.N., "Model-Based Reinforcement Learning for Physical Systems Without Velocity and Acceleration Measurements", Robotics and Automation Letters, DOI: 10.1109/LRA.2020.2977255, Vol. 5, No. 2, pp. 3548-3555, May 2020.
BibTeX TR2020-063 PDF
- @article{Romeres2020may,
- author = {Romeres, Diego and Dalla Libera, Alberto and Jha, Devesh K. and Yerazunis, William S. and Nikovski, Daniel N.},
- title = {Model-Based Reinforcement Learning for Physical Systems Without Velocity and Acceleration Measurements},
- journal = {Robotics and Automation Letters},
- year = 2020,
- volume = 5,
- number = 2,
- pages = {3548--3555},
- month = may,
- doi = {10.1109/LRA.2020.2977255},
- issn = {2377-3766},
- url = {https://www.merl.com/publications/TR2020-063}
- }
Kojima, K., TaherSima, M., Koike-Akino, T., Jha, D.K., Tang, Y., Parsons, K., Sang, F., Klamkin, J., "Deep Neural Networks for Designing Integrated Photonics", Optical Fiber Communication Conference and Exposition (OFC), DOI: 10.1364/OFC.2020.Th1A.6, March 2020.
BibTeX TR2020-057 PDF
- @inproceedings{Kojima2020mar,
- author = {Kojima, Keisuke and TaherSima, Mohammad and Koike-Akino, Toshiaki and Jha, Devesh K. and Tang, Yingheng and Parsons, Kieran and Sang, Fengqiao and Klamkin, Jonathan},
- title = {Deep Neural Networks for Designing Integrated Photonics},
- booktitle = {Optical Fiber Communication Conference and Exposition (OFC)},
- year = 2020,
- month = mar,
- publisher = {OSA},
- doi = {10.1364/OFC.2020.Th1A.6},
- isbn = {978-1-943580-71-2},
- url = {https://www.merl.com/publications/TR2020-057}
- }
Tang, Y., Kojima, K., Koike-Akino, T., Wang, Y., Wu, P., TaherSima, M., Jha, D.K., Parsons, K., Qi, M., "Generative Deep Learning Model for a Multi-level NanoOptic Broadband Power Splitter", Optical Fiber Communication Conference and Exposition (OFC), DOI: 10.1364/OFC.2020.Th1A.1, March 2020, pp. Th1A.1.
BibTeX TR2020-025 PDF
- @inproceedings{Tang2020mar,
- author = {Tang, Yingheng and Kojima, Keisuke and Koike-Akino, Toshiaki and Wang, Ye and Wu, Pengxiang and TaherSima, Mohammad and Jha, Devesh K. and Parsons, Kieran and Qi, Minghao},
- title = {Generative Deep Learning Model for a Multi-level NanoOptic Broadband Power Splitter},
- booktitle = {Optical Fiber Communication Conference and Exposition (OFC)},
- year = 2020,
- pages = {Th1A.1},
- month = mar,
- publisher = {OSA},
- doi = {10.1364/OFC.2020.Th1A.1},
- isbn = {978-1-943580-71-2},
- url = {https://www.merl.com/publications/TR2020-025}
- }
Jha, D.K., Kolaric, P., Romeres, D., Raghunathan, A., Benosman, M., Nikovski, D.N., "Robust Optimization for Trajectory-Centric Model-based Reinforcement Learning", NeurIPS Workshop on Safety and Robustness in Decision Making, December 2019.
BibTeX TR2019-156 PDF
- @inproceedings{Jha2019dec2,
- author = {Jha, Devesh K. and Kolaric, Patrik and Romeres, Diego and Raghunathan, Arvind and Benosman, Mouhacine and Nikovski, Daniel N.},
- title = {Robust Optimization for Trajectory-Centric Model-based Reinforcement Learning},
- booktitle = {NeurIPS Workshop on Safety and Robustness in Decision Making},
- year = 2019,
- month = dec,
- url = {https://www.merl.com/publications/TR2019-156}
- }
Jha, D.K., Raghunathan, A., Romeres, D., "QNTRPO: Including Curvature in TRPO", Optimization Foundations for Reinforcement Learning Workshop at NeurIPS, December 2019.
BibTeX TR2019-154 PDF Software
- @inproceedings{Jha2019dec,
- author = {Jha, Devesh K. and Raghunathan, Arvind and Romeres, Diego},
- title = {QNTRPO: Including Curvature in TRPO},
- booktitle = {Optimization Foundations for Reinforcement Learning Workshop at NeurIPS},
- year = 2019,
- month = dec,
- url = {https://www.merl.com/publications/TR2019-154}
- }
Ota, K., Jha, D.K., Oiki, T., Miura, M., Nammoto, T., Nikovski, D., Mariyama, T., "Trajectory Optimization for Unknown Constrained Systems using Reinforcement Learning", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/IROS40897.2019.8968010, November 2019, pp. 3487-3494.
BibTeX TR2019-129 PDF
- @inproceedings{Ota2019nov,
- author = {Ota, Kei and Jha, Devesh K. and Oiki, Tomohiro and Miura, Mamoru and Nammoto, Takashi and Nikovski, Daniel and Mariyama, Toshisada},
- title = {Trajectory Optimization for Unknown Constrained Systems using Reinforcement Learning},
- booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
- year = 2019,
- pages = {3487--3494},
- month = nov,
- publisher = {IEEE},
- doi = {10.1109/IROS40897.2019.8968010},
- issn = {2153-0866},
- isbn = {978-1-7281-4004-9},
- url = {https://www.merl.com/publications/TR2019-129}
- }
Jha, D.K., Raghunathan, A., Romeres, D., "Quasi-Newton Trust Region Policy Optimization", Conference on Robot Learning (CoRL), Leslie Pack Kaelbling and Danica Kragic and Komei Sugiura, Eds., October 2019, pp. 945-954.
BibTeX TR2019-120 PDF Software
- @inproceedings{Jha2019oct,
- author = {Jha, Devesh K. and Raghunathan, Arvind and Romeres, Diego},
- title = {Quasi-Newton Trust Region Policy Optimization},
- booktitle = {Conference on Robot Learning (CoRL)},
- year = 2019,
- editor = {Leslie Pack Kaelbling and Danica Kragic and Komei Sugiura},
- pages = {945--954},
- month = oct,
- publisher = {Proceedings of Machine Learning Research},
- url = {https://www.merl.com/publications/TR2019-120}
- }
Zhang, W., Jha, D.K., Laftchiev, E., Nikovski, D.N., "Multi-label Prediction in Time Series Data using Deep Neural Networks", International Journal for Prognostics and Health Management Special Issue on Applications of Deep Learning and Emerging Analytics, Vol. 10, pp. 0-12, September 2019.
BibTeX TR2019-110 PDF
- @article{Zhang2019sep2,
- author = {Zhang, Wenyu and Jha, Devesh K. and Laftchiev, Emil and Nikovski, Daniel N.},
- title = {Multi-label Prediction in Time Series Data using Deep Neural Networks},
- journal = {International Journal for Prognostics and Health Management Special Issue on Applications of Deep Learning and Emerging Analytics},
- year = 2019,
- volume = 10,
- pages = {0--12},
- month = sep,
- note = {Special Issue on Deep Learning and Emerging Analytics},
- issn = {2153-2648},
- url = {https://www.merl.com/publications/TR2019-110}
- }
Chakrabarty, A., Jha, D.K., Wang, Y., "Data-Driven Control Policies for Partially Known Systems via Kernelized Lipschitz Learning", American Control Conference (ACC), DOI: 10.23919/ACC.2019.8815325, July 2019, pp. 4192-4197.
BibTeX TR2019-047 PDF
- @inproceedings{Chakrabarty2019jul,
- author = {Chakrabarty, Ankush and Jha, Devesh K. and Wang, Yebin},
- title = {Data-Driven Control Policies for Partially Known Systems via Kernelized Lipschitz Learning},
- booktitle = {American Control Conference (ACC)},
- year = 2019,
- pages = {4192--4197},
- month = jul,
- publisher = {IEEE},
- doi = {10.23919/ACC.2019.8815325},
- url = {https://www.merl.com/publications/TR2019-047}
- }
Romeres, D., Jha, D.K., Dau, H., Yerazunis, W.S., Nikovski, D.N., "Anomaly Detection for Insertion Tasks in Robotic Assembly Using Gaussian Process Models", European Control Conference (ECC), DOI: 10.23919/ECC.2019.8795698, June 2019, pp. 1017-1022.
BibTeX TR2019-055 PDF
- @inproceedings{Romeres2019jun,
- author = {Romeres, Diego and Jha, Devesh K. and Dau, Hoang and Yerazunis, William S. and Nikovski, Daniel N.},
- title = {Anomaly Detection for Insertion Tasks in Robotic Assembly Using Gaussian Process Models},
- booktitle = {European Control Conference (ECC)},
- year = 2019,
- pages = {1017--1022},
- month = jun,
- publisher = {IEEE},
- doi = {10.23919/ECC.2019.8795698},
- isbn = {978-3-907144-00-8},
- url = {https://www.merl.com/publications/TR2019-055}
- }
Raghunathan, A., Cherian, A., Jha, D.K., "Game Theoretic Optimization via Gradient-based Nikaido-Isoda Function", International Conference on Machine Learning (ICML), Lawrence, N. and Reid, M., Eds., June 2019, pp. 5291-5300.
BibTeX TR2019-045 PDF Software
- @inproceedings{Raghunathan2019jun,
- author = {Raghunathan, Arvind and Cherian, Anoop and Jha, Devesh K.},
- title = {Game Theoretic Optimization via Gradient-based Nikaido-Isoda Function},
- booktitle = {International Conference on Machine Learning (ICML)},
- year = 2019,
- editor = {Lawrence, N. and Reid, M.},
- pages = {5291--5300},
- month = jun,
- publisher = {PMLR},
- issn = {2640-3498},
- url = {https://www.merl.com/publications/TR2019-045}
- }
Romeres, D., Jha, D.K., Dalla Libera, A., Yerazunis, W.S., Nikovski, D.N., "Semiparametrical Gaussian Processes Learning of Forward Dynamical Models for Navigating in a Circular Maze", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/ICRA.2019.8794229, May 2019, pp. 3195-3202.
BibTeX TR2019-028 PDF Video Software
- @inproceedings{Romeres2019may,
- author = {Romeres, Diego and Jha, Devesh K. and Dalla Libera, Alberto and Yerazunis, William S. and Nikovski, Daniel N.},
- title = {Semiparametrical Gaussian Processes Learning of Forward Dynamical Models for Navigating in a Circular Maze},
- booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
- year = 2019,
- pages = {3195--3202},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICRA.2019.8794229},
- issn = {2577-087X},
- isbn = {978-1-5386-6027-0},
- url = {https://www.merl.com/publications/TR2019-028}
- }
van Baar, J., Sullivan, A., Corcodel, R., Jha, D.K., Romeres, D., Nikovski, D.N., "Sim-to-Real Transfer Learning using Robustified Controllers in Robotic Tasks involving Complex Dynamics", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/ICRA.2019.8793561, May 2019, pp. 6001-6007.
BibTeX TR2018-202 PDF Video Software
- @inproceedings{vanBaar2019may,
- author = {van Baar, Jeroen and Sullivan, Alan and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and Nikovski, Daniel N.},
- title = {Sim-to-Real Transfer Learning using Robustified Controllers in Robotic Tasks involving Complex Dynamics},
- booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
- year = 2019,
- pages = {6001--6007},
- month = may,
- doi = {10.1109/ICRA.2019.8793561},
- url = {https://www.merl.com/publications/TR2018-202}
- }
TaherSima, M., Kojima, K., Koike-Akino, T., Jha, D.K., Wang, B., Lin, C., Parsons, K., "Nanostructured Photonic Power Splitter Design via Convolutional Neural Networks", Conference on Lasers and Electro-Optics (CLEO), DOI: 10.1364/CLEO_SI.2019.SW4J.6, May 2019.
BibTeX TR2019-027 PDF
- @inproceedings{TaherSima2019may,
- author = {TaherSima, Mohammad and Kojima, Keisuke and Koike-Akino, Toshiaki and Jha, Devesh K. and Wang, Bingnan and Lin, Chungwei and Parsons, Kieran},
- title = {Nanostructured Photonic Power Splitter Design via Convolutional Neural Networks},
- booktitle = {Conference on Lasers and Electro-Optics (CLEO)},
- year = 2019,
- month = may,
- publisher = {Optical Society of America},
- doi = {10.1364/CLEO_SI.2019.SW4J.6},
- url = {https://www.merl.com/publications/TR2019-027}
- }
TaherSima, M., Kojima, K., Koike-Akino, T., Jha, D.K., Wang, B., Lin, C., Parsons, K., "Deep Neural Network Inverse Modeling for Integrated Photonics", Optical Fiber Communication Conference and Exposition and the National Fiber Optic Engineers Conference (OFC/NFOEC), DOI: 10.1364/OFC.2019.W3B.5, March 2019.
BibTeX TR2018-183 PDF
- @inproceedings{TaherSima2019mar,
- author = {TaherSima, Mohammad and Kojima, Keisuke and Koike-Akino, Toshiaki and Jha, Devesh K. and Wang, Bingnan and Lin, Chungwei and Parsons, Kieran},
- title = {Deep Neural Network Inverse Modeling for Integrated Photonics},
- booktitle = {Optical Fiber Communication Conference and Exposition and the National Fiber Optic Engineers Conference (OFC/NFOEC)},
- year = 2019,
- month = mar,
- doi = {10.1364/OFC.2019.W3B.5},
- url = {https://www.merl.com/publications/TR2018-183}
- }
TaherSima, M., Kojima, K., Koike-Akino, T., Jha, D., Wang, B., Lin, C., Parsons, K., "Deep Neural Network Inverse Design of Integrated Photonic Power Splitters", Nature Scientific Reports, DOI: 10.1038/s41598-018-37952-2, Vol. 9, pp. 1368, December 2018.
BibTeX TR2018-180 PDF
- @article{TaherSima2018dec,
- author = {TaherSima, Mohammad and Kojima, Keisuke and Koike-Akino, Toshiaki and Jha, Devesh and Wang, Bingnan and Lin, Chungwei and Parsons, Kieran},
- title = {Deep Neural Network Inverse Design of Integrated Photonic Power Splitters},
- journal = {Nature Scientific Reports},
- year = 2018,
- volume = 9,
- pages = 1368,
- month = dec,
- doi = {10.1038/s41598-018-37952-2},
- issn = {2045-2322},
- url = {https://www.merl.com/publications/TR2018-180}
- }
Romeres, D.., Jha, D.K., Dalla Libera, A., Chiuso, A., Nikovski, D.N., "Derivative-Free Semiparametric Bayesian Models for Robot Learning", Advances in Neural Information Processing Systems (NIPS), December 2018.
BibTeX TR2018-165 PDF
- @inproceedings{Romeres2018dec,
- author = {Romeres, Diego and Jha, Devesh K. and Dalla Libera, Alberto and Chiuso, Alessandro and Nikovski, Daniel N.},
- title = {Derivative-Free Semiparametric Bayesian Models for Robot Learning},
- booktitle = {Advances in Neural Information Processing Systems (NIPS)},
- year = 2018,
- month = dec,
- url = {https://www.merl.com/publications/TR2018-165}
- }
Jha, D.K., Romeres, D., van Baar, J., Sullivan, A., Nikovski, D.N., "Learning Tasks in a Complex Circular Maze Environment", NIPS Workshop on Modeling the Physical World: Perception, Learning, and Control, December 2018.
BibTeX TR2018-169 PDF
- @inproceedings{vanBaar2018dec,
- author = {Jha, Devesh K. and Romeres, Diego and van Baar, Jeroen and Sullivan, Alan and Nikovski, Daniel N.},
- title = {Learning Tasks in a Complex Circular Maze Environment},
- booktitle = {NIPS Workshop on Modeling the Physical World: Perception, Learning, and Control},
- year = 2018,
- month = dec,
- url = {https://www.merl.com/publications/TR2018-169}
- }
Jha, D.K., "Algorithms for Task Allocation in Homogeneous Swarm of Robots", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/IROS.2018.8594052, October 2018.
BibTeX TR2018-151 PDF
- @inproceedings{Jha2018oct,
- author = {Jha, Devesh K.},
- title = {Algorithms for Task Allocation in Homogeneous Swarm of Robots},
- booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
- year = 2018,
- month = oct,
- doi = {10.1109/IROS.2018.8594052},
- url = {https://www.merl.com/publications/TR2018-151}
- }
van Baar, J., Corcodel, R., Sullivan, A., Jha, D.K., Romeres, D., Nikovski, D.N., "Simulation to Real Transfer Learning with Robustified Policies for Robot Tasks", arXiv, September 2018.
BibTeX arXiv
- @article{vanBaar2018sep,
- author = {van Baar, Jeroen and Corcodel, Radu and Sullivan, Alan and Jha, Devesh K. and Romeres, Diego and Nikovski, Daniel N.},
- title = {Simulation to Real Transfer Learning with Robustified Policies for Robot Tasks},
- journal = {arXiv},
- year = 2018,
- month = sep,
- url = {https://arxiv.org/abs/1809.04720}
- }
Jha, D.K., Yerazunis, W.S., Nikovski, D.N., Farahmand, A.-M., "Learning to Regulate Rolling Ball Motion", IEEE Symposium on Computational Intelligence in Engineering Solutions, DOI: 10.1109/SSCI.2017.8285376, November 2017.
BibTeX TR2017-176 PDF
- @inproceedings{Jha2017nov,
- author = {Jha, Devesh K. and Yerazunis, William S. and Nikovski, Daniel N. and Farahmand, Amir-massoud},
- title = {Learning to Regulate Rolling Ball Motion},
- booktitle = {IEEE Symposium on Computational Intelligence in Engineering Solutions},
- year = 2017,
- month = nov,
- doi = {10.1109/SSCI.2017.8285376},
- url = {https://www.merl.com/publications/TR2017-176}
- }