Publications

427 / 2,868 publications found.


  •  Hori, C., Cherian, A., Marks, T., Hori, T., "Joint Student-Teacher Learning for Audio-Visual Scene-Aware Dialog", Interspeech, September 2019, pp. 1886-1890.
    BibTeX Download PDFAbout TR2019-097
    • @inproceedings{Hori2019sep,
    • author = {Hori, Chiori and Cherian, Anoop and Marks, Tim and Hori, Takaaki},
    • title = {Joint Student-Teacher Learning for Audio-Visual Scene-Aware Dialog},
    • booktitle = {Interspeech},
    • year = 2019,
    • pages = {1886--1890},
    • month = sep,
    • publisher = {ISCA},
    • url = {https://www.merl.com/publications/TR2019-097}
    • }
  •  Karafiat, M., Baskar, M.K., Watanabe, S., Hori, T., Wiesner, M., Cernocky, J.H., "Analysis of Multilingual Sequence-to-Sequence Speech Recognition Systems", Interspeech, September 2019.
    BibTeX Download PDFAbout TR2019-103
    • @inproceedings{Karafiat2019sep,
    • author = {Karafiat, Martin and Baskar, Murali Karthick and Watanabe, Shinji and Hori, Takaaki and Wiesner, Matthew and Cernocky, Jan, Honza},
    • title = {Analysis of Multilingual Sequence-to-Sequence Speech Recognition Systems},
    • booktitle = {Interspeech},
    • year = 2019,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2019-103}
    • }
  •  Moritz, N., Hori, T., Le Roux, J., "Unidirectional Neural Network Architectures for End-to-End Automatic Speech Recognition", Interspeech, DOI: 10.21437/Interspeech.2019-2837, September 2019, pp. 76-80.
    BibTeX Download PDFAbout TR2019-098
    • @inproceedings{Moritz2019sep,
    • author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Unidirectional Neural Network Architectures for End-to-End Automatic Speech Recognition},
    • booktitle = {Interspeech},
    • year = 2019,
    • pages = {76--80},
    • month = sep,
    • doi = {10.21437/Interspeech.2019-2837},
    • url = {https://www.merl.com/publications/TR2019-098}
    • }
  •  Seki, H., Hori, T., Watanabe, S., Le Roux, J., Hershey, J., "End-to-End Multilingual Multi-Speaker Speech Recognition", Interspeech, DOI: 10.21437/Interspeech.2019-3038, September 2019, pp. 3755-3759.
    BibTeX Download PDFAbout TR2019-101
    • @inproceedings{Seki2019sep,
    • author = {Seki, Hiroshi and Hori, Takaaki and Watanabe, Shinji and Le Roux, Jonathan and Hershey, John},
    • title = {End-to-End Multilingual Multi-Speaker Speech Recognition},
    • booktitle = {Interspeech},
    • year = 2019,
    • pages = {3755--3759},
    • month = sep,
    • doi = {10.21437/Interspeech.2019-3038},
    • url = {https://www.merl.com/publications/TR2019-101}
    • }
  •  Seki, H., Hori, T., Watanabe, S., Moritz, N., Le Roux, J., "Vectorized Beam Search for CTC-Attention-based Speech Recognition", Interspeech, DOI: 10.21437/Interspeech.2019-2860, September 2019, pp. 3825-3829.
    BibTeX Download PDFAbout TR2019-102
    • @inproceedings{Seki2019sep2,
    • author = {Seki, Hiroshi and Hori, Takaaki and Watanabe, Shinji and Moritz, Niko and Le Roux, Jonathan},
    • title = {Vectorized Beam Search for CTC-Attention-based Speech Recognition},
    • booktitle = {Interspeech},
    • year = 2019,
    • pages = {3825--3829},
    • month = sep,
    • doi = {10.21437/Interspeech.2019-2860},
    • url = {https://www.merl.com/publications/TR2019-102}
    • }
  •  Zhang, Z., Lin, Z., Pfister, H., "White-Box Adversarial Defense via Self-Supervised Data Estimation", arXiv, September 2019.
    BibTeX Download PDFAbout TR2019-104
    • @article{Zhang2019sep,
    • author = {Zhang, Ziming and Lin, Zudi and Pfister, Hanspeter},
    • title = {White-Box Adversarial Defense via Self-Supervised Data Estimation},
    • journal = {arXiv},
    • year = 2019,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2019-104}
    • }
  •  Jones, M.J., Rambhatla, S., "Body Part Alignment and Temporal Attention for Video-Based Person Re-Identification", British Machine Vision Conference (BMVC), September 2019.
    BibTeX Download PDFAbout TR2019-108
    • @inproceedings{Jones2019sep,
    • author = {Jones, Michael J. and Rambhatla, Sai},
    • title = {Body Part Alignment and Temporal Attention for Video-Based Person Re-Identification},
    • booktitle = {British Machine Vision Conference (BMVC)},
    • year = 2019,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2019-108}
    • }
  •  Yalta, N., Watanabe, S., Hori, T., Nakadai, K., Ogata, T., "CNN-based Multichannel End-to-End Speech Recognition for Everyday Home Environments", European Signal Processing Conference (EUSIPCO), September 2019.
    BibTeX Download PDFAbout TR2019-094
    • @inproceedings{Yalta2019sep,
    • author = {Yalta, Nelson and Watanabe, Shinji and Hori, Takaaki and Nakadai, Kazuhiro and Ogata, Tetsuya},
    • title = {CNN-based Multichannel End-to-End Speech Recognition for Everyday Home Environments},
    • booktitle = {European Signal Processing Conference (EUSIPCO)},
    • year = 2019,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2019-094}
    • }
  •  Wang, J., Cherian, A., "Discriminative Video Representation Learning Using Support Vector Classifiers", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/TPAMI.2019.2937292, August 2019.
    BibTeX Download PDFAbout TR2019-107
    • @article{Wang2019aug,
    • author = {Wang, Jue and Cherian, Anoop},
    • title = {Discriminative Video Representation Learning Using Support Vector Classifiers},
    • journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
    • year = 2019,
    • month = aug,
    • doi = {10.1109/TPAMI.2019.2937292},
    • url = {https://www.merl.com/publications/TR2019-107}
    • }
  •  Romeres, D., Jha, D., Dau, H., Yerazunis, W.S., Nikovski, D.N., "Anomaly Detection for Insertion Tasks in Robotic Assembly Using Gaussian Process Models", European Control Conference (ECC), DOI: 10.23919/ECC.2019.8795698, ISBN: 978-3-907144-00-8, June 2019, pp. 1017-1022.
    BibTeX Download PDFAbout TR2019-055
    • @inproceedings{Romeres2019jun,
    • author = {Romeres, Diego and Jha, Devesh and Dau, Hoang and Yerazunis, William S. and Nikovski, Daniel N.},
    • title = {Anomaly Detection for Insertion Tasks in Robotic Assembly Using Gaussian Process Models},
    • booktitle = {European Control Conference (ECC)},
    • year = 2019,
    • pages = {1017--1022},
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.23919/ECC.2019.8795698},
    • isbn = {978-3-907144-00-8},
    • url = {https://www.merl.com/publications/TR2019-055}
    • }
  •  Alamri, H., Cartillier, V., Das, A., Wang, J., Lee, S., Anderson, P., Essa, I., Parikh, D., Batra, D., Cherian, A., Marks, T.K., Hori, C., "Audio-Visual Scene-Aware Dialog", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2019.
    BibTeX Download PDFAbout TR2019-048
    • @inproceedings{Alamri2019jun,
    • author = {Alamri, Huda and Cartillier, Vincent and Das, Abhishek and Wang, Jue and Lee, Stefan and Anderson, Peter and Essa, Irfan and Parikh, Devi and Batra, Dhruv and Cherian, Anoop and Marks, Tim K. and Hori, Chiori},
    • title = {Audio-Visual Scene-Aware Dialog},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2019,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2019-048}
    • }
  •  Lee, T.-Y., van Baar, J., Wittenburg, K.B., Sullivan, A., "Analysis of the contribution and temporal dependency of LSTM layers for reinforcement learning tasks", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Explanable AI Workshop, June 2019.
    BibTeX Download PDFAbout TR2019-049
    • @inproceedings{Lee2019jun2,
    • author = {Lee, Teng-Yok and van Baar, Jeroen and Wittenburg, Kent B. and Sullivan, Alan},
    • title = {Analysis of the contribution and temporal dependency of LSTM layers for reinforcement learning tasks},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Explanable AI Workshop},
    • year = 2019,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2019-049}
    • }
  •  Raghunathan, A., Cherian, A., Jha, D., "Game Theoretic Optimization via Gradient-based Nikaido-Isoda Function", International Conference on Machine Learning (ICML), Lawrence, N. and Reid, M., Eds., ISSN: 2640-3498, June 2019, pp. 5291-5300.
    BibTeX Download PDFAbout TR2019-045
    • @inproceedings{Raghunathan2019jun,
    • author = {Raghunathan, Arvind and Cherian, Anoop and Jha, Devesh},
    • title = {Game Theoretic Optimization via Gradient-based Nikaido-Isoda Function},
    • booktitle = {International Conference on Machine Learning (ICML)},
    • year = 2019,
    • editor = {Lawrence, N. and Reid, M.},
    • pages = {5291--5300},
    • month = jun,
    • publisher = {PMLR},
    • issn = {2640-3498},
    • url = {https://www.merl.com/publications/TR2019-045}
    • }
  •  Chen, S., "Large-Scale 3D Point Cloud Representations via Graph Inception Networks with Applications to Autonomous Driving", Graph Signal Processing Workshop, June 2019.
    BibTeX Download PDFAbout TR2019-039
    • @inproceedings{Chen2019jun,
    • author = {Chen, Siheng},
    • title = {Large-Scale 3D Point Cloud Representations via Graph Inception Networks with Applications to Autonomous Driving},
    • booktitle = {Graph Signal Processing Workshop},
    • year = 2019,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2019-039}
    • }
  •  Duan, C., Chen, S., Tian, D., Moura, J., Kovacevic, J., "Deep Graph Topology Learning for 3D Point Cloud Reconstruction", Graph Signal Processing Workshop, June 2019.
    BibTeX Download PDFAbout TR2019-046
    • @inproceedings{Duan2019jun,
    • author = {Duan, Chaojing and Chen, Siheng and Tian, Dong and Moura, Jose and Kovacevic, Jelena},
    • title = {Deep Graph Topology Learning for 3D Point Cloud Reconstruction},
    • booktitle = {Graph Signal Processing Workshop},
    • year = 2019,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2019-046}
    • }
  •  Bhamidipati, S., Kim, K.J., Sun, H., Orlik, P.V., Zhang, J., "Joint BP and RNN for Resilient GPS Timing Against Spoofing Attacks", EAI International Conference on Artificial Intelligence for Communications and Networks, May 2019.
    BibTeX Download PDFAbout TR2019-036
    • @inproceedings{Bhamidipati2019may,
    • author = {Bhamidipati, Sriramya and Kim, Kyeong Jin and Sun, Hongbo and Orlik, Philip V. and Zhang, Jinyun},
    • title = {Joint BP and RNN for Resilient GPS Timing Against Spoofing Attacks},
    • booktitle = {EAI International Conference on Artificial Intelligence for Communications and Networks},
    • year = 2019,
    • month = may,
    • url = {https://www.merl.com/publications/TR2019-036}
    • }
  •  Romeres, D., Jha, D., Dalla Libera, A., Yerazunis, W.S., Nikovski, D.N., "Semiparametrical Gaussian Processes Learning of Forward Dynamical Models for Navigating in a Circular Maze", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/ICRA.2019.8794229, ISSN: 2577-087X, ISBN: 978-1-5386-6027-0, May 2019, pp. 3195-3202.
    BibTeX Download PDFAbout TR2019-028
    • @inproceedings{Romeres2019may,
    • author = {Romeres, Diego and Jha, Devesh and Dalla Libera, Alberto and Yerazunis, William S. and Nikovski, Daniel N.},
    • title = {Semiparametrical Gaussian Processes Learning of Forward Dynamical Models for Navigating in a Circular Maze},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2019,
    • pages = {3195--3202},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA.2019.8794229},
    • issn = {2577-087X},
    • isbn = {978-1-5386-6027-0},
    • url = {https://www.merl.com/publications/TR2019-028}
    • }
  •  van Baar, J., Sullivan, A., Corcodel, R., Jha, D., Romeres, D., Nikovski, D.N., "Sim-to-Real Transfer Learning using Robustified Controllers in Robotic Tasks involving Complex Dynamics", IEEE International Conference on Robotics and Automation (ICRA), May 2019.
    BibTeX Download PDFAbout TR2018-202
    • @inproceedings{vanBaar2019may,
    • author = {van Baar, Jeroen and Sullivan, Alan and Corcodel, Radu and Jha, Devesh and Romeres, Diego and Nikovski, Daniel N.},
    • title = {Sim-to-Real Transfer Learning using Robustified Controllers in Robotic Tasks involving Complex Dynamics},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2019,
    • month = may,
    • url = {https://www.merl.com/publications/TR2018-202}
    • }
  •  Aihara, R., Hanazawa, T., Okato, Y., Wichern, G., Le Roux, J., "Teacher-Student Deep Clustering For Low-Delay Channel Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8682695, May 2019.
    BibTeX Download PDFAbout TR2019-003
    • @inproceedings{Aihara2019may,
    • author = {Aihara, Ryo and Hanazawa, Toshiyuki and Okato, Yohei and Wichern, Gordon and Le Roux, Jonathan},
    • title = {Teacher-Student Deep Clustering For Low-Delay Channel Speech Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8682695},
    • url = {https://www.merl.com/publications/TR2019-003}
    • }
  •  Baskar, M.K., Burget, L., Watanabe, S., Karafiat, M., Hori, T., Cernocky, J.H., "Promising Accurate Prefix Boosting for Sequence-to-Sequence ASR", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2019.
    BibTeX Download PDFAbout TR2019-006
    • @inproceedings{Baskar2019may,
    • author = {Baskar, Murali Karthick and Burget, Lukas and Watanabe, Shinji and Karafiat, Martin and Hori, Takaaki and Cernocky, Jan, Honza},
    • title = {Promising Accurate Prefix Boosting for Sequence-to-Sequence ASR},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • url = {https://www.merl.com/publications/TR2019-006}
    • }
  •  Cho, J., Watanabe, S., Hori, T., Baskar, M.K., Inaguma, H., Villalba, J., Dehak, N., "Language Model Integration Based on Memory Control for Sequence to Sequence Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8683380, May 2019.
    BibTeX Download PDFAbout TR2019-007
    • @inproceedings{Cho2019may,
    • author = {Cho, Jaejin and Watanabe, Shinji and Hori, Takaaki and Baskar, Murali Karthick and Inaguma, Hirofumi and Villalba, Jesus and Dehak, Najim},
    • title = {Language Model Integration Based on Memory Control for Sequence to Sequence Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8683380},
    • url = {https://www.merl.com/publications/TR2019-007}
    • }
  •  Hori, C., Alamri, H., Wang, J., Wichern, G., Hori, T., Cherian, A., Marks, T.K., Cartillier, V., Lopes, R., Das, A., Essa, I., Batra, D., Parikh, D., "End-to-End Audio Visual Scene-Aware Dialog Using Multimodal Attention-Based Video Features", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8682583, May 2019.
    BibTeX Download PDFAbout TR2019-016
    • @inproceedings{Hori2019may2,
    • author = {Hori, Chiori and Alamri, Huda and Wang, Jue and Wichern, Gordon and Hori, Takaaki and Cherian, Anoop and Marks, Tim K. and Cartillier, Vincent and Lopes, Raphael and Das, Abhishek and Essa, Irfan and Batra, Dhruv and Parikh, Devi},
    • title = {End-to-End Audio Visual Scene-Aware Dialog Using Multimodal Attention-Based Video Features},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8682583},
    • url = {https://www.merl.com/publications/TR2019-016}
    • }
  •  Hori, T., Astudillo, R., Hayashi, T., Zhang, Y., Watanabe, S., Le Roux, J., "Cycle-Consistency Training for End-to-End Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8683307, May 2019.
    BibTeX Download PDFAbout TR2019-002
    • @inproceedings{Hori2019may,
    • author = {Hori, Takaaki and Astudillo, Ramon and Hayashi, Tomoki and Zhang, Yu and Watanabe, Shinji and Le Roux, Jonathan},
    • title = {Cycle-Consistency Training for End-to-End Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8683307},
    • url = {https://www.merl.com/publications/TR2019-002}
    • }
  •  Le Roux, J., Wichern, G., Watanabe, S., Sarroff, A., Hershey, J., "The Phasebook: Building Complex Masks via Discrete Representations for Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8682587, May 2019.
    BibTeX Download PDFAbout TR2019-008
    • @inproceedings{LeRoux2019may2,
    • author = {Le Roux, Jonathan and Wichern, Gordon and Watanabe, Shinji and Sarroff, Andy and Hershey, John},
    • title = {The Phasebook: Building Complex Masks via Discrete Representations for Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8682587},
    • url = {https://www.merl.com/publications/TR2019-008}
    • }
  •  Moritz, N., Hori, T., Le Roux, J., "Triggered Attention for End-to-End Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8683510, May 2019.
    BibTeX Download PDFAbout TR2019-015
    • @inproceedings{Moritz2019may,
    • author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Triggered Attention for End-to-End Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8683510},
    • url = {https://www.merl.com/publications/TR2019-015}
    • }