Publications

14 / 2,644 publications found.


  •  Hori, C., Alamri, H., Wang, J., Wichern, G., Hori, T., Cherian, A., Marks, T.K., Cartillier, V., Lopes, R., Das, A., Essa, I., Batra, D., Parikh, D., "End-to-End Audio Visual Scene-Aware Dialog using Multimodal Attention-Based Video Features", arXiv, July 13, 2018.
    BibTeX Download PDFAbout TR2018-085
    • @techreport{MERL_TR2018-085,
    • author = {Hori, C. and Alamri, H. and Wang, J. and Wichern, G. and Hori, T. and Cherian, A. and Marks, T.K. and Cartillier, V. and Lopes, R. and Das, A. and Essa, I. and Batra, D. and Parikh, D.},
    • title = {End-to-End Audio Visual Scene-Aware Dialog using Multimodal Attention-Based Video Features},
    • institution = {MERL - Mitsubishi Electric Research Laboratories},
    • address = {Cambridge, MA 02139},
    • number = {TR2018-085},
    • month = jul,
    • year = 2018,
    • url = {http://www.merl.com/publications/TR2018-085/}
    • }
  •  Alamri, H., Cartillier, V., Lopes, R., Das, A., Wang, J., Essa, I., Batra, D., Parikh, D., Cherian, A., Marks, T.K., Hori, C., "Audio Visual Scene-Aware Dialog (AVSD) Challenge at DSTC7", arXiv, July 12, 2018.
    BibTeX Download PDFAbout TR2018-069
    • @techreport{MERL_TR2018-069,
    • author = {Alamri, H. and Cartillier, V. and Lopes, R. and Das, A. and Wang, J. and Essa, I. and Batra, D. and Parikh, D. and Cherian, A. and Marks, T.K. and Hori, C.},
    • title = {Audio Visual Scene-Aware Dialog (AVSD) Challenge at DSTC7},
    • institution = {MERL - Mitsubishi Electric Research Laboratories},
    • address = {Cambridge, MA 02139},
    • number = {TR2018-069},
    • month = jul,
    • year = 2018,
    • url = {http://www.merl.com/publications/TR2018-069/}
    • }
  •  Hori, C., Hori, T., Marks, T.K., Hershey, J.R., "Early and Late Integration of Audio Features for Automatic Video Description", IEEE Automatic Speech Recognition and Understanding Workshop (ASRU), DOI: 10.1109/ASRU.2017.8268968, December 2017.
  •  Hori, C., Hori, T., Lee, T.-Y., Zhang, Z., Harsham, B.A., Sumi, K., Marks, T.K., Hershey, J.R., "Attention-Based Multimodal Fusion for Video Description", IEEE International Conference on Computer Vision (ICCV), DOI: 10.1109/ICCV.2017.450, October 2017.
  •  Hori, C., Hori, T., Lee, T.-Y., Sumi, K., Hershey, J.R., Marks, T.K., "Attention-Based Multimodal Fusion for Video Description," Tech. Rep. TR2017-008, arXiv, January 2017.
    BibTeX Download PDFAbout TR2017-008
    • @techreport{MERL_TR2017-008,
    • author = {Hori, C. and Hori, T. and Lee, T.-Y. and Sumi, K. and Hershey, J.R. and Marks, T.K.},
    • title = {Attention-Based Multimodal Fusion for Video Description},
    • institution = {MERL - Mitsubishi Electric Research Laboratories},
    • address = {Cambridge, MA 02139},
    • number = {TR2017-008},
    • month = jan,
    • year = 2017,
    • url = {http://www.merl.com/publications/TR2017-008/}
    • }
  •  Porikli, F.; Tuzel, O., "Covariance Tracker", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2006.
    BibTeX Download PDFAbout TR2006-042
    • @inproceedings{Porikli2006jun2,
    • author = {Porikli, F. and Tuzel, O.},
    • title = {Covariance Tracker},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2006,
    • month = jun,
    • url = {http://www.merl.com/publications/TR2006-042}
    • }
  •  Ma, Z.; Shao, H.-R.; Shen, C., "A New Multi-path Selection Scheme for Video Streaming on Overlay Networks", IEEE International Conference on Communications (ICC), June 2004, vol. 3, pp. 1330-1334.
    BibTeX Download PDFAbout TR2004-064
    • @inproceedings{Ma2004jun,
    • author = {Ma, Z. and Shao, H.-R. and Shen, C.},
    • title = {A New Multi-path Selection Scheme for Video Streaming on Overlay Networks},
    • booktitle = {IEEE International Conference on Communications (ICC)},
    • year = 2004,
    • volume = 3,
    • pages = {1330--1334},
    • month = jun,
    • url = {http://www.merl.com/publications/TR2004-064}
    • }
  •  Xie, L.; Chang, S.-F.; Divakaran, A.; Sun, H., "Feature Selection for Unsupervised Discovery of Statistical Temporal Structures in Video", IEEE International Conference on Image Processing (ICIP), September 2003, vol. 1, pp. 29-32.
    BibTeX Download PDFAbout TR2003-116
    • @inproceedings{Xie2003sep,
    • author = {Xie, L. and Chang, S.-F. and Divakaran, A. and Sun, H.},
    • title = {Feature Selection for Unsupervised Discovery of Statistical Temporal Structures in Video},
    • booktitle = {IEEE International Conference on Image Processing (ICIP)},
    • year = 2003,
    • volume = 1,
    • pages = {29--32},
    • month = sep,
    • url = {http://www.merl.com/publications/TR2003-116}
    • }
  •  Xie, L.; Chang, S.-F.; Divakaran, A.; Sun, H., "Unsupervised Discovery of Multilevel Statistical Video Structures Using Hierarchical Hidden Markov Models", IEEE International Conference on Multimedia and Expo (ICME), July 2003, vol. 3, pp. 29-32.
    BibTeX Download PDFAbout TR2003-101
    • @inproceedings{Xie2003jul,
    • author = {Xie, L. and Chang, S.-F. and Divakaran, A. and Sun, H.},
    • title = {Unsupervised Discovery of Multilevel Statistical Video Structures Using Hierarchical Hidden Markov Models},
    • booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
    • year = 2003,
    • volume = 3,
    • pages = {29--32},
    • month = jul,
    • url = {http://www.merl.com/publications/TR2003-101}
    • }
  •  Zhou, J.; Shao, H.-R.; Shen, C.; Sun, M.-T., "Multi-Path Transport of FGS Video", Packet Video (PV), April 2003.
    BibTeX Download PDFAbout TR2003-10
    • @inproceedings{Zhou2003apr,
    • author = {Zhou, J. and Shao, H.-R. and Shen, C. and Sun, M.-T.},
    • title = {Multi-Path Transport of FGS Video},
    • booktitle = {Packet Video (PV)},
    • year = 2003,
    • month = apr,
    • url = {http://www.merl.com/publications/TR2003-10}
    • }
  •  Lin, S.; Vetro, A.; Wang, Y., "Rate-Distortion Analysis of the Multiple Description Motion Compensation Video Coding Scheme", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), ISSN: 1520-6149, April 2003, vol. 3, pp. 401-404.
    BibTeX Download PDFAbout TR2003-27
    • @inproceedings{Lin2003apr,
    • author = {Lin, S. and Vetro, A. and Wang, Y.},
    • title = {Rate-Distortion Analysis of the Multiple Description Motion Compensation Video Coding Scheme},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • volume = 3,
    • pages = {401--404},
    • month = apr,
    • issn = {1520-6149},
    • url = {http://www.merl.com/publications/TR2003-27}
    • }
  •  Divakaran, A.; Sekiguchi, S.; Asai, K.; Sun, H., "A Description Scheme for Video Based on Feature Extraction in the Compressed Domain", IEEE International Conference on Consumer Electronics (ICCE), June 2000, pp. 278-279.
    BibTeX
    • @inproceedings{Divakaran2000jun,
    • author = {Divakaran, A. and Sekiguchi, S. and Asai, K. and Sun, H.},
    • title = {A Description Scheme for Video Based on Feature Extraction in the Compressed Domain},
    • booktitle = {IEEE International Conference on Consumer Electronics (ICCE)},
    • year = 2000,
    • pages = {278--279},
    • month = jun,
    • url = {http://ieeexplore.ieee.org/xpl/articleDetails.jsp?arnumber=854628}
    • }
  •  Matthew Brand, "An entropic estimator for structure discovery", Tech. Rep. TR98-19, Mitsubishi Electric Research Laboratories, Cambridge, MA, September 1998.
    BibTeX Download PDFAbout TR98-19
    • @techreport{MERL_TR98-19,
    • author = {Matthew Brand},
    • title = {An entropic estimator for structure discovery},
    • institution = {MERL - Mitsubishi Electric Research Laboratories},
    • address = {Cambridge, MA 02139},
    • number = {TR98-19},
    • month = sep,
    • year = 1998,
    • url = {http://www.merl.com/publications/TR98-19/}
    • }
  •  Matthew Brand, "Learning concise models of human activity from ambient video via a structure-inducing M-step estimator", Tech. Rep. TR97-25, Mitsubishi Electric Research Laboratories, Cambridge, MA, November 1997.
    BibTeX Download PDFAbout TR97-25
    • @techreport{MERL_TR97-25,
    • author = {Matthew Brand},
    • title = {Learning concise models of human activity from ambient video via a structure-inducing M-step estimator},
    • institution = {MERL - Mitsubishi Electric Research Laboratories},
    • address = {Cambridge, MA 02139},
    • number = {TR97-25},
    • month = nov,
    • year = 1997,
    • url = {http://www.merl.com/publications/TR97-25/}
    • }