Publications

597 / 3,604 publications found.


  •  Wichern, G., Le Roux, J., "Phase Reconstruction with Learned Time-Frequency Representations for Single-Channel Speech Separation", International Workshop on Acoustic Signal Enhancement (IWAENC), DOI: 10.1109/​IWAENC.2018.8521243, September 2018.
    BibTeX TR2018-146 PDF
    • @inproceedings{Wichern2018sep,
    • author = {Wichern, Gordon and Le Roux, Jonathan},
    • title = {Phase Reconstruction with Learned Time-Frequency Representations for Single-Channel Speech Separation},
    • booktitle = {International Workshop on Acoustic Signal Enhancement (IWAENC)},
    • year = 2018,
    • month = sep,
    • doi = {10.1109/IWAENC.2018.8521243},
    • url = {https://www.merl.com/publications/TR2018-146}
    • }
  •  Wang, J., Cherian, A., "Learning Discriminative Video Representations Using Adversarial Perturbations", European Conference on Computer Vision (ECCV), September 2018.
    BibTeX TR2018-139 PDF Software
    • @inproceedings{Wang2018sep3,
    • author = {Wang, Jue and Cherian, Anoop},
    • title = {Learning Discriminative Video Representations Using Adversarial Perturbations},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-139}
    • }
  •  Kocanaogullari, A., Ataer-Cansizoglu, E., "Active Descriptor Learning for Feature Matching", International Workshop on Compact and Efficient Feature Representation and Learning in Computer Vision, September 2018.
    BibTeX TR2018-132 PDF
    • @inproceedings{Kocanaogullari2018sep,
    • author = {Kocanaogullari, Aziz and Ataer-Cansizoglu, Esra},
    • title = {Active Descriptor Learning for Feature Matching},
    • booktitle = {International Workshop on Compact and Efficient Feature Representation and Learning in Computer Vision},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-132}
    • }
  •  Shou, Z., Pan, J., Chan, J., Miyazawa, K., Mansour, H., Vetro, A., Giro-i-Nieto, X., Chang, S.-F., "Online Detection of Action Start in Untrimmed, Streaming Videos", European Conference on Computer Vision (ECCV), September 2018.
    BibTeX TR2018-109 PDF
    • @inproceedings{Shou2018sep,
    • author = {Shou, Zheng and Pan, Junting and Chan, Jonathan and Miyazawa, Kazuyuki and Mansour, Hassan and Vetro, Anthony and Giro-i-Nieto, Xavier and Chang, Shi-Fu},
    • title = {Online Detection of Action Start in Untrimmed, Streaming Videos},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-109}
    • }
  •  Wang, J., Cherian, A., "Discriminative Subspace Pooling for Action Recognition", Workshop on Perceptual Organization in Computer Vision as part of the European Conference on Computer Vision (ECCV), September 2018.
    BibTeX TR2018-141 PDF
    • @inproceedings{Wang2018sep2,
    • author = {Wang, Jue and Cherian, Anoop},
    • title = {Discriminative Subspace Pooling for Action Recognition},
    • booktitle = {Workshop on Perceptual Organization in Computer Vision as part of the European Conference on Computer Vision (ECCV)},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-141}
    • }
  •  Jones, M.J., Broad, A., Lee, T.-Y., "Recurrent Multi-frame Single Shot Detector for Video Object Detection", British Machine Vision Conference (BMVC), September 2018.
    BibTeX TR2018-137 PDF
    • @inproceedings{Jones2018sep,
    • author = {Jones, Michael J. and Broad, Alexander and Lee, Teng-Yok},
    • title = {Recurrent Multi-frame Single Shot Detector for Video Object Detection},
    • booktitle = {British Machine Vision Conference (BMVC)},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-137}
    • }
  •  Wang, Z.-Q., Le Roux, J., Wang, D., Hershey, J., "End-to-End Speech Separation with Unfolded Iterative Phase Reconstruction", Interspeech, September 2018.
    BibTeX TR2018-135 PDF
    • @inproceedings{Wang2018sep,
    • author = {Wang, Zhong-Qiu and Le Roux, Jonathan and Wang, DeLiang and Hershey, John},
    • title = {End-to-End Speech Separation with Unfolded Iterative Phase Reconstruction},
    • booktitle = {Interspeech},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-135}
    • }
  •  Watanabe, S., Hori, T., Karita, S., Hayashi, T., Nishitoba, J., Unno, Y., Enrique Yalta Soplin, N., Heymann, J., Wiesner, M., Chen, N., Renduchintala, A., Ochiai, T., "ESPnet: End-to-End Speech Processing Toolkit", Interspeech, September 2018.
    BibTeX TR2018-136 PDF
    • @inproceedings{Watanabe2018sep,
    • author = {Watanabe, Shinji and Hori, Takaaki and Karita, Shigeki and Hayashi, Tomoki and Nishitoba, Jiro and Unno, Yuya and Enrique Yalta Soplin, Nelson and Heymann, Jahn and Wiesner, Matthew and Chen, Nanxin and Renduchintala, Adithya and Ochiai, Tsubasa},
    • title = {ESPnet: End-to-End Speech Processing Toolkit},
    • booktitle = {Interspeech},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-136}
    • }
  •  Laftchiev, E., Sun, X., Dau, H.-A., Nikovski, D.N., "Anomaly Detection in Discrete Manufacturing Systems using Event Relationship Tables", International Workshop on Principle of Diagnosis, August 2018.
    BibTeX TR2018-128 PDF
    • @inproceedings{Laftchiev2018aug,
    • author = {Laftchiev, Emil and Sun, Xinmaio and Dau, Hoang-Anh and Nikovski, Daniel N.},
    • title = {Anomaly Detection in Discrete Manufacturing Systems using Event Relationship Tables},
    • booktitle = {International Workshop on Principle of Diagnosis},
    • year = 2018,
    • month = aug,
    • url = {https://www.merl.com/publications/TR2018-128}
    • }
  •  Ataer-Cansizoglu, E., Jones, M.J., Zhang, Z., Sullivan, A., "Verification of Very Low-Resolution Faces Using An Identity-Preserving Deep Face Super-resolution Network", arXiv, August 2018.
    BibTeX arXiv
    • @article{Ataer-Cansizoglu2018aug,
    • author = {Ataer-Cansizoglu, Esra and Jones, Michael J. and Zhang, Ziming and Sullivan, Alan},
    • title = {Verification of Very Low-Resolution Faces Using An Identity-Preserving Deep Face Super-resolution Network},
    • journal = {arXiv},
    • year = 2018,
    • month = aug,
    • url = {https://arxiv.org/abs/1903.10974}
    • }
  •  Zhang, J., Lee, T.-Y., Feng, C., Li, X., Zhang, Z., "Robust Attentional Pooling via Feature Selection", IEEE International Conference on Pattern Recognition (ICPR), DOI: 10.1109/​ICPR.2018.8545607, August 2018, pp. 2038-2043.
    BibTeX TR2018-124 PDF
    • @inproceedings{Zhang2018aug,
    • author = {Zhang, Jian and Lee, Teng-Yok and Feng, Chen and Li, Xiaohua and Zhang, Ziming},
    • title = {Robust Attentional Pooling via Feature Selection},
    • booktitle = {IEEE International Conference on Pattern Recognition (ICPR)},
    • year = 2018,
    • pages = {2038--2043},
    • month = aug,
    • doi = {10.1109/ICPR.2018.8545607},
    • url = {https://www.merl.com/publications/TR2018-124}
    • }
  •  Seki, H., Hori, T., Watanabe, S., Le Roux, J., Hershey, J., "A Purely End-to-end System for Multi-speaker Speech Recognition", Annual Meeting of the Association for Computational Linguistics (ACL), July 2018, pp. 2620-2630.
    BibTeX TR2018-104 PDF Video
    • @inproceedings{Seki2018jul,
    • author = {Seki, Hiroshi and Hori, Takaaki and Watanabe, Shinji and Le Roux, Jonathan and Hershey, John},
    • title = {A Purely End-to-end System for Multi-speaker Speech Recognition},
    • booktitle = {Annual Meeting of the Association for Computational Linguistics (ACL)},
    • year = 2018,
    • pages = {2620--2630},
    • month = jul,
    • publisher = {Elsevier},
    • url = {https://www.merl.com/publications/TR2018-104}
    • }
  •  Alamri, H., Cartillier, V., Lopes, R., Das, A., Wang, J., Essa, I., Batra, D., Parikh, D., Cherian, A., Marks, T.K., Hori, C., "Audio Visual Scene-Aware Dialog (AVSD) Challenge at DSTC7", arXiv, July 12, 2018.
    BibTeX arXiv
    • @article{Alamri2018jul,
    • author = {Alamri, Huda and Cartillier, Vincent and Lopes, Raphael and Das, Abhishek and Wang, Jue and Essa, Irfan and Batra, Dhruv and Parikh, Devi and Cherian, Anoop and Marks, Tim K. and Hori, Chiori},
    • title = {Audio Visual Scene-Aware Dialog (AVSD) Challenge at DSTC7},
    • journal = {arXiv},
    • year = 2018,
    • month = jul,
    • url = {https://arxiv.org/abs/1806.00525}
    • }
  •  Zhang, Z., "LMKL-Net: A Fast Localized Multiple Kernel Learning Solver via Deep Neural Networks", arXiv, July 12, 2018.
    BibTeX arXiv
    • @article{Zhang2018jul,
    • author = {Zhang, Ziming},
    • title = {LMKL-Net: A Fast Localized Multiple Kernel Learning Solver via Deep Neural Networks},
    • journal = {arXiv},
    • year = 2018,
    • month = jul,
    • url = {https://arxiv.org/abs/1805.08656}
    • }
  •  Zhang, Z., Lin, R., Sullivan, A., "Deformable Part Networks", arXiv, July 12, 2018.
    BibTeX arXiv
    • @article{Zhang2018jul2,
    • author = {Zhang, Ziming and Lin, Rongmei and Sullivan, Alan},
    • title = {Deformable Part Networks},
    • journal = {arXiv},
    • year = 2018,
    • month = jul,
    • url = {https://arxiv.org/abs/1805.08808}
    • }
  •  Sanz, I., Bernal, C., Bono, A., Pajovic, M., Martinez, G., "Gaussian Process Regression Applied to VRLA Battery Voltage Prediction in Photovoltaic Off-Grid Systems", Jornada de Jovenes Investigadores, July 11, 2018.
    BibTeX TR2018-077 PDF
    • @inproceedings{Sanz2018jul,
    • author = {Sanz, Ivan and Bernal, Carlos and Bono, Antonio and Pajovic, Milutin and Martinez, Gabriel},
    • title = {Gaussian Process Regression Applied to VRLA Battery Voltage Prediction in Photovoltaic Off-Grid Systems},
    • booktitle = {Jornada de Jovenes Investigadores},
    • year = 2018,
    • number = 6,
    • month = jul,
    • url = {https://www.merl.com/publications/TR2018-077}
    • }
  •  Pan, Y., Farahmand, A.-M., White, M., Nabi, S., Grover, P., Nikovski, D.N., "Reinforcement Learning with Function-Valued Action Spaces for Partial Differential Equation Control", International Conference on Machine Learning (ICML), July 2018.
    BibTeX TR2018-101 PDF
    • @inproceedings{Pan2018jul,
    • author = {Pan, Yangchen and Farahmand, Amir-massoud and White, Martha and Nabi, Saleh and Grover, Piyush and Nikovski, Daniel N.},
    • title = {Reinforcement Learning with Function-Valued Action Spaces for Partial Differential Equation Control},
    • booktitle = {International Conference on Machine Learning (ICML)},
    • year = 2018,
    • month = jul,
    • url = {https://www.merl.com/publications/TR2018-101}
    • }
  •  Liu, J., Guo, J., Orlik, P.V., Shibata, M., Nakahara, D., Mii, S., Takac, M., "Anomaly Detection in Manufacturing Systems Using Structured Neural Networks", IEEE World Congress on Intelligent Control and Automation, DOI: 10.1109/​WCICA.2018.8630692, July 2018, pp. 175-180.
    BibTeX TR2018-097 PDF
    • @inproceedings{Liu2018jul2,
    • author = {Liu, Jie and Guo, Jianlin and Orlik, Philip V. and Shibata, Masahiko and Nakahara, Daiki and Mii, Satoshi and Takac, Martin},
    • title = {Anomaly Detection in Manufacturing Systems Using Structured Neural Networks},
    • booktitle = {IEEE World Congress on Intelligent Control and Automation},
    • year = 2018,
    • pages = {175--180},
    • month = jul,
    • doi = {10.1109/WCICA.2018.8630692},
    • url = {https://www.merl.com/publications/TR2018-097}
    • }
  •  Shen, Y., Feng, C., Yang, Y., Tian, D., "Mining Point Cloud Local Structures by Kernel Correlation and Graph Pooling", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2018.
    BibTeX TR2018-041 PDF Software
    • @inproceedings{Shen2018jun,
    • author = {Shen, Yiru and Feng, Chen and Yang, Yaoqing and Tian, Dong},
    • title = {Mining Point Cloud Local Structures by Kernel Correlation and Graph Pooling},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2018,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2018-041}
    • }
  •  Yang, Y., Feng, C., Shen, Y., Tian, D., "FoldingNet: Point Cloud Auto-encoder via Deep Grid Deformation", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR.2018.00029, June 2018.
    BibTeX TR2018-042 PDF Software
    • @inproceedings{Yang2018jun,
    • author = {Yang, Yaoqing and Feng, Chen and Shen, Yiru and Tian, Dong},
    • title = {FoldingNet: Point Cloud Auto-encoder via Deep Grid Deformation},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2018,
    • month = jun,
    • doi = {10.1109/CVPR.2018.00029},
    • url = {https://www.merl.com/publications/TR2018-042}
    • }
  •  Zhang, Z., Wu, Y., Wang, G., "BPGrad: Towards Global Optimality in Deep Learning via Branch and Pruning", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2018, pp. 3301-3309.
    BibTeX TR2018-068 PDF
    • @inproceedings{Zhang2018jun,
    • author = {Zhang, Ziming and Wu, Yuanwei and Wang, Guanghui},
    • title = {BPGrad: Towards Global Optimality in Deep Learning via Branch and Pruning},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2018,
    • pages = {3301--3309},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2018-068}
    • }
  •  Nowara, E., Marks, T.K., Mansour, H., Nakamura, Y., Veeraraghavan, A., "SparsePPG: Towards Driver Monitoring Using Camera-Based Vital Signs Estimation in Near-Infrared", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop on Computer Vision for Physiological Measurement (CVPM, June 2018, pp. 1272-1281.
    BibTeX TR2018-067 PDF
    • @inproceedings{Nowara2018jun,
    • author = {Nowara, Ewa and Marks, Tim K. and Mansour, Hassan and Nakamura, Yudai and Veeraraghavan, Ashok},
    • title = {SparsePPG: Towards Driver Monitoring Using Camera-Based Vital Signs Estimation in Near-Infrared},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop on Computer Vision for Physiological Measurement (CVPM},
    • year = 2018,
    • pages = {1272--1281},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2018-067}
    • }
  •  Deshmukh, A., Laftchiev, E., "Semi-Supervised Transfer Learning Using Marginal Predictors", IEEE Data Science Workshop, DOI: 10.1109/​DSW.2018.8439908, June 6, 2018, pp. 160-164.
    BibTeX TR2018-040 PDF Software
    • @inproceedings{Deshmukh2018jun,
    • author = {Deshmukh, Aniket and Laftchiev, Emil},
    • title = {Semi-Supervised Transfer Learning Using Marginal Predictors},
    • booktitle = {IEEE Data Science Workshop},
    • year = 2018,
    • pages = {160--164},
    • month = jun,
    • doi = {10.1109/DSW.2018.8439908},
    • url = {https://www.merl.com/publications/TR2018-040}
    • }
  •  Ochiai, T., Watanabe, S., Katagiri, S., Hori, T., Hershey, J.R., "Speaker Adaptation for Multichannel End-to-End Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2018.8462161, April 2018, pp. 6707-6711.
    BibTeX TR2018-006 PDF
    • @inproceedings{Ochiai2018apr,
    • author = {Ochiai, Tsubasa and Watanabe, Shinji and Katagiri, Shigeru and Hori, Takaaki and Hershey, John R.},
    • title = {Speaker Adaptation for Multichannel End-to-End Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2018,
    • pages = {6707--6711},
    • month = apr,
    • doi = {10.1109/ICASSP.2018.8462161},
    • url = {https://www.merl.com/publications/TR2018-006}
    • }
  •  Seki, H., Watanabe, S., Hori, T., Le Roux, J., Hershey, J.R., "An End-to-End Language-Tracking Speech Recognizer for Mixed-Language Speech", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2018.8462180, April 2018, pp. 4919-4923.
    BibTeX TR2018-002 PDF Video
    • @inproceedings{Seki2018apr,
    • author = {Seki, Hiroshi and Watanabe, Shinji and Hori, Takaaki and Le Roux, Jonathan and Hershey, John R.},
    • title = {An End-to-End Language-Tracking Speech Recognizer for Mixed-Language Speech},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2018,
    • pages = {4919--4923},
    • month = apr,
    • doi = {10.1109/ICASSP.2018.8462180},
    • url = {https://www.merl.com/publications/TR2018-002}
    • }