Publications

128 / 3,208 publications found.


  •  Seetharaman, P., Wichern, G., Venkataramani, S., Le Roux, J., "Class-Conditional Embeddings for Music Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8683007, May 2019.
    BibTeX TR2019-004 PDF
    • @inproceedings{Seetharaman2019may,
    • author = {Seetharaman, Prem and Wichern, Gordon and Venkataramani, Shrikant and Le Roux, Jonathan},
    • title = {Class-Conditional Embeddings for Music Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8683007},
    • url = {https://www.merl.com/publications/TR2019-004}
    • }
  •  Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Adversarial Deep Learning in EEG Biometrics", IEEE Signal Processing Letters, DOI: 10.1109/​LSP.2019.2906826, Vol. 26, No. 5, pp. 710-714, March 2019.
    BibTeX TR2019-017 PDF
    • @article{Ozdenizci2019mar2,
    • author = {Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
    • title = {Adversarial Deep Learning in EEG Biometrics},
    • journal = {IEEE Signal Processing Letters},
    • year = 2019,
    • volume = 26,
    • number = 5,
    • pages = {710--714},
    • month = mar,
    • doi = {10.1109/LSP.2019.2906826},
    • url = {https://www.merl.com/publications/TR2019-017}
    • }
  •  Le Roux, J., Wichern, G., Watanabe, S., Sarroff, A., Hershey, J., "Phasebook and Friends: Leveraging discrete representations for source separation", IEEE Journal of Selected Topics in Signal Processing, DOI: 10.1109/​JSTSP.2019.2904183, Vol. 13, No. 2, pp. 370-382, March 2019.
    BibTeX TR2018-199 PDF
    • @article{LeRoux2019mar,
    • author = {Le Roux, Jonathan and Wichern, Gordon and Watanabe, Shinji and Sarroff, Andy and Hershey, John},
    • title = {Phasebook and Friends: Leveraging discrete representations for source separation},
    • journal = {IEEE Journal of Selected Topics in Signal Processing},
    • year = 2019,
    • volume = 13,
    • number = 2,
    • pages = {370--382},
    • month = mar,
    • doi = {10.1109/JSTSP.2019.2904183},
    • url = {https://www.merl.com/publications/TR2018-199}
    • }
  •  TaherSima, M., Kojima, K., Koike-Akino, T., Jha, D., Wang, B., Lin, C., Parsons, K., "Deep Neural Network Inverse Design of Integrated Photonic Power Splitters", Nature Scientific Reports, DOI: 10.1038/​s41598-018-37952-2, Vol. 9, pp. 1368, December 2018.
    BibTeX TR2018-180 PDF
    • @article{TaherSima2018dec,
    • author = {TaherSima, Mohammad and Kojima, Keisuke and Koike-Akino, Toshiaki and Jha, Devesh and Wang, Bingnan and Lin, Chungwei and Parsons, Kieran},
    • title = {Deep Neural Network Inverse Design of Integrated Photonic Power Splitters},
    • journal = {Nature Scientific Reports},
    • year = 2018,
    • volume = 9,
    • pages = 1368,
    • month = dec,
    • doi = {10.1038/s41598-018-37952-2},
    • issn = {2045-2322},
    • url = {https://www.merl.com/publications/TR2018-180}
    • }
  •  Paul, S., van Baar, J., "Trajectory-based Learning for Ball-in-Maze Games", NIPS Workshop on Imitation Learning and its Challenges in Robotics, December 2018.
    BibTeX TR2018-158 PDF
    • @inproceedings{Paul2018dec,
    • author = {Paul, Sujoy and van Baar, Jeroen},
    • title = {Trajectory-based Learning for Ball-in-Maze Games},
    • booktitle = {NIPS Workshop on Imitation Learning and its Challenges in Robotics},
    • year = 2018,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2018-158}
    • }
  •  Jha, D.K., Romeres, D., van Baar, J., Sullivan, A., Nikovski, D.N., "Learning Tasks in a Complex Circular Maze Environment", NIPS Workshop on Modeling the Physical World: Perception, Learning, and Control, December 2018.
    BibTeX TR2018-169 PDF
    • @inproceedings{vanBaar2018dec,
    • author = {Jha, Devesh K. and Romeres, Diego and van Baar, Jeroen and Sullivan, Alan and Nikovski, Daniel N.},
    • title = {Learning Tasks in a Complex Circular Maze Environment},
    • booktitle = {NIPS Workshop on Modeling the Physical World: Perception, Learning, and Control},
    • year = 2018,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2018-169}
    • }
  •  Wichern, G., Le Roux, J., "Phase Reconstruction with Learned Time-Frequency Representations for Single-Channel Speech Separation", International Workshop on Acoustic Signal Enhancement (IWAENC), DOI: 10.1109/​IWAENC.2018.8521243, September 2018.
    BibTeX TR2018-146 PDF
    • @inproceedings{Wichern2018sep,
    • author = {Wichern, Gordon and Le Roux, Jonathan},
    • title = {Phase Reconstruction with Learned Time-Frequency Representations for Single-Channel Speech Separation},
    • booktitle = {International Workshop on Acoustic Signal Enhancement (IWAENC)},
    • year = 2018,
    • month = sep,
    • doi = {10.1109/IWAENC.2018.8521243},
    • url = {https://www.merl.com/publications/TR2018-146}
    • }
  •  Wang, J., Cherian, A., "Learning Discriminative Video Representations Using Adversarial Perturbations", European Conference on Computer Vision (ECCV), September 2018.
    BibTeX TR2018-139 PDF Software
    • @inproceedings{Wang2018sep3,
    • author = {Wang, Jue and Cherian, Anoop},
    • title = {Learning Discriminative Video Representations Using Adversarial Perturbations},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-139}
    • }
  •  Kocanaogullari, A., Ataer-Cansizoglu, E., "Active Descriptor Learning for Feature Matching", International Workshop on Compact and Efficient Feature Representation and Learning in Computer Vision, September 2018.
    BibTeX TR2018-132 PDF
    • @inproceedings{Kocanaogullari2018sep,
    • author = {Kocanaogullari, Aziz and Ataer-Cansizoglu, Esra},
    • title = {Active Descriptor Learning for Feature Matching},
    • booktitle = {International Workshop on Compact and Efficient Feature Representation and Learning in Computer Vision},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-132}
    • }
  •  Wang, Z.-Q., Le Roux, J., Wang, D., Hershey, J., "End-to-End Speech Separation with Unfolded Iterative Phase Reconstruction", Interspeech, September 2018.
    BibTeX TR2018-135 PDF
    • @inproceedings{Wang2018sep,
    • author = {Wang, Zhong-Qiu and Le Roux, Jonathan and Wang, DeLiang and Hershey, John},
    • title = {End-to-End Speech Separation with Unfolded Iterative Phase Reconstruction},
    • booktitle = {Interspeech},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-135}
    • }
  •  Watanabe, S., Hori, T., Karita, S., Hayashi, T., Nishitoba, J., Unno, Y., Enrique Yalta Soplin, N., Heymann, J., Wiesner, M., Chen, N., Renduchintala, A., Ochiai, T., "ESPnet: End-to-End Speech Processing Toolkit", Interspeech, September 2018.
    BibTeX TR2018-136 PDF
    • @inproceedings{Watanabe2018sep,
    • author = {Watanabe, Shinji and Hori, Takaaki and Karita, Shigeki and Hayashi, Tomoki and Nishitoba, Jiro and Unno, Yuya and Enrique Yalta Soplin, Nelson and Heymann, Jahn and Wiesner, Matthew and Chen, Nanxin and Renduchintala, Adithya and Ochiai, Tsubasa},
    • title = {ESPnet: End-to-End Speech Processing Toolkit},
    • booktitle = {Interspeech},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-136}
    • }
  •  Ataer-Cansizoglu, E., Jones, M.J., Zhang, Z., Sullivan, A., "Verification of Very Low-Resolution Faces Using An Identity-Preserving Deep Face Super-resolution Network", arXiv, August 2018.
    BibTeX arXiv
    • @article{Ataer-Cansizoglu2018aug,
    • author = {Ataer-Cansizoglu, Esra and Jones, Michael J. and Zhang, Ziming and Sullivan, Alan},
    • title = {Verification of Very Low-Resolution Faces Using An Identity-Preserving Deep Face Super-resolution Network},
    • journal = {arXiv},
    • year = 2018,
    • month = aug,
    • url = {https://arxiv.org/abs/1903.10974}
    • }
  •  Zhang, Z., "LMKL-Net: A Fast Localized Multiple Kernel Learning Solver via Deep Neural Networks", arXiv, July 12, 2018.
    BibTeX arXiv
    • @article{Zhang2018jul,
    • author = {Zhang, Ziming},
    • title = {LMKL-Net: A Fast Localized Multiple Kernel Learning Solver via Deep Neural Networks},
    • journal = {arXiv},
    • year = 2018,
    • month = jul,
    • url = {https://arxiv.org/abs/1805.08656}
    • }
  •  Pan, Y., Farahmand, A.-M., White, M., Nabi, S., Grover, P., Nikovski, D.N., "Reinforcement Learning with Function-Valued Action Spaces for Partial Differential Equation Control", International Conference on Machine Learning (ICML), July 2018.
    BibTeX TR2018-101 PDF
    • @inproceedings{Pan2018jul,
    • author = {Pan, Yangchen and Farahmand, Amir-massoud and White, Martha and Nabi, Saleh and Grover, Piyush and Nikovski, Daniel N.},
    • title = {Reinforcement Learning with Function-Valued Action Spaces for Partial Differential Equation Control},
    • booktitle = {International Conference on Machine Learning (ICML)},
    • year = 2018,
    • month = jul,
    • url = {https://www.merl.com/publications/TR2018-101}
    • }
  •  Barker, J., Marxer, R., Vincent, E., Watanabe, S., "The CHiME challenges: Robust speech recognition in everyday environments" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R., Eds., chapter 14, Springer, July 2018.
    BibTeX
    • @incollection{Barker2018jul,
    • author = {Barker, Jon and Marxer, Ricard and Vincent, Emmanuel and Watanabe, Shinji},
    • title = {The CHiME challenges: Robust speech recognition in everyday environments},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R.},
    • chapter = 14,
    • month = jul,
    • publisher = {Springer}
    • }
  •  Erdogan, H., Hershey, J., Watanabe, S., Le Roux, J., "Deep recurrent networks for separation and recognition of single-channel speech in non-stationary background audio" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R., Eds., chapter 7, Springer, July 2018.
    BibTeX
    • @incollection{Erdogan2018jul,
    • author = {Erdogan, Hakan and Hershey, John and Watanabe, Shinji and Le Roux, Jonathan},
    • title = {Deep recurrent networks for separation and recognition of single-channel speech in non-stationary background audio},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R.},
    • chapter = 7,
    • month = jul,
    • publisher = {Springer},
    • isbn = {978-3-319-64680-0}
    • }
  •  Hershey, J., Le Roux, J., Watanabe, S., Wisdom, S., Chen, Z., Isik, Y., "Novel deep architectures in speech processing" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R., Eds., chapter 6, Springer, July 9, 2018.
    BibTeX
    • @incollection{Hershey2018jul,
    • author = {Hershey, John and Le Roux, Jonathan and Watanabe, Shinji and Wisdom, Scott and Chen, Zhuo and Isik, Yusuf},
    • title = {Novel deep architectures in speech processing},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R.},
    • chapter = 6,
    • month = jul,
    • publisher = {Springer}
    • }
  •  Karafiat, M., Vesely, K., Zmolikova, K., Delcroix, M., Watanabe, S., Burget, L., Cernocky, J., Szoke, I., Novotny, O., "Training data augmentation and data selectio" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R., Eds., chapter 10, Springer, July 9, 2018.
    BibTeX
    • @incollection{Karafiat2018jul,
    • author = {Karafiat, Martin and Vesely, Karel and Zmolikova, Katerina and Delcroix, Marc and Watanabe, Shinji and Burget, Lukas and Cernocky, Jan and Szoke, Igor and Novotny, Ondrej},
    • title = {Training data augmentation and data selectio},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R.},
    • chapter = 10,
    • month = jul,
    • publisher = {Springer}
    • }
  •  Watanabe, S., Hori, T., Miao, Y., Delcroix, M., Metze, F., Hershey, J., "Toolkits for robust speech processing" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R., Eds., chapter 14, Springer, July 9, 2018.
    BibTeX
    • @incollection{Watanabe2018jul,
    • author = {Watanabe, Shinji and Hori, Takaaki and Miao, Yajie and Delcroix, Marc and Metze, Florian and Hershey, John},
    • title = {Toolkits for robust speech processing},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R.},
    • chapter = 14,
    • month = jul,
    • publisher = {Springer}
    • }
  •  Xiao, X., Watanabe, S., Erdogan, H., Mandel, M., Lu, L., Hershey, J., Seltzer, M., Chen, G., Zhang, Y., Yu, D., "Discriminative beamforming with phase aware neural networks for speech enhancement and recognition" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R., Eds., chapter 4, Springer, July 9, 2018.
    BibTeX
    • @incollection{Xiao2018jul2,
    • author = {Xiao, Xiong and Watanabe, Shinji and Erdogan, Hakan and Mandel, Michael and Lu, Liang and Hershey, John and Seltzer, Mike and Chen, Guoguo and Zhang, Yu and Yu, Dong},
    • title = {Discriminative beamforming with phase aware neural networks for speech enhancement and recognition},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S., Delcroix, M., Metze, F., Hershey, J.R.},
    • chapter = 4,
    • month = jul,
    • publisher = {Springer}
    • }
  •  Liu, J., Guo, J., Orlik, P.V., Shibata, M., Nakahara, D., Mii, S., Takac, M., "Anomaly Detection in Manufacturing Systems Using Structured Neural Networks", IEEE World Congress on Intelligent Control and Automation, DOI: 10.1109/​WCICA.2018.8630692, July 2018, pp. 175-180.
    BibTeX TR2018-097 PDF
    • @inproceedings{Liu2018jul2,
    • author = {Liu, Jie and Guo, Jianlin and Orlik, Philip V. and Shibata, Masahiko and Nakahara, Daiki and Mii, Satoshi and Takac, Martin},
    • title = {Anomaly Detection in Manufacturing Systems Using Structured Neural Networks},
    • booktitle = {IEEE World Congress on Intelligent Control and Automation},
    • year = 2018,
    • pages = {175--180},
    • month = jul,
    • doi = {10.1109/WCICA.2018.8630692},
    • url = {https://www.merl.com/publications/TR2018-097}
    • }
  •  Koike-Akino, T., Millar, D.S., Parsons, K., Kojima, K., "Fiber Nonlinearity Equalization with Multi-Label Deep Learning Scalable to High-Order DP-QAM", Signal Processing in Photonic Communications (SPPCom), DOI: 10.1364/​SPPCOM.2018.SpM4G.1, July 2018.
    BibTeX TR2018-047 PDF
    • @inproceedings{Koike-Akino2018jul3,
    • author = {Koike-Akino, Toshiaki and Millar, David S. and Parsons, Kieran and Kojima, Keisuke},
    • title = {Fiber Nonlinearity Equalization with Multi-Label Deep Learning Scalable to High-Order DP-QAM},
    • booktitle = {Signal Processing in Photonic Communications (SPPCom)},
    • year = 2018,
    • month = jul,
    • doi = {10.1364/SPPCOM.2018.SpM4G.1},
    • url = {https://www.merl.com/publications/TR2018-047}
    • }
  •  Shen, Y., Feng, C., Yang, Y., Tian, D., "Mining Point Cloud Local Structures by Kernel Correlation and Graph Pooling", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2018.
    BibTeX TR2018-041 PDF Software
    • @inproceedings{Shen2018jun,
    • author = {Shen, Yiru and Feng, Chen and Yang, Yaoqing and Tian, Dong},
    • title = {Mining Point Cloud Local Structures by Kernel Correlation and Graph Pooling},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2018,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2018-041}
    • }
  •  Yang, Y., Feng, C., Shen, Y., Tian, D., "FoldingNet: Point Cloud Auto-encoder via Deep Grid Deformation", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR.2018.00029, June 2018.
    BibTeX TR2018-042 PDF Software
    • @inproceedings{Yang2018jun,
    • author = {Yang, Yaoqing and Feng, Chen and Shen, Yiru and Tian, Dong},
    • title = {FoldingNet: Point Cloud Auto-encoder via Deep Grid Deformation},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2018,
    • month = jun,
    • doi = {10.1109/CVPR.2018.00029},
    • url = {https://www.merl.com/publications/TR2018-042}
    • }
  •  Zhang, Z., Wu, Y., Wang, G., "BPGrad: Towards Global Optimality in Deep Learning via Branch and Pruning", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2018, pp. 3301-3309.
    BibTeX TR2018-068 PDF
    • @inproceedings{Zhang2018jun,
    • author = {Zhang, Ziming and Wu, Yuanwei and Wang, Guanghui},
    • title = {BPGrad: Towards Global Optimality in Deep Learning via Branch and Pruning},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2018,
    • pages = {3301--3309},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2018-068}
    • }