Publications

629 / 3,736 publications found.


  •  Aralikatti, R., Boeddeker, C., Wichern, G., Subramanian, A.S., Le Roux, J., "Reverberation as Supervision for Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10095022, May 2023, pp. 1-5.
    BibTeX TR2023-016 PDF
    • @inproceedings{Aralikatti2023may,
    • author = {Aralikatti, Rohith and Boeddeker, Christoph and Wichern, Gordon and Subramanian, Aswin Shanmugam and Le Roux, Jonathan},
    • title = {Reverberation as Supervision for Speech Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10095022},
    • url = {https://www.merl.com/publications/TR2023-016}
    • }
  •  Berk, A., Ma, Y., Boufounos, P.T., Wang, P., Mansour, H., "Deep Proximal Gradient Method for Learned Convex Regularizers", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10094632, May 2023, pp. 1-5.
    BibTeX TR2023-032 PDF Video
    • @inproceedings{Berk2023may,
    • author = {Berk, Aaron and Ma, Yanting and Boufounos, Petros T. and Wang, Pu and Mansour, Hassan},
    • title = {Deep Proximal Gradient Method for Learned Convex Regularizers},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10094632},
    • isbn = {978-1-7281-6327-7},
    • url = {https://www.merl.com/publications/TR2023-032}
    • }
  •  Bralios, D., Tzinis, E., Wichern, G., Smaragdis, P., Le Roux, J., "Latent Iterative Refinement for Modular Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10096897, May 2023, pp. 1-5.
    BibTeX TR2023-019 PDF
    • @inproceedings{Bralios2023may,
    • author = {Bralios, Dimitrios and Tzinis, Efthymios and Wichern, Gordon and Smaragdis, Paris and Le Roux, Jonathan},
    • title = {Latent Iterative Refinement for Modular Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10096897},
    • url = {https://www.merl.com/publications/TR2023-019}
    • }
  •  Fujihashi, T., Koike-Akino, T., Watanabe, T., "Soft 2D-to-3D Delivery Using Deep Graph Neural Networks for Holographic-Type Communication", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10095882, May 2023.
    BibTeX TR2023-031 PDF
    • @inproceedings{Fujihashi2023may,
    • author = {Fujihashi, Takuya and Koike-Akino, Toshiaki and Watanabe, Takashi},
    • title = {Soft 2D-to-3D Delivery Using Deep Graph Neural Networks for Holographic-Type Communication},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10095882},
    • isbn = {978-1-7281-6327-7},
    • url = {https://www.merl.com/publications/TR2023-031}
    • }
  •  Petermann, D., Wichern, G., Subramanian, A.S., Le Roux, J., "Hyperbolic Audio Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10094943, May 2023, pp. 1-5.
    BibTeX TR2023-017 PDF Video Software
    • @inproceedings{Petermann2023may,
    • author = {Petermann, Darius and Wichern, Gordon and Subramanian, Aswin Shanmugam and Le Roux, Jonathan},
    • title = {Hyperbolic Audio Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10094943},
    • url = {https://www.merl.com/publications/TR2023-017}
    • }
  •  Tzinis, E., Wichern, G., Smaragdis, P., Le Roux, J., "Optimal Condition Training for Target Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10095128, May 2023, pp. 1-5.
    BibTeX TR2023-018 PDF
    • @inproceedings{Tzinis2023may,
    • author = {Tzinis, Efthymios and Wichern, Gordon and Smaragdis, Paris and Le Roux, Jonathan},
    • title = {Optimal Condition Training for Target Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10095128},
    • url = {https://www.merl.com/publications/TR2023-018}
    • }
  •  Vaca-Rubio, C., Wang, P., Koike-Akino, T., Wang, Y., Boufounos, P.T., Popovski, P., "mmWave Wi-Fi Trajectory Estimation with Continuous-Time Neural Dynamic Learning", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10096474, May 2023, pp. 1-5.
    BibTeX TR2023-033 PDF Video
    • @inproceedings{Vaca-Rubio2023may,
    • author = {Vaca-Rubio, Cristian and Wang, Pu and Koike-Akino, Toshiaki and Wang, Ye and Boufounos, Petros T. and Popovski, Petar},
    • title = {mmWave Wi-Fi Trajectory Estimation with Continuous-Time Neural Dynamic Learning},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10096474},
    • isbn = {978-1-7281-6327-7},
    • url = {https://www.merl.com/publications/TR2023-033}
    • }
  •  Yen, H., Germain, F., Wichern, G., Le Roux, J., "Cold Diffusion for Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10096064, May 2023, pp. 1-5.
    BibTeX TR2023-020 PDF
    • @inproceedings{Yen2023may,
    • author = {Yen, Hao and Germain, Francois and Wichern, Gordon and Le Roux, Jonathan},
    • title = {Cold Diffusion for Speech Enhancement},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10096064},
    • url = {https://www.merl.com/publications/TR2023-020}
    • }
  •  Zhao, Q., Ma, Y., Boufounos, P.T., Nabi, S., Mansour, H., "Deep Born Operator Learning for Reflection Tomographic Imaging", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10095494, May 2023, pp. 1-5.
    BibTeX TR2023-029 PDF Video
    • @inproceedings{Zhao2023may,
    • author = {Zhao, Qingqing and Ma, Yanting and Boufounos, Petros T. and Nabi, Saleh and Mansour, Hassan},
    • title = {Deep Born Operator Learning for Reflection Tomographic Imaging},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10095494},
    • url = {https://www.merl.com/publications/TR2023-029}
    • }
  •  Cherian, A., Peng, K.-C., Lohit, S., Smith, K., Tenenbaum, J.B., "Are Deep Neural Networks SMARTer than Second Graders?", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), March 2023, pp. 10834-10844.
    BibTeX TR2023-014 PDF Video Data Software Presentation
    • @inproceedings{Cherian2023mar,
    • author = {Cherian, Anoop and Peng, Kuan-Chuan and Lohit, Suhas and Smith, Kevin and Tenenbaum, Joshua B.},
    • title = {Are Deep Neural Networks SMARTer than Second Graders?},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2023,
    • pages = {10834--10844},
    • month = mar,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2023-014}
    • }
  •  Kojima, K., Koike-Akino, T., Wang, Y., Jung Minwoo, , Brand, M., "Inverse design of two-dimensional freeform metagrating using an adversarial conditional variational autoencoder", SPIE Photonics West, DOI: 10.1117/​12.2650299, January 2023.
    BibTeX TR2023-004 PDF
    • @inproceedings{Kojima2023jan,
    • author = {Kojima, Keisuke and Koike-Akino, Toshiaki and Wang, Ye and Jung Minwoo and Brand, Matthew},
    • title = {Inverse design of two-dimensional freeform metagrating using an adversarial conditional variational autoencoder},
    • booktitle = {Proc. SPIE 12431, Photonic and Phononic Properties of Engineered Nanostructures XIII},
    • year = 2023,
    • month = jan,
    • publisher = {SPIE},
    • doi = {10.1117/12.2650299},
    • url = {https://www.merl.com/publications/TR2023-004}
    • }
  •  Liu, T., Cherian, A., "Learning a Constrained Optimizer: A Primal Method", AAAI Bridge on Constraint Programming and Machine Learning, January 2023.
    BibTeX TR2023-003 PDF
    • @inproceedings{Liu2023jan,
    • author = {Liu, Tao and Cherian, Anoop},
    • title = {Learning a Constrained Optimizer: A Primal Method},
    • booktitle = {AAAI Bridge on Constraint Programming and Machine Learning},
    • year = 2023,
    • month = jan,
    • url = {https://www.merl.com/publications/TR2023-003}
    • }
  •  Tohme, T., Liu, D., Youcef-Toumi, K., "GSR: A Generalized Symbolic Regression Approach", Transactions on Machine Learning Research, January 2023.
    BibTeX TR2023-002 PDF
    • @article{Tohme2023jan,
    • author = {Tohme, Tony and Liu, Dehong and Youcef-Toumi, Kamal},
    • title = {GSR: A Generalized Symbolic Regression Approach},
    • journal = {Transactions on Machine Learning Research},
    • year = 2023,
    • month = jan,
    • issn = {2835-8856},
    • url = {https://www.merl.com/publications/TR2023-002}
    • }
  •  Wang, Z.-Q., Wichern, G., Watanabe, S., Le Roux, J., "STFT-Domain Neural Speech Enhancement with Very Low Algorithmic Latency", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/​TASLP.2022.3224285, Vol. 31, pp. 397-410, December 2022.
    BibTeX TR2022-166 PDF
    • @article{Wang2022dec2,
    • author = {Wang, Zhong-Qiu and Wichern, Gordon and Watanabe, Shinji and Le Roux, Jonathan},
    • title = {STFT-Domain Neural Speech Enhancement with Very Low Algorithmic Latency},
    • journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
    • year = 2022,
    • volume = 31,
    • pages = {397--410},
    • month = dec,
    • doi = {10.1109/TASLP.2022.3224285},
    • issn = {2329-9304},
    • url = {https://www.merl.com/publications/TR2022-166}
    • }
  •  Singla, V., Aeron, S., Koike-Akino, T., Parsons, K., Brand, M., Wang, Y., "Learning with noisy labels using low-dimensional model trajectory", NeurIPS 2022 Workshop on Distribution Shifts (DistShift), December 2022.
    BibTeX TR2022-156 PDF
    • @inproceedings{Singla2022dec,
    • author = {Singla, Vasu and Aeron, Shuchin and Koike-Akino, Toshiaki and Parsons, Kieran and Brand, Matthew and Wang, Ye},
    • title = {Learning with noisy labels using low-dimensional model trajectory},
    • booktitle = {NeurIPS 2022 Workshop on Distribution Shifts: Connecting Methods and Applications},
    • year = 2022,
    • month = dec,
    • publisher = {OpenReview},
    • url = {https://www.merl.com/publications/TR2022-156}
    • }
  •  Shimoya, R., Morimoto, T., van Baar, J., Boufounos, P.T., Ma, Y., Mansour, H., "Learning Occlusion-Aware Dense Correspondences for Multi-Modal Images", IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS), DOI: 10.1109/​AVSS56176.2022.9959354, November 2022, pp. 1-8.
    BibTeX TR2022-149 PDF
    • @inproceedings{Shimoya2022nov,
    • author = {Shimoya, Ryosuke and Morimoto, Tahashi and van Baar, Jeroen and Boufounos, Petros T. and Ma, Yanting and Mansour, Hassan},
    • title = {Learning Occlusion-Aware Dense Correspondences for Multi-Modal Images},
    • booktitle = {IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS)},
    • year = 2022,
    • pages = {1--8},
    • month = nov,
    • doi = {10.1109/AVSS56176.2022.9959354},
    • isbn = {978-1-6654-6382-9},
    • url = {https://www.merl.com/publications/TR2022-149}
    • }
  •  Romero, D., Lohit, S., "Learning Partial Equivariances from Data", Advances in Neural Information Processing Systems (NeurIPS), S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh, Eds., November 2022, pp. 36466-36478.
    BibTeX TR2022-148 PDF Software Presentation
    • @inproceedings{Romero2022nov,
    • author = {Romero, David and Lohit, Suhas},
    • title = {Learning Partial Equivariances from Data},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh},
    • pages = {36466--36478},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2022-148}
    • }
  •  Wang, H., Lohit, S., Jones, M.J., Fu, R., "What Makes a “Good” Data Augmentation in Knowledge Distillation – A Statistical Perspective", Advances in Neural Information Processing Systems (NeurIPS), S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh, Eds., November 2022, pp. 13456-13469.
    BibTeX TR2022-147 PDF
    • @inproceedings{Wang2022nov,
    • author = {Wang, Huan and Lohit, Suhas and Jones, Michael J. and Fu, Raymond},
    • title = {What Makes a “Good” Data Augmentation in Knowledge Distillation – A Statistical Perspective},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh},
    • pages = {13456--13469},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2022-147}
    • }
  •  Venkatesh, S., Wichern, G., Subramanian, A.S., Le Roux, J., "Improved Domain Generalization via Disentangled Multi-Task Learning in Unsupervised Anomalous Sound Detection", DCASE Workshop, Lagrange, M. and Mesaros, A. and Pellegrini, T. and Richard, G. and Serizel, R. and Stowell, D., Eds., November 2022.
    BibTeX TR2022-146 PDF Presentation
    • @inproceedings{Venkatesh2022nov,
    • author = {Venkatesh, Satvik and Wichern, Gordon and Subramanian, Aswin Shanmugam and Le Roux, Jonathan},
    • title = {Improved Domain Generalization via Disentangled Multi-Task Learning in Unsupervised Anomalous Sound Detection},
    • booktitle = {DCASE Workshop},
    • year = 2022,
    • editor = {Lagrange, M. and Mesaros, A. and Pellegrini, T. and Richard, G. and Serizel, R. and Stowell, D.},
    • month = nov,
    • isbn = {978-952-03-2677-7},
    • url = {https://www.merl.com/publications/TR2022-146}
    • }
  •  Yu, X., Smedemark-Margulies, N., Aeron, S., Koike-Akino, T., Moulin, P., Brand, M., Parsons, K., Wang, Y., "Improving Adversarial Robustness by Learning Shared Information", Pattern Recognition, DOI: 10.1016/​j.patcog.2022.109054, Vol. 134, pp. 109054, November 2022.
    BibTeX TR2022-141 PDF
    • @article{Yu2022nov,
    • author = {Yu, Xi and Smedemark-Margulies, Niklas and Aeron, Shuchin and Koike-Akino, Toshiaki and Moulin, Pierre and Brand, Matthew and Parsons, Kieran and Wang, Ye},
    • title = {Improving Adversarial Robustness by Learning Shared Information},
    • journal = {Pattern Recognition},
    • year = 2022,
    • volume = 134,
    • pages = 109054,
    • month = nov,
    • doi = {10.1016/j.patcog.2022.109054},
    • issn = {0031-3203},
    • url = {https://www.merl.com/publications/TR2022-141}
    • }
  •  Ahmed, S.M., Lohit, S., Peng, K.-C., Jones, M.J., Roy Chowdhury, A.K., "Cross-Modal Knowledge Transfer Without Task-Relevant Source Data", European Conference on Computer Vision (ECCV), Avidan, S and Brostow, G and Cisse M and Farinella, G.M. and Hassner T., Eds., DOI: 10.1007/​978-3-031-19830-4_7, October 2022, pp. 111-127.
    BibTeX TR2022-135 PDF Video Software Presentation
    • @inproceedings{Ahmed2022oct,
    • author = {{Ahmed, Sk Miraj and Lohit, Suhas and Peng, Kuan-Chuan and Jones, Michael J. and Roy Chowdhury, Amit K.}},
    • title = {Cross-Modal Knowledge Transfer Without Task-Relevant Source Data},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2022,
    • editor = {Avidan, S and Brostow, G and Cisse M and Farinella, G.M. and Hassner T.},
    • pages = {111--127},
    • month = oct,
    • publisher = {Springer},
    • doi = {10.1007/978-3-031-19830-4_7},
    • isbn = {978-3-031-19830-4},
    • url = {https://www.merl.com/publications/TR2022-135}
    • }
  •  Xia, H., Wang, P., Ding, Z., "Incomplete Multi-view Domain Adaptation via Channel Enhancement and Knowledge Transfer", European Conference on Computer Vision (ECCV), DOI: 10.1007/​978-3-031-19830-4_12, October 2022.
    BibTeX TR2022-134 PDF
    • @inproceedings{Xia2022oct,
    • author = {{Xia, Haifeng and Wang, Pu and Ding, Zhengming}},
    • title = {Incomplete Multi-view Domain Adaptation via Channel Enhancement and Knowledge Transfer},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2022,
    • month = oct,
    • doi = {10.1007/978-3-031-19830-4_12},
    • isbn = {978-3-031-19830-4},
    • url = {https://www.merl.com/publications/TR2022-134}
    • }
  •  Leu, J., Wang, Y., Tomizuka, M., Di Cairano, S., "Improved A-Search Guided Tree for Autonomous Trailer Planning", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/​IROS47612.2022.9982121, October 2022.
    BibTeX TR2022-133 PDF
    • @inproceedings{Leu2022oct,
    • author = {Leu, Jessica and Wang, Yebin and Tomizuka, Masayoshi and Di Cairano, Stefano},
    • title = {Improved A-Search Guided Tree for Autonomous Trailer Planning},
    • booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2022,
    • month = oct,
    • doi = {10.1109/IROS47612.2022.9982121},
    • url = {https://www.merl.com/publications/TR2022-133}
    • }
  •  Paul, S., Roy Chowdhury, A.K., Cherian, A., "AVLEN: Audio-Visual-Language Embodied Navigation in 3D Environments", Advances in Neural Information Processing Systems (NeurIPS), October 2022, pp. 6236-6249.
    BibTeX TR2022-131 PDF Video Data Software
    • @inproceedings{Paul2022oct2,
    • author = {Paul, Sudipta and Roy Chowdhury, Amit K and Cherian, Anoop},
    • title = {AVLEN: Audio-Visual-Language Embodied Navigation in 3D Environments},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • pages = {6236--6249},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2022-131}
    • }
  •  Mansour, H., Lohit, S., Boufounos, P.T., "Distributed Radar Autofocus Imaging Using Deep Priors", IEEE International Conference on Image Processing (ICIP), DOI: 10.1109/​ICIP46576.2022.9897332, October 2022, pp. 2511-2515.
    BibTeX TR2022-129 PDF Video
    • @inproceedings{Mansour2022oct,
    • author = {{Mansour, Hassan and Lohit, Suhas and Boufounos, Petros T.}},
    • title = {Distributed Radar Autofocus Imaging Using Deep Priors},
    • booktitle = {IEEE International Conference on Image Processing (ICIP)},
    • year = 2022,
    • pages = {2511--2515},
    • month = oct,
    • doi = {10.1109/ICIP46576.2022.9897332},
    • url = {https://www.merl.com/publications/TR2022-129}
    • }