Julius Richter
- Email:
-
Position:
Research / Technical Staff
Visiting Research Scientist -
Education:
Ph.D. in Computer Science, University of Hamburg, Germany, 2025 -
Research Area:
External Links:
Julius' Quick Links
-
Biography
Julius's research interests include generative models and multimodal learning for audio-visual understanding and restoration. During his Ph.D., he developed novel diffusion-based generative approaches for single-channel speech enhancement. Prior to joining MERL, he was a postdoctoral researcher at Meta Superintelligence Labs.
-
Other Publications
- , "EDM2SE: A Magnitude-Preserving Network Architecture for Diffusion-Based Speech Enhancement", Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2026.BibTeX
- @Inproceedings{Richter2026ICASSPEDM2SE,
- author = {Richter, Julius and de Oliveira, Danilo and Gerkmann, Timo},
- title = {{EDM2SE}: A Magnitude-Preserving Network Architecture for Diffusion-Based Speech Enhancement},
- booktitle = {Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2026
- }
- , "Diffusion Models for Audio Restoration", IEEE Signal Processing Magazine, Vol. 41, No. 6, pp. 72-84, 2025.BibTeX
- @Article{Lemercier2025SPMDiffusion,
- author = {Lemercier, Jean-Marie and Richter, Julius and Welker, Simon and Moliner, Eloi and V{\"a}lim{\"a}ki, Vesa and Gerkmann, Timo},
- title = {Diffusion Models for Audio Restoration},
- journal = {IEEE Signal Processing Magazine},
- year = 2025,
- volume = 41,
- number = 6,
- pages = {72--84}
- }
- , "Investigating Training Objectives for Generative Speech Enhancement", Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2025.BibTeX
- @Inproceedings{Richter2025ICASSPObjectives,
- author = {Richter, Julius and de Oliveira, Danilo and Gerkmann, Timo},
- title = {Investigating Training Objectives for Generative Speech Enhancement},
- booktitle = {Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025
- }
- , "ReverbFX: A Dataset of Room Impulse Responses Derived from Reverb Effect Plugins for Singing Voice Dereverberation", Proceedings of the ITG Conference on Speech Communication, 2025.BibTeX
- @Inproceedings{Richter2025ITGReverbFX,
- author = {Richter, Julius and Svajda, Till and Gerkmann, Timo},
- title = {{ReverbFX}: A Dataset of Room Impulse Responses Derived from Reverb Effect Plugins for Singing Voice Dereverberation},
- booktitle = {Proceedings of the ITG Conference on Speech Communication},
- year = 2025
- }
- , "Non-intrusive Speech Quality Assessment with Diffusion Models Trained on Clean Speech", Proceedings of Interspeech, 2025.BibTeX
- @Inproceedings{deOliveira2025InterspeechLikelihood,
- author = {de Oliveira, Danilo and Richter, Julius and Lemercier, Jean-Marie and Welker, Simon and Gerkmann, Timo},
- title = {Non-intrusive Speech Quality Assessment with Diffusion Models Trained on Clean Speech},
- booktitle = {Proceedings of Interspeech},
- year = 2025
- }
- , "Single and Few-step Diffusion for Generative Speech Enhancement", Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2024.BibTeX
- @Inproceedings{Lay2024ICASSPFewStep,
- author = {Lay, Bunlong and Lemercier, Jean-Marie and Richter, Julius and Gerkmann, Timo},
- title = {Single and Few-step Diffusion for Generative Speech Enhancement},
- booktitle = {Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024
- }
- , "EARS: An Anechoic Fullband Speech Dataset Benchmarked for Speech Enhancement and Dereverberation", Proceedings of Interspeech, 2024.BibTeX
- @Inproceedings{Richter2024InterspeechEARS,
- author = {Richter, Julius and Wu, Yi-Chiao and Krenn, Steven and Welker, Simon and Lay, Bunlong and Watanabe, Shinji and Richard, Alexander and Gerkmann, Timo},
- title = {{EARS}: An Anechoic Fullband Speech Dataset Benchmarked for Speech Enhancement and Dereverberation},
- booktitle = {Proceedings of Interspeech},
- year = 2024
- }
- , "Diffusion-based Speech Enhancement: Demonstration of Performance and Generalization", Audio Imagination Workshop at NeurIPS, 2024.BibTeX
- @Inproceedings{Richter2024NeurIPSAudioImagination,
- author = {Richter, Julius and Gerkmann, Timo},
- title = {Diffusion-based Speech Enhancement: Demonstration of Performance and Generalization},
- booktitle = {Audio Imagination Workshop at NeurIPS},
- year = 2024
- }
- , "Causal Diffusion Models for Generalized Speech Enhancement", IEEE Open Journal of Signal Processing, Vol. 5, pp. 780-789, 2024.BibTeX
- @Article{Richter2024OJSPCausal,
- author = {Richter, Julius and Welker, Simon and Lemercier, Jean-Marie and Lay, Bunlong and Peer, Tal and Gerkmann, Timo},
- title = {Causal Diffusion Models for Generalized Speech Enhancement},
- journal = {IEEE Open Journal of Signal Processing},
- year = 2024,
- volume = 5,
- pages = {780--789}
- }
- , "Reducing the Prior Mismatch of Stochastic Differential Equations for Diffusion-based Speech Enhancement", Proceedings of Interspeech, 2023.BibTeX
- @Inproceedings{Lay2023InterspeechPriorMismatch,
- author = {Lay, Bunlong and Welker, Simon and Richter, Julius and Gerkmann, Timo},
- title = {Reducing the Prior Mismatch of Stochastic Differential Equations for Diffusion-based Speech Enhancement},
- booktitle = {Proceedings of Interspeech},
- year = 2023
- }
- , "StoRM: A Diffusion-based Stochastic Regeneration Model for Speech Enhancement and Dereverberation", IEEE/ACM Transactions on Audio, Speech, and Language Processing, Vol. 31, pp. 2724-2737, 2023.BibTeX
- @Article{Lemercier2023TASLPStoRM,
- author = {Lemercier, Jean-Marie and Richter, Julius and Welker, Simon and Gerkmann, Timo},
- title = {{StoRM}: A Diffusion-based Stochastic Regeneration Model for Speech Enhancement and Dereverberation},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2023,
- volume = 31,
- pages = {2724--2737}
- }
- , "Audio-Visual Speech Separation in Noisy Environments with a Lightweight Iterative Model", Proceedings of Interspeech, 2023.BibTeX
- @Inproceedings{Martel2023InterspeechAVSep,
- author = {Martel, Hector and Richter, Julius and Li, Kai and Hu, Xiaolin and Gerkmann, Timo},
- title = {Audio-Visual Speech Separation in Noisy Environments with a Lightweight Iterative Model},
- booktitle = {Proceedings of Interspeech},
- year = 2023
- }
- , "Speech Signal Improvement Using Causal Generative Diffusion Models", Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2023.BibTeX
- @Inproceedings{Richter2023ICASSPSpeechImprovement,
- author = {Richter, Julius and Welker, Simon and Lemercier, Jean-Marie and Lay, Bunlong and Peer, Tal and Gerkmann, Timo},
- title = {Speech Signal Improvement Using Causal Generative Diffusion Models},
- booktitle = {Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023
- }
- , "Audio-Visual Speech Enhancement with Score-Based Generative Models", Proceedings of the ITG Conference on Speech Communication, 2023.BibTeX
- @Inproceedings{Richter2023ITGAVScore,
- author = {Richter, Julius and Frintrop, Simone and Gerkmann, Timo},
- title = {Audio-Visual Speech Enhancement with Score-Based Generative Models},
- booktitle = {Proceedings of the ITG Conference on Speech Communication},
- year = 2023
- }
- , "Speech Enhancement and Dereverberation with Diffusion-Based Generative Models", IEEE/ACM Transactions on Audio, Speech, and Language Processing, Vol. 31, pp. 2351-2364, 2023.BibTeX
- @Article{Richter2023TASLPDiffusion,
- author = {Richter, Julius and Welker, Simon and Lemercier, Jean-Marie and Lay, Bunlong and Gerkmann, Timo},
- title = {Speech Enhancement and Dereverberation with Diffusion-Based Generative Models},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2023,
- volume = 31,
- pages = {2351--2364}
- }
- , "On the Behavior of Intrusive and Non-intrusive Speech Enhancement Metrics in Predictive and Generative Settings", Proceedings of the ITG Conference on Speech Communication, 2023.BibTeX
- @Inproceedings{deOliveira2023ITGMetrics,
- author = {de Oliveira, Danilo and Richter, Julius and Lemercier, Jean-Marie and Peer, Tal and Gerkmann, Timo},
- title = {On the Behavior of Intrusive and Non-intrusive Speech Enhancement Metrics in Predictive and Generative Settings},
- booktitle = {Proceedings of the ITG Conference on Speech Communication},
- year = 2023
- }
- , "Continuous Phoneme Recognition based on Audio-Visual Modality Fusion", Proceedings of the IEEE World Congress on Computational Intelligence, 2022.BibTeX
- @Inproceedings{Richter2022WCCIAVPhoneme,
- author = {Richter, Julius and Liebold, Jeanine and Gerkmann, Timo},
- title = {Continuous Phoneme Recognition based on Audio-Visual Modality Fusion},
- booktitle = {Proceedings of the IEEE World Congress on Computational Intelligence},
- year = 2022
- }
- , "Speech Enhancement with Score-Based Generative Models in the Complex STFT Domain", Proceedings of Interspeech, 2022.BibTeX
- @Inproceedings{Welker2022InterspeechComplex,
- author = {Welker, Simon and Richter, Julius and Gerkmann, Timo},
- title = {Speech Enhancement with Score-Based Generative Models in the Complex {STFT} Domain},
- booktitle = {Proceedings of Interspeech},
- year = 2022
- }
- , "Guided Variational Autoencoder for Speech Enhancement with a Supervised Classifier", Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2021.BibTeX
- @Inproceedings{Carbajal2021ICASSPGuidedVAE,
- author = {Carbajal, Guillaume and Richter, Julius and Gerkmann, Timo},
- title = {Guided Variational Autoencoder for Speech Enhancement with a Supervised Classifier},
- booktitle = {Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021
- }
- , "Disentanglement Learning for Variational Autoencoders Applied to Audio-Visual Speech Enhancement", Proceedings of the IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), 2021.BibTeX
- @Inproceedings{Carbajal2021WASPAA,
- author = {Carbajal, Guillaume and Richter, Julius and Gerkmann, Timo},
- title = {Disentanglement Learning for Variational Autoencoders Applied to Audio-Visual Speech Enhancement},
- booktitle = {Proceedings of the IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2021
- }
- , "Improving Mix-and-Separate Training in Audio-Visual Sound Source Separation with an Object Prior", Proceedings of the International Conference on Pattern Recognition (ICPR), 2020.BibTeX
- @Inproceedings{Nguyen2020ICPRAVPrior,
- author = {Nguyen, Quan and Richter, Julius and Lauri, Mikko and Gerkmann, Timo and Frintrop, Simone},
- title = {Improving Mix-and-Separate Training in Audio-Visual Sound Source Separation with an Object Prior},
- booktitle = {Proceedings of the International Conference on Pattern Recognition (ICPR)},
- year = 2020
- }
- , "Speech Enhancement with Stochastic Temporal Convolutional Networks", Proceedings of Interspeech, 2020.BibTeX
- @Inproceedings{Richter2020InterspeechTCN,
- author = {Richter, Julius and Carbajal, Guillaume and Gerkmann, Timo},
- title = {Speech Enhancement with Stochastic Temporal Convolutional Networks},
- booktitle = {Proceedings of Interspeech},
- year = 2020
- }
- , "EDM2SE: A Magnitude-Preserving Network Architecture for Diffusion-Based Speech Enhancement", Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2026.