Publications

8 / 3,993 publications found.


  •  Wilkinghoff, K., Yang, H., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Local Density-Based Anomaly Score Normalization for Domain Generalization", IEEE Transactions on Audio, Speech and Language Processing, DOI: 10.1109/​TASLPRO.2025.3629236, Vol. 33, pp. 4642-4652, January 2026.
    BibTeX TR2026-010 PDF Software
    • @article{Wilkinghoff2026jan,
    • author = {Wilkinghoff, Kevin and Yang, Haici and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Local Density-Based Anomaly Score Normalization for Domain Generalization}},
    • journal = {IEEE Transactions on Audio, Speech and Language Processing},
    • year = 2026,
    • volume = 33,
    • pages = {4642--4652},
    • month = jan,
    • doi = {10.1109/TASLPRO.2025.3629236},
    • issn = {2998-4173},
    • url = {https://www.merl.com/publications/TR2026-010}
    • }
  •  Lai, Y.-H., Ebbers, J., Wang, Y.-C.F., Germain, F.G., Jones, M.J., Chatterjee, M., "UWAV: Uncertainty-weighted Weakly-supervised Audio-Visual Video Parsing", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR52734.2025.01266, June 2025, pp. 13561-13570.
    BibTeX TR2025-072 PDF
    • @inproceedings{Lai2025jun,
    • author = {Lai, Yung-Hsuan and Ebbers, Janek and Wang, Yu-Chiang Frank and Germain, François G and Jones, Michael J. and Chatterjee, Moitreya},
    • title = {{UWAV: Uncertainty-weighted Weakly-supervised Audio-Visual Video Parsing}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2025,
    • pages = {13561--13570},
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.1109/CVPR52734.2025.01266},
    • url = {https://www.merl.com/publications/TR2025-072}
    • }
  •  Ebbers, J., Germain, F.G., Wilkinghoff, K., Wichern, G., Le Roux, J., "No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10890706, April 2025.
    BibTeX TR2025-037 PDF
    • @inproceedings{Ebbers2025mar,
    • author = {Ebbers, Janek and Germain, François G and Wilkinghoff, Kevin and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10890706},
    • url = {https://www.merl.com/publications/TR2025-037}
    • }
  •  Saijo, K., Ebbers, J., Germain, F.G., Khurana, S., Wichern, G., Le Roux, J., "Leveraging Audio-Only Data for Text-Queried Target Sound Extraction", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10888769, April 2025.
    BibTeX TR2025-033 PDF
    • @inproceedings{Saijo2025mar2,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Khurana, Sameer and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Leveraging Audio-Only Data for Text-Queried Target Sound Extraction}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10888769},
    • url = {https://www.merl.com/publications/TR2025-033}
    • }
  •  Saijo, K., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Task-Aware Unified Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10887819, April 2025.
    BibTeX TR2025-032 PDF Software
    • @inproceedings{Saijo2025mar,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Task-Aware Unified Source Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10887819},
    • url = {https://www.merl.com/publications/TR2025-032}
    • }
  •  Wilkinghoff, K., Yang, H., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Keeping the Balance: Anomaly Score Calculation for Domain Generalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10888402, April 2025.
    BibTeX TR2025-030 PDF Software
    • @inproceedings{Wilkinghoff2025mar,
    • author = {{{Wilkinghoff, Kevin and Yang, Haici and Ebbers, Janek and Germain, François G and Wichern, Gordon and Le Roux, Jonathan}}},
    • title = {{{Keeping the Balance: Anomaly Score Calculation for Domain Generalization}}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = apr,
    • doi = {10.1109/ICASSP49660.2025.10888402},
    • url = {https://www.merl.com/publications/TR2025-030}
    • }
  •  Cornell, S., Ebbers, J., Douwes, C., Martin-Morato, I., Harju, M., Mesaros, A., Serizel, R., "DCASE 2024 Task 4: Sound Event Detection with Heterogeneous Data and Missing Labels", Detection and Classification of Acoustic Scenes and Events (DCASE) Workshop, October 2024, pp. 31-35.
    BibTeX TR2024-146 PDF
    • @inproceedings{Cornell2024oct,
    • author = {Cornell, Samuele and Ebbers, Janek and Douwes, Constance and Martin-Morato, Irene and Harju, Manu and Mesaros, Annamaria and Serizel, Romain},
    • title = {{DCASE 2024 Task 4: Sound Event Detection with Heterogeneous Data and Missing Labels}},
    • booktitle = {Detection and Classification of Acoustic Scenes and Events (DCASE) Workshop},
    • year = 2024,
    • pages = {31--35},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2024-146}
    • }
  •  Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Sound Event Bounding Boxes", Interspeech, DOI: 10.21437/​Interspeech.2024-2075, September 2024, pp. 562-566.
    BibTeX TR2024-118 PDF Software
    • @inproceedings{Ebbers2024sep,
    • author = {Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Sound Event Bounding Boxes}},
    • booktitle = {Interspeech},
    • year = 2024,
    • pages = {562--566},
    • month = sep,
    • doi = {10.21437/Interspeech.2024-2075},
    • issn = {2958-1796},
    • url = {https://www.merl.com/publications/TR2024-118}
    • }