- Yang, C.-A., Peng, K.-C., Yeh, R., "Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts", IEEE International Conference on Computer Vision (ICCV), October 2025.
BibTeX TR2025-124 PDF Video Data Presentation- @inproceedings{Yang2025oct,
- author = {{{Yang, Chiao-An and Peng, Kuan-Chuan and Yeh, Raymond}}},
- title = {{{Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts}}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV)},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-124}
- }
- Peng, K.-C., "Joint Training of Image Generator and Detector for Road Defect Detection", IEEE International Conference on Computer Vision (ICCV) Workshops, October 2025.
BibTeX TR2025-149 PDF Video Presentation- @inproceedings{Peng2025oct,
- author = {{{Peng, Kuan-Chuan}}},
- title = {{{Joint Training of Image Generator and Detector for Road Defect Detection}}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshops},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-149}
- }
- Shenoy, V., Wu, S., Comas, A., Lohit, S., Mansour, H., Marks, T.K., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", IEEE Access, October 2025.
BibTeX TR2025-145 PDF- @article{Shenoy2025oct,
- author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Lohit, Suhas and Mansour, Hassan and Marks, Tim K.},
- title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
- journal = {IEEE Access},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-145}
- }
- Masuyama, Y., Germain, F.G., Wichern, G., Ick, C., Le Roux, J., "Physics-Informed Direction-Aware Neural Acoustic Fields", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2025.
BibTeX TR2025-142 PDF- @inproceedings{Masuyama2025oct,
- author = {Masuyama, Yoshiki and Germain, François G and Wichern, Gordon and Ick, Christopher and {Le Roux}, Jonathan},
- title = {{Physics-Informed Direction-Aware Neural Acoustic Fields}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-142}
- }
- Paissan, F., Wichern, G., Masuyama, Y., Aihara, R., Germain, F.G., Saijo, K., Le Roux, J., "FasTUSS: Faster Task-Aware Unified Source Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2025.
BibTeX TR2025-143 PDF- @inproceedings{Paissan2025oct,
- author = {Paissan, Francesco and Wichern, Gordon and Masuyama, Yoshiki and Aihara, Ryo and Germain, François G and Saijo, Kohei and {Le Roux}, Jonathan},
- title = {{FasTUSS: Faster Task-Aware Unified Source Separation}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-143}
- }
- Zhang, J., Cherian, A., Rodriguez, C., Deng, W., Gould, S., "Manual-PA: Learning 3D Part Assembly from Instruction Diagrams", IEEE International Conference on Computer Vision (ICCV), September 2025.
BibTeX TR2025-139 PDF- @inproceedings{Zhang2025sep,
- author = {Zhang, Jiahao and Cherian, Anoop and Rodriguez, Cristian and Deng, Weijian and Gould, Stephen},
- title = {{Manual-PA: Learning 3D Part Assembly from Instruction Diagrams}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV)},
- year = 2025,
- month = sep,
- url = {https://www.merl.com/publications/TR2025-139}
- }
- Hu, Y., Lohit, S., Kamilov, U., Marks, T.K., "Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal", IEEE Transactions on Geoscience and Remote Sensing, DOI: 10.1109/TGRS.2025.3604654, Vol. 63, September 2025.
BibTeX TR2025-138 PDF- @article{Hu2025sep2,
- author = {Hu, Yuyang and Lohit, Suhas and Kamilov, Ulugbek and Marks, Tim K.},
- title = {{Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal}},
- journal = {IEEE Transactions on Geoscience and Remote Sensing},
- year = 2025,
- volume = 63,
- month = sep,
- doi = {10.1109/TGRS.2025.3604654},
- issn = {1558-0644},
- url = {https://www.merl.com/publications/TR2025-138}
- }
- Van der Merwe, M., Jha, D.K., "In-Context Iterative Policy Improvement for Dynamic Manipulation", Conference on Robot Learning (CoRL), September 2025.
BibTeX TR2025-136 PDF Video- @inproceedings{VanderMerwe2025sep,
- author = {Van der Merwe, Mark and Jha, Devesh K.},
- title = {{In-Context Iterative Policy Improvement for Dynamic Manipulation}},
- booktitle = {Conference on Robot Learning (CoRL)},
- year = 2025,
- month = sep,
- url = {https://www.merl.com/publications/TR2025-136}
- }
- Liu, J., Koike-Akino, T., Wang, P., Brand, M., Parsons, K., Wang, Y., "LoDA: Low-Dimensional Adaptation of Large Language Models" in Springer Book, September 2025.
BibTeX TR2025-130 PDF- @incollection{Liu2025sep,
- author = {Liu, Jing and Koike-Akino, Toshiaki and Wang, Pu and Brand, Matthew and Parsons, Kieran and Wang, Ye},
- title = {{LoDA: Low-Dimensional Adaptation of Large Language Models}},
- booktitle = {Springer Book},
- year = 2025,
- month = sep,
- url = {https://www.merl.com/publications/TR2025-130}
- }
- Hussein, A., Khurana, S., Wichern, G., Germain, F.G., Le Roux, J., "HASRD: Hierarchical Acoustic and Semantic Representation Disentanglement", Interspeech, DOI: 10.21437/Interspeech.2025-2063, August 2025, pp. 5393-5397.
BibTeX TR2025-122 PDF- @inproceedings{Hussein2025aug,
- author = {Hussein, Amir and Khurana, Sameer and Wichern, Gordon and Germain, François G and {Le Roux}, Jonathan},
- title = {{HASRD: Hierarchical Acoustic and Semantic Representation Disentanglement}},
- booktitle = {Interspeech},
- year = 2025,
- pages = {5393--5397},
- month = aug,
- publisher = {ISCA},
- doi = {10.21437/Interspeech.2025-2063},
- url = {https://www.merl.com/publications/TR2025-122}
- }
- Ick, C., Wichern, G., Masuyama, Y., Germain, F.G., Le Roux, J., "Direction-Aware Neural Acoustic Fields for Few-Shot Interpolation of Ambisonic Impulse Responses", Interspeech, DOI: 10.21437/Interspeech.2025-1912, August 2025, pp. 933-937.
BibTeX TR2025-120 PDF- @inproceedings{Ick2025aug,
- author = {Ick, Christopher and Wichern, Gordon and Masuyama, Yoshiki and Germain, François G and {Le Roux}, Jonathan},
- title = {{Direction-Aware Neural Acoustic Fields for Few-Shot Interpolation of Ambisonic Impulse Responses}},
- booktitle = {Interspeech},
- year = 2025,
- pages = {933--937},
- month = aug,
- doi = {10.21437/Interspeech.2025-1912},
- url = {https://www.merl.com/publications/TR2025-120}
- }
- Khurana, S., Klement, D., Laurent, A., Bobos, D., Novosad, J., Gazdik, P., Zhang, E., Huang, Z., Hussein, A., Marxer, R., Masuyama, Y., Aihara, R., Hori, C., Germain, F.G., Wichern, G., Le Roux, J., "Factorized RVQ-GAN For Disentangled Speech Tokenization", Interspeech, DOI: 10.21437/Interspeech.2025-2612, August 2025, pp. 3514-3518.
BibTeX TR2025-123 PDF- @inproceedings{Khurana2025aug,
- author = {Khurana, Sameer and Klement, Dominik and Laurent, Antoine and Bobos, Dominik and Novosad, Juraj and Gazdik, Peter and Zhang, Ellen and Huang, Zilli and Hussein, Amir and Marxer, Ricard and Masuyama, Yoshiki and Aihara, Ryo and Hori, Chiori and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Factorized RVQ-GAN For Disentangled Speech Tokenization}},
- booktitle = {Interspeech},
- year = 2025,
- pages = {3514--3518},
- month = aug,
- publisher = {ISCA},
- doi = {10.21437/Interspeech.2025-2612},
- url = {https://www.merl.com/publications/TR2025-123}
- }
- Yang, H., Wichern, G., Aihara, R., Masuyama, Y., Khurana, S., Germain, F.G., Le Roux, J., "Investigating Continuous Autoregressive Generative Speech Enhancement", Interspeech, DOI: doi: 10.21437/Interspeech.2025-2335, August 2025, pp. 2360-2364.
BibTeX TR2025-119 PDF- @inproceedings{Yang2025aug,
- author = {Yang, Haici and Wichern, Gordon and Aihara, Ryo and Masuyama, Yoshiki and Khurana, Sameer and Germain, François G and {Le Roux}, Jonathan},
- title = {{Investigating Continuous Autoregressive Generative Speech Enhancement}},
- booktitle = {Interspeech},
- year = 2025,
- pages = {2360--2364},
- month = aug,
- publisher = {ISCA},
- doi = {doi: 10.21437/Interspeech.2025-2335},
- url = {https://www.merl.com/publications/TR2025-119}
- }
- Steinmetz, C., Uhle, C., Everardo, F., Mitcheltree, C., McElveen, J.K., Jot, J.-M., Wichern, G., "Audio Signal Processing in the Artificial Intelligence Era: Challenges and Directions", Journal of the Audio Engineering Society, August 2025.
BibTeX TR2025-116 PDF- @article{Steinmetz2025aug,
- author = {Steinmetz, Christian and Uhle, Christian and Everardo, Flavio and Mitcheltree, Christopher and McElveen, J. Keith and Jot, Jean-Marc and Wichern, Gordon},
- title = {{Audio Signal Processing in the Artificial Intelligence Era: Challenges and Directions}},
- journal = {Journal of the Audio Engineering Society},
- year = 2025,
- month = aug,
- url = {https://www.merl.com/publications/TR2025-116}
- }
- Lewis, A., White, M., Liu, J., Koike-Akino, T., Parsons, K., Wang, Y., "Winning Big with Small Models: Knowledge Distillation vs. Self-Training for Reducing Hallucination in Product QA Agents", ACL 2025 workshop on Generation, Evaluation & Metrics (GEM), July 2025.
BibTeX TR2025-114 PDF- @inproceedings{Lewis2025jul2,
- author = {Lewis, Ashley and White, Michael and Liu, Jing and Koike-Akino, Toshiaki and Parsons, Kieran and Wang, Ye},
- title = {{Winning Big with Small Models: Knowledge Distillation vs. Self-Training for Reducing Hallucination in Product QA Agents}},
- booktitle = {ACL 2025 workshop on Generation, Evaluation \& Metrics (GEM)},
- year = 2025,
- month = jul,
- url = {https://www.merl.com/publications/TR2025-114}
- }
- Almudévar, A., Hernández-Lobato, J.M., Khurana, S., Marxer, R., Ortega, A., "Aligning Multimodal Representations through an Information Bottleneck", International Conference on Machine Learning (ICML), July 2025.
BibTeX TR2025-109 PDF- @inproceedings{Almudévar2025jul,
- author = {Almudévar, Antonio and Hernández-Lobato, José, M and Khurana, Sameer and Marxer, Ricard and Ortega, Alfonso},
- title = {{Aligning Multimodal Representations through an Information Bottleneck}},
- booktitle = {International Conference on Machine Learning (ICML)},
- year = 2025,
- month = jul,
- url = {https://www.merl.com/publications/TR2025-109}
- }
- Liu, J., Koike-Akino, T., Wang, Y., Mansour, H., Brand, M., "AWP: Activation-Aware Weight Pruning and Quantization with Projected Gradient Descent", International Conference on Machine Learning (ICML) workshop, July 2025.
BibTeX TR2025-111 PDF Presentation- @inproceedings{Liu2025jul,
- author = {{{Liu, Jing and Koike-Akino, Toshiaki and Wang, Ye and Mansour, Hassan and Brand, Matthew}}},
- title = {{{AWP: Activation-Aware Weight Pruning and Quantization with Projected Gradient Descent}}},
- booktitle = {International Conference on Machine Learning (ICML) workshop},
- year = 2025,
- month = jul,
- url = {https://www.merl.com/publications/TR2025-111}
- }
- Koike-Akino, T., Liu, J., Wang, Y., "u-MoE: Test-Time Pruning as Micro-Grained Mixture-of-Experts", International Conference on Machine Learning (ICML) Workshop, July 2025.
BibTeX TR2025-112 PDF Presentation- @inproceedings{Koike-Akino2025jul,
- author = {{{Koike-Akino, Toshiaki and Liu, Jing and Wang, Ye}}},
- title = {{{u-MoE: Test-Time Pruning as Micro-Grained Mixture-of-Experts}}},
- booktitle = {International Conference on Machine Learning (ICML) Workshop},
- year = 2025,
- month = jul,
- url = {https://www.merl.com/publications/TR2025-112}
- }
- Wang, R., Wang, Y., Liu, J., Koike-Akino, T., "Quantum Diffusion Models for Few-Shot Learning", ICAD, DOI: 10.1109/ICAD65464.2025.11114033, June 2025.
BibTeX TR2025-095 PDF Presentation- @inproceedings{Wang2025jun2,
- author = {{{Wang, Ruhan and Wang, Ye and Liu, Jing and Koike-Akino, Toshiaki}}},
- title = {{{Quantum Diffusion Models for Few-Shot Learning}}},
- booktitle = {ICAD},
- year = 2025,
- month = jun,
- publisher = {IEEE},
- doi = {10.1109/ICAD65464.2025.11114033},
- isbn = {979-8-3315-2472-2},
- url = {https://www.merl.com/publications/TR2025-095}
- }
- Masuyama, Y., "Single- and Multi-Channel Speech Enhancement and Separation for Far-Field Conversation Recognition," Tech. Rep. TR2025-097, Jelinek Summer Workshop on Speech and Language Technology (JSALT), June 2025.
BibTeX TR2025-097 PDF- @techreport{Masuyama2025jun,
- author = {{{Masuyama, Yoshiki}}},
- title = {{{Single- and Multi-Channel Speech Enhancement and Separation for Far-Field Conversation Recognition}}},
- institution = {Jelinek Summer Workshop on Speech and Language Technology (JSALT)},
- year = 2025,
- month = jun,
- url = {https://www.merl.com/publications/TR2025-097}
- }
- Jung, Y.G., Park, J., Yoon, J., Peng, K.-C., Kim, W., Teoh, A.B.J., Camps, O., "TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), Isola, P. and Kjellström, H. and Lepetit, V. and Li, F. and Su, H. and Tang, S., Eds., DOI: 10.1109/CVPR52734.2025.02378, June 2025, pp. 25539-25548.
BibTeX TR2025-077 PDF Video Presentation- @inproceedings{Jung2025jun,
- author = {{{Jung, Yoon G. and Park, Jaewoo and Yoon, Jaeho and Peng, Kuan-Chuan and Kim, Wonchul and Teoh, Andrew B. J. and Camps, Octavia}}},
- title = {{{TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection}}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2025,
- editor = {Isola, P. and Kjellström, H. and Lepetit, V. and Li, F. and Su, H. and Tang, S.},
- pages = {25539--25548},
- month = jun,
- publisher = {IEEE},
- doi = {10.1109/CVPR52734.2025.02378},
- issn = {2575-7075},
- isbn = {979-8-3315-4364-8},
- url = {https://www.merl.com/publications/TR2025-077}
- }
- Lai, Y.-H., Ebbers, J., Wang, Y.-C.F., Germain, F.G., Jones, M.J., Chatterjee, M., "UWAV: Uncertainty-weighted Weakly-supervised Audio-Visual Video Parsing", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2025.
BibTeX TR2025-072 PDF- @inproceedings{Lai2025jun,
- author = {Lai, Yung-Hsuan and Ebbers, Janek and Wang, Yu-Chiang Frank and Germain, François G and Jones, Michael J. and Chatterjee, Moitreya},
- title = {{UWAV: Uncertainty-weighted Weakly-supervised Audio-Visual Video Parsing}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2025,
- month = jun,
- url = {https://www.merl.com/publications/TR2025-072}
- }
- Hegde, D., Lohit, S., Peng, K.-C., Jones, M.J., Patel, V.M., "Multimodal 3D Object Detection on Unseen Domains", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop, June 2025, pp. 2499-2509.
BibTeX TR2025-078 PDF- @inproceedings{Hegde2025jun,
- author = {Hegde, Deepti and Lohit, Suhas and Peng, Kuan-Chuan and Jones, Michael J. and Patel, Vishal M.},
- title = {{Multimodal 3D Object Detection on Unseen Domains}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop},
- year = 2025,
- pages = {2499--2509},
- month = jun,
- url = {https://www.merl.com/publications/TR2025-078}
- }
- Koike-Akino, T., Chen, X., Liu, J., Wang, Y., Wang, P., Brand, M., "LatentLLM: Attention-Aware Joint Tensor Compression", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop, June 2025.
BibTeX TR2025-075 PDF Presentation- @inproceedings{Koike-Akino2025jun,
- author = {{{Koike-Akino, Toshiaki and Chen, Xiangyu and Liu, Jing and Wang, Ye and Wang, Pu and Brand, Matthew}}},
- title = {{{LatentLLM: Attention-Aware Joint Tensor Compression}}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop},
- year = 2025,
- month = jun,
- url = {https://www.merl.com/publications/TR2025-075}
- }
- Li, K., Zhang, T., Peng, K.-C., Wang, G., "PF3Det: A Prompted Foundation Feature Assisted Visual LiDAR 3D Detector", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop, June 2025, pp. 3787-3796.
BibTeX TR2025-076 PDF Presentation- @inproceedings{Li2025jun,
- author = {{{Li, Kaidong and Zhang, Tianxiao and Peng, Kuan-Chuan and Wang, Guanghui}}},
- title = {{{PF3Det: A Prompted Foundation Feature Assisted Visual LiDAR 3D Detector}}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop},
- year = 2025,
- pages = {3787--3796},
- month = jun,
- url = {https://www.merl.com/publications/TR2025-076}
- }