- Khattar, V., Choudhury, M., Rashid, M.R.U., Liu, J., Koike-Akino, T., Jin, M., Wang, Y., "Amplification Effects in Test-Time Reinforcement Learning: Safety and Reasoning Vulnerabilities", AAAI Workshop on Trust and Control in Agentic AI, January 2026.
BibTeX TR2026-020 PDF- @inproceedings{Khattar2026jan,
- author = {Khattar, Vanshaj and Choudhury, Moumita and Rashid, Md Rafi Ur and Liu, Jing and Koike-Akino, Toshiaki and Jin, Ming and Wang, Ye},
- title = {{Amplification Effects in Test-Time Reinforcement Learning: Safety and Reasoning Vulnerabilities}},
- booktitle = {AAAI Workshop on Trust and Control in Agentic AI},
- year = 2026,
- month = jan,
- url = {https://www.merl.com/publications/TR2026-020}
- }
- Fujihashi, T., Koike-Akino, T., "Quantum Implicit Neural Compression", Springer Nature, January 2026.
BibTeX TR2026-022 PDF- @article{Fujihashi2026jan,
- author = {Fujihashi, Takuya and Koike-Akino, Toshiaki},
- title = {{Quantum Implicit Neural Compression}},
- journal = {Springer Nature},
- year = 2026,
- month = jan,
- url = {https://www.merl.com/publications/TR2026-022}
- }
- Koike-Akino, T., Chen, X., Liu, J., Wang, Y., Wang, P., Brand, M., "LatentLLM: Activation-Aware Transform to Multi-Head Latent Attention", AAAI Conference on Artificial Intelligence, January 2026.
BibTeX TR2026-018 PDF Video Presentation- @inproceedings{Koike-Akino2026jan,
- author = {{{Koike-Akino, Toshiaki and Chen, Xiangyu and Liu, Jing and Wang, Ye and Wang, Pu and Brand, Matthew}}},
- title = {{{LatentLLM: Activation-Aware Transform to Multi-Head Latent Attention}}},
- booktitle = {AAAI Conference on Artificial Intelligence},
- year = 2026,
- month = jan,
- url = {https://www.merl.com/publications/TR2026-018}
- }
- Rashid, M.R.U., Dasu, V.A., Wang, Y., Tan, G.G., Mehnaz, S., "Chain-of-Thought Driven Adversarial Scenario Extrapolation for Robust Language Models", AAAI Conference on Artificial Intelligence, January 2026.
BibTeX TR2026-017 PDF- @inproceedings{Rashid2026jan,
- author = {Rashid, Md Rafi Ur and Dasu, Vishnu Asutosh and Wang, Ye and Tan, G. Gary and Mehnaz, Shagufta},
- title = {{Chain-of-Thought Driven Adversarial Scenario Extrapolation for Robust Language Models}},
- booktitle = {AAAI Conference on Artificial Intelligence},
- year = 2026,
- month = jan,
- url = {https://www.merl.com/publications/TR2026-017}
- }
- Jeon, C.-B., Wichern, G., Germain, F.G., Le Roux, J., "Embracing Cacophony: Explaining and Improving Random Mixing in Music Source Separation", IEEE Open Journal of Signal Processing, DOI: 10.1109/OJSP.2025.3633567, Vol. 6, pp. 1179-1192, January 2026.
BibTeX TR2026-012 PDF- @article{Jeon2026jan,
- author = {Jeon, Chang-Bin and Wichern, Gordon and Germain, François G and {Le Roux}, Jonathan},
- title = {{Embracing Cacophony: Explaining and Improving Random Mixing in Music Source Separation}},
- journal = {IEEE Open Journal of Signal Processing},
- year = 2026,
- volume = 6,
- pages = {1179--1192},
- month = jan,
- doi = {10.1109/OJSP.2025.3633567},
- url = {https://www.merl.com/publications/TR2026-012}
- }
- Wilkinghoff, K., Yang, H., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Local Density-Based Anomaly Score Normalization for Domain Generalization", IEEE Transactions on Audio, Speech and Language Processing, January 2026.
BibTeX TR2026-010 PDF Software- @article{Wilkinghoff2026jan,
- author = {Wilkinghoff, Kevin and Yang, Haici and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Local Density-Based Anomaly Score Normalization for Domain Generalization}},
- journal = {IEEE Transactions on Audio, Speech and Language Processing},
- year = 2026,
- month = jan,
- url = {https://www.merl.com/publications/TR2026-010}
- }
- Cornell, S., Boeddeker, C., Park, T., Huang, H., Raj, D., Wiesner, M., Masuyama, Y., Chang, X., Wang, Z.-Q., Squartini, S., Garcia, P., Watanabe, S., "Recent Trends in Distant Conversational Speech Recognition: A Review of CHiME-7 and 8 DASR Challenges", Computer Speech & Language, DOI: 10.1016/j.csl.2025.101901, Vol. 97, pp. 101901, December 2025.
BibTeX TR2026-008 PDF- @article{Cornell2025dec,
- author = {Cornell, Samuele and Boeddeker, Christoph and Park, Taejin and Huang, He and Raj, Desh and Wiesner, Matthew and Masuyama, Yoshiki and Chang, Xuankai and Wang, Zhong-Qiu and Squartini, Stefano and Garcia, Paola and Watanabe, Shinji},
- title = {{Recent Trends in Distant Conversational Speech Recognition: A Review of CHiME-7 and 8 DASR Challenges}},
- journal = {Computer Speech \& Language},
- year = 2025,
- volume = 97,
- pages = 101901,
- month = dec,
- doi = {10.1016/j.csl.2025.101901},
- url = {https://www.merl.com/publications/TR2026-008}
- }
- Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "RANF: Neural Field-Based HRTF Spatial Upsampling with Retrieval Augmentation and Parameter Efficient Fine-Tuning", IEEE Open Journal of Signal Processing, DOI: 10.1109/OJSP.2025.3640517, Vol. 7, pp. 32-41, December 2025.
BibTeX TR2026-007 PDF Software- @article{Masuyama2025dec,
- author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and {Le Roux}, Jonathan},
- title = {{RANF: Neural Field-Based HRTF Spatial Upsampling with Retrieval Augmentation and Parameter Efficient Fine-Tuning}},
- journal = {IEEE Open Journal of Signal Processing},
- year = 2025,
- volume = 7,
- pages = {32--41},
- month = dec,
- doi = {10.1109/OJSP.2025.3640517},
- url = {https://www.merl.com/publications/TR2026-007}
- }
- Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "SuDaField: Subject- and Dataset-Aware Neural Field for HRTF Modeling", IEEE Open Journal of Signal Processing, DOI: 10.1109/OJSP.2025.3627073, Vol. 6, pp. 1169-1178, December 2025.
BibTeX TR2026-009 PDF- @article{Masuyama2025dec2,
- author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and {Le Roux}, Jonathan},
- title = {{SuDaField: Subject- and Dataset-Aware Neural Field for HRTF Modeling}},
- journal = {IEEE Open Journal of Signal Processing},
- year = 2025,
- volume = 6,
- pages = {1169--1178},
- month = dec,
- doi = {10.1109/OJSP.2025.3627073},
- url = {https://www.merl.com/publications/TR2026-009}
- }
- Hori, C., Masuyama, Y., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2025.
BibTeX TR2025-167 PDF- @inproceedings{Hori2025dec,
- author = {Hori, Chiori and Masuyama, Yoshiki and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
- title = {{Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2025,
- month = dec,
- url = {https://www.merl.com/publications/TR2025-167}
- }
- Van der Merwe, M., Jha, D.K., "In-Context Policy Iteration for Dynamic Manipulation", Advances in Neural Information Processing Systems (NeurIPS) Workshop on Embodied World Models for Decision Making, December 2025.
BibTeX TR2025-163 PDF Video- @inproceedings{VanderMerwe2025dec,
- author = {Van der Merwe, Mark and Jha, Devesh K.},
- title = {{In-Context Policy Iteration for Dynamic Manipulation}},
- booktitle = {Advances in Neural Information Processing Systems (NeurIPS) Workshop on Embodied World Models for Decision Making},
- year = 2025,
- month = dec,
- url = {https://www.merl.com/publications/TR2025-163}
- }
- Xiang, X., Peng, K.-C., Lohit, S., Jones, M.J., Zhang, J., "Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes", British Machine Vision Conference (BMVC), November 2025.
BibTeX TR2025-162 PDF Video Data Presentation- @inproceedings{Xiang2025nov,
- author = {{{Xiang, Xinhao and Peng, Kuan-Chuan and Lohit, Suhas and Jones, Michael J. and Zhang, Jiawei}}},
- title = {{{Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes}}},
- booktitle = {British Machine Vision Conference (BMVC)},
- year = 2025,
- month = nov,
- url = {https://www.merl.com/publications/TR2025-162}
- }
- Masuyama, Y., "Neural Fields for Spatial Audio Modeling," Tech. Rep. TR2025-171, Speech and Audio in the Northeast (SANE), November 2025.
BibTeX TR2025-171 PDF- @techreport{Masuyama2025nov,
- author = {Masuyama, Yoshiki},
- title = {{Neural Fields for Spatial Audio Modeling}},
- institution = {Speech and Audio in the Northeast (SANE)},
- year = 2025,
- month = nov,
- url = {https://www.merl.com/publications/TR2025-171}
- }
- Wilkinghoff, K., Fujimura, T., Imoto, K., Le Roux, J., Tan, Z.-H., Toda, T., "Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work", Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE), DOI: 10.5281/zenodo.17251589, October 2025, pp. 20-24.
BibTeX TR2025-157 PDF- @inproceedings{Wilkinghoff2025oct,
- author = {Wilkinghoff, Kevin and Fujimura, Takuya and Imoto, Keisuke and {Le Roux}, Jonathan and Tan, Zheng-Hua and Toda, Tomoki},
- title = {{Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work}},
- booktitle = {Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE)},
- year = 2025,
- pages = {20--24},
- month = oct,
- doi = {10.5281/zenodo.17251589},
- isbn = {978-84-09-77652-8},
- url = {https://www.merl.com/publications/TR2025-157}
- }
- Fujihashi, T., Kuwabara, A., Koike-Akino, T., "QKAN-GS: Quantum-Empowered 3D Gaussian Splatting", ACM Multimedia Workshop, DOI: 10.1145/3728486.375921, October 2025, pp. 51-55.
BibTeX TR2025-156 PDF- @inproceedings{Fujihashi2025oct,
- author = {Fujihashi, Takuya and Kuwabara, Akihiro and Koike-Akino, Toshiaki},
- title = {{QKAN-GS: Quantum-Empowered 3D Gaussian Splatting}},
- booktitle = {ACM Multimedia Workshop},
- year = 2025,
- pages = {51--55},
- month = oct,
- publisher = {ACM},
- doi = {10.1145/3728486.375921},
- url = {https://www.merl.com/publications/TR2025-156}
- }
- Yang, C.-A., Peng, K.-C., Yeh, R., "Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts", IEEE International Conference on Computer Vision (ICCV), October 2025.
BibTeX TR2025-124 PDF Video Data Presentation- @inproceedings{Yang2025oct,
- author = {{{Yang, Chiao-An and Peng, Kuan-Chuan and Yeh, Raymond}}},
- title = {{{Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts}}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV)},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-124}
- }
- Peng, K.-C., "Joint Training of Image Generator and Detector for Road Defect Detection", IEEE International Conference on Computer Vision (ICCV) Workshops, October 2025.
BibTeX TR2025-149 PDF Video Presentation- @inproceedings{Peng2025oct,
- author = {{{Peng, Kuan-Chuan}}},
- title = {{{Joint Training of Image Generator and Detector for Road Defect Detection}}},
- booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshops},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-149}
- }
- Shenoy, V., Wu, S., Comas, A., Lohit, S., Mansour, H., Marks, T.K., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", IEEE Access, October 2025.
BibTeX TR2025-145 PDF- @article{Shenoy2025oct,
- author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Lohit, Suhas and Mansour, Hassan and Marks, Tim K.},
- title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
- journal = {IEEE Access},
- year = 2025,
- month = oct,
- url = {https://www.merl.com/publications/TR2025-145}
- }
- Masuyama, Y., Germain, F.G., Wichern, G., Ick, C., Le Roux, J., "Physics-Informed Direction-Aware Neural Acoustic Fields", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA66052.2025.11230918, October 2025.
BibTeX TR2025-142 PDF- @inproceedings{Masuyama2025oct,
- author = {Masuyama, Yoshiki and Germain, François G and Wichern, Gordon and Ick, Christopher and {Le Roux}, Jonathan},
- title = {{Physics-Informed Direction-Aware Neural Acoustic Fields}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2025,
- month = oct,
- doi = {10.1109/WASPAA66052.2025.11230918},
- url = {https://www.merl.com/publications/TR2025-142}
- }
- Paissan, F., Wichern, G., Masuyama, Y., Aihara, R., Germain, F.G., Saijo, K., Le Roux, J., "FasTUSS: Faster Task-Aware Unified Source Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA66052.2025.11230943, October 2025.
BibTeX TR2025-143 PDF- @inproceedings{Paissan2025oct,
- author = {Paissan, Francesco and Wichern, Gordon and Masuyama, Yoshiki and Aihara, Ryo and Germain, François G and Saijo, Kohei and {Le Roux}, Jonathan},
- title = {{FasTUSS: Faster Task-Aware Unified Source Separation}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2025,
- month = oct,
- doi = {10.1109/WASPAA66052.2025.11230943},
- url = {https://www.merl.com/publications/TR2025-143}
- }
- Zhang, J., Cherian, A., Rodriguez, C., Deng, W., Gould, S., "Manual-PA: Learning 3D Part Assembly from Instruction Diagrams", IEEE International Conference on Computer Vision (ICCV), September 2025, pp. 6304-6314.
BibTeX TR2025-139 PDF- @inproceedings{Zhang2025sep,
- author = {Zhang, Jiahao and Cherian, Anoop and Rodriguez, Cristian and Deng, Weijian and Gould, Stephen},
- title = {{Manual-PA: Learning 3D Part Assembly from Instruction Diagrams}},
- booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)},
- year = 2025,
- pages = {6304--6314},
- month = sep,
- url = {https://www.merl.com/publications/TR2025-139}
- }
- Hu, Y., Lohit, S., Kamilov, U., Marks, T.K., "Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal", IEEE Transactions on Geoscience and Remote Sensing, DOI: 10.1109/TGRS.2025.3604654, Vol. 63, September 2025.
BibTeX TR2025-138 PDF- @article{Hu2025sep2,
- author = {Hu, Yuyang and Lohit, Suhas and Kamilov, Ulugbek and Marks, Tim K.},
- title = {{Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal}},
- journal = {IEEE Transactions on Geoscience and Remote Sensing},
- year = 2025,
- volume = 63,
- month = sep,
- doi = {10.1109/TGRS.2025.3604654},
- issn = {1558-0644},
- url = {https://www.merl.com/publications/TR2025-138}
- }
- Van der Merwe, M., Jha, D.K., "In-Context Iterative Policy Improvement for Dynamic Manipulation", Conference on Robot Learning (CoRL), September 2025.
BibTeX TR2025-136 PDF Video- @inproceedings{VanderMerwe2025sep,
- author = {Van der Merwe, Mark and Jha, Devesh K.},
- title = {{In-Context Iterative Policy Improvement for Dynamic Manipulation}},
- booktitle = {Conference on Robot Learning (CoRL)},
- year = 2025,
- month = sep,
- url = {https://www.merl.com/publications/TR2025-136}
- }
- Hussein, A., Khurana, S., Wichern, G., Germain, F.G., Le Roux, J., "HASRD: Hierarchical Acoustic and Semantic Representation Disentanglement", Interspeech, DOI: 10.21437/Interspeech.2025-2063, August 2025, pp. 5393-5397.
BibTeX TR2025-122 PDF- @inproceedings{Hussein2025aug,
- author = {Hussein, Amir and Khurana, Sameer and Wichern, Gordon and Germain, François G and {Le Roux}, Jonathan},
- title = {{HASRD: Hierarchical Acoustic and Semantic Representation Disentanglement}},
- booktitle = {Interspeech},
- year = 2025,
- pages = {5393--5397},
- month = aug,
- publisher = {ISCA},
- doi = {10.21437/Interspeech.2025-2063},
- url = {https://www.merl.com/publications/TR2025-122}
- }
- Ick, C., Wichern, G., Masuyama, Y., Germain, F.G., Le Roux, J., "Direction-Aware Neural Acoustic Fields for Few-Shot Interpolation of Ambisonic Impulse Responses", Interspeech, DOI: 10.21437/Interspeech.2025-1912, August 2025, pp. 933-937.
BibTeX TR2025-120 PDF- @inproceedings{Ick2025aug,
- author = {Ick, Christopher and Wichern, Gordon and Masuyama, Yoshiki and Germain, François G and {Le Roux}, Jonathan},
- title = {{Direction-Aware Neural Acoustic Fields for Few-Shot Interpolation of Ambisonic Impulse Responses}},
- booktitle = {Interspeech},
- year = 2025,
- pages = {933--937},
- month = aug,
- doi = {10.21437/Interspeech.2025-1912},
- url = {https://www.merl.com/publications/TR2025-120}
- }