Publications

709 / 3,973 publications found.


  •  Khattar, V., Choudhury, M., Rashid, M.R.U., Liu, J., Koike-Akino, T., Jin, M., Wang, Y., "Amplification Effects in Test-Time Reinforcement Learning: Safety and Reasoning Vulnerabilities", AAAI Workshop on Trust and Control in Agentic AI, January 2026.
    BibTeX TR2026-020 PDF
    • @inproceedings{Khattar2026jan,
    • author = {Khattar, Vanshaj and Choudhury, Moumita and Rashid, Md Rafi Ur and Liu, Jing and Koike-Akino, Toshiaki and Jin, Ming and Wang, Ye},
    • title = {{Amplification Effects in Test-Time Reinforcement Learning: Safety and Reasoning Vulnerabilities}},
    • booktitle = {AAAI Workshop on Trust and Control in Agentic AI},
    • year = 2026,
    • month = jan,
    • url = {https://www.merl.com/publications/TR2026-020}
    • }
  •  Fujihashi, T., Koike-Akino, T., "Quantum Implicit Neural Compression", Springer Nature, January 2026.
    BibTeX TR2026-022 PDF
    • @article{Fujihashi2026jan,
    • author = {Fujihashi, Takuya and Koike-Akino, Toshiaki},
    • title = {{Quantum Implicit Neural Compression}},
    • journal = {Springer Nature},
    • year = 2026,
    • month = jan,
    • url = {https://www.merl.com/publications/TR2026-022}
    • }
  •  Koike-Akino, T., Chen, X., Liu, J., Wang, Y., Wang, P., Brand, M., "LatentLLM: Activation-Aware Transform to Multi-Head Latent Attention", AAAI Conference on Artificial Intelligence, January 2026.
    BibTeX TR2026-018 PDF Video Presentation
    • @inproceedings{Koike-Akino2026jan,
    • author = {{{Koike-Akino, Toshiaki and Chen, Xiangyu and Liu, Jing and Wang, Ye and Wang, Pu and Brand, Matthew}}},
    • title = {{{LatentLLM: Activation-Aware Transform to Multi-Head Latent Attention}}},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2026,
    • month = jan,
    • url = {https://www.merl.com/publications/TR2026-018}
    • }
  •  Rashid, M.R.U., Dasu, V.A., Wang, Y., Tan, G.G., Mehnaz, S., "Chain-of-Thought Driven Adversarial Scenario Extrapolation for Robust Language Models", AAAI Conference on Artificial Intelligence, January 2026.
    BibTeX TR2026-017 PDF
    • @inproceedings{Rashid2026jan,
    • author = {Rashid, Md Rafi Ur and Dasu, Vishnu Asutosh and Wang, Ye and Tan, G. Gary and Mehnaz, Shagufta},
    • title = {{Chain-of-Thought Driven Adversarial Scenario Extrapolation for Robust Language Models}},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2026,
    • month = jan,
    • url = {https://www.merl.com/publications/TR2026-017}
    • }
  •  Jeon, C.-B., Wichern, G., Germain, F.G., Le Roux, J., "Embracing Cacophony: Explaining and Improving Random Mixing in Music Source Separation", IEEE Open Journal of Signal Processing, DOI: 10.1109/​OJSP.2025.3633567, Vol. 6, pp. 1179-1192, January 2026.
    BibTeX TR2026-012 PDF
    • @article{Jeon2026jan,
    • author = {Jeon, Chang-Bin and Wichern, Gordon and Germain, François G and {Le Roux}, Jonathan},
    • title = {{Embracing Cacophony: Explaining and Improving Random Mixing in Music Source Separation}},
    • journal = {IEEE Open Journal of Signal Processing},
    • year = 2026,
    • volume = 6,
    • pages = {1179--1192},
    • month = jan,
    • doi = {10.1109/OJSP.2025.3633567},
    • url = {https://www.merl.com/publications/TR2026-012}
    • }
  •  Wilkinghoff, K., Yang, H., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Local Density-Based Anomaly Score Normalization for Domain Generalization", IEEE Transactions on Audio, Speech and Language Processing, January 2026.
    BibTeX TR2026-010 PDF Software
    • @article{Wilkinghoff2026jan,
    • author = {Wilkinghoff, Kevin and Yang, Haici and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Local Density-Based Anomaly Score Normalization for Domain Generalization}},
    • journal = {IEEE Transactions on Audio, Speech and Language Processing},
    • year = 2026,
    • month = jan,
    • url = {https://www.merl.com/publications/TR2026-010}
    • }
  •  Cornell, S., Boeddeker, C., Park, T., Huang, H., Raj, D., Wiesner, M., Masuyama, Y., Chang, X., Wang, Z.-Q., Squartini, S., Garcia, P., Watanabe, S., "Recent Trends in Distant Conversational Speech Recognition: A Review of CHiME-7 and 8 DASR Challenges", Computer Speech & Language, DOI: 10.1016/​j.csl.2025.101901, Vol. 97, pp. 101901, December 2025.
    BibTeX TR2026-008 PDF
    • @article{Cornell2025dec,
    • author = {Cornell, Samuele and Boeddeker, Christoph and Park, Taejin and Huang, He and Raj, Desh and Wiesner, Matthew and Masuyama, Yoshiki and Chang, Xuankai and Wang, Zhong-Qiu and Squartini, Stefano and Garcia, Paola and Watanabe, Shinji},
    • title = {{Recent Trends in Distant Conversational Speech Recognition: A Review of CHiME-7 and 8 DASR Challenges}},
    • journal = {Computer Speech \& Language},
    • year = 2025,
    • volume = 97,
    • pages = 101901,
    • month = dec,
    • doi = {10.1016/j.csl.2025.101901},
    • url = {https://www.merl.com/publications/TR2026-008}
    • }
  •  Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "RANF: Neural Field-Based HRTF Spatial Upsampling with Retrieval Augmentation and Parameter Efficient Fine-Tuning", IEEE Open Journal of Signal Processing, DOI: 10.1109/​OJSP.2025.3640517, Vol. 7, pp. 32-41, December 2025.
    BibTeX TR2026-007 PDF Software
    • @article{Masuyama2025dec,
    • author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and {Le Roux}, Jonathan},
    • title = {{RANF: Neural Field-Based HRTF Spatial Upsampling with Retrieval Augmentation and Parameter Efficient Fine-Tuning}},
    • journal = {IEEE Open Journal of Signal Processing},
    • year = 2025,
    • volume = 7,
    • pages = {32--41},
    • month = dec,
    • doi = {10.1109/OJSP.2025.3640517},
    • url = {https://www.merl.com/publications/TR2026-007}
    • }
  •  Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "SuDaField: Subject- and Dataset-Aware Neural Field for HRTF Modeling", IEEE Open Journal of Signal Processing, DOI: 10.1109/​OJSP.2025.3627073, Vol. 6, pp. 1169-1178, December 2025.
    BibTeX TR2026-009 PDF
    • @article{Masuyama2025dec2,
    • author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and {Le Roux}, Jonathan},
    • title = {{SuDaField: Subject- and Dataset-Aware Neural Field for HRTF Modeling}},
    • journal = {IEEE Open Journal of Signal Processing},
    • year = 2025,
    • volume = 6,
    • pages = {1169--1178},
    • month = dec,
    • doi = {10.1109/OJSP.2025.3627073},
    • url = {https://www.merl.com/publications/TR2026-009}
    • }
  •  Hori, C., Masuyama, Y., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2025.
    BibTeX TR2025-167 PDF
    • @inproceedings{Hori2025dec,
    • author = {Hori, Chiori and Masuyama, Yoshiki and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
    • title = {{Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM}},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2025,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2025-167}
    • }
  •  Van der Merwe, M., Jha, D.K., "In-Context Policy Iteration for Dynamic Manipulation", Advances in Neural Information Processing Systems (NeurIPS) Workshop on Embodied World Models for Decision Making, December 2025.
    BibTeX TR2025-163 PDF Video
    • @inproceedings{VanderMerwe2025dec,
    • author = {Van der Merwe, Mark and Jha, Devesh K.},
    • title = {{In-Context Policy Iteration for Dynamic Manipulation}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS) Workshop on Embodied World Models for Decision Making},
    • year = 2025,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2025-163}
    • }
  •  Xiang, X., Peng, K.-C., Lohit, S., Jones, M.J., Zhang, J., "Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes", British Machine Vision Conference (BMVC), November 2025.
    BibTeX TR2025-162 PDF Video Data Presentation
    • @inproceedings{Xiang2025nov,
    • author = {{{Xiang, Xinhao and Peng, Kuan-Chuan and Lohit, Suhas and Jones, Michael J. and Zhang, Jiawei}}},
    • title = {{{Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes}}},
    • booktitle = {British Machine Vision Conference (BMVC)},
    • year = 2025,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2025-162}
    • }
  •  Masuyama, Y., "Neural Fields for Spatial Audio Modeling," Tech. Rep. TR2025-171, Speech and Audio in the Northeast (SANE), November 2025.
    BibTeX TR2025-171 PDF
    • @techreport{Masuyama2025nov,
    • author = {Masuyama, Yoshiki},
    • title = {{Neural Fields for Spatial Audio Modeling}},
    • institution = {Speech and Audio in the Northeast (SANE)},
    • year = 2025,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2025-171}
    • }
  •  Wilkinghoff, K., Fujimura, T., Imoto, K., Le Roux, J., Tan, Z.-H., Toda, T., "Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work", Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE), DOI: 10.5281/​zenodo.17251589, October 2025, pp. 20-24.
    BibTeX TR2025-157 PDF
    • @inproceedings{Wilkinghoff2025oct,
    • author = {Wilkinghoff, Kevin and Fujimura, Takuya and Imoto, Keisuke and {Le Roux}, Jonathan and Tan, Zheng-Hua and Toda, Tomoki},
    • title = {{Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work}},
    • booktitle = {Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE)},
    • year = 2025,
    • pages = {20--24},
    • month = oct,
    • doi = {10.5281/zenodo.17251589},
    • isbn = {978-84-09-77652-8},
    • url = {https://www.merl.com/publications/TR2025-157}
    • }
  •  Fujihashi, T., Kuwabara, A., Koike-Akino, T., "QKAN-GS: Quantum-Empowered 3D Gaussian Splatting", ACM Multimedia Workshop, DOI: 10.1145/​3728486.375921, October 2025, pp. 51-55.
    BibTeX TR2025-156 PDF
    • @inproceedings{Fujihashi2025oct,
    • author = {Fujihashi, Takuya and Kuwabara, Akihiro and Koike-Akino, Toshiaki},
    • title = {{QKAN-GS: Quantum-Empowered 3D Gaussian Splatting}},
    • booktitle = {ACM Multimedia Workshop},
    • year = 2025,
    • pages = {51--55},
    • month = oct,
    • publisher = {ACM},
    • doi = {10.1145/3728486.375921},
    • url = {https://www.merl.com/publications/TR2025-156}
    • }
  •  Yang, C.-A., Peng, K.-C., Yeh, R., "Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts", IEEE International Conference on Computer Vision (ICCV), October 2025.
    BibTeX TR2025-124 PDF Video Data Presentation
    • @inproceedings{Yang2025oct,
    • author = {{{Yang, Chiao-An and Peng, Kuan-Chuan and Yeh, Raymond}}},
    • title = {{{Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-124}
    • }
  •  Peng, K.-C., "Joint Training of Image Generator and Detector for Road Defect Detection", IEEE International Conference on Computer Vision (ICCV) Workshops, October 2025.
    BibTeX TR2025-149 PDF Video Presentation
    • @inproceedings{Peng2025oct,
    • author = {{{Peng, Kuan-Chuan}}},
    • title = {{{Joint Training of Image Generator and Detector for Road Defect Detection}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshops},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-149}
    • }
  •  Shenoy, V., Wu, S., Comas, A., Lohit, S., Mansour, H., Marks, T.K., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", IEEE Access, October 2025.
    BibTeX TR2025-145 PDF
    • @article{Shenoy2025oct,
    • author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Lohit, Suhas and Mansour, Hassan and Marks, Tim K.},
    • title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
    • journal = {IEEE Access},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-145}
    • }
  •  Masuyama, Y., Germain, F.G., Wichern, G., Ick, C., Le Roux, J., "Physics-Informed Direction-Aware Neural Acoustic Fields", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA66052.2025.11230918, October 2025.
    BibTeX TR2025-142 PDF
    • @inproceedings{Masuyama2025oct,
    • author = {Masuyama, Yoshiki and Germain, François G and Wichern, Gordon and Ick, Christopher and {Le Roux}, Jonathan},
    • title = {{Physics-Informed Direction-Aware Neural Acoustic Fields}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2025,
    • month = oct,
    • doi = {10.1109/WASPAA66052.2025.11230918},
    • url = {https://www.merl.com/publications/TR2025-142}
    • }
  •  Paissan, F., Wichern, G., Masuyama, Y., Aihara, R., Germain, F.G., Saijo, K., Le Roux, J., "FasTUSS: Faster Task-Aware Unified Source Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA66052.2025.11230943, October 2025.
    BibTeX TR2025-143 PDF
    • @inproceedings{Paissan2025oct,
    • author = {Paissan, Francesco and Wichern, Gordon and Masuyama, Yoshiki and Aihara, Ryo and Germain, François G and Saijo, Kohei and {Le Roux}, Jonathan},
    • title = {{FasTUSS: Faster Task-Aware Unified Source Separation}},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2025,
    • month = oct,
    • doi = {10.1109/WASPAA66052.2025.11230943},
    • url = {https://www.merl.com/publications/TR2025-143}
    • }
  •  Zhang, J., Cherian, A., Rodriguez, C., Deng, W., Gould, S., "Manual-PA: Learning 3D Part Assembly from Instruction Diagrams", IEEE International Conference on Computer Vision (ICCV), September 2025, pp. 6304-6314.
    BibTeX TR2025-139 PDF
    • @inproceedings{Zhang2025sep,
    • author = {Zhang, Jiahao and Cherian, Anoop and Rodriguez, Cristian and Deng, Weijian and Gould, Stephen},
    • title = {{Manual-PA: Learning 3D Part Assembly from Instruction Diagrams}},
    • booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • pages = {6304--6314},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2025-139}
    • }
  •  Hu, Y., Lohit, S., Kamilov, U., Marks, T.K., "Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal", IEEE Transactions on Geoscience and Remote Sensing, DOI: 10.1109/​TGRS.2025.3604654, Vol. 63, September 2025.
    BibTeX TR2025-138 PDF
    • @article{Hu2025sep2,
    • author = {Hu, Yuyang and Lohit, Suhas and Kamilov, Ulugbek and Marks, Tim K.},
    • title = {{Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal}},
    • journal = {IEEE Transactions on Geoscience and Remote Sensing},
    • year = 2025,
    • volume = 63,
    • month = sep,
    • doi = {10.1109/TGRS.2025.3604654},
    • issn = {1558-0644},
    • url = {https://www.merl.com/publications/TR2025-138}
    • }
  •  Van der Merwe, M., Jha, D.K., "In-Context Iterative Policy Improvement for Dynamic Manipulation", Conference on Robot Learning (CoRL), September 2025.
    BibTeX TR2025-136 PDF Video
    • @inproceedings{VanderMerwe2025sep,
    • author = {Van der Merwe, Mark and Jha, Devesh K.},
    • title = {{In-Context Iterative Policy Improvement for Dynamic Manipulation}},
    • booktitle = {Conference on Robot Learning (CoRL)},
    • year = 2025,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2025-136}
    • }
  •  Hussein, A., Khurana, S., Wichern, G., Germain, F.G., Le Roux, J., "HASRD: Hierarchical Acoustic and Semantic Representation Disentanglement", Interspeech, DOI: 10.21437/​Interspeech.2025-2063, August 2025, pp. 5393-5397.
    BibTeX TR2025-122 PDF
    • @inproceedings{Hussein2025aug,
    • author = {Hussein, Amir and Khurana, Sameer and Wichern, Gordon and Germain, François G and {Le Roux}, Jonathan},
    • title = {{HASRD: Hierarchical Acoustic and Semantic Representation Disentanglement}},
    • booktitle = {Interspeech},
    • year = 2025,
    • pages = {5393--5397},
    • month = aug,
    • publisher = {ISCA},
    • doi = {10.21437/Interspeech.2025-2063},
    • url = {https://www.merl.com/publications/TR2025-122}
    • }
  •  Ick, C., Wichern, G., Masuyama, Y., Germain, F.G., Le Roux, J., "Direction-Aware Neural Acoustic Fields for Few-Shot Interpolation of Ambisonic Impulse Responses", Interspeech, DOI: 10.21437/​Interspeech.2025-1912, August 2025, pp. 933-937.
    BibTeX TR2025-120 PDF
    • @inproceedings{Ick2025aug,
    • author = {Ick, Christopher and Wichern, Gordon and Masuyama, Yoshiki and Germain, François G and {Le Roux}, Jonathan},
    • title = {{Direction-Aware Neural Acoustic Fields for Few-Shot Interpolation of Ambisonic Impulse Responses}},
    • booktitle = {Interspeech},
    • year = 2025,
    • pages = {933--937},
    • month = aug,
    • doi = {10.21437/Interspeech.2025-1912},
    • url = {https://www.merl.com/publications/TR2025-120}
    • }