Publications

657 / 3,798 publications found.


  •  Ranade, S., Pais, G., Whitaker, R., Nascimento, J., Miraldo, P., Ramalingam, S., "SurfR: Surface Reconstruction with Multi-scale Attention", International Conference on 3D Vision (3DV), March 2025.
    BibTeX TR2025-039 PDF
    • @inproceedings{Ranade2025mar,
    • author = {Ranade, Siddhant and Pais, Goncalo and Whitaker, Ross and Nascimento, Jacinto and Miraldo, Pedro and Ramalingam, Srikumar},
    • title = {{SurfR: Surface Reconstruction with Multi-scale Attention}},
    • booktitle = {International Conference on 3D Vision (3DV)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-039}
    • }
  •  Araki, S., Ito, N., Haeb-Umbach, R., Wichern, G., Wang, Z.-Q., Mitsufuji, Y., "30+ Years of Source Separation Research: Achievements and Future Challenges", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-036 PDF
    • @inproceedings{Araki2025mar,
    • author = {Araki, Shoko and Ito, Nobutaka and Haeb-Umbach, Reinhold and Wichern, Gordon and Wang, Zhong-Qiu and Mitsufuji, Yuki},
    • title = {{30+ Years of Source Separation Research: Achievements and Future Challenges}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-036}
    • }
  •  Ebbers, J., Germain, F.G., Wilkinghoff, K., Wichern, G., Le Roux, J., "No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-037 PDF
    • @inproceedings{Ebbers2025mar,
    • author = {Ebbers, Janek and Germain, François G and Wilkinghoff, Kevin and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-037}
    • }
  •  Gruttadauria, E., Fontaine, M., Le Roux, J., Essid, S., "O-EENC-SD: Efficient Online End-to-End Neural Clustering for Speaker Diarization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-031 PDF
    • @inproceedings{Gruttadauria2025mar,
    • author = {Gruttadauria, Elio and Fontaine, Mathieu and {Le Roux}, Jonathan and Essid, Slim},
    • title = {{O-EENC-SD: Efficient Online End-to-End Neural Clustering for Speaker Diarization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-031}
    • }
  •  Hori, C., Kambara, M., Sugiura, K., Ota, K., Khurana, S., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Interactive Robot Action Replanning using Multimodal LLM Trained from Human Demonstration Videos", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-034 PDF
    • @inproceedings{Hori2025mar,
    • author = {Hori, Chiori and Kambara, Motonari and Sugiura, Komei and Ota, Kei and Khurana, Sameer and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
    • title = {{Interactive Robot Action Replanning using Multimodal LLM Trained from Human Demonstration Videos}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-034}
    • }
  •  Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-029 PDF Software
    • @inproceedings{Masuyama2025mar,
    • author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and {Le Roux}, Jonathan},
    • title = {{Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-029}
    • }
  •  Saijo, K., Ebbers, J., Germain, F.G., Khurana, S., Wichern, G., Le Roux, J., "Leveraging Audio-Only Data for Text-Queried Target Sound Extraction", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-033 PDF
    • @inproceedings{Saijo2025mar2,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Khurana, Sameer and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Leveraging Audio-Only Data for Text-Queried Target Sound Extraction}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-033}
    • }
  •  Saijo, K., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Task-Aware Unified Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-032 PDF
    • @inproceedings{Saijo2025mar,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Task-Aware Unified Source Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-032}
    • }
  •  Wilkinghoff, K., Yang, H., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Keeping the Balance: Anomaly Score Calculation for Domain Generalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-030 PDF
    • @inproceedings{Wilkinghoff2025mar,
    • author = {Wilkinghoff, Kevin and Yang, Haici and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Keeping the Balance: Anomaly Score Calculation for Domain Generalization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-030}
    • }
  •  Tian, J., Shi, J., Chen, W., Arora, S., Masuyama, Y., Takashi, M., Wu, Y., Peng, J., Bharadwaj, S., Zhao, Y., Cornell, S., Peng, Y., Yue, X., Yang, C.-H.H., Neubig, G., Watanabe, S., "ESPnet-SpeechLM: An Open Speech Language Model Toolkit", NAACL-HLT (the system demonstration track), March 2025.
    BibTeX TR2025-038 PDF
    • @inproceedings{Tian2025mar,
    • author = {Tian, Jinchuan and Shi, Jiatong and Chen, William and Arora, Siddhant and Masuyama, Yoshiki and Takashi, Maekaku and Wu, Yihan and Peng, Junyi and Bharadwaj, Shikhar and Zhao, Yiwen and Cornell, Samuele and Peng, Yifan and Yue, Xiang and Yang, Chao-Han H. and Neubig, Graham and Watanabe, Shinji},
    • title = {{ESPnet-SpeechLM: An Open Speech Language Model Toolkit}},
    • booktitle = {NAACL-HLT (the system demonstration track)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-038}
    • }
  •  Wang, R., Wang, Y., Liu, J., Koike-Akino, T., "Quantum Diffusion Models for Few-Shot Learning", AAAI Conference on Artificial Intelligence, March 2025.
    BibTeX TR2025-025 PDF
    • @inproceedings{Wang2025mar,
    • author = {Wang, Ruhan and Wang, Ye and Liu, Jing and Koike-Akino, Toshiaki},
    • title = {{Quantum Diffusion Models for Few-Shot Learning}},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-025}
    • }
  •  Fujihashi, T., Koike-Akino, T., "Quantum Implicit Neural Compression", AAAI Conference on Artificial Intelligence, March 2025.
    BibTeX TR2025-024 PDF
    • @inproceedings{Fujihashi2025mar,
    • author = {Fujihashi, Takuya and Koike-Akino, Toshiaki},
    • title = {{Quantum Implicit Neural Compression}},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-024}
    • }
  •  Wang, Y., Peng, K.-C., Fu, R., "Towards Zero-shot 3D Anomaly Localization", IEEE Winter Conference on Applications of Computer Vision (WACV), February 2025.
    BibTeX TR2025-020 PDF Video Presentation
    • @inproceedings{Wang2025feb2,
    • author = {Wang, Yizhou and Peng, Kuan-Chuan and Fu, Raymond},
    • title = {{Towards Zero-shot 3D Anomaly Localization}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2025,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2025-020}
    • }
  •  Rashid, M.R.U., Liu, J., Koike-Akino, T., Wang, Y., Mehnaz, S., "Forget to Flourish: Leveraging Machine-Unlearning on Pretrained Language Models for Privacy Leakage", AAAI Conference on Artificial Intelligence, February 2025.
    BibTeX TR2025-017 PDF
    • @inproceedings{Rashid2025feb,
    • author = {Rashid, Md Rafi Ur and Liu, Jing and Koike-Akino, Toshiaki and Wang, Ye and Mehnaz, Shagufta},
    • title = {{Forget to Flourish: Leveraging Machine-Unlearning on Pretrained Language Models for Privacy Leakage}},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2025,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2025-017}
    • }
  •  Mumcu, F., Jones, M.J., Yilmaz, Y., Cherian, A., "ComplexVAD: Detecting Interaction Anomalies in Video", IEEE Winter Conference on Applications of Computer Vision (WACV) Workshop, February 2025.
    BibTeX TR2025-016 PDF
    • @inproceedings{Mumcu2025feb,
    • author = {Mumcu, Furkan and Jones, Michael J. and Yilmaz, Yasin and Cherian, Anoop},
    • title = {{ComplexVAD: Detecting Interaction Anomalies in Video}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV) Workshop},
    • year = 2025,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2025-016}
    • }
  •  Koo, J., Wichern, G., Germain, F.G., Khurana, S., Le Roux, J., "SMITIN: Self-Monitored Inference-Time INtervention for Generative Music Transformers", IEEE Open Journal of Signal Processing, DOI: 10.1109/​OJSP.2025.3534686, Vol. 6, pp. 266-275, January 2025.
    BibTeX TR2025-012 PDF Software
    • @article{Koo2025jan,
    • author = {Koo, Junghyun and Wichern, Gordon and Germain, François G and Khurana, Sameer and {Le Roux}, Jonathan},
    • title = {{SMITIN: Self-Monitored Inference-Time INtervention for Generative Music Transformers}},
    • journal = {IEEE Open Journal of Signal Processing},
    • year = 2025,
    • volume = 6,
    • pages = {266--275},
    • month = jan,
    • doi = {10.1109/OJSP.2025.3534686},
    • issn = {2644-1322},
    • url = {https://www.merl.com/publications/TR2025-012}
    • }
  •  Lohit, S., Marks, T.K., "Rotation-Equivariant Neural Networks for Cloud Removal from Satellite Images", Asilomar Conference on Signals, Systems, and Computers (ACSSC), January 2025.
    BibTeX TR2025-009 PDF
    • @inproceedings{Lohit2025jan,
    • author = {Lohit, Suhas and Marks, Tim K.},
    • title = {{Rotation-Equivariant Neural Networks for Cloud Removal from Satellite Images}},
    • booktitle = {Asilomar Conference on Signals, Systems, and Computers (ACSSC)},
    • year = 2025,
    • month = jan,
    • url = {https://www.merl.com/publications/TR2025-009}
    • }
  •  He, Y., Shin, S., Cherian, A., Trigoni, N., Markham, A., "SoundLoc3D: Invisible 3D Sound Source Localization and Classification Using a Multimodal RGB-D Acoustic Camera", IEEE Winter Conference on Applications of Computer Vision (WACV), December 2024.
    BibTeX TR2025-003 PDF
    • @inproceedings{He2024dec2,
    • author = {He, Yuhang and Shin, Sangyun and Cherian, Anoop and Trigoni, Niki and Markham, Andrew},
    • title = {{SoundLoc3D: Invisible 3D Sound Source Localization and Classification Using a Multimodal RGB-D Acoustic Camera}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2025-003}
    • }
  •  Zhang, J., Zhang, F., Rodriguez, C., Ben-Shabat, I., Cherian, A., Gould, S., "Temporally Grounding Instructional Diagrams in Unconstrained Videos", IEEE Winter Conference on Applications of Computer Vision (WACV), December 2024.
    BibTeX TR2025-002 PDF
    • @inproceedings{Zhang2024dec,
    • author = {Zhang, Jiahao and Zhang, Frederic and Rodriguez, Cristian and Ben-Shabat, Itzik and Cherian, Anoop and Gould, Stephen},
    • title = {{Temporally Grounding Instructional Diagrams in Unconstrained Videos}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2025-002}
    • }
  •  Bimbraw, K., Wang, Y., Liu, J., Koike-Akino, T., "GPT Sonograpy: Hand Gesture Decoding from Forearm Ultrasound Images via VLM", Advances in Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2024-175 PDF Presentation
    • @inproceedings{Bimbraw2024dec,
    • author = {Bimbraw, Keshav and Wang, Ye and Liu, Jing and Koike-Akino, Toshiaki},
    • title = {{GPT Sonograpy: Hand Gesture Decoding from Forearm Ultrasound Images via VLM}},
    • booktitle = {Advancements In Medical Foundation Models: Explainability, Robustness, Security, and Beyond Workshop at Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-175}
    • }
  •  Chen, X., Wang, Y., Brand, M., Wang, P., Liu, J., Koike-Akino, T., "Slaying the HyDRA: Parameter-Efficient Hyper Networks with Low-Displacement Rank Adaptation", Advances in Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2024-157 PDF Presentation
    • @inproceedings{Chen2024dec,
    • author = {Chen, Xiangyu and Wang, Ye and Brand, Matthew and Wang, Pu and Liu, Jing and Koike-Akino, Toshiaki},
    • title = {{Slaying the HyDRA: Parameter-Efficient Hyper Networks with Low-Displacement Rank Adaptation}},
    • booktitle = {Workshop on Adaptive Foundation Models: Evolving AI for Personalized and Efficient Learning at Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-157}
    • }
  •  Fujihashi, T., Kato, S., Koike-Akino, T., "FV-NeRV: Neural Compression for Free Viewpoint Videos", Advances in Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2024-176 PDF
    • @inproceedings{Fujihashi2024dec,
    • author = {Fujihashi, Takuya and Kato, Sorachi and Koike-Akino, Toshiaki},
    • title = {{FV-NeRV: Neural Compression for Free Viewpoint Videos}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-176}
    • }
  •  Park, Y.-J., Germain, F.G., Liu, J., Wang, Y., Koike-Akino, T., Wichern, G., Christopher R., , Azizan, N., Laughman, C.A., "Probabilistic Forecasting for Building Energy Systems: Are Time-Series Foundation Models The Answer?", Advances in Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2025-001 PDF
    • @inproceedings{Park2024dec,
    • author = {Park, Young-Jin and Germain, François G and Liu, Jing and Wang, Ye and Koike-Akino, Toshiaki and Wichern, Gordon and Christopher R. and Azizan, Navid and Laughman, Chakrabarty, Ankush},
    • title = {{Probabilistic Forecasting for Building Energy Systems: Are Time-Series Foundation Models The Answer?}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2025-001}
    • }
  •  Tang, W.-T., Chakrabarty, A., Paulson, J.A., "TR-BEACON: Shedding Light on Efficient Behavior Discovery in High-Dimensional Spaces with Bayesian Novelty Search over Trust Regions", Advances in Neural Information Processing Systems (NeurIPS), December 2024.
    BibTeX TR2024-167 PDF
    • @inproceedings{Tang2024dec,
    • author = {Tang, Wei-Ting and Chakrabarty, Ankush and Paulson, Joel A.},
    • title = {{TR-BEACON: Shedding Light on Efficient Behavior Discovery in High-Dimensional Spaces with Bayesian Novelty Search over Trust Regions}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-167}
    • }
  •  Liu, J., Wang, Y., Koike-Akino, T., Nakai, T., Oonishi, K., Higashi, T., "MEL-PETs Defense for the NeurIPS 2024 LLM Privacy Challenge Blue Team Track", LLM Privacy Challenge at Neural Information Processing Systems (NeurIPS) 2024, December 2024.
    BibTeX TR2024-166 PDF Video Presentation
    • @inproceedings{Liu2024dec,
    • author = {Liu, Jing and Wang, Ye and Koike-Akino, Toshiaki and Nakai, Tsunato and Oonishi, Kento and Higashi, Takuya},
    • title = {{MEL-PETs Defense for the NeurIPS 2024 LLM Privacy Challenge Blue Team Track}},
    • booktitle = {LLM Privacy Challenge at Neural Information Processing Systems (NeurIPS) 2024},
    • year = 2024,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2024-166}
    • }