Publications

3,799 major publications by members of the MERL staff.


  •  Das, A., Rahman, S., Xiang, X., Palash, R.H., Hossain, T., Sikder, B., Yagyu, E., Nakamura, M., Teo, K.H., Chowdhury, N., "Inverse Design of AlGaN/GaN HEMT RF Device with Source Connected Field Plate", Advanced Theory and Simulations, March 2025.
    BibTeX TR2025-040 PDF
    • @article{Das2025mar,
    • author = {Das, Aurick and Rahman, Saimur and Xiang, Xiaofeng and Palash, Raffd Hassan and Hossain, Toiyob and Sikder, Bejoy and Yagyu, Eiji and Nakamura, Marika and Teo, Koon Hoo and Chowdhury, Nadim},
    • title = {{Inverse Design of AlGaN/GaN HEMT RF Device with Source Connected Field Plate}},
    • journal = {Advanced Theory and Simulations},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-040}
    • }
  •  Ranade, S., Pais, G., Whitaker, R., Nascimento, J., Miraldo, P., Ramalingam, S., "SurfR: Surface Reconstruction with Multi-scale Attention", International Conference on 3D Vision (3DV), March 2025.
    BibTeX TR2025-039 PDF
    • @inproceedings{Ranade2025mar,
    • author = {Ranade, Siddhant and Pais, Goncalo and Whitaker, Ross and Nascimento, Jacinto and Miraldo, Pedro and Ramalingam, Srikumar},
    • title = {{SurfR: Surface Reconstruction with Multi-scale Attention}},
    • booktitle = {International Conference on 3D Vision (3DV)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-039}
    • }
  •  Shenoy, V., Lohit, S., Mansour, H., Chellappa, R., Marks, T.K., "Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models", arXiv, March 2025.
    BibTeX arXiv
    • @article{Shenoy2025mar,
    • author = {Shenoy, Vineet and Lohit, Suhas and Mansour, Hassan and Chellappa, Rama and Marks, Tim K.},
    • title = {{Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.17269}
    • }
  •  Shenoy, V., Wu, S., Comas, A., Marks, T.K., Lohit, S., Mansour, H., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", arXiv, March 2025.
    BibTeX arXiv
    • @article{Shenoy2025mar2,
    • author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Marks, Tim K. and Lohit, Suhas and Mansour, Hassan},
    • title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.17351}
    • }
  •  Wilkinghoff, K., Fujimura, T., Imoto, K., Le Roux, J., Tan, Z.-H., Toda, T., "Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work", arXiv, March 2025.
    BibTeX arXiv
    • @article{Wilkinghoff2025mar2,
    • author = {Wilkinghoff, Kevin and Fujimura, Takuya and Imoto, Keisuke and {Le Roux}, Jonathan and Tan, Zheng-Hua and Toda, Tomoki},
    • title = {{Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.10435}
    • }
  •  Shirai, Y., Raghunathan, A., Jha, D.K., "Hierarchical Contact-Rich Trajectory Optimization for Multi-Modal Manipulation using Tight Convex Relaxations", arXiv, March 2025.
    BibTeX arXiv
    • @article{Shirai2025mar,
    • author = {Shirai, Yuki and Raghunathan, Arvind and Jha, Devesh K.},
    • title = {{Hierarchical Contact-Rich Trajectory Optimization for Multi-Modal Manipulation using Tight Convex Relaxations}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.07963}
    • }
  •  Schperberg, A., Menner, M., Di Cairano, S., "Energy-Efficient Motion Planner for Legged Robots", arXiv, March 2025.
    BibTeX arXiv
    • @article{Schperberg2025mar,
    • author = {Schperberg, Alexander and Menner, Marcel and {Di Cairano}, Stefano},
    • title = {{Energy-Efficient Motion Planner for Legged Robots}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.06050}
    • }
  •  Araki, S., Ito, N., Haeb-Umbach, R., Wichern, G., Wang, Z.-Q., Mitsufuji, Y., "30+ Years of Source Separation Research: Achievements and Future Challenges", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-036 PDF
    • @inproceedings{Araki2025mar,
    • author = {Araki, Shoko and Ito, Nobutaka and Haeb-Umbach, Reinhold and Wichern, Gordon and Wang, Zhong-Qiu and Mitsufuji, Yuki},
    • title = {{30+ Years of Source Separation Research: Achievements and Future Challenges}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-036}
    • }
  •  Ebbers, J., Germain, F.G., Wilkinghoff, K., Wichern, G., Le Roux, J., "No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-037 PDF
    • @inproceedings{Ebbers2025mar,
    • author = {Ebbers, Janek and Germain, François G and Wilkinghoff, Kevin and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-037}
    • }
  •  Gruttadauria, E., Fontaine, M., Le Roux, J., Essid, S., "O-EENC-SD: Efficient Online End-to-End Neural Clustering for Speaker Diarization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-031 PDF
    • @inproceedings{Gruttadauria2025mar,
    • author = {Gruttadauria, Elio and Fontaine, Mathieu and {Le Roux}, Jonathan and Essid, Slim},
    • title = {{O-EENC-SD: Efficient Online End-to-End Neural Clustering for Speaker Diarization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-031}
    • }
  •  Hori, C., Kambara, M., Sugiura, K., Ota, K., Khurana, S., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Interactive Robot Action Replanning using Multimodal LLM Trained from Human Demonstration Videos", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-034 PDF
    • @inproceedings{Hori2025mar,
    • author = {Hori, Chiori and Kambara, Motonari and Sugiura, Komei and Ota, Kei and Khurana, Sameer and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
    • title = {{Interactive Robot Action Replanning using Multimodal LLM Trained from Human Demonstration Videos}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-034}
    • }
  •  Kitichotkul, R., Rapp, J., Ma, Y., Mansour, H., "Doppler Single-Photon Lidar", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-028 PDF
    • @inproceedings{Kitichotkul2025mar,
    • author = {Kitichotkul, Ruangrawee and Rapp, Joshua and Ma, Yanting and Mansour, Hassan},
    • title = {{Doppler Single-Photon Lidar}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-028}
    • }
  •  Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-029 PDF Software
    • @inproceedings{Masuyama2025mar,
    • author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and {Le Roux}, Jonathan},
    • title = {{Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-029}
    • }
  •  Saijo, K., Ebbers, J., Germain, F.G., Khurana, S., Wichern, G., Le Roux, J., "Leveraging Audio-Only Data for Text-Queried Target Sound Extraction", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-033 PDF
    • @inproceedings{Saijo2025mar2,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Khurana, Sameer and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Leveraging Audio-Only Data for Text-Queried Target Sound Extraction}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-033}
    • }
  •  Saijo, K., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Task-Aware Unified Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-032 PDF
    • @inproceedings{Saijo2025mar,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Task-Aware Unified Source Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-032}
    • }
  •  Teh, A., Ali, W.H., Rapp, J., Mansour, H., "Indoor Airflow Imaging Using Physics-Informed Schlieren Tomography", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-035 PDF
    • @inproceedings{Teh2025mar,
    • author = {Teh, Arjun and Ali, Wael H. and Rapp, Joshua and Mansour, Hassan},
    • title = {{Indoor Airflow Imaging Using Physics-Informed Schlieren Tomography}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-035}
    • }
  •  Wilkinghoff, K., Yang, H., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Keeping the Balance: Anomaly Score Calculation for Domain Generalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-030 PDF
    • @inproceedings{Wilkinghoff2025mar,
    • author = {Wilkinghoff, Kevin and Yang, Haici and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Keeping the Balance: Anomaly Score Calculation for Domain Generalization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-030}
    • }
  •  Tian, J., Shi, J., Chen, W., Arora, S., Masuyama, Y., Takashi, M., Wu, Y., Peng, J., Bharadwaj, S., Zhao, Y., Cornell, S., Peng, Y., Yue, X., Yang, C.-H.H., Neubig, G., Watanabe, S., "ESPnet-SpeechLM: An Open Speech Language Model Toolkit", NAACL-HLT (the system demonstration track), March 2025.
    BibTeX TR2025-038 PDF
    • @inproceedings{Tian2025mar,
    • author = {Tian, Jinchuan and Shi, Jiatong and Chen, William and Arora, Siddhant and Masuyama, Yoshiki and Takashi, Maekaku and Wu, Yihan and Peng, Junyi and Bharadwaj, Shikhar and Zhao, Yiwen and Cornell, Samuele and Peng, Yifan and Yue, Xiang and Yang, Chao-Han H. and Neubig, Graham and Watanabe, Shinji},
    • title = {{ESPnet-SpeechLM: An Open Speech Language Model Toolkit}},
    • booktitle = {NAACL-HLT (the system demonstration track)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-038}
    • }
  •  Koike-Akino, T., Tonin, F., Wu, Y., Wu, F.Z., Candogan, L.N., Volkan Cevher,, "Quantum-PEFT: Ultra parameter-efficient fine-tuning", arXiv, March 2025.
    BibTeX arXiv
    • @article{Koike-Akino2025mar,
    • author = {Koike-Akino, Toshiaki and Tonin, Francesco and Wu, Yongtao and Wu, Frank Zhengqing and Candogan, Leyla Naz and Volkan Cevher},
    • title = {{Quantum-PEFT: Ultra parameter-efficient fine-tuning}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.05431}
    • }
  •  Attiah, K., Wang, P., Mansour, H., Koike-Akino, T., Boufounos, P.T., "Enabling DMG Wi-Fi Sensing in Data Transmission Intervals by Exploiting Beam Training Codebook", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-026 PDF
    • @inproceedings{Attiah2025mar,
    • author = {Attiah, Kareem and Wang, Pu and Mansour, Hassan and Koike-Akino, Toshiaki and Boufounos, Petros T.},
    • title = {{Enabling DMG Wi-Fi Sensing in Data Transmission Intervals by Exploiting Beam Training Codebook}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-026}
    • }
  •  Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Multi-View Radar Detection Transformer with Differentiable Positional Encoding", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-027 PDF
    • @inproceedings{Yataka2025mar,
    • author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
    • title = {{Multi-View Radar Detection Transformer with Differentiable Positional Encoding}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-027}
    • }
  •  Wang, R., Wang, Y., Liu, J., Koike-Akino, T., "Quantum Diffusion Models for Few-Shot Learning", AAAI Conference on Artificial Intelligence, March 2025.
    BibTeX TR2025-025 PDF
    • @inproceedings{Wang2025mar,
    • author = {Wang, Ruhan and Wang, Ye and Liu, Jing and Koike-Akino, Toshiaki},
    • title = {{Quantum Diffusion Models for Few-Shot Learning}},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-025}
    • }
  •  Fujihashi, T., Koike-Akino, T., "Quantum Implicit Neural Compression", AAAI Conference on Artificial Intelligence, March 2025.
    BibTeX TR2025-024 PDF
    • @inproceedings{Fujihashi2025mar,
    • author = {Fujihashi, Takuya and Koike-Akino, Toshiaki},
    • title = {{Quantum Implicit Neural Compression}},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-024}
    • }
  •  Vinod, A.P., Weiss, A., Di Cairano, S., "Projection-free computation of robust controllable sets with constrained zonotopes", Automatica, DOI: 10.1016/​j.automatica.2025.112211, Vol. 175, pp. 112211, March 2025.
    BibTeX TR2025-023 PDF Video
    • @article{Vinod2025mar,
    • author = {Vinod, Abraham P. and Weiss, Avishai and Di Cairano, Stefano},
    • title = {{Projection-free computation of robust controllable sets with constrained zonotopes}},
    • journal = {Automatica},
    • year = 2025,
    • volume = 175,
    • pages = 112211,
    • month = mar,
    • doi = {10.1016/j.automatica.2025.112211},
    • issn = {0005-1098},
    • url = {https://www.merl.com/publications/TR2025-023}
    • }
  •  Shao, K., Chakrabarty, A., Mesbah, A., Romeres, D., "Coactive Preference-Guided Multi-Objective Bayesian Optimization: An Application to Policy Learning in Personalized Plasma Medicine", IEEE Control Systems Letters, February 2025.
    BibTeX TR2025-021 PDF
    • @article{Shao2025feb,
    • author = {Shao, Ketong and Chakrabarty, Ankush and Mesbah, Ali and Romeres, Diego},
    • title = {{Coactive Preference-Guided Multi-Objective Bayesian Optimization: An Application to Policy Learning in Personalized Plasma Medicine}},
    • journal = {IEEE Control Systems Letters},
    • year = 2025,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2025-021}
    • }