- Koo, J., Wichern, G., Germain, F.G., Khurana, S., Le Roux, J., "SMITIN: Self-Monitored Inference-Time INtervention for Generative Music Transformers", arXiv, April 2024.
BibTeX arXiv- @article{Koo2024apr2,
- author = {Koo, Junghyun and Wichern, Gordon and Germain, François G and Khurana, Sameer and {Le Roux}, Jonathan},
- title = {{SMITIN: Self-Monitored Inference-Time INtervention for Generative Music Transformers}},
- journal = {arXiv},
- year = 2024,
- month = apr,
- url = {https://arxiv.org/abs/2404.02252}
- }
- Koo, J., Wichern, G., Germain, F.G., Khurana, S., Le Roux, J., "Understanding and Controlling Generative Music Transformers by Probing Individual Attention Heads", IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA), April 2024.
BibTeX TR2024-032 PDF- @inproceedings{Koo2024apr,
- author = {Koo, Junghyun and Wichern, Gordon and Germain, François G and Khurana, Sameer and {Le Roux}, Jonathan},
- title = {{Understanding and Controlling Generative Music Transformers by Probing Individual Attention Heads}},
- booktitle = {IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA)},
- year = 2024,
- month = apr,
- url = {https://www.merl.com/publications/TR2024-032}
- }
- Zhang, Z., Lin, C., Wang, B., "Physics-informed shape optimization using coordinate projection", Scientific Reports, DOI: 10.1038/s41598-024-57137-4, Vol. 14, pp. 6537, April 2024.
BibTeX TR2024-035 PDF- @article{Zhang2024apr,
- author = {Zhang, Zhizhou and Lin, Chungwei and Wang, Bingnan},
- title = {{Physics-informed shape optimization using coordinate projection}},
- journal = {Scientific Reports},
- year = 2024,
- volume = 14,
- pages = 6537,
- month = apr,
- doi = {10.1038/s41598-024-57137-4},
- url = {https://www.merl.com/publications/TR2024-035}
- }
- Zhu, X., Jha, D.K., Romeres, D., Sun, L., Tomizuka, M., Cherian, A., "Multi-level Reasoning for Robotic Assembly: From Sequence Inference to Contact Selection", IEEE International Conference on Robotics and Automation (ICRA), March 2024, pp. 816-823.
BibTeX TR2024-033 PDF Video- @inproceedings{Zhu2024mar,
- author = {Zhu, Xinghao and Jha, Devesh K. and Romeres, Diego and Sun, Lingfeng and Tomizuka, Masayoshi and Cherian, Anoop},
- title = {{Multi-level Reasoning for Robotic Assembly: From Sequence Inference to Contact Selection}},
- booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
- year = 2024,
- pages = {816--823},
- month = mar,
- publisher = {IEEE},
- url = {https://www.merl.com/publications/TR2024-033}
- }
- Wang, Y., Hansen, E., Ahn, H., "Hierarchical planning for autonomous parking in dynamic environments", IEEE Transactions on Control Systems Technology, DOI: 10.1109/TCST.2024.3367468, March 2024.
BibTeX TR2024-034 PDF- @article{Wang2024mar2,
- author = {Wang, Yebin and Hansen, Emma and Ahn, Heejin},
- title = {{Hierarchical planning for autonomous parking in dynamic environments}},
- journal = {IEEE Transactions on Control Systems Technology},
- year = 2024,
- month = mar,
- doi = {10.1109/TCST.2024.3367468},
- issn = {1558-0865},
- url = {https://www.merl.com/publications/TR2024-034}
- }
- Gaur, A., Pais, G., Miraldo, P., "Oriented-grid Encoder for 3D Implicit Representations", International Conference on 3D Vision (3DV), DOI: 10.1109/3DV62453.2024.00101, March 2024, pp. 1208-1218.
BibTeX TR2024-031 PDF- @inproceedings{Gaur2024mar,
- author = {Gaur, Arihant and Pais, Goncalo and Miraldo, Pedro},
- title = {{Oriented-grid Encoder for 3D Implicit Representations}},
- booktitle = {International Conference on 3D Vision (3DV)},
- year = 2024,
- pages = {1208--1218},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/3DV62453.2024.00101},
- issn = {2475-7888},
- isbn = {979-8-3503-6245-9},
- url = {https://www.merl.com/publications/TR2024-031}
- }
- Chen, X., Liu, J., Wang, Y., Wang, P., Brand, M., Wang, G., Koike-Akino, T., "SuperLoRA: Parameter-Efficient Unified Adaptation of Multi-Layer Attention Modules", arXiv, March 2024.
BibTeX arXiv- @article{Chen2024mar,
- author = {Chen, Xiangyu and Liu, Jing and Wang, Ye and Wang, Pu and Brand, Matthew and Wang, Guanghui and Koike-Akino, Toshiaki},
- title = {{SuperLoRA: Parameter-Efficient Unified Adaptation of Multi-Layer Attention Modules}},
- journal = {arXiv},
- year = 2024,
- month = mar,
- url = {https://arxiv.org/abs/2403.11887}
- }
- Jeon, C.-B., Wichern, G., Germain, F.G., Le Roux, J., "Why does music source separation benefit from cacophony?", IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA), DOI: 10.1109/ICASSPW62465.2024.10669899, March 2024, pp. 873-877.
BibTeX TR2024-030 PDF Video- @inproceedings{Jeon2024mar,
- author = {Jeon, Chang-Bin and Wichern, Gordon and Germain, François G and {Le Roux}, Jonathan},
- title = {{Why does music source separation benefit from cacophony?}},
- booktitle = {IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA)},
- year = 2024,
- pages = {873--877},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/ICASSPW62465.2024.10669899},
- isbn = {979-8-3503-7451-3},
- url = {https://www.merl.com/publications/TR2024-030}
- }
- Bralios, D., Wichern, G., Germain, F.G., Pan, Z., Khurana, S., Hori, C., Le Roux, J., "Generation or Replication: Auscultating Audio Latent Diffusion Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10447705, March 2024, pp. 1156-1160.
BibTeX TR2024-027 PDF- @inproceedings{Bralios2024mar,
- author = {Bralios, Dimitrios and Wichern, Gordon and Germain, François G and Pan, Zexu and Khurana, Sameer and Hori, Chiori and {Le Roux}, Jonathan},
- title = {{Generation or Replication: Auscultating Audio Latent Diffusion Models}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {1156--1160},
- month = mar,
- doi = {10.1109/ICASSP48485.2024.10447705},
- url = {https://www.merl.com/publications/TR2024-027}
- }
- Fernandez-Menduina, S., Rapp, J., Mansour, H., Greiff, M., Parsons, K., "Tracking Beyond the Unambiguous Range with Modulo Single-Photon Lidar", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10446835, March 2024, pp. 6-10.
BibTeX TR2024-021 PDF- @inproceedings{Fernandez-Menduina2024mar,
- author = {Fernandez-Menduina, Samuel and Rapp, Joshua and Mansour, Hassan and Greiff, Marcus and Parsons, Kieran},
- title = {{Tracking Beyond the Unambiguous Range with Modulo Single-Photon Lidar}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {6--10},
- month = mar,
- doi = {10.1109/ICASSP48485.2024.10446835},
- url = {https://www.merl.com/publications/TR2024-021}
- }
- Masuyama, Y., Wichern, G., Germain, F.G., Pan, Z., Khurana, S., Hori, C., Le Roux, J., "NIIRF: Neural IIR Filter Field for HRTF Upsampling and Personalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10448477, March 2024, pp. 1016-1020.
BibTeX TR2024-026 PDF Software- @inproceedings{Masuyama2024mar,
- author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Pan, Zexu and Khurana, Sameer and Hori, Chiori and {Le Roux}, Jonathan},
- title = {{NIIRF: Neural IIR Filter Field for HRTF Upsampling and Personalization}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {1016--1020},
- month = mar,
- doi = {10.1109/ICASSP48485.2024.10448477},
- url = {https://www.merl.com/publications/TR2024-026}
- }
- Pan, Z., Wichern, G., Germain, F.G., Khurana, S., Le Roux, J., "NeuroHeed+: Improving Neuro-steered Speaker Extraction with Joint Auditory Attention Detection", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10446333, March 2024, pp. 11456-11460.
BibTeX TR2024-025 PDF- @inproceedings{Pan2024mar,
- author = {Pan, Zexu and Wichern, Gordon and Germain, François G and Khurana, Sameer and {Le Roux}, Jonathan},
- title = {{NeuroHeed+: Improving Neuro-steered Speaker Extraction with Joint Auditory Attention Detection}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {11456--11460},
- month = mar,
- doi = {10.1109/ICASSP48485.2024.10446333},
- url = {https://www.merl.com/publications/TR2024-025}
- }
- Sholokhov, A., Rapp, J., Nabi, S., Brunton, S., Kutz, N., Mansour, H., "Single-pixel imaging of dynamic flows using Neural ODE regularization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10447584, March 2024, pp. 2530-2534.
BibTeX TR2024-024 PDF- @inproceedings{Sholokhov2024mar,
- author = {Sholokhov, Aleksei and Rapp, Joshua and Nabi, Saleh and Brunton, Steven and Kutz, Nathan and Mansour, Hassan},
- title = {{Single-pixel imaging of dynamic flows using Neural ODE regularization}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {2530--2534},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/ICASSP48485.2024.10447584},
- url = {https://www.merl.com/publications/TR2024-024}
- }
- Wu, S.-L., Chang, X., Wichern, G., Jung, J.-W., Germain, F.G., Le Roux, J., Watanabe, S., "Improving Audio Captioning Models with Fine-grained Audio Features, Text Embedding Supervision, and LLM Mix-up Augmentation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10447215, March 2024, pp. 316-320.
BibTeX TR2024-028 PDF- @inproceedings{Wu2024mar,
- author = {Wu, Shih-Lun and Chang, Xuankai and Wichern, Gordon and Jung, Jee-weon and Germain, François G and {Le Roux}, Jonathan and Watanabe, Shinji},
- title = {{Improving Audio Captioning Models with Fine-grained Audio Features, Text Embedding Supervision, and LLM Mix-up Augmentation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {316--320},
- month = mar,
- doi = {10.1109/ICASSP48485.2024.10447215},
- url = {https://www.merl.com/publications/TR2024-028}
- }
- Kato, S., Wang, P., Koike-Akino, T., Fujihashi, T., Mansour, H., Boufounos, P.T., "Object Trajectory Estimation with Multi-Band Wi-Fi Neural Dynamic Fusion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10445972, March 2024, pp. 13261-13265.
BibTeX TR2024-019 PDF- @inproceedings{Kato2024mar,
- author = {Kato, Sorachi and Wang, Pu and Koike-Akino, Toshiaki and Fujihashi, Takuya and Mansour, Hassan and Boufounos, Petros T.},
- title = {{Object Trajectory Estimation with Multi-Band Wi-Fi Neural Dynamic Fusion}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {13261--13265},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/ICASSP48485.2024.10445972},
- issn = {2379-190X},
- isbn = {979-8-3503-4485-1},
- url = {https://www.merl.com/publications/TR2024-019}
- }
- Wang, P., Boufounos, P.T., "Monostatic DMG Passive Sensing with Hypothesis Testing", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10447134, March 2024, pp. 13381-13385.
BibTeX TR2024-020 PDF- @inproceedings{Wang2024mar,
- author = {Wang, Pu and Boufounos, Petros T.},
- title = {{Monostatic DMG Passive Sensing with Hypothesis Testing}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {13381--13385},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/ICASSP48485.2024.10447134},
- issn = {2379-190X},
- isbn = {979-8-3503-4485-1},
- url = {https://www.merl.com/publications/TR2024-020}
- }
- Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Radar Perception with Scalable Connective Temporal Relations for Autonomous Driving", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10446449, March 2024, pp. 13266-13270.
BibTeX TR2024-023 PDF- @inproceedings{Yataka2024mar,
- author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
- title = {{Radar Perception with Scalable Connective Temporal Relations for Autonomous Driving}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {13266--13270},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/ICASSP48485.2024.10446449},
- issn = {2379-190X},
- isbn = {979-8-3503-4485-1},
- url = {https://www.merl.com/publications/TR2024-023}
- }
- Kobori, H., Fukuchi, K., Wang, Y., "Evaluation of Information Security Risk from Training Data Inference in Federated Learning", The Institute of Electronics, Information and Communication Engineers, General Conference, March 2024.
BibTeX - @inproceedings{Kobori2024mar,
- author = {Kobori, Hiroko and Fukuchi, Ken and Wang, Ye},
- title = {{Evaluation of Information Security Risk from Training Data Inference in Federated Learning}},
- booktitle = {The Institute of Electronics, Information and Communication Engineers, General Conference},
- year = 2024,
- month = mar
- }
- Fujihashi, T., Koike-Akino, T., "Graph-Based EEG Signal Compression for Human-Machine Interaction", IEEE Access, DOI: 10.1109/ACCESS.2023.3347592, Vol. 12, No. IEEE, pp. 1163-1171, March 2024.
BibTeX TR2024-015 PDF- @article{Fujihashi2024mar,
- author = {Fujihashi, Takuya and Koike-Akino, Toshiaki},
- title = {{Graph-Based EEG Signal Compression for Human-Machine Interaction}},
- journal = {IEEE Access},
- year = 2024,
- volume = 12,
- number = {IEEE},
- pages = {1163--1171},
- month = mar,
- doi = {10.1109/ACCESS.2023.3347592},
- issn = {2169-3536},
- url = {https://www.merl.com/publications/TR2024-015}
- }
- Baoueb, T., Liu, H., Fontaine, M., Le Roux, J., Richard, G., "SpecDiff-GAN: A Spectrally-Shaped Noise Diffusion GAN for Speech and Music Synthesis", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10446830, March 2024, pp. 986-990.
BibTeX TR2024-013 PDF- @inproceedings{Baoueb2024mar,
- author = {Baoueb, Teysir and Liu, Haocheng and Fontaine, Mathieu and {Le Roux}, Jonathan and Richard, Gaël},
- title = {{SpecDiff-GAN: A Spectrally-Shaped Noise Diffusion GAN for Speech and Music Synthesis}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {986--990},
- month = mar,
- doi = {10.1109/ICASSP48485.2024.10446830},
- issn = {2379-190X},
- isbn = {979-8-3503-4485-1},
- url = {https://www.merl.com/publications/TR2024-013}
- }
- Hori, C., Wang, P., Rahman, M., Vaca-Rubio, C., Khurana, S., Cherian, A., Le Roux, J., "Wi-Fi based Indoor Monitoring Enhanced by Multimodal Fusion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10447600, March 2024, pp. 13296-13300.
BibTeX TR2024-012 PDF- @inproceedings{Hori2024mar,
- author = {Hori, Chiori and Wang, Pu and Rahman, Mahbub and Vaca-Rubio, Cristian and Khurana, Sameer and Cherian, Anoop and {Le Roux}, Jonathan},
- title = {{Wi-Fi based Indoor Monitoring Enhanced by Multimodal Fusion}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {13296--13300},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/ICASSP48485.2024.10447600},
- issn = {2379-190X},
- isbn = {979-8-3503-4485-1},
- url = {https://www.merl.com/publications/TR2024-012}
- }
- Liu, H., Baoueb, T., Fontaine, M., Le Roux, J., Richard, G., "GLA-Grad: A Griffin-Lim Extended Waveform Generation Diffusion Model", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP48485.2024.10446058, March 2024, pp. 11611-11615.
BibTeX TR2024-014 PDF- @inproceedings{Liu2024mar,
- author = {Liu, Haocheng and Baoueb, Teysir and Fontaine, Mathieu and {Le Roux}, Jonathan and Richard, Gaël},
- title = {{GLA-Grad: A Griffin-Lim Extended Waveform Generation Diffusion Model}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2024,
- pages = {11611--11615},
- month = mar,
- doi = {10.1109/ICASSP48485.2024.10446058},
- issn = {2379-190X},
- isbn = {979-8-3503-4485-1},
- url = {https://www.merl.com/publications/TR2024-014}
- }
- Zhang, X., Mowlavi, S., Benosman, M., Basar, T., "Policy Optimization for PDE Control with a Warm Start", arXiv, March 2024.
BibTeX arXiv- @article{Zhang2024mar,
- author = {Zhang, Xiangyuan and Mowlavi, Saviz and Benosman, Mouhacine and Basar, Tamer},
- title = {{Policy Optimization for PDE Control with a Warm Start}},
- journal = {arXiv},
- year = 2024,
- month = mar,
- url = {https://arxiv.org/abs/2403.01005}
- }
- Hossain, T., sikder, B., Azad, M.T., Xie, Q., Yuan, M., Yagyu, E., Teo, K.H., Palacios, T., Chowdhury, N., "Fermi-Level Pinning Effect in Gate Region: A Case Study of Multi-Metal Gated AlGaN/GaN HEMT for High RF Linearity", IEEE Electron Devices Technology & Manufacturing Conference, DOI: 10.1109/EDTM58488.2024.10512349, February 2024.
BibTeX TR2024-010 PDF- @inproceedings{Hossain2024feb,
- author = {Hossain, Toiyob and sikder, Bejoy and Azad, Md.Tasnim and Xie, Qingyun and Yuan, Mengyang and Yagyu, Eiji and Teo, Koon Hoo and Palacios, Tomas and Chowdhury, Nadim},
- title = {{Fermi-Level Pinning Effect in Gate Region: A Case Study of Multi-Metal Gated AlGaN/GaN HEMT for High RF Linearity}},
- booktitle = {IEEE Electron Devices Technology \& Manufacturing Conference},
- year = 2024,
- month = feb,
- doi = {10.1109/EDTM58488.2024.10512349},
- url = {https://www.merl.com/publications/TR2024-010}
- }
- Bortoff, S.A., Eisenhower, B., Adetola, V., O'Neil, Z., "Control Challenges and Opportunities in Building Automation" in The Impact of Automatic Control Research on Industrial Innovation: Enabling a Sustainable Future, February 2024.
BibTeX TR2024-011 PDF- @incollection{Bortoff2024feb,
- author = {Bortoff, Scott A. and Eisenhower, Bryan and Adetola, Veronica and O'Neil, Zheng},
- title = {{Control Challenges and Opportunities in Building Automation}},
- booktitle = {The Impact of Automatic Control Research on Industrial Innovation: Enabling a Sustainable Future},
- year = 2024,
- month = feb,
- url = {https://www.merl.com/publications/TR2024-011}
- }