Publications

588 / 3,737 publications found.


  •  Chang, X., Moritz, N., Hori, T., Watanabe, S., Le Roux, J., "Extended Graph Temporal Classification for Multi-Speaker End-to-End ASR", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9747375, April 2022, pp. 7322-7326.
    BibTeX TR2022-021 PDF
    • @inproceedings{Chang2022apr,
    • author = {Chang, Xuankai and Moritz, Niko and Hori, Takaaki and Watanabe, Shinji and Le Roux, Jonathan},
    • title = {Extended Graph Temporal Classification for Multi-Speaker End-to-End ASR},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {7322--7326},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP43922.2022.9747375},
    • url = {https://www.merl.com/publications/TR2022-021}
    • }
  •  Higuchi, Y., Moritz, N., Le Roux, J., Hori, T., "Advancing Momentum Pseudo-Labeling with Conformer and Initialization Strategy", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9746275, April 2022, pp. 7672-7676.
    BibTeX TR2022-026 PDF
    • @inproceedings{Higuchi2022apr,
    • author = {Higuchi, Yosuke and Moritz, Niko and Le Roux, Jonathan and Hori, Takaaki},
    • title = {Advancing Momentum Pseudo-Labeling with Conformer and Initialization Strategy},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {7672--7676},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP43922.2022.9746275},
    • url = {https://www.merl.com/publications/TR2022-026}
    • }
  •  Moritz, N., Hori, T., Watanabe, S., Le Roux, J., "Sequence Transduction with Graph-based Supervision", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9747788, April 2022, pp. 7212-7216.
    BibTeX TR2022-024 PDF
    • @inproceedings{Moritz2022apr,
    • author = {Moritz, Niko and Hori, Takaaki and Watanabe, Shinji and Le Roux, Jonathan},
    • title = {Sequence Transduction with Graph-based Supervision},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {7212--7216},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP43922.2022.9747788},
    • url = {https://www.merl.com/publications/TR2022-024}
    • }
  •  Peng, K.-C., "Iterative Self Knowledge Distillation -- From Pothole Classification To Fine-Grained And COVID Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), Gan, W.-S. and Ma, K. K., Eds., DOI: 10.1109/​ICASSP43922.2022.9746470, April 2022, pp. 3139-3143.
    BibTeX TR2022-020 PDF Video Presentation
    • @inproceedings{Peng2022apr,
    • author = {Peng, Kuan-Chuan},
    • title = {Iterative Self Knowledge Distillation -- From Pothole Classification To Fine-Grained And COVID Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • editor = {Gan, W.-S. and Ma, K. K.},
    • pages = {3139--3143},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP43922.2022.9746470},
    • issn = {1520-6149},
    • isbn = {978-1-6654-0541-6},
    • url = {https://www.merl.com/publications/TR2022-020}
    • }
  •  Petermann, D., Wichern, G., Wang, Z.-Q., Le Roux, J., "The Cocktail Fork Problem: Three-Stem Audio Separation for Real-World Soundtracks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9746005, April 2022, pp. 526-530.
    BibTeX TR2022-022 PDF Video Software
    • @inproceedings{Petermann2022apr,
    • author = {Petermann, Darius and Wichern, Gordon and Wang, Zhong-Qiu and Le Roux, Jonathan},
    • title = {The Cocktail Fork Problem: Three-Stem Audio Separation for Real-World Soundtracks},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {526--530},
    • month = apr,
    • doi = {10.1109/ICASSP43922.2022.9746005},
    • url = {https://www.merl.com/publications/TR2022-022}
    • }
  •  Slizovskaia, O., Wichern, G., Wang, Z.-Q., Le Roux, J., "Locate This, Not That: Class-Conditioned Sound Event DOA Estimation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9747604, April 2022, pp. 711-715.
    BibTeX TR2022-023 PDF
    • @inproceedings{Slizovskaia2022mar,
    • author = {Slizovskaia, Olga and Wichern, Gordon and Wang, Zhong-Qiu and Le Roux, Jonathan},
    • title = {Locate This, Not That: Class-Conditioned Sound Event DOA Estimation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {711--715},
    • month = apr,
    • doi = {10.1109/ICASSP43922.2022.9747604},
    • url = {https://www.merl.com/publications/TR2022-023}
    • }
  •  Yu, J., Wang, P., Koike-Akino, T., Orlik, P.V., "Multi-Modal Recurrent Fusion for Indoor Localization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9746071, April 2022.
    BibTeX TR2022-018 PDF
    • @inproceedings{Yu2022apr,
    • author = {Yu, Jianyuan and Wang, Pu and Koike-Akino, Toshiaki and Orlik, Philip V.},
    • title = {Multi-Modal Recurrent Fusion for Indoor Localization},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP43922.2022.9746071},
    • issn = {2379-190X},
    • isbn = {978-1-6654-0540-9},
    • url = {https://www.merl.com/publications/TR2022-018}
    • }
  •  Cauligi, A., Chakrabarty, A., Di Cairano, S., Quirynen, R., "PRISM: Recurrent Neural Networks and Presolve Methods for Fast Mixed-integer Optimal Control", Learning for Dynamics and Control Conference (L4DC), April 2022, pp. 34-46.
    BibTeX TR2022-039 PDF
    • @inproceedings{Cauligi2022apr,
    • author = {Cauligi, Abhishek and Chakrabarty, Ankush and Di Cairano, Stefano and Quirynen, Rien},
    • title = {PRISM: Recurrent Neural Networks and Presolve Methods for Fast Mixed-integer Optimal Control},
    • booktitle = {Learning for Dynamics and Control Conference (L4DC)},
    • year = 2022,
    • pages = {34--46},
    • month = apr,
    • publisher = {Proceedings of Machine Learning Research (PMLR)},
    • url = {https://www.merl.com/publications/TR2022-039}
    • }
  •  Sanz-Alcaine, J.M., Sanz-Gorrachategui, I., Pajovic, M., Orlik, P.V., "Online Voltage Prediction Using Gaussian Process Regression for Fault-Tolerant Photovoltaic Standalone Applications", Neural Computing and Applications, DOI: 10.1007/​s00521-021-06254-6, Vol. 33, No. 23, pp. 16577–16590, March 2022.
    BibTeX TR2022-038 PDF
    • @article{Sanz-Alcaine2022mar,
    • author = {Sanz-Alcaine, José Miguel and Sanz-Gorrachategui, Ivan and Pajovic, Milutin and Orlik, Philip V.},
    • title = {Online Voltage Prediction Using Gaussian Process Regression for Fault-Tolerant Photovoltaic Standalone Applications},
    • journal = {Neural Computing and Applications},
    • year = 2022,
    • volume = 33,
    • number = 23,
    • pages = {16577–16590},
    • month = mar,
    • doi = {10.1007/s00521-021-06254-6},
    • url = {https://www.merl.com/publications/TR2022-038}
    • }
  •  Anantharaman, R., Abdelrahim, A., Martinuzzi, F., Yalburgi, S., Saba, E., Fischer, K., Hertz, G., de Vos, P., Laughman, C.R., Ma, Y., Shah, V., Edelman, A., Rackauckas, C., "Composable and Reusable Neural Surrogates to Predict System Response of Causal Model Components", AAAI 2022 Workshop on AI based Design and Manufacturing, March 2022.
    BibTeX TR2022-034 PDF
    • @inproceedings{Anantharaman2022mar,
    • author = {Anantharaman, Ranjan and Abdelrahim, Anas and Martinuzzi, Francesco and Yalburgi, Sharan and Saba, Elliot and Fischer, Keno and Hertz, Glen and de Vos, Pepijn and Laughman, Christopher R. and Ma, Yingbo and Shah, Viral and Edelman, Alan and Rackauckas, Chris},
    • title = {Composable and Reusable Neural Surrogates to Predict System Response of Causal Model Components},
    • booktitle = {AAAI 2022 Workshop on AI based Design and Manufacturing},
    • year = 2022,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2022-034}
    • }
  •  Chakrabarty, A., Maddalena, E., Qiao, H., Laughman, C.R., "Scalable Bayesian Optimization for Model Calibration: Case Study on Coupled Building and HVAC Dynamics", Energy and Buildings, DOI: 10.1016/​j.enbuild.2021.111460, Vol. 253, pp. 111460, March 2022.
    BibTeX TR2022-030 PDF
    • @article{Chakrabarty2022mar,
    • author = {Chakrabarty, Ankush and Maddalena, Emilio and Qiao, Hongtao and Laughman, Christopher R.},
    • title = {Scalable Bayesian Optimization for Model Calibration: Case Study on Coupled Building and HVAC Dynamics},
    • journal = {Energy and Buildings},
    • year = 2022,
    • volume = 253,
    • pages = 111460,
    • month = mar,
    • doi = {10.1016/j.enbuild.2021.111460},
    • url = {https://www.merl.com/publications/TR2022-030}
    • }
  •  Cao, W., Benosman, M., Zhang, X., Ma, R., "Domain Knowledge-Based Automated Analog Circuit Design with Deep Reinforcement Learning", AAAI Conference on Artificial Intelligence, February 2022.
    BibTeX TR2022-017 PDF
    • @inproceedings{Cao2022feb,
    • author = {Cao, Weidong and Benosman, Mouhacine and Zhang, Xuan and Ma, Rui},
    • title = {Domain Knowledge-Based Automated Analog Circuit Design with Deep Reinforcement Learning},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2022,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2022-017}
    • }
  •  Cherian, A., Hori, C., Marks, T.K., Le Roux, J., "(2.5+1)D Spatio-Temporal Scene Graphs for Video Question Answering", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v36i1.19922, February 2022, pp. 444-453.
    BibTeX TR2022-014 PDF Video Presentation
    • @inproceedings{Cherian2022feb,
    • author = {Cherian, Anoop and Hori, Chiori and Marks, Tim K. and Le Roux, Jonathan},
    • title = {(2.5+1)D Spatio-Temporal Scene Graphs for Video Question Answering},
    • booktitle = {Proceedings of the AAAI Conference on Artificial Intelligence},
    • year = 2022,
    • pages = {444--453},
    • month = feb,
    • doi = {10.1609/aaai.v36i1.19922},
    • url = {https://www.merl.com/publications/TR2022-014}
    • }
  •  Ke, L., Peng, K.-C., Lyu, S., "Towards To-a-T Spatio-Temporal Focus for Skeleton-Based Action Recognition", AAAI Conference on Artificial Intelligence, February 2022.
    BibTeX TR2022-015 PDF Presentation
    • @inproceedings{Ke2022feb,
    • author = {Ke, Lipeng and Peng, Kuan-Chuan and Lyu, Siwei},
    • title = {Towards To-a-T Spatio-Temporal Focus for Skeleton-Based Action Recognition},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2022,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2022-015}
    • }
  •  Shah, A., Sra, S., Chellappa, R., Cherian, A., "Max-Margin Contrastive Learning", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v36i8.20796, February 2022, pp. 8220-8230.
    BibTeX TR2022-013 PDF
    • @inproceedings{Shah2022feb,
    • author = {Shah, Anshul and Sra, Suvrit and Chellappa, Rama and Cherian, Anoop},
    • title = {Max-Margin Contrastive Learning},
    • booktitle = {Proceedings of the AAAI Conference on Artificial Intelligence},
    • year = 2022,
    • pages = {8220--8230},
    • month = feb,
    • doi = {10.1609/aaai.v36i8.20796},
    • url = {https://www.merl.com/publications/TR2022-013}
    • }
  •  Medin, S.C., Egger, B., Cherian, A., Wang, Y., Tenenbaum, J.B., Liu, X., Marks, T.K., "MOST-GAN: 3D Morphable StyleGAN for Disentangled Face Image Manipulation", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v36i2.20091, February 2022, pp. 1962-1971.
    BibTeX TR2022-011 PDF Video Data Presentation
    • @inproceedings{Medin2022feb,
    • author = {Medin, Safa C. and Egger, Bernhard and Cherian, Anoop and Wang, Ye and Tenenbaum, Joshua B. and Liu, Xiaoming and Marks, Tim K.},
    • title = {MOST-GAN: 3D Morphable StyleGAN for Disentangled Face Image Manipulation},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2022,
    • pages = {1962--1971},
    • month = feb,
    • doi = {10.1609/aaai.v36i2.20091},
    • url = {https://www.merl.com/publications/TR2022-011}
    • }
  •  Chakrabarty, A., Danielson, C., Bortoff, S.A., Laughman, C.R., "Accelerating self-optimization control of refrigerant cycles with Bayesian optimization and adaptive moment estimation", Applied Thermal Engineering, DOI: 10.1016/​j.applthermaleng.2021.117335, Vol. 197, pp. 117335, February 2022.
    BibTeX TR2022-010 PDF
    • @article{Chakrabarty2022feb,
    • author = {Chakrabarty, Ankush and Danielson, Claus and Bortoff, Scott A. and Laughman, Christopher R.},
    • title = {Accelerating self-optimization control of refrigerant cycles with Bayesian optimization and adaptive moment estimation},
    • journal = {Applied Thermal Engineering},
    • year = 2022,
    • volume = 197,
    • pages = 117335,
    • month = feb,
    • doi = {10.1016/j.applthermaleng.2021.117335},
    • url = {https://www.merl.com/publications/TR2022-010}
    • }
  •  De Silva, U., Ma, R., Koike-Akino, T., Yamashita, A., Nakamizo, H., "A Modular 1D-CNN Architecture for Real-time Digital Pre-distortion", IEEE Radio and Wireless Symposium (RWS), January 2022.
    BibTeX TR2022-007 PDF
    • @inproceedings{DeSilva2022jan,
    • author = {De Silva, Udara and Ma, Rui and Koike-Akino, Toshiaki and Yamashita, Ao and Nakamizo, Hideyuki},
    • title = {A Modular 1D-CNN Architecture for Real-time Digital Pre-distortion},
    • booktitle = {IEEE Radio and Wireless Symposium (RWS)},
    • year = 2022,
    • month = jan,
    • issn = {2473-4640},
    • isbn = {978-1-6654-3472-0},
    • url = {https://www.merl.com/publications/TR2022-007}
    • }
  •  Lohit, S., Jones, M.J., "Model Compression Using Optimal Transport", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2022.
    BibTeX TR2022-006 PDF Presentation
    • @inproceedings{Lohit2022jan,
    • author = {Lohit, Suhas and Jones, Michael J.},
    • title = {Model Compression Using Optimal Transport},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2022,
    • month = jan,
    • publisher = {CVF OpenAccess},
    • url = {https://www.merl.com/publications/TR2022-006}
    • }
  •  Jeon, W., Chakrabarty, A., Zemouche, A., Rajamani, R., "Simultaneous State Estimation and Tire Model Learning for Autonomous Vehicle Applications", IEEE/ASME Transactions on Mechatronics, DOI: 10.1109/​TMECH.2021.3081035, Vol. 26, No. 4, pp. 1941-1950, January 2022.
    BibTeX TR2022-003 PDF
    • @article{Jeon2022jan,
    • author = {Jeon, Woongsun and Chakrabarty, Ankush and Zemouche, Ali and Rajamani, Rajesh},
    • title = {Simultaneous State Estimation and Tire Model Learning for Autonomous Vehicle Applications},
    • journal = {IEEE/ASME Transactions on Mechatronics},
    • year = 2022,
    • volume = 26,
    • number = 4,
    • pages = {1941--1950},
    • month = jan,
    • doi = {10.1109/TMECH.2021.3081035},
    • url = {https://www.merl.com/publications/TR2022-003}
    • }
  •  Teo, K.H., Zhang, Y., Chowdhury, N., Rakheja, S., Ma, R., Xie, Q., Yagyu, E., Yamanaka, K., Li, K., Palacios, T., "Emerging GaN technologies for power, RF, digital and quantum computing applications: recent advances and prospects", Journal of Applied Physics, DOI: 10.1063/​5.0061555, December 2021.
    BibTeX TR2022-002 PDF
    • @article{Teo2021dec,
    • author = {Teo, Koon Hoo and Zhang, Yuhao and Chowdhury, Nadim and Rakheja, Shaloo and Ma, Rui and Xie, Qingyun and Yagyu, Eiji and Yamanaka, Koji and Li, Kexin and Palacios, Tomas},
    • title = {Emerging GaN technologies for power, RF, digital and quantum computing applications: recent advances and prospects},
    • journal = {Journal of Applied Physics},
    • year = 2021,
    • month = dec,
    • doi = {10.1063/5.0061555},
    • url = {https://www.merl.com/publications/TR2022-002}
    • }
  •  Zhan, S., Wichern, G., Laughman, C.R., Chakrabarty, A., "Meta-Learned Bayesian Optimization for Building Model Calibration using Attentive Neural Processes", Advances in Neural Information Processing Systems (NeurIPS), December 2021.
    BibTeX TR2021-149 PDF
    • @inproceedings{Zhan2021dec,
    • author = {Zhan, Sicheng and Wichern, Gordon and Laughman, Christopher R. and Chakrabarty, Ankush},
    • title = {Meta-Learned Bayesian Optimization for Building Model Calibration using Attentive Neural Processes},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2021,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2021-149}
    • }
  •  Berntorp, K., Chakrabarty, A., Di Cairano, S., "Vehicle Rollover Avoidance by Parameter-Adaptive Reference Governor", IEEE Conference on Decision and Control (CDC), DOI: 10.1109/​CDC45484.2021.9683770, December 2021, pp. 635-640.
    BibTeX TR2021-151 PDF
    • @inproceedings{Berntorp2021dec,
    • author = {Berntorp, Karl and Chakrabarty, Ankush and Di Cairano, Stefano},
    • title = {Vehicle Rollover Avoidance by Parameter-Adaptive Reference Governor},
    • booktitle = {IEEE Conference on Decision and Control (CDC)},
    • year = 2021,
    • pages = {635--640},
    • month = dec,
    • doi = {10.1109/CDC45484.2021.9683770},
    • url = {https://www.merl.com/publications/TR2021-151}
    • }
  •  Wang, Z.-Q., Wichern, G., Le Roux, J., "Convolutive Prediction for Monaural Speech Dereverberation and Noisy-Reverberant Speaker Separation", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/​TASLP.2021.3129363, Vol. 29, pp. 3476-3490, December 2021.
    BibTeX TR2021-144 PDF
    • @article{Wang2021dec,
    • author = {Wang, Zhong-Qiu and Wichern, Gordon and Le Roux, Jonathan},
    • title = {Convolutive Prediction for Monaural Speech Dereverberation and Noisy-Reverberant Speaker Separation},
    • journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
    • year = 2021,
    • volume = 29,
    • pages = {3476--3490},
    • month = dec,
    • doi = {10.1109/TASLP.2021.3129363},
    • url = {https://www.merl.com/publications/TR2021-144}
    • }
  •  Yu, X., van Baar, J., Chen, S., Sullivan, A., "Keypoint-aligned 3D Human Shape Recovery from A Single Imagewith Bilayer-Graph", International Conference on 3D Vision (3DV), DOI: 10.1109/​3DV53792.2021.00060, December 2021, pp. 505-514.
    BibTeX TR2021-143 PDF
    • @inproceedings{Yu2021dec,
    • author = {Yu, Xin and van Baar, Jeroen and Chen, Siheng and Sullivan, Alan},
    • title = {Keypoint-aligned 3D Human Shape Recovery from A Single Imagewith Bilayer-Graph},
    • booktitle = {International Conference on 3D Vision (3DV)},
    • year = 2021,
    • pages = {505--514},
    • month = dec,
    • doi = {10.1109/3DV53792.2021.00060},
    • url = {https://www.merl.com/publications/TR2021-143}
    • }