Publications

464 / 3,101 publications found.


  •  Moritz, N., Hori, T., Le Roux, J., "Capturing Multi-Resolution Context by Dilated Self-Attention", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), June 2021.
    BibTeX TR2021-036 PDF
    • @inproceedings{Moritz2021jun,
    • author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Capturing Multi-Resolution Context by Dilated Self-Attention},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2021,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2021-036}
    • }
  •  Khurana, S., Moritz, N., Hori, T., Le Roux, J., "Unsupervised Domain Adaptation For Speech Recognition via Uncertainty Driven Self-Training", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), June 2021.
    BibTeX TR2021-039 PDF
    • @inproceedings{Khurana2021jun,
    • author = {Khurana, Sameer and Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Unsupervised Domain Adaptation For Speech Recognition via Uncertainty Driven Self-Training},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2021,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2021-039}
    • }
  •  Moritz, N., Hori, T., Le Roux, J., "Semi-Supervised Speech Recognition via Graph-Based Temporal Classification", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), June 2021.
    BibTeX TR2021-037 PDF
    • @inproceedings{Moritz2021jun2,
    • author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Semi-Supervised Speech Recognition via Graph-Based Temporal Classification},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2021,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2021-037}
    • }
  •  Pan, C., Chen, S., Ortega, A., "Spatio-Temporal Graph Scattering Transform", International Conference on Learning Representations (ICLR), May 2021.
    BibTeX TR2021-044 PDF
    • @inproceedings{Pan2021may,
    • author = {Pan, Chao and Chen, Siheng and Ortega, Antonio},
    • title = {Spatio-Temporal Graph Scattering Transform},
    • booktitle = {International Conference on Learning Representations (ICLR)},
    • year = 2021,
    • month = may,
    • url = {https://www.merl.com/publications/TR2021-044}
    • }
  •  Han, M., Ozdenizci, O., Koike-Akino, T., Wang, Y., Erdogmus, D., "Universal Physiological Representation Learning with Soft-Disentangled Rateless Autoencoders", IEEE Journal of Biomedical and Health Informatics, DOI: 10.1109/​JBHI.2021.3062335, April 2021.
    BibTeX TR2021-027 PDF
    • @article{Han2021apr,
    • author = {Han, Mo and Ozdenizci, Ozan and Koike-Akino, Toshiaki and Wang, Ye and Erdogmus, Deniz},
    • title = {Universal Physiological Representation Learning with Soft-Disentangled Rateless Autoencoders},
    • journal = {IEEE Journal of Biomedical and Health Informatics},
    • year = 2021,
    • month = apr,
    • doi = {10.1109/JBHI.2021.3062335},
    • url = {https://www.merl.com/publications/TR2021-027}
    • }
  •  Ramachandra, B., Jones, M.J., Vatsavai, R., "Perceptual Metric Learning for Video Anomaly Detection", Machine Vision and Applications, DOI: 0.1007/​s00138-021-01187-5, Vol. 32, No. 63, March 2021.
    BibTeX TR2021-028 PDF
    • @article{Ramachandra2021mar,
    • author = {Ramachandra, Bharathkumar and Jones, Michael J. and Vatsavai, Ranga},
    • title = {Perceptual Metric Learning for Video Anomaly Detection},
    • journal = {Machine Vision and Applications},
    • year = 2021,
    • volume = 32,
    • number = 63,
    • month = mar,
    • doi = {0.1007/s00138-021-01187-5},
    • url = {https://www.merl.com/publications/TR2021-028}
    • }
  •  Demir, A., Koike-Akino, T., Wang, Y., Erdogmus, D., "AutoBayes: Automated Bayesian Graph Exploration for Nuisance-Robust Inference", IEEE Access, DOI: 10.1109/​ACCESS.2021.3064530, Vol. 9, pp. 39955-39972, March 2021.
    BibTeX TR2021-016 PDF
    • @article{Demir2021mar,
    • author = {Demir, Andac and Koike-Akino, Toshiaki and Wang, Ye and Erdogmus, Deniz},
    • title = {AutoBayes: Automated Bayesian Graph Exploration for Nuisance-Robust Inference},
    • journal = {IEEE Access},
    • year = 2021,
    • volume = 9,
    • pages = {39955--39972},
    • month = mar,
    • doi = {10.1109/ACCESS.2021.3064530},
    • issn = {2169-3536},
    • url = {https://www.merl.com/publications/TR2021-016}
    • }
  •  Kojima, K., Tang, Y., Koike-Akino, T., Wang, Y., Jha, D., TaherSima, M., Parsons, K., "Application of Deep Learning for Nanophotonic Device Design", SPIE Photonics West, Bahram Jalali and Ken-ichi Kitayama, Eds., DOI: 10.1117/​12.2579104, March 2021.
    BibTeX TR2020-182 PDF Video
    • @inproceedings{Kojima2021mar,
    • author = {Kojima, Keisuke and Tang, Yingheng and Koike-Akino, Toshiaki and Wang, Ye and Jha, Devesh and TaherSima, Mohammad and Parsons, Kieran},
    • title = {Application of Deep Learning for Nanophotonic Device Design},
    • booktitle = {SPIE Photonics West},
    • year = 2021,
    • editor = {Bahram Jalali and Ken-ichi Kitayama},
    • month = mar,
    • publisher = {SPIE},
    • doi = {10.1117/12.2579104},
    • url = {https://www.merl.com/publications/TR2020-182}
    • }
  •  Geng, S., Gao, P., Chatterjee, M., Hori, C., Le Roux, J., Zhang, Y., Li, H., Cherian, A., "Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers", AAAI Conference on Artificial Intelligence, February 2021.
    BibTeX TR2021-010 PDF
    • @inproceedings{Geng2021feb,
    • author = {Geng, Shijie and Gao, Peng and Chatterjee, Moitreya and Hori, Chiori and Le Roux, Jonathan and Zhang, Yongfeng and Li, Hongsheng and Cherian, Anoop},
    • title = {Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2021,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2021-010}
    • }
  •  Kojima, K., TaherSima, M., Koike-Akino, T., Jha, D., Tang, Y., Wang, Y., Parsons, K., "Deep Neural Networks for Inverse Design of Nanophotonic Devices", IEEE Journal of Lightwave Technology, DOI: 10.1109/​JLT.2021.3050083, January 2021.
    BibTeX TR2021-001 PDF
    • @article{Kojima2021jan,
    • author = {Kojima, Keisuke and TaherSima, Mohammad and Koike-Akino, Toshiaki and Jha, Devesh and Tang, Yingheng and Wang, Ye and Parsons, Kieran},
    • title = {Deep Neural Networks for Inverse Design of Nanophotonic Devices},
    • journal = {IEEE Journal of Lightwave Technology},
    • year = 2021,
    • month = jan,
    • doi = {10.1109/JLT.2021.3050083},
    • issn = {1558-2213},
    • url = {https://www.merl.com/publications/TR2021-001}
    • }
  •  Lohit, S., Anirudh, R., Turaga, P., "Recovering Trajectories of Unmarked Joints in 3D Human Actions Using Latent Space Optimization", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2021.
    BibTeX TR2021-004 PDF
    • @inproceedings{Lohit2021jan,
    • author = {Lohit, Suhas and Anirudh, Rushil and Turaga, Pavan},
    • title = {Recovering Trajectories of Unmarked Joints in 3D Human Actions Using Latent Space Optimization},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2021,
    • month = jan,
    • url = {https://www.merl.com/publications/TR2021-004}
    • }
  •  Anirudh, R., Lohit, S., Turaga, P., "Generative Patch Priors for Practical Compressive Image Recovery", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2021.
    BibTeX TR2021-003 PDF
    • @inproceedings{Anirudh2021jan,
    • author = {Anirudh, Rushil and Lohit, Suhas and Turaga, Pavan},
    • title = {Generative Patch Priors for Practical Compressive Image Recovery},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2021,
    • month = jan,
    • url = {https://www.merl.com/publications/TR2021-003}
    • }
  •  Nowara, E., Marks, T., Mansour, H., Veeraraghavan, A., "Near-Infrared Imaging Photoplethysmography During Driving", IEEE Transactions on Intelligent Transportation Systems, DOI: 10.1109/​TITS.2020.3038317, pp. 1-12, December 2020.
    BibTeX TR2020-161 PDF
    • @article{Nowara2020dec,
    • author = {Nowara, Ewa and Marks, Tim and Mansour, Hassan and Veeraraghavan, Ashok},
    • title = {Near-Infrared Imaging Photoplethysmography During Driving},
    • journal = {IEEE Transactions on Intelligent Transportation Systems},
    • year = 2020,
    • pages = {1--12},
    • month = dec,
    • doi = {10.1109/TITS.2020.3038317},
    • url = {https://www.merl.com/publications/TR2020-161}
    • }
  •  Li, M., Chen, S., Zhang, Y., "Graph Cross Networks with Vertex Infomax Pooling", Advances in Neural Information Processing Systems (NeurIPS), December 2020.
    BibTeX TR2020-167 PDF
    • @inproceedings{Li2020dec,
    • author = {Li, Maosen and Chen, Siheng and Zhang, Ya},
    • title = {Graph Cross Networks with Vertex Infomax Pooling},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2020,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2020-167}
    • }
  •  Talreja, V., Koike-Akino, T., Wang, Y., Millar, D.S., Kojima, K., Parsons, K., "End-to-End Deep Learning for Phase Noise-Robust Multi-Dimensional Geometric Shaping", European Conference on Optical Communication (ECOC), November 2020.
    BibTeX TR2020-155 PDF Video
    • @inproceedings{Talreja2020nov,
    • author = {Talreja, Veeru and Koike-Akino, Toshiaki and Wang, Ye and Millar, David S. and Kojima, Keisuke and Parsons, Kieran},
    • title = {End-to-End Deep Learning for Phase Noise-Robust Multi-Dimensional Geometric Shaping},
    • booktitle = {European Conference on Optical Communication (ECOC)},
    • year = 2020,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2020-155}
    • }
  •  Corcodel, R., Jain, S., van Baar, J., "Interactive Tactile Perception for Classification of Novel Object Instances", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/​IROS45743.2020.9341795, November 2020, pp. 9861-9868.
    BibTeX TR2020-143 PDF
    • @inproceedings{Corcodel2020nov,
    • author = {Corcodel, Radu and Jain, Siddarth and van Baar, Jeroen},
    • title = {Interactive Tactile Perception for Classification of Novel Object Instances},
    • booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2020,
    • pages = {9861--9868},
    • month = nov,
    • publisher = {IEEE},
    • doi = {10.1109/IROS45743.2020.9341795},
    • url = {https://www.merl.com/publications/TR2020-143}
    • }
  •  Jones, M.J., Ramachandra, B., Vatsavai, R., "A Survey of Single-Scene Video Anomaly Detection", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/​TPAMI.2020.3040591, November 2020.
    BibTeX TR2021-029 PDF
    • @article{Jones2020nov,
    • author = {Jones, Michael J. and Ramachandra, Bharathkumar and Vatsavai, Ranga},
    • title = {A Survey of Single-Scene Video Anomaly Detection},
    • journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
    • year = 2020,
    • month = nov,
    • doi = {10.1109/TPAMI.2020.3040591},
    • url = {https://www.merl.com/publications/TR2021-029}
    • }
  •  Ota, K., Sasaki, Y., Jha, D., Yoshiyasu, Y., Kanezaki, A., "Efficient Exploration in Constrained Environments with Goal-Oriented Reference Path", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), November 2020.
    BibTeX TR2020-141 PDF Software
    • @inproceedings{Ota2020nov,
    • author = {Ota, Kei and Sasaki, Yoko and Jha, Devesh and Yoshiyasu, Yusuke and Kanezaki, Asako},
    • title = {Efficient Exploration in Constrained Environments with Goal-Oriented Reference Path},
    • booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2020,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2020-141}
    • }
  •  Hori, T., Moritz, N., Hori, C., Le Roux, J., "Transformer-based Long-context End-to-end Speech Recognition", Annual Conference of the International Speech Communication Association (Interspeech), DOI: 10.21437/​Interspeech.2020-2928, October 2020, pp. 5011-5015.
    BibTeX TR2020-139 PDF
    • @inproceedings{Hori2020oct,
    • author = {Hori, Takaaki and Moritz, Niko and Hori, Chiori and Le Roux, Jonathan},
    • title = {Transformer-based Long-context End-to-end Speech Recognition},
    • booktitle = {Annual Conference of the International Speech Communication Association (Interspeech)},
    • year = 2020,
    • pages = {5011--5015},
    • month = oct,
    • doi = {10.21437/Interspeech.2020-2928},
    • issn = {1990-9772},
    • url = {https://www.merl.com/publications/TR2020-139}
    • }
  •  Jayashankar, T., Le Roux, J., Moulin, P., "Detecting Audio Attacks on ASR Systems with Dropout Uncertainty", Annual Conference of the International Speech Communication Association (Interspeech), DOI: 10.21437/​Interspeech.2020-1846, October 2020, pp. 4671-4675.
    BibTeX TR2020-137 PDF
    • @inproceedings{Jayashankar2020oct,
    • author = {Jayashankar, Tejas and Le Roux, Jonathan and Moulin, Pierre},
    • title = {Detecting Audio Attacks on ASR Systems with Dropout Uncertainty},
    • booktitle = {Annual Conference of the International Speech Communication Association (Interspeech)},
    • year = 2020,
    • pages = {4671--4675},
    • month = oct,
    • doi = {10.21437/Interspeech.2020-1846},
    • issn = {1990-9772},
    • url = {https://www.merl.com/publications/TR2020-137}
    • }
  •  Moritz, N., Wichern, G., Hori, T., Le Roux, J., "All-in-One Transformer: Unifying Speech Recognition, Audio Tagging, and Event Detection", Annual Conference of the International Speech Communication Association (Interspeech), DOI: 10.21437/​Interspeech.2020-2757, October 2020, pp. 3112-3116.
    BibTeX TR2020-138 PDF
    • @inproceedings{Moritz2020oct,
    • author = {Moritz, Niko and Wichern, Gordon and Hori, Takaaki and Le Roux, Jonathan},
    • title = {All-in-One Transformer: Unifying Speech Recognition, Audio Tagging, and Event Detection},
    • booktitle = {Annual Conference of the International Speech Communication Association (Interspeech)},
    • year = 2020,
    • pages = {3112--3116},
    • month = oct,
    • doi = {10.21437/Interspeech.2020-2757},
    • issn = {1990-9772},
    • url = {https://www.merl.com/publications/TR2020-138}
    • }
  •  Manilow, E., Wichern, G., Le Roux, J., "Hierarchical Musical Instrument Separation", International Society for Music Information Retrieval (ISMIR) Conference, October 2020, pp. 376-383.
    BibTeX TR2020-136 PDF
    • @inproceedings{Manilow2020oct,
    • author = {Manilow, Ethan and Wichern, Gordon and Le Roux, Jonathan},
    • title = {Hierarchical Musical Instrument Separation},
    • booktitle = {International Society for Music Information Retrieval (ISMIR) Conference},
    • year = 2020,
    • pages = {376--383},
    • month = oct,
    • isbn = {978-0-9813537-0-8},
    • url = {https://www.merl.com/publications/TR2020-136}
    • }
  •  Tang, Y., Kojima, K., Koike-Akino, T., Wang, Y., Wu, P., TaherSima, M., Jha, D., Parsons, K., Qi, M., "Generative Deep Learning Model for Inverse Design of Integrated Nanophotonic Devices", Lasers and Photonics Reviews, DOI: 10.1002/​lpor.202000287, Vol. 2020, pp. 2000287, October 2020.
    BibTeX TR2020-135 PDF
    • @article{Tang2020oct,
    • author = {Tang, Yingheng and Kojima, Keisuke and Koike-Akino, Toshiaki and Wang, Ye and Wu, Pengxiang and TaherSima, Mohammad and Jha, Devesh and Parsons, Kieran and Qi, Minghao},
    • title = {Generative Deep Learning Model for Inverse Design of Integrated Nanophotonic Devices},
    • journal = {Lasers and Photonics Reviews},
    • year = 2020,
    • volume = 2020,
    • pages = 2000287,
    • month = oct,
    • doi = {10.1002/lpor.202000287},
    • url = {https://www.merl.com/publications/TR2020-135}
    • }
  •  Seetharaman, P., Wichern, G., Pardo, B., Le Roux, J., "Autoclip: Adaptive Gradient Clipping For Source Separation Networks", IEEE International Workshop on Machine Learning for Signal Processing (MLSP), DOI: 10.1109/​MLSP49062.2020.9231926, September 2020.
    BibTeX TR2020-132 PDF
    • @inproceedings{Seetharaman2020sep,
    • author = {Seetharaman, Prem and Wichern, Gordon and Pardo, Bryan and Le Roux, Jonathan},
    • title = {Autoclip: Adaptive Gradient Clipping For Source Separation Networks},
    • booktitle = {IEEE International Workshop on Machine Learning for Signal Processing (MLSP)},
    • year = 2020,
    • month = sep,
    • publisher = {IEEE},
    • doi = {10.1109/MLSP49062.2020.9231926},
    • url = {https://www.merl.com/publications/TR2020-132}
    • }
  •  Kojima, K., Tang, Y., Koike-Akino, T., Wang, Y., Jha, D., Parsons, K., TaherSima, M., Sang, F., Klamkin, J., Qi, M., "Inverse Design of Nanophotonic Devices using Deep Neural Networks", Asia Communications and Photonics Conference (ACP), September 2020, pp. Su1A.1.
    BibTeX TR2020-130 PDF Video
    • @inproceedings{Kojima2020sep,
    • author = {Kojima, Keisuke and Tang, Yingheng and Koike-Akino, Toshiaki and Wang, Ye and Jha, Devesh and Parsons, Kieran and TaherSima, Mohammad and Sang, Fengqiao and Klamkin, Jonathan and Qi, Minghao},
    • title = {Inverse Design of Nanophotonic Devices using Deep Neural Networks},
    • booktitle = {Asia Communications and Photonics Conference (ACP)},
    • year = 2020,
    • pages = {Su1A.1},
    • month = sep,
    • publisher = {Optical Society of America},
    • isbn = {978-1-943580-82-8},
    • url = {https://www.merl.com/publications/TR2020-130}
    • }