Publications

557 / 3,666 publications found.


  •  van Baar, J., Sullivan, A., Corcodel, R., Jha, D.K., Romeres, D., Nikovski, D.N., "Sim-to-Real Transfer Learning using Robustified Controllers in Robotic Tasks involving Complex Dynamics", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA.2019.8793561, May 2019, pp. 6001-6007.
    BibTeX TR2018-202 PDF Video Software
    • @inproceedings{vanBaar2019may,
    • author = {van Baar, Jeroen and Sullivan, Alan and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and Nikovski, Daniel N.},
    • title = {Sim-to-Real Transfer Learning using Robustified Controllers in Robotic Tasks involving Complex Dynamics},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2019,
    • pages = {6001--6007},
    • month = may,
    • doi = {10.1109/ICRA.2019.8793561},
    • url = {https://www.merl.com/publications/TR2018-202}
    • }
  •  Aihara, R., Hanazawa, T., Okato, Y., Wichern, G., Le Roux, J., "Teacher-Student Deep Clustering For Low-Delay Channel Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8682695, May 2019.
    BibTeX TR2019-003 PDF
    • @inproceedings{Aihara2019may,
    • author = {Aihara, Ryo and Hanazawa, Toshiyuki and Okato, Yohei and Wichern, Gordon and Le Roux, Jonathan},
    • title = {Teacher-Student Deep Clustering For Low-Delay Channel Speech Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8682695},
    • url = {https://www.merl.com/publications/TR2019-003}
    • }
  •  Baskar, M.K., Burget, L., Watanabe, S., Karafiat, M., Hori, T., Cernocky, J.H., "Promising Accurate Prefix Boosting for Sequence-to-Sequence ASR", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8682782, May 2019, pp. 5646-5650.
    BibTeX TR2019-006 PDF
    • @inproceedings{Baskar2019may,
    • author = {Baskar, Murali Karthick and Burget, Lukas and Watanabe, Shinji and Karafiat, Martin and Hori, Takaaki and Cernocky, Jan, Honza},
    • title = {Promising Accurate Prefix Boosting for Sequence-to-Sequence ASR},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • pages = {5646--5650},
    • month = may,
    • doi = {10.1109/ICASSP.2019.8682782},
    • issn = {2379-190X},
    • isbn = {978-1-4799-8131-1},
    • url = {https://www.merl.com/publications/TR2019-006}
    • }
  •  Cho, J., Watanabe, S., Hori, T., Baskar, M.K., Inaguma, H., Villalba, J., Dehak, N., "Language Model Integration Based on Memory Control for Sequence to Sequence Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8683380, May 2019.
    BibTeX TR2019-007 PDF
    • @inproceedings{Cho2019may,
    • author = {Cho, Jaejin and Watanabe, Shinji and Hori, Takaaki and Baskar, Murali Karthick and Inaguma, Hirofumi and Villalba, Jesus and Dehak, Najim},
    • title = {Language Model Integration Based on Memory Control for Sequence to Sequence Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8683380},
    • url = {https://www.merl.com/publications/TR2019-007}
    • }
  •  Hori, C., Alamri, H., Wang, J., Wichern, G., Hori, T., Cherian, A., Marks, T.K., Cartillier, V., Lopes, R., Das, A., Essa, I., Batra, D., Parikh, D., "End-to-End Audio Visual Scene-Aware Dialog Using Multimodal Attention-Based Video Features", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8682583, May 2019.
    BibTeX TR2019-016 PDF
    • @inproceedings{Hori2019may2,
    • author = {Hori, Chiori and Alamri, Huda and Wang, Jue and Wichern, Gordon and Hori, Takaaki and Cherian, Anoop and Marks, Tim K. and Cartillier, Vincent and Lopes, Raphael and Das, Abhishek and Essa, Irfan and Batra, Dhruv and Parikh, Devi},
    • title = {End-to-End Audio Visual Scene-Aware Dialog Using Multimodal Attention-Based Video Features},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8682583},
    • url = {https://www.merl.com/publications/TR2019-016}
    • }
  •  Hori, T., Astudillo, R., Hayashi, T., Zhang, Y., Watanabe, S., Le Roux, J., "Cycle-Consistency Training for End-to-End Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8683307, May 2019.
    BibTeX TR2019-002 PDF
    • @inproceedings{Hori2019may,
    • author = {Hori, Takaaki and Astudillo, Ramon and Hayashi, Tomoki and Zhang, Yu and Watanabe, Shinji and Le Roux, Jonathan},
    • title = {Cycle-Consistency Training for End-to-End Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8683307},
    • url = {https://www.merl.com/publications/TR2019-002}
    • }
  •  Le Roux, J., Wichern, G., Watanabe, S., Sarroff, A., Hershey, J., "The Phasebook: Building Complex Masks via Discrete Representations for Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8682587, May 2019.
    BibTeX TR2019-008 PDF
    • @inproceedings{LeRoux2019may2,
    • author = {Le Roux, Jonathan and Wichern, Gordon and Watanabe, Shinji and Sarroff, Andy and Hershey, John},
    • title = {The Phasebook: Building Complex Masks via Discrete Representations for Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8682587},
    • url = {https://www.merl.com/publications/TR2019-008}
    • }
  •  Lohit, S., Liu, D., Mansour, H., Boufounos, P.T., "Unrolled Projected Gradient Descent for Multi-Spectral Image Fusion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8683124, May 2019.
    BibTeX TR2019-010 PDF
    • @inproceedings{Lohit2019may,
    • author = {Lohit, Suhas and Liu, Dehong and Mansour, Hassan and Boufounos, Petros T.},
    • title = {Unrolled Projected Gradient Descent for Multi-Spectral Image Fusion},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8683124},
    • url = {https://www.merl.com/publications/TR2019-010}
    • }
  •  Moritz, N., Hori, T., Le Roux, J., "Triggered Attention for End-to-End Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8683510, May 2019.
    BibTeX TR2019-015 PDF
    • @inproceedings{Moritz2019may,
    • author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Triggered Attention for End-to-End Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8683510},
    • url = {https://www.merl.com/publications/TR2019-015}
    • }
  •  Seetharaman, P., Wichern, G., Le Roux, J., Pardo, B., "Bootstrapping Single-Channel Source Separation via Unsupervised Spatial Clustering on Stereo Mixtures", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8683198, May 2019.
    BibTeX TR2019-014 PDF
    • @inproceedings{Seetharaman2019may2,
    • author = {Seetharaman, Prem and Wichern, Gordon and Le Roux, Jonathan and Pardo, Bryan},
    • title = {Bootstrapping Single-Channel Source Separation via Unsupervised Spatial Clustering on Stereo Mixtures},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8683198},
    • url = {https://www.merl.com/publications/TR2019-014}
    • }
  •  Seetharaman, P., Wichern, G., Venkataramani, S., Le Roux, J., "Class-Conditional Embeddings for Music Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8683007, May 2019.
    BibTeX TR2019-004 PDF
    • @inproceedings{Seetharaman2019may,
    • author = {Seetharaman, Prem and Wichern, Gordon and Venkataramani, Shrikant and Le Roux, Jonathan},
    • title = {Class-Conditional Embeddings for Music Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8683007},
    • url = {https://www.merl.com/publications/TR2019-004}
    • }
  •  Wang, X., Li, R., Mallidi, S.H., Hori, T., Watanabe, S., Hermansky, H., "Stream Attention-Based Multi-Array End-to-End Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2019.8682650, May 2019.
    BibTeX TR2019-005 PDF
    • @inproceedings{Wang2019may,
    • author = {Wang, Xiaofei and Li, Ruizhi and Mallidi, Sri Harish and Hori, Takaaki and Watanabe, Shinji and Hermansky, Hynek},
    • title = {Stream Attention-Based Multi-Array End-to-End Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2019,
    • month = may,
    • doi = {10.1109/ICASSP.2019.8682650},
    • url = {https://www.merl.com/publications/TR2019-005}
    • }
  •  Lopez, O., Mansour, H., "Robust Subspace Learning for Motion Deblurring in Images," Tech. Rep. TR2018-208, Mitsubishi Electric Research Laboratories, March 2019.
    BibTeX TR2018-208 PDF
    • @techreport{Lopez2019mar,
    • author = {Lopez, Oscar and Mansour, Hassan},
    • title = {Robust Subspace Learning for Motion Deblurring in Images},
    • year = 2019,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2018-208}
    • }
  •  Le Roux, J., Wichern, G., Watanabe, S., Sarroff, A., Hershey, J., "Phasebook and Friends: Leveraging discrete representations for source separation", IEEE Journal of Selected Topics in Signal Processing, DOI: 10.1109/​JSTSP.2019.2904183, Vol. 13, No. 2, pp. 370-382, March 2019.
    BibTeX TR2018-199 PDF
    • @article{LeRoux2019mar,
    • author = {Le Roux, Jonathan and Wichern, Gordon and Watanabe, Shinji and Sarroff, Andy and Hershey, John},
    • title = {Phasebook and Friends: Leveraging discrete representations for source separation},
    • journal = {IEEE Journal of Selected Topics in Signal Processing},
    • year = 2019,
    • volume = 13,
    • number = 2,
    • pages = {370--382},
    • month = mar,
    • doi = {10.1109/JSTSP.2019.2904183},
    • url = {https://www.merl.com/publications/TR2018-199}
    • }
  •  TaherSima, M., Kojima, K., Koike-Akino, T., Jha, D.K., Wang, B., Lin, C., Parsons, K., "Deep Neural Network Inverse Modeling for Integrated Photonics", Optical Fiber Communication Conference and Exposition and the National Fiber Optic Engineers Conference (OFC/NFOEC), DOI: 10.1364/​OFC.2019.W3B.5, March 2019.
    BibTeX TR2018-183 PDF
    • @inproceedings{TaherSima2019mar,
    • author = {TaherSima, Mohammad and Kojima, Keisuke and Koike-Akino, Toshiaki and Jha, Devesh K. and Wang, Bingnan and Lin, Chungwei and Parsons, Kieran},
    • title = {Deep Neural Network Inverse Modeling for Integrated Photonics},
    • booktitle = {Optical Fiber Communication Conference and Exposition and the National Fiber Optic Engineers Conference (OFC/NFOEC)},
    • year = 2019,
    • month = mar,
    • doi = {10.1364/OFC.2019.W3B.5},
    • url = {https://www.merl.com/publications/TR2018-183}
    • }
  •  Xu, H., Sun, H., Nikovski, D.N., Shoichi, K., Mori, K., "Learning Dynamical Demand Response Model in Real-Time Pricing Program", IEEE PES Innovative Smart Grid Technologies Conference - North America (ISGT NA), February.
    BibTeX TR2018-198 PDF
    • @inproceedings{Xu2019feb,
    • author = {Xu, Hanchen and Sun, Hongbo and Nikovski, Daniel N. and Shoichi, Kitamura and Mori, Kazuyuki},
    • title = {Learning Dynamical Demand Response Model in Real-Time Pricing Program},
    • booktitle = {IEEE PES Innovative Smart Grid Technologies Conference - North America (ISGT NA)},
    • year = 2019,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2018-198}
    • }
  •  Cherian, A., Sullivan, A., "Sem-GAN: Semantically-Consistent Image-to-Image Translation", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/​WACV.2019.00196, January 2019.
    BibTeX TR2018-178 PDF
    • @inproceedings{Cherian2019jan,
    • author = {Cherian, Anoop and Sullivan, Alan},
    • title = {Sem-GAN: Semantically-Consistent Image-to-Image Translation},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2019,
    • month = jan,
    • doi = {10.1109/WACV.2019.00196},
    • url = {https://www.merl.com/publications/TR2018-178}
    • }
  •  Cho, J., Baskar, M.K., Li, R., Wiesner, M., Mallidi, S.H., Yalta, N., Karafiat, M., Watanabe, S., Hori, T., "Multilingual Sequence-to-Sequence Speech Recognition: Architecture, Transfer Learning, and Language Modeling", IEEE Spoken Language Technology Workshop (SLT), DOI: 10.1109/​SLT.2018.8639655, December 2018.
    BibTeX TR2018-175 PDF
    • @inproceedings{Cho2018dec,
    • author = {Cho, Jaejin and Baskar, Murali Karthick and Li, Ruizhi and Wiesner, Matthew and Mallidi, Sri Harish and Yalta, Nelson and Karafiat, Martin and Watanabe, Shinji and Hori, Takaaki},
    • title = {Multilingual Sequence-to-Sequence Speech Recognition: Architecture, Transfer Learning, and Language Modeling},
    • booktitle = {IEEE Spoken Language Technology Workshop (SLT)},
    • year = 2018,
    • month = dec,
    • doi = {10.1109/SLT.2018.8639655},
    • url = {https://www.merl.com/publications/TR2018-175}
    • }
  •  Hayashi, T., Watanabe, S., Zhang, Y., Toda, T., Hori, T., Astudillo, R., Takeda, K., "Back-Translation-Style Data Augmentation for End-to-End ASR", IEEE Spoken Language Technology Workshop (SLT), DOI: 10.1109/​SLT.2018.8639619, December 2018.
    BibTeX TR2018-174 PDF
    • @inproceedings{Hayashi2018dec,
    • author = {Hayashi, Tomoki and Watanabe, Shinji and Zhang, Yu and Toda, Tomoki and Hori, Takaaki and Astudillo, Ramon and Takeda, Kazuya},
    • title = {Back-Translation-Style Data Augmentation for End-to-End ASR},
    • booktitle = {IEEE Spoken Language Technology Workshop (SLT)},
    • year = 2018,
    • month = dec,
    • doi = {10.1109/SLT.2018.8639619},
    • url = {https://www.merl.com/publications/TR2018-174}
    • }
  •  Hori, T., Cho, J., Watanabe, S., "End-to-End Speech Recognition with Word-Based RNN Language Models", IEEE Spoken Language Technology Workshop (SLT), DOI: 10.1109/​SLT.2018.8639693, December 2018.
    BibTeX TR2018-176 PDF
    • @inproceedings{Hori2018dec,
    • author = {Hori, Takaaki and Cho, Jaejin and Watanabe, Shinji},
    • title = {End-to-End Speech Recognition with Word-Based RNN Language Models},
    • booktitle = {IEEE Spoken Language Technology Workshop (SLT)},
    • year = 2018,
    • month = dec,
    • doi = {10.1109/SLT.2018.8639693},
    • url = {https://www.merl.com/publications/TR2018-176}
    • }
  •  Chakrabarty, A., Raghunathan, A.U., Di Cairano, S., Danielson, C., "Data-Driven Estimation of Reachable and Invariant Sets for Unmodeled Systems via Active Learning", IEEE Conference on Decision and Control (CDC), DOI: 10.1109/​CDC.2018.8619646, December 2018.
    BibTeX TR2018-187 PDF
    • @inproceedings{Chakrabarty2018dec,
    • author = {Chakrabarty, Ankush and Raghunathan, Arvind and Di Cairano, Stefano and Danielson, Claus},
    • title = {Data-Driven Estimation of Reachable and Invariant Sets for Unmodeled Systems via Active Learning},
    • booktitle = {IEEE Conference on Decision and Control (CDC)},
    • year = 2018,
    • month = dec,
    • doi = {10.1109/CDC.2018.8619646},
    • url = {https://www.merl.com/publications/TR2018-187}
    • }
  •  Hori, T., Wang, W., Koji, Y., Hori, C., Harsham, B.A., Hershey, J., "Adversarial Training and Decoding Strategies for End-to-end Neural Conversation Models", Computer Speech and Language, DOI: 10.1016/​j.csl.2018.08.006, Vol. 54, pp. 122-139, December 2018.
    BibTeX TR2018-161 PDF
    • @article{Hori2018dec2,
    • author = {Hori, Takaaki and Wang, Wen and Koji, Yusuke and Hori, Chiori and Harsham, Bret A. and Hershey, John},
    • title = {Adversarial Training and Decoding Strategies for End-to-end Neural Conversation Models},
    • journal = {Computer Speech and Language},
    • year = 2018,
    • volume = 54,
    • pages = {122--139},
    • month = dec,
    • publisher = {Elsevier},
    • doi = {10.1016/j.csl.2018.08.006},
    • url = {https://www.merl.com/publications/TR2018-161}
    • }
  •  Natarajan, A., Laftchiev, E., "A Transfer Active Learning Framework to Predict Thermal Comfort", International Journal of Prognostics and Health Management Special Issue on PHM for Human Health & Performance, December 2018.
    BibTeX TR2018-156 PDF
    • @article{Natarajan2018dec,
    • author = {Natarajan, Annamalai and Laftchiev, Emil},
    • title = {A Transfer Active Learning Framework to Predict Thermal Comfort},
    • journal = {International Journal of Prognostics and Health Management Special Issue on PHM for Human Health \& Performance},
    • year = 2018,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2018-156}
    • }
  •  Romeres, D.., Jha, D.K., Dalla Libera, A., Chiuso, A., Nikovski, D.N., "Derivative-Free Semiparametric Bayesian Models for Robot Learning", Advances in Neural Information Processing Systems (NIPS), December 2018.
    BibTeX TR2018-165 PDF
    • @inproceedings{Romeres2018dec,
    • author = {Romeres, Diego and Jha, Devesh K. and Dalla Libera, Alberto and Chiuso, Alessandro and Nikovski, Daniel N.},
    • title = {Derivative-Free Semiparametric Bayesian Models for Robot Learning},
    • booktitle = {Advances in Neural Information Processing Systems (NIPS)},
    • year = 2018,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2018-165}
    • }
  •  Kao, C.-C., Lee, T.-Y., Sen, P., Liu, M.-Y., "Localization-Aware Active Learning for Object Detection", Asian Conference on Computer Vision (ACCV), December 2018.
    BibTeX TR2018-166 PDF
    • @inproceedings{Kao2018dec,
    • author = {Kao, Chieh-Chi and Lee, Teng-Yok and Sen, Pradeep and Liu, Ming-Yu},
    • title = {Localization-Aware Active Learning for Object Detection},
    • booktitle = {Asian Conference on Computer Vision (ACCV)},
    • year = 2018,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2018-166}
    • }