Publications

642 / 3,778 publications found.


  •  Delcroix, M., Watanabe, S., "Recent Advances in Distant Speech Recognition," Tech. Rep. TR2016-115, Interspeech Tutorials, September 2016.
    BibTeX TR2016-115 PDF
    • @techreport{Delcroix2016sep,
    • author = {Delcroix, Marc and Watanabe, Shinji},
    • title = {Recent Advances in Distant Speech Recognition},
    • booktitle = {Interspeech Tutorials},
    • institution = {Interspeech},
    • year = 2016,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2016-115}
    • }
  •  Le Roux, J., Vincent, E., Erdogan, H., "Learning-Based Approaches to Speech Enhancement and Separation," Tech. Rep. TR2016-113, Interspeech Tutorials, September 2016.
    BibTeX TR2016-113 PDF
    • @techreport{LeRoux2016sep,
    • author = {Le Roux, Jonathan and Vincent, Emmanuel and Erdogan, Hakan},
    • title = {Learning-Based Approaches to Speech Enhancement and Separation},
    • booktitle = {Interspeech Tutorials},
    • year = 2016,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2016-113}
    • }
  •  Erdogan, H., Hershey, J.R., Watanabe, S., Mandel, M., Le Roux, J., "Improved MVDR beamforming using single-channel mask prediction networks", Interspeech, DOI: 10.21437/​Interspeech.2016-552, September 2016, pp. 1981-1985.
    BibTeX TR2016-072 PDF
    • @inproceedings{Erdogan2016sep,
    • author = {Erdogan, Hakan and Hershey, John R. and Watanabe, Shinji and Mandel, Michael and Le Roux, Jonathan},
    • title = {Improved MVDR beamforming using single-channel mask prediction networks},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {1981--1985},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-552},
    • url = {https://www.merl.com/publications/TR2016-072}
    • }
  •  Hori, C., Hori, T., Watanabe, S., Hershey, J.R., "Context-Sensitive and Role-Dependent Spoken Language Understanding using Bidirectional and Attention LSTMs", Interspeech, DOI: 10.21437/​Interspeech.2016-1171, September 2016, pp. 3236-3240.
    BibTeX TR2016-074 PDF
    • @inproceedings{Hori2016sep,
    • author = {Hori, Chiori and Hori, Takaaki and Watanabe, Shinji and Hershey, John R.},
    • title = {Context-Sensitive and Role-Dependent Spoken Language Understanding using Bidirectional and Attention LSTMs},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {3236--3240},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-1171},
    • url = {https://www.merl.com/publications/TR2016-074}
    • }
  •  Isik, Y., Le Roux, J., Chen, Z., Watanabe, S., Hershey, J.R., "Single-Channel Multi-Speaker Separation using Deep Clustering", Interspeech, DOI: 10.21437/​Interspeech.2016-1176, September 2016, pp. 545-549.
    BibTeX TR2016-073 PDF
    • @inproceedings{Isik2016sep,
    • author = {Isik, Yusuf and Le Roux, Jonathan and Chen, Zhuo and Watanabe, Shinji and Hershey, John R.},
    • title = {Single-Channel Multi-Speaker Separation using Deep Clustering},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {545--549},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-1176},
    • url = {https://www.merl.com/publications/TR2016-073}
    • }
  •  Zmolikova, K., Karafiat, M., Vesely, K., Delcroix, M., Watanabe, S., Burget, L., Cernocky, J.H., "Data selection by sequence summarizing neural network in mismatch condition training", Interspeech, DOI: 10.21437/​Interspeech.2016-741, September 2016, pp. 2354-2358.
    BibTeX TR2016-075 PDF
    • @inproceedings{Zmolikova2016sep,
    • author = {Zmolikova, Katerina and Karafiat, Martin and Vesely, Karel and Delcroix, Marc and Watanabe, Shinji and Burget, Lukas and Cernocky, Jan, Honza},
    • title = {Data selection by sequence summarizing neural network in mismatch condition training},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {2354--2358},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-741},
    • url = {https://www.merl.com/publications/TR2016-075}
    • }
  •  Hayashi, T., Watanabe, S., Toda, T., Hori, T., Le Roux, J., Takeda, K., "Bidirectional LSTM-HMM Hybrid System for Polyphonic Sound Event Detection", Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE), September 2016, pp. 35-39.
    BibTeX TR2016-114 PDF
    • @inproceedings{Hayashi2016sep,
    • author = {Hayashi, Tomoki and Watanabe, Shinji and Toda, Tomoki and Hori, Takaaki and Le Roux, Jonathan and Takeda, Kazuya},
    • title = {Bidirectional LSTM-HMM Hybrid System for Polyphonic Sound Event Detection},
    • booktitle = {Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE)},
    • year = 2016,
    • pages = {35--39},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2016-114}
    • }
  •  Koike-Akino, T., Mahajan, R., Marks, T.K., Tuzel, C.O., Wang, Y., Watanabe, S., Orlik, P.V., "High-Accuracy User Identification Using EEG Biometrics", International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC), DOI: 10.1109/​EMBC.2016.7590835, August 2016, pp. 854-858.
    BibTeX TR2016-105 PDF Presentation
    • @inproceedings{Koike-Akino2016aug,
    • author = {Koike-Akino, Toshiaki and Mahajan, Ruhi and Marks, Tim K. and Tuzel, C. Oncel and Wang, Ye and Watanabe, Shinji and Orlik, Philip V.},
    • title = {High-Accuracy User Identification Using EEG Biometrics},
    • booktitle = {International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)},
    • year = 2016,
    • pages = {854--858},
    • month = aug,
    • doi = {10.1109/EMBC.2016.7590835},
    • url = {https://www.merl.com/publications/TR2016-105}
    • }
  •  Nikovski, D.N., Byadarhaly, K., "Regularized Covariance Matrix Estimation with High Dimensional Data for Supervised Anomaly Detection Problems", IEEE International Joint Conference on Neural Networks (IJCNN), DOI: 10.1109/​IJCNN.2016.7727554, July 2016, pp. 2811-2818.
    BibTeX TR2016-099 PDF
    • @inproceedings{Nikovski2016jul,
    • author = {Nikovski, Daniel N. and Byadarhaly, Kiran},
    • title = {Regularized Covariance Matrix Estimation with High Dimensional Data for Supervised Anomaly Detection Problems},
    • booktitle = {IEEE International Joint Conference on Neural Networks (IJCNN)},
    • year = 2016,
    • pages = {2811--2818},
    • month = jul,
    • doi = {10.1109/IJCNN.2016.7727554},
    • url = {https://www.merl.com/publications/TR2016-099}
    • }
  •  Hori, C., Watanabe, S., Hori, T., Harsham, B.A., Hershey, J.R., Koji, Y., Fujii, Y., Furumoto, Y., "Driver Confusion Status Detection Using Recurrent Neural Networks", IEEE International Conference on Multimedia and Expo (ICME), DOI: 10.1109/​ICME.2016.7552966, July 2016.
    BibTeX TR2016-088 PDF
    • @inproceedings{Hori2016jul,
    • author = {Hori, Chiori and Watanabe, Shinji and Hori, Takaaki and Harsham, Bret A. and Hershey, John R. and Koji, Yusuke and Fujii, Youichi and Furumoto, Yuki},
    • title = {Driver Confusion Status Detection Using Recurrent Neural Networks},
    • booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
    • year = 2016,
    • month = jul,
    • doi = {10.1109/ICME.2016.7552966},
    • url = {https://www.merl.com/publications/TR2016-088}
    • }
  •  Singh, B., Marks, T.K., Jones, M.J., Tuzel, C.O., Shao, M., "A Multi-Stream Bi-Directional Recurrent Neural Network for Fine-Grained Action Detection", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR.2016.216, June 2016, pp. 1961-1970.
    BibTeX TR2016-080 PDF Data
    • @inproceedings{Singh2016jun,
    • author = {Singh, Bharat and Marks, Tim K. and Jones, Michael J. and Tuzel, C. Oncel and Shao, Ming},
    • title = {A Multi-Stream Bi-Directional Recurrent Neural Network for Fine-Grained Action Detection},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2016,
    • pages = {1961--1970},
    • month = jun,
    • doi = {10.1109/CVPR.2016.216},
    • url = {https://www.merl.com/publications/TR2016-080}
    • }
  •  Vemulapalli, R., Tuzel, C.O., Liu, M.-Y., "Deep Gaussian Conditional Random Field Network: A Model-based Deep Network for Discriminative Denoising", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR.2016.351, June 2016, pp. 4801-4809.
    BibTeX TR2016-079 PDF
    • @inproceedings{Vemulapalli2016jun2,
    • author = {Vemulapalli, Raviteja and Tuzel, C. Oncel and Liu, Ming-Yu},
    • title = {Deep Gaussian Conditional Random Field Network: A Model-based Deep Network for Discriminative Denoising},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2016,
    • pages = {4801--4809},
    • month = jun,
    • doi = {10.1109/CVPR.2016.351},
    • url = {https://www.merl.com/publications/TR2016-079}
    • }
  •  Vemulapalli, R., Tuzel, C.O., Liu, M.-Y., Chellappa, R., "Gaussian Conditional Random Field Network for Semantic Segmentation", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2016, pp. 3224-3233.
    BibTeX TR2016-078 PDF
    • @inproceedings{Vemulapalli2016jun,
    • author = {Vemulapalli, Raviteja and Tuzel, C. Oncel and Liu, Ming-Yu and Chellappa, Rama},
    • title = {Gaussian Conditional Random Field Network for Semantic Segmentation},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2016,
    • pages = {3224--3233},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2016-078}
    • }
  •  Son, K., Liu, M.-Y., Taguchi, Y., "Learning to Remove Multipath Distortions in Time-of-Flight Range Images for a Robotic Arm Setup", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA.2016.7487515, May 2016, pp. 3390-3397.
    BibTeX TR2016-036 PDF
    • @inproceedings{Son2016may,
    • author = {Son, Kilho and Liu, Ming-Yu and Taguchi, Yuichi},
    • title = {Learning to Remove Multipath Distortions in Time-of-Flight Range Images for a Robotic Arm Setup},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2016,
    • pages = {3390--3397},
    • month = may,
    • doi = {10.1109/ICRA.2016.7487515},
    • url = {https://www.merl.com/publications/TR2016-036}
    • }
  •  Jones, M.J., Nikovski, D.N., Imamura, M., Hirata, T., "Exemplar Learning for Extremely Efficient Anomaly Detection in Real-Valued Time Series", Journal of Data Mining and Knowledge Discovery, DOI: 10.1007/​s10618-015-0449-3, Vol. 30, No. 6, pp. 1427-1454, March 2016.
    BibTeX TR2016-027 PDF
    • @article{Jones2016mar,
    • author = {Jones, Michael J. and Nikovski, Daniel N. and Imamura, Makoto and Hirata, Takahisa},
    • title = {Exemplar Learning for Extremely Efficient Anomaly Detection in Real-Valued Time Series},
    • journal = {Journal of Data Mining and Knowledge Discovery},
    • year = 2016,
    • volume = 30,
    • number = 6,
    • pages = {1427--1454},
    • month = mar,
    • doi = {10.1007/s10618-015-0449-3},
    • issn = {1573-756X},
    • url = {https://www.merl.com/publications/TR2016-027}
    • }
  •  Hershey, J.R., Chen, Z., Le Roux, J., Watanabe, S., "Deep Clustering: Discriminative Embeddings for Segmentation and Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2016.7471631, March 2016, pp. 31-35.
    BibTeX TR2016-003 PDF
    • @inproceedings{Hershey2016mar,
    • author = {Hershey, John R. and Chen, Zhuo and Le Roux, Jonathan and Watanabe, Shinji},
    • title = {Deep Clustering: Discriminative Embeddings for Segmentation and Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2016,
    • pages = {31--35},
    • month = mar,
    • doi = {10.1109/ICASSP.2016.7471631},
    • url = {https://www.merl.com/publications/TR2016-003}
    • }
  •  Hori, T., Hori, C., Watanabe, S., Hershey, J.R., "Minimum Word Error Training of Long Short-Term Memory Recurrent Neural Network Language Models for Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2016.7472827, March 2016, pp. 5990-5994.
    BibTeX TR2016-011 PDF
    • @inproceedings{Hori2016mar,
    • author = {Hori, Takaaki and Hori, Chiori and Watanabe, Shinji and Hershey, John R.},
    • title = {Minimum Word Error Training of Long Short-Term Memory Recurrent Neural Network Language Models for Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2016,
    • pages = {5990--5994},
    • month = mar,
    • doi = {10.1109/ICASSP.2016.7472827},
    • url = {https://www.merl.com/publications/TR2016-011}
    • }
  •  Vesely, K., Watanabe, S., Zmolikova, K., Karafiat, M., Burget, L., Cernocky, J.H., "Sequence Summarizing Neural Network for Speaker Adaptation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2016.7472692, March 2016, pp. 5315-5319.
    BibTeX TR2016-001 PDF
    • @inproceedings{Vesely2016mar,
    • author = {Vesely, Karel and Watanabe, Shinji and Zmolikova, Katerina and Karafiat, Martin and Burget, Lukas and Cernocky, Jan, Honza},
    • title = {Sequence Summarizing Neural Network for Speaker Adaptation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2016,
    • pages = {5315--5319},
    • month = mar,
    • doi = {10.1109/ICASSP.2016.7472692},
    • url = {https://www.merl.com/publications/TR2016-001}
    • }
  •  Wisdom, S., Hershey, J.R., Le Roux, J., Watanabe, S., "Deep Unfolding for Multichannel Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2016.7471649, March 2016, pp. 121-125.
    BibTeX TR2016-008 PDF
    • @inproceedings{Wisdom2016mar,
    • author = {Wisdom, Scott and Hershey, John R. and Le Roux, Jonathan and Watanabe, Shinji},
    • title = {Deep Unfolding for Multichannel Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2016,
    • pages = {121--125},
    • month = mar,
    • doi = {10.1109/ICASSP.2016.7471649},
    • url = {https://www.merl.com/publications/TR2016-008}
    • }
  •  Xiao, X., Watanabe, S., Erdogan, H., Lu, L., Hershey, J., Seltzer, M., Chen, G., Zhang, Y., Mandel, M., Yu, D., "Deep Beamforming Networks for Multi-Channel Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2016.7472778, March 2016, pp. 5745-5749.
    BibTeX TR2016-002 PDF
    • @inproceedings{Xiao2016mar,
    • author = {Xiao, Xiong and Watanabe, Shinji and Erdogan, Hakan and Lu, Liang and Hershey, John and Seltzer, Mike and Chen, Guoguo and Zhang, Yu and Mandel, Michael and Yu, Dong},
    • title = {Deep Beamforming Networks for Multi-Channel Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2016,
    • pages = {5745--5749},
    • month = mar,
    • doi = {10.1109/ICASSP.2016.7472778},
    • url = {https://www.merl.com/publications/TR2016-002}
    • }
  •  Liu, M.-Y., Mallya, A., Tuzel, C.O., Chen, X., "Unsupervised Network Pretraining via Encoding Human Design", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/​WACV.2016.7477698, March 2016, pp. 1-9.
    BibTeX TR2016-022 PDF
    • @inproceedings{Liu2016mar,
    • author = {Liu, Ming-Yu and Mallya, Arun and Tuzel, C. Oncel and Chen, Xi},
    • title = {Unsupervised Network Pretraining via Encoding Human Design},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2016,
    • pages = {1--9},
    • month = mar,
    • doi = {10.1109/WACV.2016.7477698},
    • url = {https://www.merl.com/publications/TR2016-022}
    • }
  •  Farahmand, A.-M., Nikovski, D.N., Igarashi, Y., Konaka, H., "Truncated Approximate Dynamic Programming with Task-Dependent Terminal Value", Association for the Advancement of Artificial Intelligence (AAAI), February 2016, pp. 3123-3129.
    BibTeX TR2016-020 PDF
    • @inproceedings{Farahmand2016feb,
    • author = {Farahmand, Amir-massoud and Nikovski, Daniel N. and Igarashi, Yuji and Konaka, Hiroki},
    • title = {Truncated Approximate Dynamic Programming with Task-Dependent Terminal Value},
    • booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)},
    • year = 2016,
    • pages = {3123--3129},
    • month = feb,
    • url = {https://www.merl.com/publications/TR2016-020}
    • }
  •  Kanagawa, H., Tachioka, Y., Watanabe, S., Ishii, J., "Feature-Space Structural MAPLR with Regression Tree-Based Multiple Transformation Matrices for DNN", Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC), DOI: 10.1109/​APSIPA.2015.7415425, December 2015, pp. 86-92.
    BibTeX TR2015-150 PDF
    • @inproceedings{Kanagawa2015dec,
    • author = {Kanagawa, H. and Tachioka, Y. and Watanabe, S. and Ishii, J.},
    • title = {Feature-Space Structural MAPLR with Regression Tree-Based Multiple Transformation Matrices for DNN},
    • booktitle = {Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)},
    • year = 2015,
    • pages = {86--92},
    • month = dec,
    • doi = {10.1109/APSIPA.2015.7415425},
    • url = {https://www.merl.com/publications/TR2015-150}
    • }
  •  Barker, J., Marxer, R., Vincent, E., Watanabe, S., "The Third 'CHiME' Speech Separation and Recognition Challenge: Dataset, Task and Baselines", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/​ASRU.2015.75404837, December 2015, pp. 504-511.
    BibTeX TR2015-136 PDF
    • @inproceedings{Barker2015dec,
    • author = {Barker, J. and Marxer, R. and Vincent, E. and Watanabe, S.},
    • title = {The Third 'CHiME' Speech Separation and Recognition Challenge: Dataset, Task and Baselines},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2015,
    • pages = {504--511},
    • month = dec,
    • publisher = {IEEE},
    • doi = {10.1109/ASRU.2015.75404837},
    • url = {https://www.merl.com/publications/TR2015-136}
    • }
  •  Hsiao, R., Ma, J., Hartmann, W., Karafiat, M., Grezl, F., Burget, L., Szoke, I., Cernocky, J., Watanabe, S., Chen, Z., Mallidi, S.H., Hermansky, H., Tsakalidis, S., Schwartz, R., "Robust Speech Recognition in Unknown Reverberant and Noisy Conditions", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/​ARSU.2015.7404841, December 2015, pp. 533-538.
    BibTeX TR2015-138 PDF
    • @inproceedings{Hsiao2015dec,
    • author = {Hsiao, R. and Ma, J. and Hartmann, W. and Karafiat, M. and Grezl, F. and Burget, L. and Szoke, I. and Cernocky, J. and Watanabe, S. and Chen, Z. and Mallidi, S.H. and Hermansky, H. and Tsakalidis, S. and Schwartz, R.},
    • title = {Robust Speech Recognition in Unknown Reverberant and Noisy Conditions},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2015,
    • pages = {533--538},
    • month = dec,
    • publisher = {IEEE},
    • doi = {10.1109/ARSU.2015.7404841},
    • url = {https://www.merl.com/publications/TR2015-138}
    • }