- Tachioka, Y., Narita, T., Miura, I., Uramoto, T., Monta, N., Uenohara, S., Furuya, K., Watanabe, S., Le Roux, J., "Coupled initialization of multi-channel non-negative matrix factorization based on spatial and spectral information", Interspeech, August 2017.
BibTeX TR2017-134 PDF- @inproceedings{Tachioka2017aug,
- author = {Tachioka, Yuuki and Narita, Tomohiro and Miura, Iori and Uramoto, Takanobu and Monta, Natsuki and Uenohara, Shingo and Furuya, Kenichi and Watanabe, Shinji and Le Roux, Jonathan},
- title = {Coupled initialization of multi-channel non-negative matrix factorization based on spatial and spectral information},
- booktitle = {Interspeech},
- year = 2017,
- month = aug,
- url = {https://www.merl.com/publications/TR2017-134}
- }
- Hayashi, T., Watanabe, S., Toda, T., Hori, T., Le Roux, J., Takeda, K., "Duration-Controlled LSTM for Polyphonic Sound Event Detection", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TASLP.2017.2740002, Vol. 25, No. 11, August 2017.
BibTeX TR2017-150 PDF- @article{Hayashi2017aug,
- author = {Hayashi, Tomoki and Watanabe, Shinji and Toda, Tomoki and Hori, Takaaki and Le Roux, Jonathan and Takeda, Kazuya},
- title = {Duration-Controlled LSTM for Polyphonic Sound Event Detection},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2017,
- volume = 25,
- number = 11,
- month = aug,
- doi = {10.1109/TASLP.2017.2740002},
- issn = {2329-9304},
- url = {https://www.merl.com/publications/TR2017-150}
- }
- Ochiai, T., Watanabe, S., Hori, T., Hershey, J.R., "Multichannel End-to-end Speech Recognition", International Conference on Machine Learning (ICML), August 2017.
BibTeX TR2017-107 PDF- @inproceedings{Ochiai2017aug,
- author = {Ochiai, Tsubasa and Watanabe, Shinji and Hori, Takaaki and Hershey, John R.},
- title = {Multichannel End-to-end Speech Recognition},
- booktitle = {International Conference on Machine Learning (ICML)},
- year = 2017,
- month = aug,
- url = {https://www.merl.com/publications/TR2017-107}
- }
- Hori, T., Watanabe, S., Hershey, J.R., "Joint CTC/attention decoding for end-to-end speech recognition", Association for Computational Linguistics (ACL), DOI: 10.18653/v1/P17-1048, July 2017, pp. 518-529.
BibTeX TR2017-103 PDF Video- @inproceedings{Hori2017jul,
- author = {Hori, Takaaki and Watanabe, Shinji and Hershey, John R.},
- title = {Joint CTC/attention decoding for end-to-end speech recognition},
- booktitle = {Association for Computational Linguistics (ACL)},
- year = 2017,
- pages = {518--529},
- month = jul,
- doi = {10.18653/v1/P17-1048},
- url = {https://www.merl.com/publications/TR2017-103}
- }
- Chen, S., Tian, D., Feng, C., Vetro, A., Kovacevic, J., "Contour-Enhanced Resampling of 3D Point Clouds Via Graphs", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-017 PDF- @inproceedings{Chen2017mar,
- author = {Chen, Siheng and Tian, Dong and Feng, Chen and Vetro, Anthony and Kovacevic, Jelena},
- title = {Contour-Enhanced Resampling of 3D Point Clouds Via Graphs},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-017}
- }
- Hayashi, T., Watanabe, S., Toda, T., Hori, T., Le Roux, J., Takeda, K., "BLSTM-HMM Hybrid System Combined with Sound Activity Detection Network for Polyphonic Sound Event Detection", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-014 PDF- @inproceedings{Hayashi2017mar,
- author = {Hayashi, Tomoki and Watanabe, Shinji and Toda, Tomoki and Hori, Takaaki and Le Roux, Jonathan and Takeda, Kazuya},
- title = {BLSTM-HMM Hybrid System Combined with Sound Activity Detection Network for Polyphonic Sound Event Detection},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-014}
- }
- Kao, J.-Y., Tian, D., Mansour, H., Ortega, A., Vetro, A., "Disc-Glasso: Discriminative Graph Learning with Sparsity Regularization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-018 PDF- @inproceedings{Kao2017mar,
- author = {Kao, Jiun-Yu and Tian, Dong and Mansour, Hassan and Ortega, Antonio and Vetro, Anthony},
- title = {Disc-Glasso: Discriminative Graph Learning with Sparsity Regularization},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-018}
- }
- Kim, S., Hori, T., Watanabe, S., "Joint CTC- Attention Based End-to-End Speech Recognition Using Multi-task Learning", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-016 PDF Video- @inproceedings{Kim2017mar,
- author = {Kim, Suyoun and Hori, Takaaki and Watanabe, Shinji},
- title = {Joint CTC- Attention Based End-to-End Speech Recognition Using Multi-task Learning},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-016}
- }
- Li, Q., Liu, S., Mansour, H., Wakin, M., Yang, D., Zhu, Z., "Jazz: A Companion to Music for Frequency Estimation with Missing Data", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-013 PDF- @inproceedings{Li2017mar,
- author = {Li, Qiuwei and Liu, Shuang and Mansour, Hassan and Wakin, Michael and Yang, Dehui and Zhu, Zhihui},
- title = {Jazz: A Companion to Music for Frequency Estimation with Missing Data},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-013}
- }
- Liu, H.-Y., Kamilov, U., Liu, D., Mansour, H., Boufounos, P.T., "Compressive Imaging with Iterative Forward Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-009 PDF- @inproceedings{Liu2017mar2,
- author = {Liu, Hsiou-Yuan and Kamilov, Ulugbek and Liu, Dehong and Mansour, Hassan and Boufounos, Petros T.},
- title = {Compressive Imaging with Iterative Forward Models},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-009}
- }
- Luo, Y., Chen, Z., Hershey, J.R., Le Roux, J., Mesgarani, N., "Deep Clustering and Conventional Networks for Music Separation: Strong Together", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-010 PDF- @inproceedings{Luo2017mar,
- author = {Luo, Yi and Chen, Zhuo and Hershey, John R. and Le Roux, Jonathan and Mesgarani, Nima},
- title = {Deep Clustering and Conventional Networks for Music Separation: Strong Together},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-010}
- }
- Meng, Z., Watanabe, S., Hershey, J.R., Erdogan, H., "Deep Long Short-Term Memory Adaptive Beamforming Networks for Multichannel Robust Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-012 PDF- @inproceedings{Meng2017mar,
- author = {Meng, Zhong and Watanabe, Shinji and Hershey, John R. and Erdogan, Hakan},
- title = {Deep Long Short-Term Memory Adaptive Beamforming Networks for Multichannel Robust Speech Recognition},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-012}
- }
- Wang, Y., Raval, N.J., Ishwar, P., Hattori, M., Hirano, T., Matsuda, N., Shimizu, R., "On Methods for Privacy-Preserving Energy Disaggregation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-015 PDF- @inproceedings{Wang2017mar2,
- author = {Wang, Ye and Raval, Nisarg J and Ishwar, Prakash and Hattori, Mitsuhiro and Hirano, Takato and Matsuda, Nori and Shimizu, Rina},
- title = {On Methods for Privacy-Preserving Energy Disaggregation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-015}
- }
- Watanabe, S., Hori, T., Le Roux, J., Hershey, J.R., "Student-Teacher Network Learning with Enhanced Features", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-011 PDF- @inproceedings{Watanabe2017mar,
- author = {Watanabe, Shinji and Hori, Takaaki and Le Roux, Jonathan and Hershey, John R.},
- title = {Student-Teacher Network Learning with Enhanced Features},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-011}
- }
- Xiao, X., Watanabe, S., Chng, E.S., Li, H., "Beamforming Networks Using Spatial Covariance Features for Far-field Speech Recognition", Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)<br />
, DOI: 10.1109/APSIPA.2016.7820724, December 2016.
BibTeX TR2016-162 PDF- @inproceedings{Xiao2016dec,
- author = {Xiao, Xiong and Watanabe, Shinji and Chng, Eng Siong and Li, Haizhou},
- title = {Beamforming Networks Using Spatial Covariance Features for Far-field Speech Recognition},
- booktitle = {Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)
}, - year = 2016,
- month = dec,
- doi = {10.1109/APSIPA.2016.7820724},
- url = {https://www.merl.com/publications/TR2016-162}
- }
- Takano, T., Moriya, T., Shinozaki, T., Watanabe, S., Hori, T., Duh, K., "Automated Structure Discovery and Parameter Tuning of Neural Network Language Model Based on Evolution Strategy", IEEE Spoken Language Technology Workshop (SLT), DOI: 10.1109/SLT.2016.7846334, December 2016.
BibTeX TR2016-173 PDF- @inproceedings{Takano2016dec,
- author = {Takano, Tomihiro and Moriya, Takafumi and Shinozaki, Takahiro and Watanabe, Shinji and Hori, Takaaki and Duh, Kevin},
- title = {Automated Structure Discovery and Parameter Tuning of Neural Network Language Model Based on Evolution Strategy},
- booktitle = {IEEE Spoken Language Technology Workshop (SLT)},
- year = 2016,
- month = dec,
- doi = {10.1109/SLT.2016.7846334},
- url = {https://www.merl.com/publications/TR2016-173}
- }
- Barker, J., Marxer, R., Vincent, E., Watanabe, S., "The Third 'CHIME' Speech Separation and Recognition Challenge: Analysis and Outcomes", Computer Speech & Language, DOI: 10.1016/j.csl.2016.10.005, December 2016.
BibTeX TR2016-171 PDF- @article{Barker2016dec,
- author = {Barker, Jon and Marxer, Ricard and Vincent, Emmanuel and Watanabe, Shinji},
- title = {The Third 'CHIME' Speech Separation and Recognition Challenge: Analysis and Outcomes},
- journal = {Computer Speech \& Language},
- year = 2016,
- month = dec,
- publisher = {Elsevier},
- doi = {10.1016/j.csl.2016.10.005},
- url = {https://www.merl.com/publications/TR2016-171}
- }
- Vincent, E., Watanabe, S., Nugraha, A.A., Barker, J., Marxer, R., "An analysis of environment, microphone and data simulation mismatches in robust speech recognition", Computer Speech & Language, DOI: 10.1016/j.csl.2016.11.005, December 2016.
BibTeX TR2016-172 PDF- @article{Vincent2016dec,
- author = {Vincent, Emmanuel and Watanabe, Shinji and Nugraha, Aditya Arie and Barker, Jon and Marxer, Ricard},
- title = {An analysis of environment, microphone and data simulation mismatches in robust speech recognition},
- journal = {Computer Speech \& Language},
- year = 2016,
- month = dec,
- publisher = {Elsevier},
- doi = {10.1016/j.csl.2016.11.005},
- url = {https://www.merl.com/publications/TR2016-172}
- }
- Delcroix, M., Watanabe, S., "Recent Advances in Distant Speech Recognition," Tech. Rep. TR2016-115, Interspeech Tutorials, September 2016.
BibTeX TR2016-115 PDF- @techreport{Delcroix2016sep,
- author = {Delcroix, Marc and Watanabe, Shinji},
- title = {Recent Advances in Distant Speech Recognition},
- booktitle = {Interspeech Tutorials},
- institution = {Interspeech},
- year = 2016,
- month = sep,
- url = {https://www.merl.com/publications/TR2016-115}
- }
- Le Roux, J., Vincent, E., Erdogan, H., "Learning-Based Approaches to Speech Enhancement and Separation," Tech. Rep. TR2016-113, Interspeech Tutorials, September 2016.
BibTeX TR2016-113 PDF- @techreport{LeRoux2016sep,
- author = {Le Roux, Jonathan and Vincent, Emmanuel and Erdogan, Hakan},
- title = {Learning-Based Approaches to Speech Enhancement and Separation},
- booktitle = {Interspeech Tutorials},
- year = 2016,
- month = sep,
- url = {https://www.merl.com/publications/TR2016-113}
- }
- Erdogan, H., Hershey, J.R., Watanabe, S., Mandel, M., Le Roux, J., "Improved MVDR beamforming using single-channel mask prediction networks", Interspeech, DOI: 10.21437/Interspeech.2016-552, September 2016, pp. 1981-1985.
BibTeX TR2016-072 PDF- @inproceedings{Erdogan2016sep,
- author = {Erdogan, Hakan and Hershey, John R. and Watanabe, Shinji and Mandel, Michael and Le Roux, Jonathan},
- title = {Improved MVDR beamforming using single-channel mask prediction networks},
- booktitle = {Interspeech},
- year = 2016,
- pages = {1981--1985},
- month = sep,
- doi = {10.21437/Interspeech.2016-552},
- url = {https://www.merl.com/publications/TR2016-072}
- }
- Isik, Y., Le Roux, J., Chen, Z., Watanabe, S., Hershey, J.R., "Single-Channel Multi-Speaker Separation using Deep Clustering", Interspeech, DOI: 10.21437/Interspeech.2016-1176, September 2016, pp. 545-549.
BibTeX TR2016-073 PDF- @inproceedings{Isik2016sep,
- author = {Isik, Yusuf and Le Roux, Jonathan and Chen, Zhuo and Watanabe, Shinji and Hershey, John R.},
- title = {Single-Channel Multi-Speaker Separation using Deep Clustering},
- booktitle = {Interspeech},
- year = 2016,
- pages = {545--549},
- month = sep,
- doi = {10.21437/Interspeech.2016-1176},
- url = {https://www.merl.com/publications/TR2016-073}
- }
- Zmolikova, K., Karafiat, M., Vesely, K., Delcroix, M., Watanabe, S., Burget, L., Cernocky, J.H., "Data selection by sequence summarizing neural network in mismatch condition training", Interspeech, DOI: 10.21437/Interspeech.2016-741, September 2016, pp. 2354-2358.
BibTeX TR2016-075 PDF- @inproceedings{Zmolikova2016sep,
- author = {Zmolikova, Katerina and Karafiat, Martin and Vesely, Karel and Delcroix, Marc and Watanabe, Shinji and Burget, Lukas and Cernocky, Jan, Honza},
- title = {Data selection by sequence summarizing neural network in mismatch condition training},
- booktitle = {Interspeech},
- year = 2016,
- pages = {2354--2358},
- month = sep,
- doi = {10.21437/Interspeech.2016-741},
- url = {https://www.merl.com/publications/TR2016-075}
- }
- Hayashi, T., Watanabe, S., Toda, T., Hori, T., Le Roux, J., Takeda, K., "Bidirectional LSTM-HMM Hybrid System for Polyphonic Sound Event Detection", Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE), September 2016, pp. 35-39.
BibTeX TR2016-114 PDF- @inproceedings{Hayashi2016sep,
- author = {Hayashi, Tomoki and Watanabe, Shinji and Toda, Tomoki and Hori, Takaaki and Le Roux, Jonathan and Takeda, Kazuya},
- title = {Bidirectional LSTM-HMM Hybrid System for Polyphonic Sound Event Detection},
- booktitle = {Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE)},
- year = 2016,
- pages = {35--39},
- month = sep,
- url = {https://www.merl.com/publications/TR2016-114}
- }
- Castorena, J., Kamilov, U., Boufounos, P.T., "Autocalibration of LIDAR and Optical Cameras via Edge Alignment", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2016.7472200, March 2016, pp. 2862-2866.
BibTeX TR2016-009 PDF- @inproceedings{Castorena2016mar,
- author = {Castorena, Juan and Kamilov, Ulugbek and Boufounos, Petros T.},
- title = {Autocalibration of LIDAR and Optical Cameras via Edge Alignment},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2016,
- pages = {2862--2866},
- month = mar,
- doi = {10.1109/ICASSP.2016.7472200},
- url = {https://www.merl.com/publications/TR2016-009}
- }