- Tachioka, Y., Watanabe, S., Le Roux, J., Hershey, J.R., "Sequential Maximum Mutual Information Linear Discriminant Analysis for Speech Recognition", Interspeech, September 2014, vol. 15, pp. 2415-2419.
BibTeX TR2014-079 PDF- @inproceedings{Tachioka2014sep,
- author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
- title = {{Sequential Maximum Mutual Information Linear Discriminant Analysis for Speech Recognition}},
- booktitle = {Interspeech},
- year = 2014,
- volume = 15,
- pages = {2415--2419},
- month = sep,
- publisher = {International Speech Communication Association},
- issn = {2308-457X},
- url = {https://www.merl.com/publications/TR2014-079}
- }
- Watanabe, S., Hershey, J.R., Marks, T.K., Fujii, Y., Koji, Y., "Cost-level integration of statistical and rule-based dialog managers", Interspeech, September 2014, vol. 15, pp. 323-327.
BibTeX TR2014-082 PDF- @inproceedings{Watanabe2014sep,
- author = {{{Watanabe, S. and Hershey, J.R. and Marks, T.K. and Fujii, Y. and Koji, Y.}}},
- title = {{{Cost-level integration of statistical and rule-based dialog managers}}},
- booktitle = {Interspeech},
- year = 2014,
- volume = 15,
- pages = {323--327},
- month = sep,
- publisher = {International Speech Communication Association},
- url = {https://www.merl.com/publications/TR2014-082}
- }
- Weninger, F., Le Roux, J., Hershey, J.R., Watanabe, S., "Discriminative NMF and its application to single-channel source separation", Interspeech, September 2014, vol. 15, pp. 865-869.
BibTeX TR2014-081 PDF- @inproceedings{Weninger2014sep,
- author = {Weninger, F. and {Le Roux}, J. and Hershey, J.R. and Watanabe, S.},
- title = {{Discriminative NMF and its application to single-channel source separation}},
- booktitle = {Interspeech},
- year = 2014,
- volume = 15,
- pages = {865--869},
- month = sep,
- publisher = {International Speech Communication Association},
- issn = {2308-457X},
- url = {https://www.merl.com/publications/TR2014-081}
- }
- Hershey, J.R., Le Roux, J., Weninger, F., "Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures", arXiv, August 2014.
BibTeX arXiv- @article{Hershey2014aug,
- author = {Hershey, J.R. and {Le Roux}, J. and Weninger, F.},
- title = {{Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures}},
- journal = {arXiv},
- year = 2014,
- month = aug,
- url = {https://arxiv.org/abs/1409.2574}
- }
- Weninger, F., Watanabe, S., Le Roux, J., Hershey, J.R., Tachioka, Y., Geiger, J., Schuller, B., Rigoll, G., "The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement", IEEE REVERB Workshop, May 2014.
BibTeX TR2014-033 PDF- @inproceedings{Weninger2014may2,
- author = {Weninger, F. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R. and Tachioka, Y. and Geiger, J. and Schuller, B. and Rigoll, G.},
- title = {{The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement}},
- booktitle = {IEEE REVERB Workshop},
- year = 2014,
- month = may,
- url = {https://www.merl.com/publications/TR2014-033}
- }
- Simsekli, U., Le Roux, J., Hershey, J.R., "Non-negative Source-filter Dynamical System for Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854797, May 2014, pp. 6206-6210.
BibTeX TR2014-027 PDF Software- @inproceedings{Simsekli2014may,
- author = {Simsekli, U. and {Le Roux}, J. and Hershey, J.R.},
- title = {{Non-negative Source-filter Dynamical System for Speech Enhancement}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {6206--6210},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854797},
- url = {https://www.merl.com/publications/TR2014-027}
- }
- Tang, H., Watanabe, S., Marks, T.K., Hershey, J.R., "Log-linear Dialog Manager", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854371, May 2014, pp. 4092-4096.
BibTeX TR2014-024 PDF- @inproceedings{Tang2014may,
- author = {Tang, H. and Watanabe, S. and Marks, T.K. and Hershey, J.R.},
- title = {{Log-linear Dialog Manager}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {4092--4096},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854371},
- url = {https://www.merl.com/publications/TR2014-024}
- }
- Tachioka, Y., Watanabe, S., Le Roux, J., Hershey, J.R., "A Generalized Discriminative Training Framework for System Combination", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU.2013.6707703, December 2013, pp. 43-48.
BibTeX TR2013-118 PDF- @inproceedings{Tachioka2013dec,
- author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
- title = {{A Generalized Discriminative Training Framework for System Combination}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2013,
- pages = {43--48},
- month = dec,
- doi = {10.1109/ASRU.2013.6707703},
- url = {https://www.merl.com/publications/TR2013-118}
- }
- Potluru, V.K., Le Roux, J., Pearlmutter, B.A., Hershey, J.R., Brand, M., "Coordinate Descent for Mixed-norm NMF", NIPS Workshop on Greedy Algorithms, Frank-Wolfe and Friends - A Modern Perspective, December 2013.
BibTeX TR2013-130 PDF- @inproceedings{Potluru2013dec,
- author = {Potluru, V.K. and {Le Roux}, J. and Pearlmutter, B.A. and Hershey, J.R. and Brand, M.},
- title = {{Coordinate Descent for Mixed-norm NMF}},
- booktitle = {NIPS Workshop on Greedy Algorithms, Frank-Wolfe and Friends - A Modern Perspective},
- year = 2013,
- month = dec,
- url = {https://www.merl.com/publications/TR2013-130}
- }
- Le Roux, J., Watanabe, S., Hershey, J.R., "Ensemble Learning for Speech Enhancement", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA.2013.6701888, October 2013, pp. 1-4.
BibTeX TR2013-098 PDF- @inproceedings{LeRoux2013oct,
- author = {{Le Roux}, J. and Watanabe, S. and Hershey, J.R.},
- title = {{Ensemble Learning for Speech Enhancement}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2013,
- pages = {1--4},
- month = oct,
- doi = {10.1109/WASPAA.2013.6701888},
- issn = {1931-1168},
- url = {https://www.merl.com/publications/TR2013-098}
- }
- Simsekli, U., Le Roux, J., Hershey, J.R., "Hierarchical and Coupled Non-negative Dynamical Systems with Application to Audio Modeling", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA.2013.6701891, October 2013, pp. 1-4.
BibTeX TR2013-097 PDF- @inproceedings{Simsekli2013oct,
- author = {Simsekli, U. and {Le Roux}, J. and Hershey, J.R.},
- title = {{Hierarchical and Coupled Non-negative Dynamical Systems with Application to Audio Modeling}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2013,
- pages = {1--4},
- month = oct,
- doi = {10.1109/WASPAA.2013.6701891},
- issn = {1931-1168},
- url = {https://www.merl.com/publications/TR2013-097}
- }
- Yoshino, K., Watanabe, S., Le Roux, J., Hershey, J.R., "Statistical Dialogue Management using Intention Dependency Graph", International Joint Conference on Natural Language Processing (IJCNLP), October 2013.
BibTeX TR2013-096 PDF- @inproceedings{Yoshino2013oct,
- author = {Yoshino, K. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
- title = {{Statistical Dialogue Management using Intention Dependency Graph}},
- booktitle = {International Joint Conference on Natural Language Processing (IJCNLP)},
- year = 2013,
- month = oct,
- url = {https://www.merl.com/publications/TR2013-096}
- }
- Tachioka, Y., Watanabe, S., Le Roux, J., Hershey, J.R., "Discriminative Methods for Noise Robust Speech Recognition: A CHiME Challenge Benchmark", International Workshop on Machine Listening in Multisource Environments (CHiME), June 2013.
BibTeX TR2013-044 PDF- @inproceedings{Tachioka2013jun,
- author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
- title = {{Discriminative Methods for Noise Robust Speech Recognition: A CHiME Challenge Benchmark}},
- booktitle = {International Workshop on Machine Listening in Multisource Environments (CHiME)},
- year = 2013,
- month = jun,
- url = {https://www.merl.com/publications/TR2013-044}
- }
- Fevotte, C., Le Roux, J., Hershey, J.R., "Non-negative Dynamical System with Application to Speech and Audio", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2013.
BibTeX TR2013-021 PDF Software- @inproceedings{Fevotte2013may,
- author = {Fevotte, C. and {Le Roux}, J. and Hershey, J.R.},
- title = {{Non-negative Dynamical System with Application to Speech and Audio}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2013,
- month = may,
- url = {https://www.merl.com/publications/TR2013-021}
- }
- Le Roux, J., Boufounos, P.T., Kang, K., Hershey, J.R., "Source Localization in Reverberant Environments using Sparse Optimization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2013.6638473, May 2013, pp. 4310-4314.
BibTeX TR2013-022 PDF- @inproceedings{LeRoux2013may,
- author = {{Le Roux}, J. and Boufounos, P.T. and Kang, K. and Hershey, J.R.},
- title = {{Source Localization in Reverberant Environments using Sparse Optimization}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2013,
- pages = {4310--4314},
- month = may,
- doi = {10.1109/ICASSP.2013.6638473},
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2013-022}
- }
- Tachioka, Y., Watanabe, S., Hershey, J.R., "Effectiveness of Discriminative Training and Feature Transformation for Reverberated and Noisy Speech", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2013.
BibTeX TR2013-020 PDF- @inproceedings{Tachioka2013may,
- author = {Tachioka, Y. and Watanabe, S. and Hershey, J.R.},
- title = {{Effectiveness of Discriminative Training and Feature Transformation for Reverberated and Noisy Speech}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2013,
- month = may,
- url = {https://www.merl.com/publications/TR2013-020}
- }
- Watanabe, S., Hershey, J.R., "Stereo-based Feature Enhancement Using Dictionary Learning", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2013.6639034, May 2013, pp. 7073-7077.
BibTeX TR2013-019 PDF- @inproceedings{Watanabe2013may,
- author = {Watanabe, S. and Hershey, J.R.},
- title = {{Stereo-based Feature Enhancement Using Dictionary Learning}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2013,
- pages = {7073--7077},
- month = may,
- doi = {10.1109/ICASSP.2013.6639034},
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2013-019}
- }
- Hershey, J.R., Rennie, S.J., Le Roux, J., "Factorial Models for Noise Robust Speech Recognition" in Techniques for Noise Robustness in Automatic Speech Recognition, Virtanen, T. and Singh, R. and Raj, B., Eds., chapter 12, Wiley, November 2012.
BibTeX TR2012-002 PDF- @incollection{Hershey2012nov,
- author = {Hershey, J.R. and Rennie, S.J. and {Le Roux}, J.},
- title = {{Factorial Models for Noise Robust Speech Recognition}},
- booktitle = {Techniques for Noise Robustness in Automatic Speech Recognition},
- year = 2012,
- editor = {Virtanen, T. and Singh, R. and Raj, B.},
- chapter = 12,
- month = nov,
- publisher = {Wiley},
- url = {https://www.merl.com/publications/TR2012-002}
- }
- Heaukulani, C., Le Roux, J., Hershey, J.R., "Latent Dirichlet Reallocation for Term Swapping", International Workshop on Statistical Machine Learning for Speech Processing (IWSML), March 2012.
BibTeX TR2012-022 PDF- @inproceedings{Heaukulani2012mar,
- author = {Heaukulani, C. and {Le Roux}, J. and Hershey, J.R.},
- title = {{Latent Dirichlet Reallocation for Term Swapping}},
- booktitle = {International Workshop on Statistical Machine Learning for Speech Processing (IWSML)},
- year = 2012,
- month = mar,
- url = {https://www.merl.com/publications/TR2012-022}
- }
- Le Roux, J., Hershey, J.R., "Indirect Model-based Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP-2012.6288806, March 2012, pp. 4045-4048.
BibTeX TR2012-016 PDF- @inproceedings{LeRoux2012mar2,
- author = {{Le Roux}, J. and Hershey, J.R.},
- title = {{Indirect Model-based Speech Enhancement}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2012,
- pages = {4045--4048},
- month = mar,
- doi = {10.1109/ICASSP-2012.6288806},
- issn = {1520-6149},
- isbn = {978-1-4673-0045-2},
- url = {https://www.merl.com/publications/TR2012-016}
- }
- Le Roux, J., Hershey, J.R., "Speech Enhancement by Indirect VTS", Acoustical Society of Japan Spring Meeting (ASJ), March 2012.
BibTeX TR2012-011 PDF- @inproceedings{LeRoux2012mar1,
- author = {{Le Roux}, J. and Hershey, J.R.},
- title = {{Speech Enhancement by Indirect VTS}},
- booktitle = {Acoustical Society of Japan Spring Meeting (ASJ)},
- year = 2012,
- month = mar,
- url = {https://www.merl.com/publications/TR2012-011}
- }
- Taguchi, Y., Marks, T.K., Hershey, J.R., "Entropy-Based Motion Selection for Touch-Based Registration Using Rao-Blackwellized Particle Filtering", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/IROS.2011.6094767, September 2011, pp. 4690=4697.
BibTeX TR2011-067 PDF- @inproceedings{Taguchi2011sep,
- author = {Taguchi, Y. and Marks, T.K. and Hershey, J.R.},
- title = {{Entropy-Based Motion Selection for Touch-Based Registration Using Rao-Blackwellized Particle Filtering}},
- booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
- year = 2011,
- pages = {4690=4697},
- month = sep,
- doi = {10.1109/IROS.2011.6094767},
- url = {https://www.merl.com/publications/TR2011-067}
- }
- Marks, T.K., Hershey, J.R., Movellan, J.R., "Tracking Motion, Deformation, and Texture Using Conditionally Gaussian Processes", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/TPAMI.2008.278, Vol. 32, No. 2, pp. 348-363, February 2010.
BibTeX TR2010-071 PDF- @article{Marks2010feb,
- author = {Marks, T.K. and Hershey, J.R. and Movellan, J.R.},
- title = {{Tracking Motion, Deformation, and Texture Using Conditionally Gaussian Processes}},
- journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
- year = 2010,
- volume = 32,
- number = 2,
- pages = {348--363},
- month = feb,
- doi = {10.1109/TPAMI.2008.278},
- url = {https://www.merl.com/publications/TR2010-071}
- }