Publications

d’Haro, L.F., Banchs, R., Hori, C., Li, H., "Automatic Evaluation of End-to-End Dialog Systems with Adequacy-Fluency Metrics", Special issue on DSTC6 in Computer Speech and Langauge, DOI: 10.1016/j.csl.2018.12.004, Vol. 55, pp. 200-215, March 2019.
BibTeX TR2018-195 PDF
- @article{dHaro2019mar,
- author = {d’Haro, Luis Fernando and Banchs, Rafael and Hori, Chiori and Li, Haizhou},
- title = {{Automatic Evaluation of End-to-End Dialog Systems with Adequacy-Fluency Metrics}},
- journal = {Special issue on DSTC6 in Computer Speech and Langauge},
- year = 2019,
- volume = 55,
- pages = {200--215},
- month = mar,
- publisher = {Elsevier},
- doi = {10.1016/j.csl.2018.12.004},
- url = {https://www.merl.com/publications/TR2018-195}
- }
Teo, K.H., "Trip Report on International Symposium on the Physical and Failure Analysis of Integrated Circuits 2018 and NTU-MIT Alliance Labs Visit," Tech. Rep. TR2018-194, Mitsubishi Electric Research Laboratories, March 2019.
BibTeX TR2018-194 PDF
- @techreport{Teo2019mar2,
- author = {Teo, Koon Hoo},
- title = {{Trip Report on International Symposium on the Physical and Failure Analysis of Integrated Circuits 2018 and NTU-MIT Alliance Labs Visit}},
- institution = {Mitsubishi Electric Research Laboratories},
- year = 2019,
- month = mar,
- url = {https://www.merl.com/publications/TR2018-194}
- }
TaherSima, M., Kojima, K., Koike-Akino, T., Jha, D.K., Wang, B., Lin, C., Parsons, K., "Deep Neural Network Inverse Modeling for Integrated Photonics", Optical Fiber Communication Conference and Exposition and the National Fiber Optic Engineers Conference (OFC/NFOEC), DOI: 10.1364/OFC.2019.W3B.5, March 2019.
BibTeX TR2018-183 PDF
- @inproceedings{TaherSima2019mar,
- author = {TaherSima, Mohammad and Kojima, Keisuke and Koike-Akino, Toshiaki and Jha, Devesh K. and Wang, Bingnan and Lin, Chungwei and Parsons, Kieran},
- title = {{Deep Neural Network Inverse Modeling for Integrated Photonics}},
- booktitle = {Optical Fiber Communication Conference and Exposition and the National Fiber Optic Engineers Conference (OFC/NFOEC)},
- year = 2019,
- month = mar,
- doi = {10.1364/OFC.2019.W3B.5},
- url = {https://www.merl.com/publications/TR2018-183}
- }
TaherSima, M., Kojima, K., Koike-Akino, T., Jha, D., Wang, B., Lin, C., Parsons, K., "Deep Neural Network Inverse Design of Integrated Photonic Power Splitters", Nature Scientific Reports, DOI: 10.1038/s41598-018-37952-2, Vol. 9, pp. 1368, December 2018.
BibTeX TR2018-180 PDF
- @article{TaherSima2018dec,
- author = {TaherSima, Mohammad and Kojima, Keisuke and Koike-Akino, Toshiaki and Jha, Devesh and Wang, Bingnan and Lin, Chungwei and Parsons, Kieran},
- title = {{Deep Neural Network Inverse Design of Integrated Photonic Power Splitters}},
- journal = {Nature Scientific Reports},
- year = 2018,
- volume = 9,
- pages = 1368,
- month = dec,
- doi = {10.1038/s41598-018-37952-2},
- issn = {2045-2322},
- url = {https://www.merl.com/publications/TR2018-180}
- }
Ataer-Cansizoglu, E., Jones, M.J., "Super-resolution of Very Low-Resolution Faces from Videos", British Machine Vision Conference (BMVC), September 2018.
BibTeX TR2018-140 PDF
- @inproceedings{Ataer-Cansizoglu2018sep,
- author = {Ataer-Cansizoglu, Esra and Jones, Michael J.},
- title = {{Super-resolution of Very Low-Resolution Faces from Videos}},
- booktitle = {British Machine Vision Conference (BMVC)},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-140}
- }
Wichern, G., Le Roux, J., "Phase Reconstruction with Learned Time-Frequency Representations for Single-Channel Speech Separation", International Workshop on Acoustic Signal Enhancement (IWAENC), DOI: 10.1109/IWAENC.2018.8521243, September 2018.
BibTeX TR2018-146 PDF
- @inproceedings{Wichern2018sep,
- author = {Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Phase Reconstruction with Learned Time-Frequency Representations for Single-Channel Speech Separation}},
- booktitle = {International Workshop on Acoustic Signal Enhancement (IWAENC)},
- year = 2018,
- month = sep,
- doi = {10.1109/IWAENC.2018.8521243},
- url = {https://www.merl.com/publications/TR2018-146}
- }
Kocanaogullari, A., Ataer-Cansizoglu, E., "Active Descriptor Learning for Feature Matching", International Workshop on Compact and Efficient Feature Representation and Learning in Computer Vision, September 2018.
BibTeX TR2018-132 PDF
- @inproceedings{Kocanaogullari2018sep,
- author = {Kocanaogullari, Aziz and Ataer-Cansizoglu, Esra},
- title = {{Active Descriptor Learning for Feature Matching}},
- booktitle = {International Workshop on Compact and Efficient Feature Representation and Learning in Computer Vision},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-132}
- }
Jones, M.J., Broad, A., Lee, T.-Y., "Recurrent Multi-frame Single Shot Detector for Video Object Detection", British Machine Vision Conference (BMVC), September 2018.
BibTeX TR2018-137 PDF
- @inproceedings{Jones2018sep,
- author = {Jones, Michael J. and Broad, Alexander and Lee, Teng-Yok},
- title = {{Recurrent Multi-frame Single Shot Detector for Video Object Detection}},
- booktitle = {British Machine Vision Conference (BMVC)},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-137}
- }
Wang, Z.-Q., Le Roux, J., Wang, D., Hershey, J., "End-to-End Speech Separation with Unfolded Iterative Phase Reconstruction", Interspeech, September 2018.
BibTeX TR2018-135 PDF
- @inproceedings{Wang2018sep,
- author = {Wang, Zhong-Qiu and {Le Roux}, Jonathan and Wang, DeLiang and Hershey, John},
- title = {{End-to-End Speech Separation with Unfolded Iterative Phase Reconstruction}},
- booktitle = {Interspeech},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-135}
- }
Watanabe, S., Hori, T., Karita, S., Hayashi, T., Nishitoba, J., Unno, Y., Enrique Yalta Soplin, N., Heymann, J., Wiesner, M., Chen, N., Renduchintala, A., Ochiai, T., "ESPnet: End-to-End Speech Processing Toolkit", Interspeech, September 2018.
BibTeX TR2018-136 PDF
- @inproceedings{Watanabe2018sep,
- author = {Watanabe, Shinji and Hori, Takaaki and Karita, Shigeki and Hayashi, Tomoki and Nishitoba, Jiro and Unno, Yuya and Enrique Yalta Soplin, Nelson and Heymann, Jahn and Wiesner, Matthew and Chen, Nanxin and Renduchintala, Adithya and Ochiai, Tsubasa},
- title = {{ESPnet: End-to-End Speech Processing Toolkit}},
- booktitle = {Interspeech},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-136}
- }
Ataer-Cansizoglu, E., Jones, M.J., Zhang, Z., Sullivan, A., "Verification of Very Low-Resolution Faces Using An Identity-Preserving Deep Face Super-resolution Network", arXiv, August 2018.
BibTeX arXiv
- @article{Ataer-Cansizoglu2018aug,
- author = {Ataer-Cansizoglu, Esra and Jones, Michael J. and Zhang, Ziming and Sullivan, Alan},
- title = {{Verification of Very Low-Resolution Faces Using An Identity-Preserving Deep Face Super-resolution Network}},
- journal = {arXiv},
- year = 2018,
- month = aug,
- url = {https://arxiv.org/abs/1903.10974}
- }
Zhang, Z., "LMKL-Net: A Fast Localized Multiple Kernel Learning Solver via Deep Neural Networks", arXiv, July 12, 2018.
BibTeX arXiv
- @article{Zhang2018jul,
- author = {Zhang, Ziming},
- title = {{LMKL-Net: A Fast Localized Multiple Kernel Learning Solver via Deep Neural Networks}},
- journal = {arXiv},
- year = 2018,
- month = jul,
- url = {https://arxiv.org/abs/1805.08656}
- }
Erdogan, H., Hershey, J., Watanabe, S., Le Roux, J., "Deep recurrent networks for separation and recognition of single-channel speech in non-stationary background audio" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R., Eds., chapter 7, Springer, July 2018.
BibTeX
- @incollection{Erdogan2018jul,
- author = {Erdogan, Hakan and Hershey, John and Watanabe, Shinji and {Le Roux}, Jonathan},
- title = {{Deep recurrent networks for separation and recognition of single-channel speech in non-stationary background audio}},
- booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
- year = 2018,
- editor = {Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R.},
- chapter = 7,
- month = jul,
- publisher = {Springer},
- isbn = {978-3-319-64680-0}
- }
Xiao, X., Watanabe, S., Erdogan, H., Mandel, M., Lu, L., Hershey, J., Seltzer, M., Chen, G., Zhang, Y., Yu, D., "Discriminative beamforming with phase aware neural networks for speech enhancement and recognition" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R., Eds., chapter 4, Springer, July 9, 2018.
BibTeX
- @incollection{Xiao2018jul2,
- author = {Xiao, Xiong and Watanabe, Shinji and Erdogan, Hakan and Mandel, Michael and Lu, Liang and Hershey, John and Seltzer, Mike and Chen, Guoguo and Zhang, Yu and Yu, Dong},
- title = {{Discriminative beamforming with phase aware neural networks for speech enhancement and recognition}},
- booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
- year = 2018,
- editor = {Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R.},
- chapter = 4,
- month = jul,
- publisher = {Springer}
- }
Liu, J., Guo, J., Orlik, P.V., Shibata, M., Nakahara, D., Mii, S., Takac, M., "Anomaly Detection in Manufacturing Systems Using Structured Neural Networks", IEEE World Congress on Intelligent Control and Automation, DOI: 10.1109/WCICA.2018.8630692, July 2018, pp. 175-180.
BibTeX TR2018-097 PDF
- @inproceedings{Liu2018jul2,
- author = {Liu, Jie and Guo, Jianlin and Orlik, Philip V. and Shibata, Masahiko and Nakahara, Daiki and Mii, Satoshi and Takac, Martin},
- title = {{Anomaly Detection in Manufacturing Systems Using Structured Neural Networks}},
- booktitle = {IEEE World Congress on Intelligent Control and Automation},
- year = 2018,
- pages = {175--180},
- month = jul,
- doi = {10.1109/WCICA.2018.8630692},
- url = {https://www.merl.com/publications/TR2018-097}
- }
Koike-Akino, T., Millar, D.S., Parsons, K., Kojima, K., "Fiber Nonlinearity Equalization with Multi-Label Deep Learning Scalable to High-Order DP-QAM", Signal Processing in Photonic Communications (SPPCom), DOI: 10.1364/SPPCOM.2018.SpM4G.1, July 2018.
BibTeX TR2018-047 PDF
- @inproceedings{Koike-Akino2018jul3,
- author = {Koike-Akino, Toshiaki and Millar, David S. and Parsons, Kieran and Kojima, Keisuke},
- title = {{Fiber Nonlinearity Equalization with Multi-Label Deep Learning Scalable to High-Order DP-QAM}},
- booktitle = {Signal Processing in Photonic Communications (SPPCom)},
- year = 2018,
- month = jul,
- doi = {10.1364/SPPCOM.2018.SpM4G.1},
- url = {https://www.merl.com/publications/TR2018-047}
- }
Shen, Y., Feng, C., Yang, Y., Tian, D., "Mining Point Cloud Local Structures by Kernel Correlation and Graph Pooling", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2018.
BibTeX TR2018-041 PDF Software
- @inproceedings{Shen2018jun,
- author = {Shen, Yiru and Feng, Chen and Yang, Yaoqing and Tian, Dong},
- title = {{Mining Point Cloud Local Structures by Kernel Correlation and Graph Pooling}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2018,
- month = jun,
- url = {https://www.merl.com/publications/TR2018-041}
- }
Yang, Y., Feng, C., Shen, Y., Tian, D., "FoldingNet: Point Cloud Auto-encoder via Deep Grid Deformation", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/CVPR.2018.00029, June 2018.
BibTeX TR2018-042 PDF Video Software
- @inproceedings{Yang2018jun,
- author = {{Yang, Yaoqing and Feng, Chen and Shen, Yiru and Tian, Dong}},
- title = {{FoldingNet: Point Cloud Auto-encoder via Deep Grid Deformation}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2018,
- month = jun,
- doi = {10.1109/CVPR.2018.00029},
- url = {https://www.merl.com/publications/TR2018-042}
- }
Fujihashi, T., Koike-Akino, T., Watanabe, T., Orlik, P.V., "Nonlinear Equalization with Deep Learning for Multi-Purpose Visual MIMO Communications", IEEE International Conference on Communications (ICC), DOI: 10.1109/ICC.2018.8422544, May 2018.
BibTeX TR2018-039 PDF
- @inproceedings{Fujihashi2018may,
- author = {Fujihashi, Takuya and Koike-Akino, Toshiaki and Watanabe, Takashi and Orlik, Philip V.},
- title = {{Nonlinear Equalization with Deep Learning for Multi-Purpose Visual MIMO Communications}},
- booktitle = {IEEE International Conference on Communications (ICC)},
- year = 2018,
- month = may,
- doi = {10.1109/ICC.2018.8422544},
- url = {https://www.merl.com/publications/TR2018-039}
- }
Ochiai, T., Watanabe, S., Katagiri, S., Hori, T., Hershey, J.R., "Speaker Adaptation for Multichannel End-to-End Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2018.8462161, April 2018, pp. 6707-6711.
BibTeX TR2018-006 PDF
- @inproceedings{Ochiai2018apr,
- author = {Ochiai, Tsubasa and Watanabe, Shinji and Katagiri, Shigeru and Hori, Takaaki and Hershey, John R.},
- title = {{Speaker Adaptation for Multichannel End-to-End Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2018,
- pages = {6707--6711},
- month = apr,
- doi = {10.1109/ICASSP.2018.8462161},
- url = {https://www.merl.com/publications/TR2018-006}
- }
Settle, S., Le Roux, J., Hori, T., Watanabe, S., Hershey, J.R., "End-to-End Multi-Speaker Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2018.8461893, April 2018, pp. 4819-4823.
BibTeX TR2018-001 PDF Video
- @inproceedings{Settle2018apr,
- author = {Settle, Shane and {Le Roux}, Jonathan and Hori, Takaaki and Watanabe, Shinji and Hershey, John R.},
- title = {{End-to-End Multi-Speaker Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2018,
- pages = {4819--4823},
- month = apr,
- doi = {10.1109/ICASSP.2018.8461893},
- url = {https://www.merl.com/publications/TR2018-001}
- }
Wang, Z.-Q., Le Roux, J., Hershey, J.R., "Alternative Objective Functions for Deep Clustering", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2018.8462507, April 2018, pp. 686-690.
BibTeX TR2018-005 PDF
- @inproceedings{Wang2018apr,
- author = {Wang, Zhong-Qiu and {Le Roux}, Jonathan and Hershey, John R.},
- title = {{Alternative Objective Functions for Deep Clustering}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2018,
- pages = {686--690},
- month = apr,
- doi = {10.1109/ICASSP.2018.8462507},
- url = {https://www.merl.com/publications/TR2018-005}
- }
Wen, B., Kamilov, U., Liu, D., Mansour, H., Boufounos, P.T., "DeepCASD: An End-to-End Approach for Multi-Spectural Image Super-Resolution", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2018.8461795, April 2018, pp. 6503-6507.
BibTeX TR2018-009 PDF
- @inproceedings{Wen2018apr,
- author = {Wen, Bihan and Kamilov, Ulugbek and Liu, Dehong and Mansour, Hassan and Boufounos, Petros T.},
- title = {{DeepCASD: An End-to-End Approach for Multi-Spectural Image Super-Resolution}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2018,
- pages = {6503--6507},
- month = apr,
- doi = {10.1109/ICASSP.2018.8461795},
- url = {https://www.merl.com/publications/TR2018-009}
- }
Zhang, Z., Brand, M., "Convergent Block Coordinate Descent for Training Tikhonov Regularized Deep Neural Networks", Advances in Neural Information Processing Systems (NIPS), December 2017.
BibTeX TR2017-140 PDF
- @inproceedings{Ziming2017dec,
- author = {{Zhang, Ziming and Brand, Matthew}},
- title = {{Convergent Block Coordinate Descent for Training Tikhonov Regularized Deep Neural Networks}},
- booktitle = {Advances in Neural Information Processing Systems (NIPS)},
- year = 2017,
- month = dec,
- url = {https://www.merl.com/publications/TR2017-140}
- }
Ochiai, T., Watanabe, S., Hori, T., Hershey, J.R., Xiao, X., "Unified Architecture for Multichannel End-to-End Speech Recognition with Neural Beamforming", IEEE Journal of Selected Topics in Signal Processing, DOI: 10.1109/JSTSP.2017.2764276, Vol. 11, No. 8, pp. 1274-1288, October 2017.
BibTeX TR2017-192 PDF
- @article{Ochiai2017oct2,
- author = {Ochiai, Tsubasa and Watanabe, Shinji and Hori, Takaaki and Hershey, John R. and Xiao, Xiong},
- title = {{Unified Architecture for Multichannel End-to-End Speech Recognition with Neural Beamforming}},
- journal = {IEEE Journal of Selected Topics in Signal Processing},
- year = 2017,
- volume = 11,
- number = 8,
- pages = {1274--1288},
- month = oct,
- doi = {10.1109/JSTSP.2017.2764276},
- issn = {1941-0484},
- url = {https://www.merl.com/publications/TR2017-192}
- }