Publications

359 / 3,667 publications found.


  •  Smaragdis, P., "Exploiting Redundancy to Construct Listening Systems", Perspectives on Speech Separation, July 2004.
    BibTeX SpringerLink
    • @inproceedings{Smaragdis2004jul,
    • author = {Smaragdis, P.},
    • title = {Exploiting Redundancy to Construct Listening Systems},
    • booktitle = {Perspectives on Speech Separation},
    • year = 2004,
    • month = jul,
    • url = {https://link.springer.com/chapter/10.1007/0-387-22794-6_7}
    • }
  •  Raj, B., Singh, R., Stern, R.M., "On Tracking Noise with Linear Dynamical System Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2004, vol. 1, pp. 965-968.
    BibTeX TR2004-042 PDF
    • @inproceedings{Raj2004may,
    • author = {Raj, B. and Singh, R. and Stern, R.M.},
    • title = {On Tracking Noise with Linear Dynamical System Models},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2004,
    • volume = 1,
    • pages = {965--968},
    • month = may,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2004-042}
    • }
  •  Divi, V., Forlines, C., van Gemert, J.V., Raj, B., Schmidt-Nielsen, B., Wittenburg, K., Woelfel, J., Wolf, P., Zhang, F., "A Speech-In List-Out Approach to Spoken User Interfaces", Human Language Technology Conference (HLT), May 2004.
    BibTeX TR2004-023 PDF
    • @inproceedings{Divi2004may,
    • author = {Divi, V. and Forlines, C. and {van Gemert}, J.V. and Raj, B. and Schmidt-Nielsen, B. and Wittenburg, K. and Woelfel, J. and Wolf, P. and Zhang, F.},
    • title = {A Speech-In List-Out Approach to Spoken User Interfaces},
    • booktitle = {Human Language Technology Conference (HLT)},
    • year = 2004,
    • month = may,
    • url = {https://www.merl.com/publications/TR2004-023}
    • }
  •  Raj, B., Seltzer, M.L., Reyes-Gomez, M.J., "Speech Recognizer Based Maximum Likelihood Beamforming", NSF Workshop on Perspectives on Speech Separation, October 2003.
    BibTeX TR2003-87 PDF
    • @inproceedings{Raj2003oct,
    • author = {Raj, B. and Seltzer, M.L. and Reyes-Gomez, M.J.},
    • title = {Speech Recognizer Based Maximum Likelihood Beamforming},
    • booktitle = {NSF Workshop on Perspectives on Speech Separation},
    • year = 2003,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2003-87}
    • }
  •  Reyes-Gomez, M.J., Raj, B., Ellis, D.P.W., "Multi-Channel Source Separation by Beamforming Trained with Factorial HMMS", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2003, pp. 13-16.
    BibTeX TR2003-88 PDF
    • @inproceedings{Reyes-Gomez2003oct,
    • author = {Reyes-Gomez, M.J. and Raj, B. and Ellis, D.P.W.},
    • title = {Multi-Channel Source Separation by Beamforming Trained with Factorial HMMS},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2003,
    • pages = {13--16},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2003-88}
    • }
  •  Peker, K.A., Divakaran, A., "An Extended Framework for Adaptive Playback-Based Video Summarization", SPIE Conference on Internet Multimedia Management Systems, September 2003, vol. 5242, pp. 26-33.
    BibTeX TR2003-115 PDF
    • @inproceedings{Peker2003sep,
    • author = {Peker, K.A. and Divakaran, A.},
    • title = {An Extended Framework for Adaptive Playback-Based Video Summarization},
    • booktitle = {SPIE Conference on Internet Multimedia Management Systems},
    • year = 2003,
    • volume = 5242,
    • pages = {26--33},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2003-115}
    • }
  •  Lamere, P., Kwok, P., Walker, W., Gouvea, E., Singh, R., Raj, B., Wolf, P.P., "Design of the CMU Sphinx-4 Decoder", Eurospeech, September 2003.
    BibTeX TR2003-110 PDF
    • @inproceedings{Lamere2003sep,
    • author = {Lamere, P. and Kwok, P. and Walker, W. and Gouvea, E. and Singh, R. and Raj, B. and Wolf, P.P.},
    • title = {Design of the CMU Sphinx-4 Decoder},
    • booktitle = {Eurospeech},
    • year = 2003,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2003-110}
    • }
  •  Singh, R., Warmuth, M., Raj, B., Lamere, P., "Classification with Free Energy at Raised Temperatures", Eurospeech, September 2003.
    BibTeX TR2003-22 PDF
    • @inproceedings{Singh2003sep,
    • author = {Singh, R. and Warmuth, M. and Raj, B. and Lamere, P.},
    • title = {Classification with Free Energy at Raised Temperatures},
    • booktitle = {Eurospeech},
    • year = 2003,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2003-22}
    • }
  •  Lin, S., Vetro, A., Wang, Y., "Rate-Distortion Analysis of the Multiple Description Motion Compensation Video Coding Scheme", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2003, vol. 3, pp. 401-404.
    BibTeX TR2003-27 PDF
    • @inproceedings{Lin2003apr,
    • author = {Lin, S. and Vetro, A. and Wang, Y.},
    • title = {Rate-Distortion Analysis of the Multiple Description Motion Compensation Video Coding Scheme},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • volume = 3,
    • pages = {401--404},
    • month = apr,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2003-27}
    • }
  •  Raj, B., Whittaker, E.W.D., "Lossless Compression of Language Model Structure and Word Identifiers", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2003, vol. 1, pp. 388-391.
    BibTeX IEEE Xplore
    • @inproceedings{Raj2003apr,
    • author = {Raj, B. and Whittaker, E.W.D.},
    • title = {Lossless Compression of Language Model Structure and Word Identifiers},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • volume = 1,
    • pages = {388--391},
    • month = apr,
    • issn = {1520-6149},
    • url = {https://ieeexplore.ieee.org/document/1198799}
    • }
  •  Reyes-Gomez, M.J., Raj, B., Ellis, D.P.W., "Multi-Channel Source Separation by Factorial HMMs", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2003.
    BibTeX
    • @inproceedings{Reyes-Gomez2003apr,
    • author = {Reyes-Gomez, M.J. and Raj, B. and Ellis, D.P.W.},
    • title = {Multi-Channel Source Separation by Factorial HMMs},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • month = apr
    • }
  •  Singh, R., Raj, B., "Tracking Noise via Dynamical Systems with a Continuum of States", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2003.
    BibTeX
    • @inproceedings{Singh2003apr,
    • author = {Singh, R. and Raj, B.},
    • title = {Tracking Noise via Dynamical Systems with a Continuum of States},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • month = apr
    • }
  •  Xiong, Z., Radhakrishnan, R., Divakaran, A., Huang, T.S., "Audio Events Detection Based Highlights Extraction from Baseball, Golf and Soccer Games in a Unified Framework", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2003, vol. 5, pp. 632-635.
    BibTeX IEEE Xplore
    • @inproceedings{Xiong2003apr2,
    • author = {Xiong, Z. and Radhakrishnan, R. and Divakaran, A. and Huang, T.S.},
    • title = {Audio Events Detection Based Highlights Extraction from Baseball, Golf and Soccer Games in a Unified Framework},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • volume = 5,
    • pages = {632--635},
    • month = apr,
    • issn = {1520-6149},
    • url = {https://ieeexplore.ieee.org/document/1200049}
    • }
  •  Xiong, Z., Radhakrishnan, R., Divakaran, A., Huang, T.S., "Comparing MFCC and MPEG-7 Audio Features for Feature Extraction, Maximum Likelihood HMM and Entropic Prior HMM for Sports Audio Classification", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2003.1200048, April 2003, vol. 5, pp. 628-631.
    BibTeX IEEE Xplore
    • @inproceedings{Xiong2003apr1,
    • author = {Xiong, Z. and Radhakrishnan, R. and Divakaran, A. and Huang, T.S.},
    • title = {Comparing MFCC and MPEG-7 Audio Features for Feature Extraction, Maximum Likelihood HMM and Entropic Prior HMM for Sports Audio Classification},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2003,
    • volume = 5,
    • pages = {628--631},
    • month = apr,
    • doi = {10.1109/ICASSP.2003.1200048},
    • issn = {1520-6149},
    • url = {https://ieeexplore.ieee.org/document/1200048}
    • }
  •  Seltzer, M.L., Raj, B., "Speech Recognizer Based Filter Optimization for Microphone Array Processing", IEEE Transactions on Signal Processing, Vol. 10, No. 3, pp. 69-71, March 2003.
    BibTeX IEEE Xplore
    • @article{Seltzer2003mar,
    • author = {Seltzer, M.L. and Raj, B.},
    • title = {Speech Recognizer Based Filter Optimization for Microphone Array Processing},
    • journal = {IEEE Transactions on Signal Processing},
    • year = 2003,
    • volume = 10,
    • number = 3,
    • pages = {69--71},
    • month = mar,
    • issn = {1070-9908},
    • url = {https://ieeexplore.ieee.org/document/1182087}
    • }
  •  Raj, B., Singh, R., "Classifier-Based Non-Linear Projection for Adaptive Endpointing of Continuous Speech", Computer Speech and Language, Vol. 17, No. 1, pp. 5-26, January 2003.
    BibTeX
    • @article{Raj2003jan,
    • author = {Raj, B. and Singh, R.},
    • title = {Classifier-Based Non-Linear Projection for Adaptive Endpointing of Continuous Speech},
    • journal = {Computer Speech and Language},
    • year = 2003,
    • volume = 17,
    • number = 1,
    • pages = {5--26},
    • month = jan
    • }
  •  Candace L. Sidner, "Building Spoken Language Collaborative Interface Agents", Tech. Rep. TR2002-38, Mitsubishi Electric Research Laboratories, Cambridge, MA, August 2002.
    BibTeX TR2002-38 PDF
    • @techreport{MERL_TR2002-38,
    • author = {Candace L. Sidner},
    • title = {Building Spoken Language Collaborative Interface Agents},
    • institution = {MERL - Mitsubishi Electric Research Laboratories},
    • address = {Cambridge, MA 02139},
    • number = {TR2002-38},
    • month = aug,
    • year = 2002,
    • url = {https://www.merl.com/publications/TR2002-38/}
    • }
  •  Singh, R., Raj, B., Stern, R.M., "Model Compensation and Matched Condition Methods for Robust Speech Recognition" in Noise Reduction in Speech Applications, Davis, G.M., Eds., Electrical Engineering \& Applied Signal Processing Series, chapter 10, pp. 245-275, CRC Press, May 2002.
    BibTeX CRC Press
    • @incollection{Singh2002may2,
    • author = {Singh, R. and Raj, B. and Stern, R.M.},
    • title = {Model Compensation and Matched Condition Methods for Robust Speech Recognition},
    • booktitle = {Noise Reduction in Speech Applications},
    • year = 2002,
    • editor = {Davis, G.M.},
    • series = {Electrical Engineering \& Applied Signal Processing Series},
    • chapter = 10,
    • pages = {245--275},
    • month = may,
    • publisher = {CRC Press},
    • url = {https://www.crcpress.com/product/isbn/9780849309496}
    • }
  •  Singh, R., Stern, R.M., Raj, B., "Signal and Feature Compensation Methods for Robust Speech Recognition" in Noise Reduction in Speech Applications, Davis, G.M., Eds., Electrical Engineering \& Applied Signal Processing Series, chapter 9, pp. 219-244, CRC Press, May 2002.
    BibTeX CRC Press
    • @incollection{Singh2002may1,
    • author = {Singh, R. and Stern, R.M. and Raj, B.},
    • title = {Signal and Feature Compensation Methods for Robust Speech Recognition},
    • booktitle = {Noise Reduction in Speech Applications},
    • year = 2002,
    • editor = {Davis, G.M.},
    • series = {Electrical Engineering \& Applied Signal Processing Series},
    • chapter = 9,
    • pages = {219--244},
    • month = may,
    • publisher = {CRC Press},
    • url = {https://www.crcpress.com/product/isbn/9780849309496}
    • }
  •  Seltzer, M., Raj, B., Stern, R., "Speech Recognizer Based Microphone Array Processing for Robust Hands-Free Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2002, vol. 1, pp. 897-900.
    BibTeX IEEE Xplore
    • @inproceedings{Seltzer2002may,
    • author = {Seltzer, M. and Raj, B. and Stern, R.},
    • title = {Speech Recognizer Based Microphone Array Processing for Robust Hands-Free Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2002,
    • volume = 1,
    • pages = {897--900},
    • month = may,
    • issn = {1520-62149},
    • url = {https://ieeexplore.ieee.org/document/1005885}
    • }
  •  Vetro, A., Wang, Y., Sun, H., "A Probabilistic Approach for Rate-Distortion Modeling of Multi-scale Binary Shape", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2002, vol. 4, pp. 3353-3356.
    BibTeX IEEE Xplore
    • @inproceedings{Vetro2002may1,
    • author = {Vetro, A. and Wang, Y. and Sun, H.},
    • title = {A Probabilistic Approach for Rate-Distortion Modeling of Multi-scale Binary Shape},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2002,
    • volume = 4,
    • pages = {3353--3356},
    • month = may,
    • issn = {1520-6149},
    • url = {https://ieeexplore.ieee.org/document/1004630}
    • }
  •  Xie, L., Chang, S.-F., Divakaran, A., Sun, H., "Structure Analysis of Soccer Video with Hidden Markov Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2002, vol. 4, pp. 4096-4099.
    BibTeX IEEE Xplore
    • @inproceedings{Xie2002may,
    • author = {Xie, L. and Chang, S.-F. and Divakaran, A. and Sun, H.},
    • title = {Structure Analysis of Soccer Video with Hidden Markov Models},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2002,
    • volume = 4,
    • pages = {4096--4099},
    • month = may,
    • issn = {1520-6149},
    • url = {https://ieeexplore.ieee.org/document/1004819}
    • }
  •  Michael Seltzer, "Calibration of Microphone Arrays for Improved Speech Recognition", Tech. Rep. TR2001-43, Mitsubishi Electric Research Laboratories, Cambridge, MA, December 2001.
    BibTeX TR2001-43 PDF
    • @techreport{MERL_TR2001-43,
    • author = {Michael Seltzer},
    • title = {Calibration of Microphone Arrays for Improved Speech Recognition},
    • institution = {MERL - Mitsubishi Electric Research Laboratories},
    • address = {Cambridge, MA 02139},
    • number = {TR2001-43},
    • month = dec,
    • year = 2001,
    • url = {https://www.merl.com/publications/TR2001-43/}
    • }
  •  Raj, B., Migdal, J., Singh, R., "Distributed Speech Recognition with Codec Parameters", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2001, pp. 127-130.
    BibTeX TR2001-45 PDF
    • @inproceedings{Raj2001dec,
    • author = {Raj, B. and Migdal, J. and Singh, R.},
    • title = {Distributed Speech Recognition with Codec Parameters},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2001,
    • pages = {127--130},
    • month = dec,
    • url = {https://www.merl.com/publications/TR2001-45}
    • }
  •  Raj, B., Seltzer, M., Stern, R., "Robust Speech Recognition: The Case for Restoring Missing Features", Workshop for Consistent and Reliable Acoustic Cues (CRAC), September 2001.
    BibTeX TR2001-40 PDF
    • @inproceedings{Raj2001sep,
    • author = {Raj, B. and Seltzer, M. and Stern, R.},
    • title = {Robust Speech Recognition: The Case for Restoring Missing Features},
    • booktitle = {Workshop for Consistent and Reliable Acoustic Cues (CRAC)},
    • year = 2001,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2001-40}
    • }