- Guinness, J., Raj, B., Schmidt-Nielsen, B., Turicchia, L., Sarpeshkar, R., "A Companding Front End for Noise-Robust Automatic Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 1, pp. 249-252.
BibTeX TR2005-023 PDF- @inproceedings{Guinness2005mar,
- author = {Guinness, J. and Raj, B. and Schmidt-Nielsen, B. and Turicchia, L. and Sarpeshkar, R.},
- title = {A Companding Front End for Noise-Robust Automatic Speech Recognition},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2005,
- volume = 1,
- pages = {249--252},
- month = mar,
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2005-023}
- }
- Radhakrishnan, R., Divakaran, A., "Systematic Acquisition of Audio Classes for Elevator Surveillance", SPIE Conference on Image and Video Communications and Processing, March 2005, vol. 5685, pp. 64-71.
BibTeX TR2005-076 PDF- @inproceedings{Radhakrishnan2005mar,
- author = {Radhakrishnan, R. and Divakaran, A.},
- title = {Systematic Acquisition of Audio Classes for Elevator Surveillance},
- booktitle = {SPIE Conference on Image and Video Communications and Processing},
- year = 2005,
- volume = 5685,
- pages = {64--71},
- month = mar,
- url = {https://www.merl.com/publications/TR2005-076}
- }
- Radhakrishnan, R., Divakaran, A., Xiong, Z., "A Time Series Clustering based Framework for Multimedia Mining and Summarization", ACM SIGMM International Workshop on Multimedia Information Retrieval (MIR), October 2004, pp. 157-164.
BibTeX TR2004-046 PDF- @inproceedings{Radhakrishnan2004oct,
- author = {Radhakrishnan, R. and Divakaran, A. and Xiong, Z.},
- title = {A Time Series Clustering based Framework for Multimedia Mining and Summarization},
- booktitle = {ACM SIGMM International Workshop on Multimedia Information Retrieval (MIR)},
- year = 2004,
- pages = {157--164},
- month = oct,
- isbn = {1-58113-940-3},
- url = {https://www.merl.com/publications/TR2004-046}
- }
- Wolf, P., Woelfel, J., van Gemert, J., Raj, B., Wong, D., "SpokenQuery: An Alternate Approach to Choosing Items with Speech", International Conference on Spoken Language Processing (ICSLP), October 2004.
BibTeX TR2004-121 PDF- @inproceedings{Wolf2004oct,
- author = {Wolf, P. and Woelfel, J. and {van Gemert}, J. and Raj, B. and Wong, D.},
- title = {SpokenQuery: An Alternate Approach to Choosing Items with Speech},
- booktitle = {International Conference on Spoken Language Processing (ICSLP)},
- year = 2004,
- month = oct,
- url = {https://www.merl.com/publications/TR2004-121}
- }
- Smaragdis, P., "Discovering Auditory Objects Through Non-Negativity Constraints", Statistical and Perceptual Audio Processing (SAPA), October 2004.
BibTeX TR2004-094 PDF- @inproceedings{Smaragdis2004oct,
- author = {Smaragdis, P.},
- title = {Discovering Auditory Objects Through Non-Negativity Constraints},
- booktitle = {Statistical and Perceptual Audio Processing (SAPA)},
- year = 2004,
- month = oct,
- url = {https://www.merl.com/publications/TR2004-094}
- }
- Seltzer, M.L., Raj, B., Stern, R.M., "Likelihood-Maximizing Beamforming for Robust Hands-Free Speech Recognition", IEEE Transactions on Speech and Audio Processing, Vol. 12, No. 5, pp. 489-498, September 2004.
BibTeX TR2004-088 PDF- @article{Seltzer2004sep1,
- author = {Seltzer, M.L. and Raj, B. and Stern, R.M.},
- title = {Likelihood-Maximizing Beamforming for Robust Hands-Free Speech Recognition},
- journal = {IEEE Transactions on Speech and Audio Processing},
- year = 2004,
- volume = 12,
- number = 5,
- pages = {489--498},
- month = sep,
- note = {Awarded Best Young Author, March 2007},
- issn = {1063-6676},
- url = {https://www.merl.com/publications/TR2004-088}
- }
- Smaragdis, P., "Non-negative Matrix Factor Deconvolution; Extraction of Multiple Sound Sources from Monophonic Inputs", International Congress on Independent Component Analysis and Blind Signal Separation, September 2004, vol. 3195, pp. 494.
BibTeX TR2004-104 PDF- @inproceedings{Smaragdis2004sep,
- author = {Smaragdis, P.},
- title = {Non-negative Matrix Factor Deconvolution; Extraction of Multiple Sound Sources from Monophonic Inputs},
- booktitle = {International Congress on Independent Component Analysis and Blind Signal Separation},
- year = 2004,
- volume = 3195,
- pages = 494,
- month = sep,
- isbn = {3-540-23056-4},
- url = {https://www.merl.com/publications/TR2004-104}
- }
- Seltzer, M.L., Raj, B., Stern, R.M., "A Bayesian Classifier for Spectrographic Mask Estimation for Missing Feature Speech Recognition", Speech Communication, Vol. 43, No. 4, pp. 379-393, September 2004.
BibTeX TR2004-086 PDF- @article{Seltzer2004sep2,
- author = {Seltzer, M.L. and Raj, B. and Stern, R.M.},
- title = {A Bayesian Classifier for Spectrographic Mask Estimation for Missing Feature Speech Recognition},
- journal = {Speech Communication},
- year = 2004,
- volume = 43,
- number = 4,
- pages = {379--393},
- month = sep,
- url = {https://www.merl.com/publications/TR2004-086}
- }
- Raj, B., Seltzer, M.L., Stern, R.M., "Reconstruction of Missing Features for Robust Speech Recognition", Speech Communication, Vol. 43, No. 4, pp. 275-296, September 2004.
BibTeX TR2004-087 PDF- @article{Raj2004sep,
- author = {Raj, B. and Seltzer, M.L. and Stern, R.M.},
- title = {Reconstruction of Missing Features for Robust Speech Recognition},
- journal = {Speech Communication},
- year = 2004,
- volume = 43,
- number = 4,
- pages = {275--296},
- month = sep,
- url = {https://www.merl.com/publications/TR2004-087}
- }
- Singh, R., Raj, B., "Classification in Likelihood Spaces", Technometrics, Vol. 46, No. 3, pp. 318-329, August 2004.
BibTeX TR2004-089 PDF- @article{Singh2004aug,
- author = {Singh, R. and Raj, B.},
- title = {Classification in Likelihood Spaces},
- journal = {Technometrics},
- year = 2004,
- volume = 46,
- number = 3,
- pages = {318--329},
- month = aug,
- issn = {0040 1706},
- url = {https://www.merl.com/publications/TR2004-089}
- }
- Smaragdis, P., "Exploiting Redundancy to Construct Listening Systems", Perspectives on Speech Separation, July 2004.
BibTeX SpringerLink- @inproceedings{Smaragdis2004jul,
- author = {Smaragdis, P.},
- title = {Exploiting Redundancy to Construct Listening Systems},
- booktitle = {Perspectives on Speech Separation},
- year = 2004,
- month = jul,
- url = {https://link.springer.com/chapter/10.1007/0-387-22794-6_7}
- }
- Radhakrishnan, R., Xiong, Z., Divakaran, A., Memon, N., "Time Series Analysis and Segmentation Using Eigenvectors for Mining Semantic Audio Label Sequences", IEEE International Conference on Multimedia and Expo (ICME), June 2004.
BibTeX TR2004-063 PDF- @inproceedings{Radhakrishnan2004jun,
- author = {Radhakrishnan, R. and Xiong, Z. and Divakaran, A. and Memon, N.},
- title = {Time Series Analysis and Segmentation Using Eigenvectors for Mining Semantic Audio Label Sequences},
- booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
- year = 2004,
- month = jun,
- url = {https://www.merl.com/publications/TR2004-063}
- }
- Xiong, Z., Radhakrishnan, R., Divakaran, A., Huang, T.S., "Effective and Efficient Sports Highlights Extraction Using the Minimum Description Length Criterion in Selecting GMM Structures", IEEE International Conference on Multimedia and Expo (ICME), June 2004.
BibTeX TR2004-061 PDF- @inproceedings{Xiong2004jun,
- author = {Xiong, Z. and Radhakrishnan, R. and Divakaran, A. and Huang, T.S.},
- title = {Effective and Efficient Sports Highlights Extraction Using the Minimum Description Length Criterion in Selecting GMM Structures},
- booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
- year = 2004,
- month = jun,
- url = {https://www.merl.com/publications/TR2004-061}
- }
- Brown, J.C., Smaragdis, P., "Independent Component Analysis for Automatic Note Extraction from Musical Trills", Journal of the Acoustical Society of America, Vol. 115, No. 5, pp. 1851-2634, May 2004.
BibTeX TR2004-078 PDF- @article{Brown2004may,
- author = {Brown, J.C. and Smaragdis, P.},
- title = {Independent Component Analysis for Automatic Note Extraction from Musical Trills},
- journal = {Journal of the Acoustical Society of America},
- year = 2004,
- volume = 115,
- number = 5,
- pages = {1851--2634},
- month = may,
- url = {https://www.merl.com/publications/TR2004-078}
- }
- Raj, B., Singh, R., Stern, R.M., "On Tracking Noise with Linear Dynamical System Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2004, vol. 1, pp. 965-968.
BibTeX TR2004-042 PDF- @inproceedings{Raj2004may,
- author = {Raj, B. and Singh, R. and Stern, R.M.},
- title = {On Tracking Noise with Linear Dynamical System Models},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2004,
- volume = 1,
- pages = {965--968},
- month = may,
- issn = {1520-6149},
- url = {https://www.merl.com/publications/TR2004-042}
- }
- DeVault, D., Rich, C., Sidner, C.L., "Natural Language Generation and Discourse Context: Computing Distractor Sets from the Focus Stack", International Florida Artificial Intelligence Research Symposium (FLAIRS), May 2004.
BibTeX TR2004-004 PDF- @inproceedings{DeVault2004may,
- author = {DeVault, D. and Rich, C. and Sidner, C.L.},
- title = {Natural Language Generation and Discourse Context: Computing Distractor Sets from the Focus Stack},
- booktitle = {International Florida Artificial Intelligence Research Symposium (FLAIRS)},
- year = 2004,
- month = may,
- url = {https://www.merl.com/publications/TR2004-004}
- }
- Divi, V., Forlines, C., van Gemert, J.V., Raj, B., Schmidt-Nielsen, B., Wittenburg, K., Woelfel, J., Wolf, P., Zhang, F., "A Speech-In List-Out Approach to Spoken User Interfaces", Human Language Technology Conference (HLT), May 2004.
BibTeX TR2004-023 PDF- @inproceedings{Divi2004may,
- author = {Divi, V. and Forlines, C. and {van Gemert}, J.V. and Raj, B. and Schmidt-Nielsen, B. and Wittenburg, K. and Woelfel, J. and Wolf, P. and Zhang, F.},
- title = {A Speech-In List-Out Approach to Spoken User Interfaces},
- booktitle = {Human Language Technology Conference (HLT)},
- year = 2004,
- month = may,
- url = {https://www.merl.com/publications/TR2004-023}
- }
- Radhakrishan, R., Xiong, Z., Divakaran, A., Ishikawa, Y., "Generation of Sports Highlights Using a Combination of Supervised & Unsupervised Learning in Audio Domain", IEEE Pacific-Rim Conference on Multimedia (PCM), December 2003, vol. 2, pp. 935-939.
BibTeX TR2003-144 PDF- @inproceedings{Radhakrishan2003dec,
- author = {Radhakrishan, R. and Xiong, Z. and Divakaran, A. and Ishikawa, Y.},
- title = {Generation of Sports Highlights Using a Combination of Supervised & Unsupervised Learning in Audio Domain},
- booktitle = {IEEE Pacific-Rim Conference on Multimedia (PCM)},
- year = 2003,
- volume = 2,
- pages = {935--939},
- month = dec,
- url = {https://www.merl.com/publications/TR2003-144}
- }
- Raj, B., Seltzer, M.L., Reyes-Gomez, M.J., "Speech Recognizer Based Maximum Likelihood Beamforming", NSF Workshop on Perspectives on Speech Separation, October 2003.
BibTeX TR2003-87 PDF- @inproceedings{Raj2003oct,
- author = {Raj, B. and Seltzer, M.L. and Reyes-Gomez, M.J.},
- title = {Speech Recognizer Based Maximum Likelihood Beamforming},
- booktitle = {NSF Workshop on Perspectives on Speech Separation},
- year = 2003,
- month = oct,
- url = {https://www.merl.com/publications/TR2003-87}
- }
- Reyes-Gomez, M.J., Raj, B., Ellis, D.P.W., "Multi-Channel Source Separation by Beamforming Trained with Factorial HMMS", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2003, pp. 13-16.
BibTeX TR2003-88 PDF- @inproceedings{Reyes-Gomez2003oct,
- author = {Reyes-Gomez, M.J. and Raj, B. and Ellis, D.P.W.},
- title = {Multi-Channel Source Separation by Beamforming Trained with Factorial HMMS},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2003,
- pages = {13--16},
- month = oct,
- url = {https://www.merl.com/publications/TR2003-88}
- }
- Smaragdis, P., Brown, J.C., "Non-negative Matrix Factorization for Polyphonic Music Transcription", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2003, pp. 177-180.
BibTeX TR2003-139 PDF- @inproceedings{Smaragdis2003oct,
- author = {Smaragdis, P. and Brown, J.C.},
- title = {Non-negative Matrix Factorization for Polyphonic Music Transcription},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2003,
- pages = {177--180},
- month = oct,
- url = {https://www.merl.com/publications/TR2003-139}
- }
- Lamere, P., Kwok, P., Walker, W., Gouvea, E., Singh, R., Raj, B., Wolf, P.P., "Design of the CMU Sphinx-4 Decoder", Eurospeech, September 2003.
BibTeX TR2003-110 PDF- @inproceedings{Lamere2003sep,
- author = {Lamere, P. and Kwok, P. and Walker, W. and Gouvea, E. and Singh, R. and Raj, B. and Wolf, P.P.},
- title = {Design of the CMU Sphinx-4 Decoder},
- booktitle = {Eurospeech},
- year = 2003,
- month = sep,
- url = {https://www.merl.com/publications/TR2003-110}
- }
- Singh, R., Warmuth, M., Raj, B., Lamere, P., "Classification with Free Energy at Raised Temperatures", Eurospeech, September 2003.
BibTeX TR2003-22 PDF- @inproceedings{Singh2003sep,
- author = {Singh, R. and Warmuth, M. and Raj, B. and Lamere, P.},
- title = {Classification with Free Energy at Raised Temperatures},
- booktitle = {Eurospeech},
- year = 2003,
- month = sep,
- url = {https://www.merl.com/publications/TR2003-22}
- }
- Xiong, Z., Radhakrishnan, R., Divakaran, A., Huang, T.S., "Comparing MFCC and MPEG-7 Audio Features for Feature Extraction, Maximum Likelihood HMM and Entropic Prior HMM for Sports Audio Classification", IEEE International Conference on Multimedia and Expo (ICME), DOI: 10.1109/ICME.2003.1221332, July 2003, vol. 3, pp. 397-400.
BibTeX TR2004-082 PDF- @inproceedings{Xiong2003jul2,
- author = {Xiong, Z. and Radhakrishnan, R. and Divakaran, A. and Huang, T.S.},
- title = {Comparing MFCC and MPEG-7 Audio Features for Feature Extraction, Maximum Likelihood HMM and Entropic Prior HMM for Sports Audio Classification},
- booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
- year = 2003,
- volume = 3,
- pages = {397--400},
- month = jul,
- doi = {10.1109/ICME.2003.1221332},
- url = {https://www.merl.com/publications/TR2004-082}
- }
- Raj, B., Whittaker, E.W.D., "Lossless Compression of Language Model Structure and Word Identifiers", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2003, vol. 1, pp. 388-391.
BibTeX IEEE Xplore- @inproceedings{Raj2003apr,
- author = {Raj, B. and Whittaker, E.W.D.},
- title = {Lossless Compression of Language Model Structure and Word Identifiers},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2003,
- volume = 1,
- pages = {388--391},
- month = apr,
- issn = {1520-6149},
- url = {https://ieeexplore.ieee.org/document/1198799}
- }