Publications

359 / 3,666 publications found.


  •  Pan, P., Porikli, F., Schonfeld, D., "A New Method for Tracking Performance Evaluation Based on a Reflective Model and Perturbation Analysis", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2009.
    BibTeX TR2009-019 PDF
    • @inproceedings{Pan2009apr,
    • author = {Pan, P. and Porikli, F. and Schonfeld, D.},
    • title = {A New Method for Tracking Performance Evaluation Based on a Reflective Model and Perturbation Analysis},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2009,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2009-019}
    • }
  •  Wilson, K.W., Raj, B., Smaragdis, P., "Regularized Non-negative Matrix Factorization with Temporal Dependencies for Speech Denoising", Interspeech, September 2008.
    BibTeX TR2008-075 PDF
    • @inproceedings{Wilson2008sep,
    • author = {Wilson, K.W. and Raj, B. and Smaragdis, P.},
    • title = {Regularized Non-negative Matrix Factorization with Temporal Dependencies for Speech Denoising},
    • booktitle = {Interspeech},
    • year = 2008,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2008-075}
    • }
  •  Weinberg, G., Kondili, D., "Display Style Considerations for In-Car Multimodal Music Search", IADIS International Conference Interfaces and Human Computer Interaction (IHCI), July 2008.
    BibTeX TR2008-038 PDF
    • @inproceedings{Weinberg2008jul,
    • author = {Weinberg, G. and Kondili, D.},
    • title = {Display Style Considerations for In-Car Multimodal Music Search},
    • booktitle = {IADIS International Conference Interfaces and Human Computer Interaction (IHCI)},
    • year = 2008,
    • month = jul,
    • url = {https://www.merl.com/publications/TR2008-038}
    • }
  •  Mei, X., Porikli, F., "Joint Tracking and Video Registration by Factorial Hidden Markov Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2008, pp. 973-976.
    BibTeX TR2008-010 PDF
    • @inproceedings{Mei2008mar,
    • author = {Mei, X. and Porikli, F.},
    • title = {Joint Tracking and Video Registration by Factorial Hidden Markov Models},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2008,
    • pages = {973--976},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2008-010}
    • }
  •  Kalgaonkar, K., Raj, B., "Ultrasonic Doppler Sensor for Speaker Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2008, pp. 4865-4868.
    BibTeX TR2008-014 PDF
    • @inproceedings{Kalgaonkar2008mar,
    • author = {Kalgaonkar, K. and Raj, B.},
    • title = {Ultrasonic Doppler Sensor for Speaker Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2008,
    • pages = {4865--4868},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2008-014}
    • }
  •  Wilson, K.W., Raj, B., Smaragdis, P., Divakaran, A., "Speech Denoising Using Nonnegative Matrix Factorization with Priors", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2008, pp. 4029-4032.
    BibTeX TR2008-012 PDF
    • @inproceedings{Wilson2008mar,
    • author = {Wilson, K.W. and Raj, B. and Smaragdis, P. and Divakaran, A.},
    • title = {Speech Denoising Using Nonnegative Matrix Factorization with Priors},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2008,
    • pages = {4029--4032},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2008-012}
    • }
  •  Smaragdis, P., Raj, B., Shashanka, M., "Sparse and Shift-Invariant Feature Extraction from Non-Negative Data", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2008, pp. 2069-2072.
    BibTeX TR2008-013 PDF
    • @inproceedings{Smaragdis2008mar,
    • author = {Smaragdis, P. and Raj, B. and Shashanka, M.},
    • title = {Sparse and Shift-Invariant Feature Extraction from Non-Negative Data},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2008,
    • pages = {2069--2072},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2008-013}
    • }
  •  Schmidt-Nielsen, B., Harsham, B., Raj, B., Forlines, C., "Speech-Based UI Design for the Automobile" in Handbook of Research on User Interface Design and Evaluation for Mobile Technology, Lumsden, J., Eds., vol. 1, chapter 15, pp. 237-252, Information Science Reference, February 2008.
    BibTeX TR2008-006 PDF
    • @incollection{Schmidt-Nielsen2008feb,
    • author = {Schmidt-Nielsen, B. and Harsham, B. and Raj, B. and Forlines, C.},
    • title = {Speech-Based UI Design for the Automobile},
    • booktitle = {Handbook of Research on User Interface Design and Evaluation for Mobile Technology},
    • year = 2008,
    • editor = {Lumsden, J.},
    • volume = 1,
    • chapter = 15,
    • pages = {237--252},
    • month = feb,
    • publisher = {Information Science Reference},
    • isbn = {978-1-59904-871-0},
    • url = {https://www.merl.com/publications/TR2008-006}
    • }
  •  Kalgaonkar, K., Hu, R., Raj, B., "Ultrasonic Doppler Sensor for Voice Activity Detection", IEEE Signal Processing Letters, Vol. 14, No. 10, pp. 754-757, October 2007.
    BibTeX TR2007-106 PDF
    • @article{Kalgaonkar2007oct,
    • author = {Kalgaonkar, K. and Hu, R. and Raj, B.},
    • title = {Ultrasonic Doppler Sensor for Voice Activity Detection},
    • journal = {IEEE Signal Processing Letters},
    • year = 2007,
    • volume = 14,
    • number = 10,
    • pages = {754--757},
    • month = oct,
    • issn = {1558-2361},
    • url = {https://www.merl.com/publications/TR2007-106}
    • }
  •  Reddy, A.M., Raj, B., "Soft Mask Methods for Single-Channel Speaker Separation", IEEE Transactions on Audio, Speech and Language Processing, Vol. 15, No. 6, pp. 1766-1776, August 2007.
    BibTeX IEEE Xplore
    • @article{Reddy2007aug,
    • author = {Reddy, A.M. and Raj, B.},
    • title = {Soft Mask Methods for Single-Channel Speaker Separation},
    • journal = {IEEE Transactions on Audio, Speech and Language Processing},
    • year = 2007,
    • volume = 15,
    • number = 6,
    • pages = {1766--1776},
    • month = aug,
    • issn = {1558-7916},
    • url = {https://ieeexplore.ieee.org/document/4276763}
    • }
  •  Smaragdis, P., Shashanka, M., "A Framework for Secure Speech Recognition", IEEE Transactions on Audio, Speech and Language Processing, DOI: 10.1109/​TASL.2007.894526, Vol. 15, No. 4, pp. 1404-1413, May 2007.
    BibTeX TR2007-057 PDF
    • @article{Smaragdis2007may,
    • author = {Smaragdis, P. and Shashanka, M.},
    • title = {A Framework for Secure Speech Recognition},
    • journal = {IEEE Transactions on Audio, Speech and Language Processing},
    • year = 2007,
    • volume = 15,
    • number = 4,
    • pages = {1404--1413},
    • month = may,
    • doi = {10.1109/TASL.2007.894526},
    • issn = {1558-7916},
    • url = {https://www.merl.com/publications/TR2007-057}
    • }
  •  Tse, E., Shen, C., Greenberg, S., Forlines, C., "How Pairs Interact Over a Multimodal Digital Table", Conference on Human Factors In Computing Systems (SIGCHI), April 2007, pp. 215-218.
    BibTeX TR2007-055 PDF
    • @inproceedings{Tse2007apr,
    • author = {Tse, E. and Shen, C. and Greenberg, S. and Forlines, C.},
    • title = {How Pairs Interact Over a Multimodal Digital Table},
    • booktitle = {Conference on Human Factors In Computing Systems (SIGCHI)},
    • year = 2007,
    • pages = {215--218},
    • month = apr,
    • isbn = {978-1-59593-593-9},
    • url = {https://www.merl.com/publications/TR2007-055}
    • }
  •  Draper, S.C., Khisti, A., Martinian, E., Vetro, A., Yedidia, J.S., "Using Distributed Source Coding to Secure Fingerprint Biometrics", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2007, vol. 2, pp. 129-132.
    BibTeX TR2007-005 PDF
    • @inproceedings{Draper2007apr,
    • author = {Draper, S.C. and Khisti, A. and Martinian, E. and Vetro, A. and Yedidia, J.S.},
    • title = {Using Distributed Source Coding to Secure Fingerprint Biometrics},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2007,
    • volume = 2,
    • pages = {129--132},
    • month = apr,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2007-005}
    • }
  •  Raj, B., Singh, R., Shashanka, M., Smaragdis, P., "Bandwidth Expansion with a Polya URN Model", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2007, vol. 4, pp. IV597-IV600.
    BibTeX TR2007-058 PDF
    • @inproceedings{Raj2007apr,
    • author = {Raj, B. and Singh, R. and Shashanka, M. and Smaragdis, P.},
    • title = {Bandwidth Expansion with a Polya URN Model},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2007,
    • volume = 4,
    • pages = {IV597--IV600},
    • month = apr,
    • url = {https://www.merl.com/publications/TR2007-058}
    • }
  •  Shashanka, M.V.S., Raj, B., Smaragdis, P., "Sparse Overcomplete Decomposition for Single Channel Speaker Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2007, vol. 2, pp. 641-644.
    BibTeX TR2007-031 PDF
    • @inproceedings{Shashanka2007apr,
    • author = {Shashanka, M.V.S. and Raj, B. and Smaragdis, P.},
    • title = {Sparse Overcomplete Decomposition for Single Channel Speaker Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2007,
    • volume = 2,
    • pages = {641--644},
    • month = apr,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2007-031}
    • }
  •  Smaragdis, P., Shashanka, M., "A Framework for Secure Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2007, vol. 4, pp. 969-972.
    BibTeX IEEE Xplore
    • @inproceedings{Smaragdis2007apr,
    • author = {Smaragdis, P. and Shashanka, M.},
    • title = {A Framework for Secure Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2007,
    • volume = 4,
    • pages = {969--972},
    • month = apr,
    • issn = {1520-6149},
    • url = {https://ieeexplore.ieee.org/document/4218264}
    • }
  •  Smaragdis, P., "Convolutive Speech Bases and their Application to Supervised Speech Separation", IEEE Transactions on Audio, Speech and Language Processing, Vol. 15, No. 1, pp. 1-12, January 2007.
    BibTeX TR2007-002 PDF
    • @article{Smaragdis2007jan2,
    • author = {Smaragdis, P.},
    • title = {Convolutive Speech Bases and their Application to Supervised Speech Separation},
    • journal = {IEEE Transactions on Audio, Speech and Language Processing},
    • year = 2007,
    • volume = 15,
    • number = 1,
    • pages = {1--12},
    • month = jan,
    • issn = {1558-7916},
    • url = {https://www.merl.com/publications/TR2007-002}
    • }
  •  Smaragdis, P., Boufounos, P., "Position and Trajectory Learning for Microphone Arrays", IEEE Transactions on Audio, Speech and Language Processing, Vol. 15, No. 1, pp. 358-368, January 2007.
    BibTeX TR2007-001 PDF
    • @article{Smaragdis2007jan1,
    • author = {Smaragdis, P. and Boufounos, P.},
    • title = {Position and Trajectory Learning for Microphone Arrays},
    • journal = {IEEE Transactions on Audio, Speech and Language Processing},
    • year = 2007,
    • volume = 15,
    • number = 1,
    • pages = {358--368},
    • month = jan,
    • issn = {1558-7916},
    • url = {https://www.merl.com/publications/TR2007-001}
    • }
  •  Tse, E., Greenberg, S., Shen, C., "GSI Demo: Multiuser Gesture/Speech Interaction over Digital Tables by Wrapping Single User Applications", International Conference on Multimodal Interfaces (ICMI), November 2006, pp. 76-83.
    BibTeX TR2006-085 PDF
    • @inproceedings{Tse2006nov,
    • author = {Tse, E. and Greenberg, S. and Shen, C.},
    • title = {GSI Demo: Multiuser Gesture/Speech Interaction over Digital Tables by Wrapping Single User Applications},
    • booktitle = {International Conference on Multimodal Interfaces (ICMI)},
    • year = 2006,
    • pages = {76--83},
    • month = nov,
    • isbn = {1-59593-541-X},
    • url = {https://www.merl.com/publications/TR2006-085}
    • }
  •  Weinberg, G., Raj, B., Kalgaonkar, K., "Two New Techniques for Natural Spoken User Interfaces", ACM Symposium on User Interface Software and Technology (UIST), October 2006.
    BibTeX TR2006-098 PDF
    • @inproceedings{Weinberg2006oct,
    • author = {Weinberg, G. and Raj, B. and Kalgaonkar, K.},
    • title = {Two New Techniques for Natural Spoken User Interfaces},
    • booktitle = {ACM Symposium on User Interface Software and Technology (UIST)},
    • year = 2006,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2006-098}
    • }
  •  Wittenburg, K., Lanning, T., Schwenke, D., Shubin, H., Vetro, A., "The Prospects for Unrestricted Speech Input for TV Content Search", International Working Conference on Advanced Visual Interfaces (AVI), May 2006.
    BibTeX TR2006-045 PDF
    • @inproceedings{Wittenburg2006may,
    • author = {Wittenburg, K. and Lanning, T. and Schwenke, D. and Shubin, H. and Vetro, A.},
    • title = {The Prospects for Unrestricted Speech Input for TV Content Search},
    • booktitle = {International Working Conference on Advanced Visual Interfaces (AVI)},
    • year = 2006,
    • month = may,
    • url = {https://www.merl.com/publications/TR2006-045}
    • }
  •  Tse, E., Shen, C., Greenberg, S., Forlines, C., "Enabling Interaction with Single User Applications through Speech and Gestures on a Multi-User Tabletop", International Working Conference on Advanced Visual Interfaces (AVI), May 2006.
    BibTeX TR2005-130 PDF
    • @inproceedings{Tse2006may1,
    • author = {Tse, E. and Shen, C. and Greenberg, S. and Forlines, C.},
    • title = {Enabling Interaction with Single User Applications through Speech and Gestures on a Multi-User Tabletop},
    • booktitle = {International Working Conference on Advanced Visual Interfaces (AVI)},
    • year = 2006,
    • month = may,
    • url = {https://www.merl.com/publications/TR2005-130}
    • }
  •  Radhakrishnan, R., Divakaran, A., "Generative Process Tracking for Audio Analysis", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2006, vol. 5, pp. V.
    BibTeX TR2006-053 PDF
    • @inproceedings{Radhakrishnan2006may,
    • author = {Radhakrishnan, R. and Divakaran, A.},
    • title = {Generative Process Tracking for Audio Analysis},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2006,
    • volume = 5,
    • pages = {V},
    • month = may,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2006-053}
    • }
  •  Raj, B., Shashanka, M.V.S., Smaragdis, P., "Latent Dirichlet Decomposition for Single Channel Speaker Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2006.
    BibTeX TR2006-064 PDF
    • @inproceedings{Raj2006may,
    • author = {Raj, B. and Shashanka, M.V.S. and Smaragdis, P.},
    • title = {Latent Dirichlet Decomposition for Single Channel Speaker Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2006,
    • month = may,
    • url = {https://www.merl.com/publications/TR2006-064}
    • }
  •  Shashanka, M.V.S., Smaragdis, P., "Secure Sound Classification: Gaussian Mixture Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2006.
    BibTeX TR2006-065 PDF
    • @inproceedings{Shashanka2006may,
    • author = {Shashanka, M.V.S. and Smaragdis, P.},
    • title = {Secure Sound Classification: Gaussian Mixture Models},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2006,
    • month = may,
    • url = {https://www.merl.com/publications/TR2006-065}
    • }