Publications

327 / 3,734 publications found.


  •  Hu, R., Raj, B., "A Robust Voice Activity Detector Using an Acoustic Doppler Radar", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), November 2005, pp. 171-176.
    BibTeX TR2005-159 PDF
    • @inproceedings{Hu2005nov,
    • author = {Hu, R. and Raj, B.},
    • title = {A Robust Voice Activity Detector Using an Acoustic Doppler Radar},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2005,
    • pages = {171--176},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2005-159}
    • }
  •  Radhakrishnan, R., Divakaran, A., Smaragdis, P., "Audio Analysis for Surveillance Applications", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2005, pp. 158-161.
    BibTeX TR2005-139 PDF
    • @inproceedings{Radhakrishnan2005oct,
    • author = {Radhakrishnan, R. and Divakaran, A. and Smaragdis, P.},
    • title = {Audio Analysis for Surveillance Applications},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2005,
    • pages = {158--161},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2005-139}
    • }
  •  Raj, B., Smaragdis, P., "Latent Variable Decomposition of Spectrograms for Single Channel Speaker Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2005, pp. 17-20.
    BibTeX TR2005-137 PDF
    • @inproceedings{Raj2005oct,
    • author = {Raj, B. and Smaragdis, P.},
    • title = {Latent Variable Decomposition of Spectrograms for Single Channel Speaker Separation},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2005,
    • pages = {17--20},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2005-137}
    • }
  •  Smaragdis, P., Boufounos, P., "Learning Source Trajectories Using Wrapped-Phase Hidden Markov Models", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2005, pp. 114-117.
    BibTeX TR2005-138 PDF
    • @inproceedings{Smaragdis2005oct,
    • author = {Smaragdis, P. and Boufounos, P.},
    • title = {Learning Source Trajectories Using Wrapped-Phase Hidden Markov Models},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2005,
    • pages = {114--117},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2005-138}
    • }
  •  Forlines, C., Schmidt-Nielsen, B., Raj, B., Wittenburg, K., Wolf, P., "A Comparison between Spoken Queries and Menu-based Interfaces for In-Car Digital Music Selection", IFIP TC13 International Conference on Human-Computer Interaction (INTERACT), September 2005.
    BibTeX TR2005-020 PDF
    • @inproceedings{Forlines2005sep1,
    • author = {Forlines, C. and Schmidt-Nielsen, B. and Raj, B. and Wittenburg, K. and Wolf, P.},
    • title = {A Comparison between Spoken Queries and Menu-based Interfaces for In-Car Digital Music Selection},
    • booktitle = {IFIP TC13 International Conference on Human-Computer Interaction (INTERACT)},
    • year = 2005,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2005-020}
    • }
  •  Bansal, D., Raj, B., Smaragdis, P., "Bandwidth Expansion of Narrowband Speech Using non-Negative Matrix Factorization", Eurospeech, September 2005.
    BibTeX TR2005-135 PDF
    • @inproceedings{Bansal2005sep,
    • author = {Bansal, D. and Raj, B. and Smaragdis, P.},
    • title = {Bandwidth Expansion of Narrowband Speech Using non-Negative Matrix Factorization},
    • booktitle = {Eurospeech},
    • year = 2005,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2005-135}
    • }
  •  Raj, B., Singh, R., Smaragdis, P., "Recognizing Speech from Simultaneous Speakers", Eurospeech, September 2005.
    BibTeX TR2005-136 PDF
    • @inproceedings{Raj2005sep,
    • author = {Raj, B. and Singh, R. and Smaragdis, P.},
    • title = {Recognizing Speech from Simultaneous Speakers},
    • booktitle = {Eurospeech},
    • year = 2005,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2005-136}
    • }
  •  Smaragdis, P., "From Learning Music to Learning to Separate", Forum Acusticum, August 2005.
    BibTeX TR2005-134 PDF
    • @inproceedings{Smaragdis2005aug,
    • author = {Smaragdis, P.},
    • title = {From Learning Music to Learning to Separate},
    • booktitle = {Forum Acusticum},
    • year = 2005,
    • month = aug,
    • url = {https://www.merl.com/publications/TR2005-134}
    • }
  •  Guinness, J., Raj, B., Schmidt-Nielsen, B., Turicchia, L., Sarpeshkar, R., "A Companding Front End for Noise-Robust Automatic Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 1, pp. 249-252.
    BibTeX TR2005-023 PDF
    • @inproceedings{Guinness2005mar,
    • author = {Guinness, J. and Raj, B. and Schmidt-Nielsen, B. and Turicchia, L. and Sarpeshkar, R.},
    • title = {A Companding Front End for Noise-Robust Automatic Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2005,
    • volume = 1,
    • pages = {249--252},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2005-023}
    • }
  •  Radhakrishnan, R., Divakaran, A., "Systematic Acquisition of Audio Classes for Elevator Surveillance", SPIE Conference on Image and Video Communications and Processing, March 2005, vol. 5685, pp. 64-71.
    BibTeX TR2005-076 PDF
    • @inproceedings{Radhakrishnan2005mar,
    • author = {Radhakrishnan, R. and Divakaran, A.},
    • title = {Systematic Acquisition of Audio Classes for Elevator Surveillance},
    • booktitle = {SPIE Conference on Image and Video Communications and Processing},
    • year = 2005,
    • volume = 5685,
    • pages = {64--71},
    • month = mar,
    • url = {https://www.merl.com/publications/TR2005-076}
    • }
  •  Radhakrishnan, R., Divakaran, A., Xiong, Z., "A Time Series Clustering based Framework for Multimedia Mining and Summarization", ACM SIGMM International Workshop on Multimedia Information Retrieval (MIR), October 2004, pp. 157-164.
    BibTeX TR2004-046 PDF
    • @inproceedings{Radhakrishnan2004oct,
    • author = {Radhakrishnan, R. and Divakaran, A. and Xiong, Z.},
    • title = {A Time Series Clustering based Framework for Multimedia Mining and Summarization},
    • booktitle = {ACM SIGMM International Workshop on Multimedia Information Retrieval (MIR)},
    • year = 2004,
    • pages = {157--164},
    • month = oct,
    • isbn = {1-58113-940-3},
    • url = {https://www.merl.com/publications/TR2004-046}
    • }
  •  Wolf, P., Woelfel, J., van Gemert, J., Raj, B., Wong, D., "SpokenQuery: An Alternate Approach to Choosing Items with Speech", International Conference on Spoken Language Processing (ICSLP), October 2004.
    BibTeX TR2004-121 PDF
    • @inproceedings{Wolf2004oct,
    • author = {Wolf, P. and Woelfel, J. and {van Gemert}, J. and Raj, B. and Wong, D.},
    • title = {SpokenQuery: An Alternate Approach to Choosing Items with Speech},
    • booktitle = {International Conference on Spoken Language Processing (ICSLP)},
    • year = 2004,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2004-121}
    • }
  •  Smaragdis, P., "Discovering Auditory Objects Through Non-Negativity Constraints", Statistical and Perceptual Audio Processing (SAPA), October 2004.
    BibTeX TR2004-094 PDF
    • @inproceedings{Smaragdis2004oct,
    • author = {Smaragdis, P.},
    • title = {Discovering Auditory Objects Through Non-Negativity Constraints},
    • booktitle = {Statistical and Perceptual Audio Processing (SAPA)},
    • year = 2004,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2004-094}
    • }
  •  Seltzer, M.L., Raj, B., Stern, R.M., "Likelihood-Maximizing Beamforming for Robust Hands-Free Speech Recognition", IEEE Transactions on Speech and Audio Processing, Vol. 12, No. 5, pp. 489-498, September 2004.
    BibTeX TR2004-088 PDF
    • @article{Seltzer2004sep1,
    • author = {Seltzer, M.L. and Raj, B. and Stern, R.M.},
    • title = {Likelihood-Maximizing Beamforming for Robust Hands-Free Speech Recognition},
    • journal = {IEEE Transactions on Speech and Audio Processing},
    • year = 2004,
    • volume = 12,
    • number = 5,
    • pages = {489--498},
    • month = sep,
    • note = {Awarded Best Young Author, March 2007},
    • issn = {1063-6676},
    • url = {https://www.merl.com/publications/TR2004-088}
    • }
  •  Smaragdis, P., "Non-negative Matrix Factor Deconvolution; Extraction of Multiple Sound Sources from Monophonic Inputs", International Congress on Independent Component Analysis and Blind Signal Separation, September 2004, vol. 3195, pp. 494.
    BibTeX TR2004-104 PDF
    • @inproceedings{Smaragdis2004sep,
    • author = {Smaragdis, P.},
    • title = {Non-negative Matrix Factor Deconvolution; Extraction of Multiple Sound Sources from Monophonic Inputs},
    • booktitle = {International Congress on Independent Component Analysis and Blind Signal Separation},
    • year = 2004,
    • volume = 3195,
    • pages = 494,
    • month = sep,
    • isbn = {3-540-23056-4},
    • url = {https://www.merl.com/publications/TR2004-104}
    • }
  •  Seltzer, M.L., Raj, B., Stern, R.M., "A Bayesian Classifier for Spectrographic Mask Estimation for Missing Feature Speech Recognition", Speech Communication, Vol. 43, No. 4, pp. 379-393, September 2004.
    BibTeX TR2004-086 PDF
    • @article{Seltzer2004sep2,
    • author = {Seltzer, M.L. and Raj, B. and Stern, R.M.},
    • title = {A Bayesian Classifier for Spectrographic Mask Estimation for Missing Feature Speech Recognition},
    • journal = {Speech Communication},
    • year = 2004,
    • volume = 43,
    • number = 4,
    • pages = {379--393},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2004-086}
    • }
  •  Raj, B., Seltzer, M.L., Stern, R.M., "Reconstruction of Missing Features for Robust Speech Recognition", Speech Communication, Vol. 43, No. 4, pp. 275-296, September 2004.
    BibTeX TR2004-087 PDF
    • @article{Raj2004sep,
    • author = {Raj, B. and Seltzer, M.L. and Stern, R.M.},
    • title = {Reconstruction of Missing Features for Robust Speech Recognition},
    • journal = {Speech Communication},
    • year = 2004,
    • volume = 43,
    • number = 4,
    • pages = {275--296},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2004-087}
    • }
  •  Singh, R., Raj, B., "Classification in Likelihood Spaces", Technometrics, Vol. 46, No. 3, pp. 318-329, August 2004.
    BibTeX TR2004-089 PDF
    • @article{Singh2004aug,
    • author = {Singh, R. and Raj, B.},
    • title = {Classification in Likelihood Spaces},
    • journal = {Technometrics},
    • year = 2004,
    • volume = 46,
    • number = 3,
    • pages = {318--329},
    • month = aug,
    • issn = {0040 1706},
    • url = {https://www.merl.com/publications/TR2004-089}
    • }
  •  Smaragdis, P., "Exploiting Redundancy to Construct Listening Systems", Perspectives on Speech Separation, July 2004.
    BibTeX SpringerLink
    • @inproceedings{Smaragdis2004jul,
    • author = {Smaragdis, P.},
    • title = {Exploiting Redundancy to Construct Listening Systems},
    • booktitle = {Perspectives on Speech Separation},
    • year = 2004,
    • month = jul,
    • url = {https://link.springer.com/chapter/10.1007/0-387-22794-6_7}
    • }
  •  Radhakrishnan, R., Xiong, Z., Divakaran, A., Memon, N., "Time Series Analysis and Segmentation Using Eigenvectors for Mining Semantic Audio Label Sequences", IEEE International Conference on Multimedia and Expo (ICME), June 2004.
    BibTeX TR2004-063 PDF
    • @inproceedings{Radhakrishnan2004jun,
    • author = {Radhakrishnan, R. and Xiong, Z. and Divakaran, A. and Memon, N.},
    • title = {Time Series Analysis and Segmentation Using Eigenvectors for Mining Semantic Audio Label Sequences},
    • booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
    • year = 2004,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2004-063}
    • }
  •  Xiong, Z., Radhakrishnan, R., Divakaran, A., Huang, T.S., "Effective and Efficient Sports Highlights Extraction Using the Minimum Description Length Criterion in Selecting GMM Structures", IEEE International Conference on Multimedia and Expo (ICME), June 2004.
    BibTeX TR2004-061 PDF
    • @inproceedings{Xiong2004jun,
    • author = {Xiong, Z. and Radhakrishnan, R. and Divakaran, A. and Huang, T.S.},
    • title = {Effective and Efficient Sports Highlights Extraction Using the Minimum Description Length Criterion in Selecting GMM Structures},
    • booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
    • year = 2004,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2004-061}
    • }
  •  Brown, J.C., Smaragdis, P., "Independent Component Analysis for Automatic Note Extraction from Musical Trills", Journal of the Acoustical Society of America, Vol. 115, No. 5, pp. 1851-2634, May 2004.
    BibTeX TR2004-078 PDF
    • @article{Brown2004may,
    • author = {Brown, J.C. and Smaragdis, P.},
    • title = {Independent Component Analysis for Automatic Note Extraction from Musical Trills},
    • journal = {Journal of the Acoustical Society of America},
    • year = 2004,
    • volume = 115,
    • number = 5,
    • pages = {1851--2634},
    • month = may,
    • url = {https://www.merl.com/publications/TR2004-078}
    • }
  •  Raj, B., Singh, R., Stern, R.M., "On Tracking Noise with Linear Dynamical System Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2004, vol. 1, pp. 965-968.
    BibTeX TR2004-042 PDF
    • @inproceedings{Raj2004may,
    • author = {Raj, B. and Singh, R. and Stern, R.M.},
    • title = {On Tracking Noise with Linear Dynamical System Models},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2004,
    • volume = 1,
    • pages = {965--968},
    • month = may,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2004-042}
    • }
  •  DeVault, D., Rich, C., Sidner, C.L., "Natural Language Generation and Discourse Context: Computing Distractor Sets from the Focus Stack", International Florida Artificial Intelligence Research Symposium (FLAIRS), May 2004.
    BibTeX TR2004-004 PDF
    • @inproceedings{DeVault2004may,
    • author = {DeVault, D. and Rich, C. and Sidner, C.L.},
    • title = {Natural Language Generation and Discourse Context: Computing Distractor Sets from the Focus Stack},
    • booktitle = {International Florida Artificial Intelligence Research Symposium (FLAIRS)},
    • year = 2004,
    • month = may,
    • url = {https://www.merl.com/publications/TR2004-004}
    • }
  •  Divi, V., Forlines, C., van Gemert, J.V., Raj, B., Schmidt-Nielsen, B., Wittenburg, K., Woelfel, J., Wolf, P., Zhang, F., "A Speech-In List-Out Approach to Spoken User Interfaces", Human Language Technology Conference (HLT), May 2004.
    BibTeX TR2004-023 PDF
    • @inproceedings{Divi2004may,
    • author = {Divi, V. and Forlines, C. and {van Gemert}, J.V. and Raj, B. and Schmidt-Nielsen, B. and Wittenburg, K. and Woelfel, J. and Wolf, P. and Zhang, F.},
    • title = {A Speech-In List-Out Approach to Spoken User Interfaces},
    • booktitle = {Human Language Technology Conference (HLT)},
    • year = 2004,
    • month = may,
    • url = {https://www.merl.com/publications/TR2004-023}
    • }