Publications

364 / 3,734 publications found.


  •  Wittenburg, K., Lanning, T., Schwenke, D., Shubin, H., Vetro, A., "The Prospects for Unrestricted Speech Input for TV Content Search", International Working Conference on Advanced Visual Interfaces (AVI), May 2006.
    BibTeX TR2006-045 PDF
    • @inproceedings{Wittenburg2006may,
    • author = {Wittenburg, K. and Lanning, T. and Schwenke, D. and Shubin, H. and Vetro, A.},
    • title = {The Prospects for Unrestricted Speech Input for TV Content Search},
    • booktitle = {International Working Conference on Advanced Visual Interfaces (AVI)},
    • year = 2006,
    • month = may,
    • url = {https://www.merl.com/publications/TR2006-045}
    • }
  •  Tse, E., Shen, C., Greenberg, S., Forlines, C., "Enabling Interaction with Single User Applications through Speech and Gestures on a Multi-User Tabletop", International Working Conference on Advanced Visual Interfaces (AVI), May 2006.
    BibTeX TR2005-130 PDF
    • @inproceedings{Tse2006may1,
    • author = {Tse, E. and Shen, C. and Greenberg, S. and Forlines, C.},
    • title = {Enabling Interaction with Single User Applications through Speech and Gestures on a Multi-User Tabletop},
    • booktitle = {International Working Conference on Advanced Visual Interfaces (AVI)},
    • year = 2006,
    • month = may,
    • url = {https://www.merl.com/publications/TR2005-130}
    • }
  •  Radhakrishnan, R., Divakaran, A., "Generative Process Tracking for Audio Analysis", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2006, vol. 5, pp. V.
    BibTeX TR2006-053 PDF
    • @inproceedings{Radhakrishnan2006may,
    • author = {Radhakrishnan, R. and Divakaran, A.},
    • title = {Generative Process Tracking for Audio Analysis},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2006,
    • volume = 5,
    • pages = {V},
    • month = may,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2006-053}
    • }
  •  Raj, B., Shashanka, M.V.S., Smaragdis, P., "Latent Dirichlet Decomposition for Single Channel Speaker Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2006.
    BibTeX TR2006-064 PDF
    • @inproceedings{Raj2006may,
    • author = {Raj, B. and Shashanka, M.V.S. and Smaragdis, P.},
    • title = {Latent Dirichlet Decomposition for Single Channel Speaker Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2006,
    • month = may,
    • url = {https://www.merl.com/publications/TR2006-064}
    • }
  •  Shashanka, M.V.S., Smaragdis, P., "Secure Sound Classification: Gaussian Mixture Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2006.
    BibTeX TR2006-065 PDF
    • @inproceedings{Shashanka2006may,
    • author = {Shashanka, M.V.S. and Smaragdis, P.},
    • title = {Secure Sound Classification: Gaussian Mixture Models},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2006,
    • month = may,
    • url = {https://www.merl.com/publications/TR2006-065}
    • }
  •  Tse, E., Greenberg, S., Shen, C., Forlines, C., "Multimodal Multiplayer Tabletop Gaming", International Workshop on Pervasive Gaming Applications (PerGames), May 2006.
    BibTeX TR2006-009 PDF
    • @inproceedings{Tse2006may2,
    • author = {Tse, E. and Greenberg, S. and Shen, C. and Forlines, C.},
    • title = {Multimodal Multiplayer Tabletop Gaming},
    • booktitle = {International Workshop on Pervasive Gaming Applications (PerGames)},
    • year = 2006,
    • month = may,
    • url = {https://www.merl.com/publications/TR2006-009}
    • }
  •  Xing, L., Yu, H., Huang, Q., Ye, Q., Divakaran, A., "Subjective Evaluation Criterion for Selecting Affective Features and Modeling Highlights", SPIE Conference on Multimedia Content Analysis, Management and Retrieval, January 2006, vol. 6073, pp. 188-195.
    BibTeX TR2006-027 PDF
    • @inproceedings{Xing2006jan,
    • author = {Xing, L. and Yu, H. and Huang, Q. and Ye, Q. and Divakaran, A.},
    • title = {Subjective Evaluation Criterion for Selecting Affective Features and Modeling Highlights},
    • booktitle = {SPIE Conference on Multimedia Content Analysis, Management and Retrieval},
    • year = 2006,
    • volume = 6073,
    • pages = {188--195},
    • month = jan,
    • url = {https://www.merl.com/publications/TR2006-027}
    • }
  •  Shen, C., "Multi-User Interface and Interactions on Direct-Touch Horizontal Surfaces: Collaborative Tabletop Research at MERL", IEEE International Workshop on Horizontal Interactive Human-Computer Systems (TableTop), January 2006, pp. 53-54.
    BibTeX TR2005-119 PDF
    • @inproceedings{Shen2006jan,
    • author = {Shen, C.},
    • title = {Multi-User Interface and Interactions on Direct-Touch Horizontal Surfaces: Collaborative Tabletop Research at MERL},
    • booktitle = {IEEE International Workshop on Horizontal Interactive Human-Computer Systems (TableTop)},
    • year = 2006,
    • pages = {53--54},
    • month = jan,
    • isbn = {0-7695-2494-X},
    • url = {https://www.merl.com/publications/TR2005-119}
    • }
  •  Raj, B., Singh, R., "Reconstructing Spectral Vectors with Uncertain Spectrographic Masks for Robust Speech Recognition", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), November 2005, pp. 27-32.
    BibTeX TR2005-160 PDF
    • @inproceedings{Raj2005nov,
    • author = {Raj, B. and Singh, R.},
    • title = {Reconstructing Spectral Vectors with Uncertain Spectrographic Masks for Robust Speech Recognition},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2005,
    • pages = {27--32},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2005-160}
    • }
  •  Hu, R., Raj, B., "A Robust Voice Activity Detector Using an Acoustic Doppler Radar", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), November 2005, pp. 171-176.
    BibTeX TR2005-159 PDF
    • @inproceedings{Hu2005nov,
    • author = {Hu, R. and Raj, B.},
    • title = {A Robust Voice Activity Detector Using an Acoustic Doppler Radar},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2005,
    • pages = {171--176},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2005-159}
    • }
  •  Raj, B., Smaragdis, P., "Latent Variable Decomposition of Spectrograms for Single Channel Speaker Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), October 2005, pp. 17-20.
    BibTeX TR2005-137 PDF
    • @inproceedings{Raj2005oct,
    • author = {Raj, B. and Smaragdis, P.},
    • title = {Latent Variable Decomposition of Spectrograms for Single Channel Speaker Separation},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2005,
    • pages = {17--20},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2005-137}
    • }
  •  Brand, M., "Nonrigid Embeddings for Dimensionality Reduction", European Conference on Machine Learning (ECML), October 2005, vol. 3720.
    BibTeX TR2005-117 PDF
    • @inproceedings{Brand2005oct,
    • author = {Brand, M.},
    • title = {Nonrigid Embeddings for Dimensionality Reduction},
    • booktitle = {European Conference on Machine Learning (ECML)},
    • year = 2005,
    • volume = 3720,
    • month = oct,
    • isbn = {3-540-29243-8},
    • url = {https://www.merl.com/publications/TR2005-117}
    • }
  •  Bansal, D., Raj, B., Smaragdis, P., "Bandwidth Expansion of Narrowband Speech Using non-Negative Matrix Factorization", Eurospeech, September 2005.
    BibTeX TR2005-135 PDF
    • @inproceedings{Bansal2005sep,
    • author = {Bansal, D. and Raj, B. and Smaragdis, P.},
    • title = {Bandwidth Expansion of Narrowband Speech Using non-Negative Matrix Factorization},
    • booktitle = {Eurospeech},
    • year = 2005,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2005-135}
    • }
  •  Raj, B., Singh, R., Smaragdis, P., "Recognizing Speech from Simultaneous Speakers", Eurospeech, September 2005.
    BibTeX TR2005-136 PDF
    • @inproceedings{Raj2005sep,
    • author = {Raj, B. and Singh, R. and Smaragdis, P.},
    • title = {Recognizing Speech from Simultaneous Speakers},
    • booktitle = {Eurospeech},
    • year = 2005,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2005-136}
    • }
  •  Vlasic, D., Brand, M., Pfister, H., Popovic, J., "Face Transfer with Multilinear Models", ACM Transactions on Graphics (TOG), Vol. 24, No. 3, pp. 426-433, July 2005.
    BibTeX TR2005-048 PDF
    • @article{Vlasic2005jul,
    • author = {Vlasic, D. and Brand, M. and Pfister, H. and Popovic, J.},
    • title = {Face Transfer with Multilinear Models},
    • journal = {ACM Transactions on Graphics (TOG)},
    • year = 2005,
    • volume = 24,
    • number = 3,
    • pages = {426--433},
    • month = jul,
    • issn = {0730=0301},
    • url = {https://www.merl.com/publications/TR2005-048}
    • }
  •  Rich, C., Sidner, C., Lesh, N., Garland, A., Booth, S., Chimani, M., "DiamondHelp: A Collaborative Interface Framework for Networked Home Appliances", IEEE International Conference on Distributed Computing Systems Workshops, June 2005, pp. 514-519.
    BibTeX TR2004-114 PDF
    • @inproceedings{Rich2005jun,
    • author = {Rich, C. and Sidner, C. and Lesh, N. and Garland, A. and Booth, S. and Chimani, M.},
    • title = {DiamondHelp: A Collaborative Interface Framework for Networked Home Appliances},
    • booktitle = {IEEE International Conference on Distributed Computing Systems Workshops},
    • year = 2005,
    • pages = {514--519},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2004-114}
    • }
  •  Hancock, M.S., Shen, C., Forlines, C., Ryall, K., "Exploring Non-Speech Auditory Feedback at an Interactive Multi-User Tabletop", Conference on Graphics Interface (GI), May 2005, pp. 41-50.
    BibTeX TR2005-054 PDF
    • @inproceedings{Hancock2005may,
    • author = {Hancock, M.S. and Shen, C. and Forlines, C. and Ryall, K.},
    • title = {Exploring Non-Speech Auditory Feedback at an Interactive Multi-User Tabletop},
    • booktitle = {Conference on Graphics Interface (GI)},
    • year = 2005,
    • pages = {41--50},
    • month = may,
    • issn = {0713-5424},
    • url = {https://www.merl.com/publications/TR2005-054}
    • }
  •  Guinness, J., Raj, B., Schmidt-Nielsen, B., Turicchia, L., Sarpeshkar, R., "A Companding Front End for Noise-Robust Automatic Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 1, pp. 249-252.
    BibTeX TR2005-023 PDF
    • @inproceedings{Guinness2005mar,
    • author = {Guinness, J. and Raj, B. and Schmidt-Nielsen, B. and Turicchia, L. and Sarpeshkar, R.},
    • title = {A Companding Front End for Noise-Robust Automatic Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2005,
    • volume = 1,
    • pages = {249--252},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2005-023}
    • }
  •  Nie, Y., Kong, H.-S., Vetro, A., Barner, K., "Fast Adaptive Fuzzy Post-Filtering for Coding Artifacts Removal in Interlaced Video", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 2, pp. 993-996.
    BibTeX TR2005-018 PDF
    • @inproceedings{Nie2005mar,
    • author = {Nie, Y. and Kong, H.-S. and Vetro, A. and Barner, K.},
    • title = {Fast Adaptive Fuzzy Post-Filtering for Coding Artifacts Removal in Interlaced Video},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2005,
    • volume = 2,
    • pages = {993--996},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2005-018}
    • }
  •  Wang, B., Wang, Y., Selesnick, I., Vetro, A., "Video Coding Using 3-D Dual-Tree Discrete Wavelet Transforms", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 2, pp. 61-64.
    BibTeX TR2005-019 PDF
    • @inproceedings{Wang2005mar,
    • author = {Wang, B. and Wang, Y. and Selesnick, I. and Vetro, A.},
    • title = {Video Coding Using 3-D Dual-Tree Discrete Wavelet Transforms},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2005,
    • volume = 2,
    • pages = {61--64},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2005-019}
    • }
  •  Xie, L., Kennedy, L., Chang, S.-F., Divakaran, A., Sun, H., Lin, C.-Y., "Layered Dynamic Mixture Model for Pattern Discovery in Asynchronous Multi-Modal Streams", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2005, vol. 2, pp. 1053-1056.
    BibTeX TR2005-078 PDF
    • @inproceedings{Xie2005mar,
    • author = {Xie, L. and Kennedy, L. and Chang, S.-F. and Divakaran, A. and Sun, H. and Lin, C.-Y.},
    • title = {Layered Dynamic Mixture Model for Pattern Discovery in Asynchronous Multi-Modal Streams},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2005,
    • volume = 2,
    • pages = {1053--1056},
    • month = mar,
    • issn = {1520-6149},
    • url = {https://www.merl.com/publications/TR2005-078}
    • }
  •  Radhakrishnan, R., Divakaran, A., "Systematic Acquisition of Audio Classes for Elevator Surveillance", SPIE Conference on Image and Video Communications and Processing, March 2005, vol. 5685, pp. 64-71.
    BibTeX TR2005-076 PDF
    • @inproceedings{Radhakrishnan2005mar,
    • author = {Radhakrishnan, R. and Divakaran, A.},
    • title = {Systematic Acquisition of Audio Classes for Elevator Surveillance},
    • booktitle = {SPIE Conference on Image and Video Communications and Processing},
    • year = 2005,
    • volume = 5685,
    • pages = {64--71},
    • month = mar,
    • url = {https://www.merl.com/publications/TR2005-076}
    • }
  •  Radhakrishnan, R., Otsuka, I., Xiong, Z., Divakaran, A., "Modelling Sports Highlights Using a Time Series Clustering Framework and Model Interpretation", SPIE Conference on Storage and Retrieval Methods and Applications for Multimedia, January 2005, vol. 5682, pp. 269-276.
    BibTeX TR2005-077 PDF
    • @inproceedings{Radhakrishnan2005jan,
    • author = {Radhakrishnan, R. and Otsuka, I. and Xiong, Z. and Divakaran, A.},
    • title = {Modelling Sports Highlights Using a Time Series Clustering Framework and Model Interpretation},
    • booktitle = {SPIE Conference on Storage and Retrieval Methods and Applications for Multimedia},
    • year = 2005,
    • volume = 5682,
    • pages = {269--276},
    • month = jan,
    • url = {https://www.merl.com/publications/TR2005-077}
    • }
  •  Divakaran, A., Otsuka, I., Radhakrishnan, R., Nakane, K., Ogawa, M., "Audio-Assisted Video Browsing for DVD Recorders", IEEE Pacific-Rim Conference on Multimedia (PCM), November 2004.
    BibTeX TR2004-139 PDF
    • @inproceedings{Divakaran2004nov,
    • author = {Divakaran, A. and Otsuka, I. and Radhakrishnan, R. and Nakane, K. and Ogawa, M.},
    • title = {Audio-Assisted Video Browsing for DVD Recorders},
    • booktitle = {IEEE Pacific-Rim Conference on Multimedia (PCM)},
    • year = 2004,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2004-139}
    • }
  •  Xie, L., Kennedy, L., Chang, S.-F., Divakaran, A., Sun, H., Lin, C.-Y., "Discovering Meaningful Multimedia Patterns with Audio-Visual Concepts and Associated Text", IEEE International Conference on Image Processing (ICIP), October 2004, vol. 4, pp. 2383-2386.
    BibTeX TR2004-128 PDF
    • @inproceedings{Xie2004oct,
    • author = {Xie, L. and Kennedy, L. and Chang, S.-F. and Divakaran, A. and Sun, H. and Lin, C.-Y.},
    • title = {Discovering Meaningful Multimedia Patterns with Audio-Visual Concepts and Associated Text},
    • booktitle = {IEEE International Conference on Image Processing (ICIP)},
    • year = 2004,
    • volume = 4,
    • pages = {2383--2386},
    • month = oct,
    • issn = {1522-4880},
    • url = {https://www.merl.com/publications/TR2004-128}
    • }