Publications

Nikovski, D.N., Byadarhaly, K., "Regularized Covariance Matrix Estimation with High Dimensional Data for Supervised Anomaly Detection Problems", IEEE International Joint Conference on Neural Networks (IJCNN), DOI: 10.1109/IJCNN.2016.7727554, July 2016, pp. 2811-2818.
BibTeX TR2016-099 PDF
- @inproceedings{Nikovski2016jul,
- author = {Nikovski, Daniel N. and Byadarhaly, Kiran},
- title = {{Regularized Covariance Matrix Estimation with High Dimensional Data for Supervised Anomaly Detection Problems}},
- booktitle = {IEEE International Joint Conference on Neural Networks (IJCNN)},
- year = 2016,
- pages = {2811--2818},
- month = jul,
- doi = {10.1109/IJCNN.2016.7727554},
- url = {https://www.merl.com/publications/TR2016-099}
- }
Hori, C., Watanabe, S., Hori, T., Harsham, B.A., Hershey, J.R., Koji, Y., Fujii, Y., Furumoto, Y., "Driver Confusion Status Detection Using Recurrent Neural Networks", IEEE International Conference on Multimedia and Expo (ICME), DOI: 10.1109/ICME.2016.7552966, July 2016.
BibTeX TR2016-088 PDF
- @inproceedings{Hori2016jul,
- author = {Hori, Chiori and Watanabe, Shinji and Hori, Takaaki and Harsham, Bret A. and Hershey, John R. and Koji, Yusuke and Fujii, Youichi and Furumoto, Yuki},
- title = {{Driver Confusion Status Detection Using Recurrent Neural Networks}},
- booktitle = {IEEE International Conference on Multimedia and Expo (ICME)},
- year = 2016,
- month = jul,
- doi = {10.1109/ICME.2016.7552966},
- url = {https://www.merl.com/publications/TR2016-088}
- }
Singh, B., Marks, T.K., Jones, M.J., Tuzel, C.O., Shao, M., "A Multi-Stream Bi-Directional Recurrent Neural Network for Fine-Grained Action Detection", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/CVPR.2016.216, June 2016, pp. 1961-1970.
BibTeX TR2016-080 PDF Data
- @inproceedings{Singh2016jun,
- author = {Singh, Bharat and Marks, Tim K. and Jones, Michael J. and Tuzel, C. Oncel and Shao, Ming},
- title = {{A Multi-Stream Bi-Directional Recurrent Neural Network for Fine-Grained Action Detection}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2016,
- pages = {1961--1970},
- month = jun,
- doi = {10.1109/CVPR.2016.216},
- url = {https://www.merl.com/publications/TR2016-080}
- }
Vemulapalli, R., Tuzel, C.O., Liu, M.-Y., "Deep Gaussian Conditional Random Field Network: A Model-based Deep Network for Discriminative Denoising", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/CVPR.2016.351, June 2016, pp. 4801-4809.
BibTeX TR2016-079 PDF
- @inproceedings{Vemulapalli2016jun2,
- author = {Vemulapalli, Raviteja and Tuzel, C. Oncel and Liu, Ming-Yu},
- title = {{Deep Gaussian Conditional Random Field Network: A Model-based Deep Network for Discriminative Denoising}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2016,
- pages = {4801--4809},
- month = jun,
- doi = {10.1109/CVPR.2016.351},
- url = {https://www.merl.com/publications/TR2016-079}
- }
Vemulapalli, R., Tuzel, C.O., Liu, M.-Y., Chellappa, R., "Gaussian Conditional Random Field Network for Semantic Segmentation", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2016, pp. 3224-3233.
BibTeX TR2016-078 PDF
- @inproceedings{Vemulapalli2016jun,
- author = {Vemulapalli, Raviteja and Tuzel, C. Oncel and Liu, Ming-Yu and Chellappa, Rama},
- title = {{Gaussian Conditional Random Field Network for Semantic Segmentation}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2016,
- pages = {3224--3233},
- month = jun,
- url = {https://www.merl.com/publications/TR2016-078}
- }
Son, K., Liu, M.-Y., Taguchi, Y., "Learning to Remove Multipath Distortions in Time-of-Flight Range Images for a Robotic Arm Setup", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/ICRA.2016.7487515, May 2016, pp. 3390-3397.
BibTeX TR2016-036 PDF
- @inproceedings{Son2016may,
- author = {Son, Kilho and Liu, Ming-Yu and Taguchi, Yuichi},
- title = {{Learning to Remove Multipath Distortions in Time-of-Flight Range Images for a Robotic Arm Setup}},
- booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
- year = 2016,
- pages = {3390--3397},
- month = may,
- doi = {10.1109/ICRA.2016.7487515},
- url = {https://www.merl.com/publications/TR2016-036}
- }
Jones, M.J., Nikovski, D.N., Imamura, M., Hirata, T., "Exemplar Learning for Extremely Efficient Anomaly Detection in Real-Valued Time Series", Journal of Data Mining and Knowledge Discovery, DOI: 10.1007/s10618-015-0449-3, Vol. 30, No. 6, pp. 1427-1454, March 2016.
BibTeX TR2016-027 PDF
- @article{Jones2016mar,
- author = {Jones, Michael J. and Nikovski, Daniel N. and Imamura, Makoto and Hirata, Takahisa},
- title = {{Exemplar Learning for Extremely Efficient Anomaly Detection in Real-Valued Time Series}},
- journal = {Journal of Data Mining and Knowledge Discovery},
- year = 2016,
- volume = 30,
- number = 6,
- pages = {1427--1454},
- month = mar,
- doi = {10.1007/s10618-015-0449-3},
- issn = {1573-756X},
- url = {https://www.merl.com/publications/TR2016-027}
- }
Hershey, J.R., Chen, Z., Le Roux, J., Watanabe, S., "Deep Clustering: Discriminative Embeddings for Segmentation and Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2016.7471631, March 2016, pp. 31-35.
BibTeX TR2016-003 PDF
- @inproceedings{Hershey2016mar,
- author = {Hershey, John R. and Chen, Zhuo and {Le Roux}, Jonathan and Watanabe, Shinji},
- title = {{Deep Clustering: Discriminative Embeddings for Segmentation and Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2016,
- pages = {31--35},
- month = mar,
- doi = {10.1109/ICASSP.2016.7471631},
- url = {https://www.merl.com/publications/TR2016-003}
- }
Hori, T., Hori, C., Watanabe, S., Hershey, J.R., "Minimum Word Error Training of Long Short-Term Memory Recurrent Neural Network Language Models for Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2016.7472827, March 2016, pp. 5990-5994.
BibTeX TR2016-011 PDF
- @inproceedings{Hori2016mar,
- author = {Hori, Takaaki and Hori, Chiori and Watanabe, Shinji and Hershey, John R.},
- title = {{Minimum Word Error Training of Long Short-Term Memory Recurrent Neural Network Language Models for Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2016,
- pages = {5990--5994},
- month = mar,
- doi = {10.1109/ICASSP.2016.7472827},
- url = {https://www.merl.com/publications/TR2016-011}
- }
Vesely, K., Watanabe, S., Zmolikova, K., Karafiat, M., Burget, L., Cernocky, J.H., "Sequence Summarizing Neural Network for Speaker Adaptation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2016.7472692, March 2016, pp. 5315-5319.
BibTeX TR2016-001 PDF
- @inproceedings{Vesely2016mar,
- author = {Vesely, Karel and Watanabe, Shinji and Zmolikova, Katerina and Karafiat, Martin and Burget, Lukas and Cernocky, Jan, Honza},
- title = {{Sequence Summarizing Neural Network for Speaker Adaptation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2016,
- pages = {5315--5319},
- month = mar,
- doi = {10.1109/ICASSP.2016.7472692},
- url = {https://www.merl.com/publications/TR2016-001}
- }
Wisdom, S., Hershey, J.R., Le Roux, J., Watanabe, S., "Deep Unfolding for Multichannel Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2016.7471649, March 2016, pp. 121-125.
BibTeX TR2016-008 PDF
- @inproceedings{Wisdom2016mar,
- author = {Wisdom, Scott and Hershey, John R. and {Le Roux}, Jonathan and Watanabe, Shinji},
- title = {{Deep Unfolding for Multichannel Source Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2016,
- pages = {121--125},
- month = mar,
- doi = {10.1109/ICASSP.2016.7471649},
- url = {https://www.merl.com/publications/TR2016-008}
- }
Xiao, X., Watanabe, S., Erdogan, H., Lu, L., Hershey, J., Seltzer, M., Chen, G., Zhang, Y., Mandel, M., Yu, D., "Deep Beamforming Networks for Multi-Channel Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2016.7472778, March 2016, pp. 5745-5749.
BibTeX TR2016-002 PDF
- @inproceedings{Xiao2016mar,
- author = {Xiao, Xiong and Watanabe, Shinji and Erdogan, Hakan and Lu, Liang and Hershey, John and Seltzer, Mike and Chen, Guoguo and Zhang, Yu and Mandel, Michael and Yu, Dong},
- title = {{Deep Beamforming Networks for Multi-Channel Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2016,
- pages = {5745--5749},
- month = mar,
- doi = {10.1109/ICASSP.2016.7472778},
- url = {https://www.merl.com/publications/TR2016-002}
- }
Liu, M.-Y., Mallya, A., Tuzel, C.O., Chen, X., "Unsupervised Network Pretraining via Encoding Human Design", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/WACV.2016.7477698, March 2016, pp. 1-9.
BibTeX TR2016-022 PDF
- @inproceedings{Liu2016mar,
- author = {Liu, Ming-Yu and Mallya, Arun and Tuzel, C. Oncel and Chen, Xi},
- title = {{Unsupervised Network Pretraining via Encoding Human Design}},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2016,
- pages = {1--9},
- month = mar,
- doi = {10.1109/WACV.2016.7477698},
- url = {https://www.merl.com/publications/TR2016-022}
- }
Farahmand, A.-M., Nikovski, D.N., Igarashi, Y., Konaka, H., "Truncated Approximate Dynamic Programming with Task-Dependent Terminal Value", Association for the Advancement of Artificial Intelligence (AAAI), February 2016, pp. 3123-3129.
BibTeX TR2016-020 PDF
- @inproceedings{Farahmand2016feb,
- author = {Farahmand, Amir-massoud and Nikovski, Daniel N. and Igarashi, Yuji and Konaka, Hiroki},
- title = {{Truncated Approximate Dynamic Programming with Task-Dependent Terminal Value}},
- booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)},
- year = 2016,
- pages = {3123--3129},
- month = feb,
- url = {https://www.merl.com/publications/TR2016-020}
- }
Kanagawa, H., Tachioka, Y., Watanabe, S., Ishii, J., "Feature-Space Structural MAPLR with Regression Tree-Based Multiple Transformation Matrices for DNN", Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC), DOI: 10.1109/APSIPA.2015.7415425, December 2015, pp. 86-92.
BibTeX TR2015-150 PDF
- @inproceedings{Kanagawa2015dec,
- author = {Kanagawa, H. and Tachioka, Y. and Watanabe, S. and Ishii, J.},
- title = {{Feature-Space Structural MAPLR with Regression Tree-Based Multiple Transformation Matrices for DNN}},
- booktitle = {Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)},
- year = 2015,
- pages = {86--92},
- month = dec,
- doi = {10.1109/APSIPA.2015.7415425},
- url = {https://www.merl.com/publications/TR2015-150}
- }
Barker, J., Marxer, R., Vincent, E., Watanabe, S., "The Third 'CHiME' Speech Separation and Recognition Challenge: Dataset, Task and Baselines", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU.2015.75404837, December 2015, pp. 504-511.
BibTeX TR2015-136 PDF
- @inproceedings{Barker2015dec,
- author = {Barker, J. and Marxer, R. and Vincent, E. and Watanabe, S.},
- title = {{The Third 'CHiME' Speech Separation and Recognition Challenge: Dataset, Task and Baselines}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2015,
- pages = {504--511},
- month = dec,
- publisher = {IEEE},
- doi = {10.1109/ASRU.2015.75404837},
- url = {https://www.merl.com/publications/TR2015-136}
- }
Hsiao, R., Ma, J., Hartmann, W., Karafiat, M., Grezl, F., Burget, L., Szoke, I., Cernocky, J., Watanabe, S., Chen, Z., Mallidi, S.H., Hermansky, H., Tsakalidis, S., Schwartz, R., "Robust Speech Recognition in Unknown Reverberant and Noisy Conditions", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ARSU.2015.7404841, December 2015, pp. 533-538.
BibTeX TR2015-138 PDF
- @inproceedings{Hsiao2015dec,
- author = {Hsiao, R. and Ma, J. and Hartmann, W. and Karafiat, M. and Grezl, F. and Burget, L. and Szoke, I. and Cernocky, J. and Watanabe, S. and Chen, Z. and Mallidi, S.H. and Hermansky, H. and Tsakalidis, S. and Schwartz, R.},
- title = {{Robust Speech Recognition in Unknown Reverberant and Noisy Conditions}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2015,
- pages = {533--538},
- month = dec,
- publisher = {IEEE},
- doi = {10.1109/ARSU.2015.7404841},
- url = {https://www.merl.com/publications/TR2015-138}
- }
Moriya, T., Shinozaki, T., Watanabe, S., Duh, K., "Automation of System Building for State-of-the-Art Large Vocabulary Speech Recognition Using Evolution Strategy", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU.2015.7404852, December 2015, pp. 610-616.
BibTeX TR2015-137 PDF
- @inproceedings{Moriya2015dec,
- author = {Moriya, T. and Shinozaki, T. and Watanabe, S. and Duh, K.},
- title = {{Automation of System Building for State-of-the-Art Large Vocabulary Speech Recognition Using Evolution Strategy}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2015,
- pages = {610--616},
- month = dec,
- doi = {10.1109/ASRU.2015.7404852},
- url = {https://www.merl.com/publications/TR2015-137}
- }
Hori, T., Chen, Z., Erdogan, H., Hershey, J.R., Le Roux, J., Mitra, V., Watanabe, S., "The MERL/SRI System for the 3rd CHiME Challenge Using Beamforming, Robust Feature Extraction, and Advanced Speech Recognition", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU.2015.7404833, December 2015, pp. 475-481.
BibTeX TR2015-135 PDF
- @inproceedings{Hori2015dec2,
- author = {Hori, T. and Chen, Z. and Erdogan, H. and Hershey, J.R. and {Le Roux}, J. and Mitra, V. and Watanabe, S.},
- title = {{The MERL/SRI System for the 3rd CHiME Challenge Using Beamforming, Robust Feature Extraction, and Advanced Speech Recognition}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2015,
- pages = {475--481},
- month = dec,
- publisher = {IEEE},
- doi = {10.1109/ASRU.2015.7404833},
- url = {https://www.merl.com/publications/TR2015-135}
- }
Bagnell, J.A., Farahmand, A.-M., "Learning Positive Functions in a Hilbert Space", NIPS Workshop on Optimization for Machine Learning (OPT), December 2015.
BibTeX TR2015-133 PDF
- @inproceedings{Bagnell2015dec,
- author = {Bagnell, J.A. and Farahmand, A.-M.},
- title = {{Learning Positive Functions in a Hilbert Space}},
- booktitle = {NIPS Workshop on Optimization for Machine Learning (OPT)},
- year = 2015,
- month = dec,
- url = {https://www.merl.com/publications/TR2015-133}
- }
Hori, C.., Hori, T., Watanabe, S., Hershey, J.R., "Context Sensitive Spoken Language Understanding Using Role Dependent LSTM Layers", NIPS Workshop on Machine Learning for Spoken Language Understanding and Interaction, December 2015.
BibTeX TR2015-134 PDF
- @inproceedings{Hori2015dec1,
- author = {Hori, C. and Hori, T. and Watanabe, S. and Hershey, J.R.},
- title = {{Context Sensitive Spoken Language Understanding Using Role Dependent LSTM Layers}},
- booktitle = {NIPS Workshop on Machine Learning for Spoken Language Understanding and Interaction},
- year = 2015,
- month = dec,
- url = {https://www.merl.com/publications/TR2015-134}
- }
Tawara, N., Ogawa, T., Watanabe, S., Nakamura, A., Kobayashi, T., "A Sampling-Based Speaker Clustering Using Utterance-Oriented Dirichlet Process Mixture Model and Its Evaluation on Large Scale Data", APSIPA Transactions on Signal and Information Processing, DOI: 10.1017/ATSIP.2015.19, Vol. 4, October 2015.
BibTeX TR2015-153 PDF
- @article{Tawara2015oct,
- author = {Tawara, N. and Ogawa, T. and Watanabe, S. and Nakamura, A. and Kobayashi, T.},
- title = {{A Sampling-Based Speaker Clustering Using Utterance-Oriented Dirichlet Process Mixture Model and Its Evaluation on Large Scale Data}},
- journal = {APSIPA Transactions on Signal and Information Processing},
- year = 2015,
- volume = 4,
- month = oct,
- doi = {10.1017/ATSIP.2015.19},
- issn = {2048-7703},
- url = {https://www.merl.com/publications/TR2015-153}
- }
Harsham, B.A., Watanabe, S., Esenther, A., Hershey, J.R., Le Roux, J., Luan, Y., Nikovski, D.N., Potluru, V.K., "Driver Prediction to Improve Interaction with In-Vehicle HMI", Workshop on DSP for In-Vehicle Systems and Safety (DSP), October 2015.
BibTeX TR2015-120 PDF
- @inproceedings{Harsham2015oct,
- author = {Harsham, B.A. and Watanabe, S. and Esenther, A. and Hershey, J.R. and {Le Roux}, J. and Luan, Y. and Nikovski, D.N. and Potluru, V.K.},
- title = {{Driver Prediction to Improve Interaction with In-Vehicle HMI}},
- booktitle = {Workshop on DSP for In-Vehicle Systems and Safety (DSP)},
- year = 2015,
- month = oct,
- url = {https://www.merl.com/publications/TR2015-120}
- }
Abdelaziz, A.H., Watanabe, S., Hershey, J.R., Vincent, E., Kolossa, D., "Uncertainty Propagation Through Deep Neural Networks", Interspeech, September 2015, vol. 1 or 5, pp. 3561.
BibTeX TR2015-098 PDF
- @inproceedings{Abdelaziz2015sep,
- author = {Abdelaziz, A.H. and Watanabe, S. and Hershey, J.R. and Vincent, E. and Kolossa, D.},
- title = {{Uncertainty Propagation Through Deep Neural Networks}},
- booktitle = {Interspeech},
- year = 2015,
- volume = {1 or 5},
- pages = 3561,
- month = sep,
- isbn = {978-1-5108-1790-6},
- url = {https://www.merl.com/publications/TR2015-098}
- }
Chen, Z., Watanabe, S., Erdogan, H., Hershey, J.R., "Speech Enhancement and Recognition Using Multi-Task Learning of Long Short-Term Memory Recurrent Neural Networks", Interspeech, September 2015, vol. 1 of 5, pp. 1278.
BibTeX TR2015-100 PDF
- @inproceedings{Chen2015sep,
- author = {Chen, Z. and Watanabe, S. and Erdogan, H. and Hershey, J.R.},
- title = {{Speech Enhancement and Recognition Using Multi-Task Learning of Long Short-Term Memory Recurrent Neural Networks}},
- booktitle = {Interspeech},
- year = 2015,
- volume = {1 of 5},
- pages = 1278,
- month = sep,
- isbn = {978-1-5108-1790-6},
- url = {https://www.merl.com/publications/TR2015-100}
- }