Publications

Meng, Z., Watanabe, S., Hershey, J.R., Erdogan, H., "Deep Long Short-Term Memory Adaptive Beamforming Networks for Multichannel Robust Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-012 PDF
- @inproceedings{Meng2017mar,
- author = {Meng, Zhong and Watanabe, Shinji and Hershey, John R. and Erdogan, Hakan},
- title = {{Deep Long Short-Term Memory Adaptive Beamforming Networks for Multichannel Robust Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-012}
- }
Watanabe, S., Hori, T., Le Roux, J., Hershey, J.R., "Student-Teacher Network Learning with Enhanced Features", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
BibTeX TR2017-011 PDF
- @inproceedings{Watanabe2017mar,
- author = {Watanabe, Shinji and Hori, Takaaki and {Le Roux}, Jonathan and Hershey, John R.},
- title = {{Student- Teacher Network Learning with Enhanced Features}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2017,
- month = mar,
- url = {https://www.merl.com/publications/TR2017-011}
- }
Hara, K., Liu, M.-Y., Tuzel, C.O., Farahmand, A.-M., "Attentional Network for Visual Object Detection", arXiv, January 2017.
BibTeX arXiv
- @article{Hara2017jan,
- author = {Hara, Kota and Liu, Ming-Yu and Tuzel, C. Oncel and Farahmand, Amir-massoud},
- title = {{Attentional Network for Visual Object Detection}},
- journal = {arXiv},
- year = 2017,
- month = jan,
- url = {https://arxiv.org/abs/1702.01478}
- }
Xiao, X., Watanabe, S., Chng, E.S., Li, H., "Beamforming Networks Using Spatial Covariance Features for Far-field Speech Recognition", Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)<br /> , DOI: 10.1109/APSIPA.2016.7820724, December 2016.
BibTeX TR2016-162 PDF
- @inproceedings{Xiao2016dec,
- author = {Xiao, Xiong and Watanabe, Shinji and Chng, Eng Siong and Li, Haizhou},
- title = {{Beamforming Networks Using Spatial Covariance Features for Far-field Speech Recognition}},
- booktitle = {Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)
  },
- year = 2016,
- month = dec,
- doi = {10.1109/APSIPA.2016.7820724},
- url = {https://www.merl.com/publications/TR2016-162}
- }
Hori, T., Wang, H., Hori, C., Watanabe, S., Harsham, B.A., Le Roux, J., Hershey, J.R., Koji, Y., Jing, Y., Zhu, Z., Aikawa, T., "Dialog State Tracking with Attention-based Sequence-to-sequence Learning", IEEE Workshop on Spoken Language Technology (SLT), DOI: 10.1109/SLT.2016.7846317, December 2016, pp. 552-558.
BibTeX TR2016-163 PDF
- @inproceedings{Hori2016dec,
- author = {Hori, Takaaki and Wang, Hai and Hori, Chiori and Watanabe, Shinji and Harsham, Bret A. and {Le Roux}, Jonathan and Hershey, John R. and Koji, Yusuke and Jing, Yi and Zhu, Zhaocheng and Aikawa, Takeyuki},
- title = {{Dialog State Tracking with Attention-based Sequence-to-sequence Learning}},
- booktitle = {IEEE Workshop on Spoken Language Technology (SLT)},
- year = 2016,
- pages = {552--558},
- month = dec,
- doi = {10.1109/SLT.2016.7846317},
- url = {https://www.merl.com/publications/TR2016-163}
- }
Farahmand, A.-M., Nabi, S., Grover, P., Nikovski, D.N., "Learning to Control Partial Differential Equations: Regularized Fitted Q-Iteration Approach", IEEE Conference on Decision and Control (CDC), DOI: 10.1109/CDC.2016.7798966, December 2016, pp. 4578-4585.
BibTeX TR2016-145 PDF
- @inproceedings{Farahmand2016dec,
- author = {Farahmand, Amir-massoud and Nabi, Saleh and Grover, Piyush and Nikovski, Daniel N.},
- title = {{Learning to Control Partial Differential Equations: Regularized Fitted Q-Iteration Approach}},
- booktitle = {IEEE Conference on Decision and Control (CDC)},
- year = 2016,
- pages = {4578--4585},
- month = dec,
- doi = {10.1109/CDC.2016.7798966},
- url = {https://www.merl.com/publications/TR2016-145}
- }
Takano, T., Moriya, T., Shinozaki, T., Watanabe, S., Hori, T., Duh, K., "Automated Structure Discovery and Parameter Tuning of Neural Network Language Model Based on Evolution Strategy", IEEE Spoken Language Technology Workshop (SLT), DOI: 10.1109/SLT.2016.7846334, December 2016.
BibTeX TR2016-173 PDF
- @inproceedings{Takano2016dec,
- author = {Takano, Tomihiro and Moriya, Takafumi and Shinozaki, Takahiro and Watanabe, Shinji and Hori, Takaaki and Duh, Kevin},
- title = {{Automated Structure Discovery and Parameter Tuning of Neural Network Language Model Based on Evolution Strategy}},
- booktitle = {IEEE Spoken Language Technology Workshop (SLT)},
- year = 2016,
- month = dec,
- doi = {10.1109/SLT.2016.7846334},
- url = {https://www.merl.com/publications/TR2016-173}
- }
Laftchiev, E., Nikovski, D.N., "An IoT System to Estimate Personal Thermal Comfort", IEEE World Forum on Internet of Things (WF- IoT), DOI: 10.1109/WF-IoT.2016.7845401, December 2016, pp. 672-677.
BibTeX TR2016-161 PDF
- @inproceedings{Laftchiev2016dec,
- author = {Laftchiev, Emil and Nikovski, Daniel N.},
- title = {{An IoT System to Estimate Personal Thermal Comfort}},
- booktitle = {IEEE World Forum on Internet of Things (WF- IoT)},
- year = 2016,
- pages = {672--677},
- month = dec,
- doi = {10.1109/WF-IoT.2016.7845401},
- url = {https://www.merl.com/publications/TR2016-161}
- }
Barker, J., Marxer, R., Vincent, E., Watanabe, S., "The Third 'CHIME' Speech Separation and Recognition Challenge: Analysis and Outcomes", Computer Speech & Language, DOI: 10.1016/j.csl.2016.10.005, December 2016.
BibTeX TR2016-171 PDF
- @article{Barker2016dec,
- author = {Barker, Jon and Marxer, Ricard and Vincent, Emmanuel and Watanabe, Shinji},
- title = {{The Third 'CHIME' Speech Separation and Recognition Challenge: Analysis and Outcomes}},
- journal = {Computer Speech \& Language},
- year = 2016,
- month = dec,
- publisher = {Elsevier},
- doi = {10.1016/j.csl.2016.10.005},
- url = {https://www.merl.com/publications/TR2016-171}
- }
Liu, M.-Y., Tuzel, C.O., Sullivan, A., "Coupled Generative Adversarial Nets", Advances in Neural Information Processing Systems (NIPS), December 2016.
BibTeX TR2016-156 PDF
- @inproceedings{Liu2016dec,
- author = {Liu, Ming-Yu and Tuzel, C. Oncel and Sullivan, Alan},
- title = {{Coupled Generative Adversarial Nets}},
- booktitle = {Advances in Neural Information Processing Systems (NIPS)},
- year = 2016,
- month = dec,
- url = {https://www.merl.com/publications/TR2016-156}
- }
Wisdom, S., Powers, T., Hershey, J.R., Le Roux, J., Atlas, L., "Full-Capacity Unitary Recurrent Neural Networks", Advances in Neural Information Processing Systems (NIPS), December 2016.
BibTeX TR2016-155 PDF
- @inproceedings{Wisdom2016dec,
- author = {Wisdom, Scott and Powers, Thomas and Hershey, John R. and {Le Roux}, Jonathan and Atlas, Les},
- title = {{Full-Capacity Unitary Recurrent Neural Networks}},
- booktitle = {Advances in Neural Information Processing Systems (NIPS)},
- year = 2016,
- month = dec,
- url = {https://www.merl.com/publications/TR2016-155}
- }
Vincent, E., Watanabe, S., Nugraha, A.A., Barker, J., Marxer, R., "An analysis of environment, microphone and data simulation mismatches in robust speech recognition", Computer Speech & Language, DOI: 10.1016/j.csl.2016.11.005, December 2016.
BibTeX TR2016-172 PDF
- @article{Vincent2016dec,
- author = {Vincent, Emmanuel and Watanabe, Shinji and Nugraha, Aditya Arie and Barker, Jon and Marxer, Ricard},
- title = {{An analysis of environment, microphone and data simulation mismatches in robust speech recognition}},
- journal = {Computer Speech \& Language},
- year = 2016,
- month = dec,
- publisher = {Elsevier},
- doi = {10.1016/j.csl.2016.11.005},
- url = {https://www.merl.com/publications/TR2016-172}
- }
Chen, C., Liu, M.-Y., Tuzel, C.O., Xiao, J., "R-CNN for Small Object Detection", Asian Conference on Computer Vision (ACCV), DOI: 10.1007/978-3-319-54193-8_14, November 2016, vol. 10115, pp. 214-230.
BibTeX TR2016-144 PDF
- @inproceedings{Chen2016nov,
- author = {Chen, Chenyi and Liu, Ming-Yu and Tuzel, C. Oncel and Xiao, Jianxiong},
- title = {{R-CNN for Small Object Detection}},
- booktitle = {Asian Conference on Computer Vision (ACCV)},
- year = 2016,
- volume = 10115,
- pages = {214--230},
- month = nov,
- doi = {10.1007/978-3-319-54193-8_14},
- url = {https://www.merl.com/publications/TR2016-144}
- }
Tawara, N., Ogawa, T., Watanabe, S., Kobayashi, T., "Nested Gibbs sampling for mixture-of-mixture model and its application to speaker clustering", APSIPA Transactions on Signal and Information Processing, DOI: 10.1017/ATSIP.2016.15, Vol. 5, October 2016.
BibTeX TR2016-138 PDF
- @article{Tawara2016oct,
- author = {Tawara, Naohiro and Ogawa, Tetsuji and Watanabe, Shinji and Kobayashi, Tetsunori},
- title = {{Nested Gibbs sampling for mixture-of-mixture model and its application to speaker clustering}},
- journal = {APSIPA Transactions on Signal and Information Processing},
- year = 2016,
- volume = 5,
- month = oct,
- doi = {10.1017/ATSIP.2016.15},
- url = {https://www.merl.com/publications/TR2016-138}
- }
Ozcan, G., Pajovic, M., Sahinoglu, Z., Wang, Y., Orlik, P.V., Wada, T., "Online State of Charge Estimation for Lithium-Ion Batteries Using Gaussian Process Regression", IEEE Industrial Electronics Society (IECON), DOI: 10.1109/IECON.2016.7793002, October 2016, pp. 998-1003.
BibTeX TR2016-136 PDF
- @inproceedings{Ozcan2016oct,
- author = {Ozcan, Gozde and Pajovic, Milutin and Sahinoglu, Zafer and Wang, Yebin and Orlik, Philip V. and Wada, Toshihiro},
- title = {{Online State of Charge Estimation for Lithium-Ion Batteries Using Gaussian Process Regression}},
- booktitle = {IEEE Industrial Electronics Society (IECON)},
- year = 2016,
- pages = {998--1003},
- month = oct,
- doi = {10.1109/IECON.2016.7793002},
- url = {https://www.merl.com/publications/TR2016-136}
- }
Tuzel, C.O., Marks, T.K., Tambe, S., "Robust Face Alignment Using a Mixture of Invariant Experts", European Conference on Computer Vision (ECCV), DOI: 10.1007/978-3-319-46454-1_50, October 2016, vol. 9909, pp. 825-841.
BibTeX TR2016-129 PDF
- @inproceedings{Tuzel2016oct,
- author = {Tuzel, C. Oncel and Marks, Tim K. and Tambe, Salil},
- title = {{Robust Face Alignment Using a Mixture of Invariant Experts}},
- booktitle = {European Conference on Computer Vision (ECCV)},
- year = 2016,
- volume = 9909,
- pages = {825--841},
- month = oct,
- doi = {10.1007/978-3-319-46454-1_50},
- url = {https://www.merl.com/publications/TR2016-129}
- }
Sankaran, B., Ramalingam, S., Taguchi, Y., "Parameter Learning for Improving Binary Descriptor Matching", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/IROS.2016.7759718, October 2016, pp. 4892-4897.
BibTeX TR2016-132 PDF
- @inproceedings{Sankaran2016oct,
- author = {Sankaran, Bharath and Ramalingam, Srikumar and Taguchi, Yuichi},
- title = {{Parameter Learning for Improving Binary Descriptor Matching}},
- booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
- year = 2016,
- pages = {4892--4897},
- month = oct,
- doi = {10.1109/IROS.2016.7759718},
- url = {https://www.merl.com/publications/TR2016-132}
- }
Delcroix, M., Watanabe, S., "Recent Advances in Distant Speech Recognition," Tech. Rep. TR2016-115, Interspeech Tutorials, September 2016.
BibTeX TR2016-115 PDF
- @techreport{Delcroix2016sep,
- author = {Delcroix, Marc and Watanabe, Shinji},
- title = {{Recent Advances in Distant Speech Recognition}},
- booktitle = {Interspeech Tutorials},
- institution = {Interspeech},
- year = 2016,
- month = sep,
- url = {https://www.merl.com/publications/TR2016-115}
- }
Le Roux, J., Vincent, E., Erdogan, H., "Learning-Based Approaches to Speech Enhancement and Separation," Tech. Rep. TR2016-113, Interspeech Tutorials, September 2016.
BibTeX TR2016-113 PDF
- @techreport{LeRoux2016sep,
- author = {{Le Roux}, Jonathan and Vincent, Emmanuel and Erdogan, Hakan},
- title = {{Learning- Based Approaches to Speech Enhancement and Separation}},
- booktitle = {Interspeech Tutorials},
- year = 2016,
- month = sep,
- url = {https://www.merl.com/publications/TR2016-113}
- }
Erdogan, H., Hershey, J.R., Watanabe, S., Mandel, M., Le Roux, J., "Improved MVDR beamforming using single-channel mask prediction networks", Interspeech, DOI: 10.21437/Interspeech.2016-552, September 2016, pp. 1981-1985.
BibTeX TR2016-072 PDF
- @inproceedings{Erdogan2016sep,
- author = {Erdogan, Hakan and Hershey, John R. and Watanabe, Shinji and Mandel, Michael and {Le Roux}, Jonathan},
- title = {{Improved MVDR beamforming using single-channel mask prediction networks}},
- booktitle = {Interspeech},
- year = 2016,
- pages = {1981--1985},
- month = sep,
- doi = {10.21437/Interspeech.2016-552},
- url = {https://www.merl.com/publications/TR2016-072}
- }
Hori, C., Hori, T., Watanabe, S., Hershey, J.R., "Context-Sensitive and Role-Dependent Spoken Language Understanding using Bidirectional and Attention LSTMs", Interspeech, DOI: 10.21437/Interspeech.2016-1171, September 2016, pp. 3236-3240.
BibTeX TR2016-074 PDF
- @inproceedings{Hori2016sep,
- author = {Hori, Chiori and Hori, Takaaki and Watanabe, Shinji and Hershey, John R.},
- title = {{Context-Sensitive and Role-Dependent Spoken Language Understanding using Bidirectional and Attention LSTMs}},
- booktitle = {Interspeech},
- year = 2016,
- pages = {3236--3240},
- month = sep,
- doi = {10.21437/Interspeech.2016-1171},
- url = {https://www.merl.com/publications/TR2016-074}
- }
Isik, Y., Le Roux, J., Chen, Z., Watanabe, S., Hershey, J.R., "Single-Channel Multi-Speaker Separation using Deep Clustering", Interspeech, DOI: 10.21437/Interspeech.2016-1176, September 2016, pp. 545-549.
BibTeX TR2016-073 PDF
- @inproceedings{Isik2016sep,
- author = {Isik, Yusuf and {Le Roux}, Jonathan and Chen, Zhuo and Watanabe, Shinji and Hershey, John R.},
- title = {{Single-Channel Multi-Speaker Separation using Deep Clustering}},
- booktitle = {Interspeech},
- year = 2016,
- pages = {545--549},
- month = sep,
- doi = {10.21437/Interspeech.2016-1176},
- url = {https://www.merl.com/publications/TR2016-073}
- }
Zmolikova, K., Karafiat, M., Vesely, K., Delcroix, M., Watanabe, S., Burget, L., Cernocky, J.H., "Data selection by sequence summarizing neural network in mismatch condition training", Interspeech, DOI: 10.21437/Interspeech.2016-741, September 2016, pp. 2354-2358.
BibTeX TR2016-075 PDF
- @inproceedings{Zmolikova2016sep,
- author = {Zmolikova, Katerina and Karafiat, Martin and Vesely, Karel and Delcroix, Marc and Watanabe, Shinji and Burget, Lukas and Cernocky, Jan, Honza},
- title = {{Data selection by sequence summarizing neural network in mismatch condition training}},
- booktitle = {Interspeech},
- year = 2016,
- pages = {2354--2358},
- month = sep,
- doi = {10.21437/Interspeech.2016-741},
- url = {https://www.merl.com/publications/TR2016-075}
- }
Hayashi, T., Watanabe, S., Toda, T., Hori, T., Le Roux, J., Takeda, K., "Bidirectional LSTM-HMM Hybrid System for Polyphonic Sound Event Detection", Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE), September 2016, pp. 35-39.
BibTeX TR2016-114 PDF
- @inproceedings{Hayashi2016sep,
- author = {Hayashi, Tomoki and Watanabe, Shinji and Toda, Tomoki and Hori, Takaaki and {Le Roux}, Jonathan and Takeda, Kazuya},
- title = {{Bidirectional LSTM-HMM Hybrid System for Polyphonic Sound Event Detection}},
- booktitle = {Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE)},
- year = 2016,
- pages = {35--39},
- month = sep,
- url = {https://www.merl.com/publications/TR2016-114}
- }
Koike-Akino, T., Mahajan, R., Marks, T.K., Tuzel, C.O., Wang, Y., Watanabe, S., Orlik, P.V., "High-Accuracy User Identification Using EEG Biometrics", International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC), DOI: 10.1109/EMBC.2016.7590835, August 2016, pp. 854-858.
BibTeX TR2016-105 PDF Presentation
- @inproceedings{Koike-Akino2016aug,
- author = {Koike-Akino, Toshiaki and Mahajan, Ruhi and Marks, Tim K. and Tuzel, C. Oncel and Wang, Ye and Watanabe, Shinji and Orlik, Philip V.},
- title = {{High-Accuracy User Identification Using EEG Biometrics}},
- booktitle = {International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)},
- year = 2016,
- pages = {854--858},
- month = aug,
- doi = {10.1109/EMBC.2016.7590835},
- url = {https://www.merl.com/publications/TR2016-105}
- }