Publications

609 / 3,655 publications found.


  •  Meng, Z., Watanabe, S., Hershey, J.R., Erdogan, H., "Deep Long Short-Term Memory Adaptive Beamforming Networks for Multichannel Robust Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
    BibTeX TR2017-012 PDF
    • @inproceedings{Meng2017mar,
    • author = {Meng, Zhong and Watanabe, Shinji and Hershey, John R. and Erdogan, Hakan},
    • title = {Deep Long Short-Term Memory Adaptive Beamforming Networks for Multichannel Robust Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2017,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2017-012}
    • }
  •  Watanabe, S., Hori, T., Le Roux, J., Hershey, J.R., "Student-Teacher Network Learning with Enhanced Features", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2017.
    BibTeX TR2017-011 PDF
    • @inproceedings{Watanabe2017mar,
    • author = {Watanabe, Shinji and Hori, Takaaki and Le Roux, Jonathan and Hershey, John R.},
    • title = {Student-Teacher Network Learning with Enhanced Features},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2017,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2017-011}
    • }
  •  Hara, K., Liu, M.-Y., Tuzel, C.O., Farahmand, A.-M., "Attentional Network for Visual Object Detection", arXiv, January 2017.
    BibTeX arXiv
    • @article{Hara2017jan,
    • author = {Hara, Kota and Liu, Ming-Yu and Tuzel, C. Oncel and Farahmand, Amir-massoud},
    • title = {Attentional Network for Visual Object Detection},
    • journal = {arXiv},
    • year = 2017,
    • month = jan,
    • url = {https://arxiv.org/abs/1702.01478}
    • }
  •  Xiao, X., Watanabe, S., Chng, E.S., Li, H., "Beamforming Networks Using Spatial Covariance Features for Far-field Speech Recognition", Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)<br /> , DOI: 10.1109/​APSIPA.2016.7820724, December 2016.
    BibTeX TR2016-162 PDF
    • @inproceedings{Xiao2016dec,
    • author = {Xiao, Xiong and Watanabe, Shinji and Chng, Eng Siong and Li, Haizhou},
    • title = {Beamforming Networks Using Spatial Covariance Features for Far-field Speech Recognition},
    • booktitle = {Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)
      },
    • year = 2016,
    • month = dec,
    • doi = {10.1109/APSIPA.2016.7820724},
    • url = {https://www.merl.com/publications/TR2016-162}
    • }
  •  Hori, T., Wang, H., Hori, C., Watanabe, S., Harsham, B.A., Le Roux, J., Hershey, J.R., Koji, Y., Jing, Y., Zhu, Z., Aikawa, T., "Dialog State Tracking with Attention-based Sequence-to-sequence Learning", IEEE Workshop on Spoken Language Technology (SLT), DOI: 10.1109/​SLT.2016.7846317, December 2016, pp. 552-558.
    BibTeX TR2016-163 PDF
    • @inproceedings{Hori2016dec,
    • author = {Hori, Takaaki and Wang, Hai and Hori, Chiori and Watanabe, Shinji and Harsham, Bret A. and Le Roux, Jonathan and Hershey, John R. and Koji, Yusuke and Jing, Yi and Zhu, Zhaocheng and Aikawa, Takeyuki},
    • title = {Dialog State Tracking with Attention-based Sequence-to-sequence Learning},
    • booktitle = {IEEE Workshop on Spoken Language Technology (SLT)},
    • year = 2016,
    • pages = {552--558},
    • month = dec,
    • doi = {10.1109/SLT.2016.7846317},
    • url = {https://www.merl.com/publications/TR2016-163}
    • }
  •  Farahmand, A.-M., Nabi, S., Grover, P., Nikovski, D.N., "Learning to Control Partial Differential Equations: Regularized Fitted Q-Iteration Approach", IEEE Conference on Decision and Control (CDC), DOI: 10.1109/​CDC.2016.7798966, December 2016, pp. 4578-4585.
    BibTeX TR2016-145 PDF
    • @inproceedings{Farahmand2016dec,
    • author = {Farahmand, Amir-massoud and Nabi, Saleh and Grover, Piyush and Nikovski, Daniel N.},
    • title = {Learning to Control Partial Differential Equations: Regularized Fitted Q-Iteration Approach},
    • booktitle = {IEEE Conference on Decision and Control (CDC)},
    • year = 2016,
    • pages = {4578--4585},
    • month = dec,
    • doi = {10.1109/CDC.2016.7798966},
    • url = {https://www.merl.com/publications/TR2016-145}
    • }
  •  Takano, T., Moriya, T., Shinozaki, T., Watanabe, S., Hori, T., Duh, K., "Automated Structure Discovery and Parameter Tuning of Neural Network Language Model Based on Evolution Strategy", IEEE Spoken Language Technology Workshop (SLT), DOI: 10.1109/​SLT.2016.7846334, December 2016.
    BibTeX TR2016-173 PDF
    • @inproceedings{Takano2016dec,
    • author = {Takano, Tomihiro and Moriya, Takafumi and Shinozaki, Takahiro and Watanabe, Shinji and Hori, Takaaki and Duh, Kevin},
    • title = {Automated Structure Discovery and Parameter Tuning of Neural Network Language Model Based on Evolution Strategy},
    • booktitle = {IEEE Spoken Language Technology Workshop (SLT)},
    • year = 2016,
    • month = dec,
    • doi = {10.1109/SLT.2016.7846334},
    • url = {https://www.merl.com/publications/TR2016-173}
    • }
  •  Laftchiev, E., Nikovski, D.N., "An IoT System to Estimate Personal Thermal Comfort", IEEE World Forum on Internet of Things (WF- IoT), DOI: 10.1109/​WF-IoT.2016.7845401, December 2016, pp. 672-677.
    BibTeX TR2016-161 PDF
    • @inproceedings{Laftchiev2016dec,
    • author = {Laftchiev, Emil and Nikovski, Daniel N.},
    • title = {An IoT System to Estimate Personal Thermal Comfort},
    • booktitle = {IEEE World Forum on Internet of Things (WF- IoT)},
    • year = 2016,
    • pages = {672--677},
    • month = dec,
    • doi = {10.1109/WF-IoT.2016.7845401},
    • url = {https://www.merl.com/publications/TR2016-161}
    • }
  •  Barker, J., Marxer, R., Vincent, E., Watanabe, S., "The Third 'CHIME' Speech Separation and Recognition Challenge: Analysis and Outcomes", Computer Speech & Language, DOI: 10.1016/​j.csl.2016.10.005, December 2016.
    BibTeX TR2016-171 PDF
    • @article{Barker2016dec,
    • author = {Barker, Jon and Marxer, Ricard and Vincent, Emmanuel and Watanabe, Shinji},
    • title = {The Third 'CHIME' Speech Separation and Recognition Challenge: Analysis and Outcomes},
    • journal = {Computer Speech \& Language},
    • year = 2016,
    • month = dec,
    • publisher = {Elsevier},
    • doi = {10.1016/j.csl.2016.10.005},
    • url = {https://www.merl.com/publications/TR2016-171}
    • }
  •  Liu, M.-Y., Tuzel, C.O., Sullivan, A., "Coupled Generative Adversarial Nets", Advances in Neural Information Processing Systems (NIPS), December 2016.
    BibTeX TR2016-156 PDF
    • @inproceedings{Liu2016dec,
    • author = {Liu, Ming-Yu and Tuzel, C. Oncel and Sullivan, Alan},
    • title = {Coupled Generative Adversarial Nets},
    • booktitle = {Advances in Neural Information Processing Systems (NIPS)},
    • year = 2016,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2016-156}
    • }
  •  Wisdom, S., Powers, T., Hershey, J.R., Le Roux, J., Atlas, L., "Full-Capacity Unitary Recurrent Neural Networks", Advances in Neural Information Processing Systems (NIPS), December 2016.
    BibTeX TR2016-155 PDF
    • @inproceedings{Wisdom2016dec,
    • author = {Wisdom, Scott and Powers, Thomas and Hershey, John R. and Le Roux, Jonathan and Atlas, Les},
    • title = {Full-Capacity Unitary Recurrent Neural Networks},
    • booktitle = {Advances in Neural Information Processing Systems (NIPS)},
    • year = 2016,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2016-155}
    • }
  •  Vincent, E., Watanabe, S., Nugraha, A.A., Barker, J., Marxer, R., "An analysis of environment, microphone and data simulation mismatches in robust speech recognition", Computer Speech & Language, DOI: 10.1016/​j.csl.2016.11.005, December 2016.
    BibTeX TR2016-172 PDF
    • @article{Vincent2016dec,
    • author = {Vincent, Emmanuel and Watanabe, Shinji and Nugraha, Aditya Arie and Barker, Jon and Marxer, Ricard},
    • title = {An analysis of environment, microphone and data simulation mismatches in robust speech recognition},
    • journal = {Computer Speech \& Language},
    • year = 2016,
    • month = dec,
    • publisher = {Elsevier},
    • doi = {10.1016/j.csl.2016.11.005},
    • url = {https://www.merl.com/publications/TR2016-172}
    • }
  •  Chen, C., Liu, M.-Y., Tuzel, C.O., Xiao, J., "R-CNN for Small Object Detection", Asian Conference on Computer Vision (ACCV), DOI: 10.1007/​978-3-319-54193-8_14, November 2016, vol. 10115, pp. 214-230.
    BibTeX TR2016-144 PDF
    • @inproceedings{Chen2016nov,
    • author = {Chen, Chenyi and Liu, Ming-Yu and Tuzel, C. Oncel and Xiao, Jianxiong},
    • title = {R-CNN for Small Object Detection},
    • booktitle = {Asian Conference on Computer Vision (ACCV)},
    • year = 2016,
    • volume = 10115,
    • pages = {214--230},
    • month = nov,
    • doi = {10.1007/978-3-319-54193-8_14},
    • url = {https://www.merl.com/publications/TR2016-144}
    • }
  •  Tawara, N., Ogawa, T., Watanabe, S., Kobayashi, T., "Nested Gibbs sampling for mixture-of-mixture model and its application to speaker clustering", APSIPA Transactions on Signal and Information Processing, DOI: 10.1017/​ATSIP.2016.15, Vol. 5, October 2016.
    BibTeX TR2016-138 PDF
    • @article{Tawara2016oct,
    • author = {Tawara, Naohiro and Ogawa, Tetsuji and Watanabe, Shinji and Kobayashi, Tetsunori},
    • title = {Nested Gibbs sampling for mixture-of-mixture model and its application to speaker clustering},
    • journal = {APSIPA Transactions on Signal and Information Processing},
    • year = 2016,
    • volume = 5,
    • month = oct,
    • doi = {10.1017/ATSIP.2016.15},
    • url = {https://www.merl.com/publications/TR2016-138}
    • }
  •  Ozcan, G., Pajovic, M., Sahinoglu, Z., Wang, Y., Orlik, P.V., Wada, T., "Online State of Charge Estimation for Lithium-Ion Batteries Using Gaussian Process Regression", IEEE Industrial Electronics Society (IECON), DOI: 10.1109/​IECON.2016.7793002, October 2016, pp. 998-1003.
    BibTeX TR2016-136 PDF
    • @inproceedings{Ozcan2016oct,
    • author = {Ozcan, Gozde and Pajovic, Milutin and Sahinoglu, Zafer and Wang, Yebin and Orlik, Philip V. and Wada, Toshihiro},
    • title = {Online State of Charge Estimation for Lithium-Ion Batteries Using Gaussian Process Regression},
    • booktitle = {IEEE Industrial Electronics Society (IECON)},
    • year = 2016,
    • pages = {998--1003},
    • month = oct,
    • doi = {10.1109/IECON.2016.7793002},
    • url = {https://www.merl.com/publications/TR2016-136}
    • }
  •  Tuzel, C.O., Marks, T.K., Tambe, S., "Robust Face Alignment Using a Mixture of Invariant Experts", European Conference on Computer Vision (ECCV), DOI: 10.1007/​978-3-319-46454-1_50, October 2016, vol. 9909, pp. 825-841.
    BibTeX TR2016-129 PDF
    • @inproceedings{Tuzel2016oct,
    • author = {Tuzel, C. Oncel and Marks, Tim K. and Tambe, Salil},
    • title = {Robust Face Alignment Using a Mixture of Invariant Experts},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2016,
    • volume = 9909,
    • pages = {825--841},
    • month = oct,
    • doi = {10.1007/978-3-319-46454-1_50},
    • url = {https://www.merl.com/publications/TR2016-129}
    • }
  •  Sankaran, B., Ramalingam, S., Taguchi, Y., "Parameter Learning for Improving Binary Descriptor Matching", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/​IROS.2016.7759718, October 2016, pp. 4892-4897.
    BibTeX TR2016-132 PDF
    • @inproceedings{Sankaran2016oct,
    • author = {Sankaran, Bharath and Ramalingam, Srikumar and Taguchi, Yuichi},
    • title = {Parameter Learning for Improving Binary Descriptor Matching},
    • booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2016,
    • pages = {4892--4897},
    • month = oct,
    • doi = {10.1109/IROS.2016.7759718},
    • url = {https://www.merl.com/publications/TR2016-132}
    • }
  •  Delcroix, M., Watanabe, S., "Recent Advances in Distant Speech Recognition," Tech. Rep. TR2016-115, Interspeech Tutorials, September 2016.
    BibTeX TR2016-115 PDF
    • @techreport{Delcroix2016sep,
    • author = {Delcroix, Marc and Watanabe, Shinji},
    • title = {Recent Advances in Distant Speech Recognition},
    • booktitle = {Interspeech Tutorials},
    • institution = {Interspeech},
    • year = 2016,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2016-115}
    • }
  •  Le Roux, J., Vincent, E., Erdogan, H., "Learning-Based Approaches to Speech Enhancement and Separation," Tech. Rep. TR2016-113, Interspeech Tutorials, September 2016.
    BibTeX TR2016-113 PDF
    • @techreport{LeRoux2016sep,
    • author = {Le Roux, Jonathan and Vincent, Emmanuel and Erdogan, Hakan},
    • title = {Learning-Based Approaches to Speech Enhancement and Separation},
    • booktitle = {Interspeech Tutorials},
    • year = 2016,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2016-113}
    • }
  •  Erdogan, H., Hershey, J.R., Watanabe, S., Mandel, M., Le Roux, J., "Improved MVDR beamforming using single-channel mask prediction networks", Interspeech, DOI: 10.21437/​Interspeech.2016-552, September 2016, pp. 1981-1985.
    BibTeX TR2016-072 PDF
    • @inproceedings{Erdogan2016sep,
    • author = {Erdogan, Hakan and Hershey, John R. and Watanabe, Shinji and Mandel, Michael and Le Roux, Jonathan},
    • title = {Improved MVDR beamforming using single-channel mask prediction networks},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {1981--1985},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-552},
    • url = {https://www.merl.com/publications/TR2016-072}
    • }
  •  Hori, C., Hori, T., Watanabe, S., Hershey, J.R., "Context-Sensitive and Role-Dependent Spoken Language Understanding using Bidirectional and Attention LSTMs", Interspeech, DOI: 10.21437/​Interspeech.2016-1171, September 2016, pp. 3236-3240.
    BibTeX TR2016-074 PDF
    • @inproceedings{Hori2016sep,
    • author = {Hori, Chiori and Hori, Takaaki and Watanabe, Shinji and Hershey, John R.},
    • title = {Context-Sensitive and Role-Dependent Spoken Language Understanding using Bidirectional and Attention LSTMs},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {3236--3240},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-1171},
    • url = {https://www.merl.com/publications/TR2016-074}
    • }
  •  Isik, Y., Le Roux, J., Chen, Z., Watanabe, S., Hershey, J.R., "Single-Channel Multi-Speaker Separation using Deep Clustering", Interspeech, DOI: 10.21437/​Interspeech.2016-1176, September 2016, pp. 545-549.
    BibTeX TR2016-073 PDF
    • @inproceedings{Isik2016sep,
    • author = {Isik, Yusuf and Le Roux, Jonathan and Chen, Zhuo and Watanabe, Shinji and Hershey, John R.},
    • title = {Single-Channel Multi-Speaker Separation using Deep Clustering},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {545--549},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-1176},
    • url = {https://www.merl.com/publications/TR2016-073}
    • }
  •  Zmolikova, K., Karafiat, M., Vesely, K., Delcroix, M., Watanabe, S., Burget, L., Cernocky, J.H., "Data selection by sequence summarizing neural network in mismatch condition training", Interspeech, DOI: 10.21437/​Interspeech.2016-741, September 2016, pp. 2354-2358.
    BibTeX TR2016-075 PDF
    • @inproceedings{Zmolikova2016sep,
    • author = {Zmolikova, Katerina and Karafiat, Martin and Vesely, Karel and Delcroix, Marc and Watanabe, Shinji and Burget, Lukas and Cernocky, Jan, Honza},
    • title = {Data selection by sequence summarizing neural network in mismatch condition training},
    • booktitle = {Interspeech},
    • year = 2016,
    • pages = {2354--2358},
    • month = sep,
    • doi = {10.21437/Interspeech.2016-741},
    • url = {https://www.merl.com/publications/TR2016-075}
    • }
  •  Hayashi, T., Watanabe, S., Toda, T., Hori, T., Le Roux, J., Takeda, K., "Bidirectional LSTM-HMM Hybrid System for Polyphonic Sound Event Detection", Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE), September 2016, pp. 35-39.
    BibTeX TR2016-114 PDF
    • @inproceedings{Hayashi2016sep,
    • author = {Hayashi, Tomoki and Watanabe, Shinji and Toda, Tomoki and Hori, Takaaki and Le Roux, Jonathan and Takeda, Kazuya},
    • title = {Bidirectional LSTM-HMM Hybrid System for Polyphonic Sound Event Detection},
    • booktitle = {Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE)},
    • year = 2016,
    • pages = {35--39},
    • month = sep,
    • url = {https://www.merl.com/publications/TR2016-114}
    • }
  •  Koike-Akino, T., Mahajan, R., Marks, T.K., Tuzel, C.O., Wang, Y., Watanabe, S., Orlik, P.V., "High-Accuracy User Identification Using EEG Biometrics", International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC), DOI: 10.1109/​EMBC.2016.7590835, August 2016, pp. 854-858.
    BibTeX TR2016-105 PDF Presentation
    • @inproceedings{Koike-Akino2016aug,
    • author = {Koike-Akino, Toshiaki and Mahajan, Ruhi and Marks, Tim K. and Tuzel, C. Oncel and Wang, Ye and Watanabe, Shinji and Orlik, Philip V.},
    • title = {High-Accuracy User Identification Using EEG Biometrics},
    • booktitle = {International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)},
    • year = 2016,
    • pages = {854--858},
    • month = aug,
    • doi = {10.1109/EMBC.2016.7590835},
    • url = {https://www.merl.com/publications/TR2016-105}
    • }