Publications

193 / 3,738 publications found.


  •  Watanabe, S., Hori, T., Karita, S., Hayashi, T., Nishitoba, J., Unno, Y., Enrique Yalta Soplin, N., Heymann, J., Wiesner, M., Chen, N., Renduchintala, A., Ochiai, T., "ESPnet: End-to-End Speech Processing Toolkit", Interspeech, September 2018.
    BibTeX TR2018-136 PDF
    • @inproceedings{Watanabe2018sep,
    • author = {Watanabe, Shinji and Hori, Takaaki and Karita, Shigeki and Hayashi, Tomoki and Nishitoba, Jiro and Unno, Yuya and Enrique Yalta Soplin, Nelson and Heymann, Jahn and Wiesner, Matthew and Chen, Nanxin and Renduchintala, Adithya and Ochiai, Tsubasa},
    • title = {ESPnet: End-to-End Speech Processing Toolkit},
    • booktitle = {Interspeech},
    • year = 2018,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2018-136}
    • }
  •  Ataer-Cansizoglu, E., Jones, M.J., Zhang, Z., Sullivan, A., "Verification of Very Low-Resolution Faces Using An Identity-Preserving Deep Face Super-resolution Network", arXiv, August 2018.
    BibTeX arXiv
    • @article{Ataer-Cansizoglu2018aug,
    • author = {Ataer-Cansizoglu, Esra and Jones, Michael J. and Zhang, Ziming and Sullivan, Alan},
    • title = {Verification of Very Low-Resolution Faces Using An Identity-Preserving Deep Face Super-resolution Network},
    • journal = {arXiv},
    • year = 2018,
    • month = aug,
    • url = {https://arxiv.org/abs/1903.10974}
    • }
  •  Zhang, Z., "LMKL-Net: A Fast Localized Multiple Kernel Learning Solver via Deep Neural Networks", arXiv, July 12, 2018.
    BibTeX arXiv
    • @article{Zhang2018jul,
    • author = {Zhang, Ziming},
    • title = {LMKL-Net: A Fast Localized Multiple Kernel Learning Solver via Deep Neural Networks},
    • journal = {arXiv},
    • year = 2018,
    • month = jul,
    • url = {https://arxiv.org/abs/1805.08656}
    • }
  •  Pan, Y., Farahmand, A.-M., White, M., Nabi, S., Grover, P., Nikovski, D.N., "Reinforcement Learning with Function-Valued Action Spaces for Partial Differential Equation Control", International Conference on Machine Learning (ICML), July 2018.
    BibTeX TR2018-101 PDF
    • @inproceedings{Pan2018jul,
    • author = {Pan, Yangchen and Farahmand, Amir-massoud and White, Martha and Nabi, Saleh and Grover, Piyush and Nikovski, Daniel N.},
    • title = {Reinforcement Learning with Function-Valued Action Spaces for Partial Differential Equation Control},
    • booktitle = {International Conference on Machine Learning (ICML)},
    • year = 2018,
    • month = jul,
    • url = {https://www.merl.com/publications/TR2018-101}
    • }
  •  Barker, J., Marxer, R., Vincent, E., Watanabe, S., "The CHiME challenges: Robust speech recognition in everyday environments" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R., Eds., chapter 14, Springer, July 2018.
    BibTeX
    • @incollection{Barker2018jul,
    • author = {Barker, Jon and Marxer, Ricard and Vincent, Emmanuel and Watanabe, Shinji},
    • title = {The CHiME challenges: Robust speech recognition in everyday environments},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R.},
    • chapter = 14,
    • month = jul,
    • publisher = {Springer}
    • }
  •  Erdogan, H., Hershey, J., Watanabe, S., Le Roux, J., "Deep recurrent networks for separation and recognition of single-channel speech in non-stationary background audio" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R., Eds., chapter 7, Springer, July 2018.
    BibTeX
    • @incollection{Erdogan2018jul,
    • author = {Erdogan, Hakan and Hershey, John and Watanabe, Shinji and Le Roux, Jonathan},
    • title = {Deep recurrent networks for separation and recognition of single-channel speech in non-stationary background audio},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R.},
    • chapter = 7,
    • month = jul,
    • publisher = {Springer},
    • isbn = {978-3-319-64680-0}
    • }
  •  Hershey, J., Le Roux, J., Watanabe, S., Wisdom, S., Chen, Z., Isik, Y., "Novel deep architectures in speech processing" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R., Eds., chapter 6, Springer, July 9, 2018.
    BibTeX
    • @incollection{Hershey2018jul,
    • author = {Hershey, John and Le Roux, Jonathan and Watanabe, Shinji and Wisdom, Scott and Chen, Zhuo and Isik, Yusuf},
    • title = {Novel deep architectures in speech processing},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R.},
    • chapter = 6,
    • month = jul,
    • publisher = {Springer}
    • }
  •  Karafiat, M., Vesely, K., Zmolikova, K., Delcroix, M., Watanabe, S., Burget, L., Cernocky, J., Szoke, I., Novotny, O., "Training data augmentation and data selectio" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R., Eds., chapter 10, Springer, July 9, 2018.
    BibTeX
    • @incollection{Karafiat2018jul,
    • author = {Karafiat, Martin and Vesely, Karel and Zmolikova, Katerina and Delcroix, Marc and Watanabe, Shinji and Burget, Lukas and Cernocky, Jan and Szoke, Igor and Novotny, Ondrej},
    • title = {Training data augmentation and data selectio},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R.},
    • chapter = 10,
    • month = jul,
    • publisher = {Springer}
    • }
  •  Watanabe, S., Hori, T., Miao, Y., Delcroix, M., Metze, F., Hershey, J., "Toolkits for robust speech processing" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R., Eds., chapter 14, Springer, July 9, 2018.
    BibTeX
    • @incollection{Watanabe2018jul,
    • author = {Watanabe, Shinji and Hori, Takaaki and Miao, Yajie and Delcroix, Marc and Metze, Florian and Hershey, John},
    • title = {Toolkits for robust speech processing},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R.},
    • chapter = 14,
    • month = jul,
    • publisher = {Springer}
    • }
  •  Xiao, X., Watanabe, S., Erdogan, H., Mandel, M., Lu, L., Hershey, J., Seltzer, M., Chen, G., Zhang, Y., Yu, D., "Discriminative beamforming with phase aware neural networks for speech enhancement and recognition" in New Era for Robust Speech Recognition: Exploiting Deep Learning, Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R., Eds., chapter 4, Springer, July 9, 2018.
    BibTeX
    • @incollection{Xiao2018jul2,
    • author = {Xiao, Xiong and Watanabe, Shinji and Erdogan, Hakan and Mandel, Michael and Lu, Liang and Hershey, John and Seltzer, Mike and Chen, Guoguo and Zhang, Yu and Yu, Dong},
    • title = {Discriminative beamforming with phase aware neural networks for speech enhancement and recognition},
    • booktitle = {New Era for Robust Speech Recognition: Exploiting Deep Learning},
    • year = 2018,
    • editor = {Watanabe, S. and Delcroix, M. and Metze, F. and Hershey, J.R.},
    • chapter = 4,
    • month = jul,
    • publisher = {Springer}
    • }
  •  Liu, J., Guo, J., Orlik, P.V., Shibata, M., Nakahara, D., Mii, S., Takac, M., "Anomaly Detection in Manufacturing Systems Using Structured Neural Networks", IEEE World Congress on Intelligent Control and Automation, DOI: 10.1109/​WCICA.2018.8630692, July 2018, pp. 175-180.
    BibTeX TR2018-097 PDF
    • @inproceedings{Liu2018jul2,
    • author = {Liu, Jie and Guo, Jianlin and Orlik, Philip V. and Shibata, Masahiko and Nakahara, Daiki and Mii, Satoshi and Takac, Martin},
    • title = {Anomaly Detection in Manufacturing Systems Using Structured Neural Networks},
    • booktitle = {IEEE World Congress on Intelligent Control and Automation},
    • year = 2018,
    • pages = {175--180},
    • month = jul,
    • doi = {10.1109/WCICA.2018.8630692},
    • url = {https://www.merl.com/publications/TR2018-097}
    • }
  •  Koike-Akino, T., Millar, D.S., Parsons, K., Kojima, K., "Fiber Nonlinearity Equalization with Multi-Label Deep Learning Scalable to High-Order DP-QAM", Signal Processing in Photonic Communications (SPPCom), DOI: 10.1364/​SPPCOM.2018.SpM4G.1, July 2018.
    BibTeX TR2018-047 PDF
    • @inproceedings{Koike-Akino2018jul3,
    • author = {Koike-Akino, Toshiaki and Millar, David S. and Parsons, Kieran and Kojima, Keisuke},
    • title = {Fiber Nonlinearity Equalization with Multi-Label Deep Learning Scalable to High-Order DP-QAM},
    • booktitle = {Signal Processing in Photonic Communications (SPPCom)},
    • year = 2018,
    • month = jul,
    • doi = {10.1364/SPPCOM.2018.SpM4G.1},
    • url = {https://www.merl.com/publications/TR2018-047}
    • }
  •  Shen, Y., Feng, C., Yang, Y., Tian, D., "Mining Point Cloud Local Structures by Kernel Correlation and Graph Pooling", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2018.
    BibTeX TR2018-041 PDF Software
    • @inproceedings{Shen2018jun,
    • author = {Shen, Yiru and Feng, Chen and Yang, Yaoqing and Tian, Dong},
    • title = {Mining Point Cloud Local Structures by Kernel Correlation and Graph Pooling},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2018,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2018-041}
    • }
  •  Yang, Y., Feng, C., Shen, Y., Tian, D., "FoldingNet: Point Cloud Auto-encoder via Deep Grid Deformation", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR.2018.00029, June 2018.
    BibTeX TR2018-042 PDF Video Software
    • @inproceedings{Yang2018jun,
    • author = {Yang, Yaoqing and Feng, Chen and Shen, Yiru and Tian, Dong},
    • title = {FoldingNet: Point Cloud Auto-encoder via Deep Grid Deformation},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2018,
    • month = jun,
    • doi = {10.1109/CVPR.2018.00029},
    • url = {https://www.merl.com/publications/TR2018-042}
    • }
  •  Zhang, Z., Wu, Y., Wang, G., "BPGrad: Towards Global Optimality in Deep Learning via Branch and Pruning", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2018, pp. 3301-3309.
    BibTeX TR2018-068 PDF
    • @inproceedings{Zhang2018jun,
    • author = {Zhang, Ziming and Wu, Yuanwei and Wang, Guanghui},
    • title = {BPGrad: Towards Global Optimality in Deep Learning via Branch and Pruning},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2018,
    • pages = {3301--3309},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2018-068}
    • }
  •  Fujihashi, T., Koike-Akino, T., Watanabe, T., Orlik, P.V., "Nonlinear Equalization with Deep Learning for Multi-Purpose Visual MIMO Communications", IEEE International Conference on Communications (ICC), DOI: 10.1109/​ICC.2018.8422544, May 2018.
    BibTeX TR2018-039 PDF
    • @inproceedings{Fujihashi2018may,
    • author = {Fujihashi, Takuya and Koike-Akino, Toshiaki and Watanabe, Takashi and Orlik, Philip V.},
    • title = {Nonlinear Equalization with Deep Learning for Multi-Purpose Visual MIMO Communications},
    • booktitle = {IEEE International Conference on Communications (ICC)},
    • year = 2018,
    • month = may,
    • doi = {10.1109/ICC.2018.8422544},
    • url = {https://www.merl.com/publications/TR2018-039}
    • }
  •  Settle, S., Le Roux, J., Hori, T., Watanabe, S., Hershey, J.R., "End-to-End Multi-Speaker Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2018.8461893, April 2018, pp. 4819-4823.
    BibTeX TR2018-001 PDF Video
    • @inproceedings{Settle2018apr,
    • author = {Settle, Shane and Le Roux, Jonathan and Hori, Takaaki and Watanabe, Shinji and Hershey, John R.},
    • title = {End-to-End Multi-Speaker Speech Recognition},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2018,
    • pages = {4819--4823},
    • month = apr,
    • doi = {10.1109/ICASSP.2018.8461893},
    • url = {https://www.merl.com/publications/TR2018-001}
    • }
  •  Wen, B., Kamilov, U., Liu, D., Mansour, H., Boufounos, P.T., "DeepCASD: An End-to-End Approach for Multi-Spectural Image Super-Resolution", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP.2018.8461795, April 2018, pp. 6503-6507.
    BibTeX TR2018-009 PDF
    • @inproceedings{Wen2018apr,
    • author = {Wen, Bihan and Kamilov, Ulugbek and Liu, Dehong and Mansour, Hassan and Boufounos, Petros T.},
    • title = {DeepCASD: An End-to-End Approach for Multi-Spectural Image Super-Resolution},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2018,
    • pages = {6503--6507},
    • month = apr,
    • doi = {10.1109/ICASSP.2018.8461795},
    • url = {https://www.merl.com/publications/TR2018-009}
    • }
  •  Zhang, Z., Xu, W., Sullivan, A., "Time-Delay Momentum: A Regularization Perspective on the Convergence and Generalization of Stochastic Momentum for Deep Learning", arXiv, March 2018.
    BibTeX arXiv
    • @article{Zhang2018mar,
    • author = {Zhang, Ziming and Xu, Wenju and Sullivan, Alan},
    • title = {Time-Delay Momentum: A Regularization Perspective on the Convergence and Generalization of Stochastic Momentum for Deep Learning},
    • journal = {arXiv},
    • year = 2018,
    • month = mar,
    • url = {https://arxiv.org/abs/1903.00760}
    • }
  •  Ochiai, T., Watanabe, S., Hori, T., Hershey, J.R., Xiao, X., "Unified Architecture for Multichannel End-to-End Speech Recognition with Neural Beamforming", IEEE Journal of Selected Topics in Signal Processing, DOI: 10.1109/​JSTSP.2017.2764276, Vol. 11, No. 8, pp. 1274-1288, October 2017.
    BibTeX TR2017-192 PDF
    • @article{Ochiai2017oct2,
    • author = {Ochiai, Tsubasa and Watanabe, Shinji and Hori, Takaaki and Hershey, John R. and Xiao, Xiong},
    • title = {Unified Architecture for Multichannel End-to-End Speech Recognition with Neural Beamforming},
    • journal = {IEEE Journal of Selected Topics in Signal Processing},
    • year = 2017,
    • volume = 11,
    • number = 8,
    • pages = {1274--1288},
    • month = oct,
    • doi = {10.1109/JSTSP.2017.2764276},
    • issn = {1941-0484},
    • url = {https://www.merl.com/publications/TR2017-192}
    • }
  •  Watanabe, S., Hori, T., Kim, S., Hershey, J.R., Hayashi, T., "Hybrid CTC/Attention Architecture for End-to-End Speech Recognition", IEEE Journal of Selected Topics in Signal Processing, DOI: 10.1109/​JSTSP.2017.2763455, Vol. 11, No. 8, pp. 1240-1253, October 2017.
    BibTeX TR2017-190 PDF Video
    • @article{Watanabe2017oct,
    • author = {Watanabe, Shinji and Hori, Takaaki and Kim, Suyoun and Hershey, John R. and Hayashi, Tomoki},
    • title = {Hybrid CTC/Attention Architecture for End-to-End Speech Recognition},
    • journal = {IEEE Journal of Selected Topics in Signal Processing},
    • year = 2017,
    • volume = 11,
    • number = 8,
    • pages = {1240--1253},
    • month = oct,
    • doi = {10.1109/JSTSP.2017.2763455},
    • issn = {1941-0484},
    • url = {https://www.merl.com/publications/TR2017-190}
    • }
  •  Hori, T., Watanabe, S., Zhang, Y., Chan, W., "Advances in Joint CTC-Attention based End-to-End Speech Recognition with a Deep CNN Encoder and RNN-LM", Interspeech, August 2017.
    BibTeX TR2017-132 PDF Video
    • @inproceedings{Hori2017aug,
    • author = {Hori, Takaaki and Watanabe, Shinji and Zhang, Yu and Chan, William},
    • title = {Advances in Joint CTC-Attention based End-to-End Speech Recognition with a Deep CNN Encoder and RNN-LM},
    • booktitle = {Interspeech},
    • year = 2017,
    • month = aug,
    • url = {https://www.merl.com/publications/TR2017-132}
    • }
  •  Abbeloos, W., Caccamo, S., Ataer-Cansizoglu, E., Taguchi, Y., Feng, C., Lee, T.-Y., "Detecting and Grouping Identical Objects for Region Proposal and Classification", CVPR Workshop on Deep Learning for Robotic Vision, DOI: 10.1109/​CVPRW.2017.76, July 2017.
    BibTeX TR2017-099 PDF
    • @inproceedings{Abbeloos2017jul,
    • author = {Abbeloos, Wim and Caccamo, Sergio and Ataer-Cansizoglu, Esra and Taguchi, Yuichi and Feng, Chen and Lee, Teng-Yok},
    • title = {Detecting and Grouping Identical Objects for Region Proposal and Classification},
    • booktitle = {CVPR Workshop on Deep Learning for Robotic Vision},
    • year = 2017,
    • month = jul,
    • doi = {10.1109/CVPRW.2017.76},
    • url = {https://www.merl.com/publications/TR2017-099}
    • }
  •  Yu, Z., Feng, C., Liu, M.-Y., Ramalingam, S., "CASENet: Deep Category-Aware Semantic Edge Detection", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR.2017.191, July 2017.
    BibTeX TR2017-100 PDF Video Data Software
    • @inproceedings{Yu2017jul,
    • author = {Yu, Zhiding and Feng, Chen and Liu, Ming-Yu and Ramalingam, Srikumar},
    • title = {CASENet: Deep Category-Aware Semantic Edge Detection},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2017,
    • month = jul,
    • doi = {10.1109/CVPR.2017.191},
    • url = {https://www.merl.com/publications/TR2017-100}
    • }
  •  Feng, C., Liu, M.-Y., Kao, C.-C., Lee, T.-Y., "Deep Active Learning for Civil Infrastructure Defect Detection and Classification", International Workshop on Computing in Civil Engineering (IWCCE), June 2017.
    BibTeX TR2017-034 PDF
    • @inproceedings{Feng2017jun,
    • author = {Feng, Chen and Liu, Ming-Yu and Kao, Chieh-Chi and Lee, Teng-Yok},
    • title = {Deep Active Learning for Civil Infrastructure Defect Detection and Classification},
    • booktitle = {International Workshop on Computing in Civil Engineering (IWCCE)},
    • year = 2017,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2017-034}
    • }