Publications

629 / 3,738 publications found.


  •  Karita, S., Chen, N., Hayashi, T., Hori, T., Inaguma, H., Jiang, Z., Someki, M., Enrique Yalta Soplin, N., Yamamoto, R., Wang, X., Watanabe, S., Yoshimura, T., Zhang, W., "A Comparative Study on Transformer Vs RNN in Speech Applications", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/​ASRU46091.2019.9003750, December 2019, pp. 449-456.
    BibTeX TR2019-158 PDF
    • @inproceedings{Karita2019dec,
    • author = {Karita, Shigeki and Chen, Nanxin and Hayashi, Tomoki and Hori, Takaaki and Inaguma, Hirofumi and Jiang, Ziyan and Someki, Masao and Enrique Yalta Soplin, Nelson and Yamamoto, Ryuichi and Wang, Xiaofei and Watanabe, Shinji and Yoshimura, Takenori and Zhang, Wangyou},
    • title = {A Comparative Study on Transformer Vs RNN in Speech Applications},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2019,
    • pages = {449--456},
    • month = dec,
    • doi = {10.1109/ASRU46091.2019.9003750},
    • url = {https://www.merl.com/publications/TR2019-158}
    • }
  •  Moritz, N., Hori, T., Le Roux, J., "Streaming End-to-End Speech Recognition with Joint CTC-Attention Based Models", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2019, pp. 936-943.
    BibTeX TR2019-159 PDF
    • @inproceedings{Moritz2019dec,
    • author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Streaming End-to-End Speech Recognition with Joint CTC-Attention Based Models},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2019,
    • pages = {936--943},
    • month = dec,
    • isbn = {978-1-7281-0305-1},
    • url = {https://www.merl.com/publications/TR2019-159}
    • }
  •  Fujihashi, T., Koike-Akino, T., Watanabe, T., Orlik, P.V., "DNN-based Simultaneous Screen-to-Camera and Screen-to-Eye Communications", IEEE Global Communications Conference (GLOBECOM), DOI: 10.1109/​GLOBECOM38437.2019.9013967, December 2019.
    BibTeX TR2019-132 PDF
    • @inproceedings{Fujihashi2019dec,
    • author = {Fujihashi, Takuya and Koike-Akino, Toshiaki and Watanabe, Takashi and Orlik, Philip V.},
    • title = {DNN-based Simultaneous Screen-to-Camera and Screen-to-Eye Communications},
    • booktitle = {IEEE Global Communications Conference (GLOBECOM)},
    • year = 2019,
    • month = dec,
    • publisher = {IEEE},
    • doi = {10.1109/GLOBECOM38437.2019.9013967},
    • issn = {2576-6813},
    • isbn = {978-1-7281-0962-6},
    • url = {https://www.merl.com/publications/TR2019-132}
    • }
  •  Jespersen, M.H., Pajovic, M., Koike-Akino, T., Wang, Y., Popovski, P., Orlik, P.V., "Deep Learning for Synchronization and Channel Estimation in NB-IoT Random Access Channel", IEEE Global Communications Conference (GLOBECOM), DOI: 10.1109/​GLOBECOM38437.2019.9013510, December 2019.
    BibTeX TR2019-140 PDF
    • @inproceedings{Jespersen2019dec,
    • author = {Jespersen, Mads Helge and Pajovic, Milutin and Koike-Akino, Toshiaki and Wang, Ye and Popovski, Petar and Orlik, Philip V.},
    • title = {Deep Learning for Synchronization and Channel Estimation in NB-IoT Random Access Channel},
    • booktitle = {IEEE Global Communications Conference (GLOBECOM)},
    • year = 2019,
    • month = dec,
    • publisher = {IEEE},
    • doi = {10.1109/GLOBECOM38437.2019.9013510},
    • issn = {2576-6813},
    • isbn = {978-1-7281-0962-6},
    • url = {https://www.merl.com/publications/TR2019-140}
    • }
  •  Jha, D.K., Raghunathan, A., Romeres, D., "QNTRPO: Including Curvature in TRPO", Optimization Foundations for Reinforcement Learning Workshop at NeurIPS, December 2019.
    BibTeX TR2019-154 PDF Software
    • @inproceedings{Jha2019dec,
    • author = {Jha, Devesh K. and Raghunathan, Arvind and Romeres, Diego},
    • title = {QNTRPO: Including Curvature in TRPO},
    • booktitle = {Optimization Foundations for Reinforcement Learning Workshop at NeurIPS},
    • year = 2019,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2019-154}
    • }
  •  Bhamidipati, S., Kim, K.J., Sun, H., Orlik, P.V., Zhang, J., "Joint BP and RNN for Resilient GPS Timing Against Spoofing Attacks" in Social Informatics and Telecommunications Engineering, Han S. and Ye L. and Meng W., Eds., DOI: 10.1007/​978-3-030-22971-9_17, vol. 287 of Lecture Notes of the Institute for Computer Sciences, Springer, Cham, November 2019.
    BibTeX TR2019-131 PDF
    • @incollection{Bhamidipati2019nov,
    • author = {Bhamidipati, Sriramya and Kim, Kyeong Jin and Sun, Hongbo and Orlik, Philip V. and Zhang, Jinyun},
    • title = {Joint BP and RNN for Resilient GPS Timing Against Spoofing Attacks},
    • booktitle = {Social Informatics and Telecommunications Engineering},
    • year = 2019,
    • editor = {Han S. and Ye L. and Meng W.},
    • volume = 287,
    • series = {Lecture Notes of the Institute for Computer Sciences},
    • month = nov,
    • publisher = {Springer, Cham},
    • doi = {10.1007/978-3-030-22971-9_17},
    • url = {https://www.merl.com/publications/TR2019-131}
    • }
  •  Jha, D.K., Raghunathan, A., Romeres, D., "Quasi-Newton Trust Region Policy Optimization", Conference on Robot Learning (CoRL), Leslie Pack Kaelbling and Danica Kragic and Komei Sugiura, Eds., October 2019, pp. 945-954.
    BibTeX TR2019-120 PDF Software
    • @inproceedings{Jha2019oct,
    • author = {Jha, Devesh K. and Raghunathan, Arvind and Romeres, Diego},
    • title = {Quasi-Newton Trust Region Policy Optimization},
    • booktitle = {Conference on Robot Learning (CoRL)},
    • year = 2019,
    • editor = {Leslie Pack Kaelbling and Danica Kragic and Komei Sugiura},
    • pages = {945--954},
    • month = oct,
    • publisher = {Proceedings of Machine Learning Research},
    • url = {https://www.merl.com/publications/TR2019-120}
    • }
  •  Zhang, Z., Wu, Y., Wang, G., "Unsupervised Deep Feature Transfer for Low Resolution Image Classification", IEEE International Conference on Computer Vision Workshops (ICCV), DOI: 10.1109/​ICCVW.2019.00136, October 2019, pp. 1065-1069.
    BibTeX TR2019-127 PDF
    • @inproceedings{Zhang2019oct,
    • author = {Zhang, Ziming and Wu, Yuanwei and Wang, Guanghui},
    • title = {Unsupervised Deep Feature Transfer for Low Resolution Image Classification},
    • booktitle = {IEEE International Conference on Computer Vision Workshops (ICCV)},
    • year = 2019,
    • pages = {1065--1069},
    • month = oct,
    • doi = {10.1109/ICCVW.2019.00136},
    • url = {https://www.merl.com/publications/TR2019-127}
    • }
  •  Wang, J., Cherian, A., "GODS: Generalized One-class Discriminative Subspaces for Anomaly Detection", IEEE International Conference on Computer Vision (ICCV), DOI: 10.1109/​ICCV.2019.00829, October 2019, pp. 8200-8210.
    BibTeX TR2019-121 PDF
    • @inproceedings{Wang2019oct2,
    • author = {Wang, Jue and Cherian, Anoop},
    • title = {GODS: Generalized One-class Discriminative Subspaces for Anomaly Detection},
    • booktitle = {2019 IEEE/CVF International Conference on Computer Vision (ICCV)},
    • year = 2019,
    • pages = {8200--8210},
    • month = oct,
    • publisher = {IEEE},
    • doi = {10.1109/ICCV.2019.00829},
    • url = {https://www.merl.com/publications/TR2019-121}
    • }
  •  Kavalerov, I., Wisdom, S., Erdogan, H., Patton, B., Wilson, K., Le Roux, J., Hershey, J., "Universal Sound Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA.2019.8937253, October 2019, pp. 170-174.
    BibTeX TR2019-123 PDF
    • @inproceedings{Kavalerov2019oct,
    • author = {Kavalerov, Ilya and Wisdom, Scott and Erdogan, Hakan and Patton, Brian and Wilson, Kevin and Le Roux, Jonathan and Hershey, John},
    • title = {Universal Sound Separation},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2019,
    • pages = {170--174},
    • month = oct,
    • doi = {10.1109/WASPAA.2019.8937253},
    • issn = {1947-1629},
    • isbn = {978-1-7281-1123-0},
    • url = {https://www.merl.com/publications/TR2019-123}
    • }
  •  Manilow, E., Wichern, G., Seetharaman, P., Le Roux, J., "Cutting Music Source Separation Some Slakh: A Dataset to Study the Impact of Training Data Quality and Quantity", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA.2019.8937170, October 2019, pp. 45-49.
    BibTeX TR2019-124 PDF
    • @inproceedings{Manilow2019oct,
    • author = {Manilow, Ethan and Wichern, Gordon and Seetharaman, Prem and Le Roux, Jonathan},
    • title = {Cutting Music Source Separation Some Slakh: A Dataset to Study the Impact of Training Data Quality and Quantity},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2019,
    • pages = {45--49},
    • month = oct,
    • doi = {10.1109/WASPAA.2019.8937170},
    • issn = {1947-1629},
    • isbn = {978-1-7281-1123-0},
    • url = {https://www.merl.com/publications/TR2019-124}
    • }
  •  Koike-Akino, T., Wang, Y., Millar, D.S., Kojima, K., Parsons, K., "Neural Turbo Equalization to Mitigate Fiber Nonlinearity", European Conference on Optical Communication (ECOC), DOI: 10.1049/​cp.2019.0803, September 2019.
    BibTeX TR2019-088 PDF Presentation
    • @inproceedings{Koike-Akino2019sep,
    • author = {Koike-Akino, Toshiaki and Wang, Ye and Millar, David S. and Kojima, Keisuke and Parsons, Kieran},
    • title = {Neural Turbo Equalization to Mitigate Fiber Nonlinearity},
    • booktitle = {European Conference on Optical Communication (ECOC)},
    • year = 2019,
    • month = sep,
    • publisher = {IET},
    • doi = {10.1049/cp.2019.0803},
    • isbn = {978-1-83953-185-9},
    • url = {https://www.merl.com/publications/TR2019-088}
    • }
  •  Baskar, M.K., Watanabe, S., Astudillo, R., Hori, T., Burget, L., Cernocky, J.H., "Semi-supervised Sequence-to-sequence ASR using Unpaired Speech and Text", Interspeech, DOI: 10.21437/​Interspeech.2019-3167, September 2019, pp. 3790-3794.
    BibTeX TR2019-100 PDF
    • @inproceedings{Baskar2019sep,
    • author = {Baskar, Murali Karthick and Watanabe, Shinji and Astudillo, Ramon and Hori, Takaaki and Burget, Lukas and Cernocky, Jan, Honza},
    • title = {Semi-supervised Sequence-to-sequence ASR using Unpaired Speech and Text},
    • booktitle = {Interspeech},
    • year = 2019,
    • pages = {3790--3794},
    • month = sep,
    • doi = {10.21437/Interspeech.2019-3167},
    • issn = {1990-9772},
    • url = {https://www.merl.com/publications/TR2019-100}
    • }
  •  Hori, C., Cherian, A., Marks, T.K., Hori, T., "Joint Student-Teacher Learning for Audio-Visual Scene-Aware Dialog", Interspeech, September 2019, pp. 1886-1890.
    BibTeX TR2019-097 PDF
    • @inproceedings{Hori2019sep,
    • author = {Hori, Chiori and Cherian, Anoop and Marks, Tim K. and Hori, Takaaki},
    • title = {Joint Student-Teacher Learning for Audio-Visual Scene-Aware Dialog},
    • booktitle = {Interspeech},
    • year = 2019,
    • pages = {1886--1890},
    • month = sep,
    • publisher = {ISCA},
    • url = {https://www.merl.com/publications/TR2019-097}
    • }
  •  Karafiat, M., Baskar, M.K., Watanabe, S., Hori, T., Wiesner, M., Cernocky, J.H., "Analysis of Multilingual Sequence-to-Sequence Speech Recognition Systems", Interspeech, DOI: 10.21437/​Interspeech.2019-2355/​/​, September 2019, pp. 2019-2355.
    BibTeX TR2019-103 PDF
    • @inproceedings{Karafiat2019sep,
    • author = {Karafiat, Martin and Baskar, Murali Karthick and Watanabe, Shinji and Hori, Takaaki and Wiesner, Matthew and Cernocky, Jan, Honza},
    • title = {Analysis of Multilingual Sequence-to-Sequence Speech Recognition Systems},
    • booktitle = {Interspeech},
    • year = 2019,
    • pages = {2019--2355},
    • month = sep,
    • doi = {10.21437/Interspeech.2019-2355//},
    • url = {https://www.merl.com/publications/TR2019-103}
    • }
  •  Moritz, N., Hori, T., Le Roux, J., "Unidirectional Neural Network Architectures for End-to-End Automatic Speech Recognition", Interspeech, DOI: 10.21437/​Interspeech.2019-2837, September 2019, pp. 76-80.
    BibTeX TR2019-098 PDF
    • @inproceedings{Moritz2019sep,
    • author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Unidirectional Neural Network Architectures for End-to-End Automatic Speech Recognition},
    • booktitle = {Interspeech},
    • year = 2019,
    • pages = {76--80},
    • month = sep,
    • doi = {10.21437/Interspeech.2019-2837},
    • url = {https://www.merl.com/publications/TR2019-098}
    • }
  •  Seki, H., Hori, T., Watanabe, S., Le Roux, J., Hershey, J., "End-to-End Multilingual Multi-Speaker Speech Recognition", Interspeech, DOI: 10.21437/​Interspeech.2019-3038, September 2019, pp. 3755-3759.
    BibTeX TR2019-101 PDF
    • @inproceedings{Seki2019sep,
    • author = {Seki, Hiroshi and Hori, Takaaki and Watanabe, Shinji and Le Roux, Jonathan and Hershey, John},
    • title = {End-to-End Multilingual Multi-Speaker Speech Recognition},
    • booktitle = {Interspeech},
    • year = 2019,
    • pages = {3755--3759},
    • month = sep,
    • doi = {10.21437/Interspeech.2019-3038},
    • url = {https://www.merl.com/publications/TR2019-101}
    • }
  •  Seki, H., Hori, T., Watanabe, S., Moritz, N., Le Roux, J., "Vectorized Beam Search for CTC-Attention-based Speech Recognition", Interspeech, DOI: 10.21437/​Interspeech.2019-2860, September 2019, pp. 3825-3829.
    BibTeX TR2019-102 PDF
    • @inproceedings{Seki2019sep2,
    • author = {Seki, Hiroshi and Hori, Takaaki and Watanabe, Shinji and Moritz, Niko and Le Roux, Jonathan},
    • title = {Vectorized Beam Search for CTC-Attention-based Speech Recognition},
    • booktitle = {Interspeech},
    • year = 2019,
    • pages = {3825--3829},
    • month = sep,
    • doi = {10.21437/Interspeech.2019-2860},
    • url = {https://www.merl.com/publications/TR2019-102}
    • }
  •  Zhang, Z., Lin, Z., Pfister, H., "White-Box Adversarial Defense via Self-Supervised Data Estimation", arXiv, September 2019.
    BibTeX arXiv Software
    • @article{Zhang2019sep,
    • author = {Zhang, Ziming and Lin, Zudi and Pfister, Hanspeter},
    • title = {White-Box Adversarial Defense via Self-Supervised Data Estimation},
    • journal = {arXiv},
    • year = 2019,
    • month = sep,
    • url = {https://arxiv.org/abs/1909.06271}
    • }
  •  Jones, M.J., Rambhatla, S., "Body Part Alignment and Temporal Attention for Video-Based Person Re-Identification", British Machine Vision Conference (BMVC), September 2019.
    BibTeX TR2019-108 PDF
    • @inproceedings{Jones2019sep,
    • author = {Jones, Michael J. and Rambhatla, Sai},
    • title = {Body Part Alignment and Temporal Attention for Video-Based Person Re-Identification},
    • booktitle = {British Machine Vision Conference (BMVC)},
    • year = 2019,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2019-108}
    • }
  •  Yalta, N., Watanabe, S., Hori, T., Nakadai, K., Ogata, T., "CNN-based Multichannel End-to-End Speech Recognition for Everyday Home Environments", European Signal Processing Conference (EUSIPCO), DOI: 10.23919/​EUSIPCO.2019.8902524, September 2019, pp. 1-5.
    BibTeX TR2019-094 PDF
    • @inproceedings{Yalta2019sep,
    • author = {Yalta, Nelson and Watanabe, Shinji and Hori, Takaaki and Nakadai, Kazuhiro and Ogata, Tetsuya},
    • title = {CNN-based Multichannel End-to-End Speech Recognition for Everyday Home Environments},
    • booktitle = {European Signal Processing Conference (EUSIPCO)},
    • year = 2019,
    • pages = {1--5},
    • month = sep,
    • doi = {10.23919/EUSIPCO.2019.8902524},
    • url = {https://www.merl.com/publications/TR2019-094}
    • }
  •  Wang, J., Cherian, A., "Discriminative Video Representation Learning Using Support Vector Classifiers", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/​TPAMI.2019.2937292, August 2019.
    BibTeX TR2019-107 PDF
    • @article{Wang2019aug,
    • author = {Wang, Jue and Cherian, Anoop},
    • title = {Discriminative Video Representation Learning Using Support Vector Classifiers},
    • journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
    • year = 2019,
    • month = aug,
    • doi = {10.1109/TPAMI.2019.2937292},
    • url = {https://www.merl.com/publications/TR2019-107}
    • }
  •  Romeres, D., Jha, D.K., Dau, H., Yerazunis, W.S., Nikovski, D.N., "Anomaly Detection for Insertion Tasks in Robotic Assembly Using Gaussian Process Models", European Control Conference (ECC), DOI: 10.23919/​ECC.2019.8795698, June 2019, pp. 1017-1022.
    BibTeX TR2019-055 PDF
    • @inproceedings{Romeres2019jun,
    • author = {Romeres, Diego and Jha, Devesh K. and Dau, Hoang and Yerazunis, William S. and Nikovski, Daniel N.},
    • title = {Anomaly Detection for Insertion Tasks in Robotic Assembly Using Gaussian Process Models},
    • booktitle = {European Control Conference (ECC)},
    • year = 2019,
    • pages = {1017--1022},
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.23919/ECC.2019.8795698},
    • isbn = {978-3-907144-00-8},
    • url = {https://www.merl.com/publications/TR2019-055}
    • }
  •  Alamri, H., Cartillier, V., Das, A., Wang, J., Lee, S., Anderson, P., Essa, I., Parikh, D., Batra, D., Cherian, A., Marks, T.K., Hori, C., "Audio-Visual Scene-Aware Dialog", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR.2019.00774, June 2019, pp. 7550-7559.
    BibTeX TR2019-048 PDF
    • @inproceedings{Alamri2019jun,
    • author = {Alamri, Huda and Cartillier, Vincent and Das, Abhishek and Wang, Jue and Lee, Stefan and Anderson, Peter and Essa, Irfan and Parikh, Devi and Batra, Dhruv and Cherian, Anoop and Marks, Tim K. and Hori, Chiori},
    • title = {Audio-Visual Scene-Aware Dialog},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2019,
    • pages = {7550--7559},
    • month = jun,
    • doi = {10.1109/CVPR.2019.00774},
    • url = {https://www.merl.com/publications/TR2019-048}
    • }
  •  Lee, T.-Y., van Baar, J., Wittenburg, K.B., Sullivan, A., "Analysis of the contribution and temporal dependency of LSTM layers for reinforcement learning tasks", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Explanable AI Workshop, June 2019, pp. 99-102.
    BibTeX TR2019-049 PDF
    • @inproceedings{Lee2019jun2,
    • author = {Lee, Teng-Yok and van Baar, Jeroen and Wittenburg, Kent B. and Sullivan, Alan},
    • title = {Analysis of the contribution and temporal dependency of LSTM layers for reinforcement learning tasks},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Explanable AI Workshop},
    • year = 2019,
    • pages = {99--102},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2019-049}
    • }