Publications

Alamri, H., Cartillier, V., Lopes, R., Das, A., Wang, J., Essa, I., Batra, D., Parikh, D., Cherian, A., Marks, T.K., Hori, C., "Audio Visual Scene-Aware Dialog (AVSD) Challenge at DSTC7", arXiv, July 12, 2018.
BibTeX arXiv
- @article{Alamri2018jul,
- author = {Alamri, Huda and Cartillier, Vincent and Lopes, Raphael and Das, Abhishek and Wang, Jue and Essa, Irfan and Batra, Dhruv and Parikh, Devi and Cherian, Anoop and Marks, Tim K. and Hori, Chiori},
- title = {{Audio Visual Scene-Aware Dialog (AVSD) Challenge at DSTC7}},
- journal = {arXiv},
- year = 2018,
- month = jul,
- url = {https://arxiv.org/abs/1806.00525}
- }
Zhang, Z., "LMKL-Net: A Fast Localized Multiple Kernel Learning Solver via Deep Neural Networks", arXiv, July 12, 2018.
BibTeX arXiv
- @article{Zhang2018jul,
- author = {Zhang, Ziming},
- title = {{LMKL-Net: A Fast Localized Multiple Kernel Learning Solver via Deep Neural Networks}},
- journal = {arXiv},
- year = 2018,
- month = jul,
- url = {https://arxiv.org/abs/1805.08656}
- }
Zhang, Z., Lin, R., Sullivan, A., "Deformable Part Networks", arXiv, July 12, 2018.
BibTeX arXiv
- @article{Zhang2018jul2,
- author = {Zhang, Ziming and Lin, Rongmei and Sullivan, Alan},
- title = {{Deformable Part Networks}},
- journal = {arXiv},
- year = 2018,
- month = jul,
- url = {https://arxiv.org/abs/1805.08808}
- }
Sanz, I., Bernal, C., Bono, A., Pajovic, M., Martinez, G., "Gaussian Process Regression Applied to VRLA Battery Voltage Prediction in Photovoltaic Off-Grid Systems", Jornada de Jovenes Investigadores, July 11, 2018.
BibTeX TR2018-077 PDF
- @inproceedings{Sanz2018jul,
- author = {Sanz, Ivan and Bernal, Carlos and Bono, Antonio and Pajovic, Milutin and Martinez, Gabriel},
- title = {{Gaussian Process Regression Applied to VRLA Battery Voltage Prediction in Photovoltaic Off-Grid Systems}},
- booktitle = {Jornada de Jovenes Investigadores},
- year = 2018,
- number = 6,
- month = jul,
- url = {https://www.merl.com/publications/TR2018-077}
- }
Pan, Y., Farahmand, A.-M., White, M., Nabi, S., Grover, P., Nikovski, D.N., "Reinforcement Learning with Function-Valued Action Spaces for Partial Differential Equation Control", International Conference on Machine Learning (ICML), July 2018.
BibTeX TR2018-101 PDF
- @inproceedings{Pan2018jul,
- author = {Pan, Yangchen and Farahmand, Amir-massoud and White, Martha and Nabi, Saleh and Grover, Piyush and Nikovski, Daniel N.},
- title = {{Reinforcement Learning with Function-Valued Action Spaces for Partial Differential Equation Control}},
- booktitle = {International Conference on Machine Learning (ICML)},
- year = 2018,
- month = jul,
- url = {https://www.merl.com/publications/TR2018-101}
- }
Liu, J., Guo, J., Orlik, P.V., Shibata, M., Nakahara, D., Mii, S., Takac, M., "Anomaly Detection in Manufacturing Systems Using Structured Neural Networks", IEEE World Congress on Intelligent Control and Automation, DOI: 10.1109/WCICA.2018.8630692, July 2018, pp. 175-180.
BibTeX TR2018-097 PDF
- @inproceedings{Liu2018jul2,
- author = {Liu, Jie and Guo, Jianlin and Orlik, Philip V. and Shibata, Masahiko and Nakahara, Daiki and Mii, Satoshi and Takac, Martin},
- title = {{Anomaly Detection in Manufacturing Systems Using Structured Neural Networks}},
- booktitle = {IEEE World Congress on Intelligent Control and Automation},
- year = 2018,
- pages = {175--180},
- month = jul,
- doi = {10.1109/WCICA.2018.8630692},
- url = {https://www.merl.com/publications/TR2018-097}
- }
Shen, Y., Feng, C., Yang, Y., Tian, D., "Mining Point Cloud Local Structures by Kernel Correlation and Graph Pooling", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2018.
BibTeX TR2018-041 PDF Software
- @inproceedings{Shen2018jun,
- author = {Shen, Yiru and Feng, Chen and Yang, Yaoqing and Tian, Dong},
- title = {{Mining Point Cloud Local Structures by Kernel Correlation and Graph Pooling}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2018,
- month = jun,
- url = {https://www.merl.com/publications/TR2018-041}
- }
Yang, Y., Feng, C., Shen, Y., Tian, D., "FoldingNet: Point Cloud Auto-encoder via Deep Grid Deformation", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/CVPR.2018.00029, June 2018.
BibTeX TR2018-042 PDF Video Software
- @inproceedings{Yang2018jun,
- author = {Yang, Yaoqing and Feng, Chen and Shen, Yiru and Tian, Dong},
- title = {{FoldingNet: Point Cloud Auto-encoder via Deep Grid Deformation}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2018,
- month = jun,
- doi = {10.1109/CVPR.2018.00029},
- url = {https://www.merl.com/publications/TR2018-042}
- }
Zhang, Z., Wu, Y., Wang, G., "BPGrad: Towards Global Optimality in Deep Learning via Branch and Pruning", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2018, pp. 3301-3309.
BibTeX TR2018-068 PDF
- @inproceedings{Zhang2018jun,
- author = {Zhang, Ziming and Wu, Yuanwei and Wang, Guanghui},
- title = {{BPGrad: Towards Global Optimality in Deep Learning via Branch and Pruning}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2018,
- pages = {3301--3309},
- month = jun,
- url = {https://www.merl.com/publications/TR2018-068}
- }
Nowara, E., Marks, T.K., Mansour, H., Nakamura, Y., Veeraraghavan, A., "SparsePPG: Towards Driver Monitoring Using Camera-Based Vital Signs Estimation in Near-Infrared", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop on Computer Vision for Physiological Measurement (CVPM, June 2018, pp. 1272-1281.
BibTeX TR2018-067 PDF
- @inproceedings{Nowara2018jun,
- author = {Nowara, Ewa and Marks, Tim K. and Mansour, Hassan and Nakamura, Yudai and Veeraraghavan, Ashok},
- title = {{SparsePPG: Towards Driver Monitoring Using Camera-Based Vital Signs Estimation in Near-Infrared}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop on Computer Vision for Physiological Measurement (CVPM},
- year = 2018,
- pages = {1272--1281},
- month = jun,
- url = {https://www.merl.com/publications/TR2018-067}
- }
Deshmukh, A., Laftchiev, E., "Semi-Supervised Transfer Learning Using Marginal Predictors", IEEE Data Science Workshop, DOI: 10.1109/DSW.2018.8439908, June 6, 2018, pp. 160-164.
BibTeX TR2018-040 PDF Software
- @inproceedings{Deshmukh2018jun,
- author = {Deshmukh, Aniket and Laftchiev, Emil},
- title = {{Semi-Supervised Transfer Learning Using Marginal Predictors}},
- booktitle = {IEEE Data Science Workshop},
- year = 2018,
- pages = {160--164},
- month = jun,
- doi = {10.1109/DSW.2018.8439908},
- url = {https://www.merl.com/publications/TR2018-040}
- }
Ochiai, T., Watanabe, S., Katagiri, S., Hori, T., Hershey, J.R., "Speaker Adaptation for Multichannel End-to-End Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2018.8462161, April 2018, pp. 6707-6711.
BibTeX TR2018-006 PDF
- @inproceedings{Ochiai2018apr,
- author = {Ochiai, Tsubasa and Watanabe, Shinji and Katagiri, Shigeru and Hori, Takaaki and Hershey, John R.},
- title = {{Speaker Adaptation for Multichannel End-to-End Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2018,
- pages = {6707--6711},
- month = apr,
- doi = {10.1109/ICASSP.2018.8462161},
- url = {https://www.merl.com/publications/TR2018-006}
- }
Seki, H., Watanabe, S., Hori, T., Le Roux, J., Hershey, J.R., "An End-to-End Language-Tracking Speech Recognizer for Mixed-Language Speech", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2018.8462180, April 2018, pp. 4919-4923.
BibTeX TR2018-002 PDF Video
- @inproceedings{Seki2018apr,
- author = {Seki, Hiroshi and Watanabe, Shinji and Hori, Takaaki and {Le Roux}, Jonathan and Hershey, John R.},
- title = {{An End-to-End Language-Tracking Speech Recognizer for Mixed-Language Speech}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2018,
- pages = {4919--4923},
- month = apr,
- doi = {10.1109/ICASSP.2018.8462180},
- url = {https://www.merl.com/publications/TR2018-002}
- }
Settle, S., Le Roux, J., Hori, T., Watanabe, S., Hershey, J.R., "End-to-End Multi-Speaker Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2018.8461893, April 2018, pp. 4819-4823.
BibTeX TR2018-001 PDF Video
- @inproceedings{Settle2018apr,
- author = {Settle, Shane and {Le Roux}, Jonathan and Hori, Takaaki and Watanabe, Shinji and Hershey, John R.},
- title = {{End-to-End Multi-Speaker Speech Recognition}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2018,
- pages = {4819--4823},
- month = apr,
- doi = {10.1109/ICASSP.2018.8461893},
- url = {https://www.merl.com/publications/TR2018-001}
- }
Wang, Z.-Q., Le Roux, J., Hershey, J.R., "Alternative Objective Functions for Deep Clustering", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2018.8462507, April 2018, pp. 686-690.
BibTeX TR2018-005 PDF
- @inproceedings{Wang2018apr,
- author = {Wang, Zhong-Qiu and {Le Roux}, Jonathan and Hershey, John R.},
- title = {{Alternative Objective Functions for Deep Clustering}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2018,
- pages = {686--690},
- month = apr,
- doi = {10.1109/ICASSP.2018.8462507},
- url = {https://www.merl.com/publications/TR2018-005}
- }
Wang, Z.-Q., Le Roux, J., Hershey, J.R., "Multi-Channel Deep Clustering: Discriminative Spectral and Spatial Embeddings for Speaker-Independent Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2018.8461639, April 2018, pp. 1-5.
BibTeX TR2018-007 PDF
- @inproceedings{Wang2018apr2,
- author = {Wang, Zhong-Qiu and {Le Roux}, Jonathan and Hershey, John R.},
- title = {{Multi-Channel Deep Clustering: Discriminative Spectral and Spatial Embeddings for Speaker-Independent Speech Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2018,
- pages = {1--5},
- month = apr,
- doi = {10.1109/ICASSP.2018.8461639},
- url = {https://www.merl.com/publications/TR2018-007}
- }
Zhang, Z., Kag, A., Sullivan, A., Saligrama, V., "Equilibrated Recurrent Neural Network: Neuronal Time-Delayed Self-Feedback Improves Accuracy and Stability", arXiv, March 2019.
BibTeX arXiv
- @article{Zhang2018mar2,
- author = {Zhang, Ziming and Kag, Anil and Sullivan, Alan and Saligrama, Venkatesh},
- title = {{Equilibrated Recurrent Neural Network: Neuronal Time-Delayed Self-Feedback Improves Accuracy and Stability}},
- journal = {arXiv},
- year = 2018,
- month = mar,
- url = {https://arxiv.org/abs/1903.00755}
- }
Zhang, Z., Xu, W., Sullivan, A., "Time-Delay Momentum: A Regularization Perspective on the Convergence and Generalization of Stochastic Momentum for Deep Learning", arXiv, March 2018.
BibTeX arXiv
- @article{Zhang2018mar,
- author = {Zhang, Ziming and Xu, Wenju and Sullivan, Alan},
- title = {{Time-Delay Momentum: A Regularization Perspective on the Convergence and Generalization of Stochastic Momentum for Deep Learning}},
- journal = {arXiv},
- year = 2018,
- month = mar,
- url = {https://arxiv.org/abs/1903.00760}
- }
Quivira, F., Koike-Akino, T., Wang, Y., Erdogmus, D., "Translating sEMG Signals to Continuous Hand Poses using Recurrent Neural Networks", IEEE Conference on Biomedical and Health Informatics (BHI), DOI: 10.1109/BHI.2018.8333395, January 2018.
BibTeX TR2018-014 PDF Presentation
- @inproceedings{Quivira2018jan,
- author = {Quivira, Fernando and Koike-Akino, Toshiaki and Wang, Ye and Erdogmus, Deniz},
- title = {{Translating sEMG Signals to Continuous Hand Poses using Recurrent Neural Networks}},
- booktitle = {IEEE Conference on Biomedical and Health Informatics (BHI)},
- year = 2018,
- month = jan,
- doi = {10.1109/BHI.2018.8333395},
- url = {https://www.merl.com/publications/TR2018-014}
- }
Hori, C., Hori, T., "End-to-end Conversation Modeling Track in DSTC6", Dialog System Technology Challenges, December 2017.
BibTeX TR2017-188 PDF
- @inproceedings{Hori2017dec3,
- author = {Hori, Chiori and Hori, Takaaki},
- title = {{End-to-end Conversation Modeling Track in DSTC6}},
- booktitle = {Dialog System Technology Challenges},
- year = 2017,
- month = dec,
- url = {https://www.merl.com/publications/TR2017-188}
- }
Hori, C., Hori, T., Marks, T.K., Hershey, J.R., "Early and Late Integration of Audio Features for Automatic Video Description", IEEE Automatic Speech Recognition and Understanding Workshop (ASRU), DOI: 10.1109/ASRU.2017.8268968, December 2017.
BibTeX TR2017-183 PDF
- @inproceedings{Hori2017dec2,
- author = {Hori, Chiori and Hori, Takaaki and Marks, Tim K. and Hershey, John R.},
- title = {{Early and Late Integration of Audio Features for Automatic Video Description}},
- booktitle = {IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)},
- year = 2017,
- month = dec,
- doi = {10.1109/ASRU.2017.8268968},
- url = {https://www.merl.com/publications/TR2017-183}
- }
Hori, T., Watanabe, S., Hershey, J.R., "Multi-level Language Modeling and Decoding for Open Vocabulary End-to-End Speech Recognition", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU.2017.8268948, December 2017.
BibTeX TR2017-181 PDF
- @inproceedings{Hori2017dec,
- author = {Hori, Takaaki and Watanabe, Shinji and Hershey, John R.},
- title = {{Multi-level Language Modeling and Decoding for Open Vocabulary End-to-End Speech Recognition}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2017,
- month = dec,
- doi = {10.1109/ASRU.2017.8268948},
- url = {https://www.merl.com/publications/TR2017-181}
- }
Watanabe, S., Hori, T., Hershey, J.R., "Language Independent End-to-End Architecture For Joint Language and Speech Recognition", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/ASRU.2017.8268945, December 2017.
BibTeX TR2017-182 PDF Video
- @inproceedings{Watanabe2017dec,
- author = {Watanabe, Shinji and Hori, Takaaki and Hershey, John R.},
- title = {{Language Independent End-to-End Architecture For Joint Language and Speech Recognition}},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2017,
- month = dec,
- doi = {10.1109/ASRU.2017.8268945},
- url = {https://www.merl.com/publications/TR2017-182}
- }
Wang, W., Koji, Y., Harsham, B.A., Hori, T., Hershey, J.R., "Sequence Adversarial Training and Minimum Bayes Risk Decoding for End-to-end Neural Conversation Models", Dialog System Technology Challenges, December 2017.
BibTeX TR2017-180 PDF
- @inproceedings{Wang2017dec,
- author = {Wang, Wen and Koji, Yusuke and Harsham, Bret A. and Hori, Takaaki and Hershey, John R.},
- title = {{Sequence Adversarial Training and Minimum Bayes Risk Decoding for End-to-end Neural Conversation Models}},
- booktitle = {Dialog System Technology Challenges},
- year = 2017,
- month = dec,
- url = {https://www.merl.com/publications/TR2017-180}
- }
Ziming, Z., Brand, M., "Convergent Block Coordinate Descent for Training Tikhonov Regularized Deep Neural Networks", Advances in Neural Information Processing Systems (NIPS), December 2017.
BibTeX TR2017-140 PDF
- @inproceedings{Ziming2017dec,
- author = {Ziming, Zhang and Brand, Matthew},
- title = {{Convergent Block Coordinate Descent for Training Tikhonov Regularized Deep Neural Networks}},
- booktitle = {Advances in Neural Information Processing Systems (NIPS)},
- year = 2017,
- month = dec,
- url = {https://www.merl.com/publications/TR2017-140}
- }