- Kumar, A., Marks, T.K., Mou, W., Wang, Y., Cherian, A., Jones, M.J., Liu, X., Koike-Akino, T., Feng, C., "LUVLi Face Alignment: Estimating Landmarks’ Location, Uncertainty, and Visibility Likelihood", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/CVPR42600.2020.00826, June 2020.
BibTeX TR2020-067 PDF Video Data Software- @inproceedings{Kumar2020jun,
- author = {Kumar, Abhinav and Marks, Tim K. and Mou, Wenxuan and Wang, Ye and Cherian, Anoop and Jones, Michael J. and Liu, Xiaoming and Koike-Akino, Toshiaki and Feng, Chen},
- title = {LUVLi Face Alignment: Estimating Landmarks’ Location, Uncertainty, and Visibility Likelihood},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2020,
- month = jun,
- publisher = {IEEE},
- doi = {10.1109/CVPR42600.2020.00826},
- issn = {2575-7075},
- isbn = {978-1-7281-7168-5},
- url = {https://www.merl.com/publications/TR2020-067}
- }
- Wu, P., Chen, S., "MotionNet: Joint Perception and Motion Prediction for Autonomous Driving Based on Bird’s Eye View Maps", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/CVPR42600.2020.01140, June 2020, pp. 11382-11392.
BibTeX TR2020-068 PDF Data Software- @inproceedings{Wu2020jun,
- author = {Wu, Pengxiang and Chen, Siheng},
- title = {MotionNet: Joint Perception and Motion Prediction for Autonomous Driving Based on Bird’s Eye View Maps},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2020,
- pages = {11382--11392},
- month = jun,
- doi = {10.1109/CVPR42600.2020.01140},
- url = {https://www.merl.com/publications/TR2020-068}
- }
- Chen, S., Liu, B., Feng, C., Vallespi-Gonzalez, C., Wellington, C., "3D Point Cloud Processing and Learning for Autonomous Driving", IEEE Signal Processing Magazine, DOI: 10.1109/MSP.2020.2984780, Vol. 38, No. 1, pp. 68-86, May 2020.
BibTeX TR2020-066 PDF- @article{Chen2020may2,
- author = {Chen, Siheng and Liu, Baoan and Feng, Chen and Vallespi-Gonzalez, Carlos and Wellington, Carl},
- title = {3D Point Cloud Processing and Learning for Autonomous Driving},
- journal = {IEEE Signal Processing Magazine},
- year = 2020,
- volume = 38,
- number = 1,
- pages = {68--86},
- month = may,
- doi = {10.1109/MSP.2020.2984780},
- url = {https://www.merl.com/publications/TR2020-066}
- }
- Fujihashi, T., Koike-Akino, T., Watanabe, T., Orlik, P.V., "High-Quality Soft Image Delivery with Deep Image Denoising", IEEE International Conference on Communications (ICC), DOI: 10.1109/ICC40277.2020.9148611, May 2020.
BibTeX TR2020-060 PDF Video- @inproceedings{Fujihashi2020may,
- author = {Fujihashi, Takuya and Koike-Akino, Toshiaki and Watanabe, Takashi and Orlik, Philip V.},
- title = {High-Quality Soft Image Delivery with Deep Image Denoising},
- booktitle = {IEEE International Conference on Communications (ICC)},
- year = 2020,
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICC40277.2020.9148611},
- issn = {1938-1883},
- isbn = {978-1-7281-5089-5},
- url = {https://www.merl.com/publications/TR2020-060}
- }
- Bhamidipati, S., Kim, K.J., Sun, H., Orlik, P.V., "Artificial Intelligence-Based Distributed Belief Propagation and Recurrent Neural Network Algorithm for Wide-Area Monitoring Systems", IEEE Network, DOI: 10.1109/MNET.011.1900322, Vol. 34, No. 3, pp. 64-72, May 2020.
BibTeX TR2020-058 PDF- @article{Bhamidipati2020may,
- author = {Bhamidipati, Sriramya and Kim, Kyeong Jin and Sun, Hongbo and Orlik, Philip V.},
- title = {Artificial Intelligence-Based Distributed Belief Propagation and Recurrent Neural Network Algorithm for Wide-Area Monitoring Systems},
- journal = {IEEE Network},
- year = 2020,
- volume = 34,
- number = 3,
- pages = {64--72},
- month = may,
- doi = {10.1109/MNET.011.1900322},
- url = {https://www.merl.com/publications/TR2020-058}
- }
- Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Learning Invariant Representations from EEG via Adversarial Inference", IEEE Access, DOI: 10.1109/ACCESS.2020.2971600, Vol. 8, pp. 27074-27085, April 2020.
BibTeX TR2020-049 PDF- @article{Ozdenizci2020apr,
- author = {Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
- title = {Learning Invariant Representations from EEG via Adversarial Inference},
- journal = {IEEE Access},
- year = 2020,
- volume = 8,
- pages = {27074--27085},
- month = apr,
- doi = {10.1109/ACCESS.2020.2971600},
- issn = {2169-3536},
- url = {https://www.merl.com/publications/TR2020-049}
- }
- Chang, X., Zhang, W., Qian, Y., Le Roux, J., Watanabe, S., "End-To-End Multi-Speaker Speech Recognition with Transformer", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9054029, April 2020, pp. 6134-6138.
BibTeX TR2020-043 PDF Video Presentation- @inproceedings{Chang2020apr,
- author = {Chang, Xuankai and Zhang, Wangyou and Qian, Yanmin and Le Roux, Jonathan and Watanabe, Shinji},
- title = {End-To-End Multi-Speaker Speech Recognition with Transformer},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {6134--6138},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9054029},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-043}
- }
- Pishdadian, F., Wichern, G., Le Roux, J., "Learning to Separate Sounds From Weakly Labeled Scenes", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9053055, April 2020, pp. 91-95.
BibTeX TR2020-038 PDF Video Presentation- @inproceedings{Pishdadian2020apr,
- author = {Pishdadian, Fatemeh and Wichern, Gordon and Le Roux, Jonathan},
- title = {Learning to Separate Sounds From Weakly Labeled Scenes},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {91--95},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9053055},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-038}
- }
- Al-Shabili, A., Mansour, H., Boufounos, P.T., "Learning Plug-and-Play Proximal Quasi-Newton Denoisers", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9054537, April 2020, pp. 8896-8900.
BibTeX TR2020-045 PDF Video- @inproceedings{Al-Shabili2020apr,
- author = {Al-Shabili, Abdullah and Mansour, Hassan and Boufounos, Petros T.},
- title = {Learning Plug-and-Play Proximal Quasi-Newton Denoisers},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {8896--8900},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9054537},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-045}
- }
- Maciejewski, M., Wichern, G., McQuinn, E., Le Roux, J., "WHAMR!: Noisy and Reverberant Single-Channel Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9053327, April 2020, pp. 696-700.
BibTeX TR2020-042 PDF Video Presentation- @inproceedings{Maciejewski2020apr,
- author = {Maciejewski, Matthew and Wichern, Gordon and McQuinn, Emmett and Le Roux, Jonathan},
- title = {WHAMR!: Noisy and Reverberant Single-Channel Speech Separation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {696--700},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9053327},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-042}
- }
- Moritz, N., Hori, T., Le Roux, J., "Streaming Automatic Speech Recognition With The Transformer Model", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9054476, April 2020, pp. 6074-6078.
BibTeX TR2020-040 PDF Video Presentation- @inproceedings{Moritz2020apr,
- author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
- title = {Streaming Automatic Speech Recognition With The Transformer Model},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {6074--6078},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9054476},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-040}
- }
- Sari, L., Moritz, N., Hori, T., Le Roux, J., "Unsupervised Speaker Adaptation Using Attention-Based Speaker Memory For End-To-End ASR", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9054249, April 2020, pp. 7384-7388.
BibTeX TR2020-037 PDF Video Presentation- @inproceedings{Sari2020apr,
- author = {Sari, Leda and Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
- title = {Unsupervised Speaker Adaptation Using Attention-Based Speaker Memory For End-To-End ASR},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {7384--7388},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9054249},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-037}
- }
- Shi, L., Geng, S., Shuang, K., Hori, C., Liu, S., Gao, P., Su, S., "Multi-Layer Content Interaction Through Quaternion Product For Visual Question Answering", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9053595, April 2020, pp. 4412-4416.
BibTeX TR2020-046 PDF- @inproceedings{Shi2020apr,
- author = {Shi, Lei and Geng, Shijie and Shuang, Kai and Hori, Chiori and Liu, Songxiang and Gao, Peng and Su, Sen},
- title = {Multi-Layer Content Interaction Through Quaternion Product For Visual Question Answering},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {4412--4416},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9053595},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-046}
- }
- Li, R., Wang, X., Mallidi, H., Watanabe, S., Hori, T., Hermansky, H., "Multi-Stream End-to-End Speech Recognition", IEEE/ACM Transactions on Audio, Speech and Language Processing, DOI: 10.1109/TASLP.2019.2959721, Vol. 28, pp. 646-655, March 2020.
BibTeX TR2020-030 PDF- @article{Li2020mar,
- author = {Li, Ruizhi and Wang, Xiaofei and Mallidi, Harish and Watanabe, Shinji and Hori, Takaaki and Hermansky, Hynek},
- title = {Multi-Stream End-to-End Speech Recognition},
- journal = {IEEE/ACM Transactions on Audio, Speech and Language Processing},
- year = 2020,
- volume = 28,
- pages = {646--655},
- month = mar,
- doi = {10.1109/TASLP.2019.2959721},
- url = {https://www.merl.com/publications/TR2020-030}
- }
- D’Haro, L.F., Yoshino, K., Hori, C., Marks, T.K., Polymenakos, L., Kummerfeld, J.K., Galley, M., Gao, X., "Overview of the seventh Dialog System Technology Challenge: DSTC7", Computer Speech and Language, DOI: 10.1016/j.csl.2020.101068, Vol. 62, March 2020.
BibTeX TR2020-029 PDF- @article{D’Haro2020mar,
- author = {D’Haro, Luis Fernando and Yoshino, Koichiro and Hori, Chiori and Marks, Tim K. and Polymenakos, Lazaros and Kummerfeld, Jonathan K. and Galley, Michel and Gao, Xiang},
- title = {Overview of the seventh Dialog System Technology Challenge: DSTC7},
- journal = {Computer Speech and Language},
- year = 2020,
- volume = 62,
- month = mar,
- doi = {10.1016/j.csl.2020.101068},
- url = {https://www.merl.com/publications/TR2020-029}
- }
- Kojima, K., TaherSima, M., Koike-Akino, T., Jha, D.K., Tang, Y., Parsons, K., Sang, F., Klamkin, J., "Deep Neural Networks for Designing Integrated Photonics", Optical Fiber Communication Conference and Exposition (OFC), DOI: 10.1364/OFC.2020.Th1A.6, March 2020.
BibTeX TR2020-057 PDF- @inproceedings{Kojima2020mar,
- author = {Kojima, Keisuke and TaherSima, Mohammad and Koike-Akino, Toshiaki and Jha, Devesh K. and Tang, Yingheng and Parsons, Kieran and Sang, Fengqiao and Klamkin, Jonathan},
- title = {Deep Neural Networks for Designing Integrated Photonics},
- booktitle = {Optical Fiber Communication Conference and Exposition (OFC)},
- year = 2020,
- month = mar,
- publisher = {OSA},
- doi = {10.1364/OFC.2020.Th1A.6},
- isbn = {978-1-943580-71-2},
- url = {https://www.merl.com/publications/TR2020-057}
- }
- Tang, Y., Kojima, K., Koike-Akino, T., Wang, Y., Wu, P., TaherSima, M., Jha, D.K., Parsons, K., Qi, M., "Generative Deep Learning Model for a Multi-level NanoOptic Broadband Power Splitter", Optical Fiber Communication Conference and Exposition (OFC), DOI: 10.1364/OFC.2020.Th1A.1, March 2020, pp. Th1A.1.
BibTeX TR2020-025 PDF- @inproceedings{Tang2020mar,
- author = {Tang, Yingheng and Kojima, Keisuke and Koike-Akino, Toshiaki and Wang, Ye and Wu, Pengxiang and TaherSima, Mohammad and Jha, Devesh K. and Parsons, Kieran and Qi, Minghao},
- title = {Generative Deep Learning Model for a Multi-level NanoOptic Broadband Power Splitter},
- booktitle = {Optical Fiber Communication Conference and Exposition (OFC)},
- year = 2020,
- pages = {Th1A.1},
- month = mar,
- publisher = {OSA},
- doi = {10.1364/OFC.2020.Th1A.1},
- isbn = {978-1-943580-71-2},
- url = {https://www.merl.com/publications/TR2020-025}
- }
- Aihara, R., Wichern, G., Le Roux, J., "Deep Clustering-based Single Channel Speech Separation and Recent Advances", Acoustical Science and Technology, DOI: 10.1250/ast.41.465, Vol. 41, No. 2, pp. 465-471, March 2020.
BibTeX TR2021-020 PDF- @article{Aihara2020jun,
- author = {{Aihara, Ryo and Wichern, Gordon and Le Roux, Jonathan}},
- title = {Deep Clustering-based Single Channel Speech Separation and Recent Advances},
- journal = {Acoustical Science and Technology},
- year = 2020,
- volume = 41,
- number = 2,
- pages = {465--471},
- month = mar,
- doi = {10.1250/ast.41.465},
- url = {https://www.merl.com/publications/TR2021-020}
- }
- Ramachandra, B., Jones, M.J., Vatsavai, R., "Learning a distance function with a Siamese network to localize anomalies in videos", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/WACV45572.2020.9093417, February 2020, pp. 2598-2607.
BibTeX TR2020-015 PDF- @inproceedings{Jones2020feb,
- author = {Ramachandra, Bharathkumar and Jones, Michael J. and Vatsavai, Ranga},
- title = {Learning a distance function with a Siamese network to localize anomalies in videos},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2020,
- pages = {2598--2607},
- month = feb,
- doi = {10.1109/WACV45572.2020.9093417},
- url = {https://www.merl.com/publications/TR2020-015}
- }
- Cherian, A., Wang, J., Hori, C., Marks, T.K., "Spatio-Temporal Ranked-Attention Networks for Video Captioning", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/WACV45572.2020.9093291, February 2020, pp. 1606-1615.
BibTeX TR2020-016 PDF- @inproceedings{Cherian2020feb,
- author = {Cherian, Anoop and Wang, Jue and Hori, Chiori and Marks, Tim K.},
- title = {Spatio-Temporal Ranked-Attention Networks for Video Captioning},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2020,
- pages = {1606--1615},
- month = feb,
- publisher = {IEEE},
- doi = {10.1109/WACV45572.2020.9093291},
- url = {https://www.merl.com/publications/TR2020-016}
- }
- Huang, R., Xu, W., Lee, T.-Y., Cherian, A., Wang, Y., Marks, T.K., "FX-GAN: Self-Supervised GAN Learning via Feature Exchange", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/WACV45572.2020.9093525, February 2020, pp. 3183-3191.
BibTeX TR2020-014 PDF- @inproceedings{Huang2020feb,
- author = {Huang, Rui and Xu, Wenju and Lee, Teng-Yok and Cherian, Anoop and Wang, Ye and Marks, Tim K.},
- title = {FX-GAN: Self-Supervised GAN Learning via Feature Exchange},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2020,
- pages = {3183--3191},
- month = feb,
- publisher = {IEEE},
- doi = {10.1109/WACV45572.2020.9093525},
- url = {https://www.merl.com/publications/TR2020-014}
- }
- He, W., Lee, T.-Y., van Baar, J., Wittenburg, K.B., Shen, H.-W., "DynamicsExplorer: Visual Analytics for Robot Control Tasks involving Dynamics and LSTM-based Control Policies", IEEE Pacific Visualization Symposium (PacificVis), DOI: 10.1109/PacificVis48177.2020.7127, January 2020, pp. 36-45.
BibTeX TR2020-011 PDF- @inproceedings{He2020jan,
- author = {He, Wenbin and Lee, Teng-Yok and van Baar, Jeroen and Wittenburg, Kent B. and Shen, Han-Wei},
- title = {DynamicsExplorer: Visual Analytics for Robot Control Tasks involving Dynamics and LSTM-based Control Policies},
- booktitle = {IEEE Pacific Visualization Symposium (PacificVis)},
- year = 2020,
- pages = {36--45},
- month = jan,
- doi = {10.1109/PacificVis48177.2020.7127},
- url = {https://www.merl.com/publications/TR2020-011}
- }
- Chen, S., Duan, C., Yang, Y., Feng, C., Li, D., Tian, D., "Deep Unsupervised Learning of 3D Point Clouds via Graph Topology Inference and Filtering", IEEE Transactions on Image Processing, DOI: 10.1109/TIP.2019.2957935, pp. 3183-3198, January 2020.
BibTeX TR2020-004 PDF Data Software- @article{Chen2020jan,
- author = {Chen, Siheng and Duan, Chaojing and Yang, Yaoqing and Feng, Chen and Li, Duanshun and Tian, Dong},
- title = {Deep Unsupervised Learning of 3D Point Clouds via Graph Topology Inference and Filtering},
- journal = {IEEE Transactions on Image Processing},
- year = 2020,
- pages = {3183--3198},
- month = jan,
- doi = {10.1109/TIP.2019.2957935},
- url = {https://www.merl.com/publications/TR2020-004}
- }
- Xu, H., Sun, H., Nikovski, D.N., Kitamura, S., Mori, K., Hashimoto, H., "Deep Reinforcement Learning for Joint Bidding and Pricing of Load Serving Entity", IEEE Transactions on smart grids, DOI: 10.1109/TSG.2019.2903756, Vol. 10, No. 6, pp. 6366-6375, January 2020.
BibTeX TR2020-003 PDF- @article{Xu2020jan,
- author = {Xu, Hanchen and Sun, Hongbo and Nikovski, Daniel N. and Kitamura, Shoichi and Mori, Kazuyuki and Hashimoto, Hiroyuki},
- title = {Deep Reinforcement Learning for Joint Bidding and Pricing of Load Serving Entity},
- journal = {IEEE Transactions on smart grids},
- year = 2020,
- volume = 10,
- number = 6,
- pages = {6366--6375},
- month = jan,
- doi = {10.1109/TSG.2019.2903756},
- issn = {1949-3061},
- url = {https://www.merl.com/publications/TR2020-003}
- }
- Chang, X., Zhang, W., Qian, Y., Le Roux, J., Watanabe, S., "MIMO-Speech: End-to-End Multi-Channel Multi-Speaker Speech Recognition", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2019, pp. 237-144.
BibTeX TR2019-157 PDF- @inproceedings{Chang2019dec,
- author = {Chang, Xuankai and Zhang, Wangyou and Qian, Yanmin and Le Roux, Jonathan and Watanabe, Shinji},
- title = {MIMO-Speech: End-to-End Multi-Channel Multi-Speaker Speech Recognition},
- booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
- year = 2019,
- pages = {237--144},
- month = dec,
- isbn = {978-1-7281-0305-1},
- url = {https://www.merl.com/publications/TR2019-157}
- }