Publications

Shi, L., Geng, S., Shuang, K., Hori, C., Liu, S., Gao, P., Su, S., "Multi-Layer Content Interaction Through Quaternion Product For Visual Question Answering", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP40776.2020.9053595, April 2020, pp. 4412-4416.
BibTeX TR2020-046 PDF
- @inproceedings{Shi2020apr,
- author = {Shi, Lei and Geng, Shijie and Shuang, Kai and Hori, Chiori and Liu, Songxiang and Gao, Peng and Su, Sen},
- title = {Multi-Layer Content Interaction Through Quaternion Product For Visual Question Answering},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2020,
- pages = {4412--4416},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP40776.2020.9053595},
- issn = {2379-190X},
- isbn = {978-1-5090-6631-5},
- url = {https://www.merl.com/publications/TR2020-046}
- }
D’Haro, L.F., Yoshino, K., Hori, C., Marks, T.K., Polymenakos, L., Kummerfeld, J.K., Galley, M., Gao, X., "Overview of the seventh Dialog System Technology Challenge: DSTC7", Computer Speech and Language, DOI: 10.1016/j.csl.2020.101068, Vol. 62, March 2020.
BibTeX TR2020-029 PDF
- @article{D’Haro2020mar,
- author = {D’Haro, Luis Fernando and Yoshino, Koichiro and Hori, Chiori and Marks, Tim K. and Polymenakos, Lazaros and Kummerfeld, Jonathan K. and Galley, Michel and Gao, Xiang},
- title = {Overview of the seventh Dialog System Technology Challenge: DSTC7},
- journal = {Computer Speech and Language},
- year = 2020,
- volume = 62,
- month = mar,
- doi = {10.1016/j.csl.2020.101068},
- url = {https://www.merl.com/publications/TR2020-029}
- }
Ramachandra, B., Jones, M.J., Vatsavai, R., "Learning a distance function with a Siamese network to localize anomalies in videos", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/WACV45572.2020.9093417, February 2020, pp. 2598-2607.
BibTeX TR2020-015 PDF
- @inproceedings{Jones2020feb,
- author = {Ramachandra, Bharathkumar and Jones, Michael J. and Vatsavai, Ranga},
- title = {Learning a distance function with a Siamese network to localize anomalies in videos},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2020,
- pages = {2598--2607},
- month = feb,
- doi = {10.1109/WACV45572.2020.9093417},
- url = {https://www.merl.com/publications/TR2020-015}
- }
Cherian, A., Wang, J., Hori, C., Marks, T.K., "Spatio-Temporal Ranked-Attention Networks for Video Captioning", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/WACV45572.2020.9093291, February 2020, pp. 1606-1615.
BibTeX TR2020-016 PDF
- @inproceedings{Cherian2020feb,
- author = {Cherian, Anoop and Wang, Jue and Hori, Chiori and Marks, Tim K.},
- title = {Spatio-Temporal Ranked-Attention Networks for Video Captioning},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2020,
- pages = {1606--1615},
- month = feb,
- publisher = {IEEE},
- doi = {10.1109/WACV45572.2020.9093291},
- url = {https://www.merl.com/publications/TR2020-016}
- }
Huang, R., Xu, W., Lee, T.-Y., Cherian, A., Wang, Y., Marks, T.K., "FX-GAN: Self-Supervised GAN Learning via Feature Exchange", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/WACV45572.2020.9093525, February 2020, pp. 3183-3191.
BibTeX TR2020-014 PDF
- @inproceedings{Huang2020feb,
- author = {Huang, Rui and Xu, Wenju and Lee, Teng-Yok and Cherian, Anoop and Wang, Ye and Marks, Tim K.},
- title = {FX-GAN: Self-Supervised GAN Learning via Feature Exchange},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2020,
- pages = {3183--3191},
- month = feb,
- publisher = {IEEE},
- doi = {10.1109/WACV45572.2020.9093525},
- url = {https://www.merl.com/publications/TR2020-014}
- }
Ramachandra, B., Jones, M.J., "Street Scene: A new dataset and evaluation protocol for video anomaly detection", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/WACV45572.2020.9093457, February 2020, pp. 2569-2578.
BibTeX TR2020-017 PDF Data
- @inproceedings{Jones2020feb2,
- author = {Ramachandra, Bharathkumar and Jones, Michael J.},
- title = {Street Scene: A new dataset and evaluation protocol for video anomaly detection},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2020,
- pages = {2569--2578},
- month = feb,
- doi = {10.1109/WACV45572.2020.9093457},
- url = {https://www.merl.com/publications/TR2020-017}
- }
He, W., Lee, T.-Y., van Baar, J., Wittenburg, K.B., Shen, H.-W., "DynamicsExplorer: Visual Analytics for Robot Control Tasks involving Dynamics and LSTM-based Control Policies", IEEE Pacific Visualization Symposium (PacificVis), DOI: 10.1109/PacificVis48177.2020.7127, January 2020, pp. 36-45.
BibTeX TR2020-011 PDF
- @inproceedings{He2020jan,
- author = {He, Wenbin and Lee, Teng-Yok and van Baar, Jeroen and Wittenburg, Kent B. and Shen, Han-Wei},
- title = {DynamicsExplorer: Visual Analytics for Robot Control Tasks involving Dynamics and LSTM-based Control Policies},
- booktitle = {IEEE Pacific Visualization Symposium (PacificVis)},
- year = 2020,
- pages = {36--45},
- month = jan,
- doi = {10.1109/PacificVis48177.2020.7127},
- url = {https://www.merl.com/publications/TR2020-011}
- }
Chen, S., Duan, C., Yang, Y., Feng, C., Li, D., Tian, D., "Deep Unsupervised Learning of 3D Point Clouds via Graph Topology Inference and Filtering", IEEE Transactions on Image Processing, DOI: 10.1109/TIP.2019.2957935, pp. 3183-3198, January 2020.
BibTeX TR2020-004 PDF Data Software
- @article{Chen2020jan,
- author = {Chen, Siheng and Duan, Chaojing and Yang, Yaoqing and Feng, Chen and Li, Duanshun and Tian, Dong},
- title = {Deep Unsupervised Learning of 3D Point Clouds via Graph Topology Inference and Filtering},
- journal = {IEEE Transactions on Image Processing},
- year = 2020,
- pages = {3183--3198},
- month = jan,
- doi = {10.1109/TIP.2019.2957935},
- url = {https://www.merl.com/publications/TR2020-004}
- }
Zhang, Z., Wu, Y., Wang, G., "Unsupervised Deep Feature Transfer for Low Resolution Image Classification", IEEE International Conference on Computer Vision Workshops (ICCV), DOI: 10.1109/ICCVW.2019.00136, October 2019, pp. 1065-1069.
BibTeX TR2019-127 PDF
- @inproceedings{Zhang2019oct,
- author = {Zhang, Ziming and Wu, Yuanwei and Wang, Guanghui},
- title = {Unsupervised Deep Feature Transfer for Low Resolution Image Classification},
- booktitle = {IEEE International Conference on Computer Vision Workshops (ICCV)},
- year = 2019,
- pages = {1065--1069},
- month = oct,
- doi = {10.1109/ICCVW.2019.00136},
- url = {https://www.merl.com/publications/TR2019-127}
- }
Wu, Y., Marks, T.K., Cherian, A., Chen, S., Feng, C., Wang, G., Sullivan, A., "Unsupervised Joint 3D Object Model Learning and 6D Pose Estimation for Depth-Based Instance Segmentation", IEEE ICCV Workshop on Recovering 6D Object Pose, DOI: 10.1109/ICCVW.2019.00339, October 2019, pp. 2777-2786.
BibTeX TR2019-118 PDF
- @inproceedings{Wu2019oct,
- author = {Wu, Yuanwei and Marks, Tim K. and Cherian, Anoop and Chen, Siheng and Feng, Chen and Wang, Guanghui and Sullivan, Alan},
- title = {Unsupervised Joint 3D Object Model Learning and 6D Pose Estimation for Depth-Based Instance Segmentation},
- booktitle = {IEEE ICCV Workshop on Recovering 6D Object Pose},
- year = 2019,
- pages = {2777--2786},
- month = oct,
- doi = {10.1109/ICCVW.2019.00339},
- url = {https://www.merl.com/publications/TR2019-118}
- }
Paul, S., van Baar, J., Roy-Chowdhury, A.K., "Learning from Trajectories via Subgoal Discovery", Advances in Neural Information Processing Systems (NeurIPS), pp. 8409-8419, October 2019.
BibTeX TR2019-128 PDF
- @article{Paul2019oct,
- author = {Paul, Sujoy and van Baar, Jeroen and Roy-Chowdhury, Amit K.},
- title = {Learning from Trajectories via Subgoal Discovery},
- journal = {Advances in Neural Information Processing Systems (NeurIPS)},
- year = 2019,
- pages = {8409--8419},
- month = oct,
- url = {https://www.merl.com/publications/TR2019-128}
- }
Wang, J., Cherian, A., "GODS: Generalized One-class Discriminative Subspaces for Anomaly Detection", IEEE International Conference on Computer Vision (ICCV), DOI: 10.1109/ICCV.2019.00829, October 2019, pp. 8200-8210.
BibTeX TR2019-121 PDF
- @inproceedings{Wang2019oct2,
- author = {Wang, Jue and Cherian, Anoop},
- title = {GODS: Generalized One-class Discriminative Subspaces for Anomaly Detection},
- booktitle = {2019 IEEE/CVF International Conference on Computer Vision (ICCV)},
- year = 2019,
- pages = {8200--8210},
- month = oct,
- publisher = {IEEE},
- doi = {10.1109/ICCV.2019.00829},
- url = {https://www.merl.com/publications/TR2019-121}
- }
Marks, T.K., Kumar, A., Mou, W., Feng, C., Liu, X., "UGLLI Face Alignment: Estimating Uncertainty with Gaussian Log-Likelihood Loss", IEEE International Conference on Computer Vision (ICCV) Workshop on Statistical Deep Learning for Computer Vision (SDL-CV), DOI: 10.1109/ICCVW.2019.00103, October 2019, pp. 778-782.
BibTeX TR2019-117 PDF Data Software
- @inproceedings{Marks2019oct,
- author = {Marks, Tim K. and Kumar, Abhinav and Mou, Wenxuan and Feng, Chen and Liu, Xiaoming},
- title = {UGLLI Face Alignment: Estimating Uncertainty with Gaussian Log-Likelihood Loss},
- booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshop on Statistical Deep Learning for Computer Vision (SDL-CV)},
- year = 2019,
- pages = {778--782},
- month = oct,
- publisher = {IEEE},
- doi = {10.1109/ICCVW.2019.00103},
- url = {https://www.merl.com/publications/TR2019-117}
- }
Almeida, D., Ataer-Cansizoglu, E., Corcodel, R., "Detection, Tracking and 3D Modeling of Objects with Sparse RGB-D SLAM and Interactive Perception", IEEE-RAS International Conference on Humanoid Robots, DOI: 10.1109/Humanoids43949.2019.9035001, October 2019, pp. 1-8.
BibTeX TR2019-119 PDF
- @inproceedings{Almeida2019oct,
- author = {Almeida, Diogo and Ataer-Cansizoglu, Esra and Corcodel, Radu},
- title = {Detection, Tracking and 3D Modeling of Objects with Sparse RGB-D SLAM and Interactive Perception},
- booktitle = {IEEE-RAS International Conference on Humanoid Robots},
- year = 2019,
- pages = {1--8},
- month = oct,
- doi = {10.1109/Humanoids43949.2019.9035001},
- url = {https://www.merl.com/publications/TR2019-119}
- }
Kao, J.-Y., Ortega, A., Tian, D., Mansour, H., Vetro, A., "Graph Based Skeleton Modeling for Human Activity Analysis", IEEE International Conference on Image Processing (ICIP), DOI: 10.1109/ICIP.2019.8803186, September 2019.
BibTeX TR2019-037 PDF
- @inproceedings{Kao2019sep,
- author = {Kao, Jiun-Yu and Ortega, Antonio and Tian, Dong and Mansour, Hassan and Vetro, Anthony},
- title = {Graph Based Skeleton Modeling for Human Activity Analysis},
- booktitle = {IEEE International Conference on Image Processing (ICIP)},
- year = 2019,
- month = sep,
- publisher = {IEEE},
- doi = {10.1109/ICIP.2019.8803186},
- issn = {2381-8549},
- isbn = {978-1-5386-6249-6},
- url = {https://www.merl.com/publications/TR2019-037}
- }
Hori, C., Cherian, A., Marks, T.K., Hori, T., "Joint Student-Teacher Learning for Audio-Visual Scene-Aware Dialog", Interspeech, September 2019, pp. 1886-1890.
BibTeX TR2019-097 PDF
- @inproceedings{Hori2019sep,
- author = {Hori, Chiori and Cherian, Anoop and Marks, Tim K. and Hori, Takaaki},
- title = {Joint Student-Teacher Learning for Audio-Visual Scene-Aware Dialog},
- booktitle = {Interspeech},
- year = 2019,
- pages = {1886--1890},
- month = sep,
- publisher = {ISCA},
- url = {https://www.merl.com/publications/TR2019-097}
- }
Zhang, Z., Lin, Z., Pfister, H., "White-Box Adversarial Defense via Self-Supervised Data Estimation", arXiv, September 2019.
BibTeX arXiv Software
- @article{Zhang2019sep,
- author = {Zhang, Ziming and Lin, Zudi and Pfister, Hanspeter},
- title = {White-Box Adversarial Defense via Self-Supervised Data Estimation},
- journal = {arXiv},
- year = 2019,
- month = sep,
- url = {https://arxiv.org/abs/1909.06271}
- }
Jones, M.J., Rambhatla, S., "Body Part Alignment and Temporal Attention for Video-Based Person Re-Identification", British Machine Vision Conference (BMVC), September 2019.
BibTeX TR2019-108 PDF
- @inproceedings{Jones2019sep,
- author = {Jones, Michael J. and Rambhatla, Sai},
- title = {Body Part Alignment and Temporal Attention for Video-Based Person Re-Identification},
- booktitle = {British Machine Vision Conference (BMVC)},
- year = 2019,
- month = sep,
- url = {https://www.merl.com/publications/TR2019-108}
- }
Wang, J., Cherian, A., "Discriminative Video Representation Learning Using Support Vector Classifiers", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/TPAMI.2019.2937292, August 2019.
BibTeX TR2019-107 PDF
- @article{Wang2019aug,
- author = {Wang, Jue and Cherian, Anoop},
- title = {Discriminative Video Representation Learning Using Support Vector Classifiers},
- journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
- year = 2019,
- month = aug,
- doi = {10.1109/TPAMI.2019.2937292},
- url = {https://www.merl.com/publications/TR2019-107}
- }
Liu, D., Mansour, H., Boufounos, P.T., "Robust Mutual Information-Based Multi-Image Registration", IEEE International Geoscience and Remote Sensing Symposium (IGARSS), July 2019, pp. 915-918.
BibTeX TR2019-079 PDF
- @inproceedings{Liu2019jul,
- author = {Liu, Dehong and Mansour, Hassan and Boufounos, Petros T.},
- title = {Robust Mutual Information-Based Multi-Image Registration},
- booktitle = {IEEE International Geoscience and Remote Sensing Symposium (IGARSS)},
- year = 2019,
- pages = {915--918},
- month = jul,
- url = {https://www.merl.com/publications/TR2019-079}
- }
Huang, M., Zhao, M., Parikh, P., Wang, Y., Ozbay, K., Jiang, Z.-P., "Reinforcement Learning for Vision-Based Lateral Control of a Self-Driving Car", IEEE International Conference on Control and Automation (ICCA), DOI: 10.1109/JAS.2019.19117678, July 2019, pp. 1126-1131.
BibTeX TR2019-074 PDF
- @inproceedings{Huang2019jul,
- author = {Huang, Mengzhe and Zhao, Mingyu and Parikh, Parthiv and Wang, Yebin and Ozbay, Kaan and Jiang, Zhong-Ping},
- title = {Reinforcement Learning for Vision-Based Lateral Control of a Self-Driving Car},
- booktitle = {IEEE International Conference on Control and Automation (ICCA)},
- year = 2019,
- pages = {1126--1131},
- month = jul,
- doi = {10.1109/JAS.2019.19117678},
- url = {https://www.merl.com/publications/TR2019-074}
- }
Alamri, H., Cartillier, V., Das, A., Wang, J., Lee, S., Anderson, P., Essa, I., Parikh, D., Batra, D., Cherian, A., Marks, T.K., Hori, C., "Audio-Visual Scene-Aware Dialog", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/CVPR.2019.00774, June 2019, pp. 7550-7559.
BibTeX TR2019-048 PDF
- @inproceedings{Alamri2019jun,
- author = {Alamri, Huda and Cartillier, Vincent and Das, Abhishek and Wang, Jue and Lee, Stefan and Anderson, Peter and Essa, Irfan and Parikh, Devi and Batra, Dhruv and Cherian, Anoop and Marks, Tim K. and Hori, Chiori},
- title = {Audio-Visual Scene-Aware Dialog},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2019,
- pages = {7550--7559},
- month = jun,
- doi = {10.1109/CVPR.2019.00774},
- url = {https://www.merl.com/publications/TR2019-048}
- }
Lee, T.-Y., van Baar, J., Wittenburg, K.B., Sullivan, A., "Analysis of the contribution and temporal dependency of LSTM layers for reinforcement learning tasks", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Explanable AI Workshop, June 2019, pp. 99-102.
BibTeX TR2019-049 PDF
- @inproceedings{Lee2019jun2,
- author = {Lee, Teng-Yok and van Baar, Jeroen and Wittenburg, Kent B. and Sullivan, Alan},
- title = {Analysis of the contribution and temporal dependency of LSTM layers for reinforcement learning tasks},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Explanable AI Workshop},
- year = 2019,
- pages = {99--102},
- month = jun,
- url = {https://www.merl.com/publications/TR2019-049}
- }
Raghunathan, A., Cherian, A., Jha, D.K., "Game Theoretic Optimization via Gradient-based Nikaido-Isoda Function", International Conference on Machine Learning (ICML), Lawrence, N. and Reid, M., Eds., June 2019, pp. 5291-5300.
BibTeX TR2019-045 PDF Software
- @inproceedings{Raghunathan2019jun,
- author = {Raghunathan, Arvind and Cherian, Anoop and Jha, Devesh K.},
- title = {Game Theoretic Optimization via Gradient-based Nikaido-Isoda Function},
- booktitle = {International Conference on Machine Learning (ICML)},
- year = 2019,
- editor = {Lawrence, N. and Reid, M.},
- pages = {5291--5300},
- month = jun,
- publisher = {PMLR},
- issn = {2640-3498},
- url = {https://www.merl.com/publications/TR2019-045}
- }
Chen, S., "Large-Scale 3D Point Cloud Representations via Graph Inception Networks with Applications to Autonomous Driving", Graph Signal Processing Workshop (GSP), DOI: 10.1109/ICIP.2019.8803525, June 2019, pp. 4395-4399.
BibTeX TR2019-039 PDF
- @inproceedings{Chen2019jun,
- author = {Chen, Siheng},
- title = {Large-Scale 3D Point Cloud Representations via Graph Inception Networks with Applications to Autonomous Driving},
- booktitle = {Graph Signal Processing Workshop (GSP)},
- year = 2019,
- pages = {4395--4399},
- month = jun,
- doi = {10.1109/ICIP.2019.8803525},
- url = {https://www.merl.com/publications/TR2019-039}
- }