Publications

606 / 3,737 publications found.


  •  Hori, C., Hori, T., Le Roux, J., "Optimizing Latency for Online Video Captioning Using Audio-VisualTransformers", Interspeech, DOI: 10.21437/​Interspeech.2021-1975, August 2021, pp. 586–590.
    BibTeX TR2021-093 PDF
    • @inproceedings{Hori2021aug2,
    • author = {Hori, Chiori and Hori, Takaaki and Le Roux, Jonathan},
    • title = {Optimizing Latency for Online Video Captioning Using Audio-VisualTransformers},
    • booktitle = {Interspeech},
    • year = 2021,
    • pages = {586–590},
    • month = aug,
    • publisher = {ISCA},
    • doi = {10.21437/Interspeech.2021-1975},
    • url = {https://www.merl.com/publications/TR2021-093}
    • }
  •  Cherian, A., Wang, J., "Generalized One-Class Learning Using Pairs of Complementary Classifiers", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/​TPAMI.2021.3092999, June 2021.
    BibTeX TR2021-076 PDF Software
    • @article{Cherian2021jun,
    • author = {Cherian, Anoop and Wang, Jue},
    • title = {Generalized One-Class Learning Using Pairs of Complementary Classifiers},
    • journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
    • year = 2021,
    • month = jun,
    • doi = {10.1109/TPAMI.2021.3092999},
    • url = {https://www.merl.com/publications/TR2021-076}
    • }
  •  Hori, C., "Human Perspective Scene Understanding via Multimodal Sensing," Tech. Rep. TR2022-151, Audio-Visual Scene Understanding Tutorial at CVPR 2021, June 2021.
    BibTeX TR2022-151 PDF Video
    • @techreport{Hori2021jun,
    • author = {Hori, Chiori},
    • title = {Human Perspective Scene Understanding via Multimodal Sensing},
    • institution = {Mitsubishi Electric Research Laboratories},
    • year = 2021,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2022-151}
    • }
  •  Shi, L., Liu, D., Umeda, M., Hana, N., "Fusion-Based Image Correlations Framework For Strain Measurement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP39728.2021.9414987, June 2021.
    BibTeX TR2021-012 PDF Video
    • @inproceedings{Shi2021feb,
    • author = {Shi, Laixi and Liu, Dehong and Umeda, Masaki and Hana, Norihiko},
    • title = {Fusion-Based Image Correlations Framework For Strain Measurement},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2021,
    • month = jun,
    • doi = {10.1109/ICASSP39728.2021.9414987},
    • issn = {2379-190X},
    • isbn = {978-1-7281-7606-2},
    • url = {https://www.merl.com/publications/TR2021-012}
    • }
  •  Kim, S., Galley, M., Gunasekara, C., Lee, S., Atkinson, A., Peng, B., Schulz, H., Gao, J., Li, J., Adada, M., Huang, M., Lastras, L., Kummerfeld, J.K., Lasecki, W.S., Hori, C., Cherian, A., Marks, T.K., Rastogi, A., Zang, X., Sunkara, S., Gupta, R., "Overview of the Eighth Dialog System Technology Challenge: DSTC8", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/​TASLP.2021.3078368, May 2021.
    BibTeX TR2021-064 PDF
    • @article{Kim2021may,
    • author = {Kim, Seokhwan and Galley, Michel and Gunasekara, Chulaka and Lee, Sungjin and Atkinson, Adam and Peng, Baolin and Schulz, Hannes and Gao, Jianfeng and Li, Jinchao and Adada, Mahmoud and Huang, Minlie and Lastras, Luis and Kummerfeld, Jonathan K. and Lasecki, Walter S. and Hori, Chiori and Cherian, Anoop and Marks, Tim K. and Rastogi, Abhinav and Zang, Xiaoxue and Sunkara, Srinivas and Gupta, Raghav},
    • title = {Overview of the Eighth Dialog System Technology Challenge: DSTC8},
    • journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
    • year = 2021,
    • month = may,
    • doi = {10.1109/TASLP.2021.3078368},
    • issn = {2329-9290},
    • url = {https://www.merl.com/publications/TR2021-064}
    • }
  •  Hori, C., Tsuchiya, M., Chen, S., Cherian, A., Hori, T., Harsham, B.A., Marks, T.K., Le Roux, J., Sullivan, A., Vetro, A., "マルチモーダルセンシング情報に基づくScene-aware Interaction 技術", Society of Automotive Engineers of Japan, Vol. 75, No. 5, pp. 66-71, May 2021.
    BibTeX TR2021-042 PDF Video
    • @article{Hori2021may,
    • author = {Hori, Chiori and Tsuchiya, Masato and Chen, Siheng and Cherian, Anoop and Hori, Takaaki and Harsham, Bret A. and Marks, Tim K. and Le Roux, Jonathan and Sullivan, Alan and Vetro, Anthony},
    • title = {マルチモーダルセンシング情報に基づくScene-aware Interaction 技術},
    • journal = {Society of Automotive Engineers of Japan},
    • year = 2021,
    • volume = 75,
    • number = 5,
    • pages = {66--71},
    • month = may,
    • url = {https://www.merl.com/publications/TR2021-042}
    • }
  •  Ota, K., Jha, D.K., Romeres, D., van Baar, J., Smith, K., Semistsu, T., Oiki, T., Sullivan, A., Nikovski, D.N., Tenenbaum, J.B., "Data-Efficient Learning for Complex and Real-Time Physical Problem Solving using Augmented Simulation", IEEE Robotics and Automation Letters, DOI: 10.1109/​LRA.2021.3068887, Vol. 6, No. 2, March 2021.
    BibTeX TR2021-032 PDF Video Software
    • @article{Ota2021mar,
    • author = {Ota, Kei and Jha, Devesh K. and Romeres, Diego and van Baar, Jeroen and Smith, Kevin and Semistsu, Takayuki and Oiki, Tomoaki and Sullivan, Alan and Nikovski, Daniel N. and Tenenbaum, Joshua B.},
    • title = {Data-Efficient Learning for Complex and Real-Time Physical Problem Solving using Augmented Simulation},
    • journal = {IEEE Robotics and Automation Letters},
    • year = 2021,
    • volume = 6,
    • number = 2,
    • month = mar,
    • doi = {10.1109/LRA.2021.3068887},
    • url = {https://www.merl.com/publications/TR2021-032}
    • }
  •  Ramachandra, B., Jones, M.J., Vatsavai, R., "Perceptual Metric Learning for Video Anomaly Detection", Machine Vision and Applications, DOI: 0.1007/​s00138-021-01187-5, Vol. 32, No. 63, pp. 1-18, March 2021.
    BibTeX TR2021-028 PDF
    • @article{Ramachandra2021mar,
    • author = {Ramachandra, Bharathkumar and Jones, Michael J. and Vatsavai, Ranga},
    • title = {Perceptual Metric Learning for Video Anomaly Detection},
    • journal = {Machine Vision and Applications},
    • year = 2021,
    • volume = 32,
    • number = 63,
    • pages = {1--18},
    • month = mar,
    • doi = {0.1007/s00138-021-01187-5},
    • url = {https://www.merl.com/publications/TR2021-028}
    • }
  •  Geng, S., Gao, P., Chatterjee, M., Hori, C., Le Roux, J., Zhang, Y., Li, H., Cherian, A., "Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers", AAAI Conference on Artificial Intelligence, February 2021, pp. 1415-1423.
    BibTeX TR2021-010 PDF
    • @inproceedings{Geng2021feb,
    • author = {Geng, Shijie and Gao, Peng and Chatterjee, Moitreya and Hori, Chiori and Le Roux, Jonathan and Zhang, Yongfeng and Li, Hongsheng and Cherian, Anoop},
    • title = {Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2021,
    • pages = {1415--1423},
    • month = feb,
    • publisher = {AAAI Press, Palo Alto, California USA},
    • isbn = {978-1-57735-866-4},
    • url = {https://www.merl.com/publications/TR2021-010}
    • }
  •  Lohit, S., Anirudh, R., Turaga, P., "Recovering Trajectories of Unmarked Joints in 3D Human Actions Using Latent Space Optimization", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2021.
    BibTeX TR2021-004 PDF
    • @inproceedings{Lohit2021jan,
    • author = {Lohit, Suhas and Anirudh, Rushil and Turaga, Pavan},
    • title = {Recovering Trajectories of Unmarked Joints in 3D Human Actions Using Latent Space Optimization},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2021,
    • month = jan,
    • publisher = {CVF OpenAccess},
    • url = {https://www.merl.com/publications/TR2021-004}
    • }
  •  Anirudh, R., Lohit, S., Turaga, P., "Generative Patch Priors for Practical Compressive Image Recovery", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2021.
    BibTeX TR2021-003 PDF
    • @inproceedings{Anirudh2021jan,
    • author = {Anirudh, Rushil and Lohit, Suhas and Turaga, Pavan},
    • title = {Generative Patch Priors for Practical Compressive Image Recovery},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2021,
    • month = jan,
    • publisher = {CVF OpenAccess},
    • url = {https://www.merl.com/publications/TR2021-003}
    • }
  •  Nowara, E., Marks, T.K., Mansour, H., Veeraraghavan, A., "Near-Infrared Imaging Photoplethysmography During Driving", IEEE Transactions on Intelligent Transportation Systems, DOI: 10.1109/​TITS.2020.3038317, pp. 1-12, December 2020.
    BibTeX TR2020-161 PDF
    • @article{Nowara2020dec,
    • author = {Nowara, Ewa and Marks, Tim K. and Mansour, Hassan and Veeraraghavan, Ashok},
    • title = {Near-Infrared Imaging Photoplethysmography During Driving},
    • journal = {IEEE Transactions on Intelligent Transportation Systems},
    • year = 2020,
    • pages = {1--12},
    • month = dec,
    • doi = {10.1109/TITS.2020.3038317},
    • url = {https://www.merl.com/publications/TR2020-161}
    • }
  •  Li, M., Chen, S., Chen, X., Zhang, Y., Wang, Y., Tian, Q., "Symbiotic Graph Neural Networks for 3D Skeleton-based Human Action Recognition and Motion Prediction", IEEE Transactions on Pattern Analysis and Machine Intelligence, December 2020.
    BibTeX TR2020-166 PDF
    • @article{Chen2020dec,
    • author = {Li, Maosen and Chen, Siheng and Chen, Xu and Zhang, Ya and Wang, Yanfeng and Tian, Qi},
    • title = {Symbiotic Graph Neural Networks for 3D Skeleton-based Human Action Recognition and Motion Prediction},
    • journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
    • year = 2020,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2020-166}
    • }
  •  Corcodel, R., Jain, S., van Baar, J., "Interactive Tactile Perception for Classification of Novel Object Instances", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/​IROS45743.2020.9341795, November 2020, pp. 9861-9868.
    BibTeX TR2020-143 PDF Video
    • @inproceedings{Corcodel2020nov,
    • author = {Corcodel, Radu and Jain, Siddarth and van Baar, Jeroen},
    • title = {Interactive Tactile Perception for Classification of Novel Object Instances},
    • booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2020,
    • pages = {9861--9868},
    • month = nov,
    • publisher = {IEEE},
    • doi = {10.1109/IROS45743.2020.9341795},
    • url = {https://www.merl.com/publications/TR2020-143}
    • }
  •  Jones, M.J., Ramachandra, B., Vatsavai, R., "A Survey of Single-Scene Video Anomaly Detection", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/​TPAMI.2020.3040591, Vol. 44, No. 5, pp. 2293-2312, November 2020.
    BibTeX TR2021-029 PDF
    • @article{Jones2020nov,
    • author = {Jones, Michael J. and Ramachandra, Bharathkumar and Vatsavai, Ranga},
    • title = {A Survey of Single-Scene Video Anomaly Detection},
    • journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
    • year = 2020,
    • volume = 44,
    • number = 5,
    • pages = {2293--2312},
    • month = nov,
    • doi = {10.1109/TPAMI.2020.3040591},
    • url = {https://www.merl.com/publications/TR2021-029}
    • }
  •  Cherian, A., Chatterjee, M., Ahuja, N., "Sound2Sight: Generating Visual Dynamics from Sound and Context", European Conference on Computer Vision (ECCV), Vedaldi, A. and Bischof, H. and Brox, Th. and Frahm, J.-M., Eds., August 2020.
    BibTeX TR2020-121 PDF Software
    • @inproceedings{Cherian2020aug,
    • author = {Cherian, Anoop and Chatterjee, Moitreya and Ahuja, Narendra},
    • title = {Sound2Sight: Generating Visual Dynamics from Sound and Context},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2020,
    • editor = {Vedaldi, A. and Bischof, H. and Brox, Th. and Frahm, J.-M.},
    • month = aug,
    • publisher = {Springer},
    • url = {https://www.merl.com/publications/TR2020-121}
    • }
  •  Cherian, A., Aeron, S., "Representation Learning via Adversarially-Contrastive Optimal Transport", International Conference on Machine Learning (ICML), Daumé, H. and Singh, A., Eds., July 2020, pp. 10675-10685.
    BibTeX TR2020-093 PDF Software
    • @inproceedings{Cherian2020jul,
    • author = {Cherian, Anoop and Aeron, Shuchin},
    • title = {Representation Learning via Adversarially-Contrastive Optimal Transport},
    • booktitle = {International Conference on Machine Learning (ICML)},
    • year = 2020,
    • editor = {Daumé, H. and Singh, A.},
    • pages = {10675--10685},
    • month = jul,
    • url = {https://www.merl.com/publications/TR2020-093}
    • }
  •  Hu, Y., Chen, S., Zhang, Y., Gu, X., "Collaborative Motion Prediction via Neural Motion Message Passing", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR42600.2020.00635, June 2020, pp. 6318-6327.
    BibTeX TR2020-072 PDF
    • @inproceedings{Hu2020jun,
    • author = {Hu, Yue and Chen, Siheng and Zhang, Ya and Gu, Xiao},
    • title = {Collaborative Motion Prediction via Neural Motion Message Passing},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2020,
    • pages = {6318--6327},
    • month = jun,
    • doi = {10.1109/CVPR42600.2020.00635},
    • url = {https://www.merl.com/publications/TR2020-072}
    • }
  •  Li, M., Chen, S., Zhao, Y., Zhang, Y., Wang, Y., Tia, Q., "Dynamic Multiscale Graph Neural Networks for 3D Skeleton-Based Human Motion Prediction", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR42600.2020.00029, June 2020, pp. 211-220.
    BibTeX TR2020-073 PDF
    • @inproceedings{Li2020jun,
    • author = {Li, Maosen and Chen, Sihen and Zhao, Yangheng and Zhang, Ya and Wang, Yanfeng and Tia, Qi},
    • title = {Dynamic Multiscale Graph Neural Networks for 3D Skeleton-Based Human Motion Prediction},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2020,
    • pages = {211--220},
    • month = jun,
    • doi = {10.1109/CVPR42600.2020.00029},
    • url = {https://www.merl.com/publications/TR2020-073}
    • }
  •  Kumar, A., Marks, T.K., Mou, W., Wang, Y., Cherian, A., Jones, M.J., Liu, X., Koike-Akino, T., Feng, C., "LUVLi Face Alignment: Estimating Landmarks’ Location, Uncertainty, and Visibility Likelihood", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR42600.2020.00826, June 2020.
    BibTeX TR2020-067 PDF Video Data Software
    • @inproceedings{Kumar2020jun,
    • author = {Kumar, Abhinav and Marks, Tim K. and Mou, Wenxuan and Wang, Ye and Cherian, Anoop and Jones, Michael J. and Liu, Xiaoming and Koike-Akino, Toshiaki and Feng, Chen},
    • title = {LUVLi Face Alignment: Estimating Landmarks’ Location, Uncertainty, and Visibility Likelihood},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2020,
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.1109/CVPR42600.2020.00826},
    • issn = {2575-7075},
    • isbn = {978-1-7281-7168-5},
    • url = {https://www.merl.com/publications/TR2020-067}
    • }
  •  Wu, P., Chen, S., "MotionNet: Joint Perception and Motion Prediction for Autonomous Driving Based on Bird’s Eye View Maps", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR42600.2020.01140, June 2020, pp. 11382-11392.
    BibTeX TR2020-068 PDF Data Software
    • @inproceedings{Wu2020jun,
    • author = {Wu, Pengxiang and Chen, Siheng},
    • title = {MotionNet: Joint Perception and Motion Prediction for Autonomous Driving Based on Bird’s Eye View Maps},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2020,
    • pages = {11382--11392},
    • month = jun,
    • doi = {10.1109/CVPR42600.2020.01140},
    • url = {https://www.merl.com/publications/TR2020-068}
    • }
  •  Onol, A.O., Corcodel, R., Long, P., Padir, T., "Tuning-Free Contact-Implicit Trajectory Optimization", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA40945.2020.9196805, May 2020, pp. 1183-1189.
    BibTeX TR2020-065 PDF Video
    • @inproceedings{Onol2020may,
    • author = {Onol, Aykut O. and Corcodel, Radu and Long, Philip and Padir, Taskin},
    • title = {Tuning-Free Contact-Implicit Trajectory Optimization},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2020,
    • pages = {1183--1189},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA40945.2020.9196805},
    • issn = {2577-087X},
    • isbn = {978-1-7281-7395-5},
    • url = {https://www.merl.com/publications/TR2020-065}
    • }
  •  Chen, S., Liu, B., Feng, C., Vallespi-Gonzalez, C., Wellington, C., "3D Point Cloud Processing and Learning for Autonomous Driving", IEEE Signal Processing Magazine, DOI: 10.1109/​MSP.2020.2984780, Vol. 38, No. 1, pp. 68-86, May 2020.
    BibTeX TR2020-066 PDF
    • @article{Chen2020may2,
    • author = {Chen, Siheng and Liu, Baoan and Feng, Chen and Vallespi-Gonzalez, Carlos and Wellington, Carl},
    • title = {3D Point Cloud Processing and Learning for Autonomous Driving},
    • journal = {IEEE Signal Processing Magazine},
    • year = 2020,
    • volume = 38,
    • number = 1,
    • pages = {68--86},
    • month = may,
    • doi = {10.1109/MSP.2020.2984780},
    • url = {https://www.merl.com/publications/TR2020-066}
    • }
  •  Chen, S., Zhang, N., Sun, H., "Collaborative Localization Based on Traffic Landmarks for Autonomous Driving", IEEE International Symposium on Circuits and Systems (ISCAS), DOI: 10.1109/​ISCAS45731.2020.9180894, May 2020.
    BibTeX TR2020-064 PDF
    • @inproceedings{Chen2020may,
    • author = {Chen, Siheng and Zhang, Ningxiao and Sun, Huifang},
    • title = {Collaborative Localization Based on Traffic Landmarks for Autonomous Driving},
    • booktitle = {IEEE International Symposium on Circuits and Systems (ISCAS)},
    • year = 2020,
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ISCAS45731.2020.9180894},
    • url = {https://www.merl.com/publications/TR2020-064}
    • }
  •  Al-Shabili, A., Mansour, H., Boufounos, P.T., "Learning Plug-and-Play Proximal Quasi-Newton Denoisers", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9054537, April 2020, pp. 8896-8900.
    BibTeX TR2020-045 PDF Video
    • @inproceedings{Al-Shabili2020apr,
    • author = {Al-Shabili, Abdullah and Mansour, Hassan and Boufounos, Petros T.},
    • title = {Learning Plug-and-Play Proximal Quasi-Newton Denoisers},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {8896--8900},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9054537},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-045}
    • }