Publications

Han, M., Ozdenizci, O., Koike-Akino, T., Wang, Y., Erdogmus, D., "Universal Physiological Representation Learning with Soft-Disentangled Rateless Autoencoders", IEEE Journal of Biomedical and Health Informatics, DOI: 10.1109/JBHI.2021.3062335, Vol. 25, No. 8, pp. 2928-2937, April 2021.
BibTeX TR2021-027 PDF
- @article{Han2021apr,
- author = {Han, Mo and Ozdenizci, Ozan and Koike-Akino, Toshiaki and Wang, Ye and Erdogmus, Deniz},
- title = {{Universal Physiological Representation Learning with Soft-Disentangled Rateless Autoencoders}},
- journal = {IEEE Journal of Biomedical and Health Informatics},
- year = 2021,
- volume = 25,
- number = 8,
- pages = {2928--2937},
- month = apr,
- doi = {10.1109/JBHI.2021.3062335},
- issn = {2168-2208},
- url = {https://www.merl.com/publications/TR2021-027}
- }
Ramachandra, B., Jones, M.J., Vatsavai, R., "Perceptual Metric Learning for Video Anomaly Detection", Machine Vision and Applications, DOI: 0.1007/s00138-021-01187-5, Vol. 32, No. 63, pp. 1-18, March 2021.
BibTeX TR2021-028 PDF
- @article{Ramachandra2021mar,
- author = {Ramachandra, Bharathkumar and Jones, Michael J. and Vatsavai, Ranga},
- title = {{Perceptual Metric Learning for Video Anomaly Detection}},
- journal = {Machine Vision and Applications},
- year = 2021,
- volume = 32,
- number = 63,
- pages = {1--18},
- month = mar,
- doi = {0.1007/s00138-021-01187-5},
- url = {https://www.merl.com/publications/TR2021-028}
- }
Demir, A., Koike-Akino, T., Wang, Y., Erdogmus, D., "AutoBayes: Automated Bayesian Graph Exploration for Nuisance-Robust Inference", IEEE Access, DOI: 10.1109/ACCESS.2021.3064530, Vol. 9, pp. 39955-39972, March 2021.
BibTeX TR2021-016 PDF Presentation
- @article{Demir2021mar,
- author = {Demir, Andac and Koike-Akino, Toshiaki and Wang, Ye and Erdogmus, Deniz},
- title = {{AutoBayes: Automated Bayesian Graph Exploration for Nuisance-Robust Inference}},
- journal = {IEEE Access},
- year = 2021,
- volume = 9,
- pages = {39955--39972},
- month = mar,
- doi = {10.1109/ACCESS.2021.3064530},
- issn = {2169-3536},
- url = {https://www.merl.com/publications/TR2021-016}
- }
Kojima, K., Tang, Y., Koike-Akino, T., Wang, Y., Jha, D.K., TaherSima, M., Parsons, K., "Application of Deep Learning for Nanophotonic Device Design", SPIE Photonics West, Bahram Jalali and Ken-ichi Kitayama, Eds., DOI: 10.1117/12.2579104, March 2021.
BibTeX TR2020-182 PDF Video
- @inproceedings{Kojima2021mar,
- author = {Kojima, Keisuke and Tang, Yingheng and Koike-Akino, Toshiaki and Wang, Ye and Jha, Devesh K. and TaherSima, Mohammad and Parsons, Kieran},
- title = {{Application of Deep Learning for Nanophotonic Device Design}},
- booktitle = {SPIE Photonics West},
- year = 2021,
- editor = {Bahram Jalali and Ken-ichi Kitayama},
- month = mar,
- publisher = {SPIE},
- doi = {10.1117/12.2579104},
- url = {https://www.merl.com/publications/TR2020-182}
- }
Geng, S., Gao, P., Chatterjee, M., Hori, C., Le Roux, J., Zhang, Y., Li, H., Cherian, A., "Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers", AAAI Conference on Artificial Intelligence, February 2021, pp. 1415-1423.
BibTeX TR2021-010 PDF
- @inproceedings{Geng2021feb,
- author = {Geng, Shijie and Gao, Peng and Chatterjee, Moitreya and Hori, Chiori and {Le Roux}, Jonathan and Zhang, Yongfeng and Li, Hongsheng and Cherian, Anoop},
- title = {{Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers}},
- booktitle = {AAAI Conference on Artificial Intelligence},
- year = 2021,
- pages = {1415--1423},
- month = feb,
- publisher = {AAAI Press, Palo Alto, California USA},
- isbn = {978-1-57735-866-4},
- url = {https://www.merl.com/publications/TR2021-010}
- }
Kojima, K., TaherSima, M., Koike-Akino, T., Jha, D.K., Tang, Y., Wang, Y., Parsons, K., "Deep Neural Networks for Inverse Design of Nanophotonic Devices", IEEE Journal of Lightwave Technology, DOI: 10.1109/JLT.2021.3050083, January 2021.
BibTeX TR2021-001 PDF
- @article{Kojima2021jan,
- author = {Kojima, Keisuke and TaherSima, Mohammad and Koike-Akino, Toshiaki and Jha, Devesh K. and Tang, Yingheng and Wang, Ye and Parsons, Kieran},
- title = {{Deep Neural Networks for Inverse Design of Nanophotonic Devices}},
- journal = {IEEE Journal of Lightwave Technology},
- year = 2021,
- month = jan,
- doi = {10.1109/JLT.2021.3050083},
- issn = {1558-2213},
- url = {https://www.merl.com/publications/TR2021-001}
- }
Lohit, S., Anirudh, R., Turaga, P., "Recovering Trajectories of Unmarked Joints in 3D Human Actions Using Latent Space Optimization", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2021.
BibTeX TR2021-004 PDF
- @inproceedings{Lohit2021jan,
- author = {Lohit, Suhas and Anirudh, Rushil and Turaga, Pavan},
- title = {{Recovering Trajectories of Unmarked Joints in 3D Human Actions Using Latent Space Optimization}},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2021,
- month = jan,
- publisher = {CVF OpenAccess},
- url = {https://www.merl.com/publications/TR2021-004}
- }
Anirudh, R., Lohit, S., Turaga, P., "Generative Patch Priors for Practical Compressive Image Recovery", IEEE Winter Conference on Applications of Computer Vision (WACV), January 2021.
BibTeX TR2021-003 PDF
- @inproceedings{Anirudh2021jan,
- author = {Anirudh, Rushil and Lohit, Suhas and Turaga, Pavan},
- title = {{Generative Patch Priors for Practical Compressive Image Recovery}},
- booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
- year = 2021,
- month = jan,
- publisher = {CVF OpenAccess},
- url = {https://www.merl.com/publications/TR2021-003}
- }
Nowara, E., Marks, T.K., Mansour, H., Veeraraghavan, A., "Near-Infrared Imaging Photoplethysmography During Driving", IEEE Transactions on Intelligent Transportation Systems, DOI: 10.1109/TITS.2020.3038317, pp. 1-12, December 2020.
BibTeX TR2020-161 PDF
- @article{Nowara2020dec,
- author = {Nowara, Ewa and Marks, Tim K. and Mansour, Hassan and Veeraraghavan, Ashok},
- title = {{Near-Infrared Imaging Photoplethysmography During Driving}},
- journal = {IEEE Transactions on Intelligent Transportation Systems},
- year = 2020,
- pages = {1--12},
- month = dec,
- doi = {10.1109/TITS.2020.3038317},
- url = {https://www.merl.com/publications/TR2020-161}
- }
Li, M., Chen, S., Zhang, Y., "Graph Cross Networks with Vertex Infomax Pooling", Advances in Neural Information Processing Systems (NeurIPS), December 2020.
BibTeX TR2020-167 PDF
- @inproceedings{Li2020dec,
- author = {Li, Maosen and Chen, Siheng and Zhang, Ya},
- title = {{Graph Cross Networks with Vertex Infomax Pooling}},
- booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
- year = 2020,
- month = dec,
- url = {https://www.merl.com/publications/TR2020-167}
- }
Talreja, V., Koike-Akino, T., Wang, Y., Millar, D.S., Kojima, K., Parsons, K., "End-to-End Deep Learning for Phase Noise-Robust Multi-Dimensional Geometric Shaping", European Conference on Optical Communication (ECOC), DOI: 10.1109/ECOC48923.2020.9333382, November 2020.
BibTeX TR2020-155 PDF Video
- @inproceedings{Talreja2020nov,
- author = {Talreja, Veeru and Koike-Akino, Toshiaki and Wang, Ye and Millar, David S. and Kojima, Keisuke and Parsons, Kieran},
- title = {{End-to-End Deep Learning for Phase Noise-Robust Multi-Dimensional Geometric Shaping}},
- booktitle = {European Conference on Optical Communication (ECOC)},
- year = 2020,
- month = nov,
- publisher = {IEEE},
- doi = {10.1109/ECOC48923.2020.9333382},
- isbn = {978-1-7281-7361-0},
- url = {https://www.merl.com/publications/TR2020-155}
- }
Corcodel, R., Jain, S., van Baar, J., "Interactive Tactile Perception for Classification of Novel Object Instances", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/IROS45743.2020.9341795, November 2020, pp. 9861-9868.
BibTeX TR2020-143 PDF Video
- @inproceedings{Corcodel2020nov,
- author = {Corcodel, Radu and Jain, Siddarth and {van Baar}, Jeroen},
- title = {{Interactive Tactile Perception for Classification of Novel Object Instances}},
- booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
- year = 2020,
- pages = {9861--9868},
- month = nov,
- publisher = {IEEE},
- doi = {10.1109/IROS45743.2020.9341795},
- url = {https://www.merl.com/publications/TR2020-143}
- }
Jones, M.J., Ramachandra, B., Vatsavai, R., "A Survey of Single-Scene Video Anomaly Detection", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/TPAMI.2020.3040591, Vol. 44, No. 5, pp. 2293-2312, November 2020.
BibTeX TR2021-029 PDF
- @article{Jones2020nov,
- author = {Jones, Michael J. and Ramachandra, Bharathkumar and Vatsavai, Ranga},
- title = {{A Survey of Single-Scene Video Anomaly Detection}},
- journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
- year = 2020,
- volume = 44,
- number = 5,
- pages = {2293--2312},
- month = nov,
- doi = {10.1109/TPAMI.2020.3040591},
- url = {https://www.merl.com/publications/TR2021-029}
- }
Ota, K., Sasaki, Y., Jha, D., Yoshiyasu, Y., Kanezaki, A., "Efficient Exploration in Constrained Environments with Goal-Oriented Reference Path", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), November 2020.
BibTeX TR2020-141 PDF Software
- @inproceedings{Ota2020nov,
- author = {Ota, Kei and Sasaki, Yoko and Jha, Devesh and Yoshiyasu, Yusuke and Kanezaki, Asako},
- title = {{Efficient Exploration in Constrained Environments with Goal-Oriented Reference Path}},
- booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
- year = 2020,
- month = nov,
- url = {https://www.merl.com/publications/TR2020-141}
- }
Hori, T., Moritz, N., Hori, C., Le Roux, J., "Transformer-based Long-context End-to-end Speech Recognition", Interspeech, DOI: 10.21437/Interspeech.2020-2928, October 2020, pp. 5011-5015.
BibTeX TR2020-139 PDF Presentation
- @inproceedings{Hori2020oct,
- author = {Hori, Takaaki and Moritz, Niko and Hori, Chiori and {Le Roux}, Jonathan},
- title = {{Transformer-based Long-context End-to-end Speech Recognition}},
- booktitle = {Interspeech},
- year = 2020,
- pages = {5011--5015},
- month = oct,
- doi = {10.21437/Interspeech.2020-2928},
- issn = {1990-9772},
- url = {https://www.merl.com/publications/TR2020-139}
- }
Jayashankar, T., Le Roux, J., Moulin, P., "Detecting Audio Attacks on ASR Systems with Dropout Uncertainty", Interspeech, DOI: 10.21437/Interspeech.2020-1846, October 2020, pp. 4671-4675.
BibTeX TR2020-137 PDF Presentation
- @inproceedings{Jayashankar2020oct,
- author = {Jayashankar, Tejas and {Le Roux}, Jonathan and Moulin, Pierre},
- title = {{Detecting Audio Attacks on ASR Systems with Dropout Uncertainty}},
- booktitle = {Interspeech},
- year = 2020,
- pages = {4671--4675},
- month = oct,
- doi = {10.21437/Interspeech.2020-1846},
- issn = {1990-9772},
- url = {https://www.merl.com/publications/TR2020-137}
- }
Moritz, N., Wichern, G., Hori, T., Le Roux, J., "All-in-One Transformer: Unifying Speech Recognition, Audio Tagging, and Event Detection", Interspeech, DOI: 10.21437/Interspeech.2020-2757, October 2020, pp. 3112-3116.
BibTeX TR2020-138 PDF Presentation
- @inproceedings{Moritz2020oct,
- author = {Moritz, Niko and Wichern, Gordon and Hori, Takaaki and {Le Roux}, Jonathan},
- title = {{All-in-One Transformer: Unifying Speech Recognition, Audio Tagging, and Event Detection}},
- booktitle = {Interspeech},
- year = 2020,
- pages = {3112--3116},
- month = oct,
- doi = {10.21437/Interspeech.2020-2757},
- issn = {1990-9772},
- url = {https://www.merl.com/publications/TR2020-138}
- }
Manilow, E., Wichern, G., Le Roux, J., "Hierarchical Musical Instrument Separation", International Society for Music Information Retrieval (ISMIR) Conference, October 2020, pp. 376-383.
BibTeX TR2020-136 PDF Software
- @inproceedings{Manilow2020oct,
- author = {Manilow, Ethan and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Hierarchical Musical Instrument Separation}},
- booktitle = {International Society for Music Information Retrieval (ISMIR) Conference},
- year = 2020,
- pages = {376--383},
- month = oct,
- isbn = {978-0-9813537-0-8},
- url = {https://www.merl.com/publications/TR2020-136}
- }
Tang, Y., Kojima, K., Koike-Akino, T., Wang, Y., Wu, P., TaherSima, M., Jha, D.K., Parsons, K., Qi, M., "Generative Deep Learning Model for Inverse Design of Integrated Nanophotonic Devices", Lasers and Photonics Reviews, DOI: 10.1002/lpor.202000287, Vol. 2020, pp. 2000287, October 2020.
BibTeX TR2020-135 PDF
- @article{Tang2020oct,
- author = {Tang, Yingheng and Kojima, Keisuke and Koike-Akino, Toshiaki and Wang, Ye and Wu, Pengxiang and TaherSima, Mohammad and Jha, Devesh K. and Parsons, Kieran and Qi, Minghao},
- title = {{Generative Deep Learning Model for Inverse Design of Integrated Nanophotonic Devices}},
- journal = {Lasers and Photonics Reviews},
- year = 2020,
- volume = 2020,
- pages = 2000287,
- month = oct,
- doi = {10.1002/lpor.202000287},
- url = {https://www.merl.com/publications/TR2020-135}
- }
Seetharaman, P., Wichern, G., Pardo, B., Le Roux, J., "Autoclip: Adaptive Gradient Clipping For Source Separation Networks", IEEE International Workshop on Machine Learning for Signal Processing (MLSP), DOI: 10.1109/MLSP49062.2020.9231926, September 2020.
BibTeX TR2020-132 PDF
- @inproceedings{Seetharaman2020sep,
- author = {Seetharaman, Prem and Wichern, Gordon and Pardo, Bryan and {Le Roux}, Jonathan},
- title = {{Autoclip: Adaptive Gradient Clipping For Source Separation Networks}},
- booktitle = {IEEE International Workshop on Machine Learning for Signal Processing (MLSP)},
- year = 2020,
- month = sep,
- publisher = {IEEE},
- doi = {10.1109/MLSP49062.2020.9231926},
- url = {https://www.merl.com/publications/TR2020-132}
- }
Kojima, K., Tang, Y., Koike-Akino, T., Wang, Y., Jha, D.K., Parsons, K., TaherSima, M., Sang, F., Klamkin, J., Qi, M., "Inverse Design of Nanophotonic Devices using Deep Neural Networks", Asia Communications and Photonics Conference (ACP), September 2020, pp. Su1A.1.
BibTeX TR2020-130 PDF Video
- @inproceedings{Kojima2020sep,
- author = {Kojima, Keisuke and Tang, Yingheng and Koike-Akino, Toshiaki and Wang, Ye and Jha, Devesh K. and Parsons, Kieran and TaherSima, Mohammad and Sang, Fengqiao and Klamkin, Jonathan and Qi, Minghao},
- title = {{Inverse Design of Nanophotonic Devices using Deep Neural Networks}},
- booktitle = {Asia Communications and Photonics Conference (ACP)},
- year = 2020,
- pages = {Su1A.1},
- month = sep,
- publisher = {Optical Society of America},
- isbn = {978-1-943580-82-8},
- url = {https://www.merl.com/publications/TR2020-130}
- }
Han, M., Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Disentangled Adversarial Autoencoder for Subject-Invariant Physiological Feature Extraction", IEEE Signal Processing Letters, DOI: 10.1109/LSP.2020.3020215, Vol. 27, pp. 1565-1569, September 2020.
BibTeX TR2020-128 PDF
- @article{Han2020sep,
- author = {Han, Mo and Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
- title = {{Disentangled Adversarial Autoencoder for Subject-Invariant Physiological Feature Extraction}},
- journal = {IEEE Signal Processing Letters},
- year = 2020,
- volume = 27,
- pages = {1565--1569},
- month = sep,
- doi = {10.1109/LSP.2020.3020215},
- issn = {1558-2361},
- url = {https://www.merl.com/publications/TR2020-128}
- }
Pishdadian, F., Wichern, G., Le Roux, J., "Finding Strength in Weakness: Learning to Separate Sounds with Weak Supervision", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TASLP.2020.3013105, Vol. 28, pp. 2386-2399, September 2020.
BibTeX TR2020-126 PDF
- @article{Pishdadian2020sep,
- author = {Pishdadian, Fatemeh and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Finding Strength in Weakness: Learning to Separate Sounds with Weak Supervision}},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2020,
- volume = 28,
- pages = {2386--2399},
- month = sep,
- doi = {10.1109/TASLP.2020.3013105},
- url = {https://www.merl.com/publications/TR2020-126}
- }
Cherian, A., Chatterjee, M., Ahuja, N., "Sound2Sight: Generating Visual Dynamics from Sound and Context", European Conference on Computer Vision (ECCV), Vedaldi, A. and Bischof, H. and Brox, Th. and Frahm, J.-M., Eds., August 2020.
BibTeX TR2020-121 PDF Software
- @inproceedings{Cherian2020aug,
- author = {Cherian, Anoop and Chatterjee, Moitreya and Ahuja, Narendra},
- title = {{Sound2Sight: Generating Visual Dynamics from Sound and Context}},
- booktitle = {European Conference on Computer Vision (ECCV)},
- year = 2020,
- editor = {Vedaldi, A. and Bischof, H. and Brox, Th. and Frahm, J.-M.},
- month = aug,
- publisher = {Springer},
- url = {https://www.merl.com/publications/TR2020-121}
- }
Han, M., Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Disentangled Adversarial Transfer Learning for Physiological Biosignals", International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC), DOI: 10.1109/EMBC44109.2020.9175233, July 2020.
BibTeX TR2020-109 PDF Video Presentation
- @inproceedings{Han2020jul,
- author = {Han, Mo and Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
- title = {{Disentangled Adversarial Transfer Learning for Physiological Biosignals}},
- booktitle = {International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)},
- year = 2020,
- month = jul,
- publisher = {IEEE},
- doi = {10.1109/EMBC44109.2020.9175233},
- issn = {1558-4615},
- isbn = {978-1-7281-1990-8},
- url = {https://www.merl.com/publications/TR2020-109}
- }