Publications

Wang, X., Kim, K.J., Wang, Y., Koike-Akino, T., Parsons, K., "DeepEAD: Explainable Anomaly Detection from System Logs", IEEE International Conference on Communications (ICC), DOI: 10.1109/ICC45041.2023.10279563, May 2023.
BibTeX TR2023-050 PDF
- @inproceedings{Wang2023may,
- author = {Wang, Xinda and Kim, Kyeong Jin and Wang, Ye and Koike-Akino, Toshiaki and Parsons, Kieran},
- title = {{DeepEAD: Explainable Anomaly Detection from System Logs}},
- booktitle = {IEEE International Conference on Communications (ICC)},
- year = 2023,
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICC45041.2023.10279563},
- issn = {1938-1883},
- isbn = {978-1-5386-7462-8},
- url = {https://www.merl.com/publications/TR2023-050}
- }
Kim, K.J., Vinod, A.P., Guo, J., Deshpande, V.M., Parsons, K., "Spectrum Sharing-inspired Safe Motion Planning", IEEE International Conference on Communications Workshops (ICC), May 2023.
BibTeX TR2023-049 PDF
- @inproceedings{Kim2023may2,
- author = {Kim, Kyeong Jin and Vinod, Abraham P. and Guo, Jianlin and Deshpande, Vedang M. and Parsons, Kieran},
- title = {{Spectrum Sharing-inspired Safe Motion Planning}},
- booktitle = {IEEE International Conference on Communications Workshops (ICC)},
- year = 2023,
- month = may,
- url = {https://www.merl.com/publications/TR2023-049}
- }
Xu, Y., Wang, B., Sakamoto, Y., Yamamoto, T., Nishimura, Y., "Comparison of Learning-based Surrogate Models for Electric Motors", Conference on the Computation of Electromagnetic Fields (COMPUMAG), DOI: 10.1109/COMPUMAG56388.2023.10411811, May 2023, pp. 1-4.
BibTeX TR2023-042 PDF
- @inproceedings{Xu2023may,
- author = {Xu, Yihao and Wang, Bingnan and Sakamoto, Yusuke and Yamamoto, Tatsuya and Nishimura, Yuki},
- title = {{Comparison of Learning-based Surrogate Models for Electric Motors}},
- booktitle = {2023 24th International Conference on the Computation of Electromagnetic Fields (COMPUMAG)},
- year = 2023,
- pages = {1--4},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/COMPUMAG56388.2023.10411811},
- url = {https://www.merl.com/publications/TR2023-042}
- }
Chen, K., Wichern, G., Germain, F., Le Roux, J., "Pac-HuBERT: Self-Supervised Music Source Separation via Primitive Auditory Clustering and Hidden-Unit BERT", IEEE ICASSP Satellite Workshop on Self-supervision in Audio, Speech and Beyond (SASB), DOI: 10.1109/ICASSPW59220.2023.10193575, May 2023.
BibTeX TR2023-030 PDF
- @inproceedings{Chen2023may,
- author = {Chen, Ke and Wichern, Gordon and Germain, Francois and {Le Roux}, Jonathan},
- title = {{Pac-HuBERT: Self-Supervised Music Source Separation via Primitive Auditory Clustering and Hidden-Unit BERT}},
- booktitle = {IEEE ICASSP Satellite Workshop on Self-supervision in Audio, Speech and Beyond (SASB)},
- year = 2023,
- month = may,
- doi = {10.1109/ICASSPW59220.2023.10193575},
- isbn = {979-8-3503-0261-5},
- url = {https://www.merl.com/publications/TR2023-030}
- }
Aralikatti, R., Boeddeker, C., Wichern, G., Subramanian, A.S., Le Roux, J., "Reverberation as Supervision for Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10095022, May 2023, pp. 1-5.
BibTeX TR2023-016 PDF
- @inproceedings{Aralikatti2023may,
- author = {Aralikatti, Rohith and Boeddeker, Christoph and Wichern, Gordon and Subramanian, Aswin Shanmugam and {Le Roux}, Jonathan},
- title = {{Reverberation as Supervision for Speech Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10095022},
- url = {https://www.merl.com/publications/TR2023-016}
- }
Berk, A., Ma, Y., Boufounos, P.T., Wang, P., Mansour, H., "Deep Proximal Gradient Method for Learned Convex Regularizers", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10094632, May 2023, pp. 1-5.
BibTeX TR2023-032 PDF Video
- @inproceedings{Berk2023may,
- author = {Berk, Aaron and Ma, Yanting and Boufounos, Petros T. and Wang, Pu and Mansour, Hassan},
- title = {{Deep Proximal Gradient Method for Learned Convex Regularizers}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10094632},
- isbn = {978-1-7281-6327-7},
- url = {https://www.merl.com/publications/TR2023-032}
- }
Bralios, D., Tzinis, E., Wichern, G., Smaragdis, P., Le Roux, J., "Latent Iterative Refinement for Modular Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10096897, May 2023, pp. 1-5.
BibTeX TR2023-019 PDF
- @inproceedings{Bralios2023may,
- author = {Bralios, Dimitrios and Tzinis, Efthymios and Wichern, Gordon and Smaragdis, Paris and {Le Roux}, Jonathan},
- title = {{Latent Iterative Refinement for Modular Source Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10096897},
- url = {https://www.merl.com/publications/TR2023-019}
- }
Fujihashi, T., Koike-Akino, T., Watanabe, T., "Soft 2D-to-3D Delivery Using Deep Graph Neural Networks for Holographic-Type Communication", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10095882, May 2023.
BibTeX TR2023-031 PDF
- @inproceedings{Fujihashi2023may,
- author = {Fujihashi, Takuya and Koike-Akino, Toshiaki and Watanabe, Takashi},
- title = {{Soft 2D-to-3D Delivery Using Deep Graph Neural Networks for Holographic-Type Communication}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10095882},
- isbn = {978-1-7281-6327-7},
- url = {https://www.merl.com/publications/TR2023-031}
- }
Petermann, D., Wichern, G., Subramanian, A.S., Le Roux, J., "Hyperbolic Audio Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10094943, May 2023, pp. 1-5.
BibTeX TR2023-017 PDF Video Software
- @inproceedings{Petermann2023may,
- author = {Petermann, Darius and Wichern, Gordon and Subramanian, Aswin Shanmugam and {Le Roux}, Jonathan},
- title = {{Hyperbolic Audio Source Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10094943},
- url = {https://www.merl.com/publications/TR2023-017}
- }
Tzinis, E., Wichern, G., Smaragdis, P., Le Roux, J., "Optimal Condition Training for Target Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10095128, May 2023, pp. 1-5.
BibTeX TR2023-018 PDF
- @inproceedings{Tzinis2023may,
- author = {Tzinis, Efthymios and Wichern, Gordon and Smaragdis, Paris and {Le Roux}, Jonathan},
- title = {{Optimal Condition Training for Target Source Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10095128},
- url = {https://www.merl.com/publications/TR2023-018}
- }
Vaca-Rubio, C., Wang, P., Koike-Akino, T., Wang, Y., Boufounos, P.T., Popovski, P., "mmWave Wi-Fi Trajectory Estimation with Continuous-Time Neural Dynamic Learning", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10096474, May 2023, pp. 1-5.
BibTeX TR2023-033 PDF Video
- @inproceedings{Vaca-Rubio2023may,
- author = {Vaca-Rubio, Cristian and Wang, Pu and Koike-Akino, Toshiaki and Wang, Ye and Boufounos, Petros T. and Popovski, Petar},
- title = {{mmWave Wi-Fi Trajectory Estimation with Continuous-Time Neural Dynamic Learning}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10096474},
- isbn = {978-1-7281-6327-7},
- url = {https://www.merl.com/publications/TR2023-033}
- }
Yen, H., Germain, F., Wichern, G., Le Roux, J., "Cold Diffusion for Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10096064, May 2023, pp. 1-5.
BibTeX TR2023-020 PDF
- @inproceedings{Yen2023may,
- author = {Yen, Hao and Germain, Francois and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Cold Diffusion for Speech Enhancement}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10096064},
- url = {https://www.merl.com/publications/TR2023-020}
- }
Zhao, Q., Ma, Y., Boufounos, P.T., Nabi, S., Mansour, H., "Deep Born Operator Learning for Reflection Tomographic Imaging", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49357.2023.10095494, May 2023, pp. 1-5.
BibTeX TR2023-029 PDF Video
- @inproceedings{Zhao2023may,
- author = {Zhao, Qingqing and Ma, Yanting and Boufounos, Petros T. and Nabi, Saleh and Mansour, Hassan},
- title = {{Deep Born Operator Learning for Reflection Tomographic Imaging}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2023,
- pages = {1--5},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49357.2023.10095494},
- url = {https://www.merl.com/publications/TR2023-029}
- }
Cherian, A., Peng, K.-C., Lohit, S., Smith, K., Tenenbaum, J.B., "Are Deep Neural Networks SMARTer than Second Graders?", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), March 2023, pp. 10834-10844.
BibTeX TR2023-014 PDF Video Data Software Presentation
- @inproceedings{Cherian2023mar,
- author = {Cherian, Anoop and Peng, Kuan-Chuan and Lohit, Suhas and Smith, Kevin and Tenenbaum, Joshua B.},
- title = {{Are Deep Neural Networks SMARTer than Second Graders?}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2023,
- pages = {10834--10844},
- month = mar,
- publisher = {CVF},
- url = {https://www.merl.com/publications/TR2023-014}
- }
Yoshino, K., Chen, Y.-N., Crook, P., Kottur, S., Li, J., Hedayatnia, B., Moon, S., Fei, Z., Li, Z., Zhang, J., Feng, Y., Zhou, J., Kim, S., Liu, Y., Jin, D., Papangelis, A., Gopalakrishnan, K., Hakkani-Tur, D., Damavandi, B., Geramifard, A., Hori, C., Shah, A., Zhang, C., Li, H., Sedoc, J., D'Haro, L.F., Banchs, R., Rudnicky, A., "Overview of the Tenth Dialog System Technology Challenge: DSTC10", IEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TCSVT.2002.808437, Vol. 13, No. 2, pp. 121-130, February 2023.
BibTeX TR2023-109 PDF
- @article{Yoshino2023feb,
- author = {{{Yoshino, Koichiro and Chen, Yun-Nung and Crook, Paul and Kottur, Satwik and Li, Jinchao and Hedayatnia, Behnam and Moon, Seungwhan and Fei, Zhengcong and Li, Zekang and Zhang, Jinchao and Feng, Yang and Zhou, Jie and Kim, Seokhwan and Liu, Yang and Jin, Di and Papangelis, Alexandros and Gopalakrishnan, Karthik and Hakkani-Tur, Dilek and Damavandi, Babak and Geramifard, Alborz and Hori, Chiori and Shah, Ankit and Zhang, Chen and Li, Haizhou and Sedoc, João and D'Haro, Luis F. and Banchs, Rafael and Rudnicky, Alexander}}},
- title = {{{Overview of the Tenth Dialog System Technology Challenge: DSTC10}}},
- journal = {IEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2023,
- volume = 13,
- number = 2,
- pages = {121--130},
- month = feb,
- doi = {10.1109/TCSVT.2002.808437},
- url = {https://www.merl.com/publications/TR2023-109}
- }
Kojima, K., Koike-Akino, T., Wang, Y., Jung Minwoo, , Brand, M., "Inverse design of two-dimensional freeform metagrating using an adversarial conditional variational autoencoder", SPIE Photonics West, DOI: 10.1117/12.2650299, January 2023.
BibTeX TR2023-004 PDF
- @inproceedings{Kojima2023jan,
- author = {Kojima, Keisuke and Koike-Akino, Toshiaki and Wang, Ye and Jung Minwoo and Brand, Matthew},
- title = {{Inverse design of two-dimensional freeform metagrating using an adversarial conditional variational autoencoder}},
- booktitle = {Proc. SPIE 12431, Photonic and Phononic Properties of Engineered Nanostructures XIII},
- year = 2023,
- month = jan,
- publisher = {SPIE},
- doi = {10.1117/12.2650299},
- url = {https://www.merl.com/publications/TR2023-004}
- }
Liu, T., Cherian, A., "Learning a Constrained Optimizer: A Primal Method", AAAI Bridge on Constraint Programming and Machine Learning, January 2023.
BibTeX TR2023-003 PDF
- @inproceedings{Liu2023jan,
- author = {Liu, Tao and Cherian, Anoop},
- title = {{Learning a Constrained Optimizer: A Primal Method}},
- booktitle = {AAAI Bridge on Constraint Programming and Machine Learning},
- year = 2023,
- month = jan,
- url = {https://www.merl.com/publications/TR2023-003}
- }
Tohme, T., Liu, D., Youcef-Toumi, K., "GSR: A Generalized Symbolic Regression Approach", Transactions on Machine Learning Research, January 2023.
BibTeX TR2023-002 PDF
- @article{Tohme2023jan,
- author = {Tohme, Tony and Liu, Dehong and Youcef-Toumi, Kamal},
- title = {{GSR: A Generalized Symbolic Regression Approach}},
- journal = {Transactions on Machine Learning Research},
- year = 2023,
- month = jan,
- issn = {2835-8856},
- url = {https://www.merl.com/publications/TR2023-002}
- }
Wang, Z.-Q., Wichern, G., Watanabe, S., Le Roux, J., "STFT-Domain Neural Speech Enhancement with Very Low Algorithmic Latency", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TASLP.2022.3224285, Vol. 31, pp. 397-410, December 2022.
BibTeX TR2022-166 PDF
- @article{Wang2022dec2,
- author = {Wang, Zhong-Qiu and Wichern, Gordon and Watanabe, Shinji and {Le Roux}, Jonathan},
- title = {{STFT-Domain Neural Speech Enhancement with Very Low Algorithmic Latency}},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2022,
- volume = 31,
- pages = {397--410},
- month = dec,
- doi = {10.1109/TASLP.2022.3224285},
- issn = {2329-9304},
- url = {https://www.merl.com/publications/TR2022-166}
- }
Singla, V., Aeron, S., Koike-Akino, T., Parsons, K., Brand, M., Wang, Y., "Learning with noisy labels using low-dimensional model trajectory", NeurIPS 2022 Workshop on Distribution Shifts (DistShift), December 2022.
BibTeX TR2022-156 PDF
- @inproceedings{Singla2022dec,
- author = {Singla, Vasu and Aeron, Shuchin and Koike-Akino, Toshiaki and Parsons, Kieran and Brand, Matthew and Wang, Ye},
- title = {{Learning with noisy labels using low-dimensional model trajectory}},
- booktitle = {NeurIPS 2022 Workshop on Distribution Shifts: Connecting Methods and Applications},
- year = 2022,
- month = dec,
- publisher = {OpenReview},
- url = {https://www.merl.com/publications/TR2022-156}
- }
Shimoya, R., Morimoto, T., van Baar, J., Boufounos, P.T., Ma, Y., Mansour, H., "Learning Occlusion-Aware Dense Correspondences for Multi-Modal Images", IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS), DOI: 10.1109/AVSS56176.2022.9959354, November 2022, pp. 1-8.
BibTeX TR2022-149 PDF
- @inproceedings{Shimoya2022nov,
- author = {Shimoya, Ryosuke and Morimoto, Tahashi and {van Baar}, Jeroen and Boufounos, Petros T. and Ma, Yanting and Mansour, Hassan},
- title = {{Learning Occlusion-Aware Dense Correspondences for Multi-Modal Images}},
- booktitle = {IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS)},
- year = 2022,
- pages = {1--8},
- month = nov,
- doi = {10.1109/AVSS56176.2022.9959354},
- isbn = {978-1-6654-6382-9},
- url = {https://www.merl.com/publications/TR2022-149}
- }
Romero, D., Lohit, S., "Learning Partial Equivariances from Data", Advances in Neural Information Processing Systems (NeurIPS), S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh, Eds., November 2022, pp. 36466-36478.
BibTeX TR2022-148 PDF Software Presentation
- @inproceedings{Romero2022nov,
- author = {Romero, David and Lohit, Suhas},
- title = {{Learning Partial Equivariances from Data}},
- booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
- year = 2022,
- editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh},
- pages = {36466--36478},
- month = nov,
- url = {https://www.merl.com/publications/TR2022-148}
- }
Wang, H., Lohit, S., Jones, M.J., Fu, R., "What Makes a “Good” Data Augmentation in Knowledge Distillation – A Statistical Perspective", Advances in Neural Information Processing Systems (NeurIPS), S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh, Eds., November 2022, pp. 13456-13469.
BibTeX TR2022-147 PDF
- @inproceedings{Wang2022nov,
- author = {Wang, Huan and Lohit, Suhas and Jones, Michael J. and Fu, Raymond},
- title = {{What Makes a “Good” Data Augmentation in Knowledge Distillation – A Statistical Perspective}},
- booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
- year = 2022,
- editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh},
- pages = {13456--13469},
- month = nov,
- url = {https://www.merl.com/publications/TR2022-147}
- }
Venkatesh, S., Wichern, G., Subramanian, A.S., Le Roux, J., "Improved Domain Generalization via Disentangled Multi-Task Learning in Unsupervised Anomalous Sound Detection", DCASE Workshop, Lagrange, M. and Mesaros, A. and Pellegrini, T. and Richard, G. and Serizel, R. and Stowell, D., Eds., November 2022.
BibTeX TR2022-146 PDF Presentation
- @inproceedings{Venkatesh2022nov,
- author = {Venkatesh, Satvik and Wichern, Gordon and Subramanian, Aswin Shanmugam and {Le Roux}, Jonathan},
- title = {{Improved Domain Generalization via Disentangled Multi-Task Learning in Unsupervised Anomalous Sound Detection}},
- booktitle = {DCASE Workshop},
- year = 2022,
- editor = {Lagrange, M. and Mesaros, A. and Pellegrini, T. and Richard, G. and Serizel, R. and Stowell, D.},
- month = nov,
- isbn = {978-952-03-2677-7},
- url = {https://www.merl.com/publications/TR2022-146}
- }
Yu, X., Smedemark-Margulies, N., Aeron, S., Koike-Akino, T., Moulin, P., Brand, M., Parsons, K., Wang, Y., "Improving Adversarial Robustness by Learning Shared Information", Pattern Recognition, DOI: 10.1016/j.patcog.2022.109054, Vol. 134, pp. 109054, November 2022.
BibTeX TR2022-141 PDF
- @article{Yu2022nov,
- author = {Yu, Xi and Smedemark-Margulies, Niklas and Aeron, Shuchin and Koike-Akino, Toshiaki and Moulin, Pierre and Brand, Matthew and Parsons, Kieran and Wang, Ye},
- title = {{Improving Adversarial Robustness by Learning Shared Information}},
- journal = {Pattern Recognition},
- year = 2022,
- volume = 134,
- pages = 109054,
- month = nov,
- doi = {10.1016/j.patcog.2022.109054},
- issn = {0031-3203},
- url = {https://www.merl.com/publications/TR2022-141}
- }