Publications

224 / 3,734 publications found.


  •  Saijo, K., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Task-Aware Unified Source Separation", arXiv, October 2024.
    BibTeX arXiv
    • @article{Saijo2024oct,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Wichern, Gordon and Le Roux, Jonathan}},
    • title = {Task-Aware Unified Source Separation},
    • journal = {arXiv},
    • year = 2024,
    • month = oct,
    • url = {https://arxiv.org/abs/2410.23987v1}
    • }
  •  Cornell, S., Ebbers, J., Douwes, C., Martin-Morato, I., Harju, M., Mesaros, A., Serizel, R., "DCASE 2024 Task 4: Sound Event Detection with Heterogeneous Data and Missing Labels", Detection and Classification of Acoustic Scenes and Events (DCASE) Workshop, October 2024.
    BibTeX TR2024-146 PDF
    • @inproceedings{Cornell2024oct,
    • author = {Cornell, Samuele and Ebbers, Janek and Douwes, Constance and Martin-Morato, Irene and Harju, Manu and Mesaros, Annamaria and Serizel, Romain}},
    • title = {DCASE 2024 Task 4: Sound Event Detection with Heterogeneous Data and Missing Labels},
    • booktitle = {Detection and Classification of Acoustic Scenes and Events (DCASE) Workshop},
    • year = 2024,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2024-146}
    • }
  •  Saijo, K., Wichern, G., Germain, F.G., Pan, Z., Le Roux, J., "TF-Locoformer: Transformer with Local Modeling by Convolution for Speech Separation and Enhancement", International Workshop on Acoustic Signal Enhancement (IWAENC), September 2024.
    BibTeX TR2024-126 PDF Software
    • @inproceedings{Saijo2024sep2,
    • author = {Saijo, Kohei and Wichern, Gordon and Germain, François G and Pan, Zexu and Le Roux, Jonathan}},
    • title = {TF-Locoformer: Transformer with Local Modeling by Convolution for Speech Separation and Enhancement},
    • booktitle = {International Workshop on Acoustic Signal Enhancement (IWAENC)},
    • year = 2024,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2024-126}
    • }
  •  Pan, Z., Wichern, G., Germain, F.G., Saijo, K., Le Roux, J., "PARIS: Pseudo-AutoRegressIve Siamese Training for Online Speech Separation", Interspeech, DOI: 10.21437/​Interspeech.2024-1066, September 2024, pp. 582-586.
    BibTeX TR2024-124 PDF
    • @inproceedings{Pan2024sep,
    • author = {Pan, Zexu and Wichern, Gordon and Germain, François G and Saijo, Kohei and Le Roux, Jonathan}},
    • title = {PARIS: Pseudo-AutoRegressIve Siamese Training for Online Speech Separation},
    • booktitle = {Interspeech},
    • year = 2024,
    • pages = {582--586},
    • month = sep,
    • doi = {10.21437/Interspeech.2024-1066},
    • issn = {2958-1796},
    • url = {https://www.merl.com/publications/TR2024-124}
    • }
  •  Saijo, K., Wichern, G., Germain, F.G., Pan, Z., Le Roux, J., "Enhanced Reverberation as Supervision for Unsupervised Speech Separation", Interspeech, DOI: 10.21437/​Interspeech.2024-1241, September 2024, pp. 607-611.
    BibTeX TR2024-116 PDF Software
    • @inproceedings{Saijo2024sep,
    • author = {Saijo, Kohei and Wichern, Gordon and Germain, François G and Pan, Zexu and Le Roux, Jonathan}},
    • title = {Enhanced Reverberation as Supervision for Unsupervised Speech Separation},
    • booktitle = {Interspeech},
    • year = 2024,
    • pages = {607--611},
    • month = sep,
    • doi = {10.21437/Interspeech.2024-1241},
    • issn = {2958-1796},
    • url = {https://www.merl.com/publications/TR2024-116}
    • }
  •  Vinod, A.P., Yamazaki, S., Chakrabarty, A., Yoshikawa, N., Di Cairano, S., "Aircraft Approach Management using Reachability and Dynamic Programming", American Control Conference (ACC), DOI: 10.23919/​ACC60939.2024.10644902, June 2024, pp. 318-324.
    BibTeX TR2024-079 PDF
    • @inproceedings{Vinod2024jun,
    • author = {{Vinod, Abraham P. and Yamazaki, Sachiyo and Chakrabarty, Ankush and Yoshikawa, Nobuyuki and Di Cairano, Stefano}},
    • title = {Aircraft Approach Management using Reachability and Dynamic Programming},
    • booktitle = {American Control Conference (ACC)},
    • year = 2024,
    • pages = {318--324},
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.23919/ACC60939.2024.10644902},
    • url = {https://www.merl.com/publications/TR2024-079}
    • }
  •  Jeon, C.-B., Wichern, G., Germain, F.G., Le Roux, J., "Why does music source separation benefit from cacophony?", IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA), DOI: 10.1109/​ICASSPW62465.2024.10669899, March 2024, pp. 873-877.
    BibTeX TR2024-030 PDF Video
    • @inproceedings{Jeon2024mar,
    • author = {Jeon, Chang-Bin and Wichern, Gordon and Germain, François G and Le Roux, Jonathan},
    • title = {Why does music source separation benefit from cacophony?},
    • booktitle = {IEEE ICASSP Satellite Workshop on Explainable Machine Learning for Speech and Audio (XAI-SA)},
    • year = 2024,
    • pages = {873--877},
    • month = mar,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSPW62465.2024.10669899},
    • isbn = {979-8-3503-7451-3},
    • url = {https://www.merl.com/publications/TR2024-030}
    • }
  •  Boeddeker, C., Subramanian, A.S., Wichern, G., Haeb-Umbach, R., Le Roux, J., "TS-SEP: Joint Diarization and Separation Conditioned on Estimated Speaker Embeddings", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/​TASLP.2024.3350887, Vol. 32, pp. 1185-1197, February 2024.
    BibTeX TR2024-006 PDF Software
    • @article{Boeddeker2024feb,
    • author = {Boeddeker, Christoph and Subramanian, Aswin Shanmugam and Wichern, Gordon and Haeb-Umbach, Reinhold and Le Roux, Jonathan},
    • title = {TS-SEP: Joint Diarization and Separation Conditioned on Estimated Speaker Embeddings},
    • journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
    • year = 2024,
    • volume = 32,
    • pages = {1185--1197},
    • month = feb,
    • doi = {10.1109/TASLP.2024.3350887},
    • issn = {2329-9304},
    • url = {https://www.merl.com/publications/TR2024-006}
    • }
  •  Pan, Z., Wichern, G., Masuyama, Y., Germain, F.G., Khurana, S., Hori, C., Le Roux, J., "Scenario-Aware Audio-Visual TF-GridNet for Target Speech Extraction", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/​ASRU57964.2023.10389618, December 2023.
    BibTeX TR2023-152 PDF Video
    • @inproceedings{Pan2023dec2,
    • author = {Pan, Zexu and Wichern, Gordon and Masuyama, Yoshiki and Germain, François G and Khurana, Sameer and Hori, Chiori and Le Roux, Jonathan},
    • title = {Scenario-Aware Audio-Visual TF-GridNet for Target Speech Extraction},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2023,
    • month = dec,
    • doi = {10.1109/ASRU57964.2023.10389618},
    • isbn = {979-8-3503-0689-7},
    • url = {https://www.merl.com/publications/TR2023-152}
    • }
  •  Falcon Perez, R., Wichern, G., Germain, F., Le Roux, J., "Location as supervision for weakly supervised multi-channel source separation of machine sounds", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/​WASPAA58266.2023.10248128, September 2023.
    BibTeX TR2023-119 PDF Presentation
    • @inproceedings{FalconPerez2023aug,
    • author = {Falcon Perez, Ricardo and Wichern, Gordon and Germain, Francois and Le Roux, Jonathan},
    • title = {Location as supervision for weakly supervised multi-channel source separation of machine sounds},
    • booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
    • year = 2023,
    • month = sep,
    • publisher = {IEEE},
    • doi = {10.1109/WASPAA58266.2023.10248128},
    • issn = {1947-1629},
    • isbn = {979-8-3503-2372-6},
    • url = {https://www.merl.com/publications/TR2023-119}
    • }
  •  Petermann, D., Wichern, G., Subramanian, A.S., Wang, Z.-Q., Le Roux, J., "Tackling the Cocktail Fork Problem for Separation and Transcription of Real-World Soundtracks", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/​TASLP.2023.3290428, Vol. 31, pp. 2592-2605, September 2023.
    BibTeX TR2023-113 PDF
    • @article{Petermann2023sep,
    • author = {Petermann, Darius and Wichern, Gordon and Subramanian, Aswin Shanmugam and Wang, Zhong-Qiu and Le Roux, Jonathan},
    • title = {Tackling the Cocktail Fork Problem for Separation and Transcription of Real-World Soundtracks},
    • journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
    • year = 2023,
    • volume = 31,
    • pages = {2592--2605},
    • month = sep,
    • doi = {10.1109/TASLP.2023.3290428},
    • issn = {2329-9304},
    • url = {https://www.merl.com/publications/TR2023-113}
    • }
  •  Vinod, A.P., Di Cairano, S., "Sample quantile-based programming for non-convex separable chance constraints", American Control Conference (ACC), May 2023, pp. 1517-1522.
    BibTeX TR2023-062 PDF
    • @inproceedings{Vinod2023may,
    • author = {Vinod, Abraham P. and Di Cairano, Stefano},
    • title = {Sample quantile-based programming for non-convex separable chance constraints},
    • booktitle = {American Control Conference (ACC)},
    • year = 2023,
    • pages = {1517--1522},
    • month = may,
    • url = {https://www.merl.com/publications/TR2023-062}
    • }
  •  Chen, K., Wichern, G., Germain, F., Le Roux, J., "Pac-HuBERT: Self-Supervised Music Source Separation via Primitive Auditory Clustering and Hidden-Unit BERT", IEEE ICASSP Satellite Workshop on Self-supervision in Audio, Speech and Beyond (SASB), DOI: 10.1109/​ICASSPW59220.2023.10193575, May 2023.
    BibTeX TR2023-030 PDF
    • @inproceedings{Chen2023may,
    • author = {Chen, Ke and Wichern, Gordon and Germain, Francois and Le Roux, Jonathan},
    • title = {Pac-HuBERT: Self-Supervised Music Source Separation via Primitive Auditory Clustering and Hidden-Unit BERT},
    • booktitle = {IEEE ICASSP Satellite Workshop on Self-supervision in Audio, Speech and Beyond (SASB)},
    • year = 2023,
    • month = may,
    • doi = {10.1109/ICASSPW59220.2023.10193575},
    • isbn = {979-8-3503-0261-5},
    • url = {https://www.merl.com/publications/TR2023-030}
    • }
  •  Aralikatti, R., Boeddeker, C., Wichern, G., Subramanian, A.S., Le Roux, J., "Reverberation as Supervision for Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10095022, May 2023, pp. 1-5.
    BibTeX TR2023-016 PDF
    • @inproceedings{Aralikatti2023may,
    • author = {Aralikatti, Rohith and Boeddeker, Christoph and Wichern, Gordon and Subramanian, Aswin Shanmugam and Le Roux, Jonathan},
    • title = {Reverberation as Supervision for Speech Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10095022},
    • url = {https://www.merl.com/publications/TR2023-016}
    • }
  •  Bralios, D., Tzinis, E., Wichern, G., Smaragdis, P., Le Roux, J., "Latent Iterative Refinement for Modular Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10096897, May 2023, pp. 1-5.
    BibTeX TR2023-019 PDF
    • @inproceedings{Bralios2023may,
    • author = {Bralios, Dimitrios and Tzinis, Efthymios and Wichern, Gordon and Smaragdis, Paris and Le Roux, Jonathan},
    • title = {Latent Iterative Refinement for Modular Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10096897},
    • url = {https://www.merl.com/publications/TR2023-019}
    • }
  •  Petermann, D., Wichern, G., Subramanian, A.S., Le Roux, J., "Hyperbolic Audio Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10094943, May 2023, pp. 1-5.
    BibTeX TR2023-017 PDF Video Software
    • @inproceedings{Petermann2023may,
    • author = {Petermann, Darius and Wichern, Gordon and Subramanian, Aswin Shanmugam and Le Roux, Jonathan},
    • title = {Hyperbolic Audio Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10094943},
    • url = {https://www.merl.com/publications/TR2023-017}
    • }
  •  Tzinis, E., Wichern, G., Smaragdis, P., Le Roux, J., "Optimal Condition Training for Target Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10095128, May 2023, pp. 1-5.
    BibTeX TR2023-018 PDF
    • @inproceedings{Tzinis2023may,
    • author = {Tzinis, Efthymios and Wichern, Gordon and Smaragdis, Paris and Le Roux, Jonathan},
    • title = {Optimal Condition Training for Target Source Separation},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • pages = {1--5},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10095128},
    • url = {https://www.merl.com/publications/TR2023-018}
    • }
  •  Lin, C., "Analytical Parametrization for Magnetization of Gadolinium based on Scaling Hypothesis", Physica A, DOI: 10.1016/​j.physa.2023.128686, Vol. 617, pp. 128686, April 2023.
    BibTeX TR2023-015 PDF
    • @article{Lin2023apr,
    • author = {Lin, Chungwei},
    • title = {Analytical Parametrization for Magnetization of Gadolinium based on Scaling Hypothesis},
    • journal = {Physica A},
    • year = 2023,
    • volume = 617,
    • pages = 128686,
    • month = apr,
    • doi = {10.1016/j.physa.2023.128686},
    • issn = {0378-4371},
    • url = {https://www.merl.com/publications/TR2023-015}
    • }
  •  Chatterjee, M., Ahuja, N., Cherian, A., "Learning Audio-Visual Dynamics Using Scene Graphs for Audio Source Separation", Advances in Neural Information Processing Systems (NeurIPS), November 2022.
    BibTeX TR2022-140 PDF Presentation
    • @inproceedings{Chatterjee2022nov,
    • author = {Chatterjee, Moitreya and Ahuja, Narendra and Cherian, Anoop},
    • title = {Learning Audio-Visual Dynamics Using Scene Graphs for Audio Source Separation},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2022,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2022-140}
    • }
  •  Tzinis, E., Wichern, G., Subramanian, A.S., Smaragdis, P., Le Roux, J., "Heterogeneous Target Speech Separation", Interspeech, DOI: 10.21437/​Interspeech.2022-10717, September 2022, pp. 1796-1800.
    BibTeX TR2022-115 PDF Video Presentation
    • @inproceedings{Tzinis2022sep,
    • author = {Tzinis, Efthymios and Wichern, Gordon and Subramanian, Aswin Shanmugam and Smaragdis, Paris and Le Roux, Jonathan},
    • title = {Heterogeneous Target Speech Separation},
    • booktitle = {Interspeech},
    • year = 2022,
    • pages = {1796--1800},
    • month = sep,
    • doi = {10.21437/Interspeech.2022-10717},
    • url = {https://www.merl.com/publications/TR2022-115}
    • }
  •  Yu, J., Wang, P., Koike-Akino, T., Wang, Y., Orlik, P.V., Buehrer, R.M., "Multi-Band Wi-Fi Sensing with Matched Feature Granularity", IEEE Internet of Things Journal, DOI: 10.1109/​JIOT.2022.3190826, July 2022.
    BibTeX TR2022-105 PDF
    • @article{Yu2022jul,
    • author = {Yu, Jianyuan and Wang, Pu and Koike-Akino, Toshiaki and Wang, Ye and Orlik, Philip V. and Buehrer, R. Michael},
    • title = {Multi-Band Wi-Fi Sensing with Matched Feature Granularity},
    • journal = {IEEE Internet of Things Journal},
    • year = 2022,
    • month = jul,
    • doi = {10.1109/JIOT.2022.3190826},
    • issn = {2327-4662},
    • url = {https://www.merl.com/publications/TR2022-105}
    • }
  •  Shirsat, A., Sun, H., Kim, K.J., Guo, J., Nikovski, D.N., "ConvEDNet: A Convolutional Energy Disaggregation Network Using Continuous Point-On-Wave Measurements", IEEE PES General Meeting, DOI: 10.1109/​PESGM48719.2022.9916802, July 2022.
    BibTeX TR2022-101 PDF
    • @inproceedings{Shirsat2022jul,
    • author = {Shirsat, Ashwin and Sun, Hongbo and Kim, Kyeong Jin and Guo, Jianlin and Nikovski, Daniel N.},
    • title = {ConvEDNet: A Convolutional Energy Disaggregation Network Using Continuous Point-On-Wave Measurements},
    • booktitle = {2022 IEEE Power \& Energy Society General Meeting (PESGM)},
    • year = 2022,
    • month = jul,
    • doi = {10.1109/PESGM48719.2022.9916802},
    • url = {https://www.merl.com/publications/TR2022-101}
    • }
  •  Wollenstein-Betech, S., Sun, C., Zhang, J., Cassandras, C.G., Paschalidis, I.C., "Joint Data-Driven Estimation of Origin-Destination Demand and Travel Latency Functions in Multi-Class Transportation Networks", IEEE Transactions on Control of Network Systems, DOI: 10.1109/​TCNS.2022.3161200, June 2022.
    BibTeX TR2022-078 PDF
    • @article{Wollenstein-Betech2022jun,
    • author = {Wollenstein-Betech, Salomon and Sun, Chuangchuang and Zhang, Jing and Cassandras, Christos G. and Paschalidis, Ioannis Ch.},
    • title = {Joint Data-Driven Estimation of Origin-Destination Demand and Travel Latency Functions in Multi-Class Transportation Networks},
    • journal = {IEEE Transactions on Control of Network Systems},
    • year = 2022,
    • month = jun,
    • doi = {10.1109/TCNS.2022.3161200},
    • url = {https://www.merl.com/publications/TR2022-078}
    • }
  •  Petermann, D., Wichern, G., Wang, Z.-Q., Le Roux, J., "The Cocktail Fork Problem: Three-Stem Audio Separation for Real-World Soundtracks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP43922.2022.9746005, April 2022, pp. 526-530.
    BibTeX TR2022-022 PDF Video Software
    • @inproceedings{Petermann2022apr,
    • author = {Petermann, Darius and Wichern, Gordon and Wang, Zhong-Qiu and Le Roux, Jonathan},
    • title = {The Cocktail Fork Problem: Three-Stem Audio Separation for Real-World Soundtracks},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2022,
    • pages = {526--530},
    • month = apr,
    • doi = {10.1109/ICASSP43922.2022.9746005},
    • url = {https://www.merl.com/publications/TR2022-022}
    • }
  •  Jin, S., Pu, W., Boufounos, P.T., Orlik, P.V., Roy, S., "Automotive Radar Interference Mitigation with Fast-Time-Frequency Mode Retrieval", IEEE Radar Conference (RadarCon), DOI: 10.1109/​RadarConf2248738.2022.9764338, March 2022.
    BibTeX TR2022-029 PDF
    • @inproceedings{Jin2022mar,
    • author = {Jin, Sian and Pu, Wang and Boufounos, Petros T. and Orlik, Philip V. and Roy, Sumit},
    • title = {Automotive Radar Interference Mitigation with Fast-Time-Frequency Mode Retrieval},
    • booktitle = {IEEE Radar Conference (RadarCon)},
    • year = 2022,
    • month = mar,
    • doi = {10.1109/RadarConf2248738.2022.9764338},
    • isbn = {978-1-7281-5368-1},
    • url = {https://www.merl.com/publications/TR2022-029}
    • }