Publications

Tachioka, Y., Narita, T., Watanabe, S., "Effectiveness of Dereverberation, Feature Transformation, Discriminative Training Methods, and System Combination Approach for Various Reverberant Environments", EURASIP Journal on Advances in Signal Processing, DOI: 10.1186/s13634-015-0241-y, June 2015.
BibTeX TR2015-152 PDF
- @article{Tachioka2015jun,
- author = {Tachioka, Y. and Narita, T. and Watanabe, S.},
- title = {Effectiveness of Dereverberation, Feature Transformation, Discriminative Training Methods, and System Combination Approach for Various Reverberant Environments},
- journal = {EURASIP Journal on Advances in Signal Processing},
- year = 2015,
- month = jun,
- doi = {10.1186/s13634-015-0241-y},
- url = {https://www.merl.com/publications/TR2015-152}
- }
Erdogan, H., Hershey, J.R., Watanabe, S., Le Roux, J., "Phase-Sensitive and Recognition-Boosted Speech Separation Using Deep Recurrent Neural Networks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7178061, April 2015, pp. 708-712.
BibTeX TR2015-031 PDF
- @inproceedings{Erdogan2015apr,
- author = {Erdogan, H. and Hershey, J.R. and Watanabe, S. and {Le Roux}, J.},
- title = {Phase-Sensitive and Recognition-Boosted Speech Separation Using Deep Recurrent Neural Networks},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {708--712},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7178061},
- url = {https://www.merl.com/publications/TR2015-031}
- }
Kadambi, A., Boufounos, P.T., "Coded Aperture Compressive 3-D LIDAR", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7178153, April 2015, pp. 1166-1170.
BibTeX TR2015-028 PDF
- @inproceedings{Kadambi2015apr,
- author = {Kadambi, A. and Boufounos, P.T.},
- title = {Coded Aperture Compressive 3-D LIDAR},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {1166--1170},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7178153},
- url = {https://www.merl.com/publications/TR2015-028}
- }
Le Roux, J., Hershey, J.R., Weninger, F.J., "Deep NMF for Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7177933, April 2015, pp. 66-70.
BibTeX TR2015-029 PDF
- @inproceedings{LeRoux2015apr1,
- author = {{Le Roux}, J. and Hershey, J.R. and Weninger, F.J.},
- title = {Deep NMF for Speech Separation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {66--70},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7177933},
- url = {https://www.merl.com/publications/TR2015-029}
- }
Le Roux, J., Vincent, E., Hershey, J.R., Ellis, D.P.W., "Micbots: Collecting Large Realistic Datasets for Speech and Audio Research Using Mobile Robots", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7179050, April 2015, pp. 5635-5639.
BibTeX TR2015-030 PDF
- @inproceedings{LeRoux2015apr2,
- author = {{Le Roux}, J. and Vincent, E. and Hershey, J.R. and Ellis, D.P.W.},
- title = {Micbots: Collecting Large Realistic Datasets for Speech and Audio Research Using Mobile Robots},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {5635--5639},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7179050},
- url = {https://www.merl.com/publications/TR2015-030}
- }
Mansour, H., Jiang, X., "A Robust Online Subspace Estimation and Tracking Algorithm", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7178735, April 2015, pp. 4065-4069.
BibTeX TR2015-027 PDF Software
- @inproceedings{Mansour2015apr1,
- author = {Mansour, H. and Jiang, X.},
- title = {A Robust Online Subspace Estimation and Tracking Algorithm},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {4065--4069},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7178735},
- url = {https://www.merl.com/publications/TR2015-027}
- }
Mansour, H., Saab, R., "Weighted One-Norm Minimization with Inaccurate Support Estimates: Sharp Analysis via the Null-Space Property", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7178585, April 2015, pp. 3317-3321.
BibTeX TR2015-026 PDF
- @inproceedings{Mansour2015apr2,
- author = {Mansour, H. and Saab, R.},
- title = {Weighted One-Norm Minimization with Inaccurate Support Estimates: Sharp Analysis via the Null-Space Property},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {3317--3321},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7178585},
- url = {https://www.merl.com/publications/TR2015-026}
- }
Shinozaki, T., Watanabe, S., "Structure Discovery of Deep Neural Network Based on Evolutionary Algorithms", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7178918, April 2015, pp. 4979-4983.
BibTeX TR2015-032 PDF
- @inproceedings{Shinozaki2015apr,
- author = {Shinozaki, T. and Watanabe, S.},
- title = {Structure Discovery of Deep Neural Network Based on Evolutionary Algorithms},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {4979--4983},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7178918},
- url = {https://www.merl.com/publications/TR2015-032}
- }
Tachioka, Y., Watanabe, S., "Discriminative Method for Recurrent Neural Network Language Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7179000, April 2015, pp. 5386-5390.
BibTeX TR2015-033 PDF
- @inproceedings{Tachioka2015apr,
- author = {Tachioka, Y. and Watanabe, S.},
- title = {Discriminative Method for Recurrent Neural Network Language Models},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {5386--5390},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7179000},
- url = {https://www.merl.com/publications/TR2015-033}
- }
Le Roux, J., Weninger, F.J., Hershey, J.R., "Sparse NMF -- half-baked or well done?," Tech. Rep. TR2015-023, Mitsubishi Electric Research Laboratories, March 2015.
BibTeX TR2015-023 PDF
- @techreport{LeRoux2015mar,
- author = {{Le Roux}, J. and Weninger, F.J. and Hershey, J.R.},
- title = {Sparse NMF -- half-baked or well done?},
- institution = {Mitsubishi Electric Research Laboratories},
- year = 2015,
- number = {TR2015-023},
- address = {Cambridge MA, USA},
- month = mar,
- url = {https://www.merl.com/publications/TR2015-023}
- }
Gerkmann, T., Krawczyk, M., Le Roux, J., "Phase Processing for Single Channel Speech Enhancement: History and Recent Advances", IEEE Signal Processing Magazine, DOI: 10.1109/MSP.2014.2369251, Vol. 32, No. 2, pp. 55-66, March 2015.
BibTeX TR2014-122 PDF
- @article{Gerkmann2015mar,
- author = {Gerkmann, T. and Krawczyk, M. and {Le Roux}, J.},
- title = {Phase Processing for Single Channel Speech Enhancement: History and Recent Advances},
- journal = {IEEE Signal Processing Magazine},
- year = 2015,
- volume = 32,
- number = 2,
- pages = {55--66},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/MSP.2014.2369251},
- issn = {1053-5888},
- url = {https://www.merl.com/publications/TR2014-122}
- }
Weninger, F., Le Roux, J., Hershey, J.R., Schuller, B., "Discriminatively Trained Recurrent Neural Networks for Single-Channel Speech Separation", IEEE Global Conference on Signal and Information Processing (GlobalSIP), DOI: 10.1109/GlobalSIP.2014.7032183, December 2014, pp. 577-581.
BibTeX TR2014-104 PDF
- @inproceedings{Weninger2014dec,
- author = {Weninger, F. and {Le Roux}, J. and Hershey, J.R. and Schuller, B.},
- title = {Discriminatively Trained Recurrent Neural Networks for Single-Channel Speech Separation},
- booktitle = {IEEE Global Conference on Signal and Information Processing (GlobalSIP)},
- year = 2014,
- pages = {577--581},
- month = dec,
- publisher = {IEEE},
- doi = {10.1109/GlobalSIP.2014.7032183},
- url = {https://www.merl.com/publications/TR2014-104}
- }
Tachioka, Y., Watanabe, S., Le Roux, J., Hershey, J.R., "Sequential Maximum Mutual Information Linear Discriminant Analysis for Speech Recognition", Interspeech, September 2014, vol. 15, pp. 2415-2419.
BibTeX TR2014-079 PDF
- @inproceedings{Tachioka2014sep,
- author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
- title = {Sequential Maximum Mutual Information Linear Discriminant Analysis for Speech Recognition},
- booktitle = {Interspeech},
- year = 2014,
- volume = 15,
- pages = {2415--2419},
- month = sep,
- publisher = {International Speech Communication Association},
- issn = {2308-457X},
- url = {https://www.merl.com/publications/TR2014-079}
- }
Watanabe, S., Hershey, J.R., Marks, T.K., Fujii, Y., Koji, Y., "Cost-level integration of statistical and rule-based dialog managers", Interspeech, September 2014, vol. 15, pp. 323-327.
BibTeX TR2014-082 PDF
- @inproceedings{Watanabe2014sep,
- author = {Watanabe, S. and Hershey, J.R. and Marks, T.K. and Fujii, Y. and Koji, Y.},
- title = {Cost-level integration of statistical and rule-based dialog managers},
- booktitle = {Interspeech},
- year = 2014,
- volume = 15,
- pages = {323--327},
- month = sep,
- publisher = {International Speech Communication Association},
- issn = {308-457X},
- url = {https://www.merl.com/publications/TR2014-082}
- }
Weninger, F., Le Roux, J., Hershey, J.R., Watanabe, S., "Discriminative NMF and its application to single-channel source separation", Interspeech, September 2014, vol. 15, pp. 865-869.
BibTeX TR2014-081 PDF
- @inproceedings{Weninger2014sep,
- author = {Weninger, F. and {Le Roux}, J. and Hershey, J.R. and Watanabe, S.},
- title = {Discriminative NMF and its application to single-channel source separation},
- booktitle = {Interspeech},
- year = 2014,
- volume = 15,
- pages = {865--869},
- month = sep,
- publisher = {International Speech Communication Association},
- issn = {2308-457X},
- url = {https://www.merl.com/publications/TR2014-081}
- }
Le Roux, J., Vincent, E., "A Categorization of Robust Speech Processing Datasets," Tech. Rep. TR2014-116, Mitsubishi Electric Research Laboratories, September 2014.
BibTeX TR2014-116 PDF
- @techreport{LeRouxVincent2014TRdatasets,
- author = {{Le Roux}, J. and Vincent, E.},
- title = {A Categorization of Robust Speech Processing Datasets},
- institution = {Mitsubishi Electric Research Laboratories},
- year = 2014,
- number = {TR2014-116},
- address = {Cambridge MA, USA},
- month = sep,
- note = {v2014-09},
- url = {https://www.merl.com/publications/TR2014-116}
- }
Hershey, J.R., Le Roux, J., Weninger, F., "Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures", arXiv, August 2014.
BibTeX arXiv
- @article{Hershey2014aug,
- author = {Hershey, J.R. and {Le Roux}, J. and Weninger, F.},
- title = {Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures},
- journal = {arXiv},
- year = 2014,
- month = aug,
- url = {https://arxiv.org/abs/1409.2574v1}
- }
Tachioka, Y., Narita, T., Watanabe, S., Le Roux, J., "Ensemble Integration of Calibrated Speaker Localization and Statistical Speech Detection in Domestic Environments", Joint Workshop on Hands-free Speech Communication and Microphone Arrays (HSCMA), DOI: 10.1109/HSCMA.2014.6843272, May 2014, pp. 162-166.
BibTeX TR2014-034 PDF
- @inproceedings{Tachioka2014may2,
- author = {Tachioka, Y. and Narita, T. and Watanabe, S. and {Le Roux}, J.},
- title = {Ensemble Integration of Calibrated Speaker Localization and Statistical Speech Detection in Domestic Environments},
- booktitle = {Joint Workshop on Hands-free Speech Communication and Microphone Arrays (HSCMA)},
- year = 2014,
- pages = {162--166},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/HSCMA.2014.6843272},
- url = {https://www.merl.com/publications/TR2014-034}
- }
Tachioka, Y., Narita, T., Weninger, F., Watanabe, S., "Dual system combination approach for various reverberant environments with dereverberation techniques", IEEE REVERB Workshop, May 2014.
BibTeX TR2014-032 PDF
- @inproceedings{Tachioka2014may,
- author = {Tachioka, Y. and Narita, T. and Weninger, F. and Watanabe, S.},
- title = {Dual system combination approach for various reverberant environments with dereverberation techniques},
- booktitle = {IEEE REVERB Workshop},
- year = 2014,
- month = may,
- url = {https://www.merl.com/publications/TR2014-032}
- }
Weninger, F., Watanabe, S., Le Roux, J., Hershey, J.R., Tachioka, Y., Geiger, J., Schuller, B., Rigoll, G., "The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement", IEEE REVERB Workshop, May 2014.
BibTeX TR2014-033 PDF
- @inproceedings{Weninger2014may2,
- author = {Weninger, F. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R. and Tachioka, Y. and Geiger, J. and Schuller, B. and Rigoll, G.},
- title = {The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement},
- booktitle = {IEEE REVERB Workshop},
- year = 2014,
- month = may,
- url = {https://www.merl.com/publications/TR2014-033}
- }
Naini, R., Rane, S., Ramalingam, S., "A Vanishing Point-based Global Descriptor for Manhattan Scenes", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854423, May 2014, pp. 4349-4353.
BibTeX TR2014-029 PDF
- @inproceedings{Naini2014may,
- author = {Naini, R. and Rane, S. and Ramalingam, S.},
- title = {A Vanishing Point-based Global Descriptor for Manhattan Scenes},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {4349--4353},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854423},
- url = {https://www.merl.com/publications/TR2014-029}
- }
Simsekli, U., Le Roux, J., Hershey, J.R., "Non-negative Source-filter Dynamical System for Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854797, May 2014, pp. 6206-6210.
BibTeX TR2014-027 PDF Software
- @inproceedings{Simsekli2014may,
- author = {Simsekli, U. and {Le Roux}, J. and Hershey, J.R.},
- title = {Non-negative Source-filter Dynamical System for Speech Enhancement},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {6206--6210},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854797},
- url = {https://www.merl.com/publications/TR2014-027}
- }
Tang, H., Watanabe, S., Marks, T.K., Hershey, J.R., "Log-linear Dialog Manager", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854371, May 2014, pp. 4092-4096.
BibTeX TR2014-024 PDF
- @inproceedings{Tang2014may,
- author = {Tang, H. and Watanabe, S. and Marks, T.K. and Hershey, J.R.},
- title = {Log-linear Dialog Manager},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {4092--4096},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854371},
- url = {https://www.merl.com/publications/TR2014-024}
- }
Wang, Y., Ortega, A., Tian, D., Vetro, A., "A Graph-based Joint Bilateral Approach for Depth Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6853724, May 2014, pp. 885-889.
BibTeX TR2014-028 PDF
- @inproceedings{Wang2014may,
- author = {Wang, Y. and Ortega, A. and Tian, D. and Vetro, A.},
- title = {A Graph-based Joint Bilateral Approach for Depth Enhancement},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {885--889},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6853724},
- url = {https://www.merl.com/publications/TR2014-028}
- }
Watanabe, S., Le Roux, J., "Black Box Optimization for Automatic Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854202, May 2014, pp. 3256-3260.
BibTeX TR2014-021 PDF
- @inproceedings{Watanabe2014may,
- author = {Watanabe, S. and {Le Roux}, J.},
- title = {Black Box Optimization for Automatic Speech Recognition},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {3256--3260},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854202},
- url = {https://www.merl.com/publications/TR2014-021}
- }