- Tachioka, Y., Narita, T., Watanabe, S., "Effectiveness of Dereverberation, Feature Transformation, Discriminative Training Methods, and System Combination Approach for Various Reverberant Environments", EURASIP Journal on Advances in Signal Processing, DOI: 10.1186/s13634-015-0241-y, June 2015.
BibTeX TR2015-152 PDF- @article{Tachioka2015jun,
- author = {Tachioka, Y. and Narita, T. and Watanabe, S.},
- title = {Effectiveness of Dereverberation, Feature Transformation, Discriminative Training Methods, and System Combination Approach for Various Reverberant Environments},
- journal = {EURASIP Journal on Advances in Signal Processing},
- year = 2015,
- month = jun,
- doi = {10.1186/s13634-015-0241-y},
- url = {https://www.merl.com/publications/TR2015-152}
- }
- Erdogan, H., Hershey, J.R., Watanabe, S., Le Roux, J., "Phase-Sensitive and Recognition-Boosted Speech Separation Using Deep Recurrent Neural Networks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7178061, April 2015, pp. 708-712.
BibTeX TR2015-031 PDF- @inproceedings{Erdogan2015apr,
- author = {Erdogan, H. and Hershey, J.R. and Watanabe, S. and {Le Roux}, J.},
- title = {Phase-Sensitive and Recognition-Boosted Speech Separation Using Deep Recurrent Neural Networks},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {708--712},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7178061},
- url = {https://www.merl.com/publications/TR2015-031}
- }
- Kadambi, A., Boufounos, P.T., "Coded Aperture Compressive 3-D LIDAR", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7178153, April 2015, pp. 1166-1170.
BibTeX TR2015-028 PDF- @inproceedings{Kadambi2015apr,
- author = {Kadambi, A. and Boufounos, P.T.},
- title = {Coded Aperture Compressive 3-D LIDAR},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {1166--1170},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7178153},
- url = {https://www.merl.com/publications/TR2015-028}
- }
- Le Roux, J., Hershey, J.R., Weninger, F.J., "Deep NMF for Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7177933, April 2015, pp. 66-70.
BibTeX TR2015-029 PDF- @inproceedings{LeRoux2015apr1,
- author = {{Le Roux}, J. and Hershey, J.R. and Weninger, F.J.},
- title = {Deep NMF for Speech Separation},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {66--70},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7177933},
- url = {https://www.merl.com/publications/TR2015-029}
- }
- Le Roux, J., Vincent, E., Hershey, J.R., Ellis, D.P.W., "Micbots: Collecting Large Realistic Datasets for Speech and Audio Research Using Mobile Robots", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7179050, April 2015, pp. 5635-5639.
BibTeX TR2015-030 PDF- @inproceedings{LeRoux2015apr2,
- author = {{Le Roux}, J. and Vincent, E. and Hershey, J.R. and Ellis, D.P.W.},
- title = {Micbots: Collecting Large Realistic Datasets for Speech and Audio Research Using Mobile Robots},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {5635--5639},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7179050},
- url = {https://www.merl.com/publications/TR2015-030}
- }
- Mansour, H., Jiang, X., "A Robust Online Subspace Estimation and Tracking Algorithm", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7178735, April 2015, pp. 4065-4069.
BibTeX TR2015-027 PDF Software- @inproceedings{Mansour2015apr1,
- author = {Mansour, H. and Jiang, X.},
- title = {A Robust Online Subspace Estimation and Tracking Algorithm},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {4065--4069},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7178735},
- url = {https://www.merl.com/publications/TR2015-027}
- }
- Mansour, H., Saab, R., "Weighted One-Norm Minimization with Inaccurate Support Estimates: Sharp Analysis via the Null-Space Property", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7178585, April 2015, pp. 3317-3321.
BibTeX TR2015-026 PDF- @inproceedings{Mansour2015apr2,
- author = {Mansour, H. and Saab, R.},
- title = {Weighted One-Norm Minimization with Inaccurate Support Estimates: Sharp Analysis via the Null-Space Property},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {3317--3321},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7178585},
- url = {https://www.merl.com/publications/TR2015-026}
- }
- Shinozaki, T., Watanabe, S., "Structure Discovery of Deep Neural Network Based on Evolutionary Algorithms", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7178918, April 2015, pp. 4979-4983.
BibTeX TR2015-032 PDF- @inproceedings{Shinozaki2015apr,
- author = {Shinozaki, T. and Watanabe, S.},
- title = {Structure Discovery of Deep Neural Network Based on Evolutionary Algorithms},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {4979--4983},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7178918},
- url = {https://www.merl.com/publications/TR2015-032}
- }
- Tachioka, Y., Watanabe, S., "Discriminative Method for Recurrent Neural Network Language Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2015.7179000, April 2015, pp. 5386-5390.
BibTeX TR2015-033 PDF- @inproceedings{Tachioka2015apr,
- author = {Tachioka, Y. and Watanabe, S.},
- title = {Discriminative Method for Recurrent Neural Network Language Models},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2015,
- pages = {5386--5390},
- month = apr,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2015.7179000},
- url = {https://www.merl.com/publications/TR2015-033}
- }
- Le Roux, J., Weninger, F.J., Hershey, J.R., "Sparse NMF -- half-baked or well done?," Tech. Rep. TR2015-023, Mitsubishi Electric Research Laboratories, March 2015.
BibTeX TR2015-023 PDF- @techreport{LeRoux2015mar,
- author = {{Le Roux}, J. and Weninger, F.J. and Hershey, J.R.},
- title = {Sparse NMF -- half-baked or well done?},
- institution = {Mitsubishi Electric Research Laboratories},
- year = 2015,
- number = {TR2015-023},
- address = {Cambridge MA, USA},
- month = mar,
- url = {https://www.merl.com/publications/TR2015-023}
- }
- Gerkmann, T., Krawczyk, M., Le Roux, J., "Phase Processing for Single Channel Speech Enhancement: History and Recent Advances", IEEE Signal Processing Magazine, DOI: 10.1109/MSP.2014.2369251, Vol. 32, No. 2, pp. 55-66, March 2015.
BibTeX TR2014-122 PDF- @article{Gerkmann2015mar,
- author = {Gerkmann, T. and Krawczyk, M. and {Le Roux}, J.},
- title = {Phase Processing for Single Channel Speech Enhancement: History and Recent Advances},
- journal = {IEEE Signal Processing Magazine},
- year = 2015,
- volume = 32,
- number = 2,
- pages = {55--66},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/MSP.2014.2369251},
- issn = {1053-5888},
- url = {https://www.merl.com/publications/TR2014-122}
- }
- Weninger, F., Le Roux, J., Hershey, J.R., Schuller, B., "Discriminatively Trained Recurrent Neural Networks for Single-Channel Speech Separation", IEEE Global Conference on Signal and Information Processing (GlobalSIP), DOI: 10.1109/GlobalSIP.2014.7032183, December 2014, pp. 577-581.
BibTeX TR2014-104 PDF- @inproceedings{Weninger2014dec,
- author = {Weninger, F. and {Le Roux}, J. and Hershey, J.R. and Schuller, B.},
- title = {Discriminatively Trained Recurrent Neural Networks for Single-Channel Speech Separation},
- booktitle = {IEEE Global Conference on Signal and Information Processing (GlobalSIP)},
- year = 2014,
- pages = {577--581},
- month = dec,
- publisher = {IEEE},
- doi = {10.1109/GlobalSIP.2014.7032183},
- url = {https://www.merl.com/publications/TR2014-104}
- }
- Tachioka, Y., Watanabe, S., Le Roux, J., Hershey, J.R., "Sequential Maximum Mutual Information Linear Discriminant Analysis for Speech Recognition", Interspeech, September 2014, vol. 15, pp. 2415-2419.
BibTeX TR2014-079 PDF- @inproceedings{Tachioka2014sep,
- author = {Tachioka, Y. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R.},
- title = {Sequential Maximum Mutual Information Linear Discriminant Analysis for Speech Recognition},
- booktitle = {Interspeech},
- year = 2014,
- volume = 15,
- pages = {2415--2419},
- month = sep,
- publisher = {International Speech Communication Association},
- issn = {2308-457X},
- url = {https://www.merl.com/publications/TR2014-079}
- }
- Watanabe, S., Hershey, J.R., Marks, T.K., Fujii, Y., Koji, Y., "Cost-level integration of statistical and rule-based dialog managers", Interspeech, September 2014, vol. 15, pp. 323-327.
BibTeX TR2014-082 PDF- @inproceedings{Watanabe2014sep,
- author = {Watanabe, S. and Hershey, J.R. and Marks, T.K. and Fujii, Y. and Koji, Y.},
- title = {Cost-level integration of statistical and rule-based dialog managers},
- booktitle = {Interspeech},
- year = 2014,
- volume = 15,
- pages = {323--327},
- month = sep,
- publisher = {International Speech Communication Association},
- issn = {308-457X},
- url = {https://www.merl.com/publications/TR2014-082}
- }
- Weninger, F., Le Roux, J., Hershey, J.R., Watanabe, S., "Discriminative NMF and its application to single-channel source separation", Interspeech, September 2014, vol. 15, pp. 865-869.
BibTeX TR2014-081 PDF- @inproceedings{Weninger2014sep,
- author = {Weninger, F. and {Le Roux}, J. and Hershey, J.R. and Watanabe, S.},
- title = {Discriminative NMF and its application to single-channel source separation},
- booktitle = {Interspeech},
- year = 2014,
- volume = 15,
- pages = {865--869},
- month = sep,
- publisher = {International Speech Communication Association},
- issn = {2308-457X},
- url = {https://www.merl.com/publications/TR2014-081}
- }
- Le Roux, J., Vincent, E., "A Categorization of Robust Speech Processing Datasets," Tech. Rep. TR2014-116, Mitsubishi Electric Research Laboratories, September 2014.
BibTeX TR2014-116 PDF- @techreport{LeRouxVincent2014TRdatasets,
- author = {{Le Roux}, J. and Vincent, E.},
- title = {A Categorization of Robust Speech Processing Datasets},
- institution = {Mitsubishi Electric Research Laboratories},
- year = 2014,
- number = {TR2014-116},
- address = {Cambridge MA, USA},
- month = sep,
- note = {v2014-09},
- url = {https://www.merl.com/publications/TR2014-116}
- }
- Hershey, J.R., Le Roux, J., Weninger, F., "Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures", arXiv, August 2014.
BibTeX arXiv- @article{Hershey2014aug,
- author = {Hershey, J.R. and {Le Roux}, J. and Weninger, F.},
- title = {Deep Unfolding: Model-Based Inspiration of Novel Deep Architectures},
- journal = {arXiv},
- year = 2014,
- month = aug,
- url = {https://arxiv.org/abs/1409.2574v1}
- }
- Tachioka, Y., Narita, T., Watanabe, S., Le Roux, J., "Ensemble Integration of Calibrated Speaker Localization and Statistical Speech Detection in Domestic Environments", Joint Workshop on Hands-free Speech Communication and Microphone Arrays (HSCMA), DOI: 10.1109/HSCMA.2014.6843272, May 2014, pp. 162-166.
BibTeX TR2014-034 PDF- @inproceedings{Tachioka2014may2,
- author = {Tachioka, Y. and Narita, T. and Watanabe, S. and {Le Roux}, J.},
- title = {Ensemble Integration of Calibrated Speaker Localization and Statistical Speech Detection in Domestic Environments},
- booktitle = {Joint Workshop on Hands-free Speech Communication and Microphone Arrays (HSCMA)},
- year = 2014,
- pages = {162--166},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/HSCMA.2014.6843272},
- url = {https://www.merl.com/publications/TR2014-034}
- }
- Tachioka, Y., Narita, T., Weninger, F., Watanabe, S., "Dual system combination approach for various reverberant environments with dereverberation techniques", IEEE REVERB Workshop, May 2014.
BibTeX TR2014-032 PDF- @inproceedings{Tachioka2014may,
- author = {Tachioka, Y. and Narita, T. and Weninger, F. and Watanabe, S.},
- title = {Dual system combination approach for various reverberant environments with dereverberation techniques},
- booktitle = {IEEE REVERB Workshop},
- year = 2014,
- month = may,
- url = {https://www.merl.com/publications/TR2014-032}
- }
- Weninger, F., Watanabe, S., Le Roux, J., Hershey, J.R., Tachioka, Y., Geiger, J., Schuller, B., Rigoll, G., "The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement", IEEE REVERB Workshop, May 2014.
BibTeX TR2014-033 PDF- @inproceedings{Weninger2014may2,
- author = {Weninger, F. and Watanabe, S. and {Le Roux}, J. and Hershey, J.R. and Tachioka, Y. and Geiger, J. and Schuller, B. and Rigoll, G.},
- title = {The MERL/MELCO/TUM System for the REVERB Challenge Using Deep Recurrent Neural Network Feature Enhancement},
- booktitle = {IEEE REVERB Workshop},
- year = 2014,
- month = may,
- url = {https://www.merl.com/publications/TR2014-033}
- }
- Naini, R., Rane, S., Ramalingam, S., "A Vanishing Point-based Global Descriptor for Manhattan Scenes", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854423, May 2014, pp. 4349-4353.
BibTeX TR2014-029 PDF- @inproceedings{Naini2014may,
- author = {Naini, R. and Rane, S. and Ramalingam, S.},
- title = {A Vanishing Point-based Global Descriptor for Manhattan Scenes},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {4349--4353},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854423},
- url = {https://www.merl.com/publications/TR2014-029}
- }
- Simsekli, U., Le Roux, J., Hershey, J.R., "Non-negative Source-filter Dynamical System for Speech Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854797, May 2014, pp. 6206-6210.
BibTeX TR2014-027 PDF Software- @inproceedings{Simsekli2014may,
- author = {Simsekli, U. and {Le Roux}, J. and Hershey, J.R.},
- title = {Non-negative Source-filter Dynamical System for Speech Enhancement},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {6206--6210},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854797},
- url = {https://www.merl.com/publications/TR2014-027}
- }
- Tang, H., Watanabe, S., Marks, T.K., Hershey, J.R., "Log-linear Dialog Manager", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854371, May 2014, pp. 4092-4096.
BibTeX TR2014-024 PDF- @inproceedings{Tang2014may,
- author = {Tang, H. and Watanabe, S. and Marks, T.K. and Hershey, J.R.},
- title = {Log-linear Dialog Manager},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {4092--4096},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854371},
- url = {https://www.merl.com/publications/TR2014-024}
- }
- Wang, Y., Ortega, A., Tian, D., Vetro, A., "A Graph-based Joint Bilateral Approach for Depth Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6853724, May 2014, pp. 885-889.
BibTeX TR2014-028 PDF- @inproceedings{Wang2014may,
- author = {Wang, Y. and Ortega, A. and Tian, D. and Vetro, A.},
- title = {A Graph-based Joint Bilateral Approach for Depth Enhancement},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {885--889},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6853724},
- url = {https://www.merl.com/publications/TR2014-028}
- }
- Watanabe, S., Le Roux, J., "Black Box Optimization for Automatic Speech Recognition", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2014.6854202, May 2014, pp. 3256-3260.
BibTeX TR2014-021 PDF- @inproceedings{Watanabe2014may,
- author = {Watanabe, S. and {Le Roux}, J.},
- title = {Black Box Optimization for Automatic Speech Recognition},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2014,
- pages = {3256--3260},
- month = may,
- publisher = {IEEE},
- doi = {10.1109/ICASSP.2014.6854202},
- url = {https://www.merl.com/publications/TR2014-021}
- }