Publications

Hsieh, J.-W., Wu, Y.-H., Hsieh, Y.-K., Li, X., Peng, K.-C., Chang, M.-C., "SoREL: Soft-Label Refurbishment with Ensemble Learning for Noisy Long-Tailed Classification", CVPR Findings, June 2026.
BibTeX TR2026-075 PDF
- @inproceedings{Hsieh2026jun2,
- author = {Hsieh, Jun-Wei and Wu, Ying-Hsuan and Hsieh, Yi-Kuan and Li, Xin and Peng, Kuan-Chuan and Chang, Ming-Ching},
- title = {{SoREL: Soft-Label Refurbishment with Ensemble Learning for Noisy Long-Tailed Classification}},
- booktitle = {CVPR Findings},
- year = 2026,
- month = jun,
- url = {https://www.merl.com/publications/TR2026-075}
- }
Richter, J., Masuyama, Y., Boeddeker, C., Edo, T., Wichern, G., Le Roux, J., "Predictive-Generative Drift Decomposition for Speech Enhancement and Separation", arXiv, May 2026.
BibTeX arXiv
- @article{Richter2026may,
- author = {{Richter, Julius and Masuyama, Yoshiki and Boeddeker, Christoph and Edo, Takahiro and Wichern, Gordon and Le Roux, Jonathan}},
- title = {{Predictive-Generative Drift Decomposition for Speech Enhancement and Separation}},
- journal = {arXiv},
- year = 2026,
- month = may,
- url = {https://arxiv.org/abs/2605.06189}
- }
Aihara, R., Masuyama, Y., Paissan, F., Germain, F.G., Wichern, G., Le Roux, J., "SUNAC: Source-aware Unified Neural Audio Codec", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2026.
BibTeX TR2026-032 PDF
- @inproceedings{Aihara2026may,
- author = {Aihara, Ryo and Masuyama, Yoshiki and Paissan, Francesco and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{SUNAC: Source-aware Unified Neural Audio Codec}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2026,
- month = may,
- url = {https://www.merl.com/publications/TR2026-032}
- }
Masuyama, Y., Saijo, K., Paissan, F., Han, J., Delcroix, M., Aihara, R., Germain, F.G., Wichern, G., Le Roux, J., "FlexIO: Flexible Single- and Multi-Channel Speech Separation and Enhancement", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), May 2026.
BibTeX TR2026-034 PDF
- @inproceedings{Masuyama2026may2,
- author = {Masuyama, Yoshiki and Saijo, Kohei and Paissan, Francesco and Han, Jiangyu and Delcroix, Marc and Aihara, Ryo and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{FlexIO: Flexible Single- and Multi-Channel Speech Separation and Enhancement}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2026,
- month = may,
- url = {https://www.merl.com/publications/TR2026-034}
- }
Jeon, C.-B., Wichern, G., Germain, F.G., Le Roux, J., "Embracing Cacophony: Explaining and Improving Random Mixing in Music Source Separation", IEEE Open Journal of Signal Processing, DOI: 10.1109/OJSP.2025.3633567, Vol. 6, pp. 1179-1192, January 2026.
BibTeX TR2026-012 PDF Software
- @article{Jeon2026jan,
- author = {Jeon, Chang-Bin and Wichern, Gordon and Germain, François G and {Le Roux}, Jonathan},
- title = {{Embracing Cacophony: Explaining and Improving Random Mixing in Music Source Separation}},
- journal = {IEEE Open Journal of Signal Processing},
- year = 2026,
- volume = 6,
- pages = {1179--1192},
- month = jan,
- doi = {10.1109/OJSP.2025.3633567},
- url = {https://www.merl.com/publications/TR2026-012}
- }
Cornell, S., Boeddeker, C., Park, T., Huang, H., Raj, D., Wiesner, M., Masuyama, Y., Chang, X., Wang, Z.-Q., Squartini, S., Garcia, P., Watanabe, S., "Recent Trends in Distant Conversational Speech Recognition: A Review of CHiME-7 and 8 DASR Challenges", Computer Speech & Language, DOI: 10.1016/j.csl.2025.101901, Vol. 97, pp. 101901, December 2025.
BibTeX TR2026-008 PDF
- @article{Cornell2025dec,
- author = {Cornell, Samuele and Boeddeker, Christoph and Park, Taejin and Huang, He and Raj, Desh and Wiesner, Matthew and Masuyama, Yoshiki and Chang, Xuankai and Wang, Zhong-Qiu and Squartini, Stefano and Garcia, Paola and Watanabe, Shinji},
- title = {{Recent Trends in Distant Conversational Speech Recognition: A Review of CHiME-7 and 8 DASR Challenges}},
- journal = {Computer Speech \& Language},
- year = 2025,
- volume = 97,
- pages = 101901,
- month = dec,
- doi = {10.1016/j.csl.2025.101901},
- url = {https://www.merl.com/publications/TR2026-008}
- }
Sun, H., Otake, Y., Matsuyama, K., Raghunathan, A., "Switchgear Partial Discharge Diagnosis Using Scarce Fault Records", IEEE PES Innovative Smart Grid Technologies Conference - Europe (ISGT Europe), DOI: 10.1109/ISGTEurope64741.2025.11305301, October 2025.
BibTeX TR2025-155 PDF
- @inproceedings{Sun2025oct,
- author = {Sun, Hongbo and Otake, Yasutomo and Matsuyama, Kotaro and Raghunathan, Arvind},
- title = {{Switchgear Partial Discharge Diagnosis Using Scarce Fault Records}},
- booktitle = {IEEE PES Innovative Smart Grid Technologies Conference - Europe (ISGT Europe)},
- year = 2025,
- month = oct,
- doi = {10.1109/ISGTEurope64741.2025.11305301},
- url = {https://www.merl.com/publications/TR2025-155}
- }
Vats, S., Jha, D.K., Likhachev, M., Kroemer, O., Romeres, D., "RecoveryChaining: Learning Local Recovery Policies for Robust Manipulation", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), DOI: 10.1109/IROS60139.2025.11245856, October 2025.
BibTeX TR2025-152 PDF Video
- @inproceedings{Vats2025oct,
- author = {Vats, Shivam and Jha, Devesh K. and Likhachev, Maxim and Kroemer, Oliver and Romeres, Diego},
- title = {{RecoveryChaining: Learning Local Recovery Policies for Robust Manipulation}},
- booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
- year = 2025,
- month = oct,
- publisher = {IEEE},
- doi = {10.1109/IROS60139.2025.11245856},
- issn = {2153-0866},
- isbn = {979-8-3315-4393-8},
- url = {https://www.merl.com/publications/TR2025-152}
- }
Paissan, F., Wichern, G., Masuyama, Y., Aihara, R., Germain, F.G., Saijo, K., Le Roux, J., "FasTUSS: Faster Task-Aware Unified Source Separation", IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), DOI: 10.1109/WASPAA66052.2025.11230943, October 2025.
BibTeX TR2025-143 PDF
- @inproceedings{Paissan2025oct,
- author = {Paissan, Francesco and Wichern, Gordon and Masuyama, Yoshiki and Aihara, Ryo and Germain, François G and Saijo, Kohei and {Le Roux}, Jonathan},
- title = {{FasTUSS: Faster Task-Aware Unified Source Separation}},
- booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)},
- year = 2025,
- month = oct,
- doi = {10.1109/WASPAA66052.2025.11230943},
- url = {https://www.merl.com/publications/TR2025-143}
- }
Steinmetz, C., Uhle, C., Everardo, F., Mitcheltree, C., McElveen, J.K., Jot, J.-M., Wichern, G., "Audio Signal Processing in the Artificial Intelligence Era: Challenges and Directions", Journal of the Audio Engineering Society, DOI: 10.17743/jaes.2022.0209, Vol. 73, No. 7/8, pp. 406-428, August 2025.
BibTeX TR2025-116 PDF
- @article{Steinmetz2025aug,
- author = {Steinmetz, Christian and Uhle, Christian and Everardo, Flavio and Mitcheltree, Christopher and McElveen, J. Keith and Jot, Jean-Marc and Wichern, Gordon},
- title = {{Audio Signal Processing in the Artificial Intelligence Era: Challenges and Directions}},
- journal = {Journal of the Audio Engineering Society},
- year = 2025,
- volume = 73,
- number = {7/8},
- pages = {406--428},
- month = aug,
- doi = {10.17743/jaes.2022.0209},
- url = {https://www.merl.com/publications/TR2025-116}
- }
Pavlasek, N., Di Cairano, S., Weiss, A., "Geostationary Satellite Station Keeping and Collocation under High-Thrust Impulsive Control", American Control Conference (ACC), DOI: 10.23919/ACC63710.2025.11107882, July 2025, pp. 4947-4953.
BibTeX TR2025-101 PDF
- @inproceedings{Pavlasek2025jul,
- author = {Pavlasek, Natalia and {Di Cairano}, Stefano and Weiss, Avishai},
- title = {{Geostationary Satellite Station Keeping and Collocation under High-Thrust Impulsive Control}},
- booktitle = {American Control Conference (ACC)},
- year = 2025,
- pages = {4947--4953},
- month = jul,
- publisher = {IEEE},
- doi = {10.23919/ACC63710.2025.11107882},
- issn = {2378-5861},
- isbn = {979-8-3315-6937-2},
- url = {https://www.merl.com/publications/TR2025-101}
- }
Dai, M., Lu, Z., Li, N., Wang, Y., "Enhanced Agility and Safety in Mobile Manipulators through Centroidal Momentum-Based Motion Planning", European Control Conference (ECC), DOI: ECC65951.2025.11186833, June 2025.
BibTeX TR2025-092 PDF
- @inproceedings{Dai2025jun,
- author = {Dai, Min and Lu, Zehui and Li, Na and Wang, Yebin},
- title = {{Enhanced Agility and Safety in Mobile Manipulators through Centroidal Momentum-Based Motion Planning}},
- booktitle = {European Control Conference (ECC)},
- year = 2025,
- month = jun,
- doi = {ECC65951.2025.11186833},
- url = {https://www.merl.com/publications/TR2025-092}
- }
Masuyama, Y., "Single- and Multi-Channel Speech Enhancement and Separation for Far-Field Conversation Recognition," Tech. Rep. TR2025-097, Jelinek Summer Workshop on Speech and Language Technology (JSALT), June 2025.
BibTeX TR2025-097 PDF
- @techreport{Masuyama2025jun,
- author = {{{Masuyama, Yoshiki}}},
- title = {{{Single- and Multi-Channel Speech Enhancement and Separation for Far-Field Conversation Recognition}}},
- institution = {Jelinek Summer Workshop on Speech and Language Technology (JSALT)},
- year = 2025,
- month = jun,
- url = {https://www.merl.com/publications/TR2025-097}
- }
Vats, S., Jha, D.K., Likhachev, M., Kroemer, O., Romeres, D., "RecoveryChaining: Learning Local Recovery Policies for Robust Manipulation", R3: Reasoning for Robust Robot Manipulation in the Open World Workshop at R:SS 2025, June 2025.
BibTeX TR2025-091 PDF Video
- @inproceedings{Vats2025jun,
- author = {Vats, Shivam and Jha, Devesh K. and Likhachev, Maxim and Kroemer, Oliver and Romeres, Diego},
- title = {{RecoveryChaining: Learning Local Recovery Policies for Robust Manipulation}},
- booktitle = {R3: Reasoning for Robust Robot Manipulation in the Open World Workshop at R:SS 2025},
- year = 2025,
- month = jun,
- url = {https://www.merl.com/publications/TR2025-091}
- }
Jung, Y.G., Park, J., Yoon, J., Peng, K.-C., Kim, W., Teoh, A.B.J., Camps, O., "TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), Isola, P. and Kjellström, H. and Lepetit, V. and Li, F. and Su, H. and Tang, S., Eds., DOI: 10.1109/CVPR52734.2025.02378, June 2025, pp. 25539-25548.
BibTeX TR2025-077 PDF Video Presentation
- @inproceedings{Jung2025jun,
- author = {{{Jung, Yoon G. and Park, Jaewoo and Yoon, Jaeho and Peng, Kuan-Chuan and Kim, Wonchul and Teoh, Andrew B. J. and Camps, Octavia}}},
- title = {{{TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection}}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
- year = 2025,
- editor = {Isola, P. and Kjellström, H. and Lepetit, V. and Li, F. and Su, H. and Tang, S.},
- pages = {25539--25548},
- month = jun,
- publisher = {IEEE},
- doi = {10.1109/CVPR52734.2025.02378},
- issn = {2575-7075},
- isbn = {979-8-3315-4364-8},
- url = {https://www.merl.com/publications/TR2025-077}
- }
Masuyama, Y., Chang, X., Zhang, W., Cornell, S., Wang, Z.-Q., Ono, N., Qian, Y., Watanabe, S., "An End-to-End Integration of Speech Separation and Recognition with Self-Supervised Learning Representation", Computer Speech & Language, DOI: 10.1016/j.csl.2025.101813, Vol. 95, pp. 101813, May 2025.
BibTeX TR2025-054 PDF
- @article{Masuyama2025may,
- author = {Masuyama, Yoshiki and Chang, Xuankai and Zhang, Wangyou and Cornell, Samuele and Wang, Zhong-Qiu and Ono, Nobutaka and Qian, Yanmin and Watanabe, Shinji},
- title = {{An End-to-End Integration of Speech Separation and Recognition with Self-Supervised Learning Representation}},
- journal = {Computer Speech \& Language},
- year = 2025,
- volume = 95,
- pages = 101813,
- month = may,
- doi = {10.1016/j.csl.2025.101813},
- issn = {0885-2308},
- url = {https://www.merl.com/publications/TR2025-054}
- }
Araki, S., Ito, N., Haeb-Umbach, R., Wichern, G., Wang, Z.-Q., Mitsufuji, Y., "30+ Years of Source Separation Research: Achievements and Future Challenges", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10889006, April 2025, pp. 1-5.
BibTeX TR2025-036 PDF
- @inproceedings{Araki2025mar,
- author = {Araki, Shoko and Ito, Nobutaka and Haeb-Umbach, Reinhold and Wichern, Gordon and Wang, Zhong-Qiu and Mitsufuji, Yuki},
- title = {{30+ Years of Source Separation Research: Achievements and Future Challenges}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- pages = {1--5},
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10889006},
- url = {https://www.merl.com/publications/TR2025-036}
- }
Saijo, K., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Task-Aware Unified Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10887819, April 2025.
BibTeX TR2025-032 PDF Software
- @inproceedings{Saijo2025mar,
- author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Task-Aware Unified Source Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10887819},
- url = {https://www.merl.com/publications/TR2025-032}
- }
Kato, S., Wang, P., Koike-Akino, T., Fujihashi, T., Mansour, H., Boufounos, P.T., "Multi-Band Wi-Fi Neural Dynamic Fusion", IEEE Transactions on Wireless Communications, DOI: 10.1109/TWC.2025.3538463, Vol. 24, No. 5, pp. 3698-3714, February 2025.
BibTeX TR2025-115 PDF
- @article{Kato2025jul,
- author = {Kato, Sorachi and Wang, Pu and Koike-Akino, Toshiaki and Fujihashi, Takuya and Mansour, Hassan and Boufounos, Petros T.},
- title = {{Multi-Band Wi-Fi Neural Dynamic Fusion}},
- journal = {IEEE Transactions on Wireless Communications},
- year = 2025,
- volume = 24,
- number = 5,
- pages = {3698--3714},
- month = jul,
- doi = {10.1109/TWC.2025.3538463},
- issn = {1558-2248},
- url = {https://www.merl.com/publications/TR2025-115}
- }
Vinod, A.P., Weiss, A., Di Cairano, S., "Inscribing and separating an ellipsoid and a constrained zonotope: Applications in stochastic control and centering", IEEE Conference on Decision and Control (CDC), DOI: 10.1109/CDC56724.2024.10886451, December 2024, pp. 8125-8131.
BibTeX TR2024-173 PDF
- @inproceedings{Vinod2024dec,
- author = {Vinod, Abraham P. and Weiss, Avishai and {Di Cairano}, Stefano},
- title = {{Inscribing and separating an ellipsoid and a constrained zonotope: Applications in stochastic control and centering}},
- booktitle = {IEEE Conference on Decision and Control (CDC)},
- year = 2024,
- pages = {8125--8131},
- month = dec,
- doi = {10.1109/CDC56724.2024.10886451},
- url = {https://www.merl.com/publications/TR2024-173}
- }
Cornell, S., Ebbers, J., Douwes, C., Martin-Morato, I., Harju, M., Mesaros, A., Serizel, R., "DCASE 2024 Task 4: Sound Event Detection with Heterogeneous Data and Missing Labels", Detection and Classification of Acoustic Scenes and Events (DCASE) Workshop, October 2024, pp. 31-35.
BibTeX TR2024-146 PDF
- @inproceedings{Cornell2024oct,
- author = {Cornell, Samuele and Ebbers, Janek and Douwes, Constance and Martin-Morato, Irene and Harju, Manu and Mesaros, Annamaria and Serizel, Romain},
- title = {{DCASE 2024 Task 4: Sound Event Detection with Heterogeneous Data and Missing Labels}},
- booktitle = {Detection and Classification of Acoustic Scenes and Events (DCASE) Workshop},
- year = 2024,
- pages = {31--35},
- month = oct,
- url = {https://www.merl.com/publications/TR2024-146}
- }
Saijo, K., Wichern, G., Germain, F.G., Pan, Z., Le Roux, J., "TF-Locoformer: Transformer with Local Modeling by Convolution for Speech Separation and Enhancement", International Workshop on Acoustic Signal Enhancement (IWAENC), DOI: 10.1109/IWAENC61483.2024.10694313, September 2024, pp. 205-209.
BibTeX TR2024-126 PDF Software
- @inproceedings{Saijo2024sep2,
- author = {Saijo, Kohei and Wichern, Gordon and Germain, François G and Pan, Zexu and {Le Roux}, Jonathan},
- title = {{TF-Locoformer: Transformer with Local Modeling by Convolution for Speech Separation and Enhancement}},
- booktitle = {International Workshop on Acoustic Signal Enhancement (IWAENC)},
- year = 2024,
- pages = {205--209},
- month = sep,
- doi = {10.1109/IWAENC61483.2024.10694313},
- issn = {2835-3439},
- isbn = {979-8-3503-6185-8},
- url = {https://www.merl.com/publications/TR2024-126}
- }
Pan, Z., Wichern, G., Germain, F.G., Saijo, K., Le Roux, J., "PARIS: Pseudo-AutoRegressIve Siamese Training for Online Speech Separation", Interspeech, DOI: 10.21437/Interspeech.2024-1066, September 2024, pp. 582-586.
BibTeX TR2024-124 PDF
- @inproceedings{Pan2024sep,
- author = {Pan, Zexu and Wichern, Gordon and Germain, François G and Saijo, Kohei and {Le Roux}, Jonathan},
- title = {{PARIS}: Pseudo-AutoRegressIve Siamese Training for Online Speech Separation},
- booktitle = {Interspeech},
- year = 2024,
- pages = {582--586},
- month = sep,
- doi = {10.21437/Interspeech.2024-1066},
- issn = {2958-1796},
- url = {https://www.merl.com/publications/TR2024-124}
- }
Saijo, K., Wichern, G., Germain, F.G., Pan, Z., Le Roux, J., "Enhanced Reverberation as Supervision for Unsupervised Speech Separation", Interspeech, DOI: 10.21437/Interspeech.2024-1241, September 2024, pp. 607-611.
BibTeX TR2024-116 PDF Software
- @inproceedings{Saijo2024sep,
- author = {Saijo, Kohei and Wichern, Gordon and Germain, François G and Pan, Zexu and {Le Roux}, Jonathan},
- title = {{Enhanced Reverberation as Supervision for Unsupervised Speech Separation}},
- booktitle = {Interspeech},
- year = 2024,
- pages = {607--611},
- month = sep,
- doi = {10.21437/Interspeech.2024-1241},
- issn = {2958-1796},
- url = {https://www.merl.com/publications/TR2024-116}
- }
Vinod, A.P., Yamazaki, S., Chakrabarty, A., Yoshikawa, N., Di Cairano, S., "Aircraft Approach Management using Reachability and Dynamic Programming", American Control Conference (ACC), DOI: 10.23919/ACC60939.2024.10644902, June 2024, pp. 318-324.
BibTeX TR2024-079 PDF
- @inproceedings{Vinod2024jun,
- author = {{{Vinod, Abraham P. and Yamazaki, Sachiyo and Chakrabarty, Ankush and Yoshikawa, Nobuyuki and Di Cairano, Stefano}}},
- title = {{{Aircraft Approach Management using Reachability and Dynamic Programming}}},
- booktitle = {American Control Conference (ACC)},
- year = 2024,
- pages = {318--324},
- month = jun,
- publisher = {IEEE},
- doi = {10.23919/ACC60939.2024.10644902},
- url = {https://www.merl.com/publications/TR2024-079}
- }