- Ebbers, J., Germain, F.G., Wilkinghoff, K., Wichern, G., Le Roux, J., "No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10890706, April 2025.
BibTeX TR2025-037 PDF- @inproceedings{Ebbers2025mar,
- author = {Ebbers, Janek and Germain, François G and Wilkinghoff, Kevin and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10890706},
- url = {https://www.merl.com/publications/TR2025-037}
- }
- Gruttadauria, E., Fontaine, M., Le Roux, J., Essid, S., "O-EENC-SD: Efficient Online End-to-End Neural Clustering for Speaker Diarization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10890837, April 2025.
BibTeX TR2025-031 PDF- @inproceedings{Gruttadauria2025mar,
- author = {Gruttadauria, Elio and Fontaine, Mathieu and {Le Roux}, Jonathan and Essid, Slim},
- title = {{{O-EENC-SD}: Efficient Online End-to-End Neural Clustering for Speaker Diarization}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10890837},
- url = {https://www.merl.com/publications/TR2025-031}
- }
- Hori, C., Kambara, M., Sugiura, K., Ota, K., Khurana, S., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Interactive Robot Action Replanning using Multimodal LLM Trained from Human Demonstration Videos", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10887717, April 2025.
BibTeX TR2025-034 PDF- @inproceedings{Hori2025mar,
- author = {Hori, Chiori and Kambara, Motonari and Sugiura, Komei and Ota, Kei and Khurana, Sameer and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
- title = {{Interactive Robot Action Replanning using Multimodal {LLM} Trained from Human Demonstration Videos}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10887717},
- url = {https://www.merl.com/publications/TR2025-034}
- }
- Kitichotkul, R., Rapp, J., Ma, Y., Mansour, H., "Doppler Single-Photon Lidar", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10888897, April 2025, pp. 1-5.
BibTeX TR2025-028 PDF- @inproceedings{Kitichotkul2025mar,
- author = {Kitichotkul, Ruangrawee and Rapp, Joshua and Ma, Yanting and Mansour, Hassan},
- title = {{Doppler Single-Photon Lidar}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- pages = {1--5},
- month = mar,
- publisher = {IEEE},
- doi = {10.1109/ICASSP49660.2025.10888897},
- url = {https://www.merl.com/publications/TR2025-028}
- }
- Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10889481, April 2025.
BibTeX TR2025-029 PDF Software- @inproceedings{Masuyama2025mar,
- author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and {Le Roux}, Jonathan},
- title = {{Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10889481},
- url = {https://www.merl.com/publications/TR2025-029}
- }
- Saijo, K., Ebbers, J., Germain, F.G., Khurana, S., Wichern, G., Le Roux, J., "Leveraging Audio-Only Data for Text-Queried Target Sound Extraction", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10888769, April 2025.
BibTeX TR2025-033 PDF- @inproceedings{Saijo2025mar2,
- author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Khurana, Sameer and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Leveraging Audio-Only Data for Text-Queried Target Sound Extraction}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10888769},
- url = {https://www.merl.com/publications/TR2025-033}
- }
- Saijo, K., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Task-Aware Unified Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10887819, April 2025.
BibTeX TR2025-032 PDF- @inproceedings{Saijo2025mar,
- author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Task-Aware Unified Source Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10887819},
- url = {https://www.merl.com/publications/TR2025-032}
- }
- Teh, A., Ali, W.H., Rapp, J., Mansour, H., "Indoor Airflow Imaging Using Physics-Informed Schlieren Tomography", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10889412, April 2025, pp. 1-5.
BibTeX TR2025-035 PDF- @inproceedings{Teh2025mar,
- author = {Teh, Arjun and Ali, Wael H. and Rapp, Joshua and Mansour, Hassan},
- title = {{Indoor Airflow Imaging Using Physics-Informed Schlieren Tomography}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- pages = {1--5},
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10889412},
- url = {https://www.merl.com/publications/TR2025-035}
- }
- Wilkinghoff, K., Yang, H., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Keeping the Balance: Anomaly Score Calculation for Domain Generalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP49660.2025.10888402, April 2025.
BibTeX TR2025-030 PDF- @inproceedings{Wilkinghoff2025mar,
- author = {Wilkinghoff, Kevin and Yang, Haici and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Keeping the Balance: Anomaly Score Calculation for Domain Generalization}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- doi = {10.1109/ICASSP49660.2025.10888402},
- url = {https://www.merl.com/publications/TR2025-030}
- }
- Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Multi-View Radar Detection Transformer with Differentiable Positional Encoding", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2025.
BibTeX TR2025-027 PDF- @inproceedings{Yataka2025mar,
- author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
- title = {{Multi-View Radar Detection Transformer with Differentiable Positional Encoding}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2025,
- month = mar,
- url = {https://www.merl.com/publications/TR2025-027}
- }
- Hu, Y., Lohit, S., Kamilov, U., Marks, T.K., "Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal", arXiv, April 2025.
BibTeX arXiv- @article{Hu2025apr,
- author = {Hu, Yuyang and Lohit, Suhas and Kamilov, Ulugbek and Marks, Tim K.},
- title = {{Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal}},
- journal = {arXiv},
- year = 2025,
- month = apr,
- url = {https://arxiv.org/abs/2504.03607}
- }
- Li, K., Zhang, T., Peng, K.-C., Wang, G., "PF3Det: A Prompted Foundation Feature Assisted Visual LiDAR 3D Detector", arXiv, April 2025.
BibTeX arXiv- @article{Li2025apr,
- author = {Li, Kaidong and Zhang, Tianxiao and Peng, Kuan-Chuan and Wang, Guanghui},
- title = {{PF3Det: A Prompted Foundation Feature Assisted Visual LiDAR 3D Detector}},
- journal = {arXiv},
- year = 2025,
- month = apr,
- url = {https://arxiv.org/abs/2504.03563}
- }
- Ghezzi, A., Nurkanovic ́, A., Weiss, A., Diehl, M., Di Cairano, S., "A Comparative Study of MINLP and MPVC Formulations for Solving Complex Nonlinear Decision-Making Problems in Aerospace Applications", arXiv, April 2025.
BibTeX arXiv- @article{Ghezzi2025apr,
- author = {Ghezzi, Andrea and Nurkanovic ́, Armin and Weiss, Avishai and Diehl, Moritz and {Di Cairano}, Stefano},
- title = {{A Comparative Study of MINLP and MPVC Formulations for Solving Complex Nonlinear Decision-Making Problems in Aerospace Applications}},
- journal = {arXiv},
- year = 2025,
- month = apr,
- url = {https://arxiv.org/abs/2504.02375}
- }
- Jung, Y.G., Park, J., Yoon, J., Peng, K.-C., Kim, W., Teoh, A.B.J., Camps, O., "TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection", arXiv, April 2025.
BibTeX arXiv- @article{Jung2025apr,
- author = {Jung, Yoon G. and Park, Jaewoo and Yoon, Jaeho and Peng, Kuan-Chuan and Kim, Wonchul and Teoh, Andrew B. J. and Camps, Octavia},
- title = {{TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection}},
- journal = {arXiv},
- year = 2025,
- month = apr,
- url = {https://arxiv.org/abs/2504.02775}
- }
- Lin, C., Boufounos, P.T., Ma, Y., Wang, Y., "Time-optimal single-scalar control on a qubit of unitary dynamics", arXiv, April 2025.
BibTeX arXiv- @article{Lin2025apr,
- author = {Lin, Chungwei and Boufounos, Petros T. and Ma, Yanting and Wang, Yebin},
- title = {{Time-optimal single-scalar control on a qubit of unitary dynamics}},
- journal = {arXiv},
- year = 2025,
- month = apr,
- url = {https://arxiv.org/abs/2504.01785}
- }
- Chakrabarty, A., Vanfretti, L., Wang, Y., Mineyuki, T., Zhan, S., Tang, W.-T., Paulson, J.A., Deshpande, V.M., Bortoff, S.A., Laughman, C.R., "Time-Series Generative Networks for Synthesizing Realistic Scenarios in Occupant-Centric Building Simulation", Building Simulation, April 2025.
BibTeX TR2025-043 PDF- @article{Chakrabarty2025apr,
- author = {Chakrabarty, Ankush and Vanfretti, Luigi and Wang, Ye and Mineyuki, Takuma and Zhan, Sicheng and Tang, Wei-Ting and Paulson, Joel A. and Deshpande, Vedang M. and Bortoff, Scott A. and Laughman, Christopher R.},
- title = {{Time-Series Generative Networks for Synthesizing Realistic Scenarios in Occupant-Centric Building Simulation}},
- journal = {Building Simulation},
- year = 2025,
- month = apr,
- url = {https://www.merl.com/publications/TR2025-043}
- }
- Ick, C., Wichern, G., Masuyama, Y., Germain, F.G., Le Roux, J., "Data Augmentation Using Neural Acoustic Fields With Retrieval-Augmented Pre-training", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP) Satellite Workshop on Generative Data Augmentation for Real-World Signal Processing Applications (GenDA), April 2025.
BibTeX TR2025-045 PDF- @inproceedings{Ick2025apr,
- author = {Ick, Christopher and Wichern, Gordon and Masuyama, Yoshiki and Germain, François G and {Le Roux}, Jonathan},
- title = {{Data Augmentation Using Neural Acoustic Fields With Retrieval-Augmented Pre-training}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP) Satellite Workshop on Generative Data Augmentation for Real-World Signal Processing Applications (GenDA)},
- year = 2025,
- month = apr,
- url = {https://www.merl.com/publications/TR2025-045}
- }
- Smedemark-Margulies, N., Wang, Y., Koike-Akino, T., Liu, J., Parsons, K., Bicer, Y., Erdogmus, D., "Improving Subject Transfer in EEG Classification with Divergence Estimation", Journal of Neural Engineering, DOI: 10.1088/1741-2552/ad9777, Vol. 21, No. 6, April 2025.
BibTeX TR2025-044 PDF Software- @article{Smedemark-Margulies2025apr,
- author = {Smedemark-Margulies, Niklas and Wang, Ye and Koike-Akino, Toshiaki and Liu, Jing and Parsons, Kieran and Bicer, Yunus and Erdogmus, Deniz},
- title = {{Improving Subject Transfer in EEG Classification with Divergence Estimation}},
- journal = {Journal of Neural Engineering},
- year = 2025,
- volume = 21,
- number = 6,
- month = apr,
- doi = {10.1088/1741-2552/ad9777},
- url = {https://www.merl.com/publications/TR2025-044}
- }
- Wang, J.-W., Nikovski, D.N., "Learning Visual Servoing for Nonholonomic Mobile Robots with Uncalibrated Cameras", The 40th ACM/SIGAPP Symposium On Applied Computing, March 2025.
BibTeX TR2025-042 PDF- @inproceedings{Wang2025mar2,
- author = {Wang, Jen-Wei and Nikovski, Daniel N.},
- title = {{Learning Visual Servoing for Nonholonomic Mobile Robots with Uncalibrated Cameras}},
- booktitle = {The 40th ACM/SIGAPP Symposium On Applied Computing},
- year = 2025,
- month = mar,
- url = {https://www.merl.com/publications/TR2025-042}
- }
- Dong, Y., Yagyu, E., Matsuda, T., Teo, K.H., Lin, C., Rakheja, S., "An accurate electrical and thermal co-simulation framework for modeling high-temperature DC and pulsed I-V characteristics of GaN HEMTs", IEEE Journal of the Electron Devices Society, March 2025.
BibTeX TR2025-041 PDF- @article{Dong2025mar,
- author = {Dong, Yicong and Yagyu, Eiji and Matsuda, Takashi and Teo, Koon Hoo and Lin, Chungwei and Rakheja, Shaloo},
- title = {{An accurate electrical and thermal co-simulation framework for modeling high-temperature DC and pulsed I-V characteristics of GaN HEMTs}},
- journal = {IEEE Journal of the Electron Devices Society},
- year = 2025,
- month = mar,
- url = {https://www.merl.com/publications/TR2025-041}
- }
- Das, A., Rahman, S., Xiang, X., Palash, R.H., Hossain, T., Sikder, B., Yagyu, E., Nakamura, M., Teo, K.H., Chowdhury, N., "Inverse Design of AlGaN/GaN HEMT RF Device with Source Connected Field Plate", Advanced Theory and Simulations, March 2025.
BibTeX TR2025-040 PDF- @article{Das2025mar,
- author = {Das, Aurick and Rahman, Saimur and Xiang, Xiaofeng and Palash, Raffd Hassan and Hossain, Toiyob and Sikder, Bejoy and Yagyu, Eiji and Nakamura, Marika and Teo, Koon Hoo and Chowdhury, Nadim},
- title = {{Inverse Design of AlGaN/GaN HEMT RF Device with Source Connected Field Plate}},
- journal = {Advanced Theory and Simulations},
- year = 2025,
- month = mar,
- url = {https://www.merl.com/publications/TR2025-040}
- }
- Ranade, S., Pais, G., Whitaker, R., Nascimento, J., Miraldo, P., Ramalingam, S., "SurfR: Surface Reconstruction with Multi-scale Attention", International Conference on 3D Vision (3DV), March 2025.
BibTeX TR2025-039 PDF Presentation- @inproceedings{Ranade2025mar,
- author = {{{Ranade, Siddhant and Pais, Goncalo and Whitaker, Ross and Nascimento, Jacinto and Miraldo, Pedro and Ramalingam, Srikumar}}},
- title = {{{SurfR: Surface Reconstruction with Multi-scale Attention}}},
- booktitle = {International Conference on 3D Vision (3DV)},
- year = 2025,
- month = mar,
- url = {https://www.merl.com/publications/TR2025-039}
- }
- Shenoy, V., Lohit, S., Mansour, H., Chellappa, R., Marks, T.K., "Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models", arXiv, March 2025.
BibTeX arXiv- @article{Shenoy2025mar,
- author = {Shenoy, Vineet and Lohit, Suhas and Mansour, Hassan and Chellappa, Rama and Marks, Tim K.},
- title = {{Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models}},
- journal = {arXiv},
- year = 2025,
- month = mar,
- url = {https://arxiv.org/abs/2503.17269}
- }
- Shenoy, V., Wu, S., Comas, A., Marks, T.K., Lohit, S., Mansour, H., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", arXiv, March 2025.
BibTeX arXiv- @article{Shenoy2025mar2,
- author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Marks, Tim K. and Lohit, Suhas and Mansour, Hassan},
- title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
- journal = {arXiv},
- year = 2025,
- month = mar,
- url = {https://arxiv.org/abs/2503.17351}
- }
- Wilkinghoff, K., Fujimura, T., Imoto, K., Le Roux, J., Tan, Z.-H., Toda, T., "Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work", arXiv, March 2025.
BibTeX arXiv- @article{Wilkinghoff2025mar2,
- author = {Wilkinghoff, Kevin and Fujimura, Takuya and Imoto, Keisuke and {Le Roux}, Jonathan and Tan, Zheng-Hua and Toda, Tomoki},
- title = {{Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work}},
- journal = {arXiv},
- year = 2025,
- month = mar,
- url = {https://arxiv.org/abs/2503.10435}
- }